```
├── .all-contributorsrc (1000 tokens)
├── .cursorignore (700 tokens)
├── .devcontainer/
   ├── README.md (600 tokens)
   ├── devcontainer.json (100 tokens)
   ├── post-install.sh (100 tokens)
├── .dockerignore (100 tokens)
├── .gitattributes (omitted)
├── .github/
   ├── workflows/
      ├── ci-lume.yml (200 tokens)
      ├── npm-publish-computer.yml (200 tokens)
      ├── npm-publish-core.yml (200 tokens)
      ├── publish-lume.yml (2000 tokens)
      ├── pypi-publish-agent.yml (1200 tokens)
      ├── pypi-publish-computer-server.yml (500 tokens)
      ├── pypi-publish-computer.yml (1000 tokens)
      ├── pypi-publish-core.yml (300 tokens)
      ├── pypi-publish-mcp-server.yml (1200 tokens)
      ├── pypi-publish-pylume.yml (500 tokens)
      ├── pypi-publish-som.yml (400 tokens)
      ├── pypi-reusable-publish.yml (2.5k tokens)
├── .gitignore (800 tokens)
├── .vscode/
   ├── launch.json (1500 tokens)
   ├── libs-ts.code-workspace
   ├── lume.code-workspace (2.2k tokens)
   ├── lumier.code-workspace (100 tokens)
   ├── py.code-workspace (1100 tokens)
├── COMPATIBILITY.md (800 tokens)
├── CONTRIBUTING.md (500 tokens)
├── Dockerfile (400 tokens)
├── LICENSE.md (200 tokens)
├── README.md (4.2k tokens)
├── docs/
   ├── Developer-Guide.md (1600 tokens)
   ├── FAQ.md (1700 tokens)
   ├── Telemetry.md (500 tokens)
├── examples/
   ├── agent_examples.py (1000 tokens)
   ├── agent_ui_examples.py (100 tokens)
   ├── computer-example-ts/
      ├── .env.example
      ├── .gitignore
      ├── .prettierrc
      ├── README.md (300 tokens)
      ├── package.json (100 tokens)
      ├── pnpm-lock.yaml (2.1k tokens)
      ├── src/
         ├── helpers.ts (400 tokens)
         ├── index.ts (600 tokens)
      ├── tsconfig.json (100 tokens)
   ├── computer_examples.py (900 tokens)
   ├── computer_ui_examples.py (200 tokens)
   ├── evals/
      ├── wikipedia_most_linked.txt (2.4k tokens)
   ├── pylume_examples.py (500 tokens)
   ├── sandboxed_functions_examples.py (300 tokens)
   ├── som_examples.py (3.4k tokens)
   ├── utils.py (300 tokens)
   ├── winsandbox_example.py (300 tokens)
├── img/
   ├── agent.png
   ├── agent_gradio_ui.png
   ├── cli.png
   ├── computer.png
   ├── logo_black.png
   ├── logo_white.png
├── libs/
   ├── lume/
      ├── .cursorignore (700 tokens)
      ├── CONTRIBUTING.md (400 tokens)
      ├── Package.resolved (400 tokens)
      ├── Package.swift (300 tokens)
      ├── README.md (1900 tokens)
      ├── docs/
         ├── API-Reference.md (1500 tokens)
         ├── Development.md (200 tokens)
         ├── FAQ.md (800 tokens)
      ├── img/
         ├── cli.png
         ├── logo_black.png
         ├── logo_white.png
      ├── resources/
         ├── lume.entitlements
      ├── scripts/
         ├── build/
            ├── build-debug.sh
            ├── build-release-notarized.sh (1200 tokens)
            ├── build-release.sh (100 tokens)
         ├── install.sh (2.1k tokens)
      ├── src/
         ├── Commands/
            ├── Clone.swift (200 tokens)
            ├── Config.swift (1500 tokens)
            ├── Create.swift (400 tokens)
            ├── Delete.swift (200 tokens)
            ├── Get.swift (200 tokens)
            ├── IPSW.swift (100 tokens)
            ├── Images.swift (100 tokens)
            ├── List.swift (200 tokens)
            ├── Logs.swift (3.4k tokens)
            ├── Options/
               ├── FormatOption.swift
            ├── Prune.swift (100 tokens)
            ├── Pull.swift (200 tokens)
            ├── Push.swift (500 tokens)
            ├── Run.swift (800 tokens)
            ├── Serve.swift (300 tokens)
            ├── Set.swift (200 tokens)
            ├── Stop.swift (100 tokens)
         ├── ContainerRegistry/
            ├── ImageContainerRegistry.swift (35.1k tokens)
            ├── ImageList.swift
            ├── ImagesPrinter.swift (200 tokens)
         ├── Errors/
            ├── Errors.swift (1800 tokens)
         ├── FileSystem/
            ├── Home.swift (2.8k tokens)
            ├── Settings.swift (2.9k tokens)
            ├── VMConfig.swift (900 tokens)
            ├── VMDirectory.swift (1300 tokens)
            ├── VMLocation.swift (500 tokens)
         ├── LumeController.swift (8.2k tokens)
         ├── Main.swift (200 tokens)
         ├── Server/
            ├── HTTP.swift (600 tokens)
            ├── Handlers.swift (5.6k tokens)
            ├── Requests.swift (900 tokens)
            ├── Responses.swift (200 tokens)
            ├── Server.swift (5k tokens)
         ├── Utils/
            ├── CommandRegistry.swift (100 tokens)
            ├── CommandUtils.swift
            ├── Logger.swift (200 tokens)
            ├── NetworkUtils.swift (100 tokens)
            ├── Path.swift (200 tokens)
            ├── ProcessRunner.swift (100 tokens)
            ├── ProgressLogger.swift (100 tokens)
            ├── String.swift
            ├── Utils.swift (400 tokens)
         ├── VM/
            ├── DarwinVM.swift (700 tokens)
            ├── LinuxVM.swift (300 tokens)
            ├── VM.swift (6.4k tokens)
            ├── VMDetails.swift (300 tokens)
            ├── VMDetailsPrinter.swift (700 tokens)
            ├── VMDisplayResolution.swift (200 tokens)
            ├── VMFactory.swift (200 tokens)
         ├── VNC/
            ├── PassphraseGenerator.swift (500 tokens)
            ├── VNCService.swift (1000 tokens)
         ├── Virtualization/
            ├── DHCPLeaseParser.swift (900 tokens)
            ├── DarwinImageLoader.swift (1000 tokens)
            ├── ImageLoaderFactory.swift (100 tokens)
            ├── VMVirtualizationService.swift (3.8k tokens)
      ├── tests/
         ├── Mocks/
            ├── MockVM.swift (200 tokens)
            ├── MockVMVirtualizationService.swift (400 tokens)
            ├── MockVNCService.swift (200 tokens)
         ├── VM/
            ├── VMDetailsPrinterTests.swift (600 tokens)
         ├── VMTests.swift (1200 tokens)
         ├── VMVirtualizationServiceTests.swift (400 tokens)
         ├── VNCServiceTests.swift (600 tokens)
   ├── lumier/
      ├── .dockerignore (100 tokens)
      ├── Dockerfile (300 tokens)
      ├── README.md (2k tokens)
      ├── src/
         ├── bin/
            ├── entry.sh (900 tokens)
         ├── config/
            ├── constants.sh (100 tokens)
         ├── hooks/
            ├── on-logon.sh (400 tokens)
         ├── lib/
            ├── utils.sh (1200 tokens)
            ├── vm.sh (3.1k tokens)
   ├── python/
      ├── agent/
         ├── README.md (1900 tokens)
         ├── agent/
            ├── __init__.py (300 tokens)
            ├── core/
               ├── __init__.py (100 tokens)
               ├── agent.py (1700 tokens)
               ├── base.py (1700 tokens)
               ├── callbacks.py (1300 tokens)
               ├── experiment.py (1800 tokens)
               ├── factory.py (900 tokens)
               ├── messages.py (2.9k tokens)
               ├── provider_config.py (200 tokens)
               ├── telemetry.py (1000 tokens)
               ├── tools.py (200 tokens)
               ├── tools/
                  ├── __init__.py (100 tokens)
                  ├── base.py (500 tokens)
                  ├── bash.py (300 tokens)
                  ├── collection.py (300 tokens)
                  ├── computer.py (800 tokens)
                  ├── edit.py (400 tokens)
                  ├── manager.py (300 tokens)
               ├── types.py (500 tokens)
               ├── visualization.py (1300 tokens)
            ├── providers/
               ├── __init__.py
               ├── anthropic/
                  ├── __init__.py
                  ├── api/
                     ├── client.py (2.7k tokens)
                     ├── logging.py (1000 tokens)
                  ├── api_handler.py (1000 tokens)
                  ├── callbacks/
                     ├── __init__.py
                     ├── manager.py (400 tokens)
                  ├── loop.py (4.4k tokens)
                  ├── prompts.py (400 tokens)
                  ├── response_handler.py (1600 tokens)
                  ├── tools/
                     ├── __init__.py (100 tokens)
                     ├── base.py (600 tokens)
                     ├── bash.py (400 tokens)
                     ├── collection.py (200 tokens)
                     ├── computer.py (3.4k tokens)
                     ├── edit.py (2.7k tokens)
                     ├── manager.py (400 tokens)
                     ├── run.py (300 tokens)
                  ├── types.py (100 tokens)
                  ├── utils.py (2.9k tokens)
               ├── omni/
                  ├── __init__.py
                  ├── api_handler.py (200 tokens)
                  ├── clients/
                     ├── anthropic.py (700 tokens)
                     ├── base.py (200 tokens)
                     ├── oaicompat.py (1600 tokens)
                     ├── ollama.py (800 tokens)
                     ├── openai.py (1200 tokens)
                     ├── utils.py (100 tokens)
                  ├── image_utils.py (200 tokens)
                  ├── loop.py (8.8k tokens)
                  ├── parser.py (2.3k tokens)
                  ├── prompts.py (800 tokens)
                  ├── tools/
                     ├── __init__.py (200 tokens)
                     ├── base.py (200 tokens)
                     ├── bash.py (400 tokens)
                     ├── computer.py (1400 tokens)
                     ├── manager.py (400 tokens)
                  ├── utils.py (1700 tokens)
               ├── openai/
                  ├── __init__.py
                  ├── api_handler.py (3.5k tokens)
                  ├── loop.py (4.1k tokens)
                  ├── response_handler.py (1600 tokens)
                  ├── tools/
                     ├── __init__.py (100 tokens)
                     ├── base.py (500 tokens)
                     ├── computer.py (2.5k tokens)
                     ├── manager.py (800 tokens)
                  ├── types.py (200 tokens)
                  ├── utils.py (600 tokens)
               ├── uitars/
                  ├── __init__.py
                  ├── clients/
                     ├── base.py (200 tokens)
                     ├── mlxvlm.py (2.2k tokens)
                     ├── oaicompat.py (1800 tokens)
                  ├── loop.py (5.3k tokens)
                  ├── prompts.py (500 tokens)
                  ├── tools/
                     ├── __init__.py
                     ├── computer.py (2.4k tokens)
                     ├── manager.py (400 tokens)
                  ├── utils.py (1800 tokens)
            ├── telemetry.py (100 tokens)
            ├── ui/
               ├── __init__.py
               ├── __main__.py (100 tokens)
               ├── gradio/
                  ├── __init__.py (100 tokens)
                  ├── app.py (14.1k tokens)
         ├── poetry.toml
         ├── pyproject.toml (500 tokens)
      ├── computer-server/
         ├── README.md (300 tokens)
         ├── computer_server/
            ├── __init__.py (100 tokens)
            ├── __main__.py
            ├── cli.py (1000 tokens)
            ├── diorama/
               ├── __init__.py
               ├── base.py
               ├── diorama.py (3.6k tokens)
               ├── diorama_computer.py (200 tokens)
               ├── draw.py (10k tokens)
               ├── macos.py (300 tokens)
               ├── safezone.py (1200 tokens)
            ├── handlers/
               ├── base.py (1500 tokens)
               ├── factory.py (600 tokens)
               ├── generic.py (700 tokens)
               ├── linux.py (2.2k tokens)
               ├── macos.py (7.2k tokens)
               ├── windows.py (3.1k tokens)
            ├── main.py (2.2k tokens)
            ├── server.py (700 tokens)
            ├── watchdog.py (2.6k tokens)
         ├── examples/
            ├── __init__.py
            ├── usage_example.py (400 tokens)
         ├── pyproject.toml (300 tokens)
         ├── run_server.py (100 tokens)
         ├── test_connection.py (600 tokens)
      ├── computer/
         ├── README.md (1000 tokens)
         ├── computer/
            ├── __init__.py (200 tokens)
            ├── computer.py (8.3k tokens)
            ├── diorama_computer.py (800 tokens)
            ├── helpers.py (400 tokens)
            ├── interface/
               ├── __init__.py (100 tokens)
               ├── base.py (1900 tokens)
               ├── factory.py (300 tokens)
               ├── generic.py (6.9k tokens)
               ├── linux.py (100 tokens)
               ├── macos.py (100 tokens)
               ├── models.py (700 tokens)
               ├── windows.py (100 tokens)
            ├── logger.py (600 tokens)
            ├── models.py (200 tokens)
            ├── providers/
               ├── __init__.py
               ├── base.py (700 tokens)
               ├── cloud/
                  ├── __init__.py
                  ├── provider.py (600 tokens)
               ├── factory.py (1100 tokens)
               ├── lume/
                  ├── __init__.py
                  ├── provider.py (4.1k tokens)
               ├── lume_api.py (3.9k tokens)
               ├── lumier/
                  ├── __init__.py
                  ├── provider.py (9.3k tokens)
               ├── winsandbox/
                  ├── __init__.py
                  ├── provider.py (3.9k tokens)
                  ├── setup_script.ps1 (900 tokens)
            ├── telemetry.py (700 tokens)
            ├── ui/
               ├── __init__.py
               ├── __main__.py (100 tokens)
               ├── gradio/
                  ├── __init__.py
                  ├── app.py (14.1k tokens)
            ├── utils.py (600 tokens)
         ├── poetry.toml
         ├── pyproject.toml (300 tokens)
      ├── core/
         ├── README.md (200 tokens)
         ├── core/
            ├── __init__.py
            ├── telemetry/
               ├── __init__.py (100 tokens)
               ├── client.py (1500 tokens)
               ├── models.py (200 tokens)
               ├── posthog_client.py (2.4k tokens)
               ├── sender.py (100 tokens)
               ├── telemetry.py (2k tokens)
         ├── poetry.toml
         ├── pyproject.toml (200 tokens)
      ├── mcp-server/
         ├── README.md (1300 tokens)
         ├── mcp_server/
            ├── __init__.py (100 tokens)
            ├── __main__.py
            ├── server.py (1600 tokens)
         ├── pyproject.toml (100 tokens)
         ├── scripts/
            ├── install_mcp_server.sh (400 tokens)
            ├── start_mcp_server.sh (100 tokens)
      ├── pylume/
         ├── README.md (400 tokens)
         ├── __init__.py
         ├── pylume/
            ├── __init__.py (200 tokens)
            ├── client.py (800 tokens)
            ├── exceptions.py (200 tokens)
            ├── lume
            ├── models.py (800 tokens)
            ├── pylume.py (2.4k tokens)
            ├── server.py (4k tokens)
         ├── pyproject.toml (300 tokens)
      ├── som/
         ├── README.md (1100 tokens)
         ├── poetry.toml
         ├── pyproject.toml (400 tokens)
         ├── som/
            ├── __init__.py (100 tokens)
            ├── detect.py (3.5k tokens)
            ├── detection.py (1800 tokens)
            ├── models.py (800 tokens)
            ├── ocr.py (1100 tokens)
            ├── util/
               ├── utils.py (1400 tokens)
            ├── visualization.py (2.3k tokens)
         ├── tests/
            ├── test_omniparser.py (100 tokens)
   ├── typescript/
      ├── .gitignore
      ├── .nvmrc
      ├── README.md (400 tokens)
      ├── biome.json (400 tokens)
      ├── computer/
         ├── .editorconfig
         ├── .gitattributes
         ├── .gitignore
         ├── LICENSE (200 tokens)
         ├── README.md (400 tokens)
         ├── package.json (300 tokens)
         ├── src/
            ├── computer/
               ├── index.ts
               ├── providers/
                  ├── base.ts (500 tokens)
                  ├── cloud.ts (500 tokens)
                  ├── index.ts
               ├── types.ts (100 tokens)
            ├── index.ts
            ├── interface/
               ├── base.ts (2.1k tokens)
               ├── factory.ts (300 tokens)
               ├── index.ts (100 tokens)
               ├── linux.ts (100 tokens)
               ├── macos.ts (2.2k tokens)
               ├── windows.ts (100 tokens)
            ├── types.ts
         ├── tests/
            ├── computer/
               ├── cloud.test.ts (100 tokens)
            ├── interface/
               ├── factory.test.ts (400 tokens)
               ├── index.test.ts (300 tokens)
               ├── linux.test.ts (200 tokens)
               ├── macos.test.ts (5.1k tokens)
               ├── windows.test.ts (200 tokens)
            ├── setup.ts
         ├── tsconfig.json (100 tokens)
         ├── tsdown.config.ts
         ├── vitest.config.ts
      ├── core/
         ├── .editorconfig
         ├── .gitattributes
         ├── .gitignore
         ├── LICENSE (200 tokens)
         ├── README.md (100 tokens)
         ├── package.json (300 tokens)
         ├── src/
            ├── index.ts
            ├── telemetry/
               ├── clients/
                  ├── index.ts
                  ├── posthog.ts (1700 tokens)
               ├── index.ts
         ├── tests/
            ├── telemetry.test.ts (200 tokens)
         ├── tsconfig.json (100 tokens)
         ├── tsdown.config.ts
         ├── vitest.config.ts
      ├── package.json (200 tokens)
      ├── pnpm-lock.yaml (11.8k tokens)
      ├── pnpm-workspace.yaml
├── notebooks/
   ├── agent_nb.ipynb (2.9k tokens)
   ├── blog/
      ├── build-your-own-operator-on-macos-1.ipynb (2.4k tokens)
      ├── build-your-own-operator-on-macos-2.ipynb (1000 tokens)
   ├── computer_nb.ipynb (2.9k tokens)
   ├── computer_server_nb.ipynb (600 tokens)
   ├── pylume_nb.ipynb (1600 tokens)
├── pyproject.toml (400 tokens)
├── pyrightconfig.json (100 tokens)
├── scripts/
   ├── build.ps1 (1000 tokens)
   ├── build.sh (700 tokens)
   ├── cleanup.sh (500 tokens)
   ├── playground-docker.sh (2000 tokens)
   ├── playground.sh (2.3k tokens)
   ├── run-docker-dev.sh (800 tokens)
├── tests/
   ├── files.py (3.3k tokens)
   ├── pytest.ini
   ├── shell_bash.py (500 tokens)
   ├── shell_cmd.py (500 tokens)
   ├── venv.py (1400 tokens)
   ├── watchdog.py (1700 tokens)
```


## /.all-contributorsrc

```all-contributorsrc path="/.all-contributorsrc" 
{
  "projectName": "cua",
  "projectOwner": "trycua",
  "files": [
    "README.md"
  ],
  "commitType": "docs",
  "commitConvention": "angular",
  "contributorsPerLine": 7,
  "contributors": [
    {
      "login": "f-trycua",
      "name": "f-trycua",
      "avatar_url": "https://avatars.githubusercontent.com/u/195596869?v=4",
      "profile": "https://github.com/f-trycua",
      "contributions": [
        "code"
      ]
    },
    {
      "login": "pepicrft",
      "name": "Pedro Piñera Buendía",
      "avatar_url": "https://avatars.githubusercontent.com/u/663605?v=4",
      "profile": "http://pepicrft.me",
      "contributions": [
        "code"
      ]
    },
    {
      "login": "aktech",
      "name": "Amit Kumar",
      "avatar_url": "https://avatars.githubusercontent.com/u/5647941?v=4",
      "profile": "https://iamit.in",
      "contributions": [
        "code"
      ]
    },
    {
      "login": "jellydn",
      "name": "Dung Duc Huynh (Kaka)",
      "avatar_url": "https://avatars.githubusercontent.com/u/870029?v=4",
      "profile": "https://productsway.com/",
      "contributions": [
        "code"
      ]
    },
    {
      "login": "ShrootBuck",
      "name": "Zayd Krunz",
      "avatar_url": "https://avatars.githubusercontent.com/u/70227235?v=4",
      "profile": "http://zaydkrunz.com",
      "contributions": [
        "code"
      ]
    },
    {
      "login": "PrashantRaj18198",
      "name": "Prashant Raj",
      "avatar_url": "https://avatars.githubusercontent.com/u/23168997?v=4",
      "profile": "https://github.com/PrashantRaj18198",
      "contributions": [
        "code"
      ]
    },
    {
      "login": "Leland-Takamine",
      "name": "Leland Takamine",
      "avatar_url": "https://avatars.githubusercontent.com/u/847683?v=4",
      "profile": "https://www.mobile.dev",
      "contributions": [
        "code"
      ]
    },
    {
      "login": "ddupont808",
      "name": "ddupont",
      "avatar_url": "https://avatars.githubusercontent.com/u/3820588?v=4",
      "profile": "https://github.com/ddupont808",
      "contributions": [
        "code"
      ]
    },
    {
      "login": "Lizzard1123",
      "name": "Ethan Gutierrez",
      "avatar_url": "https://avatars.githubusercontent.com/u/46036335?v=4",
      "profile": "https://github.com/Lizzard1123",
      "contributions": [
        "code"
      ]
    },
    {
      "login": "RicterZ",
      "name": "Ricter Zheng",
      "avatar_url": "https://avatars.githubusercontent.com/u/5282759?v=4",
      "profile": "https://ricterz.me",
      "contributions": [
        "code"
      ]
    },
    {
      "login": "rahulkarajgikar",
      "name": "Rahul Karajgikar",
      "avatar_url": "https://avatars.githubusercontent.com/u/50844303?v=4",
      "profile": "https://www.trytruffle.ai/",
      "contributions": [
        "code"
      ]
    },
    {
      "login": "trospix",
      "name": "trospix",
      "avatar_url": "https://avatars.githubusercontent.com/u/81363696?v=4",
      "profile": "https://github.com/trospix",
      "contributions": [
        "code"
      ]
    },
    {
      "login": "eltociear",
      "name": "Ikko Eltociear Ashimine",
      "avatar_url": "https://avatars.githubusercontent.com/u/22633385?v=4",
      "profile": "https://wavee.world/invitation/b96d00e6-b802-4a1b-8a66-2e3854a01ffd",
      "contributions": [
        "code"
      ]
    },
    {
      "login": "dp221125",
      "name": "한석호(MilKyo)",
      "avatar_url": "https://avatars.githubusercontent.com/u/10572119?v=4",
      "profile": "https://github.com/dp221125",
      "contributions": [
        "code"
      ]
    },
    {
      "login": "rahimnathwani",
      "name": "Rahim Nathwani",
      "avatar_url": "https://avatars.githubusercontent.com/u/891558?v=4",
      "profile": "https://www.encona.com/",
      "contributions": [
        "code"
      ]
    },
    {
      "login": "mjspeck",
      "name": "Matt Speck",
      "avatar_url": "https://avatars.githubusercontent.com/u/20689127?v=4",
      "profile": "https://mjspeck.github.io/",
      "contributions": [
        "code"
      ]
    },
    {
      "login": "FinnBorge",
      "name": "FinnBorge",
      "avatar_url": "https://avatars.githubusercontent.com/u/9272726?v=4",
      "profile": "https://github.com/FinnBorge",
      "contributions": [
        "code"
      ]
    },
    {
      "login": "jklapacz",
      "name": "Jakub Klapacz",
      "avatar_url": "https://avatars.githubusercontent.com/u/5343758?v=4",
      "profile": "https://github.com/jklapacz",
      "contributions": [
        "code"
      ]
    },
    {
      "login": "evnsnclr",
      "name": "Evan smith",
      "avatar_url": "https://avatars.githubusercontent.com/u/139897548?v=4",
      "profile": "https://github.com/evnsnclr",
      "contributions": [
        "code"
      ]
    }
  ]
}

```

## /.cursorignore

```cursorignore path="/.cursorignore" 
# Byte-compiled / optimized / DLL files
__pycache__/
*.py[cod]
*$py.class

# C extensions
*.so

# Distribution / packaging
.Python
build/
!libs/lume/scripts/build/
develop-eggs/
dist/
downloads/
eggs/
.eggs/
lib/
lib64/
parts/
sdist/
var/
wheels/
share/python-wheels/
*.egg-info/
.installed.cfg
*.egg
MANIFEST

# PyInstaller
#  Usually these files are written by a python script from a template
#  before PyInstaller builds the exe, so as to inject date/other infos into it.
*.manifest
*.spec

# Installer logs
pip-log.txt
pip-delete-this-directory.txt

# Unit test / coverage reports
htmlcov/
.tox/
.nox/
.coverage
.coverage.*
.cache
nosetests.xml
coverage.xml
*.cover
*.py,cover
.hypothesis/
.pytest_cache/
cover/

# Translations
*.mo
*.pot

# Django stuff:
*.log
local_settings.py
db.sqlite3
db.sqlite3-journal

# Flask stuff:
instance/
.webassets-cache

# Scrapy stuff:
.scrapy

# Sphinx documentation
docs/_build/

# PyBuilder
.pybuilder/
target/

# Jupyter Notebook
.ipynb_checkpoints

# IPython
profile_default/
ipython_config.py

.pdm.toml
.pdm-python
.pdm-build/

# PEP 582; used by e.g. github.com/David-OConnor/pyflow and github.com/pdm-project/pdm
__pypackages__/

# Celery stuff
celerybeat-schedule
celerybeat.pid

# SageMath parsed files
*.sage.py

# Environments
.env
.venv
env/
venv/
ENV/
env.bak/
venv.bak/

# Spyder project settings
.spyderproject
.spyproject

# Rope project settings
.ropeproject

# mkdocs documentation
/site

# mypy
.mypy_cache/
.dmypy.json
dmypy.json

# Scripts
server/scripts/

# Pyre type checker
.pyre/

# pytype static type analyzer
.pytype/

# Cython debug symbols
cython_debug/

# Ruff stuff:
.ruff_cache/

# PyPI configuration file
.pypirc

# Conda
.conda/

# Local environment
.env.local

# macOS DS_Store
.DS_Store

weights/
weights/icon_detect/
weights/icon_detect/model.pt
weights/icon_detect/model.pt.zip
weights/icon_detect/model.pt.zip.part*

libs/python/omniparser/weights/icon_detect/model.pt

# Example test data and output
examples/test_data/
examples/output/

/screenshots/

/experiments/

/logs/

# Xcode
#
# gitignore contributors: remember to update Global/Xcode.gitignore, Objective-C.gitignore & Swift.gitignore

## User settings
xcuserdata/

## Obj-C/Swift specific
*.hmap

## App packaging
*.ipa
*.dSYM.zip
*.dSYM

## Playgrounds
timeline.xctimeline
playground.xcworkspace

# Swift Package Manager
#
# Add this line if you want to avoid checking in source code from Swift Package Manager dependencies.
# Packages/
# Package.pins
# Package.resolved
# *.xcodeproj
#
# Xcode automatically generates this directory with a .xcworkspacedata file and xcuserdata
# hence it is not needed unless you have added a package configuration file to your project
.swiftpm/
.build/

# CocoaPods
#
# We recommend against adding the Pods directory to your .gitignore. However
# you should judge for yourself, the pros and cons are mentioned at:
# https://guides.cocoapods.org/using/using-cocoapods.html#should-i-check-the-pods-directory-into-source-control
#
# Pods/
#
# Add this line if you want to avoid checking in source code from the Xcode workspace
# *.xcworkspace

# Carthage
#
# Add this line if you want to avoid checking in source code from Carthage dependencies.
# Carthage/Checkouts
Carthage/Build/

# fastlane
#
# It is recommended to not store the screenshots in the git repo.
# Instead, use fastlane to re-generate the screenshots whenever they are needed.
# For more information about the recommended setup visit:
# https://docs.fastlane.tools/best-practices/source-control/#source-control
fastlane/report.xml
fastlane/Preview.html
fastlane/screenshots/**/*.png
fastlane/test_output

# Ignore folder
ignore

# .release
.release/
```

## /.devcontainer/README.md

# Dev Container Setup

This repository includes a Dev Container configuration that simplifies the development setup to just 3 steps:

## Quick Start

![Clipboard-20250611-180809-459](https://github.com/user-attachments/assets/447eaeeb-0eec-4354-9a82-44446e202e06)

1. **Install the Dev Containers extension ([VS Code](https://marketplace.visualstudio.com/items?itemName=ms-vscode-remote.remote-containers) or [WindSurf](https://docs.windsurf.com/windsurf/advanced#dev-containers-beta))**
2. **Open the repository in the Dev Container:**
    - Press `Ctrl+Shift+P` (or `⌘+Shift+P` on macOS)
    - Select `Dev Containers: Clone Repository in Container Volume...` and paste the repository URL: `https://github.com/trycua/cua.git` (if not cloned) or `Dev Containers: Open Folder in Container...` (if git cloned).
     > **Note**: On WindSurf, the post install hook might not run automatically. If so, run `/bin/bash .devcontainer/post-install.sh` manually.
3. **Open the VS Code workspace:** Once the post-install.sh is done running, open the `.vscode/py.code-workspace` workspace and press ![Open Workspace](https://github.com/user-attachments/assets/923bdd43-8c8f-4060-8d78-75bfa302b48c)
.
4. **Run the Agent UI example:** Click ![Run Agent UI](https://github.com/user-attachments/assets/7a61ef34-4b22-4dab-9864-f86bf83e290b)
 to start the Gradio UI. If prompted to install **debugpy (Python Debugger)** to enable remote debugging, select 'Yes' to proceed.
5. **Access the Gradio UI:** The Gradio UI will be available at `http://localhost:7860` and will automatically forward to your host machine.

## What's Included

The dev container automatically:

- ✅ Sets up Python 3.11 environment
- ✅ Installs all system dependencies (build tools, OpenGL, etc.)
- ✅ Configures Python paths for all packages
- ✅ Installs Python extensions (Black, Ruff, Pylance)
- ✅ Forwards port 7860 for the Gradio web UI
- ✅ Mounts your source code for live editing
- ✅ Creates the required `.env.local` file

## Running Examples

After the container is built, you can run examples directly:

```bash
# Run the agent UI (Gradio web interface)
python examples/agent_ui_examples.py

# Run computer examples
python examples/computer_examples.py

# Run computer UI examples
python examples/computer_ui_examples.py
```

The Gradio UI will be available at `http://localhost:7860` and will automatically forward to your host machine.

## Environment Variables

You'll need to add your API keys to `.env.local`:

```bash
# Required for Anthropic provider
ANTHROPIC_API_KEY=your_anthropic_key_here

# Required for OpenAI provider
OPENAI_API_KEY=your_openai_key_here
```

## Notes

- The container connects to `host.docker.internal:7777` for Lume server communication
- All Python packages are pre-installed and configured
- Source code changes are reflected immediately (no rebuild needed)
- The container uses the same Dockerfile as the regular Docker development environment


## /.devcontainer/devcontainer.json

```json path="/.devcontainer/devcontainer.json" 
{
	"name": "C/ua - OSS",
	"build": {
		"dockerfile": "../Dockerfile"
	},
	"containerEnv": {
		"DISPLAY": "",
		"PYLUME_HOST": "host.docker.internal"
	},
	"forwardPorts": [7860],
	"portsAttributes": {
		"7860": {
			"label": "C/ua web client (Gradio)",
			"onAutoForward": "silent"
		}
	},
	"postCreateCommand": "/bin/bash .devcontainer/post-install.sh"
}

```

## /.devcontainer/post-install.sh

```sh path="/.devcontainer/post-install.sh" 
#!/usr/bin/env bash

WORKSPACE="/workspaces/cua"

# Setup .env.local
echo "PYTHON_BIN=python" > /workspaces/cua/.env.local

# Run /scripts/build.sh
./scripts/build.sh

# ---
# Build is complete. Show user a clear message to open the workspace manually.
# ---

cat << 'EOM'

============================================
  🚀 Build complete!

  👉 Next steps:

    1. Open '.vscode/py.code-workspace'
    2. Press 'Open Workspace'

  Happy coding!
============================================

EOM

```

## /.dockerignore

```dockerignore path="/.dockerignore" 
# Version control
.git
.github
.gitignore

# Environment and cache
.venv
.env
.env.local
__pycache__
*.pyc
*.pyo
*.pyd
.Python
.pytest_cache
.pdm-build

# Distribution / packaging
dist
build
*.egg-info

# Development
.vscode
.idea
*.swp
*.swo

# Docs
docs/site

# Notebooks
notebooks/.ipynb_checkpoints

# Docker
Dockerfile
.dockerignore 
```

## /.github/workflows/ci-lume.yml

```yml path="/.github/workflows/ci-lume.yml" 
name: lume
on:
  push:
    branches:
      - "main"
  pull_request: {}

concurrency:
  group: lume-${{ github.workflow }}-${{ github.ref }}
  cancel-in-progress: true

# Runner images: https://github.com/actions/runner-images

jobs:
  test:
    name: Test
    runs-on: macos-15
    steps:
      - uses: actions/checkout@v4
      - run: uname -a
      - run: sudo xcode-select -s /Applications/Xcode_16.app # Swift 6.0
      - run: swift test
        working-directory: ./libs/lume
  build:
    name: Release build
    runs-on: macos-15
    steps:
      - uses: actions/checkout@v4
      - run: uname -a
      - run: sudo xcode-select -s /Applications/Xcode_16.app # Swift 6.0
      - run: swift build --configuration release
        working-directory: ./libs/lume

```

## /.github/workflows/npm-publish-computer.yml

```yml path="/.github/workflows/npm-publish-computer.yml" 
name: Publish @trycua/computer to npm

on:
  push:
    tags:
      - "computer-v*"

jobs:
  publish:
    permissions:
      id-token: write
      contents: read
    runs-on: ubuntu-latest
    steps:
      - uses: actions/checkout@v4

      - name: Use Node.js 24.x
        uses: actions/setup-node@v4
        with:
          node-version: "24.x"
          registry-url: "https://registry.npmjs.org"

      - name: Install dependencies
        working-directory: ./libs/typescript/computer
        run: npm ci

      - name: Build package
        working-directory: ./libs/typescript/computer
        run: npm run build --if-present

      - name: Publish to npm
        working-directory: ./libs/typescript/computer
        run: npm publish --provenance --access public
        env:
          NODE_AUTH_TOKEN: ${{ secrets.NPM_TOKEN }}

```

## /.github/workflows/npm-publish-core.yml

```yml path="/.github/workflows/npm-publish-core.yml" 
name: Publish @trycua/core to npm

on:
  push:
    tags:
      - "core-v*"

jobs:
  publish:
    permissions:
      id-token: write
      contents: read
    runs-on: ubuntu-latest
    steps:
      - uses: actions/checkout@v4

      - name: Use Node.js 24.x
        uses: actions/setup-node@v4
        with:
          node-version: "24.x"
          registry-url: "https://registry.npmjs.org"

      - name: Install dependencies
        working-directory: ./libs/typescript/core
        run: npm ci

      - name: Build package
        working-directory: ./libs/typescript/core
        run: npm run build --if-present

      - name: Publish to npm
        working-directory: ./libs/typescript/core
        run: npm publish --provenance --access public
        env:
          NODE_AUTH_TOKEN: ${{ secrets.NPM_TOKEN }}

```

## /.github/workflows/publish-lume.yml

```yml path="/.github/workflows/publish-lume.yml" 
name: Publish Notarized Lume

on:
  push:
    tags:
      - "lume-v*"
  workflow_dispatch:
    inputs:
      version:
        description: "Version to notarize (without v prefix)"
        required: true
        default: "0.1.0"
  workflow_call:
    inputs:
      version:
        description: "Version to notarize"
        required: true
        type: string
    secrets:
      APPLICATION_CERT_BASE64:
        required: true
      INSTALLER_CERT_BASE64:
        required: true
      CERT_PASSWORD:
        required: true
      APPLE_ID:
        required: true
      TEAM_ID:
        required: true
      APP_SPECIFIC_PASSWORD:
        required: true
      DEVELOPER_NAME:
        required: true

permissions:
  contents: write

env:
  APPLICATION_CERT_BASE64: ${{ secrets.APPLICATION_CERT_BASE64 }}
  INSTALLER_CERT_BASE64: ${{ secrets.INSTALLER_CERT_BASE64 }}
  CERT_PASSWORD: ${{ secrets.CERT_PASSWORD }}
  APPLE_ID: ${{ secrets.APPLE_ID }}
  TEAM_ID: ${{ secrets.TEAM_ID }}
  APP_SPECIFIC_PASSWORD: ${{ secrets.APP_SPECIFIC_PASSWORD }}
  DEVELOPER_NAME: ${{ secrets.DEVELOPER_NAME }}

jobs:
  notarize:
    runs-on: macos-15
    outputs:
      sha256_checksums: ${{ steps.generate_checksums.outputs.checksums }}
      version: ${{ steps.set_version.outputs.version }}
    steps:
      - uses: actions/checkout@v4

      - name: Select Xcode 16
        run: |
          sudo xcode-select -s /Applications/Xcode_16.app
          xcodebuild -version

      - name: Install dependencies
        run: |
          brew install cpio

      - name: Create .release directory
        run: mkdir -p .release

      - name: Set version
        id: set_version
        run: |
          # Determine version from tag or input
          if [[ "$GITHUB_REF" == refs/tags/lume-v* ]]; then
            VERSION="${GITHUB_REF#refs/tags/lume-v}"
            echo "Using version from tag: $VERSION"
          elif [[ -n "${{ inputs.version }}" ]]; then
            VERSION="${{ inputs.version }}"
            echo "Using version from input: $VERSION"
          elif [[ -n "${{ inputs.version }}" ]]; then
            VERSION="${{ inputs.version }}"
            echo "Using version from workflow_call input: $VERSION"
          else
            echo "Error: No version found in tag or input"
            exit 1
          fi

          # Update version in Main.swift
          echo "Updating version in Main.swift to $VERSION"
          sed -i '' "s/static let current: String = \".*\"/static let current: String = \"$VERSION\"/" libs/lume/src/Main.swift

          # Set output for later steps
          echo "version=$VERSION" >> $GITHUB_OUTPUT

      - name: Import Certificates
        env:
          APPLICATION_CERT_BASE64: ${{ secrets.APPLICATION_CERT_BASE64 }}
          INSTALLER_CERT_BASE64: ${{ secrets.INSTALLER_CERT_BASE64 }}
          CERT_PASSWORD: ${{ secrets.CERT_PASSWORD }}
          KEYCHAIN_PASSWORD: "temp_password"
        run: |
          # Create a temporary keychain
          security create-keychain -p "$KEYCHAIN_PASSWORD" build.keychain
          security default-keychain -s build.keychain
          security unlock-keychain -p "$KEYCHAIN_PASSWORD" build.keychain
          security set-keychain-settings -t 3600 -l build.keychain

          # Import certificates
          echo $APPLICATION_CERT_BASE64 | base64 --decode > application.p12
          echo $INSTALLER_CERT_BASE64 | base64 --decode > installer.p12

          # Import certificates silently (minimize output)
          security import application.p12 -k build.keychain -P "$CERT_PASSWORD" -T /usr/bin/codesign -T /usr/bin/pkgbuild > /dev/null 2>&1
          security import installer.p12 -k build.keychain -P "$CERT_PASSWORD" -T /usr/bin/codesign -T /usr/bin/pkgbuild > /dev/null 2>&1

          # Allow codesign to access the certificates (minimal output)
          security set-key-partition-list -S apple-tool:,apple:,codesign: -s -k "$KEYCHAIN_PASSWORD" build.keychain > /dev/null 2>&1

          # Verify certificates were imported
          echo "Verifying signing identities..."
          CERT_COUNT=$(security find-identity -v -p codesigning build.keychain | grep -c "Developer ID Application" || echo "0")
          INSTALLER_COUNT=$(security find-identity -v build.keychain | grep -c "Developer ID Installer" || echo "0")

          if [ "$CERT_COUNT" -eq 0 ]; then
            echo "Error: No Developer ID Application certificate found"
            security find-identity -v -p codesigning build.keychain
            exit 1
          fi

          if [ "$INSTALLER_COUNT" -eq 0 ]; then
            echo "Error: No Developer ID Installer certificate found"  
            security find-identity -v build.keychain
            exit 1
          fi

          echo "Found $CERT_COUNT Developer ID Application certificate(s) and $INSTALLER_COUNT Developer ID Installer certificate(s)"
          echo "All required certificates verified successfully"

          # Clean up certificate files
          rm application.p12 installer.p12

      - name: Build and Notarize
        id: build_notarize
        env:
          APPLE_ID: ${{ secrets.APPLE_ID }}
          TEAM_ID: ${{ secrets.TEAM_ID }}
          APP_SPECIFIC_PASSWORD: ${{ secrets.APP_SPECIFIC_PASSWORD }}
          # These will now reference the imported certificates
          CERT_APPLICATION_NAME: "Developer ID Application: ${{ secrets.DEVELOPER_NAME }} (${{ secrets.TEAM_ID }})"
          CERT_INSTALLER_NAME: "Developer ID Installer: ${{ secrets.DEVELOPER_NAME }} (${{ secrets.TEAM_ID }})"
          VERSION: ${{ steps.set_version.outputs.version }}
        working-directory: ./libs/lume
        run: |
          # Minimal debug information
          echo "Starting build process..."
          echo "Swift version: $(swift --version | head -n 1)"
          echo "Building version: $VERSION"

          # Ensure .release directory exists
          mkdir -p .release
          chmod 755 .release

          # Build the project first (redirect verbose output)
          echo "Building project..."
          swift build --configuration release > build.log 2>&1
          echo "Build completed."

          # Run the notarization script with LOG_LEVEL env var
          chmod +x scripts/build/build-release-notarized.sh
          cd scripts/build
          LOG_LEVEL=minimal ./build-release-notarized.sh

          # Return to the lume directory
          cd ../..

          # Debug: List what files were actually created
          echo "Files in .release directory:"
          find .release -type f -name "*.tar.gz" -o -name "*.pkg.tar.gz"

          # Get architecture for output filename
          ARCH=$(uname -m)
          OS_IDENTIFIER="darwin-${ARCH}"

          # Output paths for later use
          echo "tarball_path=.release/lume-${VERSION}-${OS_IDENTIFIER}.tar.gz" >> $GITHUB_OUTPUT
          echo "pkg_path=.release/lume-${VERSION}-${OS_IDENTIFIER}.pkg.tar.gz" >> $GITHUB_OUTPUT

      - name: Generate SHA256 Checksums
        id: generate_checksums
        working-directory: ./libs/lume/.release
        run: |
          # Use existing checksums file if it exists, otherwise generate one
          if [ -f "checksums.txt" ]; then
            echo "Using existing checksums file"
            cat checksums.txt
          else
            echo "## SHA256 Checksums" > checksums.txt
            echo '\`\`\`' >> checksums.txt
            shasum -a 256 lume-*.tar.gz >> checksums.txt
            echo '\`\`\`' >> checksums.txt
          fi

          checksums=$(cat checksums.txt)
          echo "checksums<<EOF" >> $GITHUB_OUTPUT
          echo "$checksums" >> $GITHUB_OUTPUT
          echo "EOF" >> $GITHUB_OUTPUT

          # Debug: Show all files in the release directory
          echo "All files in release directory:"
          ls -la

      - name: Create Standard Version Releases
        working-directory: ./libs/lume/.release
        run: |
          VERSION=${{ steps.set_version.outputs.version }}
          ARCH=$(uname -m)
          OS_IDENTIFIER="darwin-${ARCH}"

          # Create OS-tagged symlinks
          ln -sf "lume-${VERSION}-${OS_IDENTIFIER}.tar.gz" "lume-darwin.tar.gz"
          ln -sf "lume-${VERSION}-${OS_IDENTIFIER}.pkg.tar.gz" "lume-darwin.pkg.tar.gz"

          # Create simple symlinks
          ln -sf "lume-${VERSION}-${OS_IDENTIFIER}.tar.gz" "lume.tar.gz"
          ln -sf "lume-${VERSION}-${OS_IDENTIFIER}.pkg.tar.gz" "lume.pkg.tar.gz"

          # List all files (including symlinks)
          echo "Files with symlinks in release directory:"
          ls -la

      - name: Upload Notarized Package (Tarball)
        uses: actions/upload-artifact@v4
        with:
          name: lume-notarized-tarball
          path: ./libs/lume/${{ steps.build_notarize.outputs.tarball_path }}
          if-no-files-found: error

      - name: Upload Notarized Package (Installer)
        uses: actions/upload-artifact@v4
        with:
          name: lume-notarized-installer
          path: ./libs/lume/${{ steps.build_notarize.outputs.pkg_path }}
          if-no-files-found: error

      - name: Create Release
        if: startsWith(github.ref, 'refs/tags/lume-v')
        uses: softprops/action-gh-release@v1
        with:
          files: |
            ./libs/lume/${{ steps.build_notarize.outputs.tarball_path }}
            ./libs/lume/${{ steps.build_notarize.outputs.pkg_path }}
            ./libs/lume/.release/lume-darwin.tar.gz
            ./libs/lume/.release/lume-darwin.pkg.tar.gz
            ./libs/lume/.release/lume.tar.gz
            ./libs/lume/.release/lume.pkg.tar.gz
          body: |
            ${{ steps.generate_checksums.outputs.checksums }}

            ### Installation with script

            /bin/bash -c "$(curl -fsSL https://raw.githubusercontent.com/trycua/cua/main/libs/lume/scripts/install.sh)"
            \`\`\`
          generate_release_notes: true
          make_latest: true

```

## /.github/workflows/pypi-publish-agent.yml

```yml path="/.github/workflows/pypi-publish-agent.yml" 
name: Publish Agent Package

on:
  push:
    tags:
      - "agent-v*"
  workflow_dispatch:
    inputs:
      version:
        description: "Version to publish (without v prefix)"
        required: true
        default: "0.1.0"
  workflow_call:
    inputs:
      version:
        description: "Version to publish"
        required: true
        type: string

# Adding permissions at workflow level
permissions:
  contents: write

jobs:
  prepare:
    runs-on: macos-latest
    outputs:
      version: ${{ steps.get-version.outputs.version }}
      computer_version: ${{ steps.update-deps.outputs.computer_version }}
      som_version: ${{ steps.update-deps.outputs.som_version }}
      core_version: ${{ steps.update-deps.outputs.core_version }}
    steps:
      - uses: actions/checkout@v4

      - name: Determine version
        id: get-version
        run: |
          if [ "${{ github.event_name }}" == "push" ]; then
            # Extract version from tag (for package-specific tags)
            if [[ "${{ github.ref }}" =~ ^refs/tags/agent-v([0-9]+\.[0-9]+\.[0-9]+) ]]; then
              VERSION=${BASH_REMATCH[1]}
            else
              echo "Invalid tag format for agent"
              exit 1
            fi
          elif [ "${{ github.event_name }}" == "workflow_dispatch" ]; then
            # Use version from workflow dispatch
            VERSION=${{ github.event.inputs.version }}
          else
            # Use version from workflow_call
            VERSION=${{ inputs.version }}
          fi
          echo "VERSION=$VERSION"
          echo "version=$VERSION" >> $GITHUB_OUTPUT

      - name: Set up Python
        uses: actions/setup-python@v4
        with:
          python-version: "3.11"

      - name: Update dependencies to latest versions
        id: update-deps
        run: |
          cd libs/python/agent

          # Install required package for PyPI API access
          pip install requests

          # Create a more robust Python script for PyPI version checking
          cat > get_latest_versions.py << 'EOF'
          import requests
          import json
          import sys

          def get_package_version(package_name, fallback="0.1.0"):
              try:
                  response = requests.get(f'https://pypi.org/pypi/{package_name}/json')
                  print(f"API Response Status for {package_name}: {response.status_code}", file=sys.stderr)
                  
                  if response.status_code != 200:
                      print(f"API request failed for {package_name}, using fallback version", file=sys.stderr)
                      return fallback
                  
                  data = json.loads(response.text)
                  
                  if 'info' not in data:
                      print(f"Missing 'info' key in API response for {package_name}, using fallback version", file=sys.stderr)
                      return fallback
                      
                  return data['info']['version']
              except Exception as e:
                  print(f"Error fetching version for {package_name}: {str(e)}", file=sys.stderr)
                  return fallback

          # Get latest versions
          print(get_package_version('cua-computer'))
          print(get_package_version('cua-som'))
          print(get_package_version('cua-core'))
          EOF

          # Execute the script to get the versions
          VERSIONS=($(python get_latest_versions.py))
          LATEST_COMPUTER=${VERSIONS[0]}
          LATEST_SOM=${VERSIONS[1]}
          LATEST_CORE=${VERSIONS[2]}

          echo "Latest cua-computer version: $LATEST_COMPUTER"
          echo "Latest cua-som version: $LATEST_SOM"
          echo "Latest cua-core version: $LATEST_CORE"

          # Output the versions for the next job
          echo "computer_version=$LATEST_COMPUTER" >> $GITHUB_OUTPUT
          echo "som_version=$LATEST_SOM" >> $GITHUB_OUTPUT
          echo "core_version=$LATEST_CORE" >> $GITHUB_OUTPUT

          # Determine major version for version constraint
          COMPUTER_MAJOR=$(echo $LATEST_COMPUTER | cut -d. -f1)
          SOM_MAJOR=$(echo $LATEST_SOM | cut -d. -f1)
          CORE_MAJOR=$(echo $LATEST_CORE | cut -d. -f1)

          NEXT_COMPUTER_MAJOR=$((COMPUTER_MAJOR + 1))
          NEXT_SOM_MAJOR=$((SOM_MAJOR + 1))
          NEXT_CORE_MAJOR=$((CORE_MAJOR + 1))

          # Update dependencies in pyproject.toml
          if [[ "$OSTYPE" == "darwin"* ]]; then
            # macOS version of sed needs an empty string for -i
            sed -i '' "s/\"cua-computer>=.*,<.*\"/\"cua-computer>=$LATEST_COMPUTER,<$NEXT_COMPUTER_MAJOR.0.0\"/" pyproject.toml
            sed -i '' "s/\"cua-som>=.*,<.*\"/\"cua-som>=$LATEST_SOM,<$NEXT_SOM_MAJOR.0.0\"/" pyproject.toml
            sed -i '' "s/\"cua-core>=.*,<.*\"/\"cua-core>=$LATEST_CORE,<$NEXT_CORE_MAJOR.0.0\"/" pyproject.toml
          else
            # Linux version
            sed -i "s/\"cua-computer>=.*,<.*\"/\"cua-computer>=$LATEST_COMPUTER,<$NEXT_COMPUTER_MAJOR.0.0\"/" pyproject.toml
            sed -i "s/\"cua-som>=.*,<.*\"/\"cua-som>=$LATEST_SOM,<$NEXT_SOM_MAJOR.0.0\"/" pyproject.toml
            sed -i "s/\"cua-core>=.*,<.*\"/\"cua-core>=$LATEST_CORE,<$NEXT_CORE_MAJOR.0.0\"/" pyproject.toml
          fi

          # Display the updated dependencies
          echo "Updated dependencies in pyproject.toml:"
          grep -E "cua-computer|cua-som|cua-core" pyproject.toml

  publish:
    needs: prepare
    uses: ./.github/workflows/pypi-reusable-publish.yml
    with:
      package_name: "agent"
      package_dir: "libs/python/agent"
      version: ${{ needs.prepare.outputs.version }}
      is_lume_package: false
      base_package_name: "cua-agent"
    secrets:
      PYPI_TOKEN: ${{ secrets.PYPI_TOKEN }}

  set-env-variables:
    needs: [prepare, publish]
    runs-on: macos-latest
    steps:
      - name: Set environment variables for use in other jobs
        run: |
          echo "COMPUTER_VERSION=${{ needs.prepare.outputs.computer_version }}" >> $GITHUB_ENV
          echo "SOM_VERSION=${{ needs.prepare.outputs.som_version }}" >> $GITHUB_ENV
          echo "CORE_VERSION=${{ needs.prepare.outputs.core_version }}" >> $GITHUB_ENV

```

## /.github/workflows/pypi-publish-computer-server.yml

```yml path="/.github/workflows/pypi-publish-computer-server.yml" 
name: Publish Computer Server Package

on:
  push:
    tags:
      - "computer-server-v*"
  workflow_dispatch:
    inputs:
      version:
        description: "Version to publish (without v prefix)"
        required: true
        default: "0.1.0"
  workflow_call:
    inputs:
      version:
        description: "Version to publish"
        required: true
        type: string
    outputs:
      version:
        description: "The version that was published"
        value: ${{ jobs.prepare.outputs.version }}

# Adding permissions at workflow level
permissions:
  contents: write

jobs:
  prepare:
    runs-on: macos-latest
    outputs:
      version: ${{ steps.get-version.outputs.version }}
    steps:
      - uses: actions/checkout@v4

      - name: Determine version
        id: get-version
        run: |
          if [ "${{ github.event_name }}" == "push" ]; then
            # Extract version from tag (for package-specific tags)
            if [[ "${{ github.ref }}" =~ ^refs/tags/computer-server-v([0-9]+\.[0-9]+\.[0-9]+) ]]; then
              VERSION=${BASH_REMATCH[1]}
            else
              echo "Invalid tag format for computer-server"
              exit 1
            fi
          elif [ "${{ github.event_name }}" == "workflow_dispatch" ]; then
            # Use version from workflow dispatch
            VERSION=${{ github.event.inputs.version }}
          else
            # Use version from workflow_call
            VERSION=${{ inputs.version }}
          fi
          echo "VERSION=$VERSION"
          echo "version=$VERSION" >> $GITHUB_OUTPUT

      - name: Set up Python
        uses: actions/setup-python@v4
        with:
          python-version: "3.10"

  publish:
    needs: prepare
    uses: ./.github/workflows/pypi-reusable-publish.yml
    with:
      package_name: "computer-server"
      package_dir: "libs/python/computer-server"
      version: ${{ needs.prepare.outputs.version }}
      is_lume_package: false
      base_package_name: "cua-computer-server"
    secrets:
      PYPI_TOKEN: ${{ secrets.PYPI_TOKEN }}

  set-env-variables:
    needs: [prepare, publish]
    runs-on: macos-latest
    steps:
      - name: Set environment variables for use in other jobs
        run: |
          echo "COMPUTER_VERSION=${{ needs.prepare.outputs.version }}" >> $GITHUB_ENV

```

## /.github/workflows/pypi-publish-computer.yml

```yml path="/.github/workflows/pypi-publish-computer.yml" 
name: Publish Computer Package

on:
  push:
    tags:
      - "computer-v*"
  workflow_dispatch:
    inputs:
      version:
        description: "Version to publish (without v prefix)"
        required: true
        default: "0.1.0"
  workflow_call:
    inputs:
      version:
        description: "Version to publish"
        required: true
        type: string

# Adding permissions at workflow level
permissions:
  contents: write

jobs:
  prepare:
    runs-on: macos-latest
    outputs:
      version: ${{ steps.get-version.outputs.version }}
      core_version: ${{ steps.update-deps.outputs.core_version }}
    steps:
      - uses: actions/checkout@v4

      - name: Determine version
        id: get-version
        run: |
          if [ "${{ github.event_name }}" == "push" ]; then
            # Extract version from tag (for package-specific tags)
            if [[ "${{ github.ref }}" =~ ^refs/tags/computer-v([0-9]+\.[0-9]+\.[0-9]+) ]]; then
              VERSION=${BASH_REMATCH[1]}
            else
              echo "Invalid tag format for computer"
              exit 1
            fi
          elif [ "${{ github.event_name }}" == "workflow_dispatch" ]; then
            # Use version from workflow dispatch
            VERSION=${{ github.event.inputs.version }}
          else
            # Use version from workflow_call
            VERSION=${{ inputs.version }}
          fi
          echo "VERSION=$VERSION"
          echo "version=$VERSION" >> $GITHUB_OUTPUT

      - name: Set up Python
        uses: actions/setup-python@v4
        with:
          python-version: "3.11"

      - name: Update dependencies to latest versions
        id: update-deps
        run: |
          cd libs/python/computer
          # Install required package for PyPI API access
          pip install requests

          # Create a more robust Python script for PyPI version checking
          cat > get_latest_versions.py << 'EOF'
          import requests
          import json
          import sys

          def get_package_version(package_name, fallback="0.1.0"):
              try:
                  response = requests.get(f'https://pypi.org/pypi/{package_name}/json')
                  print(f"API Response Status for {package_name}: {response.status_code}", file=sys.stderr)
                  
                  if response.status_code != 200:
                      print(f"API request failed for {package_name}, using fallback version", file=sys.stderr)
                      return fallback
                  
                  data = json.loads(response.text)
                  
                  if 'info' not in data:
                      print(f"Missing 'info' key in API response for {package_name}, using fallback version", file=sys.stderr)
                      return fallback
                      
                  return data['info']['version']
              except Exception as e:
                  print(f"Error fetching version for {package_name}: {str(e)}", file=sys.stderr)
                  return fallback

          # Get latest versions
          print(get_package_version('cua-core'))
          EOF

          # Execute the script to get the versions
          VERSIONS=($(python get_latest_versions.py))
          LATEST_CORE=${VERSIONS[0]}

          echo "Latest cua-core version: $LATEST_CORE"

          # Output the versions for the next job
          echo "core_version=$LATEST_CORE" >> $GITHUB_OUTPUT

          # Determine major version for version constraint
          CORE_MAJOR=$(echo $LATEST_CORE | cut -d. -f1)
          NEXT_CORE_MAJOR=$((CORE_MAJOR + 1))

          # Update dependencies in pyproject.toml
          if [[ "$OSTYPE" == "darwin"* ]]; then
            # macOS version of sed needs an empty string for -i
            sed -i '' "s/\"cua-core>=.*,<.*\"/\"cua-core>=$LATEST_CORE,<$NEXT_CORE_MAJOR.0.0\"/" pyproject.toml
          else
            # Linux version
            sed -i "s/\"cua-core>=.*,<.*\"/\"cua-core>=$LATEST_CORE,<$NEXT_CORE_MAJOR.0.0\"/" pyproject.toml
          fi

          # Display the updated dependencies
          echo "Updated dependencies in pyproject.toml:"
          grep -E "cua-core" pyproject.toml

  publish:
    needs: prepare
    uses: ./.github/workflows/pypi-reusable-publish.yml
    with:
      package_name: "computer"
      package_dir: "libs/python/computer"
      version: ${{ needs.prepare.outputs.version }}
      is_lume_package: false
      base_package_name: "cua-computer"
    secrets:
      PYPI_TOKEN: ${{ secrets.PYPI_TOKEN }}

  set-env-variables:
    needs: [prepare, publish]
    runs-on: macos-latest
    steps:
      - name: Set environment variables for use in other jobs
        run: |
          echo "CORE_VERSION=${{ needs.prepare.outputs.core_version }}" >> $GITHUB_ENV

```

## /.github/workflows/pypi-publish-core.yml

```yml path="/.github/workflows/pypi-publish-core.yml" 
name: Publish Core Package

on:
  push:
    tags:
      - "core-v*"
  workflow_dispatch:
    inputs:
      version:
        description: "Version to publish (without v prefix)"
        required: true
        default: "0.1.0"
  workflow_call:
    inputs:
      version:
        description: "Version to publish"
        required: true
        type: string

# Adding permissions at workflow level
permissions:
  contents: write

jobs:
  prepare:
    runs-on: macos-latest
    outputs:
      version: ${{ steps.get-version.outputs.version }}
    steps:
      - uses: actions/checkout@v4

      - name: Determine version
        id: get-version
        run: |
          if [ "${{ github.event_name }}" == "push" ]; then
            # Extract version from tag (for package-specific tags)
            if [[ "${{ github.ref }}" =~ ^refs/tags/core-v([0-9]+\.[0-9]+\.[0-9]+) ]]; then
              VERSION=${BASH_REMATCH[1]}
            else
              echo "Invalid tag format for core"
              exit 1
            fi
          elif [ "${{ github.event_name }}" == "workflow_dispatch" ]; then
            # Use version from workflow dispatch
            VERSION=${{ github.event.inputs.version }}
          else
            # Use version from workflow_call
            VERSION=${{ inputs.version }}
          fi
          echo "VERSION=$VERSION"
          echo "version=$VERSION" >> $GITHUB_OUTPUT

  publish:
    needs: prepare
    uses: ./.github/workflows/pypi-reusable-publish.yml
    with:
      package_name: "core"
      package_dir: "libs/python/core"
      version: ${{ needs.prepare.outputs.version }}
      is_lume_package: false
      base_package_name: "cua-core"
    secrets:
      PYPI_TOKEN: ${{ secrets.PYPI_TOKEN }}

```

## /.github/workflows/pypi-publish-mcp-server.yml

```yml path="/.github/workflows/pypi-publish-mcp-server.yml" 
name: Publish MCP Server Package

on:
  push:
    tags:
      - "mcp-server-v*"
  workflow_dispatch:
    inputs:
      version:
        description: "Version to publish (without v prefix)"
        required: true
        default: "0.1.0"
  workflow_call:
    inputs:
      version:
        description: "Version to publish"
        required: true
        type: string
    outputs:
      version:
        description: "The version that was published"
        value: ${{ jobs.prepare.outputs.version }}

# Adding permissions at workflow level
permissions:
  contents: write

jobs:
  prepare:
    runs-on: macos-latest
    outputs:
      version: ${{ steps.get-version.outputs.version }}
      agent_version: ${{ steps.update-deps.outputs.agent_version }}
      computer_version: ${{ steps.update-deps.outputs.computer_version }}
    steps:
      - uses: actions/checkout@v4

      - name: Determine version
        id: get-version
        run: |
          if [ "${{ github.event_name }}" == "push" ]; then
            # Extract version from tag (for package-specific tags)
            if [[ "${{ github.ref }}" =~ ^refs/tags/mcp-server-v([0-9]+\.[0-9]+\.[0-9]+) ]]; then
              VERSION=${BASH_REMATCH[1]}
            else
              echo "Invalid tag format for mcp-server"
              exit 1
            fi
          elif [ "${{ github.event_name }}" == "workflow_dispatch" ]; then
            # Use version from workflow dispatch
            VERSION=${{ github.event.inputs.version }}
          else
            # Use version from workflow_call
            VERSION=${{ inputs.version }}
          fi
          echo "VERSION=$VERSION"
          echo "version=$VERSION" >> $GITHUB_OUTPUT

      - name: Set up Python
        uses: actions/setup-python@v4
        with:
          python-version: "3.11"

      - name: Update dependencies to latest versions
        id: update-deps
        run: |
          cd libs/python/mcp-server

          # Install required package for PyPI API access
          pip install requests

          # Create a Python script for PyPI version checking
          cat > get_latest_versions.py << 'EOF'
          import requests
          import json
          import sys

          def get_package_version(package_name, fallback="0.1.0"):
              try:
                  response = requests.get(f'https://pypi.org/pypi/{package_name}/json')
                  print(f"API Response Status for {package_name}: {response.status_code}", file=sys.stderr)
                  
                  if response.status_code != 200:
                      print(f"API request failed for {package_name}, using fallback version", file=sys.stderr)
                      return fallback
                  
                  data = json.loads(response.text)
                  
                  if 'info' not in data:
                      print(f"Missing 'info' key in API response for {package_name}, using fallback version", file=sys.stderr)
                      return fallback
                      
                  return data['info']['version']
              except Exception as e:
                  print(f"Error fetching version for {package_name}: {str(e)}", file=sys.stderr)
                  return fallback

          # Get latest versions
          print(get_package_version('cua-agent'))
          print(get_package_version('cua-computer'))
          EOF

          # Execute the script to get the versions
          VERSIONS=($(python get_latest_versions.py))
          LATEST_AGENT=${VERSIONS[0]}
          LATEST_COMPUTER=${VERSIONS[1]}

          echo "Latest cua-agent version: $LATEST_AGENT"
          echo "Latest cua-computer version: $LATEST_COMPUTER"

          # Output the versions for the next job
          echo "agent_version=$LATEST_AGENT" >> $GITHUB_OUTPUT
          echo "computer_version=$LATEST_COMPUTER" >> $GITHUB_OUTPUT

          # Determine major version for version constraint
          AGENT_MAJOR=$(echo $LATEST_AGENT | cut -d. -f1)
          COMPUTER_MAJOR=$(echo $LATEST_COMPUTER | cut -d. -f1)

          NEXT_AGENT_MAJOR=$((AGENT_MAJOR + 1))
          NEXT_COMPUTER_MAJOR=$((COMPUTER_MAJOR + 1))

          # Update dependencies in pyproject.toml
          if [[ "$OSTYPE" == "darwin"* ]]; then
            # macOS version of sed needs an empty string for -i
            # Update cua-agent with all extras
            sed -i '' "s/\"cua-agent\[all\]>=.*,<.*\"/\"cua-agent[all]>=$LATEST_AGENT,<$NEXT_AGENT_MAJOR.0.0\"/" pyproject.toml
            sed -i '' "s/\"cua-computer>=.*,<.*\"/\"cua-computer>=$LATEST_COMPUTER,<$NEXT_COMPUTER_MAJOR.0.0\"/" pyproject.toml
          else
            # Linux version
            sed -i "s/\"cua-agent\[all\]>=.*,<.*\"/\"cua-agent[all]>=$LATEST_AGENT,<$NEXT_AGENT_MAJOR.0.0\"/" pyproject.toml
            sed -i "s/\"cua-computer>=.*,<.*\"/\"cua-computer>=$LATEST_COMPUTER,<$NEXT_COMPUTER_MAJOR.0.0\"/" pyproject.toml
          fi

          # Display the updated dependencies
          echo "Updated dependencies in pyproject.toml:"
          grep -E "cua-agent|cua-computer" pyproject.toml

  publish:
    needs: prepare
    uses: ./.github/workflows/pypi-reusable-publish.yml
    with:
      package_name: "mcp-server"
      package_dir: "libs/python/mcp-server"
      version: ${{ needs.prepare.outputs.version }}
      is_lume_package: false
      base_package_name: "cua-mcp-server"
    secrets:
      PYPI_TOKEN: ${{ secrets.PYPI_TOKEN }}

  set-env-variables:
    needs: [prepare, publish]
    runs-on: macos-latest
    steps:
      - name: Set environment variables for use in other jobs
        run: |
          echo "AGENT_VERSION=${{ needs.prepare.outputs.agent_version }}" >> $GITHUB_ENV
          echo "COMPUTER_VERSION=${{ needs.prepare.outputs.computer_version }}" >> $GITHUB_ENV

```

## /.github/workflows/pypi-publish-pylume.yml

```yml path="/.github/workflows/pypi-publish-pylume.yml" 
name: Publish Pylume Package

on:
  push:
    tags:
      - "pylume-v*"
  workflow_dispatch:
    inputs:
      version:
        description: "Version to publish (without v prefix)"
        required: true
        default: "0.1.0"
  workflow_call:
    inputs:
      version:
        description: "Version to publish"
        required: true
        type: string
    outputs:
      version:
        description: "The version that was published"
        value: ${{ jobs.determine-version.outputs.version }}

# Adding permissions at workflow level
permissions:
  contents: write

jobs:
  determine-version:
    runs-on: macos-latest
    outputs:
      version: ${{ steps.get-version.outputs.version }}
    steps:
      - uses: actions/checkout@v4

      - name: Determine version
        id: get-version
        run: |
          if [ "${{ github.event_name }}" == "push" ]; then
            # Extract version from tag (for package-specific tags)
            if [[ "${{ github.ref }}" =~ ^refs/tags/pylume-v([0-9]+\.[0-9]+\.[0-9]+) ]]; then
              VERSION=${BASH_REMATCH[1]}
            else
              echo "Invalid tag format for pylume"
              exit 1
            fi
          elif [ "${{ github.event_name }}" == "workflow_dispatch" ]; then
            # Use version from workflow dispatch
            VERSION=${{ github.event.inputs.version }}
          else
            # Use version from workflow_call
            VERSION=${{ inputs.version }}
          fi
          echo "VERSION=$VERSION"
          echo "version=$VERSION" >> $GITHUB_OUTPUT

  validate-version:
    runs-on: macos-latest
    needs: determine-version
    steps:
      - uses: actions/checkout@v4
      - name: Validate version
        id: validate-version
        run: |
          CODE_VERSION=$(grep '__version__' libs/python/pylume/pylume/__init__.py | cut -d'"' -f2)
          if [ "${{ needs.determine-version.outputs.version }}" != "$CODE_VERSION" ]; then
            echo "Version mismatch: expected $CODE_VERSION, got ${{ needs.determine-version.outputs.version }}"
            exit 1
          fi
          echo "Version validated: $CODE_VERSION"

  publish:
    needs: determine-version
    uses: ./.github/workflows/pypi-reusable-publish.yml
    with:
      package_name: "pylume"
      package_dir: "libs/python/pylume"
      version: ${{ needs.determine-version.outputs.version }}
      is_lume_package: true
      base_package_name: "pylume"
    secrets:
      PYPI_TOKEN: ${{ secrets.PYPI_TOKEN }}

```

## /.github/workflows/pypi-publish-som.yml

```yml path="/.github/workflows/pypi-publish-som.yml" 
name: Publish SOM Package

on:
  push:
    tags:
      - "som-v*"
  workflow_dispatch:
    inputs:
      version:
        description: "Version to publish (without v prefix)"
        required: true
        default: "0.1.0"
  workflow_call:
    inputs:
      version:
        description: "Version to publish"
        required: true
        type: string
    outputs:
      version:
        description: "The version that was published"
        value: ${{ jobs.determine-version.outputs.version }}

# Adding permissions at workflow level
permissions:
  contents: write

jobs:
  determine-version:
    runs-on: macos-latest
    outputs:
      version: ${{ steps.get-version.outputs.version }}
    steps:
      - uses: actions/checkout@v4

      - name: Determine version
        id: get-version
        run: |
          if [ "${{ github.event_name }}" == "push" ]; then
            # Extract version from tag (for package-specific tags)
            if [[ "${{ github.ref }}" =~ ^refs/tags/som-v([0-9]+\.[0-9]+\.[0-9]+) ]]; then
              VERSION=${BASH_REMATCH[1]}
            else
              echo "Invalid tag format for som"
              exit 1
            fi
          elif [ "${{ github.event_name }}" == "workflow_dispatch" ]; then
            # Use version from workflow dispatch
            VERSION=${{ github.event.inputs.version }}
          else
            # Use version from workflow_call
            VERSION=${{ inputs.version }}
          fi
          echo "VERSION=$VERSION"
          echo "version=$VERSION" >> $GITHUB_OUTPUT

  publish:
    needs: determine-version
    uses: ./.github/workflows/pypi-reusable-publish.yml
    with:
      package_name: "som"
      package_dir: "libs/python/som"
      version: ${{ needs.determine-version.outputs.version }}
      is_lume_package: false
      base_package_name: "cua-som"
    secrets:
      PYPI_TOKEN: ${{ secrets.PYPI_TOKEN }}

```

## /.github/workflows/pypi-reusable-publish.yml

```yml path="/.github/workflows/pypi-reusable-publish.yml" 
name: Reusable Package Publish Workflow

on:
  workflow_call:
    inputs:
      package_name:
        description: "Name of the package (e.g. pylume, computer, agent)"
        required: true
        type: string
      package_dir:
        description: "Directory containing the package relative to workspace root (e.g. libs/python/pylume)"
        required: true
        type: string
      version:
        description: "Version to publish"
        required: true
        type: string
      is_lume_package:
        description: "Whether this package includes the lume binary"
        required: false
        type: boolean
        default: false
      base_package_name:
        description: "PyPI package name (e.g. pylume, cua-agent)"
        required: true
        type: string
      make_latest:
        description: "Whether to mark this release as latest (should only be true for lume)"
        required: false
        type: boolean
        default: false
    secrets:
      PYPI_TOKEN:
        required: true
    outputs:
      version:
        description: "The version that was published"
        value: ${{ jobs.build-and-publish.outputs.version }}

jobs:
  build-and-publish:
    runs-on: macos-latest
    permissions:
      contents: write # This permission is needed for creating releases
    outputs:
      version: ${{ steps.set-version.outputs.version }}
    steps:
      - uses: actions/checkout@v4
        with:
          fetch-depth: 0 # Full history for release creation

      - name: Set up Python
        uses: actions/setup-python@v4
        with:
          python-version: "3.11"

      - name: Create root pdm.lock file
        run: |
          # Create an empty pdm.lock file in the root
          touch pdm.lock

      - name: Install PDM
        uses: pdm-project/setup-pdm@v3
        with:
          python-version: "3.11"
          cache: true

      - name: Set version
        id: set-version
        run: |
          echo "VERSION=${{ inputs.version }}" >> $GITHUB_ENV
          echo "version=${{ inputs.version }}" >> $GITHUB_OUTPUT

      - name: Initialize PDM in package directory
        run: |
          # Make sure we're working with a properly initialized PDM project
          cd ${{ inputs.package_dir }}

          # Create pdm.lock if it doesn't exist
          if [ ! -f "pdm.lock" ]; then
            echo "No pdm.lock found, initializing PDM project..."
            pdm lock
          fi

      - name: Set version in package
        run: |
          cd ${{ inputs.package_dir }}
          # Replace pdm bump with direct edit of pyproject.toml
          if [[ "$OSTYPE" == "darwin"* ]]; then
            # macOS version of sed needs an empty string for -i
            sed -i '' "s/version = \".*\"/version = \"$VERSION\"/" pyproject.toml
          else
            # Linux version
            sed -i "s/version = \".*\"/version = \"$VERSION\"/" pyproject.toml
          fi
          # Verify version was updated
          echo "Updated version in pyproject.toml:"
          grep "version =" pyproject.toml

      # Conditional step for lume binary download (only for pylume package)
      - name: Download and setup lume binary
        if: inputs.is_lume_package
        run: |
          # Create a temporary directory for extraction
          mkdir -p temp_lume

          # Download the latest lume release directly
          echo "Downloading latest lume version..."
          curl -sL "https://github.com/trycua/lume/releases/latest/download/lume.tar.gz" -o temp_lume/lume.tar.gz

          # Extract the tar file (ignore ownership and suppress warnings)
          cd temp_lume && tar --no-same-owner -xzf lume.tar.gz

          # Make the binary executable
          chmod +x lume

          # Copy the lume binary to the correct location in the pylume package
          mkdir -p "${GITHUB_WORKSPACE}/${{ inputs.package_dir }}/pylume"
          cp lume "${GITHUB_WORKSPACE}/${{ inputs.package_dir }}/pylume/lume"

          # Verify the binary exists and is executable
          test -x "${GITHUB_WORKSPACE}/${{ inputs.package_dir }}/pylume/lume" || { echo "lume binary not found or not executable"; exit 1; }

          # Get the version from the downloaded binary for reference
          LUME_VERSION=$(./lume --version | grep -oE '[0-9]+\.[0-9]+\.[0-9]+' || echo "unknown")
          echo "Using lume version: $LUME_VERSION"

          # Cleanup
          cd "${GITHUB_WORKSPACE}" && rm -rf temp_lume

          # Save the lume version for reference
          echo "LUME_VERSION=${LUME_VERSION}" >> $GITHUB_ENV

      - name: Build and publish
        env:
          PYPI_TOKEN: ${{ secrets.PYPI_TOKEN }}
        run: |
          cd ${{ inputs.package_dir }}
          # Build with PDM
          pdm build

          # For pylume package, verify the binary is in the wheel
          if [ "${{ inputs.is_lume_package }}" = "true" ]; then
            python -m pip install wheel
            wheel unpack dist/*.whl --dest temp_wheel
            echo "Listing contents of wheel directory:"
            find temp_wheel -type f
            test -f temp_wheel/pylume-*/pylume/lume || { echo "lume binary not found in wheel"; exit 1; }
            rm -rf temp_wheel
            echo "Publishing ${{ inputs.base_package_name }} ${VERSION} with lume ${LUME_VERSION}"
          else
            echo "Publishing ${{ inputs.base_package_name }} ${VERSION}"
          fi

          # Install and use twine directly instead of PDM publish
          echo "Installing twine for direct publishing..."
          pip install twine

          echo "Publishing to PyPI using twine..."
          TWINE_USERNAME="__token__" TWINE_PASSWORD="$PYPI_TOKEN" python -m twine upload dist/*

          # Save the wheel file path for the release
          WHEEL_FILE=$(ls dist/*.whl | head -1)
          echo "WHEEL_FILE=${WHEEL_FILE}" >> $GITHUB_ENV

      - name: Prepare Simple Release Notes
        if: startsWith(github.ref, 'refs/tags/')
        run: |
          # Create release notes based on package type
          echo "# ${{ inputs.base_package_name }} v${VERSION}" > release_notes.md
          echo "" >> release_notes.md

          if [ "${{ inputs.package_name }}" = "pylume" ]; then
            echo "## Python SDK for lume - run macOS and Linux VMs on Apple Silicon" >> release_notes.md
            echo "" >> release_notes.md
            echo "This package provides Python bindings for the lume virtualization tool." >> release_notes.md
            echo "" >> release_notes.md
            echo "## Dependencies" >> release_notes.md
            echo "* lume binary: v${LUME_VERSION}" >> release_notes.md
          elif [ "${{ inputs.package_name }}" = "computer" ]; then
            echo "## Computer control library for the Computer Universal Automation (CUA) project" >> release_notes.md
            echo "" >> release_notes.md
            echo "## Dependencies" >> release_notes.md
            echo "* pylume: ${PYLUME_VERSION:-latest}" >> release_notes.md
          elif [ "${{ inputs.package_name }}" = "agent" ]; then
            echo "## Dependencies" >> release_notes.md
            echo "* cua-computer: ${COMPUTER_VERSION:-latest}" >> release_notes.md
            echo "* cua-som: ${SOM_VERSION:-latest}" >> release_notes.md
            echo "" >> release_notes.md
            echo "## Installation Options" >> release_notes.md
            echo "" >> release_notes.md
            echo "### Basic installation with Anthropic" >> release_notes.md
            echo '\`\`\`bash' >> release_notes.md
            echo "pip install cua-agent[anthropic]==${VERSION}" >> release_notes.md
            echo '\`\`\`' >> release_notes.md
            echo "" >> release_notes.md
            echo "### With SOM (recommended)" >> release_notes.md
            echo '\`\`\`bash' >> release_notes.md
            echo "pip install cua-agent[som]==${VERSION}" >> release_notes.md
            echo '\`\`\`' >> release_notes.md
            echo "" >> release_notes.md
            echo "### All features" >> release_notes.md
            echo '\`\`\`bash' >> release_notes.md
            echo "pip install cua-agent[all]==${VERSION}" >> release_notes.md
            echo '\`\`\`' >> release_notes.md
          elif [ "${{ inputs.package_name }}" = "som" ]; then
            echo "## Computer Vision and OCR library for detecting and analyzing UI elements" >> release_notes.md
            echo "" >> release_notes.md
            echo "This package provides enhanced UI understanding capabilities through computer vision and OCR." >> release_notes.md
          elif [ "${{ inputs.package_name }}" = "computer-server" ]; then
            echo "## Computer Server for the Computer Universal Automation (CUA) project" >> release_notes.md
            echo "" >> release_notes.md
            echo "A FastAPI-based server implementation for computer control." >> release_notes.md
            echo "" >> release_notes.md
            echo "## Dependencies" >> release_notes.md
            echo "* cua-computer: ${COMPUTER_VERSION:-latest}" >> release_notes.md
            echo "" >> release_notes.md
            echo "## Usage" >> release_notes.md
            echo '\`\`\`bash' >> release_notes.md
            echo "# Run the server" >> release_notes.md
            echo "cua-computer-server" >> release_notes.md
            echo '\`\`\`' >> release_notes.md
          elif [ "${{ inputs.package_name }}" = "mcp-server" ]; then
            echo "## MCP Server for the Computer-Use Agent (CUA)" >> release_notes.md
            echo "" >> release_notes.md
            echo "This package provides MCP (Model Context Protocol) integration for CUA agents, allowing them to be used with Claude Desktop, Cursor, and other MCP clients." >> release_notes.md
            echo "" >> release_notes.md
            echo "## Dependencies" >> release_notes.md
            echo "* cua-computer: ${COMPUTER_VERSION:-latest}" >> release_notes.md
            echo "* cua-agent: ${AGENT_VERSION:-latest}" >> release_notes.md
            echo "" >> release_notes.md
            echo "## Usage" >> release_notes.md
            echo '\`\`\`bash' >> release_notes.md
            echo "# Run the MCP server directly" >> release_notes.md
            echo "cua-mcp-server" >> release_notes.md
            echo '\`\`\`' >> release_notes.md
            echo "" >> release_notes.md
            echo "## Claude Desktop Integration" >> release_notes.md
            echo "Add to your Claude Desktop configuration (~/.config/claude-desktop/claude_desktop_config.json or OS-specific location):" >> release_notes.md
            echo '\`\`\`json' >> release_notes.md
            echo '"mcpServers": {' >> release_notes.md
            echo '  "cua-agent": {' >> release_notes.md
            echo '    "command": "cua-mcp-server",' >> release_notes.md
            echo '    "args": [],' >> release_notes.md
            echo '    "env": {' >> release_notes.md
            echo '      "CUA_AGENT_LOOP": "OMNI",' >> release_notes.md
            echo '      "CUA_MODEL_PROVIDER": "ANTHROPIC",' >> release_notes.md
            echo '      "CUA_MODEL_NAME": "claude-3-opus-20240229",' >> release_notes.md
            echo '      "ANTHROPIC_API_KEY": "your-api-key",' >> release_notes.md
            echo '      "PYTHONIOENCODING": "utf-8"' >> release_notes.md
            echo '    }' >> release_notes.md
            echo '  }' >> release_notes.md
            echo '}' >> release_notes.md
            echo '\`\`\`' >> release_notes.md
          fi

          # Add installation section if not agent (which has its own installation section)
          if [ "${{ inputs.package_name }}" != "agent" ]; then
            echo "" >> release_notes.md
            echo "## Installation" >> release_notes.md
            echo '\`\`\`bash' >> release_notes.md
            echo "pip install ${{ inputs.base_package_name }}==${VERSION}" >> release_notes.md
            echo '\`\`\`' >> release_notes.md
          fi

          echo "Release notes created:"
          cat release_notes.md

      - name: Create GitHub Release
        uses: softprops/action-gh-release@v2
        if: startsWith(github.ref, 'refs/tags/')
        with:
          name: "${{ inputs.base_package_name }} v${{ env.VERSION }}"
          body_path: release_notes.md
          files: ${{ inputs.package_dir }}/${{ env.WHEEL_FILE }}
          draft: false
          prerelease: false
          make_latest: ${{ inputs.package_name == 'lume' }}
        env:
          GITHUB_TOKEN: ${{ secrets.GITHUB_TOKEN }}

```

## /.gitignore

```gitignore path="/.gitignore" 
# Byte-compiled / optimized / DLL files
__pycache__/
*.py[cod]
*$py.class

# C extensions
*.so

node_modules/*
*/node_modules
**/node_modules

# Distribution / packaging
.Python
build/
!libs/lume/scripts/build/
develop-eggs/
dist/
downloads/
eggs/
.eggs/
lib/*
!libs/lumier/src/lib/
lib64/
parts/
sdist/
var/
wheels/
share/python-wheels/
*.egg-info/
.installed.cfg
*.egg
MANIFEST

# PyInstaller
#  Usually these files are written by a python script from a template
#  before PyInstaller builds the exe, so as to inject date/other infos into it.
*.manifest
*.spec

# Installer logs
pip-log.txt
pip-delete-this-directory.txt

# Unit test / coverage reports
htmlcov/
.tox/
.nox/
.coverage
.coverage.*
.cache
nosetests.xml
coverage.xml
*.cover
*.py,cover
.hypothesis/
.pytest_cache/
cover/

# Translations
*.mo
*.pot

# Django stuff:
*.log
local_settings.py
db.sqlite3
db.sqlite3-journal

# Flask stuff:
instance/
.webassets-cache

# Scrapy stuff:
.scrapy

# Sphinx documentation
docs/_build/

# PyBuilder
.pybuilder/
target/

# Jupyter Notebook
.ipynb_checkpoints

# IPython
profile_default/
ipython_config.py

.pdm.toml
.pdm-python
.pdm-build/

# PEP 582; used by e.g. github.com/David-OConnor/pyflow and github.com/pdm-project/pdm
__pypackages__/

# Celery stuff
celerybeat-schedule
celerybeat.pid

# SageMath parsed files
*.sage.py

# Environments
.env
.venv
env/
venv/
ENV/
env.bak/
venv.bak/

# Spyder project settings
.spyderproject
.spyproject

# Rope project settings
.ropeproject

# mkdocs documentation
/site

# mypy
.mypy_cache/
.dmypy.json
dmypy.json

# Scripts
server/scripts/

# Pyre type checker
.pyre/

# pytype static type analyzer
.pytype/

# Cython debug symbols
cython_debug/

# Ruff stuff:
.ruff_cache/

# PyPI configuration file
.pypirc

# Conda
.conda/

# Local environment
.env.local

# macOS DS_Store
.DS_Store

weights/
weights/icon_detect/
weights/icon_detect/model.pt
weights/icon_detect/model.pt.zip
weights/icon_detect/model.pt.zip.part*

libs/python/omniparser/weights/icon_detect/model.pt

# Example test data and output
examples/test_data/
examples/output/

/screenshots/

/experiments/

/logs/

# Xcode
#
# gitignore contributors: remember to update Global/Xcode.gitignore, Objective-C.gitignore & Swift.gitignore

## User settings
xcuserdata/

## Obj-C/Swift specific
*.hmap

## App packaging
*.ipa
*.dSYM.zip
*.dSYM

## Playgrounds
timeline.xctimeline
playground.xcworkspace

# Swift Package Manager
#
# Add this line if you want to avoid checking in source code from Swift Package Manager dependencies.
# Packages/
# Package.pins
# Package.resolved
# *.xcodeproj
#
# Xcode automatically generates this directory with a .xcworkspacedata file and xcuserdata
# hence it is not needed unless you have added a package configuration file to your project
.swiftpm/
.build/

# CocoaPods
#
# We recommend against adding the Pods directory to your .gitignore. However
# you should judge for yourself, the pros and cons are mentioned at:
# https://guides.cocoapods.org/using/using-cocoapods.html#should-i-check-the-pods-directory-into-source-control
#
# Pods/
#
# Add this line if you want to avoid checking in source code from the Xcode workspace
# *.xcworkspace

# Carthage
#
# Add this line if you want to avoid checking in source code from Carthage dependencies.
# Carthage/Checkouts
Carthage/Build/

# fastlane
#
# It is recommended to not store the screenshots in the git repo.
# Instead, use fastlane to re-generate the screenshots whenever they are needed.
# For more information about the recommended setup visit:
# https://docs.fastlane.tools/best-practices/source-control/#source-control
fastlane/report.xml
fastlane/Preview.html
fastlane/screenshots/**/*.png
fastlane/test_output

# Ignore folder
ignore

# .release
.release/

# Shared folder
shared

# Trajectories
trajectories/

# Installation ID Storage
.storage/

# Gradio settings
.gradio_settings.json

# Lumier Storage
storage/

# Trashes
.Trashes
.Trash-1000/

post-provision
```

## /.vscode/launch.json

```json path="/.vscode/launch.json" 
{
    "configurations": [
        {
            "name": "Agent UI",
            "type": "debugpy",
            "request": "launch",
            "program": "examples/agent_ui_examples.py",
            "console": "integratedTerminal",
            "justMyCode": false,
            "python": "${workspaceFolder:cua-root}/.venv/bin/python",
            "cwd": "${workspaceFolder:cua-root}",
            "env": {
                "PYTHONPATH": "${workspaceFolder:cua-root}/libs/python/core:${workspaceFolder:cua-root}/libs/python/computer:${workspaceFolder:cua-root}/libs/python/agent:${workspaceFolder:cua-root}/libs/python/som:${workspaceFolder:cua-root}/libs/python/pylume"
            }
        },
        {
            "name": "Computer UI",
            "type": "debugpy",
            "request": "launch",
            "program": "examples/computer_ui_examples.py",
            "console": "integratedTerminal",
            "justMyCode": false,
            "python": "${workspaceFolder:cua-root}/.venv/bin/python",
            "cwd": "${workspaceFolder:cua-root}",
            "env": {
                "PYTHONPATH": "${workspaceFolder:cua-root}/libs/python/core:${workspaceFolder:cua-root}/libs/python/computer:${workspaceFolder:cua-root}/libs/python/agent:${workspaceFolder:cua-root}/libs/python/som:${workspaceFolder:cua-root}/libs/python/pylume"
            }
        },
        {
            "name": "Run Computer Examples",
            "type": "debugpy",
            "request": "launch",
            "program": "examples/computer_examples.py",
            "console": "integratedTerminal",
            "justMyCode": true,
            "python": "${workspaceFolder:cua-root}/.venv/bin/python",
            "cwd": "${workspaceFolder:cua-root}",
            "env": {
                "PYTHONPATH": "${workspaceFolder:cua-root}/libs/python/core:${workspaceFolder:cua-root}/libs/python/computer:${workspaceFolder:cua-root}/libs/python/agent:${workspaceFolder:cua-root}/libs/python/som:${workspaceFolder:cua-root}/libs/python/pylume"
            }
        },
        {
            "name": "Run Agent Examples",
            "type": "debugpy",
            "request": "launch",
            "program": "examples/agent_examples.py",
            "console": "integratedTerminal",
            "justMyCode": false,
            "python": "${workspaceFolder:cua-root}/.venv/bin/python",
            "cwd": "${workspaceFolder:cua-root}",
            "env": {
                "PYTHONPATH": "${workspaceFolder:cua-root}/libs/python/core:${workspaceFolder:cua-root}/libs/python/computer:${workspaceFolder:cua-root}/libs/python/agent:${workspaceFolder:cua-root}/libs/python/som:${workspaceFolder:cua-root}/libs/python/pylume"
            }
        },
        {
            "name": "Run PyLume Examples",
            "type": "debugpy",
            "request": "launch",
            "program": "examples/pylume_examples.py",
            "console": "integratedTerminal",
            "justMyCode": true,
            "python": "${workspaceFolder:cua-root}/.venv/bin/python",
            "cwd": "${workspaceFolder:cua-root}",
            "env": {
                "PYTHONPATH": "${workspaceFolder:cua-root}/libs/python/core:${workspaceFolder:cua-root}/libs/python/computer:${workspaceFolder:cua-root}/libs/python/agent:${workspaceFolder:cua-root}/libs/python/som:${workspaceFolder:cua-root}/libs/python/pylume"
            }
        },
        {
            "name": "SOM: Run Experiments (No OCR)",
            "type": "debugpy",
            "request": "launch",
            "program": "examples/som_examples.py",
            "args": [
                "examples/test_data",
                "--output-dir",
                "examples/output",
                "--ocr",
                "none",
                "--mode",
                "experiment"
            ],
            "console": "integratedTerminal",
            "justMyCode": false,
            "python": "${workspaceFolder:cua-root}/.venv/bin/python",
            "cwd": "${workspaceFolder:cua-root}",
            "env": {
                "PYTHONPATH": "${workspaceFolder:cua-root}/libs/python/core:${workspaceFolder:cua-root}/libs/python/computer:${workspaceFolder:cua-root}/libs/python/agent:${workspaceFolder:cua-root}/libs/python/som:${workspaceFolder:cua-root}/libs/python/pylume"
            }
        },
        {
            "name": "SOM: Run Experiments (EasyOCR)",
            "type": "debugpy",
            "request": "launch",
            "program": "examples/som_examples.py",
            "args": [
                "examples/test_data",
                "--output-dir",
                "examples/output",
                "--ocr",
                "easyocr",
                "--mode",
                "experiment"
            ],
            "console": "integratedTerminal",
            "justMyCode": false,
            "python": "${workspaceFolder:cua-root}/.venv/bin/python",
            "cwd": "${workspaceFolder:cua-root}",
            "env": {
                "PYTHONPATH": "${workspaceFolder:cua-root}/libs/python/core:${workspaceFolder:cua-root}/libs/python/computer:${workspaceFolder:cua-root}/libs/python/agent:${workspaceFolder:cua-root}/libs/python/som:${workspaceFolder:cua-root}/libs/python/pylume"
            }
        },
        {
            "name": "Run Computer Server",
            "type": "debugpy",
            "request": "launch",
            "program": "${workspaceFolder}/libs/python/computer-server/run_server.py",
            "console": "integratedTerminal",
            "justMyCode": true,
            "python": "${workspaceFolder:cua-root}/.venv/bin/python",
            "cwd": "${workspaceFolder:cua-root}",
            "env": {
                "PYTHONPATH": "${workspaceFolder:cua-root}/libs/python/core:${workspaceFolder:cua-root}/libs/python/computer:${workspaceFolder:cua-root}/libs/python/agent:${workspaceFolder:cua-root}/libs/python/som:${workspaceFolder:cua-root}/libs/python/pylume"
            }
        },
        {
            "name": "Run Computer Server with Args",
            "type": "debugpy",
            "request": "launch",
            "program": "${workspaceFolder}/libs/python/computer-server/run_server.py",
            "args": [
                "--host",
                "0.0.0.0",
                "--port",
                "8000",
                "--log-level",
                "debug"
            ],
            "console": "integratedTerminal",
            "justMyCode": false,
            "python": "${workspaceFolder:cua-root}/.venv/bin/python",
            "cwd": "${workspaceFolder:cua-root}",
            "env": {
                "PYTHONPATH": "${workspaceFolder:cua-root}/libs/python/core:${workspaceFolder:cua-root}/libs/python/computer-server"
            }
        },
        {
            "type": "lldb",
            "request": "launch",
            "args": [],
            "cwd": "${workspaceFolder:cua-root}/libs/lume",
            "name": "Debug lume (libs/lume)",
            "program": "${workspaceFolder:cua-root}/libs/lume/.build/debug/lume",
            "preLaunchTask": "swift: Build Debug lume (libs/lume)"
        },
        {
            "type": "lldb",
            "request": "launch",
            "args": [],
            "cwd": "${workspaceFolder:cua-root}/libs/lume",
            "name": "Release lume (libs/lume)",
            "program": "${workspaceFolder:cua-root}/libs/lume/.build/release/lume",
            "preLaunchTask": "swift: Build Release lume (libs/lume)"
        }
    ]
}
```

## /.vscode/libs-ts.code-workspace

```code-workspace path="/.vscode/libs-ts.code-workspace" 
{
  "folders": [
    {
      "name": "libs-ts",
      "path": "../libs/typescript"
    }
  ],
  "extensions": {
    "recommendations": [
      "biomejs.biome",
    ]
  }
}
```

## /.vscode/lume.code-workspace

```code-workspace path="/.vscode/lume.code-workspace" 
{
    "folders": [
        {
            "name": "lume",
            "path": "../libs/lume"
        }
    ],
    "settings": {
        "files.exclude": {
            "**/.git": true,
            "**/.svn": true,
            "**/.hg": true,
            "**/CVS": true,
            "**/.DS_Store": true
        },
        "swift.path.swift_driver_bin": "/usr/bin/swift",
        "swift.enableLanguageServer": true,
        "files.associations": {
            "*.swift": "swift"
        },
        "[swift]": {
            "editor.formatOnSave": true,
            "editor.detectIndentation": true,
            "editor.tabSize": 4
        },
        "swift.path": "/Applications/Xcode.app/Contents/Developer/Toolchains/XcodeDefault.xctoolchain/usr/bin",
        "swift.swiftEnvironmentVariables": {
            "DEVELOPER_DIR": "/Applications/Xcode.app"
        },
        "lldb.library": "/Applications/Xcode.app/Contents/SharedFrameworks/LLDB.framework/Versions/A/LLDB",
        "lldb.launch.expressions": "native"
    },
    "tasks": {
        "version": "2.0.0",
        "tasks": [
            {
                "label": "build-debug",
                "type": "shell",
                "command": "${workspaceFolder:lume}/scripts/build/build-debug.sh",
                "options": {
                    "cwd": "${workspaceFolder:lume}"
                },
                "group": {
                    "kind": "build",
                    "isDefault": true
                },
                "presentation": {
                    "reveal": "silent",
                    "panel": "shared"
                },
                "problemMatcher": []
            },
            {
                "label": "swift: Build Debug lume",
                "type": "shell",
                "command": "${workspaceFolder:lume}/scripts/build/build-debug.sh",
                "options": {
                    "cwd": "${workspaceFolder:lume}"
                },
                "group": "build",
                "presentation": {
                    "reveal": "silent",
                    "panel": "shared"
                },
                "problemMatcher": []
            }
        ]
    },
    "launch": {
        "configurations": [
            {
                "type": "bashdb",
                "request": "launch",
                "name": "Bash-Debug (select script from list of sh files)",
                "cwd": "${workspaceFolder}",
                "program": "${command:SelectScriptName}",
                "pathBash": "/opt/homebrew/bin/bash",
                "args": []
            },
            {
                "type": "lldb",
                "request": "launch",
                "sourceLanguages": [
                    "swift"
                ],
                "args": [
                    "serve"
                ],
                "cwd": "${workspaceFolder:lume}",
                "name": "Debug lume serve",
                "program": "${workspaceFolder:lume}/.build/debug/lume",
                "preLaunchTask": "build-debug"
            },
            {
                "type": "lldb",
                "request": "launch",
                "sourceLanguages": [
                    "swift"
                ],
                "args": [
                    "create",
                    "macos-vm",
                    "--cpu",
                    "4",
                    "--memory",
                    "4GB",
                    "--disk-size",
                    "40GB",
                    "--ipsw",
                    "/Users/<USER>/Downloads/UniversalMac_15.2_24C101_Restore.ipsw"
                ],
                "cwd": "${workspaceFolder:lume}",
                "name": "Debug lume create --os macos --ipsw 'path/to/ipsw' (macos)",
                "program": "${workspaceFolder:lume}/.build/debug/lume",
                "preLaunchTask": "build-debug"
            },
            {
                "type": "lldb",
                "request": "launch",
                "sourceLanguages": [
                    "swift"
                ],
                "args": [
                    "create",
                    "macos-vm",
                    "--cpu",
                    "4",
                    "--memory",
                    "4GB",
                    "--disk-size",
                    "20GB",
                    "--ipsw",
                    "latest"
                ],
                "cwd": "${workspaceFolder:lume}",
                "name": "Debug lume create --os macos --ipsw latest (macos)",
                "program": "${workspaceFolder:lume}/.build/debug/lume",
                "preLaunchTask": "build-debug"
            },
            {
                "type": "lldb",
                "request": "launch",
                "sourceLanguages": [
                    "swift"
                ],
                "args": [
                    "create",
                    "linux-vm",
                    "--os",
                    "linux",
                    "--cpu",
                    "4",
                    "--memory",
                    "4GB",
                    "--disk-size",
                    "20GB"
                ],
                "cwd": "${workspaceFolder:lume}",
                "name": "Debug lume create --os linux (linux)",
                "program": "${workspaceFolder:lume}/.build/debug/lume",
                "preLaunchTask": "build-debug"
            },
            {
                "type": "lldb",
                "request": "launch",
                "sourceLanguages": [
                    "swift"
                ],
                "args": [
                    "pull",
                    "macos-sequoia-vanilla:15.2",
                    "--name",
                    "macos-vm-cloned"
                ],
                "cwd": "${workspaceFolder:lume}",
                "name": "Debug lume pull (macos)",
                "program": "${workspaceFolder:lume}/.build/debug/lume",
                "preLaunchTask": "build-debug"
            },
            {
                "type": "lldb",
                "request": "launch",
                "sourceLanguages": [
                    "swift"
                ],
                "args": [
                    "run",
                    "macos-vm",
                    "--shared-dir",
                    "/Users/<USER>/repos/trycua/lume/shared_folder:rw",
                    "--start-vnc"
                ],
                "cwd": "${workspaceFolder:lume}",
                "name": "Debug lume run (macos)",
                "program": "${workspaceFolder:lume}/.build/debug/lume",
                "preLaunchTask": "build-debug"
            },
            {
                "type": "lldb",
                "request": "launch",
                "sourceLanguages": [
                    "swift"
                ],
                "args": [
                    "run",
                    "linux-vm",
                    "--start-vnc",
                    "--mount",
                    "/Users/<USER>/Downloads/ubuntu-24.04.1-live-server-arm64.iso"
                ],
                "cwd": "${workspaceFolder:lume}",
                "name": "Debug lume run with setup mount (linux)",
                "program": "${workspaceFolder:lume}/.build/debug/lume",
                "preLaunchTask": "build-debug"
            },
            {
                "type": "lldb",
                "request": "launch",
                "sourceLanguages": [
                    "swift"
                ],
                "args": [
                    "run",
                    "linux-vm",
                    "--start-vnc"
                ],
                "cwd": "${workspaceFolder:lume}",
                "name": "Debug lume run (linux)",
                "program": "${workspaceFolder:lume}/.build/debug/lume",
                "preLaunchTask": "build-debug"
            },
            {
                "type": "lldb",
                "request": "launch",
                "sourceLanguages": [
                    "swift"
                ],
                "args": [
                    "get",
                    "macos-vm"
                ],
                "cwd": "${workspaceFolder:lume}",
                "name": "Debug lume get (macos)",
                "program": "${workspaceFolder:lume}/.build/debug/lume",
                "preLaunchTask": "build-debug"
            },
            {
                "type": "lldb",
                "request": "launch",
                "sourceLanguages": [
                    "swift"
                ],
                "args": [
                    "ls"
                ],
                "cwd": "${workspaceFolder:lume}",
                "name": "Debug lume ls",
                "program": "${workspaceFolder:lume}/.build/debug/lume",
                "preLaunchTask": "build-debug"
            },
            {
                "type": "lldb",
                "request": "launch",
                "sourceLanguages": [
                    "swift"
                ],
                "args": [
                    "images"
                ],
                "cwd": "${workspaceFolder:lume}",
                "name": "Debug lume images",
                "program": "${workspaceFolder:lume}/.build/debug/lume",
                "preLaunchTask": "build-debug"
            },
            {
                "type": "lldb",
                "request": "launch",
                "sourceLanguages": [
                    "swift"
                ],
                "args": [
                    "stop",
                    "macos-vm"
                ],
                "cwd": "${workspaceFolder:lume}",
                "name": "Debug lume stop (macos)",
                "program": "${workspaceFolder:lume}/.build/debug/lume",
                "preLaunchTask": "build-debug"
            },
            {
                "type": "lldb",
                "request": "launch",
                "args": [],
                "cwd": "${workspaceFolder:lume}",
                "name": "Debug lume",
                "program": "${workspaceFolder:lume}/.build/debug/lume",
                "preLaunchTask": "swift: Build Debug lume"
            },
            {
                "type": "lldb",
                "request": "launch",
                "args": [],
                "cwd": "${workspaceFolder:lume}",
                "name": "Release lume",
                "program": "${workspaceFolder:lume}/.build/release/lume",
                "preLaunchTask": "swift: Build Release lume"
            },
            {
                "type": "bashdb",
                "request": "launch",
                "name": "Bash-Debug (select script)",
                "cwd": "${workspaceFolder:lume}",
                "program": "${command:SelectScriptName}",
                "pathBash": "/opt/homebrew/bin/bash",
                "args": []
            }
        ]
    }
} 
```

## /.vscode/lumier.code-workspace

```code-workspace path="/.vscode/lumier.code-workspace" 
{
    "folders": [
        {
            "name": "lumier",
            "path": "../libs/lumier"
        },
        {
            "name": "lume",
            "path": "../libs/lume"
        }
    ],
    "settings": {
        "files.exclude": {
            "**/.git": true,
            "**/.svn": true,
            "**/.hg": true,
            "**/CVS": true,
            "**/.DS_Store": true
        }
    },
    "tasks": {
        "version": "2.0.0",
        "tasks": [
        ]
    },
    "launch": {
        "configurations": [
        ]
    }
} 
```

## /.vscode/py.code-workspace

```code-workspace path="/.vscode/py.code-workspace" 
{
    "folders": [
        {
            "name": "cua-root",
            "path": ".."
        },
        {
            "name": "computer",
            "path": "../libs/python/computer"
        },
        {
            "name": "agent",
            "path": "../libs/python/agent"
        },
        {
            "name": "som",
            "path": "../libs/python/som"
        },
        {
            "name": "computer-server",
            "path": "../libs/python/computer-server"
        },
        {
            "name": "pylume",
            "path": "../libs/python/pylume"
        },
        {
            "name": "core",
            "path": "../libs/python/core"
        }
    ],
    "settings": {
        "files.exclude": {
            "**/.git": true,
            "**/.svn": true,
            "**/.hg": true,
            "**/CVS": true,
            "**/.DS_Store": true,
            "**/__pycache__": true,
            "**/.pytest_cache": true,
            "**/*.pyc": true
        },
        "python.testing.pytestEnabled": true,
        "python.testing.unittestEnabled": false,
        "python.testing.nosetestsEnabled": false,
        "python.testing.pytestArgs": [
            "libs"
        ],
        "python.analysis.extraPaths": [
            "${workspaceFolder:cua-root}/libs/python/core",
            "${workspaceFolder:cua-root}/libs/python/computer",
            "${workspaceFolder:cua-root}/libs/python/agent",
            "${workspaceFolder:cua-root}/libs/python/som",
            "${workspaceFolder:cua-root}/libs/python/pylume",
            "${workspaceFolder:cua-root}/.vscode/typings"
        ],
        "python.envFile": "${workspaceFolder:cua-root}/.env",
        "python.defaultInterpreterPath": "${workspaceFolder:cua-root}/.venv/bin/python",
        "python.analysis.diagnosticMode": "workspace",
        "python.analysis.typeCheckingMode": "basic",
        "python.analysis.autoSearchPaths": true,
        "python.analysis.stubPath": "${workspaceFolder:cua-root}/.vscode/typings",
        "python.analysis.indexing": false,
        "python.analysis.exclude": [
            "**/node_modules/**",
            "**/__pycache__/**",
            "**/.*/**",
            "**/venv/**",
            "**/.venv/**", 
            "**/dist/**",
            "**/build/**",
            ".pdm-build/**",
            "**/.git/**",
            "examples/**",
            "notebooks/**",
            "logs/**",
            "screenshots/**"
        ],
        "python.analysis.packageIndexDepths": [
            {
                "name": "computer",
                "depth": 2
            },
            {
                "name": "agent",
                "depth": 2
            },
            {
                "name": "som",
                "depth": 2
            },
            {
                "name": "pylume",
                "depth": 2
            },
            {
                "name": "core",
                "depth": 2
            }
        ],
        "python.autoComplete.extraPaths": [
            "${workspaceFolder:cua-root}/libs/python/core",
            "${workspaceFolder:cua-root}/libs/python/computer",
            "${workspaceFolder:cua-root}/libs/python/agent",
            "${workspaceFolder:cua-root}/libs/python/som",
            "${workspaceFolder:cua-root}/libs/python/pylume"
        ],
        "python.languageServer": "None",
        "[python]": {
            "editor.formatOnSave": true,
            "editor.defaultFormatter": "ms-python.black-formatter",
            "editor.codeActionsOnSave": {
                "source.organizeImports": "explicit"
            }
        },
        "files.associations": {
            "examples/computer_examples.py": "python",
            "examples/agent_examples.py": "python"
        },
        "python.interpreterPaths": {
            "examples/computer_examples.py": "${workspaceFolder}/libs/python/computer/.venv/bin/python",
            "examples/agent_examples.py": "${workspaceFolder}/libs/python/agent/.venv/bin/python"
        }
    },
    "tasks": {
        "version": "2.0.0",
        "tasks": [
            {
                "label": "Build Dependencies",
                "type": "shell",
                "command": "${workspaceFolder}/scripts/build.sh",
                "presentation": {
                    "reveal": "always",
                    "panel": "new",
                    "clear": true
                },
                "group": {
                    "kind": "build",
                    "isDefault": true
                },
                "options": {
                    "shell": {
                        "executable": "/bin/bash",
                        "args": ["-l", "-c"]
                    }
                },
                "problemMatcher": []
            }
        ]
    },
    "compounds": [
        {
            "name": "Run Computer Examples + Server",
            "configurations": ["Run Computer Examples", "Run Computer Server"],
            "stopAll": true,
            "presentation": {
                "group": "Computer",
                "order": 1
            }
        },
        {
            "name": "Run Server with Keep-Alive Client",
            "configurations": ["Run Computer Server", "Test Server Connection (Keep Alive)"],
            "stopAll": true,
            "presentation": {
                "group": "Computer",
                "order": 2
            }
        }
    ],
    "inputs": [
        {
            "id": "imagePath",
            "type": "promptString",
            "description": "Path to the image file or directory for icon detection",
            "default": "${workspaceFolder}/examples/test_data"
        }
    ]
}
```

## /COMPATIBILITY.md

# C/ua Compatibility Matrix

## Table of Contents
- [Host OS Compatibility](#host-os-compatibility)
  - [macOS Host](#macos-host)
  - [Ubuntu/Linux Host](#ubuntulinux-host)
  - [Windows Host](#windows-host)
- [VM Emulation Support](#vm-emulation-support)
- [Model Provider Compatibility](#model-provider-compatibility)

---

## Host OS Compatibility

*This section shows compatibility based on your **host operating system** (the OS you're running C/ua on).*

### macOS Host

| Installation Method | Requirements | Lume | Cloud | Notes |
|-------------------|-------------|------|-------|-------|
| **playground-docker.sh** | Docker Desktop | ✅ Full | ✅ Full | Recommended for quick setup |
| **Dev Container** | VS Code/WindSurf + Docker | ✅ Full | ✅ Full | Best for development |
| **PyPI packages** | Python 3.12+ | ✅ Full | ✅ Full | Most flexible |

**macOS Host Requirements:**
- macOS 15+ (Sequoia) for local VM support
- Apple Silicon (M1/M2/M3/M4) recommended for best performance
- Docker Desktop for containerized installations

---

### Ubuntu/Linux Host

| Installation Method | Requirements | Lume | Cloud | Notes |
|-------------------|-------------|------|-------|-------|
| **playground-docker.sh** | Docker Engine | ✅ Full | ✅ Full | Recommended for quick setup |
| **Dev Container** | VS Code/WindSurf + Docker | ✅ Full | ✅ Full | Best for development |
| **PyPI packages** | Python 3.12+ | ✅ Full | ✅ Full | Most flexible |

**Ubuntu/Linux Host Requirements:**
- Ubuntu 20.04+ or equivalent Linux distribution
- Docker Engine or Docker Desktop
- Python 3.12+ for PyPI installation

---

### Windows Host

| Installation Method | Requirements | Lume | Winsandbox | Cloud | Notes |
|-------------------|-------------|------|------------|-------|-------|
| **playground-docker.sh** | Docker Desktop + WSL2 | ❌ Not supported | ❌ Not supported | ✅ Full | Requires WSL2 |
| **Dev Container** | VS Code/WindSurf + Docker + WSL2 | ❌ Not supported | ❌ Not supported | ✅ Full | Requires WSL2 |
| **PyPI packages** | Python 3.12+ | ❌ Not supported | ✅ Full | ✅ Full |  |

**Windows Host Requirements:**
- Windows 10/11 with WSL2 enabled for shell script execution
- Docker Desktop with WSL2 backend
- Windows Sandbox feature enabled (for Winsandbox support)
- Python 3.12+ installed in WSL2 or Windows
- **Note**: Lume CLI is not available on Windows - use Cloud or Winsandbox providers

---

## VM Emulation Support

*This section shows which **virtual machine operating systems** each provider can emulate.*

| Provider | macOS VM | Ubuntu/Linux VM | Windows VM | Notes |
|----------|----------|-----------------|------------|-------|
| **Lume** | ✅ Full support | ⚠️ Limited support | ⚠️ Limited support | macOS: native; Ubuntu/Linux/Windows: need custom image |
| **Cloud** | 🚧 Coming soon | ✅ Full support | 🚧 Coming soon | Currently Ubuntu only, macOS/Windows in development |
| **Winsandbox** | ❌ Not supported | ❌ Not supported | ✅ Windows only | Windows 10/11 environments only |

---

## Model Provider Compatibility

*This section shows which **AI model providers** are supported on each host operating system.*

| Provider | macOS Host | Ubuntu/Linux Host | Windows Host | Notes |
|----------|------------|-------------------|--------------|-------|
| **Anthropic** | ✅ Full support | ✅ Full support | ✅ Full support | Cloud-based API |
| **OpenAI** | ✅ Full support | ✅ Full support | ✅ Full support | Cloud-based API |
| **Ollama** | ✅ Full support | ✅ Full support | ✅ Full support | Local model serving |
| **OpenAI Compatible** | ✅ Full support | ✅ Full support | ✅ Full support | Any OpenAI-compatible API endpoint |
| **MLX VLM** | ✅ macOS only | ❌ Not supported | ❌ Not supported | Apple Silicon required. PyPI installation only. |


## /CONTRIBUTING.md

# Contributing to cua

We deeply appreciate your interest in contributing to cua! Whether you're reporting bugs, suggesting enhancements, improving docs, or submitting pull requests, your contributions help improve the project for everyone.

## Reporting Bugs

If you've encountered a bug in the project, we encourage you to report it. Please follow these steps:

1. **Check the Issue Tracker**: Before submitting a new bug report, please check our issue tracker to see if the bug has already been reported.
2. **Create a New Issue**: If the bug hasn't been reported, create a new issue with:
   - A clear title and detailed description
   - Steps to reproduce the issue
   - Expected vs actual behavior
   - Your environment (macOS version, lume version)
   - Any relevant logs or error messages
3. **Label Your Issue**: Label your issue as a `bug` to help maintainers identify it quickly.

## Suggesting Enhancements

We're always looking for suggestions to make lume better. If you have an idea:

1. **Check Existing Issues**: See if someone else has already suggested something similar.
2. **Create a New Issue**: If your enhancement is new, create an issue describing:
   - The problem your enhancement solves
   - How your enhancement would work
   - Any potential implementation details
   - Why this enhancement would benefit lume users

## Code Formatting

We follow strict code formatting guidelines to ensure consistency across the codebase. Before submitting any code:

1. **Review Our Format Guide**: Please review our [Code Formatting Standards](docs/Developer-Guide.md#code-formatting-standards) section in the Getting Started guide.
2. **Configure Your IDE**: We recommend using the workspace settings provided in `.vscode/` for automatic formatting.
3. **Run Formatting Tools**: Always run the formatting tools before submitting a PR:
   ```bash
   # For Python code
   pdm run black .
   pdm run ruff check --fix .
   ```
4. **Validate Your Code**: Ensure your code passes all checks:
   ```bash
   pdm run mypy .
   ```

## Documentation

Documentation improvements are always welcome. You can:
- Fix typos or unclear explanations
- Add examples and use cases
- Improve API documentation
- Add tutorials or guides

For detailed instructions on setting up your development environment and submitting code contributions, please see our [Developer-Guide](./docs/Developer-Guide.md) guide.

Feel free to join our [Discord community](https://discord.com/invite/mVnXXpdE85) to discuss ideas or get help with your contributions. 

## /Dockerfile

``` path="/Dockerfile" 
FROM python:3.12-slim

# Set environment variables
ENV PYTHONUNBUFFERED=1 \
    PYTHONDONTWRITEBYTECODE=1 \
    PIP_NO_CACHE_DIR=1 \
    PIP_DISABLE_PIP_VERSION_CHECK=1 \
    PYTHONPATH="/app/libs/python/core:/app/libs/python/computer:/app/libs/python/agent:/app/libs/python/som:/app/libs/python/pylume:/app/libs/python/computer-server:/app/libs/python/mcp-server"

# Install system dependencies for ARM architecture
RUN apt-get update && apt-get install -y --no-install-recommends \
    git \
    build-essential \
    libgl1-mesa-glx \
    libglib2.0-0 \
    libxcb-xinerama0 \
    libxkbcommon-x11-0 \
    cmake \
    pkg-config \
    curl \
    iputils-ping \
    net-tools \
    sed \
    xxd \
    && apt-get clean \
    && rm -rf /var/lib/apt/lists/*

# Set working directory
WORKDIR /app

# Copy the entire project temporarily
# We'll mount the real source code over this at runtime
COPY . /app/

# Create a simple .env.local file for build.sh
RUN echo "PYTHON_BIN=python" > /app/.env.local

# Modify build.sh to skip virtual environment creation
RUN sed -i 's/python -m venv .venv/echo "Skipping venv creation in Docker"/' /app/scripts/build.sh && \
    sed -i 's/source .venv\/bin\/activate/echo "Skipping venv activation in Docker"/' /app/scripts/build.sh && \
    sed -i 's/find . -type d -name ".venv" -exec rm -rf {} +/echo "Skipping .venv removal in Docker"/' /app/scripts/build.sh && \
    chmod +x /app/scripts/build.sh

# Run the build script to install dependencies
RUN cd /app && ./scripts/build.sh

# Clean up the source files now that dependencies are installed
# When we run the container, we'll mount the actual source code
RUN rm -rf /app/* /app/.??*

# Note: This Docker image doesn't contain the lume executable (macOS-specific)
# Instead, it relies on connecting to a lume server running on the host machine
# via host.docker.internal:7777

# Default command
CMD ["bash"] 
```

## /LICENSE.md

MIT License

Copyright (c) 2025 trycua

Permission is hereby granted, free of charge, to any person obtaining a copy
of this software and associated documentation files (the "Software"), to deal
in the Software without restriction, including without limitation the rights
to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
copies of the Software, and to permit persons to whom the Software is
furnished to do so, subject to the following conditions:

The above copyright notice and this permission notice shall be included in all
copies or substantial portions of the Software.

THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
SOFTWARE.

## /README.md

<div align="center">
  <picture>
    <source media="(prefers-color-scheme: dark)" alt="Cua logo" height="150" srcset="img/logo_white.png">
    <source media="(prefers-color-scheme: light)" alt="Cua logo" height="150" srcset="img/logo_black.png">
    <img alt="Cua logo" height="150" src="img/logo_black.png">
  </picture>

  [![Python](https://img.shields.io/badge/Python-333333?logo=python&logoColor=white&labelColor=333333)](#)
  [![Swift](https://img.shields.io/badge/Swift-F05138?logo=swift&logoColor=white)](#)
  [![macOS](https://img.shields.io/badge/macOS-000000?logo=apple&logoColor=F0F0F0)](#)
  [![Discord](https://img.shields.io/badge/Discord-%235865F2.svg?&logo=discord&logoColor=white)](https://discord.com/invite/mVnXXpdE85)
  <br>
  <a href="https://trendshift.io/repositories/13685" target="_blank"><img src="https://trendshift.io/api/badge/repositories/13685" alt="trycua%2Fcua | Trendshift" style="width: 250px; height: 55px;" width="250" height="55"/></a>
</div>

**c/ua** ("koo-ah") is Docker for [Computer-Use Agents](https://www.oneusefulthing.org/p/when-you-give-a-claude-a-mouse) - it enables AI agents to control full operating systems in virtual containers and deploy them locally or to the cloud.

<div align="center">
  <video src="https://github.com/user-attachments/assets/c619b4ea-bb8e-4382-860e-f3757e36af20" width="800" controls></video>
</div>
<details>
<summary><b>Check out more demos of the Computer-Use Agent in action
</b></summary>

<details open>
<summary><b>MCP Server: Work with Claude Desktop and Tableau</b></summary>
<br>
<div align="center">
    <video src="https://github.com/user-attachments/assets/9f573547-5149-493e-9a72-396f3cff29df" width="800" controls></video>
</div>
</details>

<details>
<summary><b>AI-Gradio: Multi-app workflow with browser, VS Code and terminal</b></summary>
<br>
<div align="center">
    <video src="https://github.com/user-attachments/assets/723a115d-1a07-4c8e-b517-88fbdf53ed0f" width="800" controls></video>
</div>
</details>

<details>
<summary><b>Notebook: Fix GitHub issue in Cursor</b></summary>
<br>
<div align="center">
    <video src="https://github.com/user-attachments/assets/f67f0107-a1e1-46dc-aa9f-0146eb077077" width="800" controls></video>
</div>
</details>
</details><br/>

# 🚀 Quick Start with a Computer-Use Agent UI

**Need to automate desktop tasks? Launch the Computer-Use Agent UI with a single command.**


### Option 1: Fully-managed install with Docker (recommended)
*Docker-based guided install for quick use*

**macOS/Linux/Windows (via WSL):**
```bash
# Requires Docker
/bin/bash -c "$(curl -fsSL https://raw.githubusercontent.com/trycua/cua/main/scripts/playground-docker.sh)"
```
This script will guide you through setup using Docker containers and launch the Computer-Use Agent UI.

---

### Option 2: [Dev Container](./.devcontainer/README.md)
*Best for contributors and development*

This repository includes a [Dev Container](./.devcontainer/README.md) configuration that simplifies setup to a few steps:

1. **Install the Dev Containers extension ([VS Code](https://marketplace.visualstudio.com/items?itemName=ms-vscode-remote.remote-containers) or [WindSurf](https://docs.windsurf.com/windsurf/advanced#dev-containers-beta))**
2. **Open the repository in the Dev Container:**
    - Press `Ctrl+Shift+P` (or `⌘+Shift+P` on macOS)
    - Select `Dev Containers: Clone Repository in Container Volume...` and paste the repository URL: `https://github.com/trycua/cua.git` (if not cloned) or `Dev Containers: Open Folder in Container...` (if git cloned).
     > **Note**: On WindSurf, the post install hook might not run automatically. If so, run `/bin/bash .devcontainer/post-install.sh` manually.
3. **Open the VS Code workspace:** Once the post-install.sh is done running, open the `.vscode/py.code-workspace` workspace and press ![Open Workspace](https://github.com/user-attachments/assets/923bdd43-8c8f-4060-8d78-75bfa302b48c)
.
4. **Run the Agent UI example:** Click ![Run Agent UI](https://github.com/user-attachments/assets/7a61ef34-4b22-4dab-9864-f86bf83e290b)
 to start the Gradio UI. If prompted to install **debugpy (Python Debugger)** to enable remote debugging, select 'Yes' to proceed.
5. **Access the Gradio UI:** The Gradio UI will be available at `http://localhost:7860` and will automatically forward to your host machine.

---

### Option 3: PyPI
*Direct Python package installation*

```bash
# conda create -yn cua python==3.12

pip install -U "cua-computer[all]" "cua-agent[all]"
python -m agent.ui # Start the agent UI
```

Or check out the [Usage Guide](#-usage-guide) to learn how to use our Python SDK in your own code.

---

## Supported [Agent Loops](https://github.com/trycua/cua/blob/main/libs/python/agent/README.md#agent-loops)
- [UITARS-1.5](https://github.com/trycua/cua/blob/main/libs/python/agent/README.md#agent-loops) - Run locally on Apple Silicon with MLX, or use cloud providers
- [OpenAI CUA](https://github.com/trycua/cua/blob/main/libs/python/agent/README.md#agent-loops) - Use OpenAI's Computer-Use Preview model
- [Anthropic CUA](https://github.com/trycua/cua/blob/main/libs/python/agent/README.md#agent-loops) - Use Anthropic's Computer-Use capabilities
- [OmniParser-v2.0](https://github.com/trycua/cua/blob/main/libs/python/agent/README.md#agent-loops) - Control UI with [Set-of-Marks prompting](https://som-gpt4v.github.io/) using any vision model

## 🖥️ Compatibility

For detailed compatibility information including host OS support, VM emulation capabilities, and model provider compatibility, see the [Compatibility Matrix](./COMPATIBILITY.md).

<br/>
<br/>

# 🐍 Usage Guide

Follow these steps to use C/ua in your own Python code. See [Developer Guide](./docs/Developer-Guide.md) for building from source.

### Step 1: Install Lume CLI

```bash
/bin/bash -c "$(curl -fsSL https://raw.githubusercontent.com/trycua/cua/main/libs/lume/scripts/install.sh)"
```

Lume CLI manages high-performance macOS/Linux VMs with near-native speed on Apple Silicon.

### Step 2: Pull the macOS CUA Image

```bash
lume pull macos-sequoia-cua:latest
```

The macOS CUA image contains the default Mac apps and the Computer Server for easy automation.

### Step 3: Install Python SDK

```bash
pip install "cua-computer[all]" "cua-agent[all]"
```

### Step 4: Use in Your Code

```python
from computer import Computer
from agent import ComputerAgent, LLM

async def main():
    # Start a local macOS VM
    computer = Computer(os_type="macos")
    await computer.run()

    # Or with C/ua Cloud Container
    computer = Computer(
      os_type="linux",
      api_key="your_cua_api_key_here",
      name="your_container_name_here"
    )

    # Example: Direct control of a macOS VM with Computer
    await computer.interface.left_click(100, 200)
    await computer.interface.type_text("Hello, world!")
    screenshot_bytes = await computer.interface.screenshot()
    
    # Example: Create and run an agent locally using mlx-community/UI-TARS-1.5-7B-6bit
    agent = ComputerAgent(
      computer=computer,
      loop="uitars",
      model=LLM(provider="mlxvlm", name="mlx-community/UI-TARS-1.5-7B-6bit")
    )
    async for result in agent.run("Find the trycua/cua repository on GitHub and follow the quick start guide"):
        print(result)

if __name__ == "__main__":
    asyncio.run(main())
```

For ready-to-use examples, check out our [Notebooks](./notebooks/) collection.

### Lume CLI Reference

```bash
# Install Lume CLI and background service
curl -fsSL https://raw.githubusercontent.com/trycua/cua/main/libs/lume/scripts/install.sh | bash

# List all VMs
lume ls

# Pull a VM image
lume pull macos-sequoia-cua:latest

# Create a new VM
lume create my-vm --os macos --cpu 4 --memory 8GB --disk-size 50GB

# Run a VM (creates and starts if it doesn't exist)
lume run macos-sequoia-cua:latest

# Stop a VM
lume stop macos-sequoia-cua_latest

# Delete a VM
lume delete macos-sequoia-cua_latest
```

### Lumier CLI Reference

For advanced container-like virtualization, check out [Lumier](./libs/lumier/README.md) - a Docker interface for macOS and Linux VMs.

```bash
# Install Lume CLI and background service
curl -fsSL https://raw.githubusercontent.com/trycua/cua/main/libs/lume/scripts/install.sh | bash

# Run macOS in a Docker container
docker run -it --rm \
    --name lumier-vm \
    -p 8006:8006 \
    -v $(pwd)/storage:/storage \
    -v $(pwd)/shared:/shared \
    -e VM_NAME=lumier-vm \
    -e VERSION=ghcr.io/trycua/macos-sequoia-cua:latest \
    -e CPU_CORES=4 \
    -e RAM_SIZE=8192 \
    -e HOST_STORAGE_PATH=$(pwd)/storage \
    -e HOST_SHARED_PATH=$(pwd)/shared \
    trycua/lumier:latest
```

## Resources

- [How to use the MCP Server with Claude Desktop or other MCP clients](./libs/python/mcp-server/README.md) - One of the easiest ways to get started with C/ua
- [How to use OpenAI Computer-Use, Anthropic, OmniParser, or UI-TARS for your Computer-Use Agent](./libs/python/agent/README.md)
- [How to use Lume CLI for managing desktops](./libs/lume/README.md)
- [Training Computer-Use Models: Collecting Human Trajectories with C/ua (Part 1)](https://www.trycua.com/blog/training-computer-use-models-trajectories-1)
- [Build Your Own Operator on macOS (Part 1)](https://www.trycua.com/blog/build-your-own-operator-on-macos-1)

## Modules

| Module | Description | Installation |
|--------|-------------|---------------|
| [**Lume**](./libs/lume/README.md) | VM management for macOS/Linux using Apple's Virtualization.Framework | `curl -fsSL https://raw.githubusercontent.com/trycua/cua/main/libs/lume/scripts/install.sh \| bash` |
| [**Lumier**](./libs/lumier/README.md) | Docker interface for macOS and Linux VMs | `docker pull trycua/lumier:latest` |
| [**Computer**](./libs/computer/README.md) | Interface for controlling virtual machines | `pip install "cua-computer[all]"` |
| [**Agent**](./libs/agent/README.md) | AI agent framework for automating tasks | `pip install "cua-agent[all]"` |
| [**MCP Server**](./libs/mcp-server/README.md) | MCP server for using CUA with Claude Desktop | `pip install cua-mcp-server` |
| [**SOM**](./libs/som/README.md) | Self-of-Mark library for Agent | `pip install cua-som` |
| [**Computer Server**](./libs/computer-server/README.md) | Server component for Computer | `pip install cua-computer-server` |
| [**Core**](./libs/core/README.md) | Core utilities | `pip install cua-core` |

## Computer Interface Reference

For complete examples, see [computer_examples.py](./examples/computer_examples.py) or [computer_nb.ipynb](./notebooks/computer_nb.ipynb)

```python
# Shell Actions
result = await computer.interface.run_command(cmd)       # Run shell command
# result.stdout, result.stderr, result.returncode

# Mouse Actions
await computer.interface.left_click(x, y)       # Left click at coordinates
await computer.interface.right_click(x, y)      # Right click at coordinates
await computer.interface.double_click(x, y)     # Double click at coordinates
await computer.interface.move_cursor(x, y)      # Move cursor to coordinates
await computer.interface.drag_to(x, y, duration)  # Drag to coordinates
await computer.interface.get_cursor_position()  # Get current cursor position
await computer.interface.mouse_down(x, y, button="left")  # Press and hold a mouse button
await computer.interface.mouse_up(x, y, button="left")    # Release a mouse button

# Keyboard Actions
await computer.interface.type_text("Hello")     # Type text
await computer.interface.press_key("enter")     # Press a single key
await computer.interface.hotkey("command", "c") # Press key combination
await computer.interface.key_down("command")    # Press and hold a key
await computer.interface.key_up("command")      # Release a key

# Scrolling Actions
await computer.interface.scroll(x, y)           # Scroll the mouse wheel
await computer.interface.scroll_down(clicks)    # Scroll down
await computer.interface.scroll_up(clicks)      # Scroll up

# Screen Actions
await computer.interface.screenshot()           # Take a screenshot
await computer.interface.get_screen_size()      # Get screen dimensions

# Clipboard Actions
await computer.interface.set_clipboard(text)    # Set clipboard content
await computer.interface.copy_to_clipboard()    # Get clipboard content

# File System Operations
await computer.interface.file_exists(path)      # Check if file exists
await computer.interface.directory_exists(path) # Check if directory exists
await computer.interface.read_text(path, encoding="utf-8")        # Read file content
await computer.interface.write_text(path, content, encoding="utf-8") # Write file content
await computer.interface.read_bytes(path)       # Read file content as bytes
await computer.interface.write_bytes(path, content) # Write file content as bytes
await computer.interface.delete_file(path)      # Delete file
await computer.interface.create_dir(path)       # Create directory
await computer.interface.delete_dir(path)       # Delete directory
await computer.interface.list_dir(path)         # List directory contents

# Accessibility
await computer.interface.get_accessibility_tree() # Get accessibility tree

# Python Virtual Environment Operations
await computer.venv_install("demo_venv", ["requests", "macos-pyxa"]) # Install packages in a virtual environment
await computer.venv_cmd("demo_venv", "python -c 'import requests; print(requests.get(`https://httpbin.org/ip`).json())'") # Run a shell command in a virtual environment
await computer.venv_exec("demo_venv", python_function_or_code, *args, **kwargs) # Run a Python function in a virtual environment and return the result / raise an exception

# Example: Use sandboxed functions to execute code in a C/ua Container
from computer.helpers import sandboxed

@sandboxed("demo_venv")
def greet_and_print(name):
    """Get the HTML of the current Safari tab"""
    import PyXA
    safari = PyXA.Application("Safari")
    html = safari.current_document.source()
    print(f"Hello from inside the container, {name}!")
    return {"greeted": name, "safari_html": html}

# When a @sandboxed function is called, it will execute in the container
result = await greet_and_print("C/ua")
# Result: {"greeted": "C/ua", "safari_html": "<html>...</html>"}
# stdout and stderr are also captured and printed / raised
print("Result from sandboxed function:", result)
```

## ComputerAgent Reference

For complete examples, see [agent_examples.py](./examples/agent_examples.py) or [agent_nb.ipynb](./notebooks/agent_nb.ipynb)

```python
# Import necessary components
from agent import ComputerAgent, LLM, AgentLoop, LLMProvider

# UI-TARS-1.5 agent for local execution with MLX
ComputerAgent(loop=AgentLoop.UITARS, model=LLM(provider=LLMProvider.MLXVLM, name="mlx-community/UI-TARS-1.5-7B-6bit"))   
# OpenAI Computer-Use agent using OPENAI_API_KEY  
ComputerAgent(loop=AgentLoop.OPENAI, model=LLM(provider=LLMProvider.OPENAI, name="computer-use-preview"))
# Anthropic Claude agent using ANTHROPIC_API_KEY
ComputerAgent(loop=AgentLoop.ANTHROPIC, model=LLM(provider=LLMProvider.ANTHROPIC))

# OmniParser loop for UI control using Set-of-Marks (SOM) prompting and any vision LLM
ComputerAgent(loop=AgentLoop.OMNI, model=LLM(provider=LLMProvider.OLLAMA, name="gemma3:12b-it-q4_K_M"))      
# OpenRouter example using OAICOMPAT provider
ComputerAgent(
    loop=AgentLoop.OMNI,
    model=LLM(
        provider=LLMProvider.OAICOMPAT, 
        name="openai/gpt-4o-mini",
        provider_base_url="https://openrouter.ai/api/v1"
    ),
    api_key="your-openrouter-api-key"
)
```


## Community

Join our [Discord community](https://discord.com/invite/mVnXXpdE85) to discuss ideas, get assistance, or share your demos!

## License

Cua is open-sourced under the MIT License - see the [LICENSE](LICENSE) file for details.

Microsoft's OmniParser, which is used in this project, is licensed under the Creative Commons Attribution 4.0 International License (CC-BY-4.0) - see the [OmniParser LICENSE](https://github.com/microsoft/OmniParser/blob/master/LICENSE) file for details.

## Contributing

We welcome contributions to CUA! Please refer to our [Contributing Guidelines](CONTRIBUTING.md) for details.

## Trademarks

Apple, macOS, and Apple Silicon are trademarks of Apple Inc. Ubuntu and Canonical are registered trademarks of Canonical Ltd. Microsoft is a registered trademark of Microsoft Corporation. This project is not affiliated with, endorsed by, or sponsored by Apple Inc., Canonical Ltd., or Microsoft Corporation.

## Stargazers

Thank you to all our supporters!

[![Stargazers over time](https://starchart.cc/trycua/cua.svg?variant=adaptive)](https://starchart.cc/trycua/cua)

## Contributors

<!-- ALL-CONTRIBUTORS-LIST:START - Do not remove or modify this section -->
<!-- prettier-ignore-start -->
<!-- markdownlint-disable -->
<table>
  <tbody>
    <tr>
      <td align="center" valign="top" width="14.28%"><a href="https://github.com/f-trycua"><img src="https://avatars.githubusercontent.com/u/195596869?v=4?s=100" width="100px;" alt="f-trycua"/><br /><sub><b>f-trycua</b></sub></a><br /><a href="#code-f-trycua" title="Code">💻</a></td>
      <td align="center" valign="top" width="14.28%"><a href="http://pepicrft.me"><img src="https://avatars.githubusercontent.com/u/663605?v=4?s=100" width="100px;" alt="Pedro Piñera Buendía"/><br /><sub><b>Pedro Piñera Buendía</b></sub></a><br /><a href="#code-pepicrft" title="Code">💻</a></td>
      <td align="center" valign="top" width="14.28%"><a href="https://iamit.in"><img src="https://avatars.githubusercontent.com/u/5647941?v=4?s=100" width="100px;" alt="Amit Kumar"/><br /><sub><b>Amit Kumar</b></sub></a><br /><a href="#code-aktech" title="Code">💻</a></td>
      <td align="center" valign="top" width="14.28%"><a href="https://productsway.com/"><img src="https://avatars.githubusercontent.com/u/870029?v=4?s=100" width="100px;" alt="Dung Duc Huynh (Kaka)"/><br /><sub><b>Dung Duc Huynh (Kaka)</b></sub></a><br /><a href="#code-jellydn" title="Code">💻</a></td>
      <td align="center" valign="top" width="14.28%"><a href="http://zaydkrunz.com"><img src="https://avatars.githubusercontent.com/u/70227235?v=4?s=100" width="100px;" alt="Zayd Krunz"/><br /><sub><b>Zayd Krunz</b></sub></a><br /><a href="#code-ShrootBuck" title="Code">💻</a></td>
      <td align="center" valign="top" width="14.28%"><a href="https://github.com/PrashantRaj18198"><img src="https://avatars.githubusercontent.com/u/23168997?v=4?s=100" width="100px;" alt="Prashant Raj"/><br /><sub><b>Prashant Raj</b></sub></a><br /><a href="#code-PrashantRaj18198" title="Code">💻</a></td>
      <td align="center" valign="top" width="14.28%"><a href="https://www.mobile.dev"><img src="https://avatars.githubusercontent.com/u/847683?v=4?s=100" width="100px;" alt="Leland Takamine"/><br /><sub><b>Leland Takamine</b></sub></a><br /><a href="#code-Leland-Takamine" title="Code">💻</a></td>
    </tr>
    <tr>
      <td align="center" valign="top" width="14.28%"><a href="https://github.com/ddupont808"><img src="https://avatars.githubusercontent.com/u/3820588?v=4?s=100" width="100px;" alt="ddupont"/><br /><sub><b>ddupont</b></sub></a><br /><a href="#code-ddupont808" title="Code">💻</a></td>
      <td align="center" valign="top" width="14.28%"><a href="https://github.com/Lizzard1123"><img src="https://avatars.githubusercontent.com/u/46036335?v=4?s=100" width="100px;" alt="Ethan Gutierrez"/><br /><sub><b>Ethan Gutierrez</b></sub></a><br /><a href="#code-Lizzard1123" title="Code">💻</a></td>
      <td align="center" valign="top" width="14.28%"><a href="https://ricterz.me"><img src="https://avatars.githubusercontent.com/u/5282759?v=4?s=100" width="100px;" alt="Ricter Zheng"/><br /><sub><b>Ricter Zheng</b></sub></a><br /><a href="#code-RicterZ" title="Code">💻</a></td>
      <td align="center" valign="top" width="14.28%"><a href="https://www.trytruffle.ai/"><img src="https://avatars.githubusercontent.com/u/50844303?v=4?s=100" width="100px;" alt="Rahul Karajgikar"/><br /><sub><b>Rahul Karajgikar</b></sub></a><br /><a href="#code-rahulkarajgikar" title="Code">💻</a></td>
      <td align="center" valign="top" width="14.28%"><a href="https://github.com/trospix"><img src="https://avatars.githubusercontent.com/u/81363696?v=4?s=100" width="100px;" alt="trospix"/><br /><sub><b>trospix</b></sub></a><br /><a href="#code-trospix" title="Code">💻</a></td>
      <td align="center" valign="top" width="14.28%"><a href="https://github.com/evnsnclr"><img src="https://avatars.githubusercontent.com/u/139897548?v=4?s=100" width="100px;" alt="Evan smith"/><br /><sub><b>Evan smith</b></sub></a><br /><a href="#code-evnsnclr" title="Code">💻</a></td>
    </tr>
  </tbody>
</table>

<!-- markdownlint-restore -->
<!-- prettier-ignore-end -->

<!-- ALL-CONTRIBUTORS-LIST:END -->


## /docs/Developer-Guide.md

# Getting Started

## Project Structure

The project is organized as a monorepo with these main packages:

### Python
- `libs/python/core/` - Base package with telemetry support
- `libs/python/computer/` - Computer-use interface (CUI) library
- `libs/python/agent/` - AI agent library with multi-provider support
- `libs/python/som/` - Set-of-Mark parser
- `libs/python/computer-server/` - Server component for VM
- `libs/python/pylume/` - Python bindings for Lume

### TypeScript
- `libs/typescript/computer/` - Computer-use interface (CUI) library
- `libs/typescript/agent/` - AI agent library with multi-provider support

### Other
- `libs/lume/` - Lume CLI

Each package has its own virtual environment and dependencies, managed through PDM.

## Local Development Setup

1. Install Lume CLI:

    ```bash
    /bin/bash -c "$(curl -fsSL https://raw.githubusercontent.com/trycua/cua/main/libs/lume/scripts/install.sh)"
    ```

2. Clone the repository:

    ```bash
    git clone https://github.com/trycua/cua.git
    cd cua
    ```

3. Create a `.env.local` file in the root directory with your API keys:

    ```bash
    # Required for Anthropic provider
    ANTHROPIC_API_KEY=your_anthropic_key_here

    # Required for OpenAI provider
    OPENAI_API_KEY=your_openai_key_here
    ```

4. Open the workspace in VSCode or Cursor:

    ```bash
    # For Cua Python development
    code .vscode/py.code-workspace

    # For Lume (Swift) development
    code .vscode/lume.code-workspace
    ```

Using the workspace file is strongly recommended as it:

- Sets up correct Python environments for each package
- Configures proper import paths
- Enables debugging configurations
- Maintains consistent settings across packages

## Lume Development

Refer to the [Lume README](../libs/lume/docs/Development.md) for instructions on how to develop the Lume CLI.

## Python Development

There are two ways to install Lume:

### Run the build script

Run the build script to set up all packages:

```bash
./scripts/build.sh
```

The build script creates a shared virtual environment for all packages. The workspace configuration automatically handles import paths with the correct Python path settings.

This will:

- Create a virtual environment for the project
- Install all packages in development mode
- Set up the correct Python path
- Install development tools

### Install with PDM

If PDM is not already installed, you can follow the installation instructions [here](https://pdm-project.org/en/latest/#installation).

To install with PDM, simply run:

```console
pdm install -G:all
```

This installs all the dependencies for development, testing, and building the docs. If you'd only like development dependencies, you can run:

```console
pdm install -d
```

## Running Examples

The Python workspace includes launch configurations for all packages:

- "Run Computer Examples" - Runs computer examples
- "Run Computer API Server" - Runs the computer-server
- "Run Agent Examples" - Runs agent examples
- "SOM" configurations - Various settings for running SOM

To run examples from VSCode / Cursor:

1. Press F5 or use the Run/Debug view
2. Select the desired configuration

The workspace also includes compound launch configurations:

- "Run Computer Examples + Server" - Runs both the Computer Examples and Server simultaneously

## Docker Development Environment

As an alternative to installing directly on your host machine, you can use Docker for development. This approach has several advantages:

### Prerequisites

- Docker installed on your machine
- Lume server running on your host (port 7777): `lume serve`

### Setup and Usage

1. Build the development Docker image:

    ```bash
    ./scripts/run-docker-dev.sh build
    ```

2. Run an example in the container:

    ```bash
    ./scripts/run-docker-dev.sh run computer_examples.py
    ```

3. Get an interactive shell in the container:

    ```bash
    ./scripts/run-docker-dev.sh run --interactive
    ```

4. Stop any running containers:

    ```bash
    ./scripts/run-docker-dev.sh stop
    ```

### How it Works

The Docker development environment:

- Installs all required Python dependencies in the container
- Mounts your source code from the host at runtime
- Automatically configures the connection to use host.docker.internal:7777 for accessing the Lume server on your host machine
- Preserves your code changes without requiring rebuilds (source code is mounted as a volume)

> **Note**: The Docker container doesn't include the macOS-specific Lume executable. Instead, it connects to the Lume server running on your host machine via host.docker.internal:7777. Make sure to start the Lume server on your host before running examples in the container.

## Cleanup and Reset

If you need to clean up the environment (non-docker) and start fresh:

```bash
./scripts/cleanup.sh
```

This will:

- Remove all virtual environments
- Clean Python cache files and directories
- Remove build artifacts
- Clean PDM-related files
- Reset environment configurations

## Code Formatting Standards

The cua project follows strict code formatting standards to ensure consistency across all packages.

### Python Code Formatting

#### Tools

The project uses the following tools for code formatting and linting:

- **[Black](https://black.readthedocs.io/)**: Code formatter
- **[Ruff](https://beta.ruff.rs/docs/)**: Fast linter and formatter
- **[MyPy](https://mypy.readthedocs.io/)**: Static type checker

These tools are automatically installed when you set up the development environment using the `./scripts/build.sh` script.

#### Configuration

The formatting configuration is defined in the root `pyproject.toml` file:

```toml
[tool.black]
line-length = 100
target-version = ["py311"]

[tool.ruff]
line-length = 100
target-version = "py311"
select = ["E", "F", "B", "I"]
fix = true

[tool.ruff.format]
docstring-code-format = true

[tool.mypy]
strict = true
python_version = "3.11"
ignore_missing_imports = true
disallow_untyped_defs = true
check_untyped_defs = true
warn_return_any = true
show_error_codes = true
warn_unused_ignores = false
```

#### Key Formatting Rules

- **Line Length**: Maximum of 100 characters
- **Python Version**: Code should be compatible with Python 3.11+
- **Imports**: Automatically sorted (using Ruff's "I" rule)
- **Type Hints**: Required for all function definitions (strict mypy mode)

#### IDE Integration

The repository includes VSCode workspace configurations that enable automatic formatting. When you open the workspace files (as recommended in the setup instructions), the correct formatting settings are automatically applied.

Python-specific settings in the workspace files:

```json
"[python]": {
    "editor.formatOnSave": true,
    "editor.defaultFormatter": "ms-python.black-formatter",
    "editor.codeActionsOnSave": {
        "source.organizeImports": "explicit"
    }
}
```

Recommended VS Code extensions:

- Black Formatter (ms-python.black-formatter)
- Ruff (charliermarsh.ruff)
- Pylance (ms-python.vscode-pylance)

#### Manual Formatting

To manually format code:

```bash
# Format all Python files using Black
pdm run black .

# Run Ruff linter with auto-fix
pdm run ruff check --fix .

# Run type checking with MyPy
pdm run mypy .
```

#### Pre-commit Validation

Before submitting a pull request, ensure your code passes all formatting checks:

```bash
# Run all checks
pdm run black --check .
pdm run ruff check .
pdm run mypy .
```

### Swift Code (Lume)

For Swift code in the `libs/lume` directory:

- Follow the [Swift API Design Guidelines](https://www.swift.org/documentation/api-design-guidelines/)
- Use SwiftFormat for consistent formatting
- Code will be automatically formatted on save when using the lume workspace


## /docs/FAQ.md

# FAQs

### Why a local sandbox?

A local sandbox is a dedicated environment that is isolated from the rest of the system. As AI agents rapidly evolve towards 70-80% success rates on average tasks, having a controlled and secure environment becomes crucial. Cua's Computer-Use AI agents run in a local sandbox to ensure reliability, safety, and controlled execution.

Benefits of using a local sandbox rather than running the Computer-Use AI agent in the host system:

- **Reliability**: The sandbox provides a reproducible environment - critical for benchmarking and debugging agent behavior. Frameworks like [OSWorld](https://github.com/xlang-ai/OSWorld), [Simular AI](https://github.com/simular-ai/Agent-S), Microsoft's [OmniTool](https://github.com/microsoft/OmniParser/tree/master/omnitool), [WindowsAgentArena](https://github.com/microsoft/WindowsAgentArena) and more are using Computer-Use AI agents running in local sandboxes.
- **Safety & Isolation**: The sandbox is isolated from the rest of the system, protecting sensitive data and system resources. As CUA agent capabilities grow, this isolation becomes increasingly important for preventing potential safety breaches.
- **Control**: The sandbox can be easily monitored and terminated if needed, providing oversight for autonomous agent operation.

### Where are the sandbox images stored?

Sandbox are stored in `~/.lume`, and cached images are stored in `~/.lume/cache`.

### Which image is Computer using?

Computer uses an optimized macOS image for Computer-Use interactions, with pre-installed apps and settings for optimal performance.
The image is available on our [ghcr registry](https://github.com/orgs/trycua/packages/container/package/macos-sequoia-cua).

### Are Sandbox disks taking up all the disk space?

No, macOS uses sparse files, which only allocate space as needed. For example, VM disks totaling 50 GB may only use 20 GB on disk.

### How do I delete a VM?

```bash
lume delete <name>
```

### How do I fix EasyOCR `[SSL: CERTIFICATE_VERIFY_FAILED]` errors?

**Symptom:**
When running an agent that uses OCR (e.g., with `AgentLoop.OMNI`), you might encounter an error during the first run or initialization phase that includes:
```
ssl.SSLCertVerificationError: [SSL: CERTIFICATE_VERIFY_FAILED] certificate verify failed: unable to get local issuer certificate (_ssl.c:1000)
```

**Cause:**
This usually happens when EasyOCR attempts to download its language models over HTTPS for the first time. Python's SSL module cannot verify the server's certificate because it can't locate the necessary root Certificate Authority (CA) certificates in your environment's trust store.

**Solution:**
You need to explicitly tell Python where to find a trusted CA bundle. The `certifi` package provides one. Before running your Python agent script **the first time it needs to download models**, set the following environment variables in the *same terminal session*:
```bash
# Ensure certifi is installed: pip show certifi
export SSL_CERT_FILE=$(python -m certifi)
export REQUESTS_CA_BUNDLE=$(python -m certifi)

# Now run your Python script that uses the agent...
# python your_agent_script.py
```
This directs Python to use the CA bundle provided by `certifi` for SSL verification. **Note:** Once EasyOCR has successfully downloaded its models, you typically do not need to set these environment variables before every subsequent run.

### How do I troubleshoot the agent failing to get the VM IP address or getting stuck on "VM status changed to: stopped"?

**Symptom:**
When running your agent script (e.g., using `Computer().run(...)`), the script might hang during the VM startup phase, logging messages like:
*   `Waiting for VM to be ready...`
*   `VM status changed to: stopped (after 0.0s)`
*   `Still waiting for VM IP address... (elapsed: XX.Xs)`
*   Eventually, it might time out, or you might notice the VM window never appears or closes quickly.

**Cause:**
This is typically due to known instability issues with the `lume serve` background daemon process, as documented in the main `README.md`:
1.  **`lume serve` Crash:** The `lume serve` process might terminate unexpectedly shortly after launch or when the script tries to interact with it. If it's not running, the script cannot get VM status updates or the IP address.
2.  **Incorrect Status Reporting:** Even if `lume serve` is running, its API sometimes incorrectly reports the VM status as `stopped` immediately after startup is initiated. While the underlying `Computer` library tries to poll and wait for the correct `running` status, this initial incorrect report can cause delays or failures if the status doesn't update correctly within the timeout or if `lume serve` crashes during the polling.

**Troubleshooting Steps:**
1.  **Check `lume serve`:** Is the `lume serve` process still running in its terminal? Did it print any errors or exit? If it's not running, stop your agent script (`Ctrl+C`) and proceed to step 2.
2.  **Force Cleanup:** Before *every* run, perform a rigorous cleanup to ensure no old `lume` processes or VM states interfere. Open a **new terminal** and run:
    ```bash
    # Stop any running Lume VM gracefully first (replace <vm_name> if needed)
    lume stop macos-sequoia-cua_latest

    # Force kill lume serve and related processes
    pkill -f "lume serve"
    pkill -9 -f "lume"
    pkill -9 -f "VzVirtualMachine" # Kills underlying VM process

    # Optional: Verify they are gone
    # ps aux | grep -E 'lume|VzVirtualMachine' | grep -v grep
    ```
3.  **Restart Sequence:**
    *   **Terminal 1:** Start `lume serve` cleanly:
        ```bash
        lume serve
        ```
        *(Watch this terminal to ensure it stays running).*
    *   **Terminal 2:** Run your agent script (including the `export SSL_CERT_FILE...` commands if *first time* using OCR):
        ```bash
        # export SSL_CERT_FILE=$(python -m certifi) # Only if first run with OCR
        # export REQUESTS_CA_BUNDLE=$(python -m certifi) # Only if first run with OCR
        python your_agent_script.py
        ```
4.  **Retry:** Due to the intermittent nature of the Lume issues, sometimes simply repeating steps 2 and 3 allows the run to succeed if the timing avoids the status reporting bug or the `lume serve` crash.

**Related Issue: "No route to host" Error (macOS Sequoia+)**

*   **Symptom:** Even if the `Computer` library logs show the VM has obtained an IP address, you might encounter connection errors like `No route to host` when the agent tries to connect to the internal server, especially when running the agent script from within an IDE (like VS Code or Cursor).
*   **Cause:** This is often due to macOS Sequoia's enhanced local network privacy controls. Applications need explicit permission to access the local network, which includes communicating with the VM.
*   **Solution:** Grant "Local Network" access to the application you are running the script from (e.g., your IDE or terminal application). Go to **System Settings > Privacy & Security > Local Network**, find your application in the list, and toggle the switch ON. You might need to trigger a connection attempt from the application first for it to appear in the list. See [GitHub Issue #61](https://github.com/trycua/cua/issues/61) for more details and discussion.

**Note:** Improving the stability of `lume serve` is an ongoing development area.

### How do I troubleshoot Computer not connecting to lume daemon?

If you're experiencing connection issues between Computer and the lume daemon, it could be because the port 7777 (used by lume) is already in use by an orphaned process. You can diagnose this issue with:

```bash
sudo lsof -i :7777
```

This command will show all processes using port 7777. If you see a lume process already running, you can terminate it with:

```bash
kill <PID>
```

Where `<PID>` is the process ID shown in the output of the `lsof` command. After terminating the process, run `lume serve` again to start the lume daemon.

### What information does Cua track?

Cua tracks anonymized usage and error report statistics; we ascribe to Posthog's approach as detailed [here](https://posthog.com/blog/open-source-telemetry-ethical). If you would like to opt out of sending anonymized info, you can set `telemetry_enabled` to false in the Computer or Agent constructor. Check out our [Telemetry](Telemetry.md) documentation for more details.


## /docs/Telemetry.md

# Telemetry in CUA

This document explains how telemetry works in CUA libraries and how you can control it.

CUA tracks anonymized usage and error report statistics; we ascribe to Posthog's approach as detailed [here](https://posthog.com/blog/open-source-telemetry-ethical). If you would like to opt out of sending anonymized info, you can set `telemetry_enabled` to false.

## What telemetry data we collect

CUA libraries collect minimal anonymous usage data to help improve our software. The telemetry data we collect is specifically limited to:

- Basic system information:
  - Operating system (e.g., 'darwin', 'win32', 'linux')
  - Python version (e.g., '3.11.0')
- Module initialization events:
  - When a module (like 'computer' or 'agent') is imported
  - Version of the module being used

We do NOT collect:
- Personal information
- Contents of files
- Specific text being typed
- Actual screenshots or screen contents
- User-specific identifiers
- API keys
- File contents
- Application data or content
- User interactions with the computer
- Information about files being accessed

## Controlling Telemetry

We are committed to transparency and user control over telemetry. There are two ways to control telemetry:

## 1. Environment Variable (Global Control)

Telemetry is enabled by default. To disable telemetry, set the `CUA_TELEMETRY_ENABLED` environment variable to a falsy value (`0`, `false`, `no`, or `off`):

```bash
# Disable telemetry before running your script
export CUA_TELEMETRY_ENABLED=false

# Or as part of the command
CUA_TELEMETRY_ENABLED=1 python your_script.py

```
Or from Python:
```python
import os
os.environ["CUA_TELEMETRY_ENABLED"] = "false"
```

## 2. Instance-Level Control

You can control telemetry for specific CUA instances by setting `telemetry_enabled` when creating them:

```python
# Disable telemetry for a specific Computer instance
computer = Computer(telemetry_enabled=False)

# Enable telemetry for a specific Agent instance
agent = ComputerAgent(telemetry_enabled=True)
```

You can check if telemetry is enabled for an instance:

```python
print(computer.telemetry_enabled)  # Will print True or False
```

Note that telemetry settings must be configured during initialization and cannot be changed after the object is created.

## Transparency

We believe in being transparent about the data we collect. If you have any questions about our telemetry practices, please open an issue on our GitHub repository.

## /examples/agent_examples.py

```py path="/examples/agent_examples.py" 
"""Example demonstrating the ComputerAgent capabilities with the Omni provider."""

import asyncio
import logging
import traceback
import signal

from computer import Computer, VMProviderType

# Import the unified agent class and types
from agent import ComputerAgent, LLMProvider, LLM, AgentLoop

# Import utility functions
from utils import load_dotenv_files, handle_sigint

# Set up logging
logging.basicConfig(level=logging.INFO)
logger = logging.getLogger(__name__)


async def run_agent_example():
    """Run example of using the ComputerAgent with OpenAI and Omni provider."""
    print("\n=== Example: ComputerAgent with OpenAI and Omni provider ===")

    try:
        # Create a local macOS computer
        computer = Computer(
            os_type="macos",
            verbosity=logging.DEBUG,
        )

        # Create a remote Linux computer with C/ua
        # computer = Computer(
        #     os_type="linux",
        #     api_key=os.getenv("CUA_API_KEY"),
        #     name=os.getenv("CUA_CONTAINER_NAME"),
        #     provider_type=VMProviderType.CLOUD,
        # )

        # Create Computer instance with async context manager
        agent = ComputerAgent(
            computer=computer,
            loop=AgentLoop.OPENAI,
            # loop=AgentLoop.ANTHROPIC,
            # loop=AgentLoop.UITARS,
            # loop=AgentLoop.OMNI,
            model=LLM(provider=LLMProvider.OPENAI),  # No model name for Operator CUA
            # model=LLM(provider=LLMProvider.OPENAI, name="gpt-4o"),
            # model=LLM(provider=LLMProvider.ANTHROPIC, name="claude-3-7-sonnet-20250219"),
            # model=LLM(provider=LLMProvider.OLLAMA, name="gemma3:4b-it-q4_K_M"),
            # model=LLM(provider=LLMProvider.MLXVLM, name="mlx-community/UI-TARS-1.5-7B-4bit"),
            # model=LLM(
            #     provider=LLMProvider.OAICOMPAT,
            #     name="gemma-3-12b-it",
            #     provider_base_url="http://localhost:1234/v1",  # LM Studio local endpoint
            # ),
            save_trajectory=True,
            only_n_most_recent_images=3,
            verbosity=logging.DEBUG,
        )

        tasks = [
            "Look for a repository named trycua/cua on GitHub.",
            "Check the open issues, open the most recent one and read it.",
            "Clone the repository in users/lume/projects if it doesn't exist yet.",
            "Open the repository with an app named Cursor (on the dock, black background and white cube icon).",
            "From Cursor, open Composer if not already open.",
            "Focus on the Composer text area, then write and submit a task to help resolve the GitHub issue.",
        ]

        for i, task in enumerate(tasks):
            print(f"\nExecuting task {i}/{len(tasks)}: {task}")
            async for result in agent.run(task):
                print("Response ID: ", result.get("id"))

                # Print detailed usage information
                usage = result.get("usage")
                if usage:
                    print("\nUsage Details:")
                    print(f"  Input Tokens: {usage.get('input_tokens')}")
                    if "input_tokens_details" in usage:
                        print(f"  Input Tokens Details: {usage.get('input_tokens_details')}")
                    print(f"  Output Tokens: {usage.get('output_tokens')}")
                    if "output_tokens_details" in usage:
                        print(f"  Output Tokens Details: {usage.get('output_tokens_details')}")
                    print(f"  Total Tokens: {usage.get('total_tokens')}")

                print("Response Text: ", result.get("text"))

                # Print tools information
                tools = result.get("tools")
                if tools:
                    print("\nTools:")
                    print(tools)

                # Print reasoning and tool call outputs
                outputs = result.get("output", [])
                for output in outputs:
                    output_type = output.get("type")
                    if output_type == "reasoning":
                        print("\nReasoning Output:")
                        print(output)
                    elif output_type == "computer_call":
                        print("\nTool Call Output:")
                        print(output)

            print(f"\n✅ Task {i+1}/{len(tasks)} completed: {task}")

    except Exception as e:
        logger.error(f"Error in run_agent_example: {e}")
        traceback.print_exc()
        raise


def main():
    """Run the Anthropic agent example."""
    try:
        load_dotenv_files()

        # Register signal handler for graceful exit
        signal.signal(signal.SIGINT, handle_sigint)

        asyncio.run(run_agent_example())
    except Exception as e:
        print(f"Error running example: {e}")
        traceback.print_exc()


if __name__ == "__main__":
    main()

```

## /examples/agent_ui_examples.py

```py path="/examples/agent_ui_examples.py" 
#!/usr/bin/env python3
"""
Simple example script for the Computer-Use Agent Gradio UI.

This script launches the advanced Gradio UI for the Computer-Use Agent
with full model selection and configuration options.
It can be run directly from the command line.
"""


from utils import load_dotenv_files

load_dotenv_files()

# Import the create_gradio_ui function
from agent.ui.gradio.app import create_gradio_ui

if __name__ == "__main__":
    print("Launching Computer-Use Agent Gradio UI with advanced features...")
    app = create_gradio_ui()
    app.launch(
        share=False,
        server_name="0.0.0.0",
        server_port=7860,
    )

```

## /examples/computer-example-ts/.env.example

```example path="/examples/computer-example-ts/.env.example" 
OPENAI_KEY=
CUA_KEY=
CUA_CONTAINER_NAME=
```

## /examples/computer-example-ts/.gitignore

```gitignore path="/examples/computer-example-ts/.gitignore" 
node_modules
.DS_Store
.env
```

## /examples/computer-example-ts/.prettierrc

```prettierrc path="/examples/computer-example-ts/.prettierrc" 
{
  "useTabs": false,
  "semi": true,
  "singleQuote": true,
  "trailingComma": "es5",
  "bracketSpacing": true
}
```

## /examples/computer-example-ts/README.md

# cua-cloud-openai Example

This example demonstrates how to control a c/ua Cloud container using the OpenAI `computer-use-preview` model and the `@trycua/computer` TypeScript library.

## Overview

- Connects to a c/ua Cloud container via the `@trycua/computer` library
- Sends screenshots and instructions to OpenAI's computer-use model
- Executes AI-generated actions (clicks, typing, etc.) inside the container
- Designed for Linux containers, but can be adapted for other OS types

## Getting Started

1. **Install dependencies:**

   ```bash
   npm install
   ```

2. **Set up environment variables:**
   Create a `.env` file with the following variables:
   - `OPENAI_KEY` — your OpenAI API key
   - `CUA_KEY` — your c/ua Cloud API key
   - `CUA_CONTAINER_NAME` — the name of your provisioned container

3. **Run the example:**

   ```bash
   npx tsx src/index.ts
   ```

## Files

- `src/index.ts` — Main example script
- `src/helpers.ts` — Helper for executing actions on the container

## Further Reading

For a step-by-step tutorial and more detailed explanation, see the accompanying blog post:

➡️ [Controlling a c/ua Cloud Container with JavaScript](https://placeholder-url-to-blog-post.com)

_(This link will be updated once the article is published.)_

---

If you have questions or issues, please open an issue or contact the maintainers.


## /examples/computer-example-ts/package.json

```json path="/examples/computer-example-ts/package.json" 
{
  "name": "cua-cloud-openai",
  "version": "1.0.0",
  "description": "",
  "type": "module",
  "main": "index.js",
  "scripts": {
    "dev": "tsx watch src/index.ts",
    "start": "tsx src/index.ts"
  },
  "keywords": [],
  "author": "",
  "license": "MIT",
  "packageManager": "pnpm@10.12.3",
  "dependencies": {
    "@trycua/computer": "link:../../libs/typescript/computer",
    "dotenv": "^16.5.0",
    "openai": "^5.7.0"
  },
  "devDependencies": {
    "@types/node": "^22.15.33",
    "tsx": "^4.20.3",
    "typescript": "^5.8.3"
  }
}
```

## /examples/computer-example-ts/pnpm-lock.yaml

```yaml path="/examples/computer-example-ts/pnpm-lock.yaml" 
lockfileVersion: '9.0'

settings:
  autoInstallPeers: true
  excludeLinksFromLockfile: false

importers:

  .:
    dependencies:
      '@trycua/computer':
        specifier: link:../../libs/typescript/computer
        version: link:../../libs/typescript/computer
      dotenv:
        specifier: ^16.5.0
        version: 16.6.1
      openai:
        specifier: ^5.7.0
        version: 5.8.2
    devDependencies:
      '@types/node':
        specifier: ^22.15.33
        version: 22.15.34
      tsx:
        specifier: ^4.20.3
        version: 4.20.3
      typescript:
        specifier: ^5.8.3
        version: 5.8.3

packages:

  '@esbuild/aix-ppc64@0.25.5':
    resolution: {integrity: sha512-9o3TMmpmftaCMepOdA5k/yDw8SfInyzWWTjYTFCX3kPSDJMROQTb8jg+h9Cnwnmm1vOzvxN7gIfB5V2ewpjtGA==}
    engines: {node: '>=18'}
    cpu: [ppc64]
    os: [aix]

  '@esbuild/android-arm64@0.25.5':
    resolution: {integrity: sha512-VGzGhj4lJO+TVGV1v8ntCZWJktV7SGCs3Pn1GRWI1SBFtRALoomm8k5E9Pmwg3HOAal2VDc2F9+PM/rEY6oIDg==}
    engines: {node: '>=18'}
    cpu: [arm64]
    os: [android]

  '@esbuild/android-arm@0.25.5':
    resolution: {integrity: sha512-AdJKSPeEHgi7/ZhuIPtcQKr5RQdo6OO2IL87JkianiMYMPbCtot9fxPbrMiBADOWWm3T2si9stAiVsGbTQFkbA==}
    engines: {node: '>=18'}
    cpu: [arm]
    os: [android]

  '@esbuild/android-x64@0.25.5':
    resolution: {integrity: sha512-D2GyJT1kjvO//drbRT3Hib9XPwQeWd9vZoBJn+bu/lVsOZ13cqNdDeqIF/xQ5/VmWvMduP6AmXvylO/PIc2isw==}
    engines: {node: '>=18'}
    cpu: [x64]
    os: [android]

  '@esbuild/darwin-arm64@0.25.5':
    resolution: {integrity: sha512-GtaBgammVvdF7aPIgH2jxMDdivezgFu6iKpmT+48+F8Hhg5J/sfnDieg0aeG/jfSvkYQU2/pceFPDKlqZzwnfQ==}
    engines: {node: '>=18'}
    cpu: [arm64]
    os: [darwin]

  '@esbuild/darwin-x64@0.25.5':
    resolution: {integrity: sha512-1iT4FVL0dJ76/q1wd7XDsXrSW+oLoquptvh4CLR4kITDtqi2e/xwXwdCVH8hVHU43wgJdsq7Gxuzcs6Iq/7bxQ==}
    engines: {node: '>=18'}
    cpu: [x64]
    os: [darwin]

  '@esbuild/freebsd-arm64@0.25.5':
    resolution: {integrity: sha512-nk4tGP3JThz4La38Uy/gzyXtpkPW8zSAmoUhK9xKKXdBCzKODMc2adkB2+8om9BDYugz+uGV7sLmpTYzvmz6Sw==}
    engines: {node: '>=18'}
    cpu: [arm64]
    os: [freebsd]

  '@esbuild/freebsd-x64@0.25.5':
    resolution: {integrity: sha512-PrikaNjiXdR2laW6OIjlbeuCPrPaAl0IwPIaRv+SMV8CiM8i2LqVUHFC1+8eORgWyY7yhQY+2U2fA55mBzReaw==}
    engines: {node: '>=18'}
    cpu: [x64]
    os: [freebsd]

  '@esbuild/linux-arm64@0.25.5':
    resolution: {integrity: sha512-Z9kfb1v6ZlGbWj8EJk9T6czVEjjq2ntSYLY2cw6pAZl4oKtfgQuS4HOq41M/BcoLPzrUbNd+R4BXFyH//nHxVg==}
    engines: {node: '>=18'}
    cpu: [arm64]
    os: [linux]

  '@esbuild/linux-arm@0.25.5':
    resolution: {integrity: sha512-cPzojwW2okgh7ZlRpcBEtsX7WBuqbLrNXqLU89GxWbNt6uIg78ET82qifUy3W6OVww6ZWobWub5oqZOVtwolfw==}
    engines: {node: '>=18'}
    cpu: [arm]
    os: [linux]

  '@esbuild/linux-ia32@0.25.5':
    resolution: {integrity: sha512-sQ7l00M8bSv36GLV95BVAdhJ2QsIbCuCjh/uYrWiMQSUuV+LpXwIqhgJDcvMTj+VsQmqAHL2yYaasENvJ7CDKA==}
    engines: {node: '>=18'}
    cpu: [ia32]
    os: [linux]

  '@esbuild/linux-loong64@0.25.5':
    resolution: {integrity: sha512-0ur7ae16hDUC4OL5iEnDb0tZHDxYmuQyhKhsPBV8f99f6Z9KQM02g33f93rNH5A30agMS46u2HP6qTdEt6Q1kg==}
    engines: {node: '>=18'}
    cpu: [loong64]
    os: [linux]

  '@esbuild/linux-mips64el@0.25.5':
    resolution: {integrity: sha512-kB/66P1OsHO5zLz0i6X0RxlQ+3cu0mkxS3TKFvkb5lin6uwZ/ttOkP3Z8lfR9mJOBk14ZwZ9182SIIWFGNmqmg==}
    engines: {node: '>=18'}
    cpu: [mips64el]
    os: [linux]

  '@esbuild/linux-ppc64@0.25.5':
    resolution: {integrity: sha512-UZCmJ7r9X2fe2D6jBmkLBMQetXPXIsZjQJCjgwpVDz+YMcS6oFR27alkgGv3Oqkv07bxdvw7fyB71/olceJhkQ==}
    engines: {node: '>=18'}
    cpu: [ppc64]
    os: [linux]

  '@esbuild/linux-riscv64@0.25.5':
    resolution: {integrity: sha512-kTxwu4mLyeOlsVIFPfQo+fQJAV9mh24xL+y+Bm6ej067sYANjyEw1dNHmvoqxJUCMnkBdKpvOn0Ahql6+4VyeA==}
    engines: {node: '>=18'}
    cpu: [riscv64]
    os: [linux]

  '@esbuild/linux-s390x@0.25.5':
    resolution: {integrity: sha512-K2dSKTKfmdh78uJ3NcWFiqyRrimfdinS5ErLSn3vluHNeHVnBAFWC8a4X5N+7FgVE1EjXS1QDZbpqZBjfrqMTQ==}
    engines: {node: '>=18'}
    cpu: [s390x]
    os: [linux]

  '@esbuild/linux-x64@0.25.5':
    resolution: {integrity: sha512-uhj8N2obKTE6pSZ+aMUbqq+1nXxNjZIIjCjGLfsWvVpy7gKCOL6rsY1MhRh9zLtUtAI7vpgLMK6DxjO8Qm9lJw==}
    engines: {node: '>=18'}
    cpu: [x64]
    os: [linux]

  '@esbuild/netbsd-arm64@0.25.5':
    resolution: {integrity: sha512-pwHtMP9viAy1oHPvgxtOv+OkduK5ugofNTVDilIzBLpoWAM16r7b/mxBvfpuQDpRQFMfuVr5aLcn4yveGvBZvw==}
    engines: {node: '>=18'}
    cpu: [arm64]
    os: [netbsd]

  '@esbuild/netbsd-x64@0.25.5':
    resolution: {integrity: sha512-WOb5fKrvVTRMfWFNCroYWWklbnXH0Q5rZppjq0vQIdlsQKuw6mdSihwSo4RV/YdQ5UCKKvBy7/0ZZYLBZKIbwQ==}
    engines: {node: '>=18'}
    cpu: [x64]
    os: [netbsd]

  '@esbuild/openbsd-arm64@0.25.5':
    resolution: {integrity: sha512-7A208+uQKgTxHd0G0uqZO8UjK2R0DDb4fDmERtARjSHWxqMTye4Erz4zZafx7Di9Cv+lNHYuncAkiGFySoD+Mw==}
    engines: {node: '>=18'}
    cpu: [arm64]
    os: [openbsd]

  '@esbuild/openbsd-x64@0.25.5':
    resolution: {integrity: sha512-G4hE405ErTWraiZ8UiSoesH8DaCsMm0Cay4fsFWOOUcz8b8rC6uCvnagr+gnioEjWn0wC+o1/TAHt+It+MpIMg==}
    engines: {node: '>=18'}
    cpu: [x64]
    os: [openbsd]

  '@esbuild/sunos-x64@0.25.5':
    resolution: {integrity: sha512-l+azKShMy7FxzY0Rj4RCt5VD/q8mG/e+mDivgspo+yL8zW7qEwctQ6YqKX34DTEleFAvCIUviCFX1SDZRSyMQA==}
    engines: {node: '>=18'}
    cpu: [x64]
    os: [sunos]

  '@esbuild/win32-arm64@0.25.5':
    resolution: {integrity: sha512-O2S7SNZzdcFG7eFKgvwUEZ2VG9D/sn/eIiz8XRZ1Q/DO5a3s76Xv0mdBzVM5j5R639lXQmPmSo0iRpHqUUrsxw==}
    engines: {node: '>=18'}
    cpu: [arm64]
    os: [win32]

  '@esbuild/win32-ia32@0.25.5':
    resolution: {integrity: sha512-onOJ02pqs9h1iMJ1PQphR+VZv8qBMQ77Klcsqv9CNW2w6yLqoURLcgERAIurY6QE63bbLuqgP9ATqajFLK5AMQ==}
    engines: {node: '>=18'}
    cpu: [ia32]
    os: [win32]

  '@esbuild/win32-x64@0.25.5':
    resolution: {integrity: sha512-TXv6YnJ8ZMVdX+SXWVBo/0p8LTcrUYngpWjvm91TMjjBQii7Oz11Lw5lbDV5Y0TzuhSJHwiH4hEtC1I42mMS0g==}
    engines: {node: '>=18'}
    cpu: [x64]
    os: [win32]

  '@types/node@22.15.34':
    resolution: {integrity: sha512-8Y6E5WUupYy1Dd0II32BsWAx5MWdcnRd8L84Oys3veg1YrYtNtzgO4CFhiBg6MDSjk7Ay36HYOnU7/tuOzIzcw==}

  dotenv@16.6.1:
    resolution: {integrity: sha512-uBq4egWHTcTt33a72vpSG0z3HnPuIl6NqYcTrKEg2azoEyl2hpW0zqlxysq2pK9HlDIHyHyakeYaYnSAwd8bow==}
    engines: {node: '>=12'}

  esbuild@0.25.5:
    resolution: {integrity: sha512-P8OtKZRv/5J5hhz0cUAdu/cLuPIKXpQl1R9pZtvmHWQvrAUVd0UNIPT4IB4W3rNOqVO0rlqHmCIbSwxh/c9yUQ==}
    engines: {node: '>=18'}
    hasBin: true

  fsevents@2.3.3:
    resolution: {integrity: sha512-5xoDfX+fL7faATnagmWPpbFtwh/R77WmMMqqHGS65C3vvB0YHrgF+B1YmZ3441tMj5n63k0212XNoJwzlhffQw==}
    engines: {node: ^8.16.0 || ^10.6.0 || >=11.0.0}
    os: [darwin]

  get-tsconfig@4.10.1:
    resolution: {integrity: sha512-auHyJ4AgMz7vgS8Hp3N6HXSmlMdUyhSUrfBF16w153rxtLIEOE+HGqaBppczZvnHLqQJfiHotCYpNhl0lUROFQ==}

  openai@5.8.2:
    resolution: {integrity: sha512-8C+nzoHYgyYOXhHGN6r0fcb4SznuEn1R7YZMvlqDbnCuE0FM2mm3T1HiYW6WIcMS/F1Of2up/cSPjLPaWt0X9Q==}
    hasBin: true
    peerDependencies:
      ws: ^8.18.0
      zod: ^3.23.8
    peerDependenciesMeta:
      ws:
        optional: true
      zod:
        optional: true

  resolve-pkg-maps@1.0.0:
    resolution: {integrity: sha512-seS2Tj26TBVOC2NIc2rOe2y2ZO7efxITtLZcGSOnHHNOQ7CkiUBfw0Iw2ck6xkIhPwLhKNLS8BO+hEpngQlqzw==}

  tsx@4.20.3:
    resolution: {integrity: sha512-qjbnuR9Tr+FJOMBqJCW5ehvIo/buZq7vH7qD7JziU98h6l3qGy0a/yPFjwO+y0/T7GFpNgNAvEcPPVfyT8rrPQ==}
    engines: {node: '>=18.0.0'}
    hasBin: true

  typescript@5.8.3:
    resolution: {integrity: sha512-p1diW6TqL9L07nNxvRMM7hMMw4c5XOo/1ibL4aAIGmSAt9slTE1Xgw5KWuof2uTOvCg9BY7ZRi+GaF+7sfgPeQ==}
    engines: {node: '>=14.17'}
    hasBin: true

  undici-types@6.21.0:
    resolution: {integrity: sha512-iwDZqg0QAGrg9Rav5H4n0M64c3mkR59cJ6wQp+7C4nI0gsmExaedaYLNO44eT4AtBBwjbTiGPMlt2Md0T9H9JQ==}

snapshots:

  '@esbuild/aix-ppc64@0.25.5':
    optional: true

  '@esbuild/android-arm64@0.25.5':
    optional: true

  '@esbuild/android-arm@0.25.5':
    optional: true

  '@esbuild/android-x64@0.25.5':
    optional: true

  '@esbuild/darwin-arm64@0.25.5':
    optional: true

  '@esbuild/darwin-x64@0.25.5':
    optional: true

  '@esbuild/freebsd-arm64@0.25.5':
    optional: true

  '@esbuild/freebsd-x64@0.25.5':
    optional: true

  '@esbuild/linux-arm64@0.25.5':
    optional: true

  '@esbuild/linux-arm@0.25.5':
    optional: true

  '@esbuild/linux-ia32@0.25.5':
    optional: true

  '@esbuild/linux-loong64@0.25.5':
    optional: true

  '@esbuild/linux-mips64el@0.25.5':
    optional: true

  '@esbuild/linux-ppc64@0.25.5':
    optional: true

  '@esbuild/linux-riscv64@0.25.5':
    optional: true

  '@esbuild/linux-s390x@0.25.5':
    optional: true

  '@esbuild/linux-x64@0.25.5':
    optional: true

  '@esbuild/netbsd-arm64@0.25.5':
    optional: true

  '@esbuild/netbsd-x64@0.25.5':
    optional: true

  '@esbuild/openbsd-arm64@0.25.5':
    optional: true

  '@esbuild/openbsd-x64@0.25.5':
    optional: true

  '@esbuild/sunos-x64@0.25.5':
    optional: true

  '@esbuild/win32-arm64@0.25.5':
    optional: true

  '@esbuild/win32-ia32@0.25.5':
    optional: true

  '@esbuild/win32-x64@0.25.5':
    optional: true

  '@types/node@22.15.34':
    dependencies:
      undici-types: 6.21.0

  dotenv@16.6.1: {}

  esbuild@0.25.5:
    optionalDependencies:
      '@esbuild/aix-ppc64': 0.25.5
      '@esbuild/android-arm': 0.25.5
      '@esbuild/android-arm64': 0.25.5
      '@esbuild/android-x64': 0.25.5
      '@esbuild/darwin-arm64': 0.25.5
      '@esbuild/darwin-x64': 0.25.5
      '@esbuild/freebsd-arm64': 0.25.5
      '@esbuild/freebsd-x64': 0.25.5
      '@esbuild/linux-arm': 0.25.5
      '@esbuild/linux-arm64': 0.25.5
      '@esbuild/linux-ia32': 0.25.5
      '@esbuild/linux-loong64': 0.25.5
      '@esbuild/linux-mips64el': 0.25.5
      '@esbuild/linux-ppc64': 0.25.5
      '@esbuild/linux-riscv64': 0.25.5
      '@esbuild/linux-s390x': 0.25.5
      '@esbuild/linux-x64': 0.25.5
      '@esbuild/netbsd-arm64': 0.25.5
      '@esbuild/netbsd-x64': 0.25.5
      '@esbuild/openbsd-arm64': 0.25.5
      '@esbuild/openbsd-x64': 0.25.5
      '@esbuild/sunos-x64': 0.25.5
      '@esbuild/win32-arm64': 0.25.5
      '@esbuild/win32-ia32': 0.25.5
      '@esbuild/win32-x64': 0.25.5

  fsevents@2.3.3:
    optional: true

  get-tsconfig@4.10.1:
    dependencies:
      resolve-pkg-maps: 1.0.0

  openai@5.8.2: {}

  resolve-pkg-maps@1.0.0: {}

  tsx@4.20.3:
    dependencies:
      esbuild: 0.25.5
      get-tsconfig: 4.10.1
    optionalDependencies:
      fsevents: 2.3.3

  typescript@5.8.3: {}

  undici-types@6.21.0: {}

```

## /examples/computer-example-ts/src/helpers.ts

```ts path="/examples/computer-example-ts/src/helpers.ts" 
import type { Computer } from "@trycua/computer";
import type OpenAI from "openai";

export async function executeAction(
	computer: Computer,
	action: OpenAI.Responses.ResponseComputerToolCall["action"],
) {
	switch (action.type) {
		case "click": {
			const { x, y, button } = action;
			console.log(`Executing click at (${x}, ${y}) with button '${button}'.`);
			await computer.interface.moveCursor(x, y);
			if (button === "right") await computer.interface.rightClick();
			else await computer.interface.leftClick();
			break;
		}
		case "type":
			{
				const { text } = action;
				console.log(`Typing text: ${text}`);
				await computer.interface.typeText(text);
			}
			break;
		case "scroll": {
			const { x: locX, y: locY, scroll_x, scroll_y } = action;
			console.log(
				`Scrolling at (${locX}, ${locY}) with offsets (scroll_x=${scroll_x}, scroll_y=${scroll_y}).`,
			);
			await computer.interface.moveCursor(locX, locY);
			await computer.interface.scroll(scroll_x, scroll_y);
			break;
		}
		case "keypress": {
			const { keys } = action;
			for (const key of keys) {
				console.log(`Pressing key: ${key}.`);
				// Map common key names to CUA equivalents
				if (key.toLowerCase() === "enter") {
					await computer.interface.pressKey("return");
				} else if (key.toLowerCase() === "space") {
					await computer.interface.pressKey("space");
				} else {
					await computer.interface.pressKey(key);
				}
			}
			break;
		}
		case "wait": {
			console.log(`Waiting for 3 seconds.`);
			await new Promise((resolve) => setTimeout(resolve, 3 * 1000));
			break;
		}
		case "screenshot": {
			console.log("Taking screenshot.");
			// This is handled automatically in the main loop, but we can take an extra one if requested
			const screenshot = await computer.interface.screenshot();
			return screenshot;
		}
		default:
			console.log(`Unrecognized action: ${action.type}`);
			break;
	}
}

```

## /examples/computer-example-ts/src/index.ts

```ts path="/examples/computer-example-ts/src/index.ts" 
import { Computer, OSType } from "@trycua/computer";
import OpenAI from "openai";
import { executeAction } from "./helpers";

import "dotenv/config";

const openai = new OpenAI({ apiKey: process.env.OPENAI_KEY });

const COMPUTER_USE_PROMPT = "Open firefox and go to trycua.com";

// Initialize the Computer Connection
const computer = new Computer({
	apiKey: process.env.CUA_KEY!,
	name: process.env.CUA_CONTAINER_NAME!,
	osType: OSType.LINUX,
});

await computer.run();
// Take the initial screenshot
const screenshot = await computer.interface.screenshot();
const screenshotBase64 = screenshot.toString("base64");

// Setup openai config for computer use
const computerUseConfig: OpenAI.Responses.ResponseCreateParamsNonStreaming = {
	model: "computer-use-preview",
	tools: [
		{
			type: "computer_use_preview",
			display_width: 1024,
			display_height: 768,
			environment: "linux", // we're using a linux vm
		},
	],
	truncation: "auto",
};

// Send initial screenshot to the openai computer use model
let res = await openai.responses.create({
	...computerUseConfig,
	input: [
		{
			role: "user",
			content: [
				// what we want the ai to do
				{ type: "input_text", text: COMPUTER_USE_PROMPT },
				// current screenshot of the vm
				{
					type: "input_image",
					image_url: `data:image/png;base64,${screenshotBase64}`,
					detail: "auto",
				},
			],
		},
	],
});

// Loop until there are no more computer use actions.
while (true) {
	const computerCalls = res.output.filter((o) => o.type === "computer_call");
	if (computerCalls.length < 1) {
		console.log("No more computer calls. Loop complete.");
		break;
	}
	// Get the first call
	const call = computerCalls[0];
	const action = call.action;
	console.log("Received action from OpenAI Responses API:", action);
	let ackChecks: OpenAI.Responses.ResponseComputerToolCall.PendingSafetyCheck[] =
		[];
	if (call.pending_safety_checks.length > 0) {
		console.log("Safety checks pending:", call.pending_safety_checks);
		// In a real implementation, you would want to get user confirmation here
		ackChecks = call.pending_safety_checks;
	}

	// Execute the action in the container
	await executeAction(computer, action);
	// Wait for changes to process within the container (1sec)
	await new Promise((resolve) => setTimeout(resolve, 1000));

	// Capture new screenshot
	const newScreenshot = await computer.interface.screenshot();
	const newScreenshotBase64 = newScreenshot.toString("base64");

	// Screenshot back as computer_call_output

	res = await openai.responses.create({
		...computerUseConfig,
		previous_response_id: res.id,
		input: [
			{
				type: "computer_call_output",
				call_id: call.call_id,
				acknowledged_safety_checks: ackChecks,
				output: {
					type: "computer_screenshot",
					image_url: `data:image/png;base64,${newScreenshotBase64}`,
				},
			},
		],
	});
}

process.exit();

```

## /examples/computer-example-ts/tsconfig.json

```json path="/examples/computer-example-ts/tsconfig.json" 
{
  "compilerOptions": {
    "target": "esnext",
    "lib": [
      "es2023"
    ],
    "moduleDetection": "force",
    "module": "preserve",
    "moduleResolution": "bundler",
    "allowImportingTsExtensions": true,
    "resolveJsonModule": true,
    "types": [
      "node"
    ],
    "allowSyntheticDefaultImports": true,
    "strict": true,
    "noUnusedLocals": true,
    "declaration": true,
    "emitDeclarationOnly": true,
    "esModuleInterop": true,
    "isolatedModules": true,
    "verbatimModuleSyntax": true,
    "skipLibCheck": true,
    "outDir": "build",
  },
  "include": [
    "src"
  ]
}
```

## /examples/computer_examples.py

```py path="/examples/computer_examples.py" 
import os
import asyncio
from pathlib import Path
import sys
import traceback

# Load environment variables from .env file
project_root = Path(__file__).parent.parent
env_file = project_root / ".env"
print(f"Loading environment from: {env_file}")
from dotenv import load_dotenv

load_dotenv(env_file)

# Add paths to sys.path if needed
pythonpath = os.environ.get("PYTHONPATH", "")
for path in pythonpath.split(":"):
    if path and path not in sys.path:
        sys.path.insert(0, path)  # Insert at beginning to prioritize
        print(f"Added to sys.path: {path}")

from computer.computer import Computer
from computer.providers.base import VMProviderType
from computer.logger import LogLevel

async def main():
    try:
        print("\n=== Using direct initialization ===")

        # Create a local macOS computer
        computer = Computer(
            display="1024x768", 
            memory="8GB", 
            cpu="4", 
            os_type="macos",
            name="macos",
            verbosity=LogLevel.VERBOSE,
            provider_type=VMProviderType.LUME,
            storage="/Users/<USER>/repos/trycua/computer/examples/storage",
            shared_directories=[
                "/Users/<USER>/repos/trycua/computer/examples/shared"
            ],
            ephemeral=False,
        )

        # Create a remote Linux computer with C/ua
        # computer = Computer(
        #     os_type="linux",
        #     api_key=os.getenv("CUA_API_KEY"),
        #     name=os.getenv("CONTAINER_NAME"),
        #     provider_type=VMProviderType.CLOUD,
        # )
        
        try:
            # Run the computer with default parameters
            await computer.run()
            
            screenshot = await computer.interface.screenshot()
            
            # Create output directory if it doesn't exist
            output_dir = Path("./output")
            output_dir.mkdir(exist_ok=True)
            
            screenshot_path = output_dir / "screenshot.png"
            with open(screenshot_path, "wb") as f:
                f.write(screenshot)
            print(f"Screenshot saved to: {screenshot_path.absolute()}")
            
            # await computer.interface.hotkey("command", "space")

            # res = await computer.interface.run_command("touch ./Downloads/empty_file")
            # print(f"Run command result: {res}")

            accessibility_tree = await computer.interface.get_accessibility_tree()
            print(f"Accessibility tree: {accessibility_tree}")

            # Screen Actions Examples
            # print("\n===  Screen Actions ===")
            # screenshot = await computer.interface.screenshot()
            # with open("screenshot_direct.png", "wb") as f:
            #     f.write(screenshot)

            screen_size = await computer.interface.get_screen_size()
            print(f"Screen size: {screen_size}")

            # Demonstrate coordinate conversion
            center_x, center_y = 733, 736
            print(f"Center in screen coordinates: ({center_x}, {center_y})")

            screenshot_center = await computer.to_screenshot_coordinates(center_x, center_y)
            print(f"Center in screenshot coordinates: {screenshot_center}")

            screen_center = await computer.to_screen_coordinates(*screenshot_center)
            print(f"Back to screen coordinates: {screen_center}")

            # Mouse Actions Examples
            print("\n=== Mouse Actions ===")
            await computer.interface.move_cursor(100, 100)
            await computer.interface.left_click()
            await computer.interface.right_click(300, 300)
            await computer.interface.double_click(400, 400)

            # Keyboard Actions Examples
            print("\n=== Keyboard Actions ===")
            await computer.interface.type_text("Hello, World!")
            await computer.interface.press_key("enter")

            # Clipboard Actions Examples
            print("\n=== Clipboard Actions ===")
            await computer.interface.set_clipboard("Test clipboard")
            content = await computer.interface.copy_to_clipboard()
            print(f"Clipboard content: {content}")

        finally:
            # Important to clean up resources
            await computer.stop()
    except Exception as e:
        print(f"Error in main: {e}")
        traceback.print_exc()


if __name__ == "__main__":
    asyncio.run(main())

```

## /examples/computer_ui_examples.py

```py path="/examples/computer_ui_examples.py" 
#!/usr/bin/env python3
"""
Simple example script for the Computer Interface Gradio UI.

This script launches the advanced Gradio UI for the Computer Interface
with full model selection and configuration options.
It can be run directly from the command line.
"""


from utils import load_dotenv_files

load_dotenv_files()

# Import the create_gradio_ui function
from computer.ui.gradio.app import create_gradio_ui

if __name__ == "__main__":
    print("Launching Computer Interface Gradio UI with advanced features...")
    app = create_gradio_ui()
    app.launch(
        share=False,
        server_name="0.0.0.0",
        server_port=7860,
    )
    
    # Optional: Using the saved dataset
    # import datasets
    # from computer.ui.utils import convert_to_unsloth
    # ds = datasets.load_dataset("ddupont/highquality-cua-demonstrations")
    # ds = convert_to_unsloth(ds)
```

## /examples/evals/wikipedia_most_linked.txt

ISBN (identifier)
United States
Main Page
Tilde
Doi (identifier)
Fair use
Association football
Years
Wayback Machine
ISSN (identifier)
India
Wikimedia Foundation
Wikidata
Animal
Taxonomy (biology)
Australia
France
Eukaryote
IP address
U.S. state
Time zone
City
Copyright
Canada
Town
ASCII
Greek alphabet
Typographic ligature
Diacritical mark
Wikipedia
Germany
Human settlement
Open Tree of Life
IMDb (identifier)
United Kingdom
Catalogue of Life
Insect
Russia
Japan
Italy
Arthropod
Television show
Public domain
INaturalist
Poland
England
PMID (identifier)
Daylight saving time
S2CID (identifier)
China
Encyclopedia of Life
Spain
OCLC (identifier)
Plant
Flickr
Wikispecies
Africa
Song
Record label
Lepidoptera
Iran
English language
Music genre
News aggregator
Web feed
Proxy server
X-Forwarded-For
College football
World War II
Brazil
Sweden
Politics
Olympics
Netherlands
Record producer
California
New York City
Surname
The New York Times
London
New Zealand
PMC (identifier)
Logo
Synonym (taxonomy)
Switzerland
Turkey
Sport
Video game
Architecture
Norway
Bibcode (identifier)
Mexico
Botany
JSTOR (identifier)
Rail transport
Field hockey
Ireland
Scotland
Belgium
South Africa
Common name
Professional sports
Sport governing body
Sport industry
Olympic games
Election
Austria
Ukraine
Anthroponymy
Pakistan
Baseball
Denmark
Christianity
Philippines
Woman
Romania
Czech Republic
Album
Godzilla Minus One
Single (music)
Electoral reform
Nofollow
Basketball
New York (state)
Argentina
Finland
Soviet Union
Greece
Russian language
Historic site
Free content
YouTube
Catholic Church
Hungary
Kingdom Hearts
Beetle
Company
Tetris
Portugal
BioShock
Abandonware
Deus Ex (video game)
4A Engine
Yoshi's New Island
Kaboom! (video game)
Rain World
Juno (Overwatch)
Crash Team Rumble
Vault 101
Tales of Commons
NHL Hockey
Clutch Gaming
Haseo
Allin Kempthorne
Ilyas El Maliki
Ratalaika Games
3D mousepad
HaptX
Walid Sultan Midani
Rustler (video game)
Look Outside
Ducks Ahoy!
Fusion Engine
Cricket
Geography
Chordate
The Guardian
Israel
Billboard (magazine)
Ice hockey
Given name
Chicago
World War I
Pennsylvania
Indonesia
Alma mater
Vascular plant
Amorphea
Wikimedia Commons
Novel
Village
Visual arts
Film poster
Flowering plant
Opisthokont
Obazoa
County seat
Short story
First-class cricket
Law
Europe
University
Croatia
Sport of athletics
Holozoa
Choanozoa
Filozoa
German language
Tennis
Eumetazoa
Serbia
ParaHoxozoa
Thailand
History
Midfielder
Bilateria
Unincorporated area
French language
AllMusic
Astronomy
Nephrozoa
Novella
Ship
Twitter
Character (arts)
College
Malaysia
Conflict of interest
Higher education
IUCN Red List
Rock music
Gastropoda
Creative Commons
Wales
Bulgaria
UTC+2
Paris
Species
Illinois
HTML element
South Korea
BBC
Persian language
Moth
Conservation status
Pop music
Colombia
Wicket
American football
Jazz
World Flora Online
Los Angeles
Songwriter
Hong Kong
Hdl (identifier)
Genus
Spanish language
Egypt
Not out
Slovenia
Chile
Korea
Tropicos
Slovakia
Bishop
Family (biology)
Rugby union
Women's history
Nigeria
College basketball
Sports Reference
Washington, D.C.
GFDL
Afghanistan
Sri Lanka
Newspapers.com
UTC+1
Eudicots
Estonia
Los Angeles Times
Olympedia
Bangladesh
Peru
Singapore
Typographical error
UTC
Virginia
Taiwan
Fast bowling
COVID-19 pandemic
Food
Fish
River
Republic of Ireland
Beer
Caribbean
Michigan
Drink
Chinese language
Business
Leg break
Women's Test cricket
Women's cricket
Innings
New Jersey
Protostome
Spin bowling
Sugar
Underarm bowling
Roger Federer
Googly
Apple
Comics
Cricket Australia XI
Fair and unfair play
Anime
Rafael Nadal
Leander Paes
Kazakhstan
Capital city
Blessed Virgin Mary
Venezuela
Case sensitivity
Arabic language
North America
Texas
Burger King
The Plant List
Justine Henin
Sushi
Angelus
Beef
Sanctification
Cuthbert Tunstall
Bread
Saint Mungo
Incumbent
Americanism (heresy)
Curry
Ensoulment
Associated Press
Adolph John Paschang
French cuisine
Altar Society
UTC-5
Philadelphia
Bill Mallon
Yogurt
Soy sauce
Open Era (tennis)
Belarus
Manga
English Wikipedia
Islam
Trademark
ISO 4
Wisconsin
Lithuania
The Washington Post
Agaricus bisporus
Reptile
Sociology
Organizations
Death
Ham and eggs
Asia
Swimming (sport)
South America
Northern Ireland
Observation.org
European Union
Astronomical object
Georgia (U.S. state)
Gmina
Provinces of Iran
Computing
Counties of Iran
Discogs
Mathematics
Powiat
Missouri
Bachelor of Arts
Iran Standard Time
Florida
Bakhsh
Minnesota
Oregon
Nepal
Variety (magazine)
Japanese language
Journalism
Rome
Computer
Ohio
Ontario
Internet Archive
Latvia
Comedy
Azerbaijan
BBC News
Morocco
Ecdysozoa
Print-on-demand
Bengali language
A5 paper
Pedia Press
Education
Mollusca
American Civil War
Berlin
Taxon
Maryland
Panarthropoda
Hebrew language
Toronto
Tactopoda
Episode
Cuba
Country music
Religion
Rotten Tomatoes
Georgia (country)
Classical music
Month
Puerto Rico
GEOnet Names Server
Sydney
The Times
Iraq
Polyphaga
Derivative work
Lisbon
Syria
Ecuador
Uzbekistan
Greek language
Latin
United Nations
Literature
Animation
Physics
Amphibian
Romanize
List of countries
Moscow
Politician
Philosophy
Metacritic
Mammal
Pinyin
Open access
New South Wales
Theatre
Allmusic
Syntax
Women in music
Fly
Colorado
Academic journal
LGBTQ
Seal (emblem)
Rolling Stone
Saudi Arabia
Science fiction
Tweet (social media)
Heavy metal music
Boston
Vietnam
Molecular biology
Facebook
Iceland
Albania
Cycling
Tennessee
Armenia
Massachusetts
Mandibulata
United States Navy
Communes of France
Census
Algeria
United States Army
Wikilink
Pancrustacea
Alternative rock
American English
Radio stations
History of Romania
Endemism
San Francisco
Award
Ghana
Judaism
Alabama
Blog
The Independent
Melbourne
Cantons of France
Lebanon
West Germany
Quotation mark
Regions of France
Chernivtsi Oblast
Tokyo
Italian language
Connecticut
Country
Screenshot
Ghost town
Iran Daylight Time
NatureServe
Mongolia
Cyprus
Northern Bukovina
Rugby league
Northern Bessarabia
State highway
Harvard University
Yorkshire
Pterygota
Slash (punctuation)
Prize
Science
Asian Games
Eastern Time Zone
Myanmar
Nazi Germany
Ottoman Empire
Quebec
Billboard Hot 100
United Arab Emirates
Neoptera
Hexapoda
Least Concern
Type species
EPPO Code
Wikisource
Kyrgyzstan
Allotriocarida
Volleyball
Geology
Second World War
British Columbia
Socialism
Zoology
The Daily Telegraph
Paleontology
Vienna
Dicondylia
BugGuide
United States Senate
Hermit crab
Paraphrase
CNN
Royal Navy
Indian Standard Time
Billboard 200
Kenya
DVD
Sipuncula
Tajikistan
National park
Economics
Heterocyathus
Uruguay
Heteropsammia
Road
Spanish name
Luxembourg
Korean language
UK Singles Chart
Queensland
Montreal
New York Times
Bolivia
CP/M
Timestamp
Electronic music
INSEE code
ArXiv (identifier)
PubMed
SVG
USA Today
Omnivore
Tunisia
Psychology
ESPN
UEFA
Hawaii
Gastropod
Aliyah
North Carolina
Russian Empire
Tibet
Fungi
Oklahoma
Fauna Europaea
Turkmenistan
British English
The London Gazette
Civil township
Boxing
Barack Obama
Animal Diversity Web
Reuters
Eumetabola
Voter turnout
Transport
False positive
Donald Trump
Kansas
Antarctica
Lake
Ethiopia
Time (magazine)
Marriage
NBC
Beijing
Vertebrate
Czechoslovakia
Protected area
Energy
Poetry
Archaeology
Columbia University
Poverty line
Alaska
Computing platform
British Empire
University of Oxford
Costa Rica
Dublin
A-side and B-side
ZIP code
Actinopterygii
UTC-6
Photoperiodism
Mayor
Sphaeriidae
Animal suicide
Atka mackerel
Starling
Arizona
Entertainment Weekly
Sphaerium beckmani
Junqueira cow
Zaniolepis frenata
Campocraspedon
Zimbabwe
Motorsport
Bird flight
Cnemophilidae
Hinduism
Phalarope
Indiana
Museums
Holometabola
Pytilia
North Macedonia
Malta
Cathartiformes
Darter
Saker falcon
Cathartes
Avian malaria
Coal tit
Magpie duck
Video game developer
Bird bath
Vesper sparrow
Gouldian finch
Debeaking
Vector graphics
Semiplumbeous hawk
Scottish crossbill
Bullfinch
Fregata
Nidicolous
Plushcap
Pallid scops owl
Hip-hop
Blyth's frogmouth
Sunda scops owl
Argus (bird)
Operation Migration
Nik Borrow
Per capita income
Guy Oseary
Madrid
Buddhism
Drainage basin
Sephardic Haredim
Rami Kleinstein
Guy Bavli
David Bar-Hayim
Levin Kipnis
Edna Arbel
Prisoner of Zion
Ayala Procaccia
Nachum Heiman
Zman Tel Aviv
CBS
ARIA Charts
Cucujiformia
Away colours
Regex
2019 African Games
1962 Asian Games
1958 Asian Games
Chemistry
Olympic Games
The Middle Ages
Central Asia
Bengalis
Southeast Asia
Find a Grave
Microsoft Windows
Swing (politics)
White (U.S. Census)
Roman Catholic
Maine
The Times of India
Season (sports)
Jamaica
Video game genre
Munich
Asterids
Rosids
Golf
Language
Hangul
Atlanta
Glasgow
UTC+3
Library of Congress
Deuterostome
COVID-19
Video game publisher
Montenegro
ESPNcricinfo
Brand
UTC-4
IGN
Stockholm
Istanbul
NASA
Gnathostomata
Ukrainian language
Human rights
Chicago Tribune
ProQuest
IMDb
River mouth
Hip hop music
Gene
Netflix
Moldova
Barcelona
Paraguay
Olfactores
Labour Party (UK)
United States dollar
Qatar
Photography
Guatemala
Summit
Cold War
Running
First World War
Precipitation
Edinburgh
Amsterdam
Lima
New Eskaton
Computer program
Xinjiang
Women in science
Manhattan
Warsaw
Magazine
Horror film
Deadline Hollywood
Jordan
Aparaglossata
Agriculture
Internet
Prague
The Hindu
Cretaceous
Latino (U.S. Census)
Vietnam War
Music download
Encyclopedia
Chemical compounds
Pittsburgh
Soap opera
Budapest
George W. Bush
Seattle
Extended play
Washington (state)
Listed building
Palestine
LCCN (identifier)
Portland, Oregon
Panama
Plagiarism
Brooklyn
Teleostomi
Manchester
Bird
Mollusk
Automobile
Historic England
Linguistics
Dependent territory
Athens
Civil engineering
Sea snail
Population density
Finance
Disaster management
Tanzania
Jurassic
Districts of Russia
Western Australia
Louisiana
Portuguese language
Anatomy
The Beatles
Tamil language
Milan
Uganda
Natural environment
FIFA
Cameroon
Blu-ray
Mexico City
Chemical formula
Jimmy Wales
Papua New Guinea
Diaphoretickes
UNESCO
Forbes
Technology
Buenos Aires
Vancouver
Dominican Republic
2007
Species description
East Germany
Folk music
Kentucky
Multimedia
Monocotyledon
Rio de Janeiro
Automated
Hindi
Houston
Google
Devonian
Member of Parliament
Bible
Mumbai
FishBase
African diaspora
Carboniferous
Cambrian
Triassic
Montana
Handball
Ordovician
San Diego
Archive.today
Stanford University
British Army
Middle Ages
Frequency
Ultratop
Permian
Detroit
Earth
Precambrian
Hamburg
Alberta
Tamil Nadu
Madagascar
Lancashire
Guitar
Trade union
Instagram
Engineering
2006
Silurian
NPR
Railway station
CAS Registry Number
Yemen
Noctuoidea
Fiji
Haiti
Rowing (sport)
New Orleans
NME
Alternative media
North Korea
Microsoft
Jerusalem
Paleogene
Audery Mill Creek
Horse racing
Post town
Piano
Bavaria
Polish language
Horror fiction
Neogene
Kerala
Copenhagen
Google Books
Central Time Zone
Island
Birmingham
Anglicanism
Software
Mountain range
Investment
Brussels
Muhammad Ali
Asian (U.S. Census)
Video game culture
Brisbane
Church of England
Kosovo
Bachelor of Science
Molar mass
Arachnid
Own goal
Yale University
Caenogastropoda
Auckland
World Athletics
Trinidad and Tobago
Hanyu Pinyin
Sound bite
Time
El Salvador
Microbiology
Columbia Records
Seoul
Cerambycidae
Maharashtra
Chelicerata
Fungus
Media influence
South Carolina
Radio
Telenovela
FA Cup
Senegal
Internet trolling
Nashville, Tennessee
Demonym
Standard Chinese
Sculpture
Liverpool
Thesis
Bass guitar
Chess
Women artists
Icon (computing)
PubChem
UK Albums Chart
Head coach
Roman Empire
Grand Slam (tennis)
JSmol
Formula One
Biology
Kent
Ancient Rome
Inner Carniola
Oslo
Dutch language
Wingspan
Archaeplastida
MTV
Edvard Ravnikar
ITunes
Feminism
German Empire
Pacific Ocean
Atlantic Ocean
Pharmacology
Track gauge
ChemSpider
Doctor of Philosophy
Regions of England
Districts of England
Christmas
Pavel Golia
Predjama Castle
Overtime (sports)
Forum
Swiss Hitparade
Stumped
Majority
Male
Shanghai
Siddharta (band)

## /examples/pylume_examples.py

```py path="/examples/pylume_examples.py" 
import asyncio
from pylume import PyLume, ImageRef, VMRunOpts, SharedDirectory, VMConfig, VMUpdateOpts


async def main():
    """Example usage of PyLume."""
    async with PyLume(port=7777, use_existing_server=False, debug=True) as pylume:

        # Get latest IPSW URL
        print("\n=== Getting Latest IPSW URL ===")
        url = await pylume.get_latest_ipsw_url()
        print("Latest IPSW URL:", url)

        # Create a new VM
        print("\n=== Creating a new VM ===")
        vm_config = VMConfig(
            name="lume-vm-new",
            os="macOS",
            cpu=2,
            memory="4GB",
            disk_size="64GB",  # type: ignore
            display="1024x768",
            ipsw="latest",
        )
        await pylume.create_vm(vm_config)

        # Get latest IPSW URL
        print("\n=== Getting Latest IPSW URL ===")
        url = await pylume.get_latest_ipsw_url()
        print("Latest IPSW URL:", url)

        # List available images
        print("\n=== Listing Available Images ===")
        images = await pylume.get_images()
        print("Available Images:", images)

        # List all VMs to verify creation
        print("\n=== Listing All VMs ===")
        vms = await pylume.list_vms()
        print("VMs:", vms)

        # Get specific VM details
        print("\n=== Getting VM Details ===")
        vm = await pylume.get_vm("lume-vm")
        print("VM Details:", vm)

        # Update VM settings
        print("\n=== Updating VM Settings ===")
        update_opts = VMUpdateOpts(cpu=8, memory="4GB")
        await pylume.update_vm("lume-vm", update_opts)

        # Pull an image
        image_ref = ImageRef(
            image="macos-sequoia-vanilla", tag="latest", registry="ghcr.io", organization="trycua"
        )
        await pylume.pull_image(image_ref, name="lume-vm-pulled")

        # Run with shared directory
        run_opts = VMRunOpts(
            no_display=False,  # type: ignore
            shared_directories=[  # type: ignore
                SharedDirectory(host_path="~/shared", read_only=False)  # type: ignore
            ],
        )
        await pylume.run_vm("lume-vm", run_opts)

        # Or simpler:
        await pylume.run_vm("lume-vm")

        # Clone VM
        print("\n=== Cloning VM ===")
        await pylume.clone_vm("lume-vm", "lume-vm-cloned")

        # Stop VM
        print("\n=== Stopping VM ===")
        await pylume.stop_vm("lume-vm")

        # Delete VM
        print("\n=== Deleting VM ===")
        await pylume.delete_vm("lume-vm-cloned")


if __name__ == "__main__":
    asyncio.run(main())

```

## /examples/sandboxed_functions_examples.py

```py path="/examples/sandboxed_functions_examples.py" 
from pathlib import Path
import os
import sys

# Load environment variables from .env file
project_root = Path(__file__).parent.parent
env_file = project_root / ".env"
print(f"Loading environment from: {env_file}")
from dotenv import load_dotenv

load_dotenv(env_file)

# Add paths to sys.path if needed
pythonpath = os.environ.get("PYTHONPATH", "")
for path in pythonpath.split(":"):
    if path and path not in sys.path:
        sys.path.insert(0, path)  # Insert at beginning to prioritize
        print(f"Added to sys.path: {path}")

import asyncio
from computer.computer import Computer
from computer.helpers import sandboxed

async def main():
    # Initialize the computer in a C/ua Container
    computer = Computer()
    await computer.run()
    
    # Install a package in a virtual environment in the container
    await computer.venv_install("demo_venv", ["requests", "macos-pyxa"])

    # Open Safari
    await computer.interface.run_command("open -a Safari")
    await asyncio.sleep(2)

    # Define a sandboxed function
    # This function will run inside the C/ua Container
    @sandboxed("demo_venv")
    def greet_and_print(name):
        # get .html of the current Safari tab
        import PyXA
        safari = PyXA.Application("Safari")
        current_doc = safari.current_document
        html = current_doc.source()
        print(f"Hello from inside the container, {name}!")
        print("Safari HTML length:", len(html))
        return {"greeted": name, "safari_html_length": len(html), "safari_html_snippet": html[:200]}

    # Call with args and kwargs
    result = await greet_and_print("C/ua")
    print("Result from sandboxed function:", result)

if __name__ == "__main__":
    asyncio.run(main())

```

## /examples/som_examples.py

```py path="/examples/som_examples.py" 
#!/usr/bin/env python3
"""
Example script demonstrating the usage of OmniParser's UI element detection functionality.
This script shows how to:
1. Initialize the OmniParser
2. Load and process images
3. Visualize detection results
4. Compare performance between CPU and MPS (Apple Silicon)
"""

import argparse
import logging
import sys
from pathlib import Path
import time
from PIL import Image
from typing import Dict, Any, List, Optional
import numpy as np
import io
import base64
import glob
import os

# Load environment variables from .env file
project_root = Path(__file__).parent.parent
env_file = project_root / ".env"
print(f"Loading environment from: {env_file}")
from dotenv import load_dotenv

load_dotenv(env_file)

# Add paths to sys.path if needed
pythonpath = os.environ.get("PYTHONPATH", "")
for path in pythonpath.split(":"):
    if path and path not in sys.path:
        sys.path.append(path)
        print(f"Added to sys.path: {path}")

# Add the libs directory to the path to find som
libs_path = project_root / "libs"
if str(libs_path) not in sys.path:
    sys.path.append(str(libs_path))
    print(f"Added to sys.path: {libs_path}")

from som import OmniParser, ParseResult, IconElement, TextElement
from som.models import UIElement, ParserMetadata, BoundingBox

# Configure logging
logging.basicConfig(
    level=logging.INFO,
    format="%(asctime)s - %(name)s - %(levelname)s - %(message)s",
    datefmt="%Y-%m-%d %H:%M:%S",
)
logger = logging.getLogger(__name__)


def setup_logging():
    """Configure logging with a nice format."""
    logging.basicConfig(
        level=logging.INFO,
        format="%(asctime)s - %(levelname)s - %(message)s",
        datefmt="%Y-%m-%d %H:%M:%S",
    )


class Timer:
    """Enhanced context manager for timing code blocks."""

    def __init__(self, name: str, logger):
        self.name = name
        self.logger = logger
        self.start_time: float = 0.0
        self.elapsed_time: float = 0.0

    def __enter__(self):
        self.start_time = time.time()
        return self

    def __exit__(self, *args):
        self.elapsed_time = time.time() - self.start_time
        self.logger.info(f"{self.name}: {self.elapsed_time:.3f}s")
        return False


def image_to_bytes(image: Image.Image) -> bytes:
    """Convert PIL Image to PNG bytes."""
    buf = io.BytesIO()
    image.save(buf, format="PNG")
    return buf.getvalue()


def process_image(
    parser: OmniParser, image_path: str, output_dir: Path, use_ocr: bool = False
) -> None:
    """Process a single image and save the result."""
    try:
        # Load image
        logger.info(f"Processing image: {image_path}")
        image = Image.open(image_path).convert("RGB")
        logger.info(f"Image loaded successfully, size: {image.size}")

        # Create output filename
        input_filename = Path(image_path).stem
        output_path = output_dir / f"{input_filename}_analyzed.png"

        # Convert image to PNG bytes
        image_bytes = image_to_bytes(image)

        # Process image
        with Timer(f"Processing {input_filename}", logger):
            result = parser.parse(image_bytes, use_ocr=use_ocr)
            logger.info(
                f"Found {result.metadata.num_icons} icons and {result.metadata.num_text} text elements"
            )

            # Save the annotated image
            logger.info(f"Saving annotated image to: {output_path}")
            try:
                # Save image from base64
                img_data = base64.b64decode(result.annotated_image_base64)
                img = Image.open(io.BytesIO(img_data))
                img.save(output_path)

                # Print detailed results
                logger.info("\nDetected Elements:")
                for elem in result.elements:
                    if isinstance(elem, IconElement):
                        logger.info(
                            f"Icon: confidence={elem.confidence:.3f}, bbox={elem.bbox.coordinates}"
                        )
                    elif isinstance(elem, TextElement):
                        logger.info(
                            f"Text: '{elem.content}', confidence={elem.confidence:.3f}, bbox={elem.bbox.coordinates}"
                        )

                # Verify file exists and log size
                if output_path.exists():
                    logger.info(
                        f"Successfully saved image. File size: {output_path.stat().st_size} bytes"
                    )
                else:
                    logger.error(f"Failed to verify file at {output_path}")
            except Exception as e:
                logger.error(f"Error saving image: {str(e)}", exc_info=True)

    except Exception as e:
        logger.error(f"Error processing image {image_path}: {str(e)}", exc_info=True)


def run_detection_benchmark(
    input_path: str,
    output_dir: Path,
    use_ocr: bool = False,
    box_threshold: float = 0.01,
    iou_threshold: float = 0.1,
):
    """Run detection benchmark on images."""
    logger.info(
        f"Starting benchmark with OCR enabled: {use_ocr}, box_threshold: {box_threshold}, iou_threshold: {iou_threshold}"
    )

    try:
        # Initialize parser
        logger.info("Initializing OmniParser...")
        parser = OmniParser()

        # Create output directory
        output_dir.mkdir(parents=True, exist_ok=True)
        logger.info(f"Output directory created at: {output_dir}")

        # Get list of PNG files
        if os.path.isdir(input_path):
            image_files = glob.glob(os.path.join(input_path, "*.png"))
        else:
            image_files = [input_path]

        logger.info(f"Found {len(image_files)} images to process")

        # Process each image with specified thresholds
        for image_path in image_files:
            try:
                # Load image
                logger.info(f"Processing image: {image_path}")
                image = Image.open(image_path).convert("RGB")
                logger.info(f"Image loaded successfully, size: {image.size}")

                # Create output filename
                input_filename = Path(image_path).stem
                output_path = output_dir / f"{input_filename}_analyzed.png"

                # Convert image to PNG bytes
                image_bytes = image_to_bytes(image)

                # Process image with specified thresholds
                with Timer(f"Processing {input_filename}", logger):
                    result = parser.parse(
                        image_bytes,
                        use_ocr=use_ocr,
                        box_threshold=box_threshold,
                        iou_threshold=iou_threshold,
                    )
                    logger.info(
                        f"Found {result.metadata.num_icons} icons and {result.metadata.num_text} text elements"
                    )

                    # Save the annotated image
                    logger.info(f"Saving annotated image to: {output_path}")
                    try:
                        # Save image from base64
                        img_data = base64.b64decode(result.annotated_image_base64)
                        img = Image.open(io.BytesIO(img_data))
                        img.save(output_path)

                        # Print detailed results
                        logger.info("\nDetected Elements:")
                        for elem in result.elements:
                            if isinstance(elem, IconElement):
                                logger.info(
                                    f"Icon: confidence={elem.confidence:.3f}, bbox={elem.bbox.coordinates}"
                                )
                            elif isinstance(elem, TextElement):
                                logger.info(
                                    f"Text: '{elem.content}', confidence={elem.confidence:.3f}, bbox={elem.bbox.coordinates}"
                                )

                        # Verify file exists and log size
                        if output_path.exists():
                            logger.info(
                                f"Successfully saved image. File size: {output_path.stat().st_size} bytes"
                            )
                        else:
                            logger.error(f"Failed to verify file at {output_path}")
                    except Exception as e:
                        logger.error(f"Error saving image: {str(e)}", exc_info=True)

            except Exception as e:
                logger.error(f"Error processing image {image_path}: {str(e)}", exc_info=True)

    except Exception as e:
        logger.error(f"Benchmark failed: {str(e)}", exc_info=True)
        raise


def run_experiments(input_path: str, output_dir: Path, use_ocr: bool = False):
    """Run experiments with different threshold combinations."""
    # Define threshold values to test
    box_thresholds = [0.01, 0.05, 0.1, 0.3]
    iou_thresholds = [0.05, 0.1, 0.2, 0.5]

    logger.info("Starting threshold experiments...")
    logger.info("Box thresholds to test: %s", box_thresholds)
    logger.info("IOU thresholds to test: %s", iou_thresholds)

    # Create results directory for this experiment
    timestamp = time.strftime("%Y%m%d-%H%M%S")
    ocr_suffix = "_ocr" if use_ocr else "_no_ocr"
    exp_dir = output_dir / f"experiment_{timestamp}{ocr_suffix}"
    exp_dir.mkdir(parents=True, exist_ok=True)

    # Create a summary file
    summary_file = exp_dir / "results_summary.txt"
    with open(summary_file, "w") as f:
        f.write("Threshold Experiments Results\n")
        f.write("==========================\n\n")
        f.write(f"Input: {input_path}\n")
        f.write(f"OCR Enabled: {use_ocr}\n")
        f.write(f"Date: {time.strftime('%Y-%m-%d %H:%M:%S')}\n\n")
        f.write("Results:\n")
        f.write("-" * 80 + "\n")
        f.write(
            f"{'Box Thresh':^10} | {'IOU Thresh':^10} | {'Num Icons':^10} | {'Num Text':^10} | {'Time (s)':^10}\n"
        )
        f.write("-" * 80 + "\n")

        # Initialize parser once for all experiments
        parser = OmniParser()

        # Run experiments with each combination
        for box_thresh in box_thresholds:
            for iou_thresh in iou_thresholds:
                logger.info(f"\nTesting box_threshold={box_thresh}, iou_threshold={iou_thresh}")

                # Create directory for this combination
                combo_dir = exp_dir / f"box_{box_thresh}_iou_{iou_thresh}"
                combo_dir.mkdir(exist_ok=True)

                try:
                    # Process each image
                    if os.path.isdir(input_path):
                        image_files = glob.glob(os.path.join(input_path, "*.png"))
                    else:
                        image_files = [input_path]

                    total_icons = 0
                    total_text = 0
                    total_time = 0

                    for image_path in image_files:
                        # Load and process image
                        image = Image.open(image_path).convert("RGB")
                        image_bytes = image_to_bytes(image)

                        # Process with current thresholds
                        with Timer(f"Processing {Path(image_path).stem}", logger) as t:
                            result = parser.parse(
                                image_bytes,
                                use_ocr=use_ocr,
                                box_threshold=box_thresh,
                                iou_threshold=iou_thresh,
                            )

                            # Save annotated image
                            output_path = combo_dir / f"{Path(image_path).stem}_analyzed.png"
                            img_data = base64.b64decode(result.annotated_image_base64)
                            img = Image.open(io.BytesIO(img_data))
                            img.save(output_path)

                            # Update totals
                            total_icons += result.metadata.num_icons
                            total_text += result.metadata.num_text

                            # Log detailed results
                            detail_file = combo_dir / f"{Path(image_path).stem}_details.txt"
                            with open(detail_file, "w") as detail_f:
                                detail_f.write(f"Results for {Path(image_path).name}\n")
                                detail_f.write("-" * 40 + "\n")
                                detail_f.write(f"Number of icons: {result.metadata.num_icons}\n")
                                detail_f.write(
                                    f"Number of text elements: {result.metadata.num_text}\n\n"
                                )

                                detail_f.write("Icon Detections:\n")
                                icon_count = 1
                                text_count = (
                                    result.metadata.num_icons + 1
                                )  # Text boxes start after icons

                                # First list all icons
                                for elem in result.elements:
                                    if isinstance(elem, IconElement):
                                        detail_f.write(f"Box #{icon_count}: Icon\n")
                                        detail_f.write(f"  - Confidence: {elem.confidence:.3f}\n")
                                        detail_f.write(
                                            f"  - Coordinates: {elem.bbox.coordinates}\n"
                                        )
                                        icon_count += 1

                                if use_ocr:
                                    detail_f.write("\nText Detections:\n")
                                    for elem in result.elements:
                                        if isinstance(elem, TextElement):
                                            detail_f.write(f"Box #{text_count}: Text\n")
                                            detail_f.write(f"  - Content: '{elem.content}'\n")
                                            detail_f.write(
                                                f"  - Confidence: {elem.confidence:.3f}\n"
                                            )
                                            detail_f.write(
                                                f"  - Coordinates: {elem.bbox.coordinates}\n"
                                            )
                                            text_count += 1

                        # Update timing totals
                        total_time += t.elapsed_time
                        
                    # Write summary for this combination
                    avg_time = total_time / len(image_files)
                    f.write(
                        f"{box_thresh:^10.3f} | {iou_thresh:^10.3f} | {total_icons:^10d} | {total_text:^10d} | {avg_time:^10.3f}\n"
                    )

                except Exception as e:
                    logger.error(
                        f"Error in experiment box={box_thresh}, iou={iou_thresh}: {str(e)}"
                    )
                    f.write(
                        f"{box_thresh:^10.3f} | {iou_thresh:^10.3f} | {'ERROR':^10s} | {'ERROR':^10s} | {'ERROR':^10s}\n"
                    )

        # Write summary footer
        f.write("-" * 80 + "\n")
        f.write("\nExperiment completed successfully!\n")

    logger.info(f"\nExperiment results saved to {exp_dir}")
    logger.info(f"Summary file: {summary_file}")


def main():
    """Main entry point."""
    parser = argparse.ArgumentParser(description="Run OmniParser benchmark")
    parser.add_argument("input_path", help="Path to input image or directory containing images")
    parser.add_argument(
        "--output-dir", default="examples/output", help="Output directory for annotated images"
    )
    parser.add_argument(
        "--ocr",
        choices=["none", "easyocr"],
        default="none",
        help="OCR engine to use (default: none)",
    )
    parser.add_argument(
        "--mode",
        choices=["single", "experiment"],
        default="single",
        help="Run mode: single run or threshold experiments (default: single)",
    )
    parser.add_argument(
        "--box-threshold",
        type=float,
        default=0.01,
        help="Confidence threshold for detection (default: 0.01)",
    )
    parser.add_argument(
        "--iou-threshold",
        type=float,
        default=0.1,
        help="IOU threshold for Non-Maximum Suppression (default: 0.1)",
    )
    args = parser.parse_args()

    logger.info(f"Starting OmniParser with arguments: {args}")
    use_ocr = args.ocr != "none"
    output_dir = Path(args.output_dir)

    try:
        if args.mode == "experiment":
            run_experiments(args.input_path, output_dir, use_ocr)
        else:
            run_detection_benchmark(
                args.input_path, output_dir, use_ocr, args.box_threshold, args.iou_threshold
            )
    except Exception as e:
        logger.error(f"Process failed: {str(e)}", exc_info=True)
        return 1

    return 0


if __name__ == "__main__":
    sys.exit(main())

```

## /examples/utils.py

```py path="/examples/utils.py" 
"""Utility functions for example scripts."""

import os
import sys
import signal
from pathlib import Path
from typing import Optional


def load_env_file(path: Path) -> bool:
    """Load environment variables from a file.

    Args:
        path: Path to the .env file

    Returns:
        True if file was loaded successfully, False otherwise
    """
    if not path.exists():
        return False

    print(f"Loading environment from {path}")
    with open(path, "r") as f:
        for line in f:
            line = line.strip()
            if not line or line.startswith("#"):
                continue

            key, value = line.split("=", 1)
            os.environ[key] = value

    return True


def load_dotenv_files():
    """Load environment variables from .env files.

    Tries to load from .env.local first, then .env if .env.local doesn't exist.
    """
    # Get the project root directory (parent of the examples directory)
    project_root = Path(__file__).parent.parent

    # Try loading .env.local first, then .env if .env.local doesn't exist
    env_local_path = project_root / ".env.local"
    env_path = project_root / ".env"

    # Load .env.local if it exists, otherwise try .env
    if not load_env_file(env_local_path):
        load_env_file(env_path)


def handle_sigint(signum, frame):
    """Handle SIGINT (Ctrl+C) gracefully."""
    print("\nExiting gracefully...")
    sys.exit(0)

```

## /examples/winsandbox_example.py

```py path="/examples/winsandbox_example.py" 
"""Example of using the Windows Sandbox computer provider.

Learn more at: https://learn.microsoft.com/en-us/windows/security/application-security/application-isolation/windows-sandbox/
"""

import asyncio
from computer import Computer

async def main():
    """Test the Windows Sandbox provider."""
    
    # Create a computer instance using Windows Sandbox
    computer = Computer(
        provider_type="winsandbox",
        os_type="windows",
        memory="4GB",
        # ephemeral=True,  # Always true for Windows Sandbox
    )
    
    try:
        print("Starting Windows Sandbox...")
        await computer.run()
        
        print("Windows Sandbox is ready!")
        print(f"IP Address: {await computer.get_ip()}")
        
        # Test basic functionality
        print("Testing basic functionality...")
        screenshot = await computer.interface.screenshot()
        print(f"Screenshot taken: {len(screenshot)} bytes")
        
        # Test running a command
        print("Testing command execution...")
        stdout, stderr = await computer.interface.run_command("echo Hello from Windows Sandbox!")
        print(f"Command output: {stdout}")

        print("Press any key to continue...")
        input()
        
    except Exception as e:
        print(f"Error: {e}")
        import traceback
        traceback.print_exc()
    
    finally:
        print("Stopping Windows Sandbox...")
        await computer.stop()
        print("Windows Sandbox stopped.")

if __name__ == "__main__":
    asyncio.run(main())

```

## /img/agent.png

Binary file available at https://raw.githubusercontent.com/trycua/cua/refs/heads/main/img/agent.png

## /img/agent_gradio_ui.png

Binary file available at https://raw.githubusercontent.com/trycua/cua/refs/heads/main/img/agent_gradio_ui.png

## /img/cli.png

Binary file available at https://raw.githubusercontent.com/trycua/cua/refs/heads/main/img/cli.png

## /img/computer.png

Binary file available at https://raw.githubusercontent.com/trycua/cua/refs/heads/main/img/computer.png

## /img/logo_black.png

Binary file available at https://raw.githubusercontent.com/trycua/cua/refs/heads/main/img/logo_black.png

## /img/logo_white.png

Binary file available at https://raw.githubusercontent.com/trycua/cua/refs/heads/main/img/logo_white.png

## /libs/lume/.cursorignore

```cursorignore path="/libs/lume/.cursorignore" 
# Byte-compiled / optimized / DLL files
__pycache__/
*.py[cod]
*$py.class

# C extensions
*.so

# Distribution / packaging
.Python
build/
!libs/lume/scripts/build/
develop-eggs/
dist/
downloads/
eggs/
.eggs/
lib/
lib64/
parts/
sdist/
var/
wheels/
share/python-wheels/
*.egg-info/
.installed.cfg
*.egg
MANIFEST

# PyInstaller
#  Usually these files are written by a python script from a template
#  before PyInstaller builds the exe, so as to inject date/other infos into it.
*.manifest
*.spec

# Installer logs
pip-log.txt
pip-delete-this-directory.txt

# Unit test / coverage reports
htmlcov/
.tox/
.nox/
.coverage
.coverage.*
.cache
nosetests.xml
coverage.xml
*.cover
*.py,cover
.hypothesis/
.pytest_cache/
cover/

# Translations
*.mo
*.pot

# Django stuff:
*.log
local_settings.py
db.sqlite3
db.sqlite3-journal

# Flask stuff:
instance/
.webassets-cache

# Scrapy stuff:
.scrapy

# Sphinx documentation
docs/_build/

# PyBuilder
.pybuilder/
target/

# Jupyter Notebook
.ipynb_checkpoints

# IPython
profile_default/
ipython_config.py

.pdm.toml
.pdm-python
.pdm-build/

# PEP 582; used by e.g. github.com/David-OConnor/pyflow and github.com/pdm-project/pdm
__pypackages__/

# Celery stuff
celerybeat-schedule
celerybeat.pid

# SageMath parsed files
*.sage.py

# Environments
.env
.venv
env/
venv/
ENV/
env.bak/
venv.bak/

# Spyder project settings
.spyderproject
.spyproject

# Rope project settings
.ropeproject

# mkdocs documentation
/site

# mypy
.mypy_cache/
.dmypy.json
dmypy.json

# Scripts
server/scripts/

# Pyre type checker
.pyre/

# pytype static type analyzer
.pytype/

# Cython debug symbols
cython_debug/

# Ruff stuff:
.ruff_cache/

# PyPI configuration file
.pypirc

# Conda
.conda/

# Local environment
.env.local

# macOS DS_Store
.DS_Store

weights/
weights/icon_detect/
weights/icon_detect/model.pt
weights/icon_detect/model.pt.zip
weights/icon_detect/model.pt.zip.part*

libs/omniparser/weights/icon_detect/model.pt

# Example test data and output
examples/test_data/
examples/output/

/screenshots/

/experiments/

/logs/

# Xcode
#
# gitignore contributors: remember to update Global/Xcode.gitignore, Objective-C.gitignore & Swift.gitignore

## User settings
xcuserdata/

## Obj-C/Swift specific
*.hmap

## App packaging
*.ipa
*.dSYM.zip
*.dSYM

## Playgrounds
timeline.xctimeline
playground.xcworkspace

# Swift Package Manager
#
# Add this line if you want to avoid checking in source code from Swift Package Manager dependencies.
# Packages/
# Package.pins
# Package.resolved
# *.xcodeproj
#
# Xcode automatically generates this directory with a .xcworkspacedata file and xcuserdata
# hence it is not needed unless you have added a package configuration file to your project
.swiftpm/
.build/

# CocoaPods
#
# We recommend against adding the Pods directory to your .gitignore. However
# you should judge for yourself, the pros and cons are mentioned at:
# https://guides.cocoapods.org/using/using-cocoapods.html#should-i-check-the-pods-directory-into-source-control
#
# Pods/
#
# Add this line if you want to avoid checking in source code from the Xcode workspace
# *.xcworkspace

# Carthage
#
# Add this line if you want to avoid checking in source code from Carthage dependencies.
# Carthage/Checkouts
Carthage/Build/

# fastlane
#
# It is recommended to not store the screenshots in the git repo.
# Instead, use fastlane to re-generate the screenshots whenever they are needed.
# For more information about the recommended setup visit:
# https://docs.fastlane.tools/best-practices/source-control/#source-control
fastlane/report.xml
fastlane/Preview.html
fastlane/screenshots/**/*.png
fastlane/test_output

# Ignore folder
ignore

# .release
.release/
```

## /libs/lume/CONTRIBUTING.md

# Contributing to lume

We deeply appreciate your interest in contributing to lume! Whether you're reporting bugs, suggesting enhancements, improving docs, or submitting pull requests, your contributions help improve the project for everyone.

## Reporting Bugs

If you've encountered a bug in the project, we encourage you to report it. Please follow these steps:

1. **Check the Issue Tracker**: Before submitting a new bug report, please check our issue tracker to see if the bug has already been reported.
2. **Create a New Issue**: If the bug hasn't been reported, create a new issue with:
   - A clear title and detailed description
   - Steps to reproduce the issue
   - Expected vs actual behavior
   - Your environment (macOS version, lume version)
   - Any relevant logs or error messages
3. **Label Your Issue**: Label your issue as a `bug` to help maintainers identify it quickly.

## Suggesting Enhancements

We're always looking for suggestions to make lume better. If you have an idea:

1. **Check Existing Issues**: See if someone else has already suggested something similar.
2. **Create a New Issue**: If your enhancement is new, create an issue describing:
   - The problem your enhancement solves
   - How your enhancement would work
   - Any potential implementation details
   - Why this enhancement would benefit lume users

## Documentation

Documentation improvements are always welcome. You can:
- Fix typos or unclear explanations
- Add examples and use cases
- Improve API documentation
- Add tutorials or guides

For detailed instructions on setting up your development environment and submitting code contributions, please see our [Development.md](docs/Development.md) guide.

Feel free to join our [Discord community](https://discord.com/invite/mVnXXpdE85) to discuss ideas or get help with your contributions. 

## /libs/lume/Package.resolved

```resolved path="/libs/lume/Package.resolved" 
{
  "originHash" : "81a9d169da3c391b981b894044911091d11285486aab463e32222490c931ba45",
  "pins" : [
    {
      "identity" : "dynamic",
      "kind" : "remoteSourceControl",
      "location" : "https://github.com/mhdhejazi/Dynamic",
      "state" : {
        "branch" : "master",
        "revision" : "772883073d044bc754d401cabb6574624eb3778f"
      }
    },
    {
      "identity" : "swift-argument-parser",
      "kind" : "remoteSourceControl",
      "location" : "https://github.com/apple/swift-argument-parser",
      "state" : {
        "revision" : "41982a3656a71c768319979febd796c6fd111d5c",
        "version" : "1.5.0"
      }
    },
    {
      "identity" : "swift-atomics",
      "kind" : "remoteSourceControl",
      "location" : "https://github.com/apple/swift-atomics.git",
      "state" : {
        "revision" : "cd142fd2f64be2100422d658e7411e39489da985",
        "version" : "1.2.0"
      }
    },
    {
      "identity" : "swift-cmark",
      "kind" : "remoteSourceControl",
      "location" : "https://github.com/apple/swift-cmark.git",
      "state" : {
        "revision" : "3ccff77b2dc5b96b77db3da0d68d28068593fa53",
        "version" : "0.5.0"
      }
    },
    {
      "identity" : "swift-format",
      "kind" : "remoteSourceControl",
      "location" : "https://github.com/apple/swift-format.git",
      "state" : {
        "branch" : "release/5.10",
        "revision" : "3191b8f3109730af449c6332d0b1ca6653b857a0"
      }
    },
    {
      "identity" : "swift-markdown",
      "kind" : "remoteSourceControl",
      "location" : "https://github.com/apple/swift-markdown.git",
      "state" : {
        "revision" : "8f79cb175981458a0a27e76cb42fee8e17b1a993",
        "version" : "0.5.0"
      }
    },
    {
      "identity" : "swift-syntax",
      "kind" : "remoteSourceControl",
      "location" : "https://github.com/apple/swift-syntax.git",
      "state" : {
        "branch" : "release/5.10",
        "revision" : "cdd571f366a4298bb863a9dcfe1295bb595041d5"
      }
    }
  ],
  "version" : 3
}

```

## /libs/lume/Package.swift

```swift path="/libs/lume/Package.swift" 
// swift-tools-version: 6.0
// The swift-tools-version declares the minimum version of Swift required to build this package.

import PackageDescription

let package = Package(
    name: "lume",
    platforms: [
        .macOS(.v14)
    ],
    dependencies: [
        .package(url: "https://github.com/apple/swift-argument-parser", from: "1.3.1"),
        .package(url: "https://github.com/apple/swift-format.git", branch: ("release/5.10")),
        .package(url: "https://github.com/apple/swift-atomics.git", .upToNextMajor(from: "1.2.0")),
        .package(url: "https://github.com/mhdhejazi/Dynamic", branch: "master")
    ],
    targets: [
        // Targets are the basic building blocks of a package, defining a module or a test suite.
        // Targets can depend on other targets in this package and products from dependencies.
        .executableTarget(
            name: "lume",
            dependencies: [
                .product(name: "ArgumentParser", package: "swift-argument-parser"),
                .product(name: "Atomics", package: "swift-atomics"),
                .product(name: "Dynamic", package: "Dynamic")
            ],
            path: "src"),
        .testTarget(
            name: "lumeTests",
            dependencies: [
                "lume"
            ],
            path: "tests")
    ]
)

```

## /libs/lume/README.md

<div align="center">
<h1>
  <div class="image-wrapper" style="display: inline-block;">
    <picture>
      <source media="(prefers-color-scheme: dark)" alt="logo" height="150" srcset="img/logo_white.png" style="display: block; margin: auto;">
      <source media="(prefers-color-scheme: light)" alt="logo" height="150" srcset="img/logo_black.png" style="display: block; margin: auto;">
      <img alt="Shows my svg">
    </picture>
  </div>

  [![Swift 6](https://img.shields.io/badge/Swift_6-F54A2A?logo=swift&logoColor=white&labelColor=F54A2A)](#)
  [![macOS](https://img.shields.io/badge/macOS-000000?logo=apple&logoColor=F0F0F0)](#)
  [![Discord](https://img.shields.io/badge/Discord-%235865F2.svg?&logo=discord&logoColor=white)](https://discord.com/invite/mVnXXpdE85)
</h1>
</div>


**lume** is a lightweight Command Line Interface and local API server to create, run and manage macOS and Linux virtual machines (VMs) with near-native performance on Apple Silicon, using Apple's `Virtualization.Framework`.

### Run prebuilt macOS images in just 1 step

<div align="center">
<img src="../../img/cli.png" alt="lume cli">
</div>


```bash
lume run macos-sequoia-vanilla:latest
```

## Development Environment

If you're working on Lume in the context of the CUA monorepo, we recommend using the dedicated VS Code workspace configuration:

```bash
# Open VS Code workspace from the root of the monorepo
code .vscode/lume.code-workspace
```
This workspace is preconfigured with Swift language support, build tasks, and debug configurations.

## Usage

```bash
lume <command>

Commands:
  lume create <name>            Create a new macOS or Linux VM
  lume run <name>               Run a VM
  lume ls                       List all VMs
  lume get <name>               Get detailed information about a VM
  lume set <name>               Modify VM configuration
  lume stop <name>              Stop a running VM
  lume delete <name>            Delete a VM
  lume pull <image>             Pull a macOS image from container registry
  lume push <name> <image:tag>  Push a VM image to a container registry
  lume clone <name> <new-name>  Clone an existing VM
  lume config                   Get or set lume configuration
  lume images                   List available macOS images in local cache
  lume ipsw                     Get the latest macOS restore image URL
  lume prune                    Remove cached images
  lume serve                    Start the API server

Options:
  --help     Show help [boolean]
  --version  Show version number [boolean]

Command Options:
  create:
    --os <os>            Operating system to install (macOS or linux, default: macOS)
    --cpu <cores>        Number of CPU cores (default: 4)
    --memory <size>      Memory size, e.g., 8GB (default: 4GB)
    --disk-size <size>   Disk size, e.g., 50GB (default: 40GB)
    --display <res>      Display resolution (default: 1024x768)
    --ipsw <path>        Path to IPSW file or 'latest' for macOS VMs
    --storage <name>     VM storage location to use

  run:
    --no-display                Do not start the VNC client app
    --shared-dir <dir>          Share directory with VM (format: path[:ro|rw])
    --mount <path>              For Linux VMs only, attach a read-only disk image
    --registry <url>            Container registry URL (default: ghcr.io)
    --organization <org>        Organization to pull from (default: trycua)
    --vnc-port <port>           Port to use for the VNC server (default: 0 for auto-assign)
    --recovery-mode <boolean>   For MacOS VMs only, start VM in recovery mode (default: false)
    --storage <name>            VM storage location to use

  set:
    --cpu <cores>        New number of CPU cores (e.g., 4)
    --memory <size>      New memory size (e.g., 8192MB or 8GB)
    --disk-size <size>   New disk size (e.g., 40960MB or 40GB)
    --display <res>      New display resolution in format WIDTHxHEIGHT (e.g., 1024x768)
    --storage <name>     VM storage location to use

  delete:
    --force              Force deletion without confirmation
    --storage <name>     VM storage location to use

  pull:
    --registry <url>     Container registry URL (default: ghcr.io)
    --organization <org> Organization to pull from (default: trycua)
    --storage <name>     VM storage location to use

  push:
    --additional-tags <tags...>  Additional tags to push the same image to
    --registry <url>            Container registry URL (default: ghcr.io)
    --organization <org>        Organization/user to push to (default: trycua)
    --storage <name>            VM storage location to use
    --chunk-size-mb <size>      Chunk size for disk image upload in MB (default: 512)
    --verbose                   Enable verbose logging
    --dry-run                   Prepare files and show plan without uploading
    --reassemble                Verify integrity by reassembling chunks (requires --dry-run)

  get:
    -f, --format <format> Output format (json|text)
    --storage <name>      VM storage location to use

  stop:
    --storage <name>     VM storage location to use

  clone:
    --source-storage <name> Source VM storage location
    --dest-storage <name>   Destination VM storage location

  config:
    get                  Get current configuration
    storage              Manage VM storage locations
      add <name> <path>  Add a new VM storage location
      remove <name>      Remove a VM storage location
      list               List all VM storage locations
      default <name>     Set the default VM storage location
    cache                Manage cache settings
      get                Get current cache directory
      set <path>         Set cache directory
    caching              Manage image caching settings
      get                Show current caching status
      set <boolean>      Enable or disable image caching

  serve:
    --port <port>        Port to listen on (default: 7777)
```

## Install

Install with a single command:

```bash
/bin/bash -c "$(curl -fsSL https://raw.githubusercontent.com/trycua/cua/main/libs/lume/scripts/install.sh)"
```

By default, Lume is installed as a background service that starts automatically on login. If you prefer to start the Lume API service manually when needed, you can use the `--no-background-service` option:

```bash
/bin/bash -c "$(curl -fsSL https://raw.githubusercontent.com/trycua/cua/main/libs/lume/scripts/install.sh) --no-background-service"
```

**Note:** With this option, you'll need to manually start the Lume API service by running `lume serve` in your terminal whenever you need to use tools or libraries that rely on the Lume API (such as the Computer-Use Agent).

You can also download the `lume.pkg.tar.gz` archive from the [latest release](https://github.com/trycua/lume/releases), extract it, and install the package manually.

## Prebuilt Images

Pre-built images are available in the registry [ghcr.io/trycua](https://github.com/orgs/trycua/packages). 

**Important Note (v0.2.0+):** Images are being re-uploaded with sparse file system optimizations enabled, resulting in significantly lower actual disk usage. Older images (without the `-sparse` suffix) are now **deprecated**. The last version of `lume` fully supporting the non-sparse images was `v0.1.x`. Starting from `v0.2.0`, lume will automatically pull images optimized with sparse file system support.

These images come with an SSH server pre-configured and auto-login enabled.

For the security of your VM, change the default password `lume` immediately after your first login.

| Image | Tag | Description | Logical Size |
|-------|------------|-------------|------|
| `macos-sequoia-vanilla` | `latest`, `15.2` | macOS Sequoia 15.2 image | 20GB |
| `macos-sequoia-xcode` | `latest`, `15.2` | macOS Sequoia 15.2 image with Xcode command line tools | 22GB |
| `macos-sequoia-cua` | `latest`, `15.3` | macOS Sequoia 15.3 image compatible with the Computer interface | 24GB |
| `ubuntu-noble-vanilla` | `latest`, `24.04.1` | [Ubuntu Server for ARM 24.04.1 LTS](https://ubuntu.com/download/server/arm) with Ubuntu Desktop | 20GB |

For additional disk space, resize the VM disk after pulling the image using the `lume set <name> --disk-size <size>` command. Note that the actual disk space used by sparse images will be much lower than the logical size listed.

## Local API Server
  
`lume` exposes a local HTTP API server that listens on `http://localhost:7777/lume`, enabling automated management of VMs.

```bash
lume serve
```

For detailed API documentation, please refer to [API Reference](docs/API-Reference.md).

## Docs

- [API Reference](docs/API-Reference.md)
- [Development](docs/Development.md)
- [FAQ](docs/FAQ.md)

## Contributing

We welcome and greatly appreciate contributions to lume! Whether you're improving documentation, adding new features, fixing bugs, or adding new VM images, your efforts help make lume better for everyone. For detailed instructions on how to contribute, please refer to our [Contributing Guidelines](CONTRIBUTING.md).

Join our [Discord community](https://discord.com/invite/mVnXXpdE85) to discuss ideas or get assistance.

## License

lume is open-sourced under the MIT License - see the [LICENSE](LICENSE) file for details.

## Trademarks

Apple, macOS, and Apple Silicon are trademarks of Apple Inc. Ubuntu and Canonical are registered trademarks of Canonical Ltd. This project is not affiliated with, endorsed by, or sponsored by Apple Inc. or Canonical Ltd.


## /libs/lume/docs/API-Reference.md

## API Reference

<details open>
<summary><strong>Create VM</strong> - POST /vms</summary>

```bash
curl --connect-timeout 6000 \
    --max-time 5000 \
    -X POST \
    -H "Content-Type: application/json" \
    -d '{
      "name": "lume_vm",
      "os": "macOS",
      "cpu": 2,
      "memory": "4GB",
      "diskSize": "64GB",
      "display": "1024x768",
      "ipsw": "latest",
      "storage": "ssd"
    }' \
    http://localhost:7777/lume/vms
```
</details>

<details open>
<summary><strong>Run VM</strong> - POST /vms/:name/run</summary>

```bash
# Basic run
curl --connect-timeout 6000 \
  --max-time 5000 \
  -X POST \
  http://localhost:7777/lume/vms/my-vm-name/run

# Run with VNC client started and shared directory
curl --connect-timeout 6000 \
  --max-time 5000 \
  -X POST \
  -H "Content-Type: application/json" \
  -d '{
    "noDisplay": false,
    "sharedDirectories": [
      {
        "hostPath": "~/Projects",
        "readOnly": false
      }
    ],
    "recoveryMode": false,
    "storage": "ssd"
  }' \
  http://localhost:7777/lume/vms/lume_vm/run
```
</details>

<details open>
<summary><strong>List VMs</strong> - GET /vms</summary>

```bash
curl --connect-timeout 6000 \
  --max-time 5000 \
  http://localhost:7777/lume/vms
```
```
[
  {
    "name": "my-vm",
    "state": "stopped",
    "os": "macOS",
    "cpu": 2,
    "memory": "4GB",
    "diskSize": "64GB"
  },
  {
    "name": "my-vm-2",
    "state": "stopped",
    "os": "linux",
    "cpu": 2,
    "memory": "4GB",
    "diskSize": "64GB"
  }
]
```
</details>

<details open>
<summary><strong>Get VM Details</strong> - GET /vms/:name</summary>

```bash
# Basic get
curl --connect-timeout 6000 \
  --max-time 5000 \
  http://localhost:7777/lume/vms/lume_vm

# Get with storage location specified
curl --connect-timeout 6000 \
  --max-time 5000 \
  http://localhost:7777/lume/vms/lume_vm?storage=ssd
```
```
{
  "name": "lume_vm",
  "state": "running",
  "os": "macOS",
  "cpu": 2,
  "memory": "4GB",
  "diskSize": "64GB"
}
```
</details>

<details open>
<summary><strong>Update VM Settings</strong> - PATCH /vms/:name</summary>

```bash
curl --connect-timeout 6000 \
  --max-time 5000 \
  -X PATCH \
  -H "Content-Type: application/json" \
  -d '{
    "cpu": 4,
    "memory": "8GB",
    "diskSize": "128GB",
    "storage": "ssd"
  }' \
  http://localhost:7777/lume/vms/my-vm-name
```
</details>

<details open>
<summary><strong>Stop VM</strong> - POST /vms/:name/stop</summary>

```bash
# Basic stop
curl --connect-timeout 6000 \
  --max-time 5000 \
  -X POST \
  http://localhost:7777/lume/vms/my-vm-name/stop

# Stop with storage location specified
curl --connect-timeout 6000 \
  --max-time 5000 \
  -X POST \
  http://localhost:7777/lume/vms/my-vm-name/stop?storage=ssd
```
</details>

<details open>
<summary><strong>Delete VM</strong> - DELETE /vms/:name</summary>

```bash
# Basic delete
curl --connect-timeout 6000 \
  --max-time 5000 \
  -X DELETE \
  http://localhost:7777/lume/vms/my-vm-name

# Delete with storage location specified
curl --connect-timeout 6000 \
  --max-time 5000 \
  -X DELETE \
  http://localhost:7777/lume/vms/my-vm-name?storage=ssd
```
</details>

<details open>
<summary><strong>Pull Image</strong> - POST /pull</summary>

```bash
curl --connect-timeout 6000 \
  --max-time 5000 \
  -X POST \
  -H "Content-Type: application/json" \
  -d '{
    "image": "macos-sequoia-vanilla:latest",
    "name": "my-vm-name",
    "registry": "ghcr.io",
    "organization": "trycua",
    "storage": "ssd"
  }' \
  http://localhost:7777/lume/pull
```

```bash
curl --connect-timeout 6000 \
  --max-time 5000 \
  -X POST \
  -H "Content-Type: application/json" \
  -d '{
    "image": "macos-sequoia-vanilla:15.2",
    "name": "macos-sequoia-vanilla"
  }' \
  http://localhost:7777/lume/pull
```
</details>

<details open>
<summary><strong>Push Image (Async)</strong> - POST /vms/push</summary>

```bash
# Push VM 'my-local-vm' to 'my-org/my-image:latest' and 'my-org/my-image:v1'
curl --connect-timeout 6000 \
  --max-time 5000 \
  -X POST \
  -H "Content-Type: application/json" \
  -d '{
    "name": "my-local-vm", 
    "imageName": "my-image",
    "tags": ["latest", "v1"],
    "organization": "my-org", 
    "registry": "ghcr.io",
    "chunkSizeMb": 512,
    "storage": null 
  }' \
  http://localhost:7777/lume/vms/push 
```

**Response (202 Accepted):**

```json
{
  "message": "Push initiated in background",
  "name": "my-local-vm",
  "imageName": "my-image",
  "tags": [
    "latest",
    "v1"
  ]
}
```
</details>

<details open>
<summary><strong>Clone VM</strong> - POST /vms/:name/clone</summary>

```bash
curl --connect-timeout 6000 \
  --max-time 5000 \
  -X POST \
  -H "Content-Type: application/json" \
  -d '{
    "name": "source-vm",
    "newName": "cloned-vm",
    "sourceLocation": "default",
    "destLocation": "ssd"
  }' \
  http://localhost:7777/lume/vms/clone
```
</details>

<details open>
<summary><strong>Get Latest IPSW URL</strong> - GET /ipsw</summary>

```bash
curl --connect-timeout 6000 \
  --max-time 5000 \
  http://localhost:7777/lume/ipsw
```
</details>

<details open>
<summary><strong>List Images</strong> - GET /images</summary>

```bash
# List images with default organization (trycua)
curl --connect-timeout 6000 \
  --max-time 5000 \
  http://localhost:7777/lume/images
```

```json
{
  "local": [
    "macos-sequoia-xcode:latest",
    "macos-sequoia-vanilla:latest"
  ]
}
```
</details>

<details open>
<summary><strong>Prune Images</strong> - POST /lume/prune</summary>

```bash
curl --connect-timeout 6000 \
  --max-time 5000 \
  -X POST \
  http://localhost:7777/lume/prune
```
</details>

<details open>
<summary><strong>Get Configuration</strong> - GET /lume/config</summary>

```bash
curl --connect-timeout 6000 \
  --max-time 5000 \
  http://localhost:7777/lume/config
```

```json
{
  "homeDirectory": "~/.lume",
  "cacheDirectory": "~/.lume/cache",
  "cachingEnabled": true
}
```
</details>

<details open>
<summary><strong>Update Configuration</strong> - POST /lume/config</summary>

```bash
curl --connect-timeout 6000 \
  --max-time 5000 \
  -X POST \
  -H "Content-Type: application/json" \
  -d '{
    "homeDirectory": "~/custom/lume",
    "cacheDirectory": "~/custom/lume/cache",
    "cachingEnabled": true
  }' \
  http://localhost:7777/lume/config
```
</details>

<details open>
<summary><strong>Get VM Storage Locations</strong> - GET /lume/config/locations</summary>

```bash
curl --connect-timeout 6000 \
  --max-time 5000 \
  http://localhost:7777/lume/config/locations
```

```json
[
  {
    "name": "default",
    "path": "~/.lume/vms",
    "isDefault": true
  },
  {
    "name": "ssd",
    "path": "/Volumes/SSD/lume/vms",
    "isDefault": false
  }
]
```
</details>

<details open>
<summary><strong>Add VM Storage Location</strong> - POST /lume/config/locations</summary>

```bash
curl --connect-timeout 6000 \
  --max-time 5000 \
  -X POST \
  -H "Content-Type: application/json" \
  -d '{
    "name": "ssd",
    "path": "/Volumes/SSD/lume/vms"
  }' \
  http://localhost:7777/lume/config/locations
```
</details>

<details open>
<summary><strong>Remove VM Storage Location</strong> - DELETE /lume/config/locations/:name</summary>

```bash
curl --connect-timeout 6000 \
  --max-time 5000 \
  -X DELETE \
  http://localhost:7777/lume/config/locations/ssd
```
</details>

<details open>
<summary><strong>Set Default VM Storage Location</strong> - POST /lume/config/locations/default/:name</summary>

```bash
curl --connect-timeout 6000 \
  --max-time 5000 \
  -X POST \
  http://localhost:7777/lume/config/locations/default/ssd
```
</details>


## /libs/lume/docs/Development.md

# Development Guide

This guide will help you set up your development environment and understand the process for contributing code to lume.

## Environment Setup

Lume development requires:
- Swift 6 or higher
- Xcode 15 or higher
- macOS Sequoia 15.2 or higher
- (Optional) VS Code with Swift extension

## Setting Up the Repository Locally

1. **Fork the Repository**: Create your own fork of lume
2. **Clone the Repository**: 
   ```bash
   git clone https://github.com/trycua/lume.git
   cd lume
   ```
3. **Install Dependencies**:
   ```bash
   swift package resolve
   ```
4. **Build the Project**:
   ```bash
   swift build
   ```

## Development Workflow

1. Create a new branch for your changes
2. Make your changes
3. Run the tests: `swift test`
4. Build and test your changes locally
5. Commit your changes with clear commit messages

## Submitting Pull Requests

1. Push your changes to your fork
2. Open a Pull Request with:
   - A clear title and description
   - Reference to any related issues
   - Screenshots or logs if relevant
3. Respond to any feedback from maintainers


## /libs/lume/docs/FAQ.md

# FAQs

### Where are the VMs stored?

VMs are stored in `~/.lume` by default. You can configure additional storage locations using the `lume config` command.

### How are images cached?

Images are cached in `~/.lume/cache`. When doing `lume pull <image>`, it will check if the image is already cached. If not, it will download the image and cache it, removing any older versions.

### Where is the configuration file stored?

Lume follows the XDG Base Directory specification for the configuration file:

- Configuration is stored in `$XDG_CONFIG_HOME/lume/config.yaml` (defaults to `~/.config/lume/config.yaml`)

By default, other data is stored in:
- VM data: `~/.lume`
- Cache files: `~/.lume/cache`

The config file contains settings for:
- VM storage locations and the default location
- Cache directory location
- Whether caching is enabled

You can view and modify these settings using the `lume config` commands:

```bash
# View current configuration
lume config get

# Manage VM storage locations
lume config storage list                 # List all VM storage locations
lume config storage add <name> <path>    # Add a new VM storage location
lume config storage remove <name>        # Remove a VM storage location
lume config storage default <name>       # Set the default VM storage location

# Manage cache settings
lume config cache get                    # Get current cache directory
lume config cache set <path>             # Set cache directory

# Manage image caching settings
lume config caching get                  # Show current caching status
lume config caching set <boolean>        # Enable or disable image caching
```

### How do I use multiple VM storage locations?

Lume supports storing VMs in different locations (e.g., internal drive, external SSD). After configuring storage locations, you can specify which location to use with the `--storage` parameter in various commands:

```bash
# Create a VM in a specific storage location
lume create my-vm --os macos --ipsw latest --storage ssd

# Run a VM from a specific storage location
lume run my-vm --storage ssd

# Delete a VM from a specific storage location
lume delete my-vm --storage ssd

# Pull an image to a specific storage location
lume pull macos-sequoia-vanilla:latest --name my-vm --storage ssd

# Clone a VM between storage locations
lume clone source-vm cloned-vm --source-storage default --dest-storage ssd
```

If you don't specify a storage location, Lume will use the default one or search across all configured locations.

### Are VM disks taking up all the disk space?

No, macOS uses sparse files, which only allocate space as needed. For example, VM disks totaling 50 GB may only use 20 GB on disk.

### How do I get the latest macOS restore image URL?

```bash
lume ipsw
```

### How do I delete a VM?

```bash
lume delete <name>
```

### How to Install macOS from an IPSW Image

#### Create a new macOS VM using the latest supported IPSW image:
Run the following command to create a new macOS virtual machine using the latest available IPSW image:

```bash
lume create <name> --os macos --ipsw latest
```

#### Create a new macOS VM using a specific IPSW image:
To create a macOS virtual machine from an older or specific IPSW file, first download the desired IPSW (UniversalMac) from a trusted source.

Then, use the downloaded IPSW path:

```bash
lume create <name> --os macos --ipsw <downloaded_ipsw_path>
```

### How do I install a custom Linux image?

The process for creating a custom Linux image differs than macOS, with IPSW restore files not being used. You need to create a linux VM first, then mount a setup image file to the VM for the first boot.

```bash
lume create <name> --os linux

lume run <name> --mount <path-to-setup-image>

lume run <name>
```


## /libs/lume/img/cli.png

Binary file available at https://raw.githubusercontent.com/trycua/cua/refs/heads/main/libs/lume/img/cli.png

## /libs/lume/img/logo_black.png

Binary file available at https://raw.githubusercontent.com/trycua/cua/refs/heads/main/libs/lume/img/logo_black.png

## /libs/lume/img/logo_white.png

Binary file available at https://raw.githubusercontent.com/trycua/cua/refs/heads/main/libs/lume/img/logo_white.png

## /libs/lume/resources/lume.entitlements

```entitlements path="/libs/lume/resources/lume.entitlements" 
<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE plist PUBLIC "-//Apple//DTD PLIST 1.0//EN" "http://www.apple.com/DTDs/PropertyList-1.0.dtd">
<plist version="1.0">
<dict>
	<key>com.apple.security.virtualization</key>
	<true/>
</dict>
</plist>

```

## /libs/lume/scripts/build/build-debug.sh

```sh path="/libs/lume/scripts/build/build-debug.sh" 
#!/bin/sh

swift build --product lume
codesign --force --entitlement resources/lume.entitlements --sign - .build/debug/lume

```

## /libs/lume/scripts/build/build-release-notarized.sh

```sh path="/libs/lume/scripts/build/build-release-notarized.sh" 
#!/bin/bash

# Set default log level if not provided
LOG_LEVEL=${LOG_LEVEL:-"normal"}

# Function to log based on level
log() {
  local level=$1
  local message=$2
  
  case "$LOG_LEVEL" in
    "minimal")
      # Only show essential or error messages
      if [ "$level" = "essential" ] || [ "$level" = "error" ]; then
        echo "$message"
      fi
      ;;
    "none")
      # Show nothing except errors
      if [ "$level" = "error" ]; then
        echo "$message" >&2
      fi
      ;;
    *)
      # Normal logging - show everything
      echo "$message"
      ;;
  esac
}

# Check required environment variables
required_vars=(
  "CERT_APPLICATION_NAME"
  "CERT_INSTALLER_NAME"
  "APPLE_ID"
  "TEAM_ID"
  "APP_SPECIFIC_PASSWORD"
)

for var in "${required_vars[@]}"; do
  if [ -z "${!var}" ]; then
    log "error" "Error: $var is not set"
    exit 1
  fi
done

# Get VERSION from environment or use default
VERSION=${VERSION:-"0.1.0"}

# Move to the project root directory
pushd ../../ > /dev/null

# Ensure .release directory exists and is clean
mkdir -p .release
log "normal" "Ensuring .release directory exists and is accessible"

# Build the release version
log "essential" "Building release version..."
swift build -c release --product lume > /dev/null

# Sign the binary with hardened runtime entitlements
log "essential" "Signing binary with entitlements..."
codesign --force --options runtime \
         --entitlement ./resources/lume.entitlements \
         --sign "$CERT_APPLICATION_NAME" \
         .build/release/lume 2> /dev/null

# Create a temporary directory for packaging
TEMP_ROOT=$(mktemp -d)
mkdir -p "$TEMP_ROOT/usr/local/bin"
cp -f .build/release/lume "$TEMP_ROOT/usr/local/bin/"

# Build the installer package
log "essential" "Building installer package..."
if ! pkgbuild --root "$TEMP_ROOT" \
         --identifier "com.trycua.lume" \
         --version "1.0" \
         --install-location "/" \
         --sign "$CERT_INSTALLER_NAME" \
         ./.release/lume.pkg; then
    log "error" "Failed to build installer package"
    exit 1
fi

# Verify the package was created
if [ ! -f "./.release/lume.pkg" ]; then
    log "error" "Package file ./.release/lume.pkg was not created"
    exit 1
fi

log "essential" "Package created successfully"

# Submit for notarization using stored credentials
log "essential" "Submitting for notarization..."
if [ "$LOG_LEVEL" = "minimal" ] || [ "$LOG_LEVEL" = "none" ]; then
  # Minimal output - capture ID but hide details
  NOTARY_OUTPUT=$(xcrun notarytool submit ./.release/lume.pkg \
      --apple-id "${APPLE_ID}" \
      --team-id "${TEAM_ID}" \
      --password "${APP_SPECIFIC_PASSWORD}" \
      --wait 2>&1)
  
  # Check if notarization was successful
  if echo "$NOTARY_OUTPUT" | grep -q "status: Accepted"; then
    log "essential" "Notarization successful!"
  else
    log "error" "Notarization failed. Please check logs."
    log "error" "Notarization output:"
    echo "$NOTARY_OUTPUT"
    exit 1
  fi
else
  # Normal verbose output
  if ! xcrun notarytool submit ./.release/lume.pkg \
      --apple-id "${APPLE_ID}" \
      --team-id "${TEAM_ID}" \
      --password "${APP_SPECIFIC_PASSWORD}" \
      --wait; then
    log "error" "Notarization failed"
    exit 1
  fi
fi

# Staple the notarization ticket
log "essential" "Stapling notarization ticket..."
if ! xcrun stapler staple ./.release/lume.pkg > /dev/null 2>&1; then
  log "error" "Failed to staple notarization ticket"
  exit 1
fi

# Create temporary directory for package extraction
EXTRACT_ROOT=$(mktemp -d)
PKG_PATH="$(pwd)/.release/lume.pkg"

# Extract the pkg using xar
cd "$EXTRACT_ROOT"
xar -xf "$PKG_PATH" > /dev/null 2>&1

# Verify Payload exists before proceeding
if [ ! -f "Payload" ]; then
    log "error" "Error: Payload file not found after xar extraction"
    exit 1
fi

# Create a directory for the extracted contents
mkdir -p extracted
cd extracted

# Extract the Payload
cat ../Payload | gunzip -dc | cpio -i > /dev/null 2>&1

# Verify the binary exists
if [ ! -f "usr/local/bin/lume" ]; then
    log "error" "Error: lume binary not found in expected location"
    exit 1
fi

# Get the release directory absolute path
RELEASE_DIR="$(realpath "$(dirname "$PKG_PATH")")"
log "normal" "Using release directory: $RELEASE_DIR"

# Copy extracted lume to the release directory
cp -f usr/local/bin/lume "$RELEASE_DIR/lume"

# Install to user-local bin directory (standard location)
USER_BIN="$HOME/.local/bin"
mkdir -p "$USER_BIN"
cp -f "$RELEASE_DIR/lume" "$USER_BIN/lume"

# Advise user to add to PATH if not present
if ! echo "$PATH" | grep -q "$USER_BIN"; then
  log "normal" "[lume build] Note: $USER_BIN is not in your PATH. Add 'export PATH=\"$USER_BIN:\$PATH\"' to your shell profile."
fi

# Get architecture and create OS identifier
ARCH=$(uname -m)
OS_IDENTIFIER="darwin-${ARCH}"

# Create versioned archives of the package with OS identifier in the name
log "essential" "Creating archives in $RELEASE_DIR..."
cd "$RELEASE_DIR"

# Clean up any existing artifacts first to avoid conflicts
rm -f lume-*.tar.gz lume-*.pkg.tar.gz

# Create version-specific archives
log "essential" "Creating version-specific archives (${VERSION})..."
# Package the binary
tar -czf "lume-${VERSION}-${OS_IDENTIFIER}.tar.gz" lume > /dev/null 2>&1
# Package the installer
tar -czf "lume-${VERSION}-${OS_IDENTIFIER}.pkg.tar.gz" lume.pkg > /dev/null 2>&1

# Create sha256 checksum file
log "essential" "Generating checksums..."
shasum -a 256 lume-*.tar.gz > checksums.txt
log "essential" "Package created successfully with checksums generated."

# Show what's in the release directory
log "essential" "Files in release directory:"
ls -la "$RELEASE_DIR"

# Ensure correct permissions
chmod 644 "$RELEASE_DIR"/*.tar.gz "$RELEASE_DIR"/*.pkg.tar.gz "$RELEASE_DIR"/checksums.txt

popd > /dev/null

# Clean up
rm -rf "$TEMP_ROOT"
rm -rf "$EXTRACT_ROOT"

log "essential" "Build and packaging completed successfully."
```

## /libs/lume/scripts/build/build-release.sh

```sh path="/libs/lume/scripts/build/build-release.sh" 
#!/bin/sh

pushd ../../

swift build -c release --product lume
codesign --force --entitlement ./resources/lume.entitlements --sign - .build/release/lume

mkdir -p ./.release
cp -f .build/release/lume ./.release/lume

# Install to user-local bin directory (standard location)
USER_BIN="$HOME/.local/bin"
mkdir -p "$USER_BIN"
cp -f ./.release/lume "$USER_BIN/lume"

# Advise user to add to PATH if not present
if ! echo "$PATH" | grep -q "$USER_BIN"; then
  echo "[lume build] Note: $USER_BIN is not in your PATH. Add 'export PATH=\"$USER_BIN:\$PATH\"' to your shell profile."
fi

popd
```

## /libs/lume/src/Commands/Options/FormatOption.swift

```swift path="/libs/lume/src/Commands/Options/FormatOption.swift" 
import ArgumentParser

enum FormatOption: String, ExpressibleByArgument {
    case json
    case text
}

```

## /libs/python/agent/poetry.toml

```toml path="/libs/python/agent/poetry.toml" 
[virtualenvs]
in-project = true

```


The content has been capped at 50000 tokens. The user could consider applying other filters to refine the result. The better and more specific the context, the better the LLM can follow instructions. If the context seems verbose, the user can refine the filter using uithub. Thank you for using https://uithub.com - Perfect LLM context for any GitHub repo.