From 543823757a7e2750f32d5f8fde11d4d470b030a0 Mon Sep 17 00:00:00 2001
From: orangbejo <148731115+orang2bejo@users.noreply.github.com>
Date: Fri, 5 Sep 2025 02:04:45 +0800
Subject: [PATCH] feat: add secure config validation and telemetry

---
 .github/workflows/ci.yml                    |  37 ++-
 .github/workflows/release.yml               |  24 ++
 .pre-commit-config.yaml                     |  14 +
 .secrets.baseline                           |   5 +
 CHANGELOG.md                                |   9 +
 README.md                                   |  15 +
 audit_reports/ACTION_PLAN.md                |  18 ++
 audit_reports/BUGS_AND_ERRORS.md            |  10 +
 audit_reports/CODE_QUALITY_REPORT.md        |  34 +++
 audit_reports/CONFIG_DB_AUDIT.md            |  24 ++
 audit_reports/CPU_GPU_TELEMETRY_GAP.md      |  32 ++
 audit_reports/DEPENDENCY_RISKS.md           |  23 ++
 audit_reports/HEALTHCHECK_README_SNIPPET.md |  19 ++
 audit_reports/SECURITY_AUDIT.md             |  21 ++
 audit_reports/STRUCTURE_AUDIT.md            |  31 ++
 audit_reports/TEST_MATRIX.md                |  24 ++
 config/logging.yaml                         |  25 +-
 config/models.yaml                          |   4 +
 config/security.yaml                        |   5 +
 docs/SECRETS.md                             |  18 ++
 docs/SECURITY_MODES.md                      |   9 +
 docs/TROUBLESHOOTING.md                     |  17 ++
 pyproject.toml                              |   2 +-
 requirements.txt                            |   1 +
 scripts/healthcheck.py                      |  44 +++
 src/windows_use/config_loader.py            |  55 ++++
 src/windows_use/config_schema.py            |  49 ++++
 src/windows_use/obs/log_sanitizer.py        |  15 +
 src/windows_use/security/secret_store.py    |  36 +++
 src/windows_use/tools/ps_shell.py           | 307 ++++++++++++--------
 src/windows_use/tools/tts_piper.py          | 215 +++++++-------
 src/windows_use/tools/voice_input.py        | 169 ++++++-----
 src/windows_use/utils/logger.py             |  11 +-
 src/windows_use/utils/rate_limit.py         |  31 ++
 src/windows_use/utils/retry.py              |  32 ++
 src/windows_use/web/browser_automation.py   |   5 +
 src/windows_use/web/security_utils.py       |  43 +++
 tests/test_config_validation.py             |  33 +++
 tests/test_device_flags.py                  |  22 ++
 tests/test_log_sanitizer.py                 |   9 +
 tests/test_powershell_wrapper.py            |  25 ++
 tests/test_retry_rate_limit.py              |  30 ++
 tests/test_web_security.py                  |  40 +++
 43 files changed, 1279 insertions(+), 313 deletions(-)
 create mode 100644 .github/workflows/release.yml
 create mode 100644 .pre-commit-config.yaml
 create mode 100644 .secrets.baseline
 create mode 100644 CHANGELOG.md
 create mode 100644 README.md
 create mode 100644 audit_reports/ACTION_PLAN.md
 create mode 100644 audit_reports/BUGS_AND_ERRORS.md
 create mode 100644 audit_reports/CODE_QUALITY_REPORT.md
 create mode 100644 audit_reports/CONFIG_DB_AUDIT.md
 create mode 100644 audit_reports/CPU_GPU_TELEMETRY_GAP.md
 create mode 100644 audit_reports/DEPENDENCY_RISKS.md
 create mode 100644 audit_reports/HEALTHCHECK_README_SNIPPET.md
 create mode 100644 audit_reports/SECURITY_AUDIT.md
 create mode 100644 audit_reports/STRUCTURE_AUDIT.md
 create mode 100644 audit_reports/TEST_MATRIX.md
 create mode 100644 config/models.yaml
 create mode 100644 config/security.yaml
 create mode 100644 docs/SECRETS.md
 create mode 100644 docs/SECURITY_MODES.md
 create mode 100644 docs/TROUBLESHOOTING.md
 create mode 100644 scripts/healthcheck.py
 create mode 100644 src/windows_use/config_loader.py
 create mode 100644 src/windows_use/config_schema.py
 create mode 100644 src/windows_use/obs/log_sanitizer.py
 create mode 100644 src/windows_use/security/secret_store.py
 create mode 100644 src/windows_use/utils/rate_limit.py
 create mode 100644 src/windows_use/utils/retry.py
 create mode 100644 src/windows_use/web/security_utils.py
 create mode 100644 tests/test_config_validation.py
 create mode 100644 tests/test_device_flags.py
 create mode 100644 tests/test_log_sanitizer.py
 create mode 100644 tests/test_powershell_wrapper.py
 create mode 100644 tests/test_retry_rate_limit.py
 create mode 100644 tests/test_web_security.py

diff --git a/.github/workflows/ci.yml b/.github/workflows/ci.yml
index 1e4a9078..9d704756 100644
--- a/.github/workflows/ci.yml
+++ b/.github/workflows/ci.yml
@@ -73,6 +73,13 @@ jobs:
     - name: Run installation test
       run: |
         python test_installation.py
+
+    - name: Upload audit reports
+      if: always()
+      uses: actions/upload-artifact@v3
+      with:
+        name: audit-reports
+        path: audit_reports/
     
     - name: Generate coverage report
       run: |
@@ -161,4 +168,32 @@ jobs:
     
     - name: Notify on failure
       if: ${{ needs.test.result == 'failure' }}
-      run: echo "❌ Tests failed. Please check the logs."
\ No newline at end of file
+      run: echo "❌ Tests failed. Please check the logs."
+
+  supply-chain:
+    runs-on: ubuntu-latest
+    steps:
+    - uses: actions/checkout@v4
+
+    - name: Generate SBOM
+      run: |
+        pip install cyclonedx-bom
+        cyclonedx-py --format json --output sbom.json
+
+    - name: Scan secrets
+      uses: gitleaks/gitleaks-action@v2
+      with:
+        args: '--no-git --path .'
+
+    - name: CVE audit
+      run: |
+        pip install pip-audit
+        pip-audit > cve-report.txt || true
+
+    - name: Upload supply-chain artifacts
+      uses: actions/upload-artifact@v3
+      with:
+        name: supply-chain
+        path: |
+          sbom.json
+          cve-report.txt
diff --git a/.github/workflows/release.yml b/.github/workflows/release.yml
new file mode 100644
index 00000000..8134f19e
--- /dev/null
+++ b/.github/workflows/release.yml
@@ -0,0 +1,24 @@
+name: Release
+
+on:
+  push:
+    tags: ['v*']
+
+jobs:
+  build:
+    runs-on: ubuntu-latest
+    steps:
+    - uses: actions/checkout@v4
+    - name: Set up Python
+      uses: actions/setup-python@v4
+      with:
+        python-version: '3.12'
+    - name: Build wheel
+      run: |
+        pip install build
+        python -m build
+    - name: Upload artifact
+      uses: actions/upload-artifact@v3
+      with:
+        name: wheel
+        path: dist/*.whl
diff --git a/.pre-commit-config.yaml b/.pre-commit-config.yaml
new file mode 100644
index 00000000..92a7e1c8
--- /dev/null
+++ b/.pre-commit-config.yaml
@@ -0,0 +1,14 @@
+repos:
+  - repo: https://github.com/psf/black
+    rev: 24.3.0
+    hooks:
+      - id: black
+  - repo: https://github.com/astral-sh/ruff-pre-commit
+    rev: v0.3.4
+    hooks:
+      - id: ruff
+  - repo: https://github.com/Yelp/detect-secrets
+    rev: v1.4.0
+    hooks:
+      - id: detect-secrets
+        args: ['--baseline', '.secrets.baseline']
diff --git a/.secrets.baseline b/.secrets.baseline
new file mode 100644
index 00000000..0b8a9293
--- /dev/null
+++ b/.secrets.baseline
@@ -0,0 +1,5 @@
+{
+  "version": "1.0.0",
+  "plugins_used": [],
+  "results": {}
+}
diff --git a/CHANGELOG.md b/CHANGELOG.md
new file mode 100644
index 00000000..530a257f
--- /dev/null
+++ b/CHANGELOG.md
@@ -0,0 +1,9 @@
+# Changelog
+
+## 0.1.0 - 2024-06-12
+- add config validation with Pydantic
+- integrate Windows secret store
+- sanitize logs and enforce retention
+- GPU auto-detection for STT/TTS with healthcheck
+- rate limiting and retry utilities
+- PowerShell hardening and CI supply-chain jobs
diff --git a/README.md b/README.md
new file mode 100644
index 00000000..93094e61
--- /dev/null
+++ b/README.md
@@ -0,0 +1,15 @@
+# Jarvis Windows Agent
+
+![CI](https://github.com/CursorTouch/AI_Agents/actions/workflows/ci.yml/badge.svg)
+
+Jarvis is an autonomous agent for Windows automation, integrating voice, web, and desktop controls.
+
+## Security & Compliance
+- Default automation mode is **ASSISTIVE**; other modes are documented in [Security Modes](docs/SECURITY_MODES.md).
+- Secrets are stored via Windows Credential Manager; see [SECRETS.md](docs/SECRETS.md).
+- Logs are sanitized and rotated every 14 days. Use `scripts/healthcheck.py` to inspect device providers.
+
+## Healthcheck
+```bash
+python scripts/healthcheck.py
+```
diff --git a/audit_reports/ACTION_PLAN.md b/audit_reports/ACTION_PLAN.md
new file mode 100644
index 00000000..f4c4c35b
--- /dev/null
+++ b/audit_reports/ACTION_PLAN.md
@@ -0,0 +1,18 @@
+# Action Plan
+
+## P0 – Immediate
+- Remove secrets from `jarvis_config.json`; load from environment.
+- Fix `desktop.execute_command` to avoid `command.split()` injection.
+- Add domain allowlist & confirmation prompts in web automation.
+- Resolve `jarvis_demo.py` syntax error to restore build.
+
+## P1 – Near Term
+- Implement `obs/device_telemetry.py` and `scripts/healthcheck.py` for CPU/GPU metrics.
+- Add CI workflow running `ruff`, `black --check`, `mypy`, `pytest` (skip Office if unavailable).
+- Refactor large modules (`web_form_automation.py`, `hitl.py`).
+- Ensure `personality_state.json` and other runtime data are gitignored.
+
+## P2 – Later
+- Consolidate dependency management in `pyproject.toml` with extras for voice/office/web/security.
+- Split monolithic web modules into smaller components and add retry/backoff utilities.
+- Centralize logging and PII masking utilities.
diff --git a/audit_reports/BUGS_AND_ERRORS.md b/audit_reports/BUGS_AND_ERRORS.md
new file mode 100644
index 00000000..668086a2
--- /dev/null
+++ b/audit_reports/BUGS_AND_ERRORS.md
@@ -0,0 +1,10 @@
+# Bugs & Errors
+
+| File/Line | Issue | Suggested Fix |
+| --- | --- | --- |
+| `src/windows_use/examples/jarvis_demo.py:272` | Syntax error: positional argument after keyword【ba1ebe†L1-L3】 | Reorder arguments per Python syntax |
+| `src/windows_use/web/web_form_automation.py:466` | Bare `except` hides errors【5d1671†L66-L75】 | Catch `Exception` or specific Playwright errors |
+| `src/windows_use/desktop/__init__.py:61` | `command.split()` may break quoted args, injection risk【23938c†L59-L63】 | Use `shlex.split` or pass list to subprocess |
+| `config/jarvis_config.json` | Hard-coded API keys【294e78†L31-L44】 | Use env vars and remove from repo |
+| `tests/test_installation.py` | Import name conflict causes pytest collection error【fd3edd†L1-L20】 | Rename script or test module |
+| `security/hitl.py` | Multiple unused variables causing clutter【5d1671†L1-L40】 | Remove or log variables |
diff --git a/audit_reports/CODE_QUALITY_REPORT.md b/audit_reports/CODE_QUALITY_REPORT.md
new file mode 100644
index 00000000..8309a5f6
--- /dev/null
+++ b/audit_reports/CODE_QUALITY_REPORT.md
@@ -0,0 +1,34 @@
+# Code Quality Report
+
+## Tooling Results
+- `ruff check src/windows_use` → **232 issues** (e.g., unused imports, unused vars, bare except)【5d1671†L1-L85】
+- `black --check src/windows_use` → 84 files need formatting; one file failed to parse (`examples/jarvis_demo.py`)【765a0f†L1-L24】
+- `mypy src/windows_use` → Syntax error at `examples/jarvis_demo.py:272`【ba1ebe†L1-L3】
+- `pytest` → collection error due to name conflict with `test_installation.py`【fd3edd†L1-L20】
+
+## Composition & Complexity
+- `src/windows_use/security/hitl.py` contains multiple unused imports and variables (F401/F841). Consider refactor.
+- `src/windows_use/web/web_form_automation.py` uses bare `except:` blocks at lines 466 and 474; replace with specific exceptions.
+- `desktop.execute_command` splits user-supplied strings directly, risking incorrect tokenization.
+- Large monolithic modules (e.g., `web_form_automation.py` ~800+ lines) could be split into smaller units.
+
+## Suggested Patches
+```python
+# Example: handle specific timeout instead of bare except
+try:
+    await self.page.wait_for_selector(f"text={indicator}", timeout=1000)
+    return False
+except playwright.TimeoutError:
+    continue
+```
+```python
+# Example: secure command execution
+result = subprocess.run(['powershell', '-Command', command], shell=False, capture_output=True, check=True)
+```
+
+## Dead Code & Duplication
+- Duplicate directories `data/learning_data` and `learning_data`.
+- `logging_config.py` defines custom formatters; ensure they are reused consistently.
+
+## Circular Imports
+- No explicit circular imports detected, but keep `__init__.py` imports minimal to avoid cycles.
diff --git a/audit_reports/CONFIG_DB_AUDIT.md b/audit_reports/CONFIG_DB_AUDIT.md
new file mode 100644
index 00000000..a0748972
--- /dev/null
+++ b/audit_reports/CONFIG_DB_AUDIT.md
@@ -0,0 +1,24 @@
+# Config & Database Audit
+
+## Inspected Files
+- `config/jarvis_config.json`
+- `config/llm_config.yaml`
+- `config/logging.yaml`
+- `config/personality_config.json`
+- `config/personality_state.json`
+- `data/learning_data/learning_data.json`
+- `.gitignore`
+
+## Findings
+- **Secrets committed**: `evi_api_key` and `evi.api_key` are hard-coded in `jarvis_config.json`.
+- `personality_state.json` contains user state and is committed despite ignore rules.
+- `llm_config.yaml` references API keys via environment variables (good practice).
+- No `.env` file found; environment variable reliance not documented.
+- No domain allowlist or Full-Auto default setting located in configs.
+- No encryption or access control for JSON data files; data retention policies absent.
+
+## Recommendations
+- Move secrets to environment variables and remove from VCS.
+- Ensure `personality_state.json` and other dynamic state files are gitignored and rotated.
+- Add domain allowlist and explicit `mode` (Assistive/Semi/Full) flags in configs.
+- Consider encrypting sensitive config sections or using a secrets manager.
diff --git a/audit_reports/CPU_GPU_TELEMETRY_GAP.md b/audit_reports/CPU_GPU_TELEMETRY_GAP.md
new file mode 100644
index 00000000..54962797
--- /dev/null
+++ b/audit_reports/CPU_GPU_TELEMETRY_GAP.md
@@ -0,0 +1,32 @@
+# CPU/GPU Telemetry Gap
+
+## Current State
+- **LLM (Ollama)**: HTTP client; no device telemetry. GPU usage determined by server.
+- **STT (Whisper)**: `voice_input.py` loads model without specifying device (defaults to CPU)【b8a58e†L70-L75】
+- **TTS (Piper)**: Uses ONNX model via CPU; no GPU acceleration or reporting【6b1380†L35-L80】
+- No scripts for runtime health or hardware checks.
+
+## Recommended Patches
+```python
+# obs/device_telemetry.py (new)
+import psutil, json
+
+def snapshot() -> dict:
+    return {
+        "cpu_percent": psutil.cpu_percent(),
+        "mem_percent": psutil.virtual_memory().percent,
+    }
+```
+```python
+# scripts/healthcheck.py (new)
+from obs.device_telemetry import snapshot
+
+if __name__ == "__main__":
+    stats = snapshot()
+    print(json.dumps(stats, indent=2))
+```
+
+## Telemetry Plan
+- Capture CPU/GPU metrics per component (LLM/STT/TTS) before and after operations.
+- Emit JSON summary for CI dashboards.
+- Extend to GPU via `torch.cuda` or `onnxruntime` when available.
diff --git a/audit_reports/DEPENDENCY_RISKS.md b/audit_reports/DEPENDENCY_RISKS.md
new file mode 100644
index 00000000..2fcd350e
--- /dev/null
+++ b/audit_reports/DEPENDENCY_RISKS.md
@@ -0,0 +1,23 @@
+# Dependency Risks
+
+## Sources Reviewed
+- `requirements.txt`
+- `requirements-dev.txt`
+- `pyproject.toml`
+
+## Observations
+- Many dependencies use `>=` without upper bounds; risk of future breaking changes.
+- `requirements.txt` marks several optional packages commented out; better handled via extras.
+- `pyproject.toml` already defines `voice` and `office` extras but lacks `web` or `security` groups.
+- Duplicated dependencies between `requirements.txt` and `pyproject.toml` (e.g., langchain, numpy).
+- Development requirements include heavy packages (`torch`, `tensorflow`) that drastically increase install size.
+
+## Potential Vulnerabilities
+- `requests` and `aiohttp` have frequent CVEs; ensure versions remain updated.
+- `pyautogui` and `uiautomation` run with high privileges—monitor for updates.
+
+## Recommendations
+- Consolidate dependency management using `pyproject.toml` exclusively; generate lock file.
+- Define extras: `[voice]`, `[office]`, `[web]`, `[security]`.
+- Pin critical packages with upper bounds (e.g., `requests>=2.31,<3.0`).
+- Run `pip-audit` or `safety` in CI to track CVEs.
diff --git a/audit_reports/HEALTHCHECK_README_SNIPPET.md b/audit_reports/HEALTHCHECK_README_SNIPPET.md
new file mode 100644
index 00000000..25ac0659
--- /dev/null
+++ b/audit_reports/HEALTHCHECK_README_SNIPPET.md
@@ -0,0 +1,19 @@
+```markdown
+## Healthcheck
+Run a quick system check:
+
+```bash
+python scripts/healthcheck.py
+```
+
+Expected output:
+```json
+{
+  "cpu_percent": 12.5,
+  "mem_percent": 43.2
+}
+```
+- **cpu_percent** – overall CPU usage
+- **mem_percent** – RAM usage
+Values consistently above 80% indicate resource pressure.
+```
diff --git a/audit_reports/SECURITY_AUDIT.md b/audit_reports/SECURITY_AUDIT.md
new file mode 100644
index 00000000..8fc2e8eb
--- /dev/null
+++ b/audit_reports/SECURITY_AUDIT.md
@@ -0,0 +1,21 @@
+# Security Audit
+
+## Key Findings
+- **Secrets in repo**: `evi_api_key` in `config/jarvis_config.json`【294e78†L31-L44】
+- `personality_state.json` stores user interaction metadata committed to git【64a7f2†L1-L9】
+- `desktop.execute_command` concatenates user commands with `command.split()` → susceptible to injection【23938c†L59-L63】
+- `web_form_automation.py` lacks domain allowlist and uses bare `except` blocks【5d1671†L66-L75】
+- No CAPTCHA/OTP handling; automation can run in Full-Auto without confirmation.
+- Logging configuration writes to plain-text log files without PII masking.
+
+## Guardrails & HITL
+- HITL module (`security/hitl.py`) exists but contains unused variables and minimal logging.
+- No explicit mode enforcement; config does not default to Assistive or Semi-Auto.
+
+## Recommendations
+- Remove committed secrets; use environment variables and secret managers.
+- Sanitize PowerShell commands: avoid `command.split()`; use argument lists or shlex.
+- Implement domain allowlist and confirm-before-submit in web automation.
+- Add PII masking and log rotation policies.
+- Enforce HITL prompts for destructive actions; default to **Assistive** mode.
+- Document CAPTCHA/OTP fallback paths requiring Semi-Auto intervention.
diff --git a/audit_reports/STRUCTURE_AUDIT.md b/audit_reports/STRUCTURE_AUDIT.md
new file mode 100644
index 00000000..0fba2663
--- /dev/null
+++ b/audit_reports/STRUCTURE_AUDIT.md
@@ -0,0 +1,31 @@
+# Structure Audit
+
+## Repository Tree (top 2 levels)
+```
+.
+├── config/
+├── cookbook/
+├── data/
+├── docs/
+├── scripts/
+├── src/
+│   ├── data/
+│   └── windows_use/
+└── tests/
+```
+
+## `src/windows_use` Modules
+```
+agent/  desktop/  evolution/  examples/  jarvis_ai/
+llm/    office/   security/   tools/     tree/
+utils/  web/
+```
+
+## Missing or Claimed-but-Missing Components
+- README.md (root) – not found
+- actions/, backends/, nlu/, modes/, memory/, obs/, recovery/, vision/, ui/ – no corresponding folders under `src/windows_use`
+- reports/ – referenced in instructions but not present
+
+## Naming & Duplication Notes
+- `learning_data` and `data/learning_data` both exist
+- `personality_state.json` is committed despite .gitignore rule
diff --git a/audit_reports/TEST_MATRIX.md b/audit_reports/TEST_MATRIX.md
new file mode 100644
index 00000000..f54fb23e
--- /dev/null
+++ b/audit_reports/TEST_MATRIX.md
@@ -0,0 +1,24 @@
+# Test Matrix
+
+## Existing Tests
+- `tests/test_llm.py`
+- `tests/test_integration.py`
+- `tests/test_security.py`
+- `tests/test_evolution.py`
+- `tests/test_web.py`
+- `tests/test_gui.py`
+- `tests/test_python312_upgrade.py`
+
+## Gaps & Proposed Tests
+| Area | Missing Coverage | Suggested Test |
+| --- | --- | --- |
+| Office COM | Interaction with Word/Excel/PowerPoint | Mock COM objects to validate API usage |
+| Voice/STT/TTS | Whisper & Piper integration | Simulate audio input/output; check device selection |
+| Configuration | Loading/parsing of YAML/JSON | Unit tests for `config/*` schema validation |
+| Web Automation | Domain allowlist & form submission | Headless test ensuring prompts before submit |
+| Recovery/Retry | Retry logic in `web_form_automation` | Unit test for retry/backoff on timeouts |
+| Healthcheck | System telemetry | Test `scripts/healthcheck.py` returns CPU metrics |
+
+## CI Recommendations
+- Run `ruff`, `black --check`, `mypy`, and `pytest` in pipeline.
+- Skip Office tests if dependencies unavailable; mark as `xfail`.
diff --git a/config/logging.yaml b/config/logging.yaml
index c944663e..2d8b4fb0 100644
--- a/config/logging.yaml
+++ b/config/logging.yaml
@@ -34,30 +34,33 @@ handlers:
     stream: ext://sys.stdout
   
   file:
-    class: logging.handlers.RotatingFileHandler
+    class: logging.handlers.TimedRotatingFileHandler
     level: DEBUG
     formatter: detailed
     filename: logs/jarvis.log
-    maxBytes: 10485760  # 10MB
-    backupCount: 5
+    when: D
+    interval: 1
+    backupCount: 14
     encoding: utf8
-  
+
   error_file:
-    class: logging.handlers.RotatingFileHandler
+    class: logging.handlers.TimedRotatingFileHandler
     level: ERROR
     formatter: detailed
     filename: logs/jarvis_errors.log
-    maxBytes: 10485760  # 10MB
-    backupCount: 3
+    when: D
+    interval: 1
+    backupCount: 14
     encoding: utf8
-  
+
   performance_file:
-    class: logging.handlers.RotatingFileHandler
+    class: logging.handlers.TimedRotatingFileHandler
     level: DEBUG
     formatter: json
     filename: logs/jarvis_performance.log
-    maxBytes: 10485760  # 10MB
-    backupCount: 3
+    when: D
+    interval: 1
+    backupCount: 14
     encoding: utf8
     filters: [performance]
 
diff --git a/config/models.yaml b/config/models.yaml
new file mode 100644
index 00000000..fb4a7542
--- /dev/null
+++ b/config/models.yaml
@@ -0,0 +1,4 @@
+planner: gpt-4
+judge: gpt-4
+offline: small
+vision: null
diff --git a/config/security.yaml b/config/security.yaml
new file mode 100644
index 00000000..7c607f13
--- /dev/null
+++ b/config/security.yaml
@@ -0,0 +1,5 @@
+mode_default: ASSISTIVE
+web:
+  allowlist:
+    - example.com
+  require_confirm_on_submit: true
diff --git a/docs/SECRETS.md b/docs/SECRETS.md
new file mode 100644
index 00000000..1834f2ad
--- /dev/null
+++ b/docs/SECRETS.md
@@ -0,0 +1,18 @@
+# Secrets Management
+
+Jarvis uses the Windows Credential Manager via the `secret_store` module to keep API keys and tokens out of source control.
+
+## Storing a Secret
+```python
+from windows_use.security.secret_store import set_secret
+set_secret("OPENAI_API_KEY", "sk-...")
+```
+
+## Using a Secret in Config
+`security.yaml` values can reference `${OPENAI_API_KEY}`. If the environment variable is not set, the loader resolves it from the secret store.
+
+## Rotation
+Update the secret with `set_secret` and restart the agent. Use `delete_secret` to remove old keys.
+
+## Auditing
+Secrets are never logged. Review access through Windows Credential Manager's audit logs.
diff --git a/docs/SECURITY_MODES.md b/docs/SECURITY_MODES.md
new file mode 100644
index 00000000..316c3ac1
--- /dev/null
+++ b/docs/SECURITY_MODES.md
@@ -0,0 +1,9 @@
+# Security Modes
+
+| Mode | Description | Typical Use |
+| --- | --- | --- |
+| ASSISTIVE | Requires explicit user confirmation before actions that modify state. | Safe default for day-to-day use. |
+| SEMI_AUTO | Proceeds with predefined checkpoints; user confirmation needed for critical steps or when OTP/CAPTCHA detected. | Batch tasks with oversight. |
+| FULL_AUTO | Executes actions without user intervention. Should only run in controlled environments. | Trusted, sandboxed automation. |
+
+Actions submitted in ASSISTIVE and SEMI_AUTO modes must be confirmed when `require_confirm_on_submit` is enabled.
diff --git a/docs/TROUBLESHOOTING.md b/docs/TROUBLESHOOTING.md
new file mode 100644
index 00000000..42fea98d
--- /dev/null
+++ b/docs/TROUBLESHOOTING.md
@@ -0,0 +1,17 @@
+# Troubleshooting
+
+## GPU Not Detected
+- Ensure CUDA drivers are installed.
+- Set `JARVIS_STT_DEVICE=cuda` to force GPU for Whisper.
+
+## Playwright Failures
+- Install browsers with `playwright install`.
+- Check allowlist and network access.
+
+## Office COM Crashes
+- Verify Microsoft Office is installed and updated.
+- Run the agent with administrator privileges if required.
+
+## PowerShell Permission Errors
+- Constrained Language Mode may block certain cmdlets.
+- Ensure commands are in the whitelist and do not require elevated rights.
diff --git a/pyproject.toml b/pyproject.toml
index 7a6758bf..7575ab5d 100644
--- a/pyproject.toml
+++ b/pyproject.toml
@@ -1,6 +1,6 @@
 [project]
 name = "windows-use"
-version = "0.1.31"
+version = "0.1.0"
 description = "An AI Agent that interacts with Windows OS at GUI level."
 readme = "readme.md"
 authors = [
diff --git a/requirements.txt b/requirements.txt
index e6330f18..7470c8ba 100644
--- a/requirements.txt
+++ b/requirements.txt
@@ -41,6 +41,7 @@ termcolor>=2.3.0
 sounddevice>=0.4.6
 websockets>=11.0.0
 webrtcvad>=2.0.10
+keyring>=24.3.0
 
 # Optional Dependencies (install only if needed)
 # Voice Recognition (uncomment if voice features needed)
diff --git a/scripts/healthcheck.py b/scripts/healthcheck.py
new file mode 100644
index 00000000..e23a48dd
--- /dev/null
+++ b/scripts/healthcheck.py
@@ -0,0 +1,44 @@
+from __future__ import annotations
+
+import json
+import os
+import time
+
+try:
+    import torch
+except Exception:  # pragma: no cover
+    torch = None
+
+try:
+    import onnxruntime as ort
+except Exception:  # pragma: no cover
+    ort = None
+
+
+def main() -> None:
+    providers = []
+    if ort:
+        providers = ort.get_available_providers()
+    gpu = "CPU"
+    if torch and torch.cuda.is_available():
+        gpu = torch.cuda.get_device_name(0)
+    stt_device = os.getenv("JARVIS_STT_DEVICE", "auto")
+
+    info = {"providers": providers, "gpu": gpu, "stt_device": stt_device}
+    print(json.dumps(info, indent=2))
+
+    try:
+        import ollama  # type: ignore
+
+        start = time.time()
+        ollama.generate(
+            model="llama2", prompt="healthcheck", options={"num_predict": 10}
+        )
+        latency = time.time() - start
+        print(f"Ollama generated 10 tokens in {latency:.2f}s")
+    except Exception as e:  # pragma: no cover - ollama optional
+        print(f"Ollama check skipped: {e}")
+
+
+if __name__ == "__main__":
+    main()
diff --git a/src/windows_use/config_loader.py b/src/windows_use/config_loader.py
new file mode 100644
index 00000000..304abc12
--- /dev/null
+++ b/src/windows_use/config_loader.py
@@ -0,0 +1,55 @@
+from __future__ import annotations
+
+import os
+import re
+from pathlib import Path
+from typing import Any, Dict
+
+import yaml
+
+from .config_schema import ModelsConfig, SecurityConfig
+from .security.secret_store import get_secret
+
+
+_ENV_PATTERN = re.compile(r"\$\{([^}]+)\}")
+
+
+def _resolve(value: Any) -> Any:
+    if isinstance(value, str):
+        match = _ENV_PATTERN.fullmatch(value)
+        if match:
+            name = match.group(1)
+            return os.getenv(name) or get_secret(name)
+    return value
+
+
+def _load_yaml(path: Path) -> Dict[str, Any]:
+    with path.open("r", encoding="utf-8") as f:
+        data = yaml.safe_load(f) or {}
+    return _traverse(data)
+
+
+def _traverse(obj: Any) -> Any:
+    if isinstance(obj, dict):
+        return {k: _traverse(v) for k, v in obj.items()}
+    if isinstance(obj, list):
+        return [_traverse(v) for v in obj]
+    return _resolve(obj)
+
+
+def load_security_config(path: str | Path = "config/security.yaml") -> SecurityConfig:
+    data = _load_yaml(Path(path))
+    config = SecurityConfig(**data)
+    if not config.web.allowlist:
+        raise ValueError("allowlist must not be empty")
+    if config.mode_default != config.mode_default.__class__.ASSISTIVE:
+        raise ValueError("mode_default must be ASSISTIVE")
+    return config
+
+
+def load_models_config(path: str | Path = "config/models.yaml") -> ModelsConfig:
+    data = _load_yaml(Path(path))
+    config = ModelsConfig(**data)
+    if not config.offline:
+        config.offline = "safe"
+    return config
diff --git a/src/windows_use/config_schema.py b/src/windows_use/config_schema.py
new file mode 100644
index 00000000..ad226045
--- /dev/null
+++ b/src/windows_use/config_schema.py
@@ -0,0 +1,49 @@
+from __future__ import annotations
+
+from enum import Enum
+from typing import List, Optional
+
+from pydantic import BaseModel, Field, validator
+
+
+class Mode(str, Enum):
+    ASSISTIVE = "ASSISTIVE"
+    SEMI_AUTO = "SEMI_AUTO"
+    FULL_AUTO = "FULL_AUTO"
+
+
+class WebConfig(BaseModel):
+    allowlist: List[str] = Field(..., min_length=1)
+    require_confirm_on_submit: bool = True
+
+    @validator("allowlist")
+    def _non_empty(cls, v: List[str]) -> List[str]:
+        if not v:
+            raise ValueError("allowlist must not be empty")
+        return v
+
+
+class SecurityConfig(BaseModel):
+    mode_default: Mode = Mode.ASSISTIVE
+    web: WebConfig
+
+    @validator("mode_default")
+    def _mode_default_assistive(cls, v: Mode) -> Mode:
+        if v != Mode.ASSISTIVE:
+            raise ValueError("mode_default must default to ASSISTIVE")
+        return v
+
+
+class ModelsConfig(BaseModel):
+    planner: Optional[str] = None
+    judge: Optional[str] = None
+    offline: str = "safe"
+    vision: Optional[str] = None
+
+    @validator("planner", "judge", "offline", "vision", pre=True, always=True)
+    def _validate_name(cls, v: Optional[str]) -> Optional[str]:
+        if v is None:
+            return v
+        if not isinstance(v, str) or not v.strip():
+            raise ValueError("model name must be a non-empty string")
+        return v
diff --git a/src/windows_use/obs/log_sanitizer.py b/src/windows_use/obs/log_sanitizer.py
new file mode 100644
index 00000000..4baf1ecb
--- /dev/null
+++ b/src/windows_use/obs/log_sanitizer.py
@@ -0,0 +1,15 @@
+from __future__ import annotations
+
+import re
+
+TOKEN_RE = re.compile(r"[A-Za-z0-9]{32,}")
+EMAIL_RE = re.compile(r"[\w\.-]+@[\w\.-]+")
+PHONE_RE = re.compile(r"\b\d{9,15}\b")
+
+
+def redact(text: str) -> str:
+    """Mask obvious secrets from log text."""
+    text = TOKEN_RE.sub("[REDACTED]", text)
+    text = EMAIL_RE.sub("[REDACTED_EMAIL]", text)
+    text = PHONE_RE.sub("[REDACTED_PHONE]", text)
+    return text
diff --git a/src/windows_use/security/secret_store.py b/src/windows_use/security/secret_store.py
new file mode 100644
index 00000000..1b2ccc51
--- /dev/null
+++ b/src/windows_use/security/secret_store.py
@@ -0,0 +1,36 @@
+"""Simple wrapper around Windows Credential Manager via keyring."""
+
+from __future__ import annotations
+
+from typing import Optional
+
+try:
+    import keyring
+except Exception:  # pragma: no cover - keyring may not be available on CI
+    keyring = None
+
+_SERVICE = "jarvis-ai"
+
+
+def get_secret(name: str) -> Optional[str]:
+    if not keyring:
+        return None
+    try:
+        return keyring.get_password(_SERVICE, name)
+    except Exception:
+        return None
+
+
+def set_secret(name: str, value: str) -> None:
+    if not keyring:
+        raise RuntimeError("keyring backend not available")
+    keyring.set_password(_SERVICE, name, value)
+
+
+def delete_secret(name: str) -> None:
+    if not keyring:
+        return
+    try:
+        keyring.delete_password(_SERVICE, name)
+    except Exception:
+        pass
diff --git a/src/windows_use/tools/ps_shell.py b/src/windows_use/tools/ps_shell.py
index 221c803c..5a9bdf62 100644
--- a/src/windows_use/tools/ps_shell.py
+++ b/src/windows_use/tools/ps_shell.py
@@ -10,13 +10,13 @@
 from typing import Dict, List, Optional, Tuple, Any
 from dataclasses import dataclass
 from pathlib import Path
-import tempfile
 import os
 
 
 @dataclass
 class PSResult:
     """Result from PowerShell command execution."""
+
     success: bool
     output: str
     error: str
@@ -26,57 +26,89 @@ class PSResult:
 
 class PowerShellManager:
     """Safe PowerShell operations with validation and logging."""
-    
+
     # Whitelist of safe PowerShell cmdlets
     SAFE_CMDLETS = {
         # File and folder operations
-        'Get-ChildItem', 'Get-Item', 'Get-Content', 'Set-Content',
-        'Copy-Item', 'Move-Item', 'Remove-Item', 'New-Item',
-        'Test-Path', 'Resolve-Path', 'Split-Path', 'Join-Path',
-        
+        "Get-ChildItem",
+        "Get-Item",
+        "Get-Content",
+        "Set-Content",
+        "Copy-Item",
+        "Move-Item",
+        "Remove-Item",
+        "New-Item",
+        "Test-Path",
+        "Resolve-Path",
+        "Split-Path",
+        "Join-Path",
         # Process management
-        'Get-Process', 'Stop-Process', 'Start-Process',
-        
+        "Get-Process",
+        "Stop-Process",
+        "Start-Process",
         # Service management (read-only by default)
-        'Get-Service', 'Get-WmiObject',
-        
+        "Get-Service",
+        "Get-WmiObject",
         # System information
-        'Get-ComputerInfo', 'Get-SystemInfo', 'Get-Date',
-        'Get-TimeZone', 'Get-Culture', 'Get-Host',
-        
+        "Get-ComputerInfo",
+        "Get-SystemInfo",
+        "Get-Date",
+        "Get-TimeZone",
+        "Get-Culture",
+        "Get-Host",
         # Network (read-only)
-        'Get-NetAdapter', 'Get-NetIPAddress', 'Get-NetRoute',
-        'Test-NetConnection', 'Resolve-DnsName',
-        
+        "Get-NetAdapter",
+        "Get-NetIPAddress",
+        "Get-NetRoute",
+        "Test-NetConnection",
+        "Resolve-DnsName",
         # Registry (read-only by default)
-        'Get-ItemProperty', 'Get-ChildItem',
-        
+        "Get-ItemProperty",
+        "Get-ChildItem",
         # Archive operations
-        'Compress-Archive', 'Expand-Archive',
-        
+        "Compress-Archive",
+        "Expand-Archive",
         # Text processing
-        'Select-String', 'ConvertTo-Json', 'ConvertFrom-Json',
-        'ConvertTo-Csv', 'ConvertFrom-Csv',
-        
+        "Select-String",
+        "ConvertTo-Json",
+        "ConvertFrom-Json",
+        "ConvertTo-Csv",
+        "ConvertFrom-Csv",
         # Basic utilities
-        'Write-Output', 'Write-Host', 'Measure-Object',
-        'Sort-Object', 'Group-Object', 'Where-Object', 'ForEach-Object'
+        "Write-Output",
+        "Write-Host",
+        "Measure-Object",
+        "Sort-Object",
+        "Group-Object",
+        "Where-Object",
+        "ForEach-Object",
     }
-    
+
     # Dangerous cmdlets that require explicit approval
     DANGEROUS_CMDLETS = {
-        'Remove-Item', 'Remove-ItemProperty', 'Clear-Content',
-        'Stop-Process', 'Stop-Service', 'Restart-Service',
-        'Set-ItemProperty', 'New-ItemProperty', 'Remove-ItemProperty',
-        'Invoke-Expression', 'Invoke-Command', 'Start-Process'
+        "Remove-Item",
+        "Remove-ItemProperty",
+        "Clear-Content",
+        "Stop-Process",
+        "Stop-Service",
+        "Restart-Service",
+        "Set-ItemProperty",
+        "New-ItemProperty",
+        "Remove-ItemProperty",
+        "Invoke-Expression",
+        "Invoke-Command",
+        "Start-Process",
     }
-    
-    def __init__(self, logger: Optional[logging.Logger] = None, 
-                 require_approval_for_dangerous: bool = True):
+
+    def __init__(
+        self,
+        logger: Optional[logging.Logger] = None,
+        require_approval_for_dangerous: bool = True,
+    ):
         self.logger = logger or logging.getLogger(__name__)
         self.require_approval = require_approval_for_dangerous
         self._validate_powershell_available()
-        
+
     def _validate_powershell_available(self) -> bool:
         """Check if PowerShell is available on the system."""
         try:
@@ -84,7 +116,7 @@ def _validate_powershell_available(self) -> bool:
                 ["powershell", "-Command", "$PSVersionTable.PSVersion"],
                 capture_output=True,
                 text=True,
-                timeout=10
+                timeout=10,
             )
             if result.returncode == 0:
                 self.logger.info(f"PowerShell available: {result.stdout.strip()}")
@@ -94,47 +126,47 @@ def _validate_powershell_available(self) -> bool:
         except (subprocess.TimeoutExpired, FileNotFoundError, RuntimeError) as e:
             self.logger.error(f"PowerShell validation failed: {e}")
             raise RuntimeError("PowerShell is not available on this system")
-    
+
     def _validate_command_safety(self, command: str) -> Tuple[bool, str]:
         """Validate if a PowerShell command is safe to execute.
-        
+
         Args:
             command: PowerShell command to validate
-            
+
         Returns:
             Tuple of (is_safe, reason)
         """
         # Remove comments and normalize whitespace
-        clean_command = re.sub(r'#.*$', '', command, flags=re.MULTILINE)
-        clean_command = ' '.join(clean_command.split())
-        
+        clean_command = re.sub(r"#.*$", "", command, flags=re.MULTILINE)
+        clean_command = " ".join(clean_command.split())
+
         # Check for dangerous patterns
         dangerous_patterns = [
-            r'Invoke-Expression',
-            r'IEX\s',
-            r'&\s*\(',
-            r'cmd\.exe',
-            r'powershell\.exe.*-EncodedCommand',
-            r'DownloadString',
-            r'DownloadFile',
-            r'WebClient',
-            r'Net\.WebClient',
-            r'Start-BitsTransfer',
-            r'Invoke-WebRequest.*-OutFile',
-            r'curl.*-o',
-            r'wget',
-            r'Format-.*-Force',
-            r'Remove-.*-Recurse.*-Force'
+            r"Invoke-Expression",
+            r"IEX\s",
+            r"&\s*\(",
+            r"cmd\.exe",
+            r"powershell\.exe.*-EncodedCommand",
+            r"DownloadString",
+            r"DownloadFile",
+            r"WebClient",
+            r"Net\.WebClient",
+            r"Start-BitsTransfer",
+            r"Invoke-WebRequest.*-OutFile",
+            r"curl.*-o",
+            r"wget",
+            r"Format-.*-Force",
+            r"Remove-.*-Recurse.*-Force",
         ]
-        
+
         for pattern in dangerous_patterns:
             if re.search(pattern, clean_command, re.IGNORECASE):
                 return False, f"Dangerous pattern detected: {pattern}"
-        
+
         # Extract cmdlets from command
-        cmdlet_pattern = r'([A-Za-z]+-[A-Za-z]+)'
+        cmdlet_pattern = r"([A-Za-z]+-[A-Za-z]+)"
         cmdlets = re.findall(cmdlet_pattern, clean_command)
-        
+
         # Check if all cmdlets are in safe list
         for cmdlet in cmdlets:
             if cmdlet not in self.SAFE_CMDLETS:
@@ -143,26 +175,31 @@ def _validate_command_safety(self, command: str) -> Tuple[bool, str]:
                         return False, f"Dangerous cmdlet requires approval: {cmdlet}"
                 else:
                     return False, f"Unknown/unsafe cmdlet: {cmdlet}"
-        
+
         return True, "Command appears safe"
-    
-    def execute_command(self, command: str, timeout: int = 30, 
-                       working_directory: Optional[str] = None,
-                       force_approve: bool = False) -> PSResult:
+
+    def execute_command(
+        self,
+        command: str,
+        timeout: int = 30,
+        working_directory: Optional[str] = None,
+        force_approve: bool = False,
+    ) -> PSResult:
         """Execute a PowerShell command safely.
-        
+
         Args:
             command: PowerShell command to execute
             timeout: Execution timeout in seconds
             working_directory: Working directory for command execution
             force_approve: Skip safety validation (use with caution)
-            
+
         Returns:
             PSResult object with execution details
         """
         import time
+
         start_time = time.time()
-        
+
         # Validate command safety
         if not force_approve:
             is_safe, reason = self._validate_command_safety(command)
@@ -173,47 +210,59 @@ def execute_command(self, command: str, timeout: int = 30,
                     output="",
                     error=f"Command rejected for safety: {reason}",
                     exit_code=-1,
-                    execution_time=time.time() - start_time
+                    execution_time=time.time() - start_time,
                 )
-        
+
         try:
             # Prepare PowerShell command
-            ps_cmd = ["powershell", "-NoProfile", "-ExecutionPolicy", "Bypass", "-Command"]
-            
-            # Set working directory if specified
+            ps_cmd = [
+                "powershell",
+                "-NoProfile",
+                "-ExecutionPolicy",
+                "Bypass",
+                "-Command",
+                command,
+            ]
+
             if working_directory:
-                command = f"Set-Location '{working_directory}'; {command}"
-            
-            ps_cmd.append(command)
-            
+                ps_cmd[-1] = f"Set-Location '{working_directory}'; {command}"
+
             self.logger.info(f"Executing PowerShell command: {command[:100]}...")
-            
-            # Execute command
+
+            env = os.environ.copy()
+            env["__PSLockdownPolicy"] = "4"
+
             result = subprocess.run(
                 ps_cmd,
                 capture_output=True,
                 text=True,
                 timeout=timeout,
-                cwd=working_directory
+                cwd=working_directory,
+                env=env,
+                shell=False,
             )
-            
+
             execution_time = time.time() - start_time
-            
+
             ps_result = PSResult(
                 success=result.returncode == 0,
                 output=result.stdout,
                 error=result.stderr,
                 exit_code=result.returncode,
-                execution_time=execution_time
+                execution_time=execution_time,
             )
-            
+
             if ps_result.success:
-                self.logger.info(f"Command executed successfully in {execution_time:.2f}s")
+                self.logger.info(
+                    f"Command executed successfully in {execution_time:.2f}s"
+                )
             else:
-                self.logger.error(f"Command failed with exit code {result.returncode}: {result.stderr}")
-            
+                self.logger.error(
+                    f"Command failed with exit code {result.returncode}: {result.stderr}"
+                )
+
             return ps_result
-            
+
         except subprocess.TimeoutExpired:
             execution_time = time.time() - start_time
             error_msg = f"Command timeout after {timeout} seconds"
@@ -223,7 +272,7 @@ def execute_command(self, command: str, timeout: int = 30,
                 output="",
                 error=error_msg,
                 exit_code=-2,
-                execution_time=execution_time
+                execution_time=execution_time,
             )
         except Exception as e:
             execution_time = time.time() - start_time
@@ -234,18 +283,22 @@ def execute_command(self, command: str, timeout: int = 30,
                 output="",
                 error=error_msg,
                 exit_code=-3,
-                execution_time=execution_time
+                execution_time=execution_time,
             )
-    
-    def execute_script_file(self, script_path: str, parameters: Optional[Dict[str, Any]] = None,
-                           timeout: int = 60) -> PSResult:
+
+    def execute_script_file(
+        self,
+        script_path: str,
+        parameters: Optional[Dict[str, Any]] = None,
+        timeout: int = 60,
+    ) -> PSResult:
         """Execute a PowerShell script file.
-        
+
         Args:
             script_path: Path to PowerShell script file
             parameters: Script parameters
             timeout: Execution timeout in seconds
-            
+
         Returns:
             PSResult object with execution details
         """
@@ -255,9 +308,9 @@ def execute_script_file(self, script_path: str, parameters: Optional[Dict[str, A
                 output="",
                 error=f"Script file not found: {script_path}",
                 exit_code=-1,
-                execution_time=0.0
+                execution_time=0.0,
             )
-        
+
         # Build command with parameters
         command = f"& '{script_path}'"
         if parameters:
@@ -268,12 +321,12 @@ def execute_script_file(self, script_path: str, parameters: Optional[Dict[str, A
                 else:
                     param_strings.append(f"-{key} {value}")
             command += " " + " ".join(param_strings)
-        
+
         return self.execute_command(command, timeout=timeout, force_approve=True)
-    
+
     def get_system_info(self) -> Dict[str, Any]:
         """Get basic system information using PowerShell.
-        
+
         Returns:
             Dictionary with system information
         """
@@ -289,7 +342,7 @@ def get_system_info(self) -> Dict[str, Any]:
         $info['PowerShellVersion'] = $PSVersionTable.PSVersion.ToString()
         $info | ConvertTo-Json
         """
-        
+
         result = self.execute_command(command)
         if result.success:
             try:
@@ -300,21 +353,25 @@ def get_system_info(self) -> Dict[str, Any]:
         else:
             self.logger.error(f"Failed to get system info: {result.error}")
             return {}
-    
-    def get_running_processes(self, name_filter: Optional[str] = None) -> List[Dict[str, Any]]:
+
+    def get_running_processes(
+        self, name_filter: Optional[str] = None
+    ) -> List[Dict[str, Any]]:
         """Get list of running processes.
-        
+
         Args:
             name_filter: Optional process name filter
-            
+
         Returns:
             List of process information dictionaries
         """
         command = "Get-Process"
         if name_filter:
             command += f" -Name '*{name_filter}*'"
-        command += " | Select-Object Name, Id, CPU, WorkingSet, StartTime | ConvertTo-Json"
-        
+        command += (
+            " | Select-Object Name, Id, CPU, WorkingSet, StartTime | ConvertTo-Json"
+        )
+
         result = self.execute_command(command)
         if result.success:
             try:
@@ -326,40 +383,42 @@ def get_running_processes(self, name_filter: Optional[str] = None) -> List[Dict[
         else:
             self.logger.error(f"Failed to get process list: {result.error}")
             return []
-    
+
     def compress_folder(self, source_path: str, destination_path: str) -> PSResult:
         """Compress a folder to ZIP archive.
-        
+
         Args:
             source_path: Source folder path
             destination_path: Destination ZIP file path
-            
+
         Returns:
             PSResult object
         """
         command = f"Compress-Archive -Path '{source_path}' -DestinationPath '{destination_path}' -Force"
         return self.execute_command(command)
-    
+
     def extract_archive(self, archive_path: str, destination_path: str) -> PSResult:
         """Extract ZIP archive to destination folder.
-        
+
         Args:
             archive_path: ZIP file path
             destination_path: Destination folder path
-            
+
         Returns:
             PSResult object
         """
         command = f"Expand-Archive -Path '{archive_path}' -DestinationPath '{destination_path}' -Force"
         return self.execute_command(command)
-    
-    def test_network_connection(self, target: str, port: Optional[int] = None) -> Dict[str, Any]:
+
+    def test_network_connection(
+        self, target: str, port: Optional[int] = None
+    ) -> Dict[str, Any]:
         """Test network connection to target.
-        
+
         Args:
             target: Target hostname or IP
             port: Optional port number
-            
+
         Returns:
             Connection test results
         """
@@ -367,7 +426,7 @@ def test_network_connection(self, target: str, port: Optional[int] = None) -> Di
         if port:
             command += f" -Port {port}"
         command += " | ConvertTo-Json"
-        
+
         result = self.execute_command(command)
         if result.success:
             try:
@@ -387,17 +446,17 @@ def test_network_connection(self, target: str, port: Optional[int] = None) -> Di
     "system_uptime": "(Get-Date) - (Get-CimInstance Win32_OperatingSystem).LastBootUpTime",
     "installed_programs": "Get-WmiObject -Class Win32_Product | Select-Object Name, Version, Vendor",
     "network_adapters": "Get-NetAdapter | Select-Object Name, InterfaceDescription, LinkSpeed, Status",
-    "services_status": "Get-Service | Where-Object {$_.Status -eq 'Running'} | Select-Object Name, Status, StartType"
+    "services_status": "Get-Service | Where-Object {$_.Status -eq 'Running'} | Select-Object Name, Status, StartType",
 }
 
 
 def get_snippet(name: str, **kwargs) -> Optional[str]:
     """Get a common PowerShell snippet with parameter substitution.
-    
+
     Args:
         name: Snippet name
         **kwargs: Parameters for snippet formatting
-        
+
     Returns:
         Formatted PowerShell command or None if snippet not found
     """
@@ -405,6 +464,8 @@ def get_snippet(name: str, **kwargs) -> Optional[str]:
         try:
             return COMMON_SNIPPETS[name].format(**kwargs)
         except KeyError as e:
-            logging.getLogger(__name__).error(f"Missing parameter for snippet {name}: {e}")
+            logging.getLogger(__name__).error(
+                f"Missing parameter for snippet {name}: {e}"
+            )
             return None
-    return None
\ No newline at end of file
+    return None
diff --git a/src/windows_use/tools/tts_piper.py b/src/windows_use/tools/tts_piper.py
index 2db90854..23869b79 100644
--- a/src/windows_use/tools/tts_piper.py
+++ b/src/windows_use/tools/tts_piper.py
@@ -7,42 +7,44 @@
 - Voice configuration dan customization
 """
 
-import asyncio
 import logging
-import os
-import tempfile
 import threading
 from pathlib import Path
-from typing import Optional, Dict, Any, List
+from typing import Optional, Dict, Any
 
 import numpy as np
 
 try:
     import sounddevice as sd
     import wave
-except ImportError as e:
+except (ImportError, OSError) as e:
     logging.warning(f"Audio dependencies not installed: {e}")
     logging.warning("Install with: pip install sounddevice numpy")
 
 try:
     # Piper TTS - install dengan: pip install piper-tts
     from piper import PiperVoice
+    import onnxruntime as ort
 except ImportError:
     logging.warning("Piper TTS not installed")
     logging.warning("Install with: pip install piper-tts")
     PiperVoice = None
+    ort = None
+
 
 class TTSPiper:
     """Text-to-Speech menggunakan Piper"""
-    
-    def __init__(self, 
-                 voice_model: str = "id_ID-fajri-medium",
-                 sample_rate: int = 22050,
-                 speed: float = 1.0,
-                 volume: float = 0.8):
+
+    def __init__(
+        self,
+        voice_model: str = "id_ID-fajri-medium",
+        sample_rate: int = 22050,
+        speed: float = 1.0,
+        volume: float = 0.8,
+    ):
         """
         Initialize TTS Piper
-        
+
         Args:
             voice_model: Piper voice model untuk bahasa Indonesia
             sample_rate: Audio sample rate
@@ -53,77 +55,86 @@ def __init__(self,
         self.sample_rate = sample_rate
         self.speed = speed
         self.volume = volume
-        
+
         self.voice = None
+        self.execution_provider = "CPUExecutionProvider"
         self.is_speaking = False
-        
+
         # Voice models yang tersedia untuk bahasa Indonesia
         self.available_voices = {
             "id_ID-fajri-medium": "Suara pria Indonesia (medium quality)",
             "id_ID-fajri-low": "Suara pria Indonesia (low quality, faster)",
             # Tambah voice models lain jika tersedia
         }
-        
+
         self._setup_voice()
-    
+
     def _setup_voice(self):
         """Setup Piper voice model"""
         if PiperVoice is None:
             logging.error("Piper TTS not available")
             return
-        
+
         try:
             # Download dan load voice model jika belum ada
             model_path = self._get_or_download_model()
             if model_path:
-                self.voice = PiperVoice.load(model_path)
+                provider = self.execution_provider
+                if ort:
+                    providers = ort.get_available_providers()
+                    if "CUDAExecutionProvider" in providers:
+                        provider = "CUDAExecutionProvider"
+                        self.execution_provider = provider
+                self.voice = PiperVoice.load(
+                    model_path, provider=self.execution_provider
+                )
                 logging.info(f"Piper voice loaded: {self.voice_model}")
             else:
                 logging.error(f"Failed to load voice model: {self.voice_model}")
-                
+
         except Exception as e:
             logging.error(f"Failed to setup Piper voice: {e}")
-    
+
     def _get_or_download_model(self) -> Optional[str]:
         """Get atau download voice model
-        
+
         Returns:
             Path ke model file atau None jika gagal
         """
         # Implementasi sederhana - dalam production, ini bisa download dari Piper repository
         models_dir = Path.home() / ".piper" / "voices"
         models_dir.mkdir(parents=True, exist_ok=True)
-        
+
         model_file = models_dir / f"{self.voice_model}.onnx"
         config_file = models_dir / f"{self.voice_model}.onnx.json"
-        
+
         if model_file.exists() and config_file.exists():
             return str(model_file)
-        
+
         # Fallback: gunakan voice model default jika ada
         logging.warning(f"Voice model {self.voice_model} not found")
         logging.warning("Please download Piper voice models manually")
         logging.warning("See: https://github.com/rhasspy/piper/releases")
-        
+
         return None
-    
+
     def speak(self, text: str, blocking: bool = True) -> bool:
         """Speak text menggunakan TTS
-        
+
         Args:
             text: Text yang akan diucapkan
             blocking: Jika True, tunggu sampai selesai bicara
-            
+
         Returns:
             True jika berhasil, False jika gagal
         """
         if not self.voice:
             logging.error("Voice model not loaded")
             return False
-        
+
         if not text.strip():
             return False
-        
+
         if blocking:
             return self._speak_sync(text)
         else:
@@ -131,71 +142,71 @@ def speak(self, text: str, blocking: bool = True) -> bool:
             thread.daemon = True
             thread.start()
             return True
-    
+
     def _speak_sync(self, text: str) -> bool:
         """Synchronous speech synthesis dan playback"""
         try:
             self.is_speaking = True
-            
+
             # Generate audio dari text
             audio_data = self._synthesize_audio(text)
             if audio_data is None:
                 return False
-            
+
             # Play audio
             self._play_audio(audio_data)
-            
+
             return True
-            
+
         except Exception as e:
             logging.error(f"Speech synthesis failed: {e}")
             return False
         finally:
             self.is_speaking = False
-    
+
     def _synthesize_audio(self, text: str) -> Optional[np.ndarray]:
         """Synthesize audio dari text
-        
+
         Args:
             text: Input text
-            
+
         Returns:
             Audio data sebagai numpy array atau None jika gagal
         """
         try:
             # Preprocess text
             text = self._preprocess_text(text)
-            
+
             # Generate audio dengan Piper
             audio_stream = self.voice.synthesize(text)
-            
+
             # Convert ke numpy array
             audio_data = np.array(list(audio_stream), dtype=np.float32)
-            
+
             # Apply speed dan volume adjustments
             if self.speed != 1.0:
                 audio_data = self._adjust_speed(audio_data)
-            
+
             audio_data = audio_data * self.volume
-            
+
             return audio_data
-            
+
         except Exception as e:
             logging.error(f"Audio synthesis failed: {e}")
             return None
-    
+
     def _preprocess_text(self, text: str) -> str:
         """Preprocess text untuk TTS
-        
+
         Args:
             text: Raw text
-            
+
         Returns:
             Processed text
         """
         # Normalisasi text untuk bahasa Indonesia
         text = text.strip()
-        
+
         # Replace common abbreviations
         replacements = {
             "&": "dan",
@@ -209,18 +220,18 @@ def _preprocess_text(self, text: str) -> str:
             "₹": "rupee",
             "Rp": "rupiah",
         }
-        
+
         for old, new in replacements.items():
             text = text.replace(old, new)
-        
+
         return text
-    
+
     def _adjust_speed(self, audio_data: np.ndarray) -> np.ndarray:
         """Adjust speech speed
-        
+
         Args:
             audio_data: Original audio data
-            
+
         Returns:
             Speed-adjusted audio data
         """
@@ -228,15 +239,15 @@ def _adjust_speed(self, audio_data: np.ndarray) -> np.ndarray:
         # Untuk implementasi yang lebih baik, gunakan librosa atau similar
         if self.speed == 1.0:
             return audio_data
-        
+
         # Resample untuk mengubah speed
         new_length = int(len(audio_data) / self.speed)
         indices = np.linspace(0, len(audio_data) - 1, new_length)
         return np.interp(indices, np.arange(len(audio_data)), audio_data)
-    
+
     def _play_audio(self, audio_data: np.ndarray):
         """Play audio data
-        
+
         Args:
             audio_data: Audio data untuk diplay
         """
@@ -244,17 +255,17 @@ def _play_audio(self, audio_data: np.ndarray):
             # Play audio menggunakan sounddevice
             sd.play(audio_data, samplerate=self.sample_rate)
             sd.wait()  # Wait sampai selesai
-            
+
         except Exception as e:
             logging.error(f"Audio playback failed: {e}")
-    
+
     def save_to_file(self, text: str, output_path: str) -> bool:
         """Save synthesized speech ke file
-        
+
         Args:
             text: Text yang akan di-synthesize
             output_path: Path output file (.wav)
-            
+
         Returns:
             True jika berhasil, False jika gagal
         """
@@ -262,24 +273,24 @@ def save_to_file(self, text: str, output_path: str) -> bool:
             audio_data = self._synthesize_audio(text)
             if audio_data is None:
                 return False
-            
+
             # Convert ke int16 untuk WAV file
             audio_int16 = (audio_data * 32767).astype(np.int16)
-            
+
             # Save ke WAV file
-            with wave.open(output_path, 'wb') as wav_file:
+            with wave.open(output_path, "wb") as wav_file:
                 wav_file.setnchannels(1)  # Mono
                 wav_file.setsampwidth(2)  # 16-bit
                 wav_file.setframerate(self.sample_rate)
                 wav_file.writeframes(audio_int16.tobytes())
-            
+
             logging.info(f"Audio saved to: {output_path}")
             return True
-            
+
         except Exception as e:
             logging.error(f"Failed to save audio: {e}")
             return False
-    
+
     def stop_speaking(self):
         """Stop current speech"""
         try:
@@ -288,22 +299,22 @@ def stop_speaking(self):
             logging.info("Speech stopped")
         except Exception as e:
             logging.error(f"Failed to stop speech: {e}")
-    
+
     def set_voice(self, voice_model: str) -> bool:
         """Change voice model
-        
+
         Args:
             voice_model: New voice model name
-            
+
         Returns:
             True jika berhasil, False jika gagal
         """
         if voice_model == self.voice_model:
             return True
-        
+
         old_model = self.voice_model
         self.voice_model = voice_model
-        
+
         try:
             self._setup_voice()
             if self.voice:
@@ -314,25 +325,25 @@ def set_voice(self, voice_model: str) -> bool:
                 self.voice_model = old_model
                 self._setup_voice()
                 return False
-                
+
         except Exception as e:
             logging.error(f"Failed to change voice: {e}")
             # Rollback
             self.voice_model = old_model
             self._setup_voice()
             return False
-    
+
     def get_available_voices(self) -> Dict[str, str]:
         """Get list voice models yang tersedia
-        
+
         Returns:
             Dictionary voice models dan descriptions
         """
         return self.available_voices.copy()
-    
+
     def is_voice_available(self) -> bool:
         """Check apakah voice model tersedia
-        
+
         Returns:
             True jika voice tersedia
         """
@@ -342,33 +353,34 @@ def is_voice_available(self) -> bool:
 # Fallback TTS menggunakan Windows SAPI jika Piper tidak tersedia
 class TTSFallback:
     """Fallback TTS menggunakan Windows SAPI"""
-    
+
     def __init__(self, rate: int = 0, volume: float = 0.8):
         self.rate = rate  # -10 to 10
         self.volume = volume  # 0.0 to 1.0
         self.is_speaking = False
-        
+
         try:
             import pyttsx3
+
             self.engine = pyttsx3.init()
-            self.engine.setProperty('rate', 150 + (rate * 25))
-            self.engine.setProperty('volume', volume)
-            
+            self.engine.setProperty("rate", 150 + (rate * 25))
+            self.engine.setProperty("volume", volume)
+
             # Set Indonesian voice jika tersedia
-            voices = self.engine.getProperty('voices')
+            voices = self.engine.getProperty("voices")
             for voice in voices:
-                if 'indonesia' in voice.name.lower() or 'id' in voice.id.lower():
-                    self.engine.setProperty('voice', voice.id)
+                if "indonesia" in voice.name.lower() or "id" in voice.id.lower():
+                    self.engine.setProperty("voice", voice.id)
                     break
-                    
+
         except ImportError:
             logging.error("pyttsx3 not installed. Install with: pip install pyttsx3")
             self.engine = None
-    
+
     def speak(self, text: str, blocking: bool = True) -> bool:
         if not self.engine or not text.strip():
             return False
-        
+
         try:
             self.is_speaking = True
             if blocking:
@@ -385,14 +397,14 @@ def speak(self, text: str, blocking: bool = True) -> bool:
         finally:
             if blocking:
                 self.is_speaking = False
-    
+
     def _speak_async(self, text: str):
         try:
             self.engine.say(text)
             self.engine.runAndWait()
         finally:
             self.is_speaking = False
-    
+
     def stop_speaking(self):
         if self.engine:
             self.engine.stop()
@@ -402,11 +414,11 @@ def stop_speaking(self):
 # Factory function untuk create TTS instance
 def create_tts(prefer_piper: bool = True, **kwargs) -> Any:
     """Create TTS instance
-    
+
     Args:
         prefer_piper: Prefer Piper over fallback TTS
         **kwargs: Arguments untuk TTS constructor
-        
+
     Returns:
         TTS instance (TTSPiper atau TTSFallback)
     """
@@ -414,7 +426,7 @@ def create_tts(prefer_piper: bool = True, **kwargs) -> Any:
         tts = TTSPiper(**kwargs)
         if tts.is_voice_available():
             return tts
-    
+
     # Fallback ke Windows SAPI
     logging.info("Using fallback TTS (Windows SAPI)")
     return TTSFallback(**kwargs)
@@ -423,35 +435,36 @@ def create_tts(prefer_piper: bool = True, **kwargs) -> Any:
 # Example usage dan testing
 if __name__ == "__main__":
     logging.basicConfig(level=logging.INFO)
-    
+
     print("TTS Piper Test")
     print("1. Piper TTS (preferred)")
     print("2. Fallback TTS (Windows SAPI)")
-    
+
     choice = input("Choose TTS engine (1/2): ")
-    
+
     if choice == "1":
         tts = TTSPiper()
     elif choice == "2":
         tts = TTSFallback()
     else:
         tts = create_tts()
-    
+
     # Test speech
     test_texts = [
         "Halo, saya adalah asisten suara Windows.",
         "Saya dapat membantu Anda mengendalikan komputer dengan suara.",
-        "Silakan berikan perintah Anda."
+        "Silakan berikan perintah Anda.",
     ]
-    
+
     for text in test_texts:
         print(f"Speaking: {text}")
         success = tts.speak(text, blocking=True)
         if not success:
             print("Failed to speak")
             break
-        
+
         import time
+
         time.sleep(0.5)
-    
-    print("TTS test completed")
\ No newline at end of file
+
+    print("TTS test completed")
diff --git a/src/windows_use/tools/voice_input.py b/src/windows_use/tools/voice_input.py
index 8b31b051..ca1c4ade 100644
--- a/src/windows_use/tools/voice_input.py
+++ b/src/windows_use/tools/voice_input.py
@@ -7,34 +7,44 @@
 - Audio recording dan preprocessing
 """
 
-import asyncio
-import threading
 import time
-from typing import Optional, Callable, Dict, Any
+from typing import Optional, Callable
 import logging
+import os
+
+try:
+    import torch
+except ImportError:
+    torch = None
 
 try:
     import sounddevice as sd
     import numpy as np
     import whisper
     import webrtcvad
-except ImportError as e:
+except (ImportError, OSError) as e:
     logging.warning(f"Voice dependencies not installed: {e}")
-    logging.warning("Install with: pip install sounddevice numpy openai-whisper webrtcvad")
+    logging.warning(
+        "Install with: pip install sounddevice numpy openai-whisper webrtcvad"
+    )
+
 
 class VoiceInput:
     """Voice Input handler dengan STT dan VAD"""
-    
-    def __init__(self, 
-                 model_name: str = "base",
-                 sample_rate: int = 16000,
-                 chunk_duration: float = 0.03,  # 30ms chunks untuk VAD
-                 vad_aggressiveness: int = 2,
-                 silence_threshold: float = 2.0,  # detik silence sebelum stop
-                 push_to_talk_key: str = "space"):
+
+    def __init__(
+        self,
+        model_name: str = "base",
+        sample_rate: int = 16000,
+        chunk_duration: float = 0.03,  # 30ms chunks untuk VAD
+        vad_aggressiveness: int = 2,
+        silence_threshold: float = 2.0,  # detik silence sebelum stop
+        push_to_talk_key: str = "space",
+        device: str = "auto",
+    ):
         """
         Initialize Voice Input
-        
+
         Args:
             model_name: Whisper model (tiny, base, small, medium, large)
             sample_rate: Audio sample rate (16kHz optimal untuk Whisper)
@@ -49,51 +59,60 @@ def __init__(self,
         self.chunk_size = int(sample_rate * chunk_duration)
         self.silence_threshold = silence_threshold
         self.push_to_talk_key = push_to_talk_key
-        
+        self.device = device
+
         # Initialize components
         self.whisper_model = None
         self.vad = None
         self.is_recording = False
         self.audio_buffer = []
         self.last_speech_time = 0
-        
+
         # Callbacks
         self.on_speech_start: Optional[Callable] = None
         self.on_speech_end: Optional[Callable] = None
         self.on_transcription: Optional[Callable[[str], None]] = None
-        
+
         self._setup_components()
-        
+
     def _setup_components(self):
         """Setup Whisper dan VAD components"""
         try:
             # Check if whisper is available
-            if 'whisper' in globals():
+            if "whisper" in globals():
                 # Load Whisper model
                 logging.info(f"Loading Whisper model: {self.model_name}")
-                self.whisper_model = whisper.load_model(self.model_name)
+                device = os.getenv("JARVIS_STT_DEVICE", self.device)
+                if device == "auto":
+                    if torch and torch.cuda.is_available():
+                        device = "cuda"
+                    else:
+                        device = "cpu"
+                self.whisper_model = whisper.load_model(self.model_name, device=device)
             else:
                 logging.warning("Whisper not available, voice recognition disabled")
                 self.whisper_model = None
-            
+
             # Setup VAD
-            if 'webrtcvad' in globals():
+            if "webrtcvad" in globals():
                 self.vad = webrtcvad.Vad()
                 self.vad.set_mode(2)  # Aggressiveness mode
             else:
-                logging.warning("WebRTC VAD not available, voice activity detection disabled")
+                logging.warning(
+                    "WebRTC VAD not available, voice activity detection disabled"
+                )
                 self.vad = None
-            
+
             logging.info("Voice components initialized successfully")
-            
+
         except Exception as e:
             logging.error(f"Failed to setup voice components: {e}")
             self.whisper_model = None
             self.vad = None
-    
+
     def start_listening(self, mode: str = "vad") -> None:
         """Start listening untuk voice input
-        
+
         Args:
             mode: "vad" untuk voice activity detection, "ptt" untuk push-to-talk
         """
@@ -103,19 +122,20 @@ def start_listening(self, mode: str = "vad") -> None:
             self._start_ptt_listening()
         else:
             raise ValueError("Mode must be 'vad' or 'ptt'")
-    
+
     def _start_vad_listening(self):
         """Start VAD-based listening"""
+
         def audio_callback(indata, frames, time, status):
             if status:
                 logging.warning(f"Audio callback status: {status}")
-            
+
             # Convert to int16 untuk VAD
             audio_int16 = (indata[:, 0] * 32767).astype(np.int16)
-            
+
             # Check voice activity
             is_speech = self.vad.is_speech(audio_int16.tobytes(), self.sample_rate)
-            
+
             if is_speech:
                 if not self.is_recording:
                     self.is_recording = True
@@ -123,28 +143,30 @@ def audio_callback(indata, frames, time, status):
                     if self.on_speech_start:
                         self.on_speech_start()
                     logging.info("Speech detected, starting recording")
-                
+
                 self.audio_buffer.append(audio_int16)
                 self.last_speech_time = time.time()
-                
+
             elif self.is_recording:
                 # Check if silence duration exceeded threshold
                 silence_duration = time.time() - self.last_speech_time
                 if silence_duration > self.silence_threshold:
                     self._process_recorded_audio()
-        
+
         # Start audio stream
         logging.info("Starting VAD listening...")
-        with sd.InputStream(callback=audio_callback,
-                          channels=1,
-                          samplerate=self.sample_rate,
-                          blocksize=self.chunk_size):
+        with sd.InputStream(
+            callback=audio_callback,
+            channels=1,
+            samplerate=self.sample_rate,
+            blocksize=self.chunk_size,
+        ):
             try:
                 while True:
                     time.sleep(0.1)
             except KeyboardInterrupt:
                 logging.info("Stopping VAD listening")
-    
+
     def _start_ptt_listening(self):
         """Start Push-to-Talk listening"""
         try:
@@ -153,7 +175,7 @@ def _start_ptt_listening(self):
             logging.error("keyboard library required for PTT mode")
             logging.error("Install with: pip install keyboard")
             return
-        
+
         def on_key_press():
             if not self.is_recording:
                 self.is_recording = True
@@ -162,83 +184,86 @@ def on_key_press():
                     self.on_speech_start()
                 logging.info("PTT activated, recording...")
                 self._start_recording()
-        
+
         def on_key_release():
             if self.is_recording:
                 self._process_recorded_audio()
-        
+
         # Setup keyboard hooks
         keyboard.on_press_key(self.push_to_talk_key, lambda _: on_key_press())
         keyboard.on_release_key(self.push_to_talk_key, lambda _: on_key_release())
-        
+
         logging.info(f"PTT mode active. Hold '{self.push_to_talk_key}' to talk")
         keyboard.wait()  # Keep listening
-    
+
     def _start_recording(self):
         """Start recording audio untuk PTT mode"""
+
         def audio_callback(indata, frames, time, status):
             if self.is_recording:
                 audio_int16 = (indata[:, 0] * 32767).astype(np.int16)
                 self.audio_buffer.append(audio_int16)
-        
-        self.stream = sd.InputStream(callback=audio_callback,
-                                   channels=1,
-                                   samplerate=self.sample_rate,
-                                   blocksize=self.chunk_size)
+
+        self.stream = sd.InputStream(
+            callback=audio_callback,
+            channels=1,
+            samplerate=self.sample_rate,
+            blocksize=self.chunk_size,
+        )
         self.stream.start()
-    
+
     def _process_recorded_audio(self):
         """Process recorded audio dengan Whisper STT"""
         if not self.audio_buffer:
             return
-        
+
         self.is_recording = False
-        if hasattr(self, 'stream'):
+        if hasattr(self, "stream"):
             self.stream.stop()
             self.stream.close()
-        
+
         if self.on_speech_end:
             self.on_speech_end()
-        
+
         # Combine audio chunks
         audio_data = np.concatenate(self.audio_buffer)
-        
+
         # Convert to float32 untuk Whisper
         audio_float32 = audio_data.astype(np.float32) / 32767.0
-        
+
         # Transcribe dengan Whisper
         try:
             logging.info("Transcribing audio...")
             result = self.whisper_model.transcribe(audio_float32, language="id")
             text = result["text"].strip()
-            
+
             if text:
                 logging.info(f"Transcription: {text}")
                 if self.on_transcription:
                     self.on_transcription(text)
             else:
                 logging.info("No speech detected in audio")
-                
+
         except Exception as e:
             logging.error(f"Transcription failed: {e}")
-        
+
         # Clear buffer
         self.audio_buffer = []
-    
+
     def stop_listening(self):
         """Stop voice input"""
         self.is_recording = False
-        if hasattr(self, 'stream'):
+        if hasattr(self, "stream"):
             self.stream.stop()
             self.stream.close()
         logging.info("Voice input stopped")
-    
+
     def transcribe_file(self, audio_file_path: str) -> str:
         """Transcribe audio file
-        
+
         Args:
             audio_file_path: Path ke audio file
-            
+
         Returns:
             Transcribed text
         """
@@ -253,28 +278,28 @@ def transcribe_file(self, audio_file_path: str) -> str:
 # Example usage dan testing
 if __name__ == "__main__":
     logging.basicConfig(level=logging.INFO)
-    
+
     def on_transcription(text: str):
         print(f"\n🎤 Transcription: {text}\n")
-    
+
     def on_speech_start():
         print("🔴 Recording started...")
-    
+
     def on_speech_end():
         print("⏹️ Recording stopped, processing...")
-    
+
     # Initialize voice input
     voice = VoiceInput(model_name="base")
     voice.on_transcription = on_transcription
     voice.on_speech_start = on_speech_start
     voice.on_speech_end = on_speech_end
-    
+
     print("Voice Input Test")
     print("1. VAD mode (automatic)")
     print("2. PTT mode (press space)")
-    
+
     choice = input("Choose mode (1/2): ")
-    
+
     try:
         if choice == "1":
             voice.start_listening("vad")
@@ -284,4 +309,4 @@ def on_speech_end():
             print("Invalid choice")
     except KeyboardInterrupt:
         voice.stop_listening()
-        print("\nVoice input stopped")
\ No newline at end of file
+        print("\nVoice input stopped")
diff --git a/src/windows_use/utils/logger.py b/src/windows_use/utils/logger.py
index 0c836db6..cfc1e03c 100644
--- a/src/windows_use/utils/logger.py
+++ b/src/windows_use/utils/logger.py
@@ -25,6 +25,8 @@
 import threading
 from contextlib import contextmanager
 
+from ..obs.log_sanitizer import redact
+
 class LogLevel(Enum):
     """Log levels untuk structured logging"""
     DEBUG = "debug"
@@ -165,19 +167,20 @@ def log_event(self, event_type: EventType, message: str,
             component: Component name
             trace_id: Trace ID for request tracking
         """
-        # Merge context
         merged_context = self._get_context().copy()
         if context:
             merged_context.update(context)
-        
-        # Create log entry
+
+        sanitized_context = {k: redact(str(v)) for k, v in merged_context.items()}
+        message = redact(message)
+
         entry = LogEntry(
             timestamp=datetime.utcnow().isoformat() + "Z",
             session_id=self.session_id,
             event_type=event_type.value,
             level=level.value,
             message=message,
-            context=merged_context,
+            context=sanitized_context,
             duration_ms=duration_ms,
             error_details=error_details,
             user_id=user_id,
diff --git a/src/windows_use/utils/rate_limit.py b/src/windows_use/utils/rate_limit.py
new file mode 100644
index 00000000..181a3bb2
--- /dev/null
+++ b/src/windows_use/utils/rate_limit.py
@@ -0,0 +1,31 @@
+from __future__ import annotations
+
+import time
+from functools import wraps
+from typing import Callable
+
+
+def rate_limit(max_calls: int, period: float) -> Callable:
+    tokens = max_calls
+    last = time.monotonic()
+
+    def decorator(func: Callable) -> Callable:
+        @wraps(func)
+        def wrapper(*args, **kwargs):
+            nonlocal tokens, last
+            now = time.monotonic()
+            tokens += (now - last) * (max_calls / period)
+            if tokens > max_calls:
+                tokens = max_calls
+            if tokens < 1:
+                sleep_for = (1 - tokens) * (period / max_calls)
+                time.sleep(sleep_for)
+                now = time.monotonic()
+                tokens += (now - last) * (max_calls / period)
+            tokens -= 1
+            last = now
+            return func(*args, **kwargs)
+
+        return wrapper
+
+    return decorator
diff --git a/src/windows_use/utils/retry.py b/src/windows_use/utils/retry.py
new file mode 100644
index 00000000..501bb332
--- /dev/null
+++ b/src/windows_use/utils/retry.py
@@ -0,0 +1,32 @@
+from __future__ import annotations
+
+import random
+import time
+from functools import wraps
+from typing import Callable, Iterable, Tuple, Type
+
+
+def retry(
+    exceptions: Iterable[Type[BaseException]],
+    tries: int = 3,
+    backoff: float = 0.5,
+    jitter: bool = True,
+) -> Callable:
+    exceptions_tuple: Tuple[Type[BaseException], ...] = tuple(exceptions)
+
+    def decorator(func: Callable) -> Callable:
+        @wraps(func)
+        def wrapper(*args, **kwargs):
+            delay = backoff
+            for attempt in range(tries - 1):
+                try:
+                    return func(*args, **kwargs)
+                except exceptions_tuple:
+                    sleep = delay + (random.uniform(0, delay) if jitter else 0)
+                    time.sleep(sleep)
+                    delay *= 2
+            return func(*args, **kwargs)
+
+        return wrapper
+
+    return decorator
diff --git a/src/windows_use/web/browser_automation.py b/src/windows_use/web/browser_automation.py
index 05f71619..25eba570 100644
--- a/src/windows_use/web/browser_automation.py
+++ b/src/windows_use/web/browser_automation.py
@@ -15,6 +15,9 @@
 
 from pydantic import BaseModel
 
+from ..utils.rate_limit import rate_limit
+from ..utils.retry import retry
+
 try:
     from selenium import webdriver
     from selenium.webdriver.common.by import By
@@ -111,6 +114,7 @@ def __init__(self, config: BrowserConfig):
         self.driver = None
         self.wait = None
         
+    @retry((Exception,), tries=3, backoff=0.2)
     def start(self):
         """Start browser session"""
         try:
@@ -213,6 +217,7 @@ def _get_browser_options(self):
             
             return options
     
+    @rate_limit(5, 1)
     def navigate_to(self, url: str) -> BrowserAction:
         """Navigate to URL"""
         start_time = time.time()
diff --git a/src/windows_use/web/security_utils.py b/src/windows_use/web/security_utils.py
new file mode 100644
index 00000000..0e42b3ef
--- /dev/null
+++ b/src/windows_use/web/security_utils.py
@@ -0,0 +1,43 @@
+from __future__ import annotations
+
+from enum import Enum
+from typing import Callable, Sequence, Tuple
+from urllib.parse import urlparse
+
+from playwright.async_api import Error as PlaywrightError, TimeoutError as PlaywrightTimeoutError  # type: ignore
+
+
+class Mode(str, Enum):
+    ASSISTIVE = "ASSISTIVE"
+    SEMI_AUTO = "SEMI_AUTO"
+    FULL_AUTO = "FULL_AUTO"
+
+
+def check_allowlist(url: str, allowlist: Sequence[str]) -> None:
+    domain = urlparse(url).hostname or ""
+    if domain not in allowlist:
+        raise ValueError("Domain not allowed")
+
+
+def require_confirmation(
+    mode: Mode, require: bool, confirmer: Callable[[], bool]
+) -> None:
+    if mode in (Mode.ASSISTIVE, Mode.SEMI_AUTO) and require:
+        if not confirmer():
+            raise PermissionError("User confirmation required")
+
+
+def handle_otp(mode: Mode, otp_detected: bool) -> Tuple[Mode, bool]:
+    if otp_detected and mode == Mode.FULL_AUTO:
+        return Mode.SEMI_AUTO, True
+    return mode, False
+
+
+async def goto_with_security(page, url: str, allowlist: Sequence[str]) -> None:
+    check_allowlist(url, allowlist)
+    try:
+        await page.goto(url)
+    except PlaywrightTimeoutError:
+        raise
+    except PlaywrightError:
+        raise
diff --git a/tests/test_config_validation.py b/tests/test_config_validation.py
new file mode 100644
index 00000000..6854dd80
--- /dev/null
+++ b/tests/test_config_validation.py
@@ -0,0 +1,33 @@
+import tempfile
+from pathlib import Path
+
+import pytest
+
+from windows_use.config_loader import load_models_config, load_security_config
+
+
+def test_security_config_allowlist_empty():
+    data = "mode_default: ASSISTIVE\nweb:\n  allowlist: []\n  require_confirm_on_submit: true\n"
+    with tempfile.NamedTemporaryFile("w", delete=False) as f:
+        f.write(data)
+        path = Path(f.name)
+    with pytest.raises(Exception):
+        load_security_config(path)
+
+
+def test_security_config_valid():
+    data = "mode_default: ASSISTIVE\nweb:\n  allowlist: ['example.com']\n  require_confirm_on_submit: true\n"
+    with tempfile.NamedTemporaryFile("w", delete=False) as f:
+        f.write(data)
+        path = Path(f.name)
+    cfg = load_security_config(path)
+    assert cfg.web.allowlist == ["example.com"]
+
+
+def test_models_config_default_offline():
+    data = "planner: gpt\n"
+    with tempfile.NamedTemporaryFile("w", delete=False) as f:
+        f.write(data)
+        path = Path(f.name)
+    cfg = load_models_config(path)
+    assert cfg.offline == "safe"
diff --git a/tests/test_device_flags.py b/tests/test_device_flags.py
new file mode 100644
index 00000000..e9d75546
--- /dev/null
+++ b/tests/test_device_flags.py
@@ -0,0 +1,22 @@
+import pytest
+from unittest import mock
+
+pytest.importorskip("whisper")
+from windows_use.tools.voice_input import VoiceInput
+
+
+def test_stt_device_env(monkeypatch):
+    called = {}
+
+    def fake_load(model, device="cpu"):
+        called["device"] = device
+
+        class M:
+            pass
+
+        return M()
+
+    monkeypatch.setenv("JARVIS_STT_DEVICE", "cpu")
+    with mock.patch("windows_use.tools.voice_input.whisper.load_model", fake_load):
+        VoiceInput()
+    assert called["device"] == "cpu"
diff --git a/tests/test_log_sanitizer.py b/tests/test_log_sanitizer.py
new file mode 100644
index 00000000..4e19ceec
--- /dev/null
+++ b/tests/test_log_sanitizer.py
@@ -0,0 +1,9 @@
+from windows_use.obs.log_sanitizer import redact
+
+
+def test_redact_token_email_phone():
+    text = "token abcdef0123456789abcdef0123456789 email test@example.com phone 081234567890"
+    result = redact(text)
+    assert "abcdef0123456789abcdef0123456789" not in result
+    assert "test@example.com" not in result
+    assert "081234567890" not in result
diff --git a/tests/test_powershell_wrapper.py b/tests/test_powershell_wrapper.py
new file mode 100644
index 00000000..857a3824
--- /dev/null
+++ b/tests/test_powershell_wrapper.py
@@ -0,0 +1,25 @@
+from unittest import mock
+
+from windows_use.tools.ps_shell import PowerShellManager
+
+
+def test_powershell_command_list_and_env(monkeypatch):
+    monkeypatch.setattr(
+        PowerShellManager, "_validate_powershell_available", lambda self: True
+    )
+    manager = PowerShellManager()
+
+    def fake_run(cmd, capture_output, text, timeout, cwd, env):
+        assert isinstance(cmd, list)
+        assert cmd[0] == "powershell"
+        assert env.get("__PSLockdownPolicy") == "4"
+
+        class R:
+            returncode = 0
+            stdout = ""
+            stderr = ""
+
+        return R()
+
+    with mock.patch("subprocess.run", fake_run):
+        manager.execute_command("Get-Process")
diff --git a/tests/test_retry_rate_limit.py b/tests/test_retry_rate_limit.py
new file mode 100644
index 00000000..88dff1d6
--- /dev/null
+++ b/tests/test_retry_rate_limit.py
@@ -0,0 +1,30 @@
+import time
+
+from windows_use.utils.rate_limit import rate_limit
+from windows_use.utils.retry import retry
+
+
+def test_rate_limit_sleep():
+    calls = []
+
+    @rate_limit(1, 0.2)
+    def func():
+        calls.append(time.time())
+
+    func()
+    func()
+    assert calls[1] - calls[0] >= 0.2
+
+
+def test_retry_eventually_succeeds():
+    counter = {"n": 0}
+
+    @retry((ValueError,), tries=3, backoff=0.01, jitter=False)
+    def flaky():
+        counter["n"] += 1
+        if counter["n"] < 3:
+            raise ValueError("fail")
+        return True
+
+    assert flaky() is True
+    assert counter["n"] == 3
diff --git a/tests/test_web_security.py b/tests/test_web_security.py
new file mode 100644
index 00000000..e7e6b61a
--- /dev/null
+++ b/tests/test_web_security.py
@@ -0,0 +1,40 @@
+import pytest
+from unittest.mock import AsyncMock
+
+pytest.importorskip("playwright.async_api")
+from playwright.async_api import Error as PlaywrightError, TimeoutError as PlaywrightTimeoutError  # type: ignore
+
+from windows_use.web.security_utils import (
+    Mode,
+    check_allowlist,
+    goto_with_security,
+    handle_otp,
+    require_confirmation,
+)
+
+
+def test_check_allowlist_rejects():
+    with pytest.raises(ValueError):
+        check_allowlist("https://evil.com", ["example.com"])
+
+
+def test_require_confirmation():
+    with pytest.raises(PermissionError):
+        require_confirmation(Mode.ASSISTIVE, True, lambda: False)
+    require_confirmation(Mode.ASSISTIVE, True, lambda: True)
+
+
+def test_handle_otp_switches_mode():
+    mode, paused = handle_otp(Mode.FULL_AUTO, True)
+    assert mode == Mode.SEMI_AUTO and paused
+
+
+@pytest.mark.asyncio
+async def test_goto_with_security_propagates_timeout():
+    page = AsyncMock()
+    page.goto.side_effect = PlaywrightTimeoutError("timeout")
+    with pytest.raises(PlaywrightTimeoutError):
+        await goto_with_security(page, "https://example.com", ["example.com"])
+    page.goto.side_effect = PlaywrightError("error")
+    with pytest.raises(PlaywrightError):
+        await goto_with_security(page, "https://example.com", ["example.com"])