diff --git a/.github/workflows/ci.yml b/.github/workflows/ci.yml
index 1e8b3bc..e089376 100644
--- a/.github/workflows/ci.yml
+++ b/.github/workflows/ci.yml
@@ -4,6 +4,8 @@ on:
   push:
     branches:
       - main
+    tags:
+      - 'v*'
 
 concurrency:
   group: fastfetchbot
@@ -24,6 +26,9 @@ jobs:
           - service: telegram-bot
             dockerfile: apps/telegram-bot/Dockerfile
             image_suffix: tgbot
+          - service: worker
+            dockerfile: apps/worker/Dockerfile
+            image_suffix: worker
     steps:
       - name: Checkout
         uses: actions/checkout@v4
@@ -33,13 +38,29 @@ jobs:
       - name: Check commit message
         id: check_message
         run: |
-          MESSAGE=$(git log --format=%B -n 1 ${{ github.sha }})
+          MESSAGE=$(git log --format=%B -n 1 "$GITHUB_SHA")
           if [[ "$MESSAGE" == *"[github-action]"* ]]; then
             echo "skip=true" >> "$GITHUB_OUTPUT"
           else
             echo "skip=false" >> "$GITHUB_OUTPUT"
           fi
 
+      - name: Determine Environment Tags
+        id: env_vars
+        run: |
+          # Check if the workflow was triggered by a tag or a branch push
+          if [[ "$GITHUB_REF" == refs/tags/* ]]; then
+            # Production Environment (Tag Trigger)
+            VERSION_TAG=${GITHUB_REF#refs/tags/}
+            echo "docker_tag=latest" >> "$GITHUB_OUTPUT"
+            echo "version_tag=$VERSION_TAG" >> "$GITHUB_OUTPUT"
+          else
+            # Staging Environment (Main Branch Trigger)
+            echo "docker_tag=stage" >> "$GITHUB_OUTPUT"
+            # Use the short commit SHA as a secondary tag for tracking
+            echo "version_tag=$(git rev-parse --short HEAD)" >> "$GITHUB_OUTPUT"
+          fi
+
       - name: Set up QEMU
         uses: docker/setup-qemu-action@v3
 
@@ -67,12 +88,24 @@ jobs:
           build-args: |
             APP_VERSION=${{ env.APP_VERSION }}
           tags: |
-            ghcr.io/${{ github.repository_owner }}/fastfetchbot-${{ matrix.image_suffix }}:latest
+            ghcr.io/${{ github.repository_owner }}/fastfetchbot-${{ matrix.image_suffix }}:${{ steps.env_vars.outputs.docker_tag }}
+            ghcr.io/${{ github.repository_owner }}/fastfetchbot-${{ matrix.image_suffix }}:${{ steps.env_vars.outputs.version_tag }}
 
-  deploy:
-    needs: build
-    runs-on: ubuntu-latest
-    steps:
-      - name: Trigger Watchtower deployment
-        run: |
-          curl -H "Authorization: Bearer ${{ secrets.WATCHTOWER_TOKEN }}" ${{ secrets.WATCHTOWER_WEBHOOK_URL }}
+#  deploy:
+#    needs: build
+#    runs-on: ubuntu-latest
+#    steps:
+#      - name: Trigger Watchtower deployment
+#        run: |
+#          # Route the webhook to the appropriate server based on the trigger
+#          if [[ "$GITHUB_REF" == refs/tags/* ]]; then
+#            echo "Deploying to Production..."
+#            TOKEN="${{ secrets.PROD_WATCHTOWER_TOKEN }}"
+#            WEBHOOK_URL="${{ secrets.PROD_WATCHTOWER_WEBHOOK_URL }}"
+#          else
+#            echo "Deploying to Staging..."
+#            TOKEN="${{ secrets.STAGE_WATCHTOWER_TOKEN }}"
+#            WEBHOOK_URL="${{ secrets.STAGE_WATCHTOWER_WEBHOOK_URL }}"
+#          fi
+#
+#          curl -H "Authorization: Bearer $TOKEN" "$WEBHOOK_URL"
\ No newline at end of file
diff --git a/.gitignore b/.gitignore
index d9fa219..e9d466b 100644
--- a/.gitignore
+++ b/.gitignore
@@ -258,3 +258,4 @@ conf/*
 /.run/
 .DS_Store
 /.claude/
+/apps/worker/conf/
diff --git a/CLAUDE.md b/CLAUDE.md
index 207372d..09eb0e0 100644
--- a/CLAUDE.md
+++ b/CLAUDE.md
@@ -2,143 +2,162 @@
 
 ## Project Overview
 
-FastFetchBot is a social media content fetching API built with FastAPI, designed to scrape and archive content from various social media platforms. It includes a Telegram Bot as the default client interface and supports multiple social media platforms including Twitter, Weibo, Xiaohongshu, Reddit, Bluesky, Instagram, Zhihu, Douban, YouTube, and Bilibili.
+FastFetchBot is a social media content fetching service built as a **UV workspace monorepo** with three microservices: a FastAPI server (API), a Telegram Bot client, and a Celery worker for file operations. It scrapes and archives content from various social media platforms including Twitter, Weibo, Xiaohongshu, Reddit, Bluesky, Instagram, Zhihu, Douban, YouTube, and Bilibili.
+
+## Architecture
+
+```
+FastFetchBot/
+├── packages/shared/          # fastfetchbot-shared: common models, utilities, logger
+├── packages/file-export/     # fastfetchbot-file-export: video download, PDF export, transcription
+├── apps/api/                 # FastAPI server: scrapers, storage, routing
+├── apps/telegram-bot/        # Telegram Bot: webhook/polling, message handling
+├── apps/worker/              # Celery worker: async file operations (video, PDF, audio)
+├── app/                      # Legacy re-export wrappers (backward compatibility)
+├── pyproject.toml            # Root workspace configuration
+└── uv.lock                   # Lockfile for the entire workspace
+```
+
+| Service | Package Name | Port | Entry Point |
+|---------|-------------|------|-------------|
+| **API Server** (`apps/api/src/`) | `fastfetchbot-api` | 10450 | `gunicorn -k uvicorn.workers.UvicornWorker src.main:app --preload` |
+| **Telegram Bot** (`apps/telegram-bot/core/`) | `fastfetchbot-telegram-bot` | 10451 | `python -m core.main` |
+| **Worker** (`apps/worker/worker_core/`) | `fastfetchbot-worker` | — | `celery -A worker_core.main:app worker --loglevel=info --concurrency=2` |
+| **Shared Library** (`packages/shared/fastfetchbot_shared/`) | `fastfetchbot-shared` | — | — |
+| **File Export Library** (`packages/file-export/fastfetchbot_file_export/`) | `fastfetchbot-file-export` | — | — |
+
+The Telegram Bot communicates with the API server over HTTP (`API_SERVER_URL`). In Docker, this is `http://api:10450`.
+
+### API Server (`apps/api/src/`)
+
+- **`main.py`** — FastAPI app setup, Sentry integration, lifecycle management
+- **`config.py`** — Environment variable handling, platform credentials
+- **`routers/`** — `scraper.py` (generic endpoint), `scraper_routers.py` (platform-specific), `inoreader.py`, `wechat.py`
+- **`services/scrapers/`** — `scraper_manager.py` orchestrates platform scrapers (twitter, weibo, bluesky, xiaohongshu, reddit, instagram, zhihu, douban, threads, wechat, general)
+- **`services/file_export/`** — PDF generation, audio transcription (OpenAI), video download
+- **`services/amazon/s3.py`** — S3 storage integration
+- **`services/telegraph/`** — Telegraph content publishing
+- **`templates/`** — Jinja2 templates for platform-specific output formatting
+
+### Telegram Bot (`apps/telegram-bot/core/`)
+
+- **`main.py`** — Entry point
+- **`api_client.py`** — HTTP client calling the API server
+- **`handlers/`** — `messages.py`, `buttons.py`, `url_process.py`
+- **`services/`** — `bot_app.py`, `message_sender.py`, `constants.py`
+- **`webhook/server.py`** — Webhook/polling server
+- **`templates/`** — Jinja2 templates for bot messages
+
+### Shared Library (`packages/shared/fastfetchbot_shared/`)
+
+- **`config.py`** — URL patterns (SOCIAL_MEDIA_WEBSITE_PATTERNS, VIDEO_WEBSITE_PATTERNS, BANNED_PATTERNS)
+- **`models/`** — `classes.py` (NamedBytesIO), `metadata_item.py`, `telegraph_item.py`, `url_metadata.py`
+- **`utils/`** — `parse.py` (URL parsing, HTML processing, `get_env_bool`), `image.py`, `logger.py`, `network.py`
+
+### Legacy `app/` Directory
+
+Re-export wrappers providing backward compatibility. Actual code lives in `apps/api/src/` and `packages/shared/`. For example, `app/config.py` imports `get_env_bool` from `fastfetchbot_shared.utils.parse`.
 
 ## Development Commands
 
 ### Package Management
-- `uv sync` - Install all dependencies (including dev)
-- `uv sync --no-dev` - Install production dependencies only
-- `uv sync --extra windows` - Install with Windows extras
-- `uv lock` - Regenerate the lock file after pyproject.toml changes
+- `uv sync` — Install all dependencies (including dev)
+- `uv lock` — Regenerate the lock file after pyproject.toml changes
 
-### Running the Application
-- **Production**: `uv run gunicorn -k uvicorn.workers.UvicornWorker app.main:app --preload`
-- **Development**: `uv run gunicorn -k uvicorn.workers.UvicornWorker --bind 0.0.0.0:10450 wsgi:app`
+### Running Locally
 
-### Docker Commands
-- `docker-compose up -d` - Start all services (FastFetchBot, Telegram Bot API, File Exporter)
-- `docker-compose build` - Build the FastFetchBot container
+```bash
+# API server
+cd apps/api
+uv run gunicorn -k uvicorn.workers.UvicornWorker src.main:app --preload
 
-> **uv version in Docker**: The Dockerfile pins uv to `0.8.18` via `COPY --from=ghcr.io/astral-sh/uv:0.8.18`.
-> To upgrade, update that tag in `Dockerfile` line 24 and verify the build with `docker build -t fastfetchbot-test .`.
+# Telegram Bot (separate terminal)
+cd apps/telegram-bot
+uv run python -m core.main
+```
 
 ### Testing
-- `uv run pytest` - Run all tests
-- `uv run pytest tests/test_bluesky.py` - Run specific test file
-- `uv run pytest -v` - Run tests with verbose output
+- `uv run pytest` — Run all tests
+- `uv run pytest tests/test_bluesky.py` — Run specific test file
+- `uv run pytest -v` — Verbose output
 
 ### Code Formatting
-- `uv run black .` - Format all Python code using Black formatter
-
-## Architecture Overview
-
-### Core Components
-
-**FastAPI Application (`app/main.py`)**
-- Main application entry point with FastAPI instance
-- Configures routers, middleware, and lifecycle management
-- Integrates Sentry for error monitoring
-- Handles Telegram bot webhook setup on startup
-
-**Scraper Architecture (`app/services/scrapers/`)**
-- `ScraperManager`: Centralized manager for all platform scrapers
-- Individual scraper modules for each platform (twitter, weibo, bluesky, etc.)
-- Each scraper implements platform-specific content extraction logic
-- Common scraping utilities in `common.py`
-
-**Router Structure (`app/routers/`)**
-- Platform-specific routers (twitter.py, weibo.py, etc.)
-- Generic scraper router for unified API endpoints
-- Telegram bot webhook handler
-- Feed processing and Inoreader integration
-
-**Data Models (`app/models/`)**
-- `classes.py`: Core data structures (NamedBytesIO)
-- `database_model.py`: MongoDB/Beanie models
-- Platform-specific metadata models
-- Telegram chat and Telegraph item models
-
-**Configuration (`app/config.py`)**
-- Comprehensive environment variable handling
-- Platform-specific API credentials and cookies
-- Database, storage, and service configurations
-- Template and localization settings
-
-### Key Services
-
-**Telegram Bot Service (`app/services/telegram_bot/`)**
-- Handles webhook setup and message processing
-- Integrates with local Telegram Bot API server for large file support
-- Channel and admin management
-
-**File Export Service (`app/services/file_export/`)**
-- Document export (PDF generation)
-- Audio transcription (OpenAI integration)
-- Video download capabilities
-
-**Storage Services**
-- Amazon S3 integration for media storage
-- Local file system management
-- Telegraph integration for content publishing
-
-### Platform Support
-
-**Supported Social Media Platforms:**
-- Twitter (requires ct0 and auth_token cookies)
-- Weibo (requires cookies)
-- Xiaohongshu (requires a1, webid, websession cookies)
-- Bluesky (requires username/password)
-- Reddit (requires API credentials)
-- Instagram (requires X-RapidAPI key)
-- Zhihu (requires cookies in conf/zhihu_cookies.json)
-- Douban
-- YouTube, Bilibili (video content)
+- `uv run black .` — Format all Python code
+
+### Docker
+
+```bash
+# Start all services (uses pre-built images from GHCR)
+docker-compose up -d
+
+# Build locally
+docker build -f apps/api/Dockerfile -t fastfetchbot-api .
+docker build -f apps/telegram-bot/Dockerfile -t fastfetchbot-telegram-bot .
+docker build -f apps/worker/Dockerfile -t fastfetchbot-worker .
+```
+
+> **uv version in Docker**: All three Dockerfiles pin uv to `0.10.4` via `COPY --from=ghcr.io/astral-sh/uv:0.10.4`.
+> To upgrade, update that tag in `apps/api/Dockerfile`, `apps/telegram-bot/Dockerfile`, and `apps/worker/Dockerfile`.
+
+Docker Compose services (see `docker-compose.template.yml`):
+- **api** — API server (port 10450)
+- **telegram-bot** — Telegram Bot (port 10451)
+- **telegram-bot-api** — Local Telegram Bot API for large file support (ports 8081-8082)
+- **redis** — Message broker and result backend for Celery (port 6379)
+- **worker** — Celery worker for file operations (video download, PDF export, audio transcription)
 
 ## Environment Configuration
 
-### Required Variables
-- `BASE_URL`: Server base URL
-- `TELEGRAM_BOT_TOKEN`: Telegram bot token
-- `TELEGRAM_CHAT_ID`: Default chat ID for bot
+See `template.env` for a complete reference. Key variables:
+
+### Required
+| Variable | Description |
+|----------|-------------|
+| `BASE_URL` | Public server domain (used for webhook URL construction) |
+| `TELEGRAM_BOT_TOKEN` | Bot token from @BotFather |
+| `TELEGRAM_CHAT_ID` | Default chat ID for the bot |
 
-### Critical Setup Notes
-- Most social media scrapers require authentication cookies/tokens
+### Service Communication (Docker)
+| Variable | Default | Description |
+|----------|---------|-------------|
+| `API_SERVER_URL` | `http://localhost:10450` | URL the Telegram Bot uses to call the API. `http://api:10450` in Docker. |
+| `TELEGRAM_BOT_CALLBACK_URL` | `http://localhost:10451` | URL the API uses to call the Telegram Bot. `http://telegram-bot:10451` in Docker. |
+| `TELEGRAM_BOT_MODE` | `polling` | `polling` (dev) or `webhook` (production with HTTPS) |
+
+### Platform Credentials
+- Most scrapers require authentication cookies/tokens
 - Use browser extension "Get cookies.txt LOCALLY" to extract cookies
 - Store Zhihu cookies in `conf/zhihu_cookies.json`
-- Template environment file available at `template.env`
+- See `template.env` for all platform-specific variables (Twitter, Weibo, Xiaohongshu, Reddit, Instagram, Bluesky, etc.)
 
-### Database Integration
-- Optional MongoDB integration (set `DATABASE_ON=true`)
-- Uses Beanie ODM for async MongoDB operations
-- Database initialization handled in app lifecycle
+### Database
+- Optional MongoDB integration (`DATABASE_ON=true`)
+- Uses Beanie ODM for async operations
 
-### Docker Services
-- **fastfetchbot**: Main application container
-- **telegram-bot-api**: Local Telegram Bot API for large file support
-- **fast-yt-downloader**: Separate service for video downloads
+## CI/CD
 
-## Development Guidelines
+GitHub Actions (`.github/workflows/ci.yml`) builds and pushes all three images on push to `main`:
+- `ghcr.io/aturret/fastfetchbot-api:latest`
+- `ghcr.io/aturret/fastfetchbot-tgbot:latest`
+- `ghcr.io/aturret/fastfetchbot-worker:latest`
 
-### Cookie Management
-- Platform scrapers depend on valid authentication cookies
-- Store sensitive cookies in environment variables, never in code
-- Test scraper functionality after cookie updates
+Deployment is triggered via Watchtower webhook after builds complete. Include `[github-action]` in a commit message to skip the build.
 
-### Adding New Platform Support
-1. Create new scraper module in `app/services/scrapers/[platform]/`
+## Development Guidelines
+
+### Adding a New Platform Scraper
+1. Create scraper module in `apps/api/src/services/scrapers/<platform>/`
 2. Implement scraper class following existing patterns
-3. Add platform-specific router in `app/routers/`
-4. Update ScraperManager to include new scraper
-5. Add configuration variables in `app/config.py`
+3. Add platform-specific router in `apps/api/src/routers/`
+4. Register the scraper in `ScraperManager`
+5. Add configuration variables in `apps/api/src/config.py`
 6. Create tests in `tests/cases/`
 
-### Template System
-- Jinja2 templates in `app/templates/` for content formatting
-- Platform-specific templates for different output formats
-- Supports internationalization via gettext
-
-### Error Handling and Logging
-- Loguru for comprehensive logging
-- Sentry integration for production error monitoring
-- Platform-specific error handling in scrapers
\ No newline at end of file
+### Key Conventions
+- Shared models and utilities go in `packages/shared/fastfetchbot_shared/`
+- API-specific code goes in `apps/api/src/`
+- Telegram bot code goes in `apps/telegram-bot/core/`
+- The bot communicates with the API only via HTTP — no direct imports of API code
+- Jinja2 templates for output formatting, with i18n support via Babel
+- Loguru for logging, Sentry for production error monitoring
+- Store sensitive cookies/tokens in environment variables, never in code
diff --git a/app/auth.py b/app/auth.py
deleted file mode 100644
index 815218e..0000000
--- a/app/auth.py
+++ /dev/null
@@ -1,33 +0,0 @@
-import secrets
-
-from fastapi import HTTPException, Security, status
-from fastapi.security.api_key import APIKeyQuery, APIKeyHeader
-
-from app.config import API_KEY_NAME, API_KEY, TELEGRAM_BOT_SECRET_TOKEN
-
-api_key_query = APIKeyQuery(name=API_KEY_NAME, auto_error=False)
-telegram_secret_token_query = APIKeyHeader(
-    name="X-Telegram-Bot-Api-Secret-Token", auto_error=False
-)
-
-
-def verify_key(input_key: str, true_key: str):
-    if api_key_query is None or not secrets.compare_digest(input_key, true_key):
-        raise HTTPException(
-            status_code=status.HTTP_401_UNAUTHORIZED, detail="API Key Invalid"
-        )
-
-
-def verify_api_key(api_key_query: str = Security(api_key_query)):
-    verify_key(api_key_query, API_KEY)
-
-
-def verify_telegram_api_header(
-    api_header_query: str = Security(telegram_secret_token_query),
-):
-    if api_header_query is None or not secrets.compare_digest(
-        api_header_query, TELEGRAM_BOT_SECRET_TOKEN
-    ):
-        raise HTTPException(
-            status_code=status.HTTP_401_UNAUTHORIZED, detail="API Key Invalid"
-        )
diff --git a/app/config.py b/app/config.py
deleted file mode 100644
index ca0db5d..0000000
--- a/app/config.py
+++ /dev/null
@@ -1,233 +0,0 @@
-import json
-import os
-import tempfile
-
-from jinja2 import Environment, FileSystemLoader
-import gettext
-import secrets
-
-from fastfetchbot_shared.utils.parse import get_env_bool
-
-env = os.environ
-current_directory = os.path.dirname(os.path.abspath(__file__))
-conf_dir = os.path.join(current_directory, "..", "conf")
-
-# FastAPI environment variables
-BASE_URL = env.get("BASE_URL", "localhost")
-API_KEY_NAME = env.get("API_KEY_NAME", "pwd")
-API_KEY = env.get("API_KEY", secrets.token_urlsafe(32))
-
-# Filesystem environment variables
-TEMP_DIR = env.get("TEMP_DIR", tempfile.gettempdir())
-WORK_DIR = env.get("WORK_DIR", os.getcwd())
-DOWNLOAD_DIR = env.get("DOWNLOAD_DIR", os.path.join(WORK_DIR, "download"))
-DEBUG_MODE = get_env_bool(env, "DEBUG_MODE", False)
-
-# Logging environment variables
-LOG_FILE_PATH = env.get("LOG_FILE_PATH", TEMP_DIR)
-LOG_LEVEL = env.get("LOG_LEVEL", "DEBUG")
-
-# MongoDB environment variables
-DATABASE_ON = get_env_bool(env, "DATABASE_ON", False)
-MONGODB_PORT = int(env.get("MONGODB_PORT", 27017)) or 27017
-MONGODB_HOST = env.get("MONGODB_HOST", "localhost")
-MONGODB_URL = env.get("MONGODB_URL", f"mongodb://{MONGODB_HOST}:{MONGODB_PORT}")
-
-# Telegram bot environment variables
-TELEGRAM_BOT_ON = get_env_bool(env, "TELEGRAM_BOT_ON", True)
-TELEGRAM_BOT_MODE = env.get("TELEGRAM_BOT_MODE", "polling")
-TELEGRAM_BOT_TOKEN = env.get("TELEGRAM_BOT_TOKEN", None)
-TELEGRAM_BOT_SECRET_TOKEN = env.get(
-    "TELEGRAM_BOT_SECRET_TOKEN", secrets.token_urlsafe(32)
-)
-
-TELEGRAM_CHANNEL_ID = []
-telegram_channel_id = env.get("TELEGRAM_CHANNEL_ID", "").split(",")
-for single_telegram_channel_id in telegram_channel_id:
-    if single_telegram_channel_id.startswith("@"):
-        TELEGRAM_CHANNEL_ID.append(single_telegram_channel_id)
-    elif single_telegram_channel_id.startswith("-1"):
-        TELEGRAM_CHANNEL_ID.append(int(single_telegram_channel_id))
-if len(TELEGRAM_CHANNEL_ID) == 0:
-    TELEGRAM_CHANNEL_ID = None
-telebot_debug_channel = env.get("TELEBOT_DEBUG_CHANNEL", "")
-if telebot_debug_channel.startswith("@"):
-    TELEBOT_DEBUG_CHANNEL = telebot_debug_channel
-elif telebot_debug_channel.startswith("-1"):
-    TELEBOT_DEBUG_CHANNEL = int(telebot_debug_channel)
-else:
-    TELEBOT_DEBUG_CHANNEL = None
-telegram_channel_admin_list = env.get("TELEGRAM_CHANNEL_ADMIN_LIST", "")
-TELEGRAM_CHANNEL_ADMIN_LIST = [
-    admin_id for admin_id in telegram_channel_admin_list.split(",")
-]
-if not TELEGRAM_CHANNEL_ADMIN_LIST:
-    TELEGRAM_CHANNEL_ADMIN_LIST = None
-
-TELEGRAM_WEBHOOK_URL = f"https://{BASE_URL}/telegram/bot/webhook"
-
-TELEBOT_API_SERVER_HOST = env.get("TELEBOT_API_SERVER_HOST", None)
-TELEBOT_API_SERVER_PORT = env.get("TELEBOT_API_SERVER_PORT", None)
-TELEBOT_API_SERVER = (
-    f"http://{TELEBOT_API_SERVER_HOST}:{TELEBOT_API_SERVER_PORT}" + "/bot"
-    if (TELEBOT_API_SERVER_HOST and TELEBOT_API_SERVER_PORT)
-    else "https://api.telegram.org/bot"
-)
-TELEBOT_API_SERVER_FILE = (
-    f"http://{TELEBOT_API_SERVER_HOST}:{TELEBOT_API_SERVER_PORT}" + "/file/bot"
-    if (TELEBOT_API_SERVER_HOST and TELEBOT_API_SERVER_PORT)
-    else "https://api.telegram.org/file/bot"
-)
-TELEBOT_LOCAL_FILE_MODE = (
-    False if TELEBOT_API_SERVER == "https://api.telegram.org/bot" else True
-)
-TELEBOT_CONNECT_TIMEOUT = int(env.get("TELEGRAM_CONNECT_TIMEOUT", 15)) or 15
-TELEBOT_READ_TIMEOUT = int(env.get("TELEGRAM_READ_TIMEOUT", 60)) or 60
-TELEBOT_WRITE_TIMEOUT = int(env.get("TELEGRAM_WRITE_TIMEOUT", 60)) or 60
-TELEBOT_MAX_RETRY = int(env.get("TELEGRAM_MAX_RETRY", 5)) or 5
-TELEGRAM_IMAGE_DIMENSION_LIMIT = int(env.get("TELEGRAM_IMAGE_SIZE_LIMIT", 1600)) or 1600
-TELEGRAM_IMAGE_SIZE_LIMIT = (
-    int(env.get("TELEGRAM_IMAGE_SIZE_LIMIT", 5242880)) or 5242880
-)
-telegram_group_message_ban_list = env.get("TELEGRAM_GROUP_MESSAGE_BAN_LIST", "")
-telegram_bot_message_ban_list = env.get("TELEGRAM_BOT_MESSAGE_BAN_LIST", "")
-
-
-def ban_list_resolver(ban_list_string: str) -> list:
-    ban_list = ban_list_string.split(",")
-    for item in ban_list:
-        if item == "social_media":
-            ban_list.extend(
-                [
-                    "weibo",
-                    "twitter",
-                    "instagram",
-                    "zhihu",
-                    "douban",
-                    "wechat",
-                    "xiaohongshu",
-                    "reddit",
-                ]
-            )
-        elif item == "video":
-            ban_list.extend(["youtube", "bilibili"])
-    return ban_list
-
-
-TELEGRAM_GROUP_MESSAGE_BAN_LIST = ban_list_resolver(telegram_group_message_ban_list)
-TELEGRAM_BOT_MESSAGE_BAN_LIST = ban_list_resolver(telegram_bot_message_ban_list)
-telegraph_token_list = env.get("TELEGRAPH_TOKEN_LIST", "")
-TELEGRAPH_TOKEN_LIST = telegraph_token_list.split(",") if telegraph_token_list else None
-
-# Youtube-dl environment variables
-FILE_EXPORTER_ON = get_env_bool(env, "FILE_EXPORTER_ON", True)
-FILE_EXPORTER_HOST = env.get("FILE_EXPORTER_HOST", "fast-yt-downloader")
-FILE_EXPORTER_PORT = env.get("FILE_EXPORTER_PORT", "4000")
-FILE_EXPORTER_URL = f"http://{FILE_EXPORTER_HOST}:{FILE_EXPORTER_PORT}"
-DOWNLOAD_VIDEO_TIMEOUT = env.get("DOWNLOAD_VIDEO_TIMEOUT", 600)
-
-# Services environment variables
-templates_directory = os.path.join(current_directory, "templates")
-JINJA2_ENV = Environment(
-    loader=FileSystemLoader(templates_directory), lstrip_blocks=True, trim_blocks=True
-)
-TEMPLATE_LANGUAGE = env.get(
-    "TEMPLATE_LANGUAGE", "zh_CN"
-)  # It is a workaround for translation system
-
-# X-RapidAPI (for instagram)
-X_RAPIDAPI_KEY = env.get("X_RAPIDAPI_KEY", None)
-
-# Twitter
-TWITTER_EMAIL = env.get("TWITTER_EMAIL", None)
-TWITTER_PASSWORD = env.get("TWITTER_PASSWORD", None)
-TWITTER_USERNAME = env.get("TWITTER_USERNAME", None)
-TWITTER_CT0 = env.get("TWITTER_CT0", None)
-TWITTER_AUTH_TOKEN = env.get("TWITTER_AUTH_TOKEN", None)
-TWITTER_COOKIES = {
-    "ct0": TWITTER_CT0,
-    "auth_token": TWITTER_AUTH_TOKEN,
-}
-
-# Bluesky
-BLUESKY_USERNAME = env.get("BLUESKY_USERNAME", None)
-BLUESKY_PASSWORD = env.get("BLUESKY_PASSWORD", None)
-
-# Weibo
-WEIBO_COOKIES = env.get("WEIBO_COOKIES", None)
-
-# Xiaohongshu
-XIAOHONGSHU_A1 = env.get("XIAOHONGSHU_A1", None)
-XIAOHONGSHU_WEBID = env.get("XIAOHONGSHU_WEBID", None)
-XIAOHONGSHU_WEBSESSION = env.get("XIAOHONGSHU_WEBSESSION", None)
-XIAOHONGSHU_COOKIES = {
-    "a1": XIAOHONGSHU_A1,
-    "web_id": XIAOHONGSHU_WEBID,
-    "web_session": XIAOHONGSHU_WEBSESSION,
-}
-XHS_PHONE_LIST = env.get("XHS_PHONE_LIST", "").split(",")
-XHS_IP_PROXY_LIST = env.get("XHS_IP_PROXY_LIST", "").split(",")
-XHS_ENABLE_IP_PROXY = get_env_bool(env, "XHS_ENABLE_IP_PROXY", False)
-XHS_SAVE_LOGIN_STATE = get_env_bool(env, "XHS_SAVE_LOGIN_STATE", True)
-
-# Zhihu
-FXZHIHU_HOST = env.get("FXZHIHU_HOST", "fxzhihu.com")
-
-zhihu_cookie_path = os.path.join(conf_dir, "zhihu_cookies.json")
-if os.path.exists(zhihu_cookie_path):
-    try:
-        with open(zhihu_cookie_path, "r") as f:
-            ZHIHU_COOKIES_JSON = json.load(f)
-    except json.JSONDecodeError:
-        print("Error: The file is not in a valid JSON format.")
-        ZHIHU_COOKIES_JSON = None
-    except FileNotFoundError:
-        print("Error: The file does not exist.")
-        ZHIHU_COOKIES_JSON = None
-else:
-    print("Error: We cannot find it.")
-    ZHIHU_COOKIES_JSON = None
-
-# Reddit
-REDDIT_CLIENT_ID = env.get("REDDIT_CLIENT_ID", None)
-REDDIT_CLIENT_SECRET = env.get("REDDIT_CLIENT_SECRET", None)
-REDDIT_PASSWORD = env.get("REDDIT_PASSWORD", None)
-REDDIT_USERNAME = env.get("REDDIT_USERNAME", None)
-
-# AWS storage
-AWS_STORAGE_ON = get_env_bool(env, "AWS_STORAGE_ON", False)
-AWS_ACCESS_KEY_ID = env.get("AWS_ACCESS_KEY_ID", None)
-AWS_SECRET_ACCESS_KEY = env.get("AWS_SECRET_ACCESS_KEY", None)
-AWS_S3_BUCKET_NAME = env.get("AWS_S3_BUCKET_NAME", "")
-AWS_REGION_NAME = env.get("AWS_REGION_NAME", "")
-AWS_DOMAIN_HOST = env.get("AWS_DOMAIN_HOST", None)
-if not (AWS_ACCESS_KEY_ID and AWS_SECRET_ACCESS_KEY and AWS_S3_BUCKET_NAME):
-    AWS_STORAGE_ON = False
-INOREADER_APP_ID = env.get("INOREADER_APP_ID", None)
-INOREADER_APP_KEY = env.get("INOREADER_APP_KEY", None)
-INOREADER_EMAIL = env.get("INOREADER_EMAIL", None)
-INOREADER_PASSWORD = env.get("INOREADER_PASSWORD", None)
-
-# Open AI API
-OPENAI_API_KEY = env.get("OPENAI_API_KEY", None)
-
-# General webpage scraping
-GENERAL_SCRAPING_ON = get_env_bool(env, "GENERAL_SCRAPING_ON", False)
-GENERAL_SCRAPING_API = env.get("GENERAL_SCRAPING_API", "FIRECRAWL")
-
-# Firecrawl API
-FIRECRAWL_API_URL = os.getenv("FIRECRAWL_API_URL", "")
-FIRECRAWL_API_KEY = os.getenv("FIRECRAWL_API_KEY", "")
-FIRECRAWL_WAIT_FOR = int(env.get("FIRECRAWL_WAIT_FOR", 3000))  # milliseconds to wait for JS rendering
-
-
-# Zyte API
-ZYTE_API_KEY = env.get("ZYTE_API_KEY", None)
-
-# Locale directories environment variables
-localedir = os.path.join(os.path.dirname(__file__), "locale")
-translation = gettext.translation("messages", localedir=localedir, fallback=True)
-_ = translation.gettext
-
-# Utils environment variables
-HTTP_REQUEST_TIMEOUT = env.get("HTTP_REQUEST_TIMEOUT", 30)
\ No newline at end of file
diff --git a/app/database.py b/app/database.py
deleted file mode 100644
index f78488a..0000000
--- a/app/database.py
+++ /dev/null
@@ -1,37 +0,0 @@
-from typing import Optional, Union, List
-
-from motor.motor_asyncio import AsyncIOMotorClient
-from beanie import init_beanie, Document, Indexed
-
-from app.config import MONGODB_URL
-from app.models.database_model import document_list
-from app.utils.logger import logger
-
-
-async def startup() -> None:
-    client = AsyncIOMotorClient(MONGODB_URL)
-    await init_beanie(database=client["telegram_bot"], document_models=document_list)
-
-
-async def shutdown() -> None:
-    pass
-
-
-async def save_instances(instances: Union[Document, List[Document]], *args) -> None:
-    if instances is None:
-        raise TypeError("instances must be a Model or a list of Model")
-
-    if isinstance(instances, Document):
-        instance_type = type(instances)
-        await instance_type.insert(instances)
-    elif isinstance(instances, list):
-        instance_type = type(instances[0])
-        await instance_type.insert_many(instances)
-    else:
-        raise TypeError("instances must be a Model or a list of Model")
-
-    for arg in args:
-        if not isinstance(arg, Document):
-            raise TypeError("args must be a Model")
-        instance_type = type(arg)
-        await instance_type.insert_one(arg)
diff --git a/app/main.py b/app/main.py
deleted file mode 100644
index 1fae5b2..0000000
--- a/app/main.py
+++ /dev/null
@@ -1,72 +0,0 @@
-import asyncio
-
-import sentry_sdk
-
-from fastapi import FastAPI, Request
-from contextlib import asynccontextmanager
-from starlette.middleware.base import BaseHTTPMiddleware
-
-from app import auth, database
-from app.routers import telegram_bot, inoreader, scraper_routers, scraper
-from app.services import telegram_bot as telegram_bot_service
-from app.config import TELEGRAM_BOT_TOKEN, DATABASE_ON
-from app.utils.logger import logger
-
-SENTRY_DSN = ""
-
-# https://docs.sentry.io/platforms/python/guides/fastapi/
-sentry_sdk.init(
-    dsn=SENTRY_DSN,
-    # Set traces_sample_rate to 1.0 to capture 100%
-    # of transactions for performance monitoring.
-    # We recommend adjusting this value in production,
-    traces_sample_rate=1.0,
-)
-
-started = False
-lock = asyncio.Lock()
-
-
-@asynccontextmanager
-async def lifespan(app: FastAPI):
-    global started
-    async with lock:
-        if not started:
-            started = True
-            await telegram_bot_service.set_webhook()
-            await telegram_bot_service.startup()
-    if DATABASE_ON:
-        await database.startup()
-    try:
-        yield
-    finally:
-        if DATABASE_ON:
-            await database.shutdown()
-        await telegram_bot_service.shutdown()
-
-
-class LogMiddleware(BaseHTTPMiddleware):
-    def __init__(self, app):
-        super().__init__(app)
-
-    async def dispatch(self, request: Request, call_next):
-        logger.info(f"{request.method} {request.url}")
-        response = await call_next(request)
-        return response
-
-
-def create_app():
-    fastapi_app = FastAPI(lifespan=lifespan)
-    fastapi_app.add_middleware(LogMiddleware)
-    if TELEGRAM_BOT_TOKEN is not None:
-        fastapi_app.include_router(telegram_bot.router)
-    else:
-        logger.warning("Telegram bot token not set, telegram bot disabled")
-    fastapi_app.include_router(inoreader.router)
-    fastapi_app.include_router(scraper.router)
-    for router in scraper_routers.scraper_routers:
-        fastapi_app.include_router(router)
-    return fastapi_app
-
-
-app = create_app()
diff --git a/app/models/classes.py b/app/models/classes.py
deleted file mode 100644
index e89bcf7..0000000
--- a/app/models/classes.py
+++ /dev/null
@@ -1,2 +0,0 @@
-# Re-export from shared package
-from fastfetchbot_shared.models.classes import NamedBytesIO  # noqa: F401
diff --git a/app/models/database_model.py b/app/models/database_model.py
deleted file mode 100644
index 7143d8d..0000000
--- a/app/models/database_model.py
+++ /dev/null
@@ -1,43 +0,0 @@
-from typing import Optional, Any
-from datetime import datetime
-
-from pydantic import BaseModel, Field
-from beanie import Document, Indexed, Insert, after_event, before_event
-
-from app.models.metadata_item import MediaFile, MessageType
-from app.models.telegram_chat import document_list as telegram_chat_document_list
-from app.utils.logger import logger
-from app.utils.parse import get_html_text_length
-
-
-class Metadata(Document):
-    title: str = Field(default="untitled")
-    message_type: MessageType = MessageType.SHORT
-    url: str
-    author: Optional[str] = None
-    author_url: Optional[str] = None
-    text: Optional[str] = None
-    text_length: Optional[int] = Field(ge=0)
-    content: Optional[str] = None
-    content_length: Optional[int] = Field(ge=0)
-    category: Optional[str] = None
-    source: Optional[str] = None
-    media_files: Optional[list[MediaFile]] = None
-    telegraph_url: Optional[str] = None
-    timestamp: datetime = Field(default_factory=datetime.utcnow)
-    scrape_status: bool = False
-
-    @before_event(Insert)
-    def get_text_length(self):
-        self.text_length = get_html_text_length(self.text)
-        self.content_length = get_html_text_length(self.content)
-
-    #
-    @staticmethod
-    def from_dict(obj: Any) -> "Metadata":
-        assert isinstance(obj, dict)
-        return Metadata(**obj)
-
-
-document_list = [Metadata]
-document_list.extend(telegram_chat_document_list)
diff --git a/app/models/media_type.py b/app/models/media_type.py
deleted file mode 100644
index 8b1c761..0000000
--- a/app/models/media_type.py
+++ /dev/null
@@ -1,7 +0,0 @@
-from enum import Enum
-
-
-class MediaType(Enum):
-    PHOTO = 1
-    VIDEO = 2
-    ANIMATION = 3
diff --git a/app/models/metadata_item.py b/app/models/metadata_item.py
deleted file mode 100644
index 5bce9fa..0000000
--- a/app/models/metadata_item.py
+++ /dev/null
@@ -1,12 +0,0 @@
-# Re-export from shared package
-from fastfetchbot_shared.models.metadata_item import *  # noqa: F401,F403
-from fastfetchbot_shared.models.metadata_item import (  # noqa: F401
-    MetadataItem,
-    MediaFile,
-    MessageType,
-    from_str,
-    from_list,
-    to_class,
-    metadata_item_from_dict,
-    metadata_item_to_dict,
-)
diff --git a/app/models/telegram_chat.py b/app/models/telegram_chat.py
deleted file mode 100644
index 8261c96..0000000
--- a/app/models/telegram_chat.py
+++ /dev/null
@@ -1,33 +0,0 @@
-from typing import Optional, Any
-from datetime import datetime
-
-from pydantic import BaseModel, Field
-from beanie import Document, Indexed
-
-
-class TelegramUser(BaseModel):
-    id: int
-    is_bot: bool
-    first_name: str
-    last_name: Optional[str] = None
-    username: Optional[str] = None
-    language_code: Optional[str] = None
-
-
-class TelegramChat(BaseModel):
-    id: int
-    type: str
-    title: Optional[str] = None
-    username: Optional[str] = None
-    first_name: Optional[str] = None
-    last_name: Optional[str] = None
-
-
-class TelegramMessage(Document):
-    date: Indexed(datetime) = Field(default_factory=datetime.utcnow)
-    chat: TelegramChat
-    user: TelegramUser
-    text: str = Field(default="unknown")
-
-
-document_list = [TelegramMessage]
diff --git a/app/models/telegraph_item.py b/app/models/telegraph_item.py
deleted file mode 100644
index 2b4b2f0..0000000
--- a/app/models/telegraph_item.py
+++ /dev/null
@@ -1,7 +0,0 @@
-# Re-export from shared package
-from fastfetchbot_shared.models.telegraph_item import *  # noqa: F401,F403
-from fastfetchbot_shared.models.telegraph_item import (  # noqa: F401
-    TelegraphItem,
-    telegraph_item_from_dict,
-    telegraph_item_to_dict,
-)
diff --git a/app/models/url_metadata.py b/app/models/url_metadata.py
deleted file mode 100644
index 020d120..0000000
--- a/app/models/url_metadata.py
+++ /dev/null
@@ -1,7 +0,0 @@
-# Re-export from shared package
-from fastfetchbot_shared.models.url_metadata import *  # noqa: F401,F403
-from fastfetchbot_shared.models.url_metadata import (  # noqa: F401
-    UrlMetadata,
-    url_metadata_from_dict,
-    url_metadata_to_dict,
-)
diff --git a/app/routers/feed_push.py b/app/routers/feed_push.py
deleted file mode 100644
index 997fdb1..0000000
--- a/app/routers/feed_push.py
+++ /dev/null
@@ -1,53 +0,0 @@
-# TODO: this script is now unused, will be removed in the future
-
-from fastapi import APIRouter
-from fastapi.requests import Request
-
-from app.config import TELEGRAM_CHANNEL_ID
-from app.services.telegram_bot import send_item_message
-from app.services.scrapers.common import InfoExtractService
-from fastapi import Security
-from app.auth import verify_api_key
-from app.utils.logger import logger
-from app.utils.parse import get_url_metadata
-
-router = APIRouter(prefix="/feedPush")
-
-
-async def get_feed_item(url: str, channel_id: str, **kwargs):
-    try:
-        channel_id = int(channel_id) if channel_id.startswith("-") else channel_id
-        url_metadata = await get_url_metadata(url)
-        item = InfoExtractService(url_metadata, **kwargs)
-        metadata_item = await item.get_item()
-        if channel_id not in TELEGRAM_CHANNEL_ID:
-            logger.error(f"channel_id {channel_id} not found")
-            return
-        await send_item_message(metadata_item, chat_id=channel_id)
-    except Exception as e:
-        logger.error(f"Error while getting item: {e}")
-
-
-@router.post("/", dependencies=[Security(verify_api_key)])
-async def push_feed_item(
-    request: Request,
-):
-    try:
-        data = await request.json()
-        params = request.query_params
-        url = (
-            data.get("url")
-            or data.get("aurl")
-            or params.get("url")
-            or params.get("aurl")
-        )
-        if not url:
-            return f"Error: url is required"
-        channel_id = data.get("channelId") or params.get("channelId")
-        if not channel_id:
-            return f"Error: channelId is required"
-        kwargs = data.get("kwargs", {})
-        await get_feed_item(url, channel_id, **kwargs)
-        return "ok"
-    except Exception as e:
-        return f"Error: {e}"
diff --git a/app/routers/inoreader.py b/app/routers/inoreader.py
deleted file mode 100644
index dd5d671..0000000
--- a/app/routers/inoreader.py
+++ /dev/null
@@ -1,38 +0,0 @@
-from fastapi import APIRouter
-from fastapi.requests import Request
-
-from app.config import INOREADER_APP_ID, INOREADER_APP_KEY
-from app.services.inoreader import Inoreader
-from app.services.inoreader.telegram_process import (
-    get_inoreader_item_async,
-    process_inoreader_data,
-    default_telegram_channel_id
-)
-from fastapi import Security
-from app.auth import verify_api_key
-
-router = APIRouter(prefix="/inoreader")
-
-
-async def get_inoreader_webhook_data(data: dict):
-    result = data["items"]
-    return result
-
-
-@router.post("/triggerAsync", dependencies=[Security(verify_api_key)])
-async def inoreader_trigger_webhook(request: Request):
-    if not INOREADER_APP_ID or not INOREADER_APP_KEY:
-        return "inoreader app id or key not set"
-    params = request.query_params
-    await get_inoreader_item_async(trigger=True, params=params)
-    return "ok"
-
-
-@router.post("/webhook", dependencies=[Security(verify_api_key)])
-async def inoreader_tag_webhook(request: Request):
-    data = await request.json()
-    data = await Inoreader.process_items_data(data)
-    params = request.query_params
-    telegram_channel_id = params.get("channel_id", default_telegram_channel_id)
-    await process_inoreader_data(data=data, use_inoreader_content=True, telegram_channel_id=telegram_channel_id)
-    return "ok"
diff --git a/app/routers/scraper.py b/app/routers/scraper.py
deleted file mode 100644
index ff1f576..0000000
--- a/app/routers/scraper.py
+++ /dev/null
@@ -1,37 +0,0 @@
-import asyncio
-
-from fastapi import APIRouter
-from fastapi.requests import Request
-
-from app.config import API_KEY_NAME
-from app.services.scrapers.common import InfoExtractService
-from fastapi import Security
-from app.auth import verify_api_key
-from app.utils.logger import logger
-from app.utils.parse import get_url_metadata
-
-router = APIRouter(prefix="/scraper")
-
-
-@router.post("/getItem", dependencies=[Security(verify_api_key)])
-async def get_item_route(request: Request):
-    logger.debug("A scraper getItem request received")
-    query_params = dict(request.query_params)
-    url = query_params.pop("url")
-    ban_list = query_params.pop("ban_list", None)
-    logger.debug(f"get_item_route: url: {url}, query_params: {query_params}")
-    if API_KEY_NAME in query_params:
-        query_params.pop(API_KEY_NAME)
-    url_metadata = await get_url_metadata(url, ban_list)
-    item = InfoExtractService(url_metadata, **query_params)
-    result = await item.get_item()
-    logger.debug(f"getItem result: {result}")
-    return result
-
-
-@router.post("/getUrlMetadata", dependencies=[Security(verify_api_key)])
-async def get_url_metadata_route(request: Request):
-    url = request.query_params.get("url")
-    ban_list = request.query_params.get("ban_list")
-    url_metadata = await get_url_metadata(url, ban_list)
-    return url_metadata.to_dict()
diff --git a/app/routers/scraper_routers.py b/app/routers/scraper_routers.py
deleted file mode 100644
index 66316c7..0000000
--- a/app/routers/scraper_routers.py
+++ /dev/null
@@ -1,6 +0,0 @@
-from .wechat import router as wechat_router
-
-
-scraper_routers = [
-    wechat_router,
-]
diff --git a/app/routers/telegram_bot.py b/app/routers/telegram_bot.py
deleted file mode 100644
index 3a4f9c9..0000000
--- a/app/routers/telegram_bot.py
+++ /dev/null
@@ -1,34 +0,0 @@
-import asyncio
-
-from fastapi import APIRouter, HTTPException
-from fastapi.requests import Request
-
-from app.services.telegram_bot import set_webhook, process_telegram_update
-from app.config import TELEGRAM_WEBHOOK_URL, TELEGRAM_BOT_SECRET_TOKEN
-from app.utils.logger import logger
-from fastapi import Security, BackgroundTasks
-from app.auth import verify_api_key, verify_telegram_api_header
-
-router = APIRouter(prefix="/telegram")
-
-
-@router.post("/bot/webhook", dependencies=[Security(verify_telegram_api_header)])
-async def telegram_bot_webhook(request: Request, background_tasks: BackgroundTasks):
-    logger.debug("A telegram bot webhook received")
-    data = await request.json()
-    background_tasks.add_task(process_telegram_update, data)
-    logger.debug(f"telegram bot webhook data received, background task added: {data}")
-    return "ok"
-
-
-@router.get("/bot/set_webhook", dependencies=[Security(verify_api_key)])
-async def telegram_bot_set_webhook():
-    # mask api key
-    logger.debug(
-        f"set telegram webhook: {TELEGRAM_WEBHOOK_URL}\nsecret token: {TELEGRAM_BOT_SECRET_TOKEN[:2]}{'*' * (len(TELEGRAM_BOT_SECRET_TOKEN) - 4)}{TELEGRAM_BOT_SECRET_TOKEN[-2:]}"
-    )
-    if await set_webhook():
-        return "ok"
-    else:
-        logger.error("set telegram webhook failed")
-        raise HTTPException(status_code=500, detail="set telegram webhook failed") 
diff --git a/app/routers/twitter.py b/app/routers/twitter.py
deleted file mode 100644
index b15763c..0000000
--- a/app/routers/twitter.py
+++ /dev/null
@@ -1,20 +0,0 @@
-from fastapi import APIRouter
-
-from app.services.scrapers.common import InfoExtractService
-from fastapi import Security
-from app.auth import verify_api_key
-
-
-router = APIRouter(prefix="/twitter")
-
-
-@router.post("/repost", dependencies=[Security(verify_api_key)])
-async def twitter_repost_webhook(url: str):
-    url_metadata = {
-        "url": url,
-        "type": "social_media",
-        "source": "twitter",
-    }
-    item = InfoExtractService(url_metadata)
-    await item.get_item()
-    return "ok"
diff --git a/app/routers/wechat.py b/app/routers/wechat.py
deleted file mode 100644
index fb17df1..0000000
--- a/app/routers/wechat.py
+++ /dev/null
@@ -1,29 +0,0 @@
-from fastapi import APIRouter
-from fastapi.requests import Request
-
-from app.models.url_metadata import UrlMetadata
-from app.services.scrapers.common import InfoExtractService
-from fastapi import Security
-from app.auth import verify_api_key
-
-router = APIRouter(prefix="/wechat")
-
-
-@router.post("/gzh", dependencies=[Security(verify_api_key)])
-async def wechat_gzh_scrape(request: Request):
-    url = request.query_params.get("url")
-    if url:
-        url_metadata = UrlMetadata.from_dict({
-            "url": url,
-            "type": "social_media",
-            "source": "wechat",
-        })
-    else:
-        customized_url_metadata = request.json()
-        if customized_url_metadata:
-            url_metadata = UrlMetadata.from_dict(customized_url_metadata)
-        else:
-            return "url or url metadata not found"
-    item = InfoExtractService(url_metadata)
-    result = await item.get_item()
-    return result
diff --git a/app/services/amazon/s3.py b/app/services/amazon/s3.py
deleted file mode 100644
index 4cd347a..0000000
--- a/app/services/amazon/s3.py
+++ /dev/null
@@ -1,67 +0,0 @@
-import asyncio
-import uuid
-from datetime import datetime
-from urllib.parse import urlparse, quote
-
-import aiofiles.os
-from pathlib import Path
-
-import aioboto3
-from botocore.exceptions import ClientError
-
-from app.utils.logger import logger
-from app.utils.network import download_file_to_local
-from app.config import AWS_S3_BUCKET_NAME, AWS_REGION_NAME, AWS_DOMAIN_HOST
-
-session = aioboto3.Session()
-image_url_host = (
-    AWS_DOMAIN_HOST
-    if AWS_DOMAIN_HOST
-    else f"{AWS_S3_BUCKET_NAME}.s3.{AWS_REGION_NAME}.amazonaws.com"
-)
-
-
-async def download_and_upload(url: str, referer: str = None, suite: str = "test") -> str:
-    urlparser = urlparse(url)
-    file_name = (urlparser.netloc + urlparser.path).replace("/", "-")
-    local_path = await download_file_to_local(url=url, referer=referer, file_name=file_name)
-    local_path = Path(local_path)
-    file_name = local_path.name
-    if not local_path:
-        return ""
-    s3_path = await upload(
-        suite=suite,
-        staging_path=local_path,
-        file_name=file_name,
-    )
-    await aiofiles.os.remove(local_path)
-    return s3_path
-
-
-async def upload(
-        staging_path: Path,
-        bucket: str = AWS_S3_BUCKET_NAME,
-        suite: str = "test",
-        release: str = datetime.now().strftime("%Y-%m-%d"),
-        file_name: str = None,
-) -> str:
-    if not file_name:
-        file_name = uuid.uuid4().hex
-    blob_s3_key = f"{suite}/{release}/{file_name}"
-    async with session.client("s3") as s3:
-        try:
-            with staging_path.open("rb") as spfp:
-                logger.info(f"Uploading {blob_s3_key}")
-                await s3.upload_fileobj(
-                    spfp,
-                    bucket,
-                    blob_s3_key,
-                )
-                logger.info(f"Uploaded {file_name} to {suite}/{release}")
-        except Exception as e:
-            logger.error(f"Failed to upload {file_name} to {suite}/{release}, {e}")
-            return ""
-        image_url = f"https://{image_url_host}/{blob_s3_key}"
-        urlparser = urlparse(image_url)
-        quoted_url = urlparser.scheme + "://" + urlparser.netloc + quote(urlparser.path)
-        return quoted_url
diff --git a/app/services/file_export/__init__.py b/app/services/file_export/__init__.py
deleted file mode 100644
index e69de29..0000000
diff --git a/app/services/file_export/audio_transcribe/__init__.py b/app/services/file_export/audio_transcribe/__init__.py
deleted file mode 100644
index 2290b3e..0000000
--- a/app/services/file_export/audio_transcribe/__init__.py
+++ /dev/null
@@ -1,30 +0,0 @@
-import httpx
-
-from app.config import OPENAI_API_KEY, FILE_EXPORTER_URL, DOWNLOAD_VIDEO_TIMEOUT
-from app.utils.logger import logger
-from app.utils.parse import wrap_text_into_html
-
-TRANSCRIBE_MODEL = "whisper-1"
-SEGMENT_LENGTH = 5 * 60
-
-
-class AudioTranscribe:
-    def __init__(self, audio_file: str):
-        self.audio_file = audio_file
-
-    async def transcribe(self):
-        return await self._get_audio_text(self.audio_file)
-
-    @staticmethod
-    async def _get_audio_text(audio_file: str):
-        async with httpx.AsyncClient() as client:
-            body = {
-                "audio_file": audio_file,
-                "openai_api_key": OPENAI_API_KEY,
-            }
-            request_url = FILE_EXPORTER_URL + "/transcribe"
-            response = await client.post(
-                url=request_url, json=body, timeout=DOWNLOAD_VIDEO_TIMEOUT
-            )
-            transcript = response.json().get("transcript")
-            return transcript
diff --git a/app/services/file_export/document_export/__init__.py b/app/services/file_export/document_export/__init__.py
deleted file mode 100644
index 282167d..0000000
--- a/app/services/file_export/document_export/__init__.py
+++ /dev/null
@@ -1,10 +0,0 @@
-from . import pdf_export
-
-
-class DocumentExport(object):
-    def __init__(self, document):
-        self.document = document
-
-    def export(self):
-        if self.document["type"] == "pdf":
-            return pdf_export.PdfExport(self.document["content"]).export()
diff --git a/app/services/file_export/document_export/pdf_export.py b/app/services/file_export/document_export/pdf_export.py
deleted file mode 100644
index 22d5df7..0000000
--- a/app/services/file_export/document_export/pdf_export.py
+++ /dev/null
@@ -1,109 +0,0 @@
-import asyncio
-import functools
-
-# import gc
-import os
-import uuid
-from pathlib import Path
-
-import aiofiles
-import aiofiles.os
-import httpx
-from bs4 import BeautifulSoup
-
-from app.config import DOWNLOAD_DIR, FILE_EXPORTER_URL, DOWNLOAD_VIDEO_TIMEOUT, TEMP_DIR, AWS_STORAGE_ON
-from app.services.amazon.s3 import upload as upload_to_s3
-from app.utils.logger import logger
-
-current_directory = os.path.dirname(os.path.abspath(__file__))
-
-PDF_STYLESHEET = os.path.join(current_directory, "pdf_export.css")
-
-
-async def upload_file_to_s3(output_filename):
-    return await upload_to_s3(
-        staging_path=output_filename,
-        suite="documents",
-        file_name=output_filename.name,
-    )
-
-
-class PdfExport:
-    def __init__(self, title: str, html_string: str = None):
-        self.title = title
-        self.html_string = html_string
-
-    async def export(self, method: str = "file") -> str:
-        body = {
-            "method": method
-        }
-        html_string = self.wrap_html_string(self.html_string)
-        if method == "string":
-            body["html_string"] = html_string,
-            logger.debug(
-                f"""
-                    html_string: {html_string}
-                    """
-            )
-        elif method == "file":
-            filename = f"{self.title}-{uuid.uuid4()}.html"
-            filename = os.path.join(TEMP_DIR, filename)
-            async with aiofiles.open(
-                filename, "w", encoding="utf-8"
-            ) as f:
-                await f.write(html_string)
-                html_file = filename
-                logger.debug(html_file)
-            body["html_file"] = html_file
-        output_filename = f"{self.title}-{uuid.uuid4()}.pdf"
-        body["output_filename"] = output_filename
-
-        async with httpx.AsyncClient() as client:
-            request_url = FILE_EXPORTER_URL + "/pdfExport"
-            logger.info(f"requesting pdf export from pdf server: {body}")
-            resp = await client.post(
-                request_url, json=body, timeout=DOWNLOAD_VIDEO_TIMEOUT
-            )
-        output_filename = resp.json().get("output_filename")
-        logger.info(f"pdf export success: {output_filename}")
-        await aiofiles.os.remove(html_file)
-        if AWS_STORAGE_ON:
-            local_filename = output_filename
-            output_filename = await upload_file_to_s3(Path(output_filename))
-            await aiofiles.os.remove(local_filename)
-        return output_filename
-
-    @staticmethod
-    def wrap_html_string(html_string: str) -> str:
-        soup = BeautifulSoup(
-            '<html><head><meta http-equiv="Content-Type" content="text/html; charset=utf-8">'
-            '<meta charset="UTF-8"></head><body></body></html>',
-            "html.parser",
-        )
-        soup.body.append(BeautifulSoup(html_string, "html.parser"))
-        for tag in soup.find_all(True):
-            if "style" in tag.attrs:
-                del tag["style"]
-        for style_tag in soup.find_all("style"):
-            style_tag.decompose()
-        return soup.prettify()
-
-    # @staticmethod
-    # async def convert_html_to_pdf(
-    #     html_string: str, css_string: str, output_filename: str
-    # ) -> None:
-    #     font_config = FontConfiguration()
-    #     css_item = CSS(string=css_string, font_config=font_config)
-    #     html_item = HTML(string=html_string)
-    #     loop = asyncio.get_event_loop()
-    #     pdf_obj = await loop.run_in_executor(
-    #         None,
-    #         functools.partial(
-    #             html_item.write_pdf, output_filename, stylesheets=[css_item]
-    #         ),
-    #     )
-    #     del font_config
-    #     del css_item
-    #     del html_item
-    #     del pdf_obj
-    #     gc.collect()
diff --git a/app/services/file_export/document_export/simsun.ttc b/app/services/file_export/document_export/simsun.ttc
deleted file mode 100644
index 6ca8de3..0000000
Binary files a/app/services/file_export/document_export/simsun.ttc and /dev/null differ
diff --git a/app/services/file_export/video_download/__init__.py b/app/services/file_export/video_download/__init__.py
deleted file mode 100644
index ca3bd4e..0000000
--- a/app/services/file_export/video_download/__init__.py
+++ /dev/null
@@ -1,232 +0,0 @@
-from typing import Any, Optional
-
-import httpx
-from urllib.parse import urlparse, parse_qs
-
-from app.models.metadata_item import MetadataItem, MessageType, MediaFile
-from app.services.file_export.audio_transcribe import AudioTranscribe
-from app.config import FILE_EXPORTER_URL, DOWNLOAD_VIDEO_TIMEOUT
-from app.utils.parse import unix_timestamp_to_utc, second_to_time, wrap_text_into_html
-from app.utils.logger import logger
-from app.config import JINJA2_ENV
-
-video_info_template = JINJA2_ENV.get_template("video_info.jinja2")
-
-
-class VideoDownloader(MetadataItem):
-    def __init__(
-            self,
-            url: str,
-            category: str,
-            data: Optional[Any] = None,
-            download: bool = True,
-            audio_only: bool = False,
-            hd: bool = False,
-            transcribe: bool = False,
-            **kwargs,
-    ):
-        self.extractor = category
-        self.url = url
-        self.author_url = ""
-        self.download = download
-        self.audio_only = audio_only
-        self.transcribe = transcribe
-        self.hd = hd
-        self.message_type = MessageType.SHORT
-        self.file_path = None
-        # metadata variables
-        self.category = category
-        self.media_files = []
-        # auxiliary variables
-        self.created = None
-        self.duration = None
-
-    @classmethod
-    async def create(cls, *args, **kwargs):
-        instance = cls(*args, **kwargs)
-        instance.url = await instance._parse_url(instance.url)
-        return instance
-
-    async def get_item(self) -> dict:
-        self.url = await self._parse_url(self.url)
-        await self.get_video()
-        return self.to_dict()
-
-    async def get_video(self) -> None:
-        content_info = await self.get_video_info()
-        self.file_path = content_info["file_path"]
-        video_info_funcs = {
-            "youtube": self._youtube_info_parse,
-            "bilibili": self._bilibili_info_parse,
-        }
-        meta_info = video_info_funcs[self.extractor](content_info)
-        self._video_info_formatting(meta_info)
-        # AI transcribe
-        if self.transcribe:
-            audio_content_info = await self.get_video_info(audio_only=True)
-            audio_file_path = audio_content_info["file_path"]
-            audio_transcribe = AudioTranscribe(audio_file_path)
-            transcribe_text = await audio_transcribe.transcribe()
-            if self.download is False:
-                self.message_type = MessageType.LONG
-            self.text += "\nAI全文摘录：" + transcribe_text
-            self.content += "<hr>" + wrap_text_into_html(transcribe_text)
-
-    async def _parse_url(self, url: str) -> str:
-        async def _get_redirected_url(original_url: str) -> str:
-            async with httpx.AsyncClient(follow_redirects=False) as client:
-                resp = await client.get(original_url)
-                if resp.status_code == 200:
-                    original_url = resp.url
-                elif resp.status_code == 302:
-                    original_url = resp.headers["Location"]
-                return original_url
-
-        def _remove_youtube_link_tracing(original_url: str) -> str:
-            original_url_parser = urlparse(original_url)
-            original_url_hostname = str(original_url_parser.hostname)
-
-            if "youtu.be" in original_url_hostname:
-                # remove all queries
-                original_url = original_url.split("?")[0]
-            if "youtube.com" in original_url_hostname:
-                # remove all queries except "?v=" part
-                original_url = original_url_parser.scheme + "://" + original_url_parser.netloc + original_url_parser.path
-                if original_url_parser.query:
-                    v_part_query = [item for item in original_url_parser.query.split("&") if "v=" in item]
-                    if v_part_query:
-                        original_url += "?" + v_part_query[0]
-            return original_url
-
-        def _remove_bilibili_link_tracing(original_url: str) -> str:
-            original_url_parser = urlparse(original_url)
-            original_url_hostname = str(original_url_parser.hostname)
-            query_dict = parse_qs(original_url_parser.query)
-            bilibili_p_query_string = "?p=" + query_dict["p"][0] if 'p' in query_dict else ""
-
-            if "bilibili.com" in original_url_hostname:
-                original_url = original_url_parser.scheme + "://" + original_url_parser.netloc + original_url_parser.path
-            return original_url + bilibili_p_query_string
-
-        logger.info(f"parsing original video url: {url} for {self.extractor}")
-
-        url_parser = urlparse(url)
-        url_hostname = str(url_parser.hostname)
-
-        if self.extractor == "bilibili":
-            if "b23.tv" in url_hostname:
-                url = await _get_redirected_url(url)
-            if "m.bilibili.com" in url_hostname:
-                url = url.replace("m.bilibili.com", "www.bilibili.com")
-            url = _remove_bilibili_link_tracing(url)
-        elif self.extractor == "youtube":
-            if "youtu.be" in url_hostname:
-                url = await _get_redirected_url(url)
-            url = _remove_youtube_link_tracing(url)
-
-        logger.info(f"parsed video url: {url} for {self.extractor}")
-        return url
-
-    async def get_video_info(
-            self,
-            url: str = None,
-            download: bool = None,
-            extractor: str = None,
-            audio_only: bool = None,
-            hd: bool = None,
-    ) -> dict:
-        """
-        make a request to youtube-dl server to get video info
-        :return: video info dict
-        """
-        if url is None:
-            url = self.url
-        if download is None:
-            download = self.download
-        if extractor is None:
-            extractor = self.extractor
-        if audio_only is None:
-            audio_only = self.audio_only
-        if hd is None:
-            hd = self.hd
-        async with httpx.AsyncClient() as client:
-            body = {
-                "url": url,
-                "download": download,
-                "extractor": extractor,
-                "audio_only": audio_only,
-                "hd": hd,
-            }
-            request_url = FILE_EXPORTER_URL + "/videoDownload"
-            logger.info(f"requesting video info from youtube-dl server: {body}")
-            if download is True:
-                logger.info(f"video downloading... it may take a while")
-                if hd is True:
-                    logger.info(f"downloading HD video, it may take longer")
-                elif audio_only is True:
-                    logger.info(f"downloading audio only")
-            logger.debug(f"downloading video timeout: {DOWNLOAD_VIDEO_TIMEOUT}")
-            resp = await client.post(
-                request_url, json=body, timeout=DOWNLOAD_VIDEO_TIMEOUT
-            )
-            content_info = resp.json().get("content_info")
-            file_path = resp.json().get("file_path")
-            content_info["file_path"] = file_path
-            return content_info
-
-    def _video_info_formatting(self, meta_info: dict):
-        self.title = meta_info["title"]
-        self.author = meta_info["author"]
-        self.author_url = meta_info["author_url"]
-        if len(meta_info["description"]) > 800:
-            meta_info["description"] = meta_info["description"][:800] + "..."
-        self.created = meta_info["upload_date"]
-        self.duration = meta_info["duration"]
-        self.text = video_info_template.render(
-            data={
-                "url": self.url,
-                "title": self.title,
-                "author": self.author,
-                "author_url": self.author_url,
-                "duration": self.duration,
-                "created": self.created,
-                "playback_data": meta_info["playback_data"],
-                "description": meta_info["description"],
-            }
-        )
-        self.content = self.text.replace("\n", "<br>")
-        if self.download:
-            media_type = "video"
-            if self.audio_only:
-                media_type = "audio"
-            self.media_files = [MediaFile(media_type, self.file_path, "")]
-
-    @staticmethod
-    def _youtube_info_parse(video_info: dict) -> dict:
-        return {
-            "id": video_info["id"],
-            "title": video_info["title"],
-            "author": video_info["uploader"],
-            "author_url": video_info["uploader_url"] or video_info["channel_url"],
-            "description": video_info["description"],
-            "playback_data": f"视频播放量：{video_info['view_count']} 评论数：{video_info['comment_count']}",
-            "author_avatar": video_info["thumbnail"],
-            "upload_date": str(video_info["upload_date"]),
-            "duration": second_to_time(round(video_info["duration"])),
-        }
-
-    @staticmethod
-    def _bilibili_info_parse(video_info: dict) -> dict:
-        return {
-            "id": video_info["id"],
-            "title": video_info["title"],
-            "author": video_info["uploader"],
-            "author_url": "https://space.bilibili.com/"
-                          + str(video_info["uploader_id"]),
-            "author_avatar": video_info["thumbnail"],
-            "ext": video_info["ext"],
-            "description": video_info["description"],
-            "playback_data": f"视频播放量：{video_info['view_count']} 弹幕数：{video_info['comment_count']} 点赞数：{video_info['like_count']}",
-            "upload_date": unix_timestamp_to_utc(video_info["timestamp"]),
-            "duration": second_to_time(round(video_info["duration"])),
-        }
diff --git a/app/services/inoreader/__init__.py b/app/services/inoreader/__init__.py
deleted file mode 100644
index 55fc3c7..0000000
--- a/app/services/inoreader/__init__.py
+++ /dev/null
@@ -1,170 +0,0 @@
-from typing import Optional
-from urllib.parse import quote
-
-import httpx
-from bs4 import BeautifulSoup
-import jmespath
-from httpx import Response
-
-from app.models.metadata_item import MetadataItem, MediaFile, MessageType
-from app.utils.network import HEADERS
-from app.utils.logger import logger
-from app.utils.parse import get_html_text_length
-from app.config import (
-    INOREADER_APP_ID,
-    INOREADER_APP_KEY,
-    INOREADER_EMAIL,
-    INOREADER_PASSWORD,
-)
-
-INOREADER_CONTENT_URL = "https://www.inoreader.com/reader/api/0/stream/contents/"
-TAG_PATH = "user/-/label/"
-OTHER_PATH = "user/-/state/com.google/"
-INOREADER_LOGIN_URL = "https://www.inoreader.com/accounts/ClientLogin"
-
-
-class Inoreader(MetadataItem):
-    def __init__(self, url: str = None, data: dict = None, **kwargs):
-        if url:
-            self.url = url
-        if data:
-            self.title = data.get("title", "")
-            self.message = data.get("message", "")
-            self.author = data.get("author", "")
-            self.author_url = data.get("author_url", "")
-            self.category = data.get("category", "")
-            self.raw_content = data.get("content", "")
-            self.content = self.raw_content
-        if kwargs.get("category"):
-            self.category = kwargs["category"]
-        self.media_files = []
-        self.message_type = MessageType.LONG
-
-    def _from_data(self, data: dict):
-        self.title = data.get("title", "")
-        self.message = data.get("message", "")
-        self.author = data.get("author", "")
-        self.author_url = data.get("author_url", "")
-        self.category = data.get("category", "")
-        self.raw_content = data.get("content", "")
-        self.content = self.raw_content
-
-    async def get_item(self, api: bool = False) -> dict:
-        if api:
-            data = await self.get_api_item_data()
-        self._resolve_media_files()
-        if get_html_text_length(self.content) < 400:
-            self.message_type = MessageType.SHORT
-        metadata_dict = self.to_dict()
-        metadata_dict["message"] = self.message
-        return metadata_dict
-
-    def _resolve_media_files(self):
-        soup = BeautifulSoup(self.raw_content, "html.parser")
-        for img in soup.find_all("img"):
-            self.media_files.append(MediaFile(url=img["src"], media_type="image"))
-            img.extract()
-        for video in soup.find_all("video"):
-            self.media_files.append(MediaFile(url=video["src"], media_type="video"))
-            video.extract()
-        for tags in soup.find_all(["p", "span"]):
-            tags.unwrap()
-        self.text = str(soup)
-        self.text = '<a href="' + self.url + '">' + self.author + "</a>: " + self.text
-
-    @staticmethod
-    def get_stream_id(
-            stream_type: str = "broadcast", tag: str = None, feed: str = None
-    ) -> str:
-        if stream_type == "feed":
-            stream_id = feed
-        elif stream_type == "tag":
-            stream_id = TAG_PATH + tag
-        else:
-            stream_id = OTHER_PATH + stream_type
-        stream_id = quote(stream_id)
-        return stream_id
-
-    @staticmethod
-    async def mark_all_as_read(stream_id: str, timestamp: int = 0) -> None:
-        request_url = "https://www.inoreader.com/reader/api/0/mark-all-as-read"
-        params = {"s": stream_id, "ts": timestamp}
-        resp = await Inoreader.get_api_info(url=request_url, params=params)
-        logger.debug(resp.text)
-
-    @staticmethod
-    async def get_api_item_data(
-            stream_type: str = "broadcast",
-            tag: str = None,
-            feed: str = None,
-            params: dict = None,
-    ) -> Optional[dict | list]:
-        stream_id = Inoreader.get_stream_id(stream_type=stream_type, tag=tag, feed=feed)
-        request_url = INOREADER_CONTENT_URL + stream_id
-        default_params = {
-            "comments": 1,
-            "n": 10,
-            "r": "o",
-            "xt": "user/-/state/com.google/read",
-        }
-        if params:
-            default_params.update(params)
-        params = default_params
-        resp = await Inoreader.get_api_info(url=request_url, params=params)
-        logger.debug(resp.text)
-        data = resp.json()
-        data = await Inoreader.process_items_data(data)
-        return data
-
-    @staticmethod
-    async def process_items_data(data: dict) -> Optional[dict | list]:
-        expression = """
-                            items[].{
-                            "aurl": canonical[0].href,
-                            "title": title,
-                            "author": origin.title,
-                            "author_url": origin.htmlUrl,
-                            "content": summary.content,
-                            "category": categories[-1],
-                            "message": comments[0].commentBody,
-                            "timestamp": updated
-                            }
-                        """
-        data = jmespath.search(expression, data)
-        for item in data:
-            item["category"] = item["category"].split("/")[-1]
-        return data
-
-    @staticmethod
-    async def get_api_info(
-            url: str,
-            params=None,
-    ) -> Response:
-        async with httpx.AsyncClient() as client:
-            resp = await client.post(
-                INOREADER_LOGIN_URL,
-                params={
-                    "Email": INOREADER_EMAIL,
-                    "Passwd": INOREADER_PASSWORD,
-                },
-            )
-            authorization = resp.text.split("\n")[2].split("=")[1]
-
-        async with httpx.AsyncClient() as client:
-            headers = HEADERS
-            headers["Authorization"] = f"GoogleLogin auth={authorization}"
-            params = params or {}
-            params.update(
-                {
-                    "AppId": INOREADER_APP_ID,
-                    "AppKey": INOREADER_APP_KEY,
-                }
-            )
-            resp = await client.get(
-                url=url,
-                params=params,
-                headers=headers,
-            )
-            return resp
-
-
diff --git a/app/services/inoreader/telegram_process.py b/app/services/inoreader/telegram_process.py
deleted file mode 100644
index 975e894..0000000
--- a/app/services/inoreader/telegram_process.py
+++ /dev/null
@@ -1,102 +0,0 @@
-from typing import Union, Optional, Dict, Callable, Awaitable
-
-from app.config import TELEGRAM_CHANNEL_ID
-from app.models.url_metadata import UrlMetadata
-from app.services.inoreader import Inoreader
-from app.services.scrapers.common import InfoExtractService
-from app.utils.logger import logger
-from app.utils.parse import get_url_metadata, get_bool
-
-default_telegram_channel_id = TELEGRAM_CHANNEL_ID[0] if TELEGRAM_CHANNEL_ID else None
-
-# Type alias for the message callback
-MessageCallback = Callable[[dict, Union[int, str]], Awaitable[None]]
-
-
-async def _default_message_callback(metadata_item: dict, chat_id: Union[int, str]) -> None:
-    """Default callback that sends via Telegram bot. Used when no callback is provided."""
-    from app.services.telegram_bot import send_item_message
-    await send_item_message(metadata_item, chat_id=chat_id)
-
-
-async def process_inoreader_data(
-        data: list,
-        use_inoreader_content: bool,
-        telegram_channel_id: Union[int, str] = default_telegram_channel_id,
-        stream_id: str = None,
-        message_callback: MessageCallback = None,
-):
-    if message_callback is None:
-        message_callback = _default_message_callback
-
-    for item in data:
-        url_type_item = await get_url_metadata(item["aurl"])
-        url_type_dict = url_type_item.to_dict()
-        logger.debug(f"ino original: {use_inoreader_content}")
-        if (
-                use_inoreader_content is True
-                or url_type_dict["content_type"] == "unknown"
-        ):
-            is_video = url_type_dict["content_type"] == "video"
-            content_type = url_type_dict["content_type"] if is_video else "social_media"
-            source = url_type_dict["source"] if is_video else "inoreader"
-            url_metadata = UrlMetadata(
-                url=item["aurl"],
-                content_type=content_type,
-                source=source,
-            )
-            metadata_item = InfoExtractService(
-                url_metadata=url_metadata,
-                data=item,
-                store_document=True,
-                category=item["category"],
-            )
-        else:
-            metadata_item = InfoExtractService(
-                url_metadata=url_type_item,
-                data=item,
-                store_document=True,
-            )
-        message_metadata_item = await metadata_item.get_item()
-        await message_callback(message_metadata_item, telegram_channel_id)
-        if stream_id:
-            await Inoreader.mark_all_as_read(
-                stream_id=stream_id, timestamp=item["timestamp"] - 1
-            )
-
-
-async def get_inoreader_item_async(
-        data: Optional[Dict] = None,
-        trigger: bool = False,
-        params: Optional[Dict] = None,
-        message_callback: MessageCallback = None,
-) -> None:
-    stream_id = None
-    use_inoreader_content = True
-    telegram_channel_id = default_telegram_channel_id
-    if trigger and params and not data:
-        logger.debug(f"params:{params}")
-        use_inoreader_content = get_bool(params.get("useInoreaderContent"), True)
-        stream_type = params.get("streamType", "broadcast")
-        telegram_channel_id = params.get("channelId", default_telegram_channel_id)
-        tag = params.get("tag", None)
-        feed = params.get("feed", None)
-        the_remaining_params = {
-            k: v
-            for k, v in params.items()
-            if k not in ["streamType", "channelId", "tag", "feed"]
-        }
-        data = await Inoreader.get_api_item_data(
-            stream_type=stream_type, tag=tag, params=the_remaining_params, feed=feed
-        )
-        if not data:
-            return
-        stream_id = Inoreader.get_stream_id(stream_type=stream_type, tag=tag, feed=feed)
-    if type(data) is dict:
-        data = [data]
-    await process_inoreader_data(
-        data, use_inoreader_content, telegram_channel_id, stream_id,
-        message_callback=message_callback,
-    )
-    if stream_id:
-        await Inoreader.mark_all_as_read(stream_id=stream_id)
diff --git a/app/services/scrapers/__init__.py b/app/services/scrapers/__init__.py
deleted file mode 100644
index e69de29..0000000
diff --git a/app/services/scrapers/bluesky/__init__.py b/app/services/scrapers/bluesky/__init__.py
deleted file mode 100644
index cb11b74..0000000
--- a/app/services/scrapers/bluesky/__init__.py
+++ /dev/null
@@ -1,45 +0,0 @@
-import traceback
-from dataclasses import dataclass
-from urllib.parse import urlparse
-from typing import Dict, Optional, Any
-
-import httpx
-import jmespath
-
-from app.models.metadata_item import MetadataItem, MediaFile, MessageType
-from app.utils.parse import get_html_text_length, wrap_text_into_html
-
-
-@dataclass
-class Bluesky(MetadataItem):
-    cid: str = ""
-    author_did: str = ""
-    retweet_post: Optional["Bluesky"] = None
-
-    @staticmethod
-    def from_dict(obj: Any) -> "Bluesky":
-        bluesky_item = MetadataItem.from_dict(obj)
-        bluesky_item.cid = obj.get("cid")
-        bluesky_item.author_did = obj.get("author_did")
-        return Bluesky(
-            url=bluesky_item.url,
-            title=bluesky_item.title,
-            author=bluesky_item.author,
-            author_url=bluesky_item.author_url,
-            telegraph_url=bluesky_item.telegraph_url,
-            text=bluesky_item.text,
-            content=bluesky_item.content,
-            media_files=bluesky_item.media_files,
-            category=bluesky_item.category,
-            message_type=bluesky_item.message_type,
-            cid=bluesky_item.cid,
-            author_did=bluesky_item.author_did,
-        )
-
-    def to_dict(self) -> dict:
-        result: dict = super().to_dict()
-        result["cid"] = self.cid
-        result["author_did"] = self.author_did
-        if self.retweet_post:
-            result["retweet_post"] = self.retweet_post.to_dict()
-        return result
diff --git a/app/services/scrapers/bluesky/config.py b/app/services/scrapers/bluesky/config.py
deleted file mode 100644
index 3183639..0000000
--- a/app/services/scrapers/bluesky/config.py
+++ /dev/null
@@ -1,3 +0,0 @@
-BLUESKY_HOST = "https://bsky.app"
-
-BLUESKY_MAX_LENGTH = 800
diff --git a/app/services/scrapers/bluesky/scraper.py b/app/services/scrapers/bluesky/scraper.py
deleted file mode 100644
index 06f09d9..0000000
--- a/app/services/scrapers/bluesky/scraper.py
+++ /dev/null
@@ -1,191 +0,0 @@
-from typing import Optional
-from urllib.parse import urlparse
-
-from atproto import AsyncClient, IdResolver, AtUri
-from atproto_client.models.app.bsky.embed.record import ViewRecord
-from atproto_client.models.app.bsky.feed.defs import ThreadViewPost, PostView
-
-from app.config import JINJA2_ENV
-from app.models.metadata_item import MediaFile, MessageType
-from app.services.scrapers.scraper import Scraper, DataProcessor
-from app.services.scrapers.bluesky import Bluesky
-from app.services.scrapers.bluesky.config import BLUESKY_HOST, BLUESKY_MAX_LENGTH
-from app.utils.logger import logger
-from app.utils.parse import wrap_text_into_html
-
-telegram_text_template = JINJA2_ENV.get_template("bluesky_telegram_text.jinja2")
-content_template = JINJA2_ENV.get_template("bluesky_content.jinja2")
-
-
-class BlueskyPost:
-    def __init__(self, bluesky_url: str):
-        self.url: str = bluesky_url
-        bluesky_url_parser = urlparse(bluesky_url)
-        self.bluesky_host: Optional[str] = bluesky_url_parser.netloc
-        bluesky_path = bluesky_url_parser.path
-        self.handle: Optional[str] = bluesky_path.split("/")[2]
-        self.post_rkey: Optional[str] = bluesky_path.split("/")[-1]
-        self.did: str = BlueskyScraper.id_resolver.handle.resolve(self.handle)
-
-
-class BlueskyDataProcessor(DataProcessor):
-
-    def __init__(self, url: str, bluesky_thread_data: ThreadViewPost):
-        self.url: str = url
-        self.bluesky_thread_data: ThreadViewPost = bluesky_thread_data
-        logger.debug(
-            f"BlueskyDataProcessor initialized with url: {url}\n and bluesky_thread_data: \n{bluesky_thread_data}")
-        self._data: dict = {}
-
-    async def get_item(self) -> dict:
-        await self.process_data()
-        bluesky_item = Bluesky.from_dict(self._data)
-        return bluesky_item.to_dict()
-        pass
-
-    async def process_data(self):
-        await self._resolve_thread_data()
-
-    async def _resolve_thread_data(self) -> None:
-        base_post_view_data = await BlueskyDataProcessor._resolve_single_post_data(self.bluesky_thread_data.post)
-        base_post_view_data["url"] = self.url
-
-        post_author_did = base_post_view_data["author_did"]
-
-        parent_posts_text = ""
-        parent_posts_content = ""
-        parent_posts_media_files = []
-        replies_posts_text = ""
-        replies_posts_content = ""
-        replies_posts_media_files = []
-        # get post data from the parent posts whose author is the same as the base post author
-        if self.bluesky_thread_data.parent:
-            parent_posts_data = []
-            parent_post_view = self.bluesky_thread_data.parent
-            await BlueskyDataProcessor._get_parent_posts_data(parent_post_view, parent_posts_data)
-            if parent_posts_data:
-                for post_data in parent_posts_data:
-                    parent_posts_text += "\n" + post_data["text"]
-                    parent_posts_content += post_data["content"]
-                    parent_posts_media_files.extend(post_data["media_files"])
-        # get post data from the replies whose author is the same as the base post author
-        if self.bluesky_thread_data.replies:
-            replies_posts_data = []
-            for post_thread_view in self.bluesky_thread_data.replies:
-                post_view = post_thread_view.post
-                if post_author_did == post_view.author.did:
-                    post_data = await BlueskyDataProcessor._resolve_single_post_data(post_view)
-                    replies_posts_data.append(post_data)
-            if replies_posts_data:
-                for post_data in replies_posts_data:
-                    replies_posts_text += "\n" + post_data["text"]
-                    replies_posts_content += post_data["content"]
-                    replies_posts_media_files.extend(post_data["media_files"])
-        base_post_view_data["text"] = parent_posts_text + base_post_view_data["text"] + replies_posts_text
-        base_post_view_data["content"] = parent_posts_content + base_post_view_data["content"] + replies_posts_content
-        base_post_view_data["media_files"] = parent_posts_media_files + base_post_view_data[
-            "media_files"] + replies_posts_media_files
-
-        if len(base_post_view_data["text"]) > BLUESKY_MAX_LENGTH:
-            base_post_view_data["message_type"] = MessageType.LONG
-        else:
-            base_post_view_data["message_type"] = MessageType.SHORT
-
-        self._data = base_post_view_data
-
-    @staticmethod
-    async def _get_parent_posts_data(parent_post_view: ThreadViewPost, parent_posts_data_list: list) -> None:
-        parent_post_data = await BlueskyDataProcessor._resolve_single_post_data(parent_post_view.post)
-        parent_posts_data_list.append(parent_post_data)
-        if parent_post_view.parent:
-            await BlueskyDataProcessor._get_parent_posts_data(parent_post_view.parent, parent_posts_data_list)
-
-    @staticmethod
-    async def _resolve_single_post_data(post_data: PostView) -> dict:
-        at_uri = AtUri.from_str(post_data.uri)
-        url = BLUESKY_HOST + "/profile/" + post_data.author.handle + "/post/" + at_uri.rkey
-        author = post_data.author.display_name
-        author_url = BLUESKY_HOST + "/profile/" + post_data.author.handle
-        author_did = post_data.author.did
-        text = post_data.record.text
-        created_at = post_data.record.created_at
-
-        parsed_post_data = {
-            "url": url,
-            "title": author + "\'s Bluesky post",
-            "author": author,
-            "author_url": author_url,
-            "text": text,
-            "category": "bluesky",
-            "media_files": [],
-            "created_at": created_at,
-            "author_did": author_did,
-        }
-
-        media_files = []
-        if post_data.embed is not None:
-            # images and videos
-            if "images" in post_data.embed.__dict__:
-                for image in post_data.embed.images:
-                    img_url = image.fullsize
-                    img_item = {
-                        "media_type": "image",
-                        "url": img_url,
-                        "caption": "",
-                    }
-                    media_files.append(img_item)
-            # TODO: handle video, which is in m3u8 format that needs to be downloaded and converted to mp4
-            parsed_post_data["media_files"] = media_files
-            # retweet post
-            if "record" in post_data.embed.__dict__ and post_data.embed.record is ViewRecord:
-                retweet_post_data = await BlueskyDataProcessor._resolve_single_post_data(post_data.embed.record)
-                parsed_post_data["retweet_post"] = retweet_post_data
-
-        content = await BlueskyDataProcessor._generate_html_content(parsed_post_data)
-        text = await BlueskyDataProcessor._generate_telegram_text(parsed_post_data)
-        parsed_post_data["content"] = content
-        parsed_post_data["text"] = text
-
-        return parsed_post_data
-
-    @staticmethod
-    async def _generate_html_content(data: dict) -> str:
-        html_content_text = wrap_text_into_html(data["text"])
-        data["html_content_text"] = html_content_text
-        content = content_template.render(data=data)
-        return content
-
-    @staticmethod
-    async def _generate_telegram_text(data: dict) -> str:
-        text = telegram_text_template.render(data=data)
-        return text
-
-
-class BlueskyScraper(Scraper):
-    id_resolver = IdResolver()
-
-    def __init__(self, username: Optional[str] = None, password: Optional[str] = None):
-        self.client: AsyncClient = AsyncClient()
-        self.username: Optional[str] = username
-        self.password: Optional[str] = password
-        self.did: Optional[str] = None
-
-    async def init(self):
-        if self.username and self.password:
-            await self.client.login(self.username, self.password)
-            # self.did = await self.client.com
-
-    async def get_processor_by_url(self, url: str) -> BlueskyDataProcessor:
-        bluesky_post = BlueskyPost(url)
-        bluesky_post_data = await self._request_post_data(bluesky_post)
-        return BlueskyDataProcessor(url, bluesky_post_data)
-
-    async def _request_post_data(self, bluesky_post: BlueskyPost) -> ThreadViewPost:
-        profile_identify = bluesky_post.did or bluesky_post.handle
-        try:
-            post_data = await self.client.get_post(profile_identify=profile_identify, post_rkey=bluesky_post.post_rkey)
-            post_uri = post_data.uri
-            post_thread_data = await self.client.get_post_thread(uri=post_uri)
-            return post_thread_data.thread
-        except Exception as e:
-            logger.error(f"Error while getting post data: {e}")
diff --git a/app/services/scrapers/common.py b/app/services/scrapers/common.py
deleted file mode 100644
index bdb1a42..0000000
--- a/app/services/scrapers/common.py
+++ /dev/null
@@ -1,114 +0,0 @@
-from typing import Optional, Any
-
-from app.models.database_model import Metadata
-from app.models.url_metadata import UrlMetadata
-from app.models.metadata_item import MessageType
-from app.services import (
-    telegraph,
-    inoreader
-)
-from app.services.file_export import video_download, document_export
-from app.services.scrapers import twitter, wechat, reddit, weibo, zhihu, douban, instagram, xiaohongshu, threads
-from app.services.scrapers.scraper_manager import ScraperManager
-from app.database import save_instances
-from app.utils.logger import logger
-from app.config import DATABASE_ON
-
-
-class InfoExtractService(object):
-    service_classes: dict = {
-        "twitter": twitter.Twitter,
-        "threads": threads.Threads,
-        "reddit": reddit.Reddit,
-        "weibo": weibo.Weibo,
-        "wechat": wechat.Wechat,
-        "instagram": instagram.Instagram,
-        "douban": douban.Douban,
-        "zhihu": zhihu.Zhihu,
-        "xiaohongshu": xiaohongshu.Xiaohongshu,
-        "youtube": video_download.VideoDownloader,
-        "bilibili": video_download.VideoDownloader,
-        "inoreader": inoreader.Inoreader,
-    }
-
-    def __init__(
-            self,
-            url_metadata: UrlMetadata,
-            data: Any = None,
-            store_database: Optional[bool] = DATABASE_ON,
-            store_telegraph: Optional[bool] = True,
-            store_document: Optional[bool] = False,
-            **kwargs,
-    ):
-        url_metadata = url_metadata.to_dict()
-        self.url = url_metadata["url"]
-        self.content_type = url_metadata["content_type"]
-        self.source = url_metadata["source"]
-        self.data = data
-        self.kwargs = kwargs
-        self.store_database = store_database
-        self.store_telegraph = store_telegraph
-        self.store_document = store_document
-
-    @property
-    def category(self) -> str:
-        return self.source
-
-    async def get_item(self, metadata_item: Optional[dict] = None) -> dict:
-        if self.content_type == "video":
-            if not self.kwargs.get("category"):
-                self.kwargs["category"] = self.category
-        if not metadata_item:
-            try:
-                if self.category in ["bluesky", "weibo", "other", "unknown"]:  # it is a workaround before the code refactor
-                    await ScraperManager.init_scraper(self.category)
-                    item_data_processor = await ScraperManager.scrapers[self.category].get_processor_by_url(url=self.url)
-                    metadata_item = await item_data_processor.get_item()
-                else:
-                    scraper_item = InfoExtractService.service_classes[self.category](
-                        url=self.url, data=self.data, **self.kwargs
-                    )
-                    metadata_item = await scraper_item.get_item()
-            except Exception as e:
-                logger.error(f"Error while getting item: {e}")
-                raise e
-        logger.info(f"Got metadata item")
-        logger.debug(metadata_item)
-        metadata_item = await self.process_item(metadata_item)
-        return metadata_item
-
-    async def process_item(self, metadata_item: dict) -> dict:
-        if metadata_item.get("message_type") == MessageType.LONG:
-            self.store_telegraph = True
-            logger.info("message type is long, store in telegraph")
-        if self.store_telegraph:
-            telegraph_item = telegraph.Telegraph.from_dict(metadata_item)
-            try:
-                telegraph_url = await telegraph_item.get_telegraph()
-            except Exception as e:
-                logger.error(f"Error while getting telegraph: {e}")
-                telegraph_url = ""
-            metadata_item["telegraph_url"] = telegraph_url
-        if self.store_document or (
-                not self.store_document and metadata_item["telegraph_url"] == ""
-        ):
-            logger.info("store in document")
-            try:
-                pdf_document = document_export.pdf_export.PdfExport(
-                    title=metadata_item["title"], html_string=metadata_item["content"]
-                )
-                output_filename = await pdf_document.export(method="file")
-                metadata_item["media_files"].append(
-                    {
-                        "media_type": "document",
-                        "url": output_filename,
-                        "caption": "",
-                    }
-                )
-            except Exception as e:
-                logger.error(f"Error while exporting document: {e}")
-        metadata_item["title"] = metadata_item["title"].strip()
-        if self.store_database:
-            logger.info("store in database")
-            await save_instances(Metadata.model_construct(**metadata_item))
-        return metadata_item
diff --git a/app/services/scrapers/douban/__init__.py b/app/services/scrapers/douban/__init__.py
deleted file mode 100644
index feec305..0000000
--- a/app/services/scrapers/douban/__init__.py
+++ /dev/null
@@ -1,230 +0,0 @@
-import re
-from typing import Dict, Optional, Any
-from enum import Enum
-from urllib.parse import urlparse
-
-from bs4 import BeautifulSoup
-from lxml import etree
-
-from app.utils.parse import get_html_text_length, wrap_text_into_html
-from app.utils.network import get_selector, HEADERS
-from app.models.metadata_item import MetadataItem, MediaFile, MessageType
-from app.config import JINJA2_ENV
-
-SHORT_LIMIT = 600
-
-short_text_template = JINJA2_ENV.get_template("douban_short_text.jinja2")
-content_template = JINJA2_ENV.get_template("douban_content.jinja2")
-
-
-class DoubanType(str, Enum):
-    MOVIE_REVIEW = "movie_review"
-    BOOK_REVIEW = "book_review"
-    NOTE = "note"
-    STATUS = "status"
-    GROUP = "group"
-    UNKNOWN = "unknown"
-
-
-class Douban(MetadataItem):
-    item_title: Optional[str]
-    item_url: Optional[str]
-    group_name: Optional[str]
-    group_url: Optional[str]
-    douban_type: DoubanType
-    text_group: Optional[str]
-    raw_content: Optional[str]
-    date: Optional[str]
-
-    def __init__(self, url: str, data: Optional[Any] = None, **kwargs):
-        # metadata fields
-        self.url = url
-        self.title = ""
-        self.author = ""
-        self.author_url = ""
-        self.text = ""
-        self.content = ""
-        self.media_files = []
-        self.category = "douban"
-        self.message_type = MessageType.SHORT
-        # auxiliary fields
-        self.item_title: Optional[str] = None
-        self.item_url: Optional[str] = None
-        self.group_name: Optional[str] = None
-        self.group_url: Optional[str] = None
-        self.douban_type: DoubanType = DoubanType.UNKNOWN
-        self.text_group: Optional[str] = None
-        self.raw_content: Optional[str] = None
-        self.date: Optional[str] = None
-        # reqeust fields
-        self.headers = HEADERS
-        self.headers["Cookie"] = kwargs.get("cookie", "")
-
-    async def get_item(self) -> dict:
-        await self.get_douban()
-        return self.to_dict()
-
-    async def get_douban(self) -> None:
-        self.check_douban_type()
-        await self.get_douban_item()
-
-    def check_douban_type(self):
-        urlparser = urlparse(self.url)
-        host = urlparser.netloc
-        path = urlparser.path
-        if host.find("m.douban") != -1:  # parse the m.douban url
-            host = host.replace("m.douban", "douban")
-            if path.startswith("/movie/review"):
-                self.douban_type = DoubanType.MOVIE_REVIEW
-                host = host.replace("douban", "movie.douban")
-                path = path.replace("/movie/", "/")
-            elif path.startswith("/book/review"):
-                self.douban_type = DoubanType.BOOK_REVIEW
-                host = host.replace("douban", "book.douban")
-                path = path.replace("/book/", "/")
-        if path.startswith("/note/"):
-            self.douban_type = DoubanType.NOTE
-        elif path.startswith("/status/") or re.match(r"/people/\d+/status/\d+", path):
-            self.douban_type = DoubanType.STATUS
-        elif path.startswith("/group/topic/"):
-            self.douban_type = DoubanType.GROUP
-        elif host.startswith("movie.douban") and path.startswith("/review/"):
-            self.douban_type = DoubanType.MOVIE_REVIEW
-        elif host.startswith("book.douban") and path.startswith("/review/"):
-            self.douban_type = DoubanType.BOOK_REVIEW
-        else:
-            self.douban_type = DoubanType.UNKNOWN
-        self.url = f"https://{host}{path}"
-
-    async def get_douban_item(self):
-        function_dict = {
-            DoubanType.MOVIE_REVIEW: self._get_douban_movie_review,
-            DoubanType.BOOK_REVIEW: self._get_douban_book_review,
-            DoubanType.NOTE: self._get_douban_note,
-            DoubanType.STATUS: self._get_douban_status,
-            DoubanType.GROUP: self._get_douban_group_article,
-            DoubanType.UNKNOWN: None,
-        }
-        await function_dict[self.douban_type]()
-        short_text = self._douban_short_text_process()
-        if short_text.endswith("\n"):
-            short_text = short_text[:-1]
-        data = self.__dict__
-        data["short_text"] = short_text
-        self.text = short_text_template.render(data=data)
-        self.raw_content = self.raw_content_to_html(self.raw_content)
-        self.content = wrap_text_into_html(
-            content_template.render(data=data), is_html=True
-        )
-        if get_html_text_length(self.content) > SHORT_LIMIT:
-            self.message_type = MessageType.LONG
-        else:
-            self.message_type = MessageType.SHORT
-
-    async def _get_douban_movie_review(self):
-        selector = await get_selector(url=self.url, headers=self.headers)
-        self.title = selector.xpath('string(//div[@id="content"]//h1//span)')
-        self.author = selector.xpath('string(//header[@class="main-hd"]//span)')
-        self.author_url = selector.xpath('string(//header[@class="main-hd"]/a/@href)')
-        self.item_title = selector.xpath('string(//header[@class="main-hd"]/a[2])')
-        self.item_url = selector.xpath('string(//header[@class="main-hd"]/a[2]/@href)')
-        self.raw_content = str(
-            etree.tostring(
-                selector.xpath("//div[contains(@class,'review-content')]")[0],
-                encoding="utf-8",
-            ),
-            encoding="utf-8",
-        )
-
-    async def _get_douban_book_review(self):
-        selector = await get_selector(self.url, headers=self.headers)
-        self.title = selector.xpath('string(//div[@id="content"]//h1//span)')
-        self.author = selector.xpath('string(//header[@class="main-hd"]//span)')
-        self.author_url = selector.xpath('string(//header[@class="main-hd"]/a/@href)')
-        self.item_title = selector.xpath('string(//header[@class="main-hd"]/a[2])')
-        self.item_url = selector.xpath('string(//header[@class="main-hd"]/a[2]/@href)')
-        self.raw_content = str(
-            etree.tostring(
-                selector.xpath('//div[@id="link-report"]')[0], encoding="utf-8"
-            ),
-            encoding="utf-8",
-        )
-
-    async def _get_douban_note(self):
-        selector = await get_selector(self.url, headers=self.headers)
-        self.title = selector.xpath("string(//h1)")
-        self.author = selector.xpath('string(//div[@class="content"]/a)')
-        self.author_url = selector.xpath('string(//div[@class="content"]/a/@href)')
-        self.raw_content = str(
-            etree.tostring(
-                selector.xpath('//div[@id="link-report"]')[0], encoding="utf-8"
-            ),
-            encoding="utf-8",
-        )
-
-    async def _get_douban_status(self):
-        selector = await get_selector(self.url, headers=self.headers)
-        self.author = selector.xpath('string(//div[@class="content"]/a)')
-        self.author_url = selector.xpath('string(//div[@class="content"]/a/@href)')
-        self.title = self.author + "的广播"
-        self.raw_content = (
-            str(
-                etree.tostring(
-                    selector.xpath('//div[@class="status-saying"]')[0], encoding="utf-8"
-                ),
-                encoding="utf-8",
-            )
-            .replace("<blockquote>", "")
-            .replace("</blockquote>", "")
-            .replace(">+<", "><")
-            .replace("&#13;", "<br>")
-        )
-
-    async def _get_douban_group_article(self):
-        selector = await get_selector(self.url, headers=self.headers)
-        self.title = selector.xpath('string(//div[@id="content"]//h1)')
-        self.title = self.title.replace("\n", "").strip()
-        self.author = selector.xpath('string(//span[@class="from"]//a)')
-        self.author_url = selector.xpath('string(//span[@class="from"]//a/@href)')
-        self.group_name = selector.xpath(
-            'string(//div[@id="g-side-info"]//div[@class="title"]/a)'
-        )
-        self.group_url = selector.xpath(
-            'string(//div[@id="g-side-info"]//div[@class="title"]/a/@href)'
-        )
-        self.raw_content = str(
-            etree.tostring(
-                selector.xpath('//div[@id="link-report"]')[0], encoding="utf-8"
-            ),
-            encoding="utf-8",
-        )
-
-    def _douban_short_text_process(self) -> str:
-        soup = BeautifulSoup(self.raw_content, "html.parser")
-        for img in soup.find_all("img"):
-            media_item = {"media_type": "image", "url": img["src"], "caption": ""}
-            self.media_files.append(MediaFile.from_dict(media_item))
-            img.extract()
-        for item in soup.find_all(["p", "span", "div"]):
-            item.unwrap()
-        for item in soup.find_all(["link", "script"]):
-            item.decompose()
-        for item in soup.find_all("a"):
-            if item.get("title") == "查看原图":
-                item.decompose()
-        short_text = str(soup)
-        short_text = re.sub(r"\n{2,}", "\n", short_text)
-        short_text = re.sub(r"<br\s*/?>", "\n", short_text)
-        return short_text
-
-    @staticmethod
-    def raw_content_to_html(raw_content: str) -> str:
-        # Split the text into paragraphs based on double newlines
-        print(raw_content)
-        paragraphs = raw_content.split('<br>\n')
-        # Wrap each paragraph with <p> tags
-        print(paragraphs)
-        html_paragraphs = [f'<p>{paragraph.strip()}</p>' for paragraph in paragraphs]
-        # Join the paragraphs to form the final HTML string
-        html_string = ''.join(html_paragraphs)
-        return html_string
diff --git a/app/services/scrapers/general/__init__.py b/app/services/scrapers/general/__init__.py
deleted file mode 100644
index 94c0402..0000000
--- a/app/services/scrapers/general/__init__.py
+++ /dev/null
@@ -1,40 +0,0 @@
-from dataclasses import dataclass
-from typing import Any
-
-from app.models.metadata_item import MetadataItem
-
-
-@dataclass
-class GeneralItem(MetadataItem):
-    """
-    GeneralItem: Data class for scraped content from general webpage scrapers.
-    """
-    id: str = ""
-    raw_content: str = ""
-    scraper_type: str = ""  # Which scraper was used (e.g., "firecrawl", "zyte", etc.)
-
-    @staticmethod
-    def from_dict(obj: Any) -> "GeneralItem":
-        metadata_item = MetadataItem.from_dict(obj)
-        return GeneralItem(
-            url=metadata_item.url,
-            title=metadata_item.title,
-            author=metadata_item.author,
-            author_url=metadata_item.author_url,
-            telegraph_url=metadata_item.telegraph_url,
-            text=metadata_item.text,
-            content=metadata_item.content,
-            media_files=metadata_item.media_files,
-            category=metadata_item.category,
-            message_type=metadata_item.message_type,
-            id=obj.get("id", ""),
-            raw_content=obj.get("raw_content", ""),
-            scraper_type=obj.get("scraper_type", ""),
-        )
-
-    def to_dict(self) -> dict:
-        result: dict = super().to_dict()
-        result["id"] = self.id
-        result["raw_content"] = self.raw_content
-        result["scraper_type"] = self.scraper_type
-        return result
diff --git a/app/services/scrapers/general/base.py b/app/services/scrapers/general/base.py
deleted file mode 100644
index 1ab9360..0000000
--- a/app/services/scrapers/general/base.py
+++ /dev/null
@@ -1,208 +0,0 @@
-import hashlib
-from abc import abstractmethod
-from typing import Optional
-from urllib.parse import urlparse
-
-from bs4 import BeautifulSoup, Doctype
-from openai import AsyncOpenAI
-from openai.types.chat import ChatCompletionSystemMessageParam, ChatCompletionUserMessageParam
-
-from app.config import OPENAI_API_KEY
-from app.models.metadata_item import MediaFile, MessageType
-from app.services.scrapers.scraper import Scraper, DataProcessor
-from app.services.scrapers.general import GeneralItem
-from app.utils.parse import get_html_text_length, wrap_text_into_html
-from app.utils.logger import logger
-
-GENERAL_TEXT_LIMIT = 800
-
-DEFAULT_OPENAI_MODEL = "gpt-5-nano"
-
-# System prompt for LLM to extract article content
-ARTICLE_EXTRACTION_PROMPT = """You are an expert content extractor. Your task is to extract the main article content from the provided HTML.
-
-Instructions:
-1. Identify and extract ONLY the main article/post content
-2. Remove navigation, headers, footers, sidebars, ads, comments, and other non-article elements
-3. Preserve the article's structure (headings, paragraphs, lists, etc.)
-4. Keep important formatting like bold, italic, links, and images
-5. Return clean HTML containing only the article content
-6. If you cannot identify the main content, return the original HTML unchanged
-7. After all of the above, remove some basic HTML tags like <!DOCTYPE>, <html>, <script>, <body>
-
-Return ONLY the extracted HTML content, no explanations or markdown."""
-
-
-class BaseGeneralDataProcessor(DataProcessor):
-    """
-    Base class for general webpage data processors.
-    Each specific scraper (Firecrawl, Zyte, etc.) should inherit from this class.
-    """
-
-    def __init__(self, url: str):
-        self.url: str = url
-        self._data: dict = {}
-        self.url_parser = urlparse(url)
-        self.id = hashlib.md5(url.encode()).hexdigest()[:16]
-        self.scraper_type: str = "base"
-
-    async def get_item(self) -> dict:
-        await self.process_data()
-        general_item = GeneralItem.from_dict(self._data)
-        return general_item.to_dict()
-
-    async def process_data(self) -> None:
-        await self._get_page_content()
-
-    @abstractmethod
-    async def _get_page_content(self) -> None:
-        """Subclasses must implement this method to fetch page content."""
-        pass
-
-    async def _build_item_data(
-        self,
-        title: str,
-        author: str,
-        description: str,
-        markdown_content: str,
-        html_content: str,
-        og_image: Optional[str] = None,
-    ) -> None:
-        """
-        Common method to build item data from scraped content.
-        """
-        item_data = {
-            "id": self.id,
-            "category": "other",
-            "url": self.url,
-            "title": title or self.url,
-            "author": author or self.url_parser.netloc,
-            "author_url": f"{self.url_parser.scheme}://{self.url_parser.netloc}",
-            "scraper_type": self.scraper_type,
-        }
-
-        # Process text content - use description or first part of markdown
-        # Strip any HTML tags to ensure plain text for Telegram short messages
-        text = description if description else (markdown_content or "")[:500]
-        text = BeautifulSoup(text, "html.parser").get_text()
-        item_data["text"] = text
-
-        # Process HTML content with LLM if available, then sanitize deterministically
-        if html_content:
-            cleaned_html = await self.parsing_article_body_by_llm(html_content)
-            cleaned_html = self.sanitize_html(cleaned_html)
-            content = wrap_text_into_html(cleaned_html, is_html=True)
-        else:
-            content = wrap_text_into_html(markdown_content or "", is_html=False)
-        item_data["content"] = content
-        item_data["raw_content"] = markdown_content
-
-        # Process media files - extract og:image if available
-        media_files = []
-        if og_image:
-            media_files.append(MediaFile(url=og_image, media_type="image"))
-
-        item_data["media_files"] = [m.to_dict() for m in media_files]
-
-        # Determine the message type based on content length (not text length)
-        item_data["message_type"] = (
-            MessageType.LONG
-            if get_html_text_length(content) > GENERAL_TEXT_LIMIT
-            else MessageType.SHORT
-        )
-
-        self._data = item_data
-
-    @staticmethod
-    def sanitize_html(html_content: str) -> str:
-        """
-        Deterministic HTML sanitizer that removes all non-content tags.
-
-        This runs AFTER the LLM extraction as a safety net — the LLM is unreliable,
-        and when it fails (or when OPENAI_API_KEY is not set), raw Firecrawl HTML
-        (including <!DOCTYPE>, <script>, etc.) passes through unchanged.
-
-        Keeps content-meaningful tags: p, h1-h6, a, b/strong, i/em, u, ul, ol, li,
-        blockquote, pre, code, img, br, table, tr, td, th, thead, tbody.
-        """
-        if not html_content:
-            return html_content
-
-        soup = BeautifulSoup(html_content, "html.parser")
-
-        # Remove DOCTYPE declarations
-        for item in soup.contents:
-            if isinstance(item, Doctype):
-                item.extract()
-
-        # Remove tags that should be destroyed with all their content
-        for tag_name in ["script", "style", "head", "meta", "link", "noscript", "iframe", "svg", "form", "input", "button"]:
-            for tag in soup.find_all(tag_name):
-                tag.decompose()
-
-        # Unwrap structural/layout tags — keep their text content, discard the tag itself
-        for tag_name in ["html", "body", "div", "span", "section", "article", "nav",
-                         "header", "footer", "main", "aside", "figure", "figcaption",
-                         "details", "summary", "dd", "dt", "dl"]:
-            for tag in soup.find_all(tag_name):
-                tag.unwrap()
-
-        return str(soup).strip()
-
-    @staticmethod
-    async def parsing_article_body_by_llm(html_content: str) -> str:
-        """
-        Use LLM to extract the main article content from HTML.
-
-        Args:
-            html_content: Raw HTML content from a scraper
-
-        Returns:
-            Cleaned HTML containing only the main article content
-        """
-        if not html_content:
-            return html_content
-
-        if not OPENAI_API_KEY:
-            logger.warning("OPENAI_API_KEY not configured, skipping LLM parsing")
-            return html_content
-
-        try:
-            client = AsyncOpenAI(api_key=OPENAI_API_KEY)
-
-            # Truncate content if too long to avoid token limits
-            max_content_length = 50000
-            truncated_content = html_content[:max_content_length] if len(html_content) > max_content_length else html_content
-
-            response = await client.chat.completions.create(
-                model=DEFAULT_OPENAI_MODEL,
-                messages=[
-                    ChatCompletionSystemMessageParam(role="system", content=ARTICLE_EXTRACTION_PROMPT),
-                    ChatCompletionUserMessageParam(role="user", content=f"Extract the main article content from this HTML:\n\n{truncated_content}")
-                ],
-                temperature=0.1,
-                max_completion_tokens=10000,
-            )
-
-            extracted_content = response.choices[0].message.content
-
-            if extracted_content:
-                logger.info("Successfully extracted article content using LLM")
-                return extracted_content.strip()
-            else:
-                logger.warning("LLM returned empty content, using original HTML")
-                return html_content
-
-        except Exception as e:
-            logger.error(f"Failed to parse article body with LLM: {e}")
-            return html_content
-
-
-class BaseGeneralScraper(Scraper):
-    """
-    Base class for general webpage scrapers.
-    """
-
-    @abstractmethod
-    async def get_processor_by_url(self, url: str) -> DataProcessor:
-        pass
diff --git a/app/services/scrapers/general/firecrawl.py b/app/services/scrapers/general/firecrawl.py
deleted file mode 100644
index 093fe75..0000000
--- a/app/services/scrapers/general/firecrawl.py
+++ /dev/null
@@ -1,65 +0,0 @@
-from app.config import FIRECRAWL_WAIT_FOR
-from app.services.scrapers.general.base import BaseGeneralDataProcessor, BaseGeneralScraper
-from app.services.scrapers.general.firecrawl_client import FirecrawlClient
-from app.services.scrapers.scraper import DataProcessor
-from app.utils.logger import logger
-
-# HTML tags to exclude from Firecrawl output at the source
-FIRECRAWL_EXCLUDE_TAGS = [
-    "nav", "footer", "aside", "script", "style",
-    "noscript", "iframe", "svg", "form",
-]
-
-
-class FirecrawlDataProcessor(BaseGeneralDataProcessor):
-    """
-    FirecrawlDataProcessor: Process URLs using Firecrawl to extract content.
-    """
-
-    def __init__(self, url: str):
-        super().__init__(url)
-        self.scraper_type = "firecrawl"
-        self._client: FirecrawlClient = FirecrawlClient.get_instance()
-
-    async def _get_page_content(self) -> None:
-        try:
-            result = await self._client.scrape_url(
-                url=self.url,
-                formats=["markdown", "html"],
-                only_main_content=True,
-                exclude_tags=FIRECRAWL_EXCLUDE_TAGS,
-                wait_for=FIRECRAWL_WAIT_FOR,
-            )
-            await self._process_firecrawl_result(result)
-        except Exception as e:
-            logger.error(f"Failed to scrape URL with Firecrawl: {e}")
-            raise
-
-    async def _process_firecrawl_result(self, result: dict) -> None:
-        metadata = result.get("metadata", {})
-        markdown_content = result.get("markdown", "")
-        html_content = result.get("html", "")
-
-        # Extract metadata fields
-        title = metadata.get("title", "") or metadata.get("ogTitle", "")
-        author = metadata.get("author", "") or metadata.get("ogSiteName", "")
-        description = metadata.get("description", "") or metadata.get("ogDescription", "")
-        og_image = metadata.get("ogImage")
-
-        await self._build_item_data(
-            title=title,
-            author=author,
-            description=description,
-            markdown_content=markdown_content,
-            html_content=html_content,
-            og_image=og_image,
-        )
-
-
-class FirecrawlScraper(BaseGeneralScraper):
-    """
-    FirecrawlScraper: Scraper implementation using Firecrawl for generic URL scraping.
-    """
-
-    async def get_processor_by_url(self, url: str) -> DataProcessor:
-        return FirecrawlDataProcessor(url)
diff --git a/app/services/scrapers/general/firecrawl_client.py b/app/services/scrapers/general/firecrawl_client.py
deleted file mode 100644
index b92e3bd..0000000
--- a/app/services/scrapers/general/firecrawl_client.py
+++ /dev/null
@@ -1,94 +0,0 @@
-from __future__ import annotations
-
-import threading
-from dataclasses import dataclass
-from typing import Any, Dict, List, Optional
-
-from firecrawl import AsyncFirecrawl
-
-from app.config import FIRECRAWL_API_URL, FIRECRAWL_API_KEY
-
-
-@dataclass(frozen=True)
-class FirecrawlSettings:
-    api_url: str
-    api_key: str
-
-
-class FirecrawlClient:
-    """
-    FirecrawlClient: 对 firecrawl python SDK 的封装 + 单例访问点。
-
-    - 提供 scrape / crawl 等常用方法，方便其他模块调用
-    - 线程安全单例（适合 Web 服务 / worker 多线程场景）
-    """
-
-    _instance: Optional["FirecrawlClient"] = None
-    _lock = threading.Lock()
-
-    def __init__(self, config: FirecrawlSettings):
-        self._settings: FirecrawlSettings = config
-        self._app: AsyncFirecrawl = self._create_app(config)
-
-    @staticmethod
-    def _create_app(config: FirecrawlSettings) -> AsyncFirecrawl:
-        return AsyncFirecrawl(api_url=config.api_url, api_key=config.api_key)
-
-    @classmethod
-    def get_instance(cls) -> "FirecrawlClient":
-        """
-        线程安全的单例获取。
-        - 首次调用可传 settings
-        - 之后重复调用可不传
-        """
-        if cls._instance is not None:
-            return cls._instance
-
-        with cls._lock:
-            if cls._instance is not None:
-                return cls._instance
-
-            config = FirecrawlSettings(
-                api_url=FIRECRAWL_API_URL,
-                api_key=FIRECRAWL_API_KEY,
-            )
-
-            cls._instance = cls(config)
-            return cls._instance
-
-    @classmethod
-    def reset_instance(cls) -> None:
-        """测试用：重置单例。"""
-        with cls._lock:
-            cls._instance = None
-
-    async def scrape_url(
-            self,
-            url: str,
-            formats: Optional[List[str]] = None,
-            only_main_content: bool = True,
-            timeout: Optional[int] = None,
-            exclude_tags: Optional[List[str]] = None,
-            wait_for: Optional[int] = None,
-    ) -> Dict[str, Any]:
-        """
-        Args:
-            url: The URL to scrape.
-            formats: Output formats (e.g. ["markdown", "html"]).
-            only_main_content: If True, extract only the main content.
-            timeout: Request timeout in milliseconds.
-            exclude_tags: HTML tag names to exclude from output (e.g. ["nav", "footer"]).
-            wait_for: Time in milliseconds to wait for JS rendering before scraping.
-        """
-        try:
-            result = await self._app.scrape(
-                url,
-                formats=formats,
-                only_main_content=only_main_content,
-                timeout=timeout,
-                exclude_tags=exclude_tags,
-                wait_for=wait_for,
-            )
-            return result.model_dump(exclude_none=True)
-        except Exception as e:
-            raise RuntimeError(f"Firecrawl scrape_url failed: url={url}") from e
diff --git a/app/services/scrapers/general/scraper.py b/app/services/scrapers/general/scraper.py
deleted file mode 100644
index 17d9c38..0000000
--- a/app/services/scrapers/general/scraper.py
+++ /dev/null
@@ -1,86 +0,0 @@
-from typing import Optional
-
-from app.config import GENERAL_SCRAPING_API
-from app.services.scrapers.scraper import Scraper, DataProcessor
-from app.services.scrapers.general.base import BaseGeneralScraper
-from app.services.scrapers.general.firecrawl import FirecrawlScraper
-from app.services.scrapers.general.zyte import ZyteScraper
-from app.utils.logger import logger
-
-
-class GeneralScraper(Scraper):
-    """
-    GeneralScraper: A wrapper scraper that delegates to the configured scraper implementation.
-
-    This class acts as a factory/facade that selects the appropriate scraper
-    based on the GENERAL_SCRAPING_API configuration.
-
-    Supported scrapers:
-    - FIRECRAWL: Uses Firecrawl API for scraping
-    - ZYTE: Uses Zyte API for scraping
-    """
-
-    # Registry of available scrapers
-    SCRAPER_REGISTRY: dict[str, type[BaseGeneralScraper]] = {
-        "FIRECRAWL": FirecrawlScraper,
-        "ZYTE": ZyteScraper,
-    }
-
-    def __init__(self, scraper_type: Optional[str] = None):
-        """
-        Initialize the GeneralScraper with a specific scraper type.
-
-        Args:
-            scraper_type: The type of scraper to use. If None, uses GENERAL_SCRAPING_API config.
-        """
-        self.scraper_type = scraper_type or GENERAL_SCRAPING_API
-        self._scraper: Optional[BaseGeneralScraper] = None
-        self._init_scraper()
-
-    def _init_scraper(self) -> None:
-        """Initialize the underlying scraper based on scraper_type."""
-        scraper_class = self.SCRAPER_REGISTRY.get(self.scraper_type.upper())
-
-        if scraper_class is None:
-            available = ", ".join(self.SCRAPER_REGISTRY.keys())
-            logger.error(f"Unknown scraper type: {self.scraper_type}. Available: {available}")
-            # Fall back to Firecrawl as default
-            logger.info("Falling back to FIRECRAWL scraper")
-            scraper_class = FirecrawlScraper
-
-        self._scraper = scraper_class()
-        logger.info(f"Initialized GeneralScraper with {self.scraper_type} backend")
-
-    async def get_processor_by_url(self, url: str) -> DataProcessor:
-        """
-        Get the appropriate data processor for the given URL.
-
-        Args:
-            url: The URL to scrape
-
-        Returns:
-            DataProcessor instance for processing the URL
-        """
-        return await self._scraper.get_processor_by_url(url)
-
-    @classmethod
-    def register_scraper(cls, name: str, scraper_class: type[BaseGeneralScraper]) -> None:
-        """
-        Register a new scraper type.
-
-        Args:
-            name: The name to register the scraper under (e.g., "ZYTE")
-            scraper_class: The scraper class to register
-        """
-        cls.SCRAPER_REGISTRY[name.upper()] = scraper_class
-        logger.info(f"Registered new scraper: {name}")
-
-    @classmethod
-    def get_available_scrapers(cls) -> list[str]:
-        """
-        Get a list of available scraper types.
-
-        Returns:
-            List of registered scraper names
-        """
-        return list(cls.SCRAPER_REGISTRY.keys())
diff --git a/app/services/scrapers/general/zyte.py b/app/services/scrapers/general/zyte.py
deleted file mode 100644
index 1ff00a5..0000000
--- a/app/services/scrapers/general/zyte.py
+++ /dev/null
@@ -1,78 +0,0 @@
-from zyte_api import AsyncZyteAPI
-
-from app.config import ZYTE_API_KEY
-from app.services.scrapers.general.base import BaseGeneralDataProcessor, BaseGeneralScraper
-from app.services.scrapers.scraper import DataProcessor
-from app.utils.logger import logger
-
-
-class ZyteDataProcessor(BaseGeneralDataProcessor):
-    """
-    ZyteDataProcessor: Process URLs using Zyte API to extract content.
-    """
-
-    def __init__(self, url: str):
-        super().__init__(url)
-        self.scraper_type = "zyte"
-
-    async def _get_page_content(self) -> None:
-        if not ZYTE_API_KEY:
-            raise RuntimeError("ZYTE_API_KEY is not configured")
-
-        try:
-            client = AsyncZyteAPI(api_key=ZYTE_API_KEY)
-            result = await client.get(
-                {
-                    "url": self.url,
-                    "browserHtml": True,
-                    "article": True,
-                    "articleOptions": {"extractFrom": "browserHtml"},
-                }
-            )
-            await self._process_zyte_result(result)
-        except Exception as e:
-            logger.error(f"Failed to scrape URL with Zyte: {e}")
-            raise
-
-    async def _process_zyte_result(self, result: dict) -> None:
-        article = result.get("article", {})
-        browser_html = result.get("browserHtml", "")
-
-        # Extract metadata fields from article
-        title = article.get("headline", "") or article.get("name", "")
-
-        # Extract author information
-        authors = article.get("authors", [])
-        author = authors[0].get("name", "") if authors else ""
-
-        description = article.get("description", "") or article.get("articleBodyRaw", "")[:500]
-
-        # Get article body as HTML
-        article_body_html = article.get("articleBodyHtml", "")
-        article_body_raw = article.get("articleBodyRaw", "")
-
-        # Use article body HTML if available, otherwise fall back to browser HTML
-        html_content = article_body_html if article_body_html else browser_html
-        markdown_content = article_body_raw
-
-        # Extract main image
-        main_image = article.get("mainImage", {})
-        og_image = main_image.get("url") if main_image else None
-
-        await self._build_item_data(
-            title=title,
-            author=author,
-            description=description,
-            markdown_content=markdown_content,
-            html_content=html_content,
-            og_image=og_image,
-        )
-
-
-class ZyteScraper(BaseGeneralScraper):
-    """
-    ZyteScraper: Scraper implementation using Zyte API for generic URL scraping.
-    """
-
-    async def get_processor_by_url(self, url: str) -> DataProcessor:
-        return ZyteDataProcessor(url)
diff --git a/app/services/scrapers/instagram/__init__.py b/app/services/scrapers/instagram/__init__.py
deleted file mode 100644
index 30cc7b1..0000000
--- a/app/services/scrapers/instagram/__init__.py
+++ /dev/null
@@ -1,271 +0,0 @@
-# TODO: https://rapidapi.com/arraybobo/api/instagram-scraper-2022
-import re
-from typing import Any, Optional
-from urllib.parse import urlparse
-
-from html import escape
-
-from app.models.metadata_item import MetadataItem, MessageType, MediaFile
-from app.utils.network import get_response
-from app.utils.parse import get_html_text_length
-from app.utils.logger import logger
-from .config import API_HEADERS_LIST, ALL_SCRAPERS
-from app.config import X_RAPIDAPI_KEY
-
-
-class Instagram(MetadataItem):
-    def __init__(self, url: str, data: Optional[Any] = None, **kwargs):
-        self.url = url
-        self.category = "instagram"
-        # auxiliary variables
-        self.urlparser = urlparse(url)
-        self.post_id = re.sub(r".*((/p/)|(/reel/))", "", self.urlparser.path).replace(
-            "/", ""
-        )
-        self.message_type = MessageType.SHORT
-
-    async def get_item(self):
-        await self.get_instagram()
-        return self.to_dict()
-
-    async def get_instagram(self):
-        self._check_instagram_url()
-        await self._get_instagram_info()
-
-    def _check_instagram_url(self):
-        if (
-            self.urlparser.path.find("p") != -1
-            or self.urlparser.path.find("reel") != -1
-        ):
-            self.ins_type = "post"
-        if self.urlparser.path.find("stories") != -1:
-            self.ins_type = "story"
-
-    async def _get_instagram_info(self):
-        ins_functions_dict = {
-            "post": self._get_post_info,
-            "story": self._get_story_info,
-        }
-        ins_info = await ins_functions_dict[self.ins_type]()
-        self._process_ins_info(ins_info)
-
-    async def _get_post_info(self) -> dict:
-        ins_info = {}
-        for scraper in ALL_SCRAPERS:
-            self.scraper = scraper
-            self.host = API_HEADERS_LIST[self.scraper]["host"]
-            self.headers = {
-                "X-RapidAPI-Key": X_RAPIDAPI_KEY,
-                "X-RapidAPI-Host": API_HEADERS_LIST[self.scraper]["top_domain"],
-                "content-type": "application/octet-stream",
-            }
-            params_value = self.url if self.scraper == "looter2" else self.post_id
-            self.params = {API_HEADERS_LIST[self.scraper]["params"]: params_value}
-            response = await get_response(
-                url=self.host, headers=self.headers, params=self.params
-            )
-            if response.status_code != 200:
-                logger.error(
-                    "get_ins_post_item error: %s %s", self.scraper, response.status_code
-                )
-                continue
-            else:
-                ins_data = response.json()
-                logger.debug("get_ins_post_item: %s %s", self.params, ins_data)
-                if type(ins_data) == dict and "graphql" in ins_data:
-                    ins_data = ins_data["graphql"]["shortcode_media"]
-                elif type(ins_data) == dict and "data" in ins_data:
-                    ins_data = ins_data["data"]
-                elif (
-                    type(ins_data) == dict
-                    and "status" in ins_data
-                    and ins_data["status"] is False
-                ):
-                    print("get_ins_post_item error: ", self.scraper)
-                    continue
-                elif type(ins_data) == str and "400" in ins_data:
-                    print("get_ins_post_item error: ", self.scraper, ins_data)
-                    continue
-            if (
-                self.scraper == "looter2"
-                or self.scraper == "ins191"
-                or self.scraper == "ins130"
-            ):
-                ins_info = self._get_ins_post_looter2(ins_data)
-            elif self.scraper == "ins28" or self.scraper == "scraper2" or self.scraper == "api2":
-                ins_info = self._get_ins_post_ins28_scraper2(ins_data)
-            break
-        return ins_info
-
-    def _process_ins_info(self, ins_info: dict):
-        self.__dict__.update(ins_info)
-        self.title = self.author + "'s Instagram post"
-        self.text = escape(self.text)
-        self.text = "<a href='" + self.url + "'>" + self.title + "</a>\n" + self.text
-        if get_html_text_length(self.text) > 500:
-            self.message_type = MessageType.LONG
-
-    @staticmethod
-    def _get_ins_post_looter2(ins_data: dict) -> dict:
-        ins_info = {}
-        ins_text_data = (
-            ins_data["edge_media_to_caption"]["edges"][0]["node"]["text"]
-            if ins_data["edge_media_to_caption"]["edges"]
-            else ""
-        )
-        ins_info["content"] = ""
-        ins_info["text"] = ins_text_data
-        ins_info["author"] = ins_data["owner"]["username"]
-        if ins_data["owner"]["full_name"]:
-            ins_info["author"] += "(" + ins_data["owner"]["full_name"] + ")"
-        ins_info["author_url"] = (
-            "https://www.instagram.com/" + ins_data["owner"]["username"] + "/"
-        )
-        ins_info["media_files"] = []
-        if ins_data["__typename"] == "GraphVideo":
-            ins_info["media_files"].append(
-                MediaFile.from_dict(
-                    {"media_type": "video", "url": ins_data["video_url"], "caption": ""}
-                )
-            ) if ins_data["video_url"] else []
-            ins_info["content"] += (
-                '<video controls src="' + ins_data["video_url"] + '"></video>'
-            )
-        elif ins_data["__typename"] == "GraphImage":
-            ins_info["media_files"].append(
-                MediaFile.from_dict(
-                    {
-                        "media_type": "image",
-                        "url": ins_data["display_url"],
-                        "caption": "",
-                    }
-                )
-            )
-            ins_info["content"] += (
-                '<img src="' + ins_data["display_url"] + '">'
-                if ins_data["display_url"]
-                else ""
-            )
-        elif ins_data["__typename"] == "GraphSidecar":
-            for item in ins_data["edge_sidecar_to_children"]["edges"]:
-                if item["node"]["__typename"] == "GraphVideo":
-                    ins_info["media_files"].append(
-                        MediaFile.from_dict(
-                            {
-                                "media_type": "video",
-                                "url": item["node"]["video_url"],
-                                "caption": "",
-                            }
-                        )
-                    )
-                    ins_info["content"] += (
-                        '<video controls src="'
-                        + item["node"]["video_url"]
-                        + '"></video>'
-                    )
-                elif item["node"]["__typename"] == "GraphImage":
-                    ins_info["media_files"].append(
-                        MediaFile.from_dict(
-                            {
-                                "media_type": "image",
-                                "url": item["node"]["display_url"],
-                                "caption": "",
-                            }
-                        )
-                    )
-                    ins_info["content"] += (
-                        '<img src="' + item["node"]["display_url"] + '">'
-                    )
-        ins_info["content"] += ins_text_data
-        ins_info["status"] = True
-        return ins_info
-
-    @staticmethod
-    def _get_ins_post_ins28_scraper2(ins_data):
-        ins_info = {}
-        ins_text_data = (
-            ins_data["items"][0]["caption"]["text"]
-            if ins_data["items"][0]["caption"]
-            else ""
-        )
-        ins_info["content"] = ""
-        ins_info["text"] = ins_text_data
-        ins_info["author"] = ins_data["items"][0]["user"]["username"]
-        if ins_data["items"][0]["user"]["full_name"]:
-            ins_info["author"] += "(" + ins_data["items"][0]["user"]["full_name"] + ")"
-        ins_info["author_url"] = (
-            "https://www.instagram.com/"
-            + ins_data["items"][0]["user"]["username"]
-            + "/"
-        )
-        ins_info["media_files"] = []
-        if ins_data["items"][0]["media_type"] == 2:
-            ins_info["media_files"].append(
-                MediaFile.from_dict(
-                    {
-                        "media_type": "video",
-                        "url": ins_data["items"][0]["video_versions"][0]["url"],
-                        "caption": "",
-                    }
-                )
-            )
-            ins_info["content"] += (
-                '<video controls src="'
-                + ins_data["items"][0]["video_versions"][0]["url"]
-                + '"></video>'
-            )
-        elif ins_data["items"][0]["media_type"] == 1:
-            ins_info["media_files"].append(
-                MediaFile.from_dict(
-                    {
-                        "media_type": "image",
-                        "url": ins_data["items"][0]["image_versions2"]["candidates"][0][
-                            "url"
-                        ],
-                        "caption": "",
-                    }
-                )
-            )
-            ins_info["content"] += (
-                '<img src="'
-                + ins_data["items"][0]["image_versions2"]["candidates"][0]["url"]
-                + '">'
-            )
-        elif ins_data["items"][0]["media_type"] == 8:
-            for item in ins_data["items"][0]["carousel_media"]:
-                if item["media_type"] == 2:
-                    ins_info["media_files"].append(
-                        MediaFile.from_dict(
-                            {
-                                "media_type": "video",
-                                "url": item["video_versions"][0]["url"],
-                                "caption": "",
-                            }
-                        )
-                    )
-                    ins_info["content"] += (
-                        '<video controls src="'
-                        + item["video_versions"][0]["url"]
-                        + '"></video>'
-                    )
-                elif item["media_type"] == 1:
-                    ins_info["media_files"].append(
-                        MediaFile.from_dict(
-                            {
-                                "media_type": "image",
-                                "url": item["image_versions2"]["candidates"][0]["url"],
-                                "caption": "",
-                            }
-                        )
-                    )
-                    ins_info["content"] += (
-                        '<img src="'
-                        + item["image_versions2"]["candidates"][0]["url"]
-                        + '">'
-                    )
-        ins_info["content"] += ins_text_data
-        ins_info["status"] = True
-        return ins_info
-
-    async def _get_story_info(self):
-        pass
diff --git a/app/services/scrapers/instagram/config.py b/app/services/scrapers/instagram/config.py
deleted file mode 100644
index e8dbdb9..0000000
--- a/app/services/scrapers/instagram/config.py
+++ /dev/null
@@ -1,33 +0,0 @@
-API_HEADERS_LIST = {
-    "looter2": {
-        "host": "https://instagram-looter2.p.rapidapi.com/post",
-        "top_domain": "instagram-looter2.p.rapidapi.com",
-        "params": "url",
-    },
-    "ins28": {
-        "host": "https://instagram28.p.rapidapi.com/media_info_v2",
-        "top_domain": "instagram28.p.rapidapi.com",
-        "params": "short_code",
-    },
-    "scraper2": {
-        "host": "https://instagram-scraper2.p.rapidapi.com/media_info_v2",
-        "top_domain": "instagram-scraper2.p.rapidapi.com",
-        "params": "short_code",
-    },
-    "ins191": {
-        "host": "https://instagram191.p.rapidapi.com/v2/post/details-by-shortcode",
-        "top_domain": "instagram191.p.rapidapi.com",
-        "params": "shortcode",
-    },
-    "ins130": {
-        "host": "https://instagram130.p.rapidapi.com/media-info",
-        "top_domain": "instagram130.p.rapidapi.com",
-        "params": "code",
-    },
-    "api2": {
-        "host": "https://instagram-scraper-api2.p.rapidapi.com/v1/post_info",
-        "top_domain": "instagram-scraper-api2.p.rapidapi.com",
-        "params": "code_or_id_or_url",
-    },
-}
-ALL_SCRAPERS = ["ins28", "scraper2", "looter2", "ins191", "ins130"]
diff --git a/app/services/scrapers/reddit/__init__.py b/app/services/scrapers/reddit/__init__.py
deleted file mode 100644
index 3621c97..0000000
--- a/app/services/scrapers/reddit/__init__.py
+++ /dev/null
@@ -1,124 +0,0 @@
-import re
-from typing import Optional, Any
-
-import asyncpraw
-from bs4 import BeautifulSoup
-
-from app.models.metadata_item import MetadataItem, MessageType, MediaFile
-from app.config import (
-    REDDIT_CLIENT_ID,
-    REDDIT_CLIENT_SECRET,
-    REDDIT_PASSWORD,
-    REDDIT_USERNAME,
-    JINJA2_ENV,
-)
-from app.utils.parse import unix_timestamp_to_utc, get_html_text_length
-from app.utils.network import get_redirect_url
-
-short_text_template = JINJA2_ENV.get_template("reddit_short_text.jinja2")
-content_template = JINJA2_ENV.get_template("reddit_content.jinja2")
-
-
-class Reddit(MetadataItem):
-    def __init__(self, url, data: Optional[Any] = None, **kwargs):
-        self.url = url
-        self.category = "reddit"
-        self.media_files = []
-        self.message_type = MessageType.LONG
-
-    async def get_item(self) -> dict:
-        await self.get_reddit()
-        return self.to_dict()
-
-    async def get_reddit(self) -> None:
-        self.url = await get_redirect_url(self.url)
-        reddit_data = await self._get_reddit_data()
-        await self._process_reddit_data(reddit_data)
-
-    async def _get_reddit_data(self) -> dict:
-        reddit_user_agent = f"testscript by u/{REDDIT_USERNAME}"
-        reddit = asyncpraw.Reddit(
-            client_id=REDDIT_CLIENT_ID,
-            client_secret=REDDIT_CLIENT_SECRET,
-            password=REDDIT_PASSWORD,
-            user_agent=reddit_user_agent,
-            username=REDDIT_USERNAME,
-        )
-        submission = await reddit.submission(url=self.url)
-        return submission.__dict__
-
-    async def _process_reddit_data(self, reddit_data) -> None:
-        self.url = "https://www.reddit.com" + reddit_data["permalink"]
-        self.title = reddit_data["title"]
-        self.author = reddit_data["author"].name
-        self.author_url = f"https://www.reddit.com/user/{self.author}"
-        self.raw_content = reddit_data["selftext_html"] or ""
-        self.created = unix_timestamp_to_utc(int(reddit_data["created_utc"]))
-        self.score = reddit_data["score"]
-        self.comments_count = reddit_data["num_comments"]
-        self.upvote_ratio = reddit_data["upvote_ratio"]
-        self.subreddit = reddit_data["subreddit"].display_name
-        self.subreddit_name_prefixed = reddit_data["subreddit_name_prefixed"]
-        self.subreddit_url = (
-            f"https://www.reddit.com/{reddit_data['subreddit_name_prefixed']}"
-        )
-        content_html = self.raw_content
-        if "media_metadata" in reddit_data:
-            for media_item in reddit_data["media_metadata"].values():
-                if media_item["e"] == "Image":
-                    media_type = "image"
-                    media_url = media_item["s"]["u"]
-                elif media_item["e"] == "AnimatedImage":
-                    media_type = "video"
-                    media_url = media_item["s"]["gif"]
-                elif media_item["e"] == "Video":
-                    media_type = "video"
-                    media_url = media_item["s"]["gif"]
-                else:
-                    continue
-                self.media_files.append(
-                    MediaFile(
-                        media_type=media_type,
-                        url=media_url,
-                        caption="",
-                    )
-                )
-        if reddit_data.get("post_hint", "") == "image":
-            preview_url = reddit_data["preview"]["images"][0]["source"]["url"]
-            self.media_files.append(
-                MediaFile(
-                    media_type="image",
-                    url=preview_url,
-                    caption="",
-                )
-            )
-            preview_image_html_tag = f"<img src='{preview_url}'>"
-            content_html += preview_image_html_tag
-        self.raw_content = re.sub(r"<!--.*?-->", "", self.raw_content, flags=re.DOTALL)
-        soup = BeautifulSoup(self.raw_content, "html.parser")
-        # resolve content
-        for p in soup.find_all("p"):
-            if p.text == "&#x200B;" or p.text == "\n\n":
-                p.decompose()
-        for a in soup.find_all("a"):
-            if a.text == "[removed]":
-                a.decompose()
-            if a.get("href", "").find("preview.redd.it") != -1:
-                img = soup.new_tag("img")
-                img["src"] = a["href"]
-                a.append(f"<p>{a.text}</p>")
-                a.replace_with(img)
-        self.content = str(soup)
-        # resolve short text
-        for tag in soup.find_all(["p", "span", "div"]):
-            # add '\n' after the tag and then unwrap it
-            tag.append("\n")
-            tag.unwrap()
-        for tag in soup.find_all(["strong"]):
-            tag.replace_with(f"<b>{tag.text}</b>")
-        self.text = str(soup)
-        data = self.__dict__
-        self.content = content_template.render(data=data)
-        self.text = short_text_template.render(data=data)
-        if get_html_text_length(self.text) < 800:
-            self.message_type = MessageType.SHORT
diff --git a/app/services/scrapers/scraper.py b/app/services/scrapers/scraper.py
deleted file mode 100644
index b314462..0000000
--- a/app/services/scrapers/scraper.py
+++ /dev/null
@@ -1,19 +0,0 @@
-from abc import abstractmethod
-
-
-class Scraper:
-
-    @abstractmethod
-    async def get_processor_by_url(self, url) -> object:
-        pass
-
-
-class DataProcessor:
-
-    @abstractmethod
-    async def get_item(self) -> dict:
-        pass
-
-    @abstractmethod
-    async def process_data(self) -> None:
-        pass
diff --git a/app/services/scrapers/scraper_manager.py b/app/services/scrapers/scraper_manager.py
deleted file mode 100644
index 0a010e5..0000000
--- a/app/services/scrapers/scraper_manager.py
+++ /dev/null
@@ -1,62 +0,0 @@
-from typing import Optional
-
-from app.utils.logger import logger
-from app.services.scrapers.bluesky.scraper import BlueskyScraper
-from app.services.scrapers.weibo.scraper import WeiboScraper
-from app.services.scrapers.general.scraper import GeneralScraper
-from app.config import (
-    BLUESKY_USERNAME, BLUESKY_PASSWORD
-)
-
-
-class ScraperManager:
-
-    bluesky_scraper: Optional[BlueskyScraper] = None
-    weibo_scraper: Optional[WeiboScraper] = None
-    general_scraper: Optional[GeneralScraper] = None
-
-    scrapers = {"bluesky": bluesky_scraper,
-                "weibo": weibo_scraper,
-                "other": general_scraper,
-                "unknown": general_scraper}
-
-    @classmethod
-    async def init_scrapers(cls):
-        await cls.init_bluesky_scraper()
-
-    @classmethod
-    async def init_scraper(cls, category: str) -> None:
-        if category in cls.scrapers.keys():
-            scraper = None
-            if category == "bluesky" and not cls.bluesky_scraper:
-                scraper = await cls.init_bluesky_scraper()
-            elif category == "weibo" and not cls.weibo_scraper:
-                scraper = await cls.init_weibo_scraper()
-            elif category in ["other", "unknown"] and not cls.general_scraper:
-                scraper = await cls.init_general_scraper()
-            if scraper:
-                cls.scrapers[category] = scraper
-                # general_scraper serves both "other" and "unknown" — keep both keys in sync
-                if category in ["other", "unknown"]:
-                    cls.scrapers["other"] = scraper
-                    cls.scrapers["unknown"] = scraper
-        else:
-            logger.error(f"Scraper {category} is not supported")
-            raise ValueError(f"Scraper {category} is not supported")
-
-    @classmethod
-    async def init_bluesky_scraper(cls) -> BlueskyScraper:
-        cls.bluesky_scraper = BlueskyScraper(username=BLUESKY_USERNAME, password=BLUESKY_PASSWORD)
-        await cls.bluesky_scraper.init()
-        return cls.bluesky_scraper
-
-    @classmethod
-    async def init_weibo_scraper(cls) -> WeiboScraper:
-        cls.weibo_scraper = WeiboScraper()
-        return cls.weibo_scraper
-
-    @classmethod
-    async def init_general_scraper(cls) -> GeneralScraper:
-        cls.general_scraper = GeneralScraper()
-        return cls.general_scraper
-
diff --git a/app/services/scrapers/threads/__init__.py b/app/services/scrapers/threads/__init__.py
deleted file mode 100644
index e1d4195..0000000
--- a/app/services/scrapers/threads/__init__.py
+++ /dev/null
@@ -1,191 +0,0 @@
-import json
-from typing import Dict, Any, Optional
-from urllib.parse import urlparse, unquote
-
-import jmespath
-from playwright.async_api import async_playwright
-
-from app.utils.logger import logger
-from app.utils.parse import get_html_text_length, unix_timestamp_to_utc, wrap_text_into_html
-from app.models.metadata_item import MetadataItem, MediaFile, MessageType
-
-SHORT_LIMIT = 600
-
-
-class Threads(MetadataItem):
-    def __init__(self, url: str, data: Optional[Any] = None, **kwargs):
-        # metadata fields
-        self.url = url
-        self.title = ""
-        self.author = ""
-        self.author_url = ""
-        self.text = ""
-        self.content = ""
-        self.media_files = []
-        self.category = "threads"
-        self.message_type = MessageType.SHORT
-        # auxiliary fields
-        self.text_group = ""
-        self.content_group = ""
-        self.code = urlparse(url).path.split("/")[2]
-        self.pics_url = []
-        self.videos_url = []
-
-    async def get_item(self) -> dict:
-        await self.get_threads()
-        return self.to_dict()
-
-    async def get_threads(self) -> None:
-        thread_data = await self.scrape_thread_data(self.url)
-        self.process_threads_item(thread_data)
-        logger.debug(thread_data)
-
-    @staticmethod
-    def parse_single_threads_data(data: Dict) -> Dict:
-        """The code is referenced from https://scrapfly.io/blog/how-to-scrape-threads/"""
-        """Parse Threads post JSON dataset for the most important fields"""
-        result = jmespath.search(
-            """{
-            text: caption.text,
-            published_on: taken_at,
-            id: id,
-            pk: pk,
-            code: code,
-            username: user.username,
-            user_pic: user.profile_pic_url,
-            user_verified: user.is_verified,
-            user_pk: user.pk,
-            user_id: user.id,
-            has_audio: has_audio,
-            reply_count: text_post_app_info.direct_reply_count,
-            like_count: like_count,
-            media_files: carousel_media[]
-            images: carousel_media[].image_versions2.candidates[1].url,
-            image: image_versions2.candidates[1].url,
-            video: video_versions[1].url,
-            media_count: carousel_media_count,
-            quoted_post: text_post_app_info.share_info.quoted_post,
-            link: text_post_app_info.link_preview_attachment
-        }""",
-            data,
-        )
-        return result
-
-    async def scrape_thread_data(self, url: str) -> dict:
-        """The code is referenced from https://scrapfly.io/blog/how-to-scrape-threads/"""
-        """Scrape Threads post and replies from a given URL"""
-        _xhr_calls = []
-
-        async def intercept_response(response):
-            """capture all background requests and save them"""
-            if response.request.resource_type == "xhr":
-                _xhr_calls.append(response)
-            return response
-
-        async with async_playwright() as pw:
-            browser = await pw.chromium.launch()
-            context = await browser.new_context(viewport={"width": 1920, "height": 1080})
-            page = await context.new_page()
-            page.on("response", intercept_response)  # enable background request intercepting
-            await page.goto(url)  # go to url and wait for the page to load
-            await page.wait_for_selector("[data-pressable-container=true]")  # wait for page to finish loading
-            # find all thread related background requests:
-            gql_calls = [f for f in _xhr_calls if "/api/graphql" in f.url]
-            thread_data = {
-                "threads": [],
-            }
-            for xhr in gql_calls:
-                text = await xhr.text()
-                data = json.loads(text)
-                print(json.dumps(data, indent=4, ensure_ascii=False))
-                threads = data["data"]["data"]["containing_thread"]["thread_items"]
-                for thread in threads:
-                    thread_data["threads"].append(self.parse_single_threads_data(thread["post"]))
-            return thread_data
-
-    def process_threads_item(self, thread_data: Dict) -> None:
-        for thread in thread_data["threads"]:
-            self.process_single_threads(thread)
-        self.text += self.text_group
-        self.content += self.content_group
-        self.message_type = MessageType.LONG if get_html_text_length(self.text) > SHORT_LIMIT else MessageType.SHORT
-
-    def process_single_threads(self, thread: Dict) -> None:
-        if thread["code"] == self.code:  # if the thread is the authoral post
-            self.title = thread["username"] + "'s Threads"
-            self.author = thread["username"]
-            self.author_url = f"https://threads.net/@{thread['username']}"
-            created_at = unix_timestamp_to_utc(thread["published_on"])
-            reply_count = thread["reply_count"]
-            like_count = thread["like_count"]
-            self.content += f"<p>Created at: {created_at} "
-            self.content += f" Reply count: {reply_count} "
-            self.content += f" Like count: {like_count}</p>"
-        thread_info = self.parse_single_threads(thread)
-        self.text_group += thread_info["text_group"]
-        self.content_group += thread_info["content_group"]
-        self.pics_url += thread_info["pics_url"]
-        self.videos_url += thread_info["videos_url"]
-        self.media_files += thread_info["media_files"]
-
-    @staticmethod
-    def parse_single_threads(thread: Dict) -> Dict:
-        thread_info = {
-            "pics_url": [],
-            "videos_url": [],
-            "media_files": [],
-            "text_group": "",
-            "content_group": "",
-        }
-        # make html components, and solve the pictures and videos
-        user_component = f"<a href='https://threads.net/@{thread['username']}'>@{thread['username']}</a>:"
-        thread_info["content_group"] += wrap_text_into_html(user_component + thread["text"])
-        thread_info["text_group"] += user_component + thread["text"] + "\n"
-        if not thread["media_count"]:  # if the thread doesn't have multiple media files
-            if thread["video"]:  # if the threads has only one video/gif
-                thread_info["videos_url"].append(thread["video"])
-                thread_info["media_files"].append(MediaFile(media_type="video", url=thread["video"], caption=""))
-                thread_info["content_group"] += f"<video controls=\"controls\" src=\"{thread['video']}\">"
-            elif thread["image"]:  # if the threads has only one picture
-                thread_info["pics_url"].append(thread["image"])
-                thread_info["media_files"].append(MediaFile(media_type="image", url=thread["image"], caption=""))
-                thread_info["content_group"] += f"<img src=\"{thread['image']}\">"
-        else:  # if the threads has more than one media files
-            for media in thread["media_files"]:
-                if len(media["video_versions"]) > 0:  # if the media is a video/gif
-                    thread_info["videos_url"].append(media["video_versions"][0]["url"])
-                    thread_info["media_files"].append(
-                        MediaFile(
-                            media_type="video",
-                            url=media["video_versions"][0]["url"],
-                            caption="",
-                        )
-                    )
-                    thread_info[
-                        "content_group"
-                    ] += f"<video controls=\"controls\" src=\"{media['video_versions'][0]['url']}\">"
-                else:  # if the media is a picture
-                    thread_info["pics_url"].append(media["image_versions2"]["candidates"][0]["url"])
-                    thread_info["media_files"].append(
-                        MediaFile(
-                            media_type="image",
-                            url=media["image_versions2"]["candidates"][0]["url"],
-                            caption="",
-                        )
-                    )
-                    thread_info["content_group"] += f"<img src=\"{media['image_versions2']['candidates'][0]['url']}\">"
-        thread_info["content_group"] += "<hr>"
-        if thread["link"]:  # process the link item in the threads
-            link_title = thread["link"]["title"]
-            link_url = unquote(urlparse(thread["link"]["url"]).query).split("=")[1].split("&")[0]
-            thread_info["text_group"] += f"<a href='{link_url}'>{link_title}</a>\n"
-            thread_info["content_group"] += f"<p><a href='{link_url}'>{link_title}</a></p><br>"
-        if thread["quoted_post"] is not None:  # solve possible retweeted threads
-            retweeted_thread = Threads.parse_single_threads_data(thread["quoted_post"])
-            retweeted_thread_info = Threads.parse_single_threads(retweeted_thread)
-            thread_info = {
-                key: (thread_info[key] + retweeted_thread_info[key])
-                for key in thread_info.keys()
-                if key in retweeted_thread_info
-            }
-        return thread_info
diff --git a/app/services/scrapers/twitter/__init__.py b/app/services/scrapers/twitter/__init__.py
deleted file mode 100644
index 6183f1c..0000000
--- a/app/services/scrapers/twitter/__init__.py
+++ /dev/null
@@ -1,381 +0,0 @@
-# TODO: https://rapidapi.com/Glavier/api/twitter135
-import asyncio
-import traceback
-from urllib.parse import urlparse
-from typing import Dict, List, Optional, Any, Tuple
-
-import httpx
-import jmespath
-
-from app.models.metadata_item import MetadataItem, MediaFile, MessageType
-from app.utils.parse import get_html_text_length, wrap_text_into_html
-from twitter.scraper import Scraper
-from .config import (
-    ALL_SCRAPER,
-    ALL_SINGLE_SCRAPER,
-    X_RAPIDAPI_HOST,
-    SCRAPER_INFO,
-    SHORT_LIMIT,
-)
-from app.config import X_RAPIDAPI_KEY, TWITTER_COOKIES, DEBUG_MODE
-from app.utils.logger import logger
-
-
-class Twitter(MetadataItem):
-    def __init__(
-            self,
-            url: str,
-            data: Optional[Any] = None,
-            scraper: Optional[str] = "Twitter135",
-            instruction: Optional[str] = "threads",
-            **kwargs,
-    ):
-        # metadata fields
-        self.url = url
-        self.title = ""
-        self.author = ""
-        self.author_url = ""
-        self.text = ""
-        self.content = ""
-        self.media_files: list[MediaFile] = []
-        self.category = "twitter"
-        self.message_type = MessageType.SHORT
-        # auxiliary fields
-        self.tid = urlparse(url).path.split("/")[-1]
-        self.text_group = ""
-        self.content_group = ""
-        self.date = ""
-        # reqeust fields
-        self.instruction = instruction
-        self.scraper = scraper
-        self.host = ""
-        self.headers = {}
-        self.params = {}
-        self.include_comments: bool = kwargs.get("include_comments", False)
-        self.article_tweet: bool = False
-
-    async def get_item(self) -> dict:
-        await self.get_twitter()
-        return self.to_dict()
-
-    async def get_twitter(self) -> None:
-        tweet_data = await self._get_response_tweet_data()
-        self._process_tweet(tweet_data)
-
-    async def _get_response_tweet_data(self) -> Dict:
-        scrapers = ALL_SCRAPER if self.instruction == "threads" else ALL_SINGLE_SCRAPER
-        for scraper in scrapers:
-            self.scraper = scraper
-            try:
-                if self.scraper.startswith("Twitter"):
-                    tweet_data = await self._rapidapi_get_response_tweet_data()
-                    return tweet_data
-                elif self.scraper == "api-client":
-                    tweet_data = await self._api_client_get_response_tweet_data()
-                    return tweet_data
-            except Exception as e:
-                logger.error(e)
-                traceback.print_exc()
-                continue
-        raise Exception("No valid response from all Twitter scrapers")
-
-    async def _rapidapi_get_response_tweet_data(self) -> Dict:
-        async with httpx.AsyncClient() as client:
-            self._get_request_headers()
-            response = await client.get(
-                url=self.host, headers=self.headers, params=self.params
-            )
-            if response.status_code == 200:
-                tweet_data = response.json()
-                if (
-                        type(tweet_data) == dict
-                        and ("errors" in tweet_data or "detail" in tweet_data)
-                ) or (
-                        type(tweet_data) == str
-                        and ("400" in tweet_data or "429" in tweet_data)
-                ):
-                    raise Exception("Invalid response from Twitter API")
-                else:
-                    return tweet_data
-            else:
-                raise Exception("Invalid response from Twitter API")
-
-    async def _api_client_get_response_tweet_data(self) -> Dict:
-        scraper = Scraper(
-            save=False,
-            pbar=False,
-            debug=0,
-            cookies=TWITTER_COOKIES
-        )
-        tweet_data = await asyncio.to_thread(scraper.tweets_details, [int(self.tid)], limit=1)
-        logger.debug(tweet_data)
-        return tweet_data[0]
-
-    def _process_tweet(self, tweet_data: Dict):
-        # if self.scraper == "api-client":
-        #     self.process_twitter_api_client(tweet_data)
-        if self.scraper in ["api-client", "Twitter135"]:
-            self._process_tweet_twitter135(tweet_data)
-        elif self.scraper in ["Twitter154", "twitter-v24"]:
-            self._process_tweet_Twitter154(tweet_data)
-
-    def _process_tweet_twitter135(self, tweet_data: Dict):
-        tweet_data_instructions = tweet_data["data"]["threaded_conversation_with_injections_v2"][
-            "instructions"
-        ]
-        entries_instruction = next(
-            (instr for instr in tweet_data_instructions if 'entries' in instr),
-            None
-        )
-        entries = entries_instruction['entries']
-        tweets = []
-        for entry in entries:
-            content = entry["content"]
-            entry_type = content.get("entryType", "")
-
-            if entry_type == "TimelineTimelineItem":
-                item_content = content.get("itemContent", {})
-                if item_content.get("itemType") == "TimelineTweet":
-                    result = item_content.get("tweet_results", {}).get("result")
-                    if result:
-                        tweets.append(result)
-
-            elif entry_type == "TimelineTimelineModule" and self.include_comments:
-                for module_item in content.get("items", []):
-                    item_content = module_item.get("item", {}).get("itemContent", {})
-                    if item_content.get("itemType") == "TimelineTweet":
-                        result = item_content.get("tweet_results", {}).get("result")
-                        if result:
-                            tweets.append(result)
-        for tweet in tweets:
-            if tweet["__typename"] == "TweetWithVisibilityResults":
-                tweet = tweet["tweet"]
-            parsed_tweet_data = self.parse_tweet_data_Twitter135(tweet)
-            self.process_single_tweet_Twitter135(parsed_tweet_data)
-        self.text += self.text_group
-        self.text = self.text[:-1]
-        self.content += self.content_group
-        self.message_type = (
-            MessageType.LONG if (get_html_text_length(self.text) > SHORT_LIMIT or self.article_tweet) else MessageType.SHORT
-        )
-
-    def process_single_tweet_Twitter135(self, tweet: Dict, retweeted=False) -> None:
-        if tweet.get("tid") == self.tid:
-            if tweet.get("article") and tweet["article"].get("title"):
-                self.title = tweet["article"]["title"]
-                self.article_tweet = True
-            else:
-                self.title = f"{tweet['name']}'s Tweet"
-            self.author = tweet["name"]
-            self.author_url = f"https://twitter.com/{tweet['username']}"
-            self.date = tweet["date"]
-        tweet_info = self.parse_single_tweet_Twitter135(tweet, retweeted=retweeted)
-        self.text_group += tweet_info["text_group"]
-        self.content_group += tweet_info["content_group"]
-        self.media_files += tweet_info["media_files"]
-        if tweet["quoted_tweet"]:
-            retweeted_tweet_info = self.parse_tweet_data_Twitter135(
-                tweet["quoted_tweet"]
-            )
-            self.process_single_tweet_Twitter135(retweeted_tweet_info, retweeted=True)
-        if tweet.get("tid") == self.tid:
-            self.content_group = self.content_group.replace("<hr>", "", 1)
-
-    @staticmethod
-    def parse_single_tweet_Twitter135(tweet: Dict, retweeted=False) -> Dict:
-        tweet_info = {
-            "media_files": [],
-            "text_group": "",
-            "content_group": "<hr>" if not retweeted else "<p>Quoted:</p>",
-        }
-        user_component = f"<a href='https://twitter.com/{tweet['username']}/status/{tweet['tid']}'>@{tweet['name']}</a>"
-
-        if tweet.get("article"):
-            article = tweet["article"]
-            article_title = article.get("title", "")
-            display_text = article_title if article_title else (
-                tweet["full_text"] if tweet.get("full_text") else tweet["text"]
-            )
-            tweet_info["content_group"] += wrap_text_into_html(f"{user_component}: {display_text}")
-            tweet_info["text_group"] += f"{user_component}: {display_text}\n"
-            article_html, article_media = Twitter.parse_article_content(article)
-            tweet_info["content_group"] += article_html
-            tweet_info["media_files"] += article_media
-        else:
-            text = tweet["full_text"] if tweet.get("full_text") else tweet["text"]
-            tweet_info["content_group"] += wrap_text_into_html(f"{user_component}: {text}")
-            tweet_info["text_group"] += f"{user_component}: {text}\n"
-
-        if tweet["media"]:
-            for media in tweet["media"]:
-                if media["type"] == "photo":
-                    photo_url = media["media_url_https"] + "?name=orig"
-                    tweet_info[
-                        "content_group"
-                    ] += f"<img src='{photo_url}'/>"
-                    tweet_info["media_files"].append(
-                        MediaFile(
-                            media_type="image",
-                            url=photo_url,
-                            caption="",
-                        )
-                    )
-                elif media["type"] == "video" or media["type"] == "animated_gif":
-                    highest_bitrate_item = max(
-                        media["video_info"]["variants"],
-                        key=lambda x: x.get("bitrate", 0),
-                    )
-                    tweet_info[
-                        "content_group"
-                    ] += f'<video controls="controls" src="{highest_bitrate_item["url"]}"></video>'
-                    tweet_info["media_files"].append(
-                        MediaFile(
-                            media_type="video",
-                            url=highest_bitrate_item["url"],
-                            caption="",
-                        )
-                    )
-        tweet_info["content_group"] = tweet_info["content_group"].replace("\n", "<br>")
-        return tweet_info
-
-    @staticmethod
-    def parse_tweet_data_Twitter135(data: Dict) -> Dict:
-        result = jmespath.search(
-            """{
-            tid: rest_id,
-            name: core.user_results.result.core.name || core.user_results.result.legacy.name,
-            username: core.user_results.result.core.screen_name || core.user_results.result.legacy.screen_name,
-            date: legacy.created_at,
-            full_text: note_tweet.note_tweet_results.result.text,
-            text: legacy.full_text,
-            media: legacy.extended_entities.media,
-            quoted_tweet: quoted_status_result.result,
-            article: article.article_results.result
-            }""",
-            data,
-        )
-        return result
-
-    def _process_tweet_Twitter154(self, tweet_data: Dict):
-        pass
-
-    @staticmethod
-    def parse_article_content(article: Dict) -> Tuple[str, List[MediaFile]]:
-        content_state = article.get("content_state", {})
-        blocks = content_state.get("blocks", [])
-        entity_map_list = content_state.get("entityMap", [])
-
-        entity_lookup = {}
-        for entry in entity_map_list:
-            entity_lookup[str(entry["key"])] = entry["value"]
-
-        html_parts = []
-        media_files = []
-
-        for block in blocks:
-            block_type = block.get("type", "unstyled")
-            text = block.get("text", "")
-            inline_style_ranges = block.get("inlineStyleRanges", [])
-            entity_ranges = block.get("entityRanges", [])
-
-            if block_type == "atomic":
-                for er in entity_ranges:
-                    entity = entity_lookup.get(str(er["key"]))
-                    if entity and entity.get("type") == "MEDIA":
-                        for media_item in entity.get("data", {}).get("mediaItems", []):
-                            media_id = media_item.get("mediaId", "")
-                            media_url = _find_article_media_url(article, media_id)
-                            if media_url:
-                                html_parts.append(f"<img src='{media_url}'/>")
-                                media_files.append(MediaFile(
-                                    media_type="image",
-                                    url=media_url,
-                                    caption="",
-                                ))
-                continue
-
-            styled_text = _apply_inline_formatting(
-                text, inline_style_ranges, entity_ranges, entity_lookup
-            )
-
-            if block_type == "header-two":
-                html_parts.append(f"<h2>{styled_text}</h2>")
-            else:
-                html_parts.append(f"<p>{styled_text}</p>")
-
-        return "".join(html_parts), media_files
-
-    def _get_request_headers(self):
-        self.host = SCRAPER_INFO[self.scraper]["host"]
-        self.headers = {
-            "X-RapidAPI-Key": X_RAPIDAPI_KEY,
-            "X-RapidAPI-Host": SCRAPER_INFO[self.scraper]["top_domain"]
-                               + X_RAPIDAPI_HOST,
-            "content-type": "application/octet-stream",
-        }
-        self.params = {
-            SCRAPER_INFO[self.scraper]["params"]: self.tid,
-        }
-
-
-def _find_article_media_url(article: Dict, media_id: str) -> str:
-    for entity in article.get("media_entities", []):
-        if str(entity.get("media_id")) == str(media_id):
-            media_info = entity.get("media_info", {})
-            url = media_info.get("original_img_url", "")
-            return url
-    return ""
-
-
-def _apply_inline_formatting(
-        text: str,
-        style_ranges: List[Dict],
-        entity_ranges: List[Dict],
-        entity_lookup: Dict,
-) -> str:
-    if not text or (not style_ranges and not entity_ranges):
-        return text
-
-    n = len(text)
-    bold = [False] * n
-    italic = [False] * n
-    link_url = [None] * n
-
-    for sr in style_ranges:
-        start = sr["offset"]
-        end = start + sr["length"]
-        for i in range(start, min(end, n)):
-            if sr["style"] == "Bold":
-                bold[i] = True
-            elif sr["style"] == "Italic":
-                italic[i] = True
-
-    for er in entity_ranges:
-        entity = entity_lookup.get(str(er["key"]))
-        if entity and entity.get("type") == "LINK":
-            url = entity.get("data", {}).get("url", "")
-            start = er["offset"]
-            end = start + er["length"]
-            for i in range(start, min(end, n)):
-                link_url[i] = url
-
-    result = []
-    i = 0
-    while i < n:
-        cur_bold = bold[i]
-        cur_italic = italic[i]
-        cur_link = link_url[i]
-        j = i
-        while j < n and bold[j] == cur_bold and italic[j] == cur_italic and link_url[j] == cur_link:
-            j += 1
-        segment = text[i:j]
-        if cur_bold:
-            segment = f"<b>{segment}</b>"
-        if cur_italic:
-            segment = f"<i>{segment}</i>"
-        if cur_link:
-            segment = f"<a href='{cur_link}'>{segment}</a>"
-        result.append(segment)
-        i = j
-
-    return "".join(result)
diff --git a/app/services/scrapers/twitter/config.py b/app/services/scrapers/twitter/config.py
deleted file mode 100644
index 15b5278..0000000
--- a/app/services/scrapers/twitter/config.py
+++ /dev/null
@@ -1,31 +0,0 @@
-"""
-scaper infos
-"""
-
-ALL_SCRAPER = ["api-client", "Twitter135"]
-# ALL_SCRAPER = ["Twitter135", "Twitter154", "twitter-v24"]
-ALL_SINGLE_SCRAPER = ["Twitter154", "twitter-v24", "Twitter135", "api-client"]
-SCRAPER_INFO = {
-    "Twitter135": {
-        "host": "https://twitter135.p.rapidapi.com/v2/TweetDetail/",
-        "top_domain": "twitter135",
-        "params": "id",
-    },
-    "Twitter154": {
-        "host": "https://twitter154.p.rapidapi.com/tweet/details/",
-        "top_domain": "twitter154",
-        "params": "tweet_id",
-    },
-    "twitter-v24": {
-        "host": "https://twitter-v24.p.rapidapi.com/tweet/details",
-        "top_domain": "twitter-v24",
-        "params": "tweet_id",
-    },
-}
-X_RAPIDAPI_HOST = ".p.rapidapi.com"
-
-"""
-twitter constants
-"""
-
-SHORT_LIMIT = 600
diff --git a/app/services/scrapers/wechat/__init__.py b/app/services/scrapers/wechat/__init__.py
deleted file mode 100644
index 80ab0d2..0000000
--- a/app/services/scrapers/wechat/__init__.py
+++ /dev/null
@@ -1,102 +0,0 @@
-from typing import Dict, Any, Optional
-
-from lxml import etree
-from bs4 import BeautifulSoup, NavigableString
-
-from app.models.metadata_item import MetadataItem, MediaFile, MessageType
-from app.utils.logger import logger
-from app.utils.network import get_selector, HEADERS
-
-
-class Wechat(MetadataItem):
-    def __init__(self, url: str, data: Optional[Any] = None, **kwargs):
-        self.url = url
-        self.title = ""
-        self.author = ""
-        self.author_url = self.url
-        self.text = ""
-        self.content = ""
-        self.media_files: list[MediaFile] = []
-        self.category = "wechat"
-        self.message_type = MessageType.LONG
-        # auxiliary fields
-        self.sid = ""
-        self.official_account = ""
-        self.date = ""
-
-    async def get_item(self) -> dict:
-        await self.get_wechat()
-        return self.to_dict()
-
-    async def get_wechat(self) -> None:
-        wechat_data = await self._get_response_wechat_data()
-        self._process_wechat(wechat_data)
-        pass
-
-    async def _get_response_wechat_data(self) -> Dict:
-        wechat_data = await get_selector(self.url, headers=HEADERS)
-        wechat_data = self._wechat_data_parse(wechat_data)
-        return wechat_data
-
-    @staticmethod
-    def _wechat_data_parse(wechat_data: etree.HTML) -> Dict:
-        article = wechat_data.xpath('//div[@id="js_article"]')[0]
-        meta_data = {
-            "title": article.xpath('string(//h1[@id="activity-name"])'),
-            "author": article.xpath('string(//a[@id="js_name"])'),
-            "content": str(
-                etree.tostring(
-                    article.xpath('//div[@id="js_content"]')[0], encoding="utf-8"
-                ),
-                encoding="utf-8",
-            ),
-        }
-        for k, v in meta_data.items():
-            new_string = v.replace("\n", "")
-            meta_data[k] = new_string.strip()
-        return meta_data
-
-    def _process_wechat(self, wechat_data: Dict) -> None:
-        self.title = wechat_data["title"]
-        self.author = wechat_data["author"]
-        self.author_url = ""
-        soup = BeautifulSoup(wechat_data["content"], "lxml")
-        for img_item in soup.find_all("img"):
-            if img_item.get("class") and all(
-                    elem in img_item.get("class") for elem in ["rich_pages", "wxw-img"]
-            ):
-                img_url = img_item["data-src"]
-                img_item["src"] = img_url
-                img_item["data-src"] = img_url
-                self.media_files.append(MediaFile(url=img_url, media_type="image"))
-        for section_tag in soup.find_all("section"):
-            # if no p tag in section tag, then we consider that all text tags are span tags. We divide paragraphs by
-            # <br/><br/> tags pair, unwrap all other tags, and wrap them with <p> tags.
-            if not section_tag.find_all("section"):
-                new_p_tag = soup.new_tag("p")
-                contents = section_tag.contents[:]
-                for content in contents:
-                    content.extract()
-                for content in contents:
-                    if (
-                            content.name == "br"
-                            and content.next_sibling
-                            and content.next_sibling.name == "br"
-                    ):
-                        content.decompose()
-                        content.next_sibling.decompose()
-                        if new_p_tag.contents:
-                            section_tag.append(new_p_tag)
-                            new_p_tag = soup.new_tag("p")
-                    elif content.name == "p":
-                        if new_p_tag.contents:
-                            section_tag.append(new_p_tag)
-                            new_p_tag = soup.new_tag("p")
-                        section_tag.append(content)
-                    else:
-                        new_p_tag.append(content)
-                if new_p_tag.contents:
-                    section_tag.append(new_p_tag)
-        self.raw_content = str(soup)
-        self.content = self.raw_content
-        self.text = soup.get_text()
diff --git a/app/services/scrapers/weibo/__init__.py b/app/services/scrapers/weibo/__init__.py
deleted file mode 100644
index 5b4fcd9..0000000
--- a/app/services/scrapers/weibo/__init__.py
+++ /dev/null
@@ -1,55 +0,0 @@
-import json
-from dataclasses import dataclass
-from typing import Optional, Any
-from urllib.parse import urlparse
-
-import httpx
-import jmespath
-from bs4 import BeautifulSoup
-from lxml import html
-
-from app.models.metadata_item import MetadataItem, MediaFile, MessageType
-from app.utils.network import get_response_json, get_random_user_agent
-from app.utils.parse import get_html_text_length, wrap_text_into_html
-from .config import (
-    AJAX_HOST,
-    AJAX_LONGTEXT_HOST,
-    WEIBO_WEB_HOST,
-    WEIBO_HOST,
-    WEIBO_TEXT_LIMIT,
-)
-from app.config import JINJA2_ENV, WEIBO_COOKIES
-from app.utils.logger import logger
-
-short_text_template = JINJA2_ENV.get_template("weibo_short_text.jinja2")
-content_template = JINJA2_ENV.get_template("weibo_content.jinja2")
-
-
-@dataclass
-class Weibo(MetadataItem):
-    id: str = ""
-
-    @staticmethod
-    def from_dict(obj: Any) -> "Weibo":
-        weibo_item = MetadataItem.from_dict(obj)
-        weibo_item.id = obj.get("id")
-        return Weibo(
-            url=weibo_item.url,
-            title=weibo_item.title,
-            author=weibo_item.author,
-            author_url=weibo_item.author_url,
-            telegraph_url=weibo_item.telegraph_url,
-            text=weibo_item.text,
-            content=weibo_item.content,
-            media_files=weibo_item.media_files,
-            category=weibo_item.category,
-            message_type=weibo_item.message_type,
-            id=weibo_item.id,
-        )
-
-    def to_dict(self) -> dict:
-        result: dict = super().to_dict()
-        result["id"] = self.id
-        return result
-
-
diff --git a/app/services/scrapers/weibo/config.py b/app/services/scrapers/weibo/config.py
deleted file mode 100644
index bf21d7f..0000000
--- a/app/services/scrapers/weibo/config.py
+++ /dev/null
@@ -1,5 +0,0 @@
-AJAX_HOST = "https://weibo.com/ajax/statuses/show?id="
-AJAX_LONGTEXT_HOST = "https://weibo.com/ajax/statuses/longtext?id="
-WEIBO_WEB_HOST = "https://m.weibo.cn/status/"
-WEIBO_HOST = "https://weibo.com"
-WEIBO_TEXT_LIMIT = 700
diff --git a/app/services/scrapers/weibo/scraper.py b/app/services/scrapers/weibo/scraper.py
deleted file mode 100644
index 9aa0a67..0000000
--- a/app/services/scrapers/weibo/scraper.py
+++ /dev/null
@@ -1,501 +0,0 @@
-import json
-from typing import Optional, Any, Union
-from urllib.parse import urlparse
-
-import httpx
-import jmespath
-from bs4 import BeautifulSoup
-from lxml import html
-
-from app.models.metadata_item import MetadataItem, MediaFile, MessageType
-from app.services.scrapers.scraper import Scraper, DataProcessor
-from app.services.scrapers.weibo import Weibo
-from app.utils.network import get_response_json, get_random_user_agent
-from app.utils.parse import get_html_text_length, wrap_text_into_html
-from .config import (
-    AJAX_HOST,
-    AJAX_LONGTEXT_HOST,
-    WEIBO_WEB_HOST,
-    WEIBO_HOST,
-    WEIBO_TEXT_LIMIT,
-)
-from app.config import JINJA2_ENV, WEIBO_COOKIES
-from app.utils.logger import logger
-
-short_text_template = JINJA2_ENV.get_template("weibo_short_text.jinja2")
-content_template = JINJA2_ENV.get_template("weibo_content.jinja2")
-
-
-class WeiboDataProcessor(DataProcessor):
-
-    def __init__(
-            self,
-            url: str,
-            method: str = "webpage",
-            user_agent: dict = None,
-            cookies: str = WEIBO_COOKIES
-    ):
-        if not user_agent:
-            user_agent = get_random_user_agent()
-        self.url: str = url
-        self._data: dict = {}
-        self.url = url
-        self.method = method
-        self.text = ""
-        self.headers = {"User-Agent": user_agent, "Cookie": cookies if cookies else ""}
-        self.url_parser = urlparse(url)
-        self.id = self.url_parser.path.split("/")[-1]
-        self.ajax_url = AJAX_HOST + self.id
-        self.ajax_longtext_url = AJAX_LONGTEXT_HOST + self.id
-
-    async def get_item(self) -> dict:
-        await self.process_data()
-        weibo_item = Weibo.from_dict(self._data)
-        return weibo_item.to_dict()
-
-    async def process_data(self) -> None:
-        await self._get_weibo()
-
-    async def _get_weibo(self) -> None:
-        try:
-            weibo_info = await self._get_weibo_info()
-        except ConnectionError as e:
-            self.method = "webpage"
-            weibo_info = await self._get_weibo_info()
-            logger.error(f"Failed to get weibo info by api: {e}")
-            # TODO: a better exception handling
-        try:
-            await self._process_weibo_item(weibo_info)
-        except Exception as e:
-            logger.error(f"Failed to process weibo item: {e}")
-
-    async def _get_weibo_info(self, method=None) -> dict:
-        try:
-            if not method:
-                method = self.method
-            if method == "webpage":
-                weibo_info = await self._get_weibo_info_webpage()
-            elif method == "api":
-                weibo_info = await self._get_weibo_info_api()
-            else:
-                raise ValueError("method must be webpage or api")
-            weibo_info = self._parse_weibo_info(weibo_info)
-            return weibo_info
-        except ConnectionError as e:
-            raise ConnectionError(f"There are some network issues: {e}")
-
-    async def _get_weibo_info_webpage(self) -> dict:
-        url = WEIBO_WEB_HOST + self.id
-        async with httpx.AsyncClient() as client:
-            response = await client.get(url, headers=self.headers)
-            if response.status_code == 302:  # redirect
-                new_url = response.headers["Location"]
-                response = await client.get(new_url, headers=self.headers)
-        html_string = response.text
-        html_string = html_string[html_string.find('"status":'):]
-        html_string = html_string[: html_string.rfind('"hotScheme"')]
-        html_string = html_string[: html_string.rfind(",")]
-        html_string = html_string[: html_string.rfind("][0] || {};")]
-        html_string = "{" + html_string
-        try:
-            js = json.loads(html_string, strict=False)
-            print(js)
-            weibo_info = js.get("status")
-        except Exception as e:
-            logger.error(f"Failed to get weibo info by webpage scraping: {e}")
-            weibo_info = {}
-        return weibo_info
-
-    async def _get_weibo_info_api(self) -> dict:
-        try:
-            ajax_json = await get_response_json(self.ajax_url, headers=self.headers)
-            logger.debug(f"weibo ajax_json info by api: {ajax_json}")
-            if not ajax_json or ajax_json["ok"] == 0:
-                raise ConnectionError(f"Failed to get weibo info by api")
-            return ajax_json
-        except Exception as e:
-            raise ConnectionError(f"Failed to get weibo info by api: {e}")
-
-    async def _get_long_weibo_info_api(self) -> dict:
-        ajax_json = await get_response_json(
-            self.ajax_longtext_url, headers=self.headers
-        )
-        logger.debug(f"weibo ajax_json info by api: {ajax_json}")
-        return ajax_json
-
-    async def _process_weibo_item(self, weibo_info: dict) -> None:
-        # self.id = str(weibo_info.get("id"))
-        # get user info
-        weibo_item_data = {
-            "category": "weibo",
-            "url": self.url,
-            "user_id": weibo_info.get("user_id"),
-            "author": weibo_info.get("author"),
-            "author_url": weibo_info.get("author_url"),
-            "title": weibo_info.get("author") + "的微博",
-            "date": weibo_info.get("created", None),
-            "source": weibo_info.get("source", None),
-            "region_name": weibo_info.get("region_name", None),
-            "attitudes_count": self._string_to_int(weibo_info.get("attitudes_count", 0)),
-            "comments_count": self._string_to_int(weibo_info.get("comments_count", 0)),
-            "reposts_count": self._string_to_int(weibo_info.get("reposts_count", 0)),
-        }
-        # resolve text
-        # check if the weibo is longtext weibo (which means >140 characters so has an excerpt) or not
-        text = weibo_info.get("text", "")
-        if (
-                weibo_info["is_long_text"]
-                or text.endswith('<span class="expand">展开</span>')
-                or text.endswith("展开")
-                or not text
-        ):
-            # if a weibo has more than 9 pictures, the isLongText will be True even if it is not a longtext weibo
-            # however, we cannot get the full text of such kind of weibo from longtext api (it will return None)
-            # so, it is necessary to check if a weibo is a real longtext weibo or not for getting the full text
-            try:
-                longtext_info = await self._get_weibo_info(method="webpage")
-                # if longtext_info.get("is_long_text"):
-                #     raise Exception("Still a long text weibo, should go long text api.")
-                text = longtext_info.get("text")
-                if not text:
-                    raise Exception(
-                        "Failed to get longtext of weibo by webpage scraping."
-                    )
-            except Exception as e:
-                logger.error(f"Failed to get longtext of weibo by webpage scraping.{e}")
-                try:
-                    longtext_info = await self._get_long_weibo_info_api()
-                    longtext_info = longtext_info.get("data", {})
-                    text = longtext_info.get("longTextContent")
-                except Exception as e:
-                    logger.error(f"Failed to get longtext of weibo by api.{e}")
-            # The two methods can both fail in some cases. So, we need to check if the text is None or not.
-        else:
-            # TODO: to add a branch to get the fulltext without using the webpage scraping. This branch needs cookies.
-            pass
-        cleaned_text, fw_pics = WeiboDataProcessor._weibo_html_text_clean(text)
-        media_files = []
-        for pic in fw_pics:
-            media_files.append(MediaFile(url=pic, media_type="image"))
-        text = cleaned_text.replace("<br />", "<br>").replace("br/", "br")
-        raw_content = text.replace("<br/><br/>", "<br>")
-        # resolve medias
-        extra_medias = self._get_media_files(weibo_info)
-        if extra_medias:
-            media_files += extra_medias
-        # render the text and content
-        weibo_item_data["raw_content"] = raw_content
-        text = short_text_template.render(data=weibo_item_data).replace("<br />", "\n").replace("<br>", "\n")
-        text = text[:-1] if text.endswith("\n") else text
-        weibo_item_data["text"] = text
-        for i in media_files:
-            if i.media_type == "video":
-                raw_content += f'<video src="{i.url}" controls="controls"></video>'
-            elif i.media_type == "image":
-                raw_content += f'<img src="{i.url}">'
-        content = content_template.render(data=weibo_item_data)
-        content = wrap_text_into_html(
-            wrap_text_into_html(content, is_html=True), is_html=False
-        )
-        weibo_item_data["media_files"] = media_files
-        weibo_item_data["content"] = content
-        # resolve retweet
-        if weibo_info.get("retweeted_status"):
-            retweeted_weibo_id = (
-                    weibo_info["retweeted_status"].get("id")
-                    or weibo_info["retweeted_status"].get("mid")
-                    or weibo_info["retweeted_status"].get("idstr")
-            )
-            retweeted_weibo_item = WeiboDataProcessor(url=WEIBO_WEB_HOST + retweeted_weibo_id)
-            retweeted_info = await retweeted_weibo_item.get_item()
-            weibo_item_data["text"] += retweeted_info["text"]
-            weibo_item_data["content"] += "<hr>" + retweeted_info["content"]
-            weibo_item_data["media_files"] += retweeted_info["media_files"]
-        # type check
-        weibo_item_data["message_type"] = (
-            MessageType.LONG
-            if get_html_text_length(weibo_item_data["text"]) > WEIBO_TEXT_LIMIT
-            else MessageType.SHORT
-        )
-        media_file_dict = [i.to_dict() for i in media_files]
-        weibo_item_data["media_files"] = media_file_dict
-        self._data = weibo_item_data
-
-
-    @staticmethod
-    def _parse_weibo_info(data: dict) -> dict:
-        expression = f"""{{
-            "id": id,
-            "author": user.screen_name,
-            "author_url": user.profile_url,
-            "user_id": user.id,
-            "created": created_at,
-            "source": source,
-            "region_name": region_name,
-            "text": text,
-            "text_raw": text_raw,
-            "text_length": textLength,
-            "is_long_text": isLongText,
-            "pic_num": pic_num,
-            "pic_video": pic_video,
-            "pic_infos": pic_infos,
-            "page_info": page_info,
-            "pics": pics,
-            "mix_media_info": mix_media_info,
-            "url_struct": url_struct,
-            "attitudes_count": attitudes_count,
-            "comments_count": comments_count,
-            "reposts_count": reposts_count,
-            "retweeted_status": retweeted_status
-        }}"""
-        weibo_info = jmespath.search(expression, data)
-        return weibo_info
-
-    def _get_media_files(self, weibo_info: dict) -> list:
-        """
-        The function is used to get all media files (pictures, videos, live photos) from a weibo item
-        The design of weibo media files is very complicated and confusing. It can be divided from the following aspects:
-        1. pic_infos: the media files of a weibo item are stored in pic_infos. This key only appears when the weibo item
-        has only pictures. However, live photos, which is actually "videos", are also stored in pic_infos. So, we need
-        to check the type and add it into the media files list.
-        2. page_info: the media files of a weibo item are stored in page_info. This key only appears when the weibo item
-        has only one video.
-        3. mix_media_info: the media files of a weibo item are stored in mix_media_info. This key only appears when the
-        weibo item has both pictures and videos.
-        We separate the media files scraping process into three parts according to the above aspects. For keeping the
-        order of the media files, we use a list to store the media files.
-        :param weibo_info:
-        :return: media_files: a list of media files
-        """
-        media_files = []
-        media_files += self._get_pictures(weibo_info)
-        media_files += self._get_videos(weibo_info)
-        media_files += self._get_mix_media(weibo_info)
-        return media_files
-
-    @staticmethod
-    def _get_pictures(weibo_info: dict) -> list:
-        media_files = []
-        if weibo_info.get("pics"):
-            pic_info = weibo_info["pics"]
-            if pic_info:
-                for pic in pic_info:
-                    media_files.append(
-                        MediaFile(
-                            url=pic["large"]["url"], media_type="image", caption=""
-                        )
-                    )
-                    if pic.get("type") in ["gifvideos", "livephoto"]:
-                        media_files.append(
-                            MediaFile(
-                                url=pic["videoSrc"], media_type="video", caption=""
-                            )
-                        )
-        elif "pic_infos" in weibo_info and weibo_info.get("pic_num") > 0:
-            pic_info = weibo_info["pic_infos"]
-            if pic_info:
-                for pic in pic_info:
-                    if pic_info[pic].get("type") == "pic":
-                        media_files.append(
-                            MediaFile(
-                                url=pic_info[pic]["original"]["url"],
-                                media_type="image",
-                                caption="",
-                            )
-                        ) if pic_info[pic]["original"] else media_files.append(
-                            MediaFile(
-                                url=pic_info[pic]["large"]["url"],
-                                media_type="image",
-                                caption="",
-                            )
-                        )
-                    elif pic_info[pic].get("type") in ["live_photo", "livephoto"]:
-                        media_files.append(
-                            MediaFile(
-                                url=pic_info[pic]["original"]["url"], media_type="image"
-                            )
-                        ) if pic_info[pic]["original"] else media_files.append(
-                            MediaFile(pic_info[pic]["large"]["url"])
-                        )
-                        live_pic_url = pic_info[pic]["video"]["url"]
-                        if not (live_pic_url[-4] == "." and live_pic_url[-3:] != "mp4"):
-                            media_files.append(
-                                MediaFile(
-                                    url=pic_info[pic]["video"], media_type="video"
-                                )
-                            )
-                    elif pic_info[pic].get("type") == "gif":
-                        media_files.append(
-                            MediaFile(url=pic_info[pic]["video"], media_type="video")
-                        )
-        else:
-            return media_files
-        return media_files
-
-    @staticmethod
-    def _get_videos(weibo_info: dict) -> list:
-        media_files, video_url_list = [], []
-        if weibo_info.get("page_info"):
-            if (
-                    weibo_info["page_info"].get("urls")
-                    or weibo_info["page_info"].get("media_info")
-            ) and (
-                    weibo_info["page_info"].get("type") == "video"
-                    or weibo_info["page_info"].get("object_type") == "video"
-            ):
-                media_info = (
-                    weibo_info["page_info"]["urls"]
-                    if weibo_info["page_info"].get("urls")
-                    else ""
-                )
-                if not media_info:
-                    media_info = weibo_info["page_info"]["media_info"]
-                video_url_keys = [
-                    "mp4_720p_mp4",
-                    "mp4_hd_url",
-                    "hevc_mp4_hd",
-                    "mp4_sd_url",
-                    "mp4_ld_mp4",
-                    "stream_url_hd",
-                    "stream_url",
-                ]
-                for key in video_url_keys:
-                    video_url = media_info.get(key)
-                    if video_url:
-                        break
-                video_url_list.append(video_url)
-        for url in video_url_list:
-            media_files.append(MediaFile(url=url, media_type="video"))
-        return media_files
-
-    @staticmethod
-    def _get_mix_media(weibo_info: dict) -> list:
-        media_files = []
-        if weibo_info.get("mix_media_info"):
-            for item in weibo_info["mix_media_info"]["items"]:
-                if item.get("type") == "pic":
-                    media_files.append(
-                        MediaFile(
-                            url=item["data"]["original"]["url"], media_type="image"
-                        )
-                    ) if item["data"]["original"] else media_files.append(
-                        MediaFile(url=item["data"]["large"]["url"], media_type="image")
-                    )
-                elif item.get("type") in ["live_photo", "livephoto"]:
-                    media_files.append(
-                        MediaFile(
-                            url=item["data"]["original"]["url"], media_type="image"
-                        )
-                    ) if item["data"]["original"] else media_files.append(
-                        MediaFile(url=item["data"]["large"]["url"], media_type="image")
-                    )
-                    media_files.append(
-                        MediaFile(url=item["data"]["video"]["url"], media_type="video")
-                    )
-                elif item.get("type") == "gif":
-                    media_files.append(
-                        MediaFile(url=item["data"]["video"]["url"], media_type="video")
-                    )
-                elif item.get("type") == "video":
-                    video_url = item.get("stream_url_hd")
-                    video_keys = [
-                        "mp4_720p_mp4",
-                        "mp4_hd_url",
-                        "hevc_mp4_hd",
-                        "mp4_sd_url",
-                        "mp4_ld_mp4",
-                        "stream_url_hd",
-                        "stream_url",
-                    ]
-                    for key in video_keys:
-                        video_url = item["data"]["media_info"].get(key)
-                        if video_url:
-                            break
-                    media_files.append(MediaFile(url=video_url, media_type="video"))
-        return media_files
-
-    @staticmethod
-    def _string_to_int(string: Union[str | int]) -> int:
-        """
-        Convert Chinese numeric string to int
-        :param string: str
-        :return: int: int value of the string
-        """
-        if isinstance(string, int):
-            return string
-        elif string.endswith("万+"):
-            string = string[:-2] + "0000"
-        elif string.endswith("万"):
-            string = float(string[:-1]) * 10000
-        elif string.endswith("亿"):
-            string = float(string[:-1]) * 100000000
-        return int(string)
-
-    @staticmethod
-    def _get_live_photo(weibo_info: dict) -> list:
-        live_photo_list = []
-        live_photo = weibo_info.get("pic_video")
-        if live_photo:
-            prefix = "https://video.weibo.com/media/play?livephoto=//us.sinaimg.cn/"
-            for i in live_photo.split(","):
-                if len(i.split(":")) == 2:
-                    url = prefix + i.split(":")[1] + ".mov"
-                    live_photo_list.append(url)
-            return live_photo_list
-
-    @staticmethod
-    def _weibo_html_text_clean(text, method="bs4"):
-        if method == "bs4":
-            return WeiboDataProcessor._weibo_html_text_clean_bs4(text)
-        elif method == "lxml":
-            return WeiboDataProcessor._weibo_html_text_clean_lxml(text)
-        else:
-            raise ValueError("method must be bs4 or lxml")
-
-    @staticmethod
-    def _weibo_html_text_clean_bs4(text):
-        fw_pics = []
-        soup = BeautifulSoup(text, "html.parser")
-        for img in soup.find_all("img"):
-            alt_text = img.get("alt", "")
-            img.replace_with(alt_text)
-        for image in soup.find_all("image"):
-            if image.get("src") == "https://h5.sinaimg.cn/upload/2015/09/25/3/timeline_card_small_web_default.png":
-                image.replace_with("")
-        for a in soup.find_all("a"):
-            if a.text == "查看图片":
-                fw_pics.append(a.attrs.get("href"))
-            if "/n/" in a.get("href") and a.get("usercard"):
-                a["href"] = "https://weibo.com" + a.attrs.get("href")
-        for i in soup.find_all("span"):
-            i.unwrap()
-        res = (
-            str(soup)
-            .replace('href="//', 'href="http://')
-            .replace('href="/n/', 'href="http://weibo.com/n/')
-        )
-        return res, fw_pics
-
-    @staticmethod
-    def _weibo_html_text_clean_lxml(text):
-        selector = html.fromstring(text)
-        # remove all img tags and replace with alt text
-        for img in selector.xpath("//img"):
-            alt_text = img.get("alt", "")
-            # get innerhtml pure text of the parent tag
-            parent_text = img.getparent().text_content() if img.getparent() else ""
-            replace_text = alt_text + parent_text
-            text_node = html.fromstring(replace_text)
-            img.addprevious(text_node)
-            img.getparent().remove(img)
-            # make text_node become pure text
-            text_node.text = text_node.text_content()
-        # return the html document after cleaning
-        return html.tostring(selector, encoding="unicode")
-
-
-class WeiboScraper(Scraper):
-    weibo_cookies = WEIBO_COOKIES
-
-    async def get_processor_by_url(self, url) -> DataProcessor:
-        return WeiboDataProcessor(url, cookies=self.weibo_cookies)
diff --git a/app/services/scrapers/weibo/testcase b/app/services/scrapers/weibo/testcase
deleted file mode 100644
index 7a8e13b..0000000
--- a/app/services/scrapers/weibo/testcase
+++ /dev/null
@@ -1,4 +0,0 @@
-single video with tags: https://m.weibo.cn/status/4884946584077604
-weibo with emoji tag: https://m.weibo.cn/status/MCAqGFsQL
-weibo with multiple videos: https://m.weibo.cn/status/MBY95pZ2g
-forwarding weibo with image link: https://m.weibo.cn/status/MCAOYhYM3
diff --git a/app/services/scrapers/xiaohongshu/__init__.py b/app/services/scrapers/xiaohongshu/__init__.py
deleted file mode 100644
index 55507b7..0000000
--- a/app/services/scrapers/xiaohongshu/__init__.py
+++ /dev/null
@@ -1,153 +0,0 @@
-import asyncio
-from typing import Any
-from urllib.parse import urlparse
-
-import httpx
-import jmespath
-
-from app.models.metadata_item import MetadataItem, MediaFile, MessageType
-from app.utils.network import HEADERS
-from app.config import JINJA2_ENV, HTTP_REQUEST_TIMEOUT
-from .xhs.core import XiaoHongShuCrawler
-from .xhs.client import XHSClient
-from .xhs import proxy_account_pool
-
-from app.utils.logger import logger
-from app.utils.parse import (
-    unix_timestamp_to_utc,
-    get_html_text_length,
-    wrap_text_into_html,
-)
-
-environment = JINJA2_ENV
-short_text_template = environment.get_template("xiaohongshu_short_text.jinja2")
-content_template = environment.get_template("xiaohongshu_content.jinja2")
-
-
-class Xiaohongshu(MetadataItem):
-    def __init__(self, url: str, data: Any, **kwargs):
-        self.url = url
-        self.id = None
-        self.media_files = []
-        self.category = "xiaohongshu"
-        self.message_type = MessageType.SHORT
-        # auxiliary fields
-        self.ip_location = None
-        self.share_count = None
-        self.comment_count = None
-        self.collected_count = None
-        self.like_count = None
-        self.updated = None
-        self.created = None
-        self.raw_content = None
-
-    async def get_item(self) -> dict:
-        await self.get_xiaohongshu()
-        return self.to_dict()
-
-    async def get_xiaohongshu(self) -> None:
-        if self.url.find("xiaohongshu.com") == -1:
-            async with httpx.AsyncClient() as client:
-                resp = await client.get(
-                    self.url,
-                    headers=HEADERS,
-                    follow_redirects=True,
-                    timeout=HTTP_REQUEST_TIMEOUT,
-                )
-                if (
-                    resp.history
-                ):  # if there is a redirect, the request will have a response chain
-                    for h in resp.history:
-                        print(h.status_code, h.url)
-                    self.url = str(resp.url)
-        urlparser = urlparse(self.url)
-        self.id = urlparser.path.split("/")[-1]
-        crawler = XiaoHongShuCrawler()
-        account_pool = proxy_account_pool.create_account_pool()
-        crawler.init_config("xhs", "cookie", account_pool)
-        note_detail = None
-        for _ in range(5):
-            try:
-                note_detail = await crawler.start(id=self.id)
-                break
-            except Exception as e:
-                await asyncio.sleep(3)
-                logger.error(f"error: {e}")
-                logger.error(f"retrying...")
-        if not note_detail:
-            raise Exception("重试了这么多次还是无法签名成功，寄寄寄")
-        # logger.debug(f"json_data: {json.dumps(note_detail, ensure_ascii=False, indent=4)}")
-        parsed_data = self.process_note_json(note_detail)
-        await self.process_xiaohongshu_note(parsed_data)
-
-    async def process_xiaohongshu_note(self, json_data: dict):
-        self.title = json_data.get("title")
-        self.author = json_data.get("author")
-        if not self.title and self.author:
-            self.title = f"{self.author}的小红书笔记"
-        self.author_url = "https://www.xiaohongshu.com/user/profile/" + json_data.get(
-            "user_id"
-        )
-        self.raw_content = json_data.get("raw_content")
-        logger.debug(f"{json_data.get('created')}")
-        self.created = (
-            unix_timestamp_to_utc(json_data.get("created") / 1000)
-            if json_data.get("created")
-            else None
-        )
-        self.updated = (
-            unix_timestamp_to_utc(json_data.get("updated") / 1000)
-            if json_data.get("updated")
-            else None
-        )
-        self.like_count = json_data.get("like_count")
-        self.collected_count = json_data.get("collected_count")
-        self.comment_count = json_data.get("comment_count")
-        self.share_count = json_data.get("share_count")
-        self.ip_location = json_data.get("ip_location")
-        if json_data.get("image_list"):
-            for image_url in json_data.get("image_list"):
-                self.media_files.append(MediaFile(url=image_url, media_type="image"))
-        if json_data.get("video"):
-            self.media_files.append(
-                MediaFile(url=json_data.get("video"), media_type="video")
-            )
-        data = self.__dict__
-        data["raw_content"] = data["raw_content"].replace("\t", "")
-        if data["raw_content"].endswith("\n"):
-            data["raw_content"] = data["raw_content"][:-1]
-        self.text = short_text_template.render(data=data)
-        if get_html_text_length(self.text) > 500:
-            self.message_type = MessageType.LONG
-        data["raw_content"] = wrap_text_into_html(self.raw_content)
-        for media_file in self.media_files:
-            if media_file.media_type == "image":
-                data["raw_content"] += f'<p><img src="{media_file.url}" alt=""/></p>'
-            elif media_file.media_type == "video":
-                data[
-                    "raw_content"
-                ] += (
-                    f'<p><video src="{media_file.url}" controls="controls"></video></p>'
-                )
-        self.content = content_template.render(data=data)
-
-    @staticmethod
-    def process_note_json(json_data: dict):
-        expression = """
-        {
-        title: title,
-        raw_content: desc,
-        author: user.nickname,
-        user_id: user.user_id,
-        image_list: image_list[*].url,
-        video: video.media.stream.h264[0].master_url,
-        like_count: interact_info.liked_count,
-        collected_count: interact_info.collected_count,
-        comment_count: interact_info.comment_count,
-        share_count: interact_info.share_count,
-        ip_location: ip_location,
-        created: time,
-        updated: last_update_time
-        }
-        """
-        return jmespath.search(expression, json_data)
diff --git a/app/services/scrapers/xiaohongshu/xhs/__init__.py b/app/services/scrapers/xiaohongshu/xhs/__init__.py
deleted file mode 100644
index 947f034..0000000
--- a/app/services/scrapers/xiaohongshu/xhs/__init__.py
+++ /dev/null
@@ -1,2 +0,0 @@
-from .core import XiaoHongShuCrawler
-from .field import *
diff --git a/app/services/scrapers/xiaohongshu/xhs/base_crawler.py b/app/services/scrapers/xiaohongshu/xhs/base_crawler.py
deleted file mode 100644
index d00b38a..0000000
--- a/app/services/scrapers/xiaohongshu/xhs/base_crawler.py
+++ /dev/null
@@ -1,35 +0,0 @@
-from abc import ABC, abstractmethod
-
-from .proxy_account_pool import AccountPool
-
-
-class AbstractCrawler(ABC):
-    @abstractmethod
-    def init_config(self, platform: str, login_type: str, account_pool: AccountPool):
-        pass
-
-    @abstractmethod
-    async def start(self):
-        pass
-
-    @abstractmethod
-    async def search(self):
-        pass
-
-
-class AbstractLogin(ABC):
-    @abstractmethod
-    async def begin(self):
-        pass
-
-    @abstractmethod
-    async def login_by_qrcode(self):
-        pass
-
-    @abstractmethod
-    async def login_by_mobile(self):
-        pass
-
-    @abstractmethod
-    async def login_by_cookies(self):
-        pass
diff --git a/app/services/scrapers/xiaohongshu/xhs/client.py b/app/services/scrapers/xiaohongshu/xhs/client.py
deleted file mode 100644
index b83074d..0000000
--- a/app/services/scrapers/xiaohongshu/xhs/client.py
+++ /dev/null
@@ -1,217 +0,0 @@
-import asyncio
-import json
-from typing import Dict
-
-import httpx
-from playwright.async_api import BrowserContext, Page
-
-from app.utils.logger import logger
-from .exception import DataFetchError, IPBlockError
-from .field import SearchNoteType, SearchSortType
-from .help import get_search_id, sign
-from . import utils
-
-
-class XHSClient:
-    def __init__(
-        self,
-        timeout=10,
-        proxies=None,
-        *,
-        headers: Dict[str, str],
-        playwright_page: Page,
-        cookie_dict: Dict[str, str],
-    ):
-        self.proxies = proxies
-        self.timeout = timeout
-        self.headers = headers
-        self._host = "https://edith.xiaohongshu.com"
-        self.IP_ERROR_STR = "网络连接异常，请检查网络设置或重启试试"
-        self.IP_ERROR_CODE = 300012
-        self.NOTE_ABNORMAL_STR = "笔记状态异常，请稍后查看"
-        self.NOTE_ABNORMAL_CODE = -510001
-        self.playwright_page = playwright_page
-        self.cookie_dict = cookie_dict
-
-    async def _pre_headers(self, url: str, data=None):
-        encrypt_params = await self.playwright_page.evaluate(
-            "([url, data]) => window._webmsxyw(url,data)", [url, data]
-        )
-        local_storage = await self.playwright_page.evaluate("() => window.localStorage")
-        signs = sign(
-            a1=self.cookie_dict.get("a1", ""),
-            b1=local_storage.get("b1", ""),
-            x_s=encrypt_params.get("X-s", ""),
-            x_t=str(encrypt_params.get("X-t", "")),
-        )
-
-        headers = {
-            "X-S": signs["x-s"],
-            "X-T": signs["x-t"],
-            "x-S-Common": signs["x-s-common"],
-            "X-B3-Traceid": signs["x-b3-traceid"],
-        }
-        self.headers.update(headers)
-        return self.headers
-
-    async def request(self, method, url, **kwargs) -> Dict:
-        async with httpx.AsyncClient(proxies=self.proxies) as client:
-            response = await client.request(method, url, timeout=self.timeout, **kwargs)
-        data: Dict = response.json()
-        if data["success"]:
-            return data.get("data", data.get("success", {}))
-        elif data["code"] == self.IP_ERROR_CODE:
-            raise IPBlockError(self.IP_ERROR_STR)
-        else:
-            raise DataFetchError(data.get("msg", None))
-
-    async def get(self, uri: str, params=None) -> Dict:
-        final_uri = uri
-        if isinstance(params, dict):
-            final_uri = f"{uri}?" f"{'&'.join([f'{k}={v}' for k, v in params.items()])}"
-        headers = await self._pre_headers(final_uri)
-        return await self.request(
-            method="GET", url=f"{self._host}{final_uri}", headers=headers
-        )
-
-    async def post(self, uri: str, data: dict) -> Dict:
-        headers = await self._pre_headers(uri, data)
-        json_str = json.dumps(data, separators=(",", ":"), ensure_ascii=False)
-        return await self.request(
-            method="POST", url=f"{self._host}{uri}", data=json_str, headers=headers
-        )
-
-    async def ping(self) -> bool:
-        """get a note to check if login state is ok"""
-        logger.info("Begin to ping xhs...")
-        ping_flag = False
-        try:
-            note_card: Dict = await self.get_note_by_keyword(keyword="小红书")
-            if note_card.get("items"):
-                ping_flag = True
-        except Exception as e:
-            logger.error(f"Ping xhs failed: {e}, and try to login again...")
-            ping_flag = False
-        return ping_flag
-
-    async def update_cookies(self, browser_context: BrowserContext):
-        cookie_str, cookie_dict = utils.convert_cookies(await browser_context.cookies())
-        self.headers["Cookie"] = cookie_str
-        self.cookie_dict = cookie_dict
-
-    async def get_note_by_keyword(
-        self,
-        keyword: str,
-        page: int = 1,
-        page_size: int = 20,
-        sort: SearchSortType = SearchSortType.GENERAL,
-        note_type: SearchNoteType = SearchNoteType.ALL,
-    ) -> Dict:
-        """search note by keyword
-
-        :param keyword: what notes you want to search
-        :param page: page number, defaults to 1
-        :param page_size: page size, defaults to 20
-        :param sort: sort ordering, defaults to SearchSortType.GENERAL
-        :param note_type: note type, defaults to SearchNoteType.ALL
-        :return: {has_more: true, items: []}
-        """
-        uri = "/api/sns/web/v1/search/notes"
-        data = {
-            "keyword": keyword,
-            "page": page,
-            "page_size": page_size,
-            "search_id": get_search_id(),
-            "sort": sort.value,
-            "note_type": note_type.value,
-        }
-        return await self.post(uri, data)
-
-    async def get_note_by_id(self, note_id: str) -> Dict:
-        """
-        :param note_id: note_id you want to fetch
-        :return: {"time":1679019883000,"user":{"nickname":"nickname","avatar":"avatar","user_id":"user_id"},"image_list":[{"url":"https://sns-img-qc.xhscdn.com/c8e505ca-4e5f-44be-fe1c-ca0205a38bad","trace_id":"1000g00826s57r6cfu0005ossb1e9gk8c65d0c80","file_id":"c8e505ca-4e5f-44be-fe1c-ca0205a38bad","height":1920,"width":1440}],"tag_list":[{"id":"5be78cdfdb601f000100d0bc","name":"jk","type":"topic"}],"desc":"裙裙","interact_info":{"followed":false,"liked":false,"liked_count":"1732","collected":false,"collected_count":"453","comment_count":"30","share_count":"41"},"at_user_list":[],"last_update_time":1679019884000,"note_id":"6413cf6b00000000270115b5","type":"normal","title":"title"}
-        """
-        data = {"source_note_id": note_id}
-        uri = "/api/sns/web/v1/feed"
-        res = await self.post(uri, data)
-        res_dict: Dict = res["items"][0]["note_card"]
-        return res_dict
-
-    async def get_note_comments(self, note_id: str, cursor: str = "") -> Dict:
-        """get note comments
-        :param note_id: note id you want to fetch
-        :param cursor: last you get cursor, defaults to ""
-        :return: {"has_more": true,"cursor": "6422442d000000000700dcdb",comments: [],"user_id": "63273a77000000002303cc9b","time": 1681566542930}
-        """
-        uri = "/api/sns/web/v2/comment/page"
-        params = {"note_id": note_id, "cursor": cursor}
-        return await self.get(uri, params)
-
-    async def get_note_sub_comments(
-        self, note_id: str, root_comment_id: str, num: int = 30, cursor: str = ""
-    ):
-        """
-        get note sub comments
-        :param note_id: note id you want to fetch
-        :param root_comment_id: parent comment id
-        :param num: recommend 30, if num greater 30, it only return 30 comments
-        :param cursor: last you get cursor, defaults to ""
-        :return: {"has_more": true,"cursor": "6422442d000000000700dcdb",comments: [],"user_id": "63273a77000000002303cc9b","time": 1681566542930}
-        """
-        uri = "/api/sns/web/v2/comment/sub/page"
-        params = {
-            "note_id": note_id,
-            "root_comment_id": root_comment_id,
-            "num": num,
-            "cursor": cursor,
-        }
-        return await self.get(uri, params)
-
-    async def get_note_all_comments(
-        self, note_id: str, crawl_interval: float = 1.0, is_fetch_sub_comments=False
-    ):
-        """
-        get note all comments include sub comments
-        :param note_id:
-        :param crawl_interval:
-        :param is_fetch_sub_comments:
-        :return:
-        """
-
-        result = []
-        comments_has_more = True
-        comments_cursor = ""
-        while comments_has_more:
-            comments_res = await self.get_note_comments(note_id, comments_cursor)
-            comments_has_more = comments_res.get("has_more", False)
-            comments_cursor = comments_res.get("cursor", "")
-            comments = comments_res["comments"]
-            if not is_fetch_sub_comments:
-                result.extend(comments)
-                continue
-            # handle get sub comments
-            for comment in comments:
-                result.append(comment)
-                cur_sub_comment_count = int(comment["sub_comment_count"])
-                cur_sub_comments = comment["sub_comments"]
-                result.extend(cur_sub_comments)
-                sub_comments_has_more = (
-                    comment["sub_comment_has_more"]
-                    and len(cur_sub_comments) < cur_sub_comment_count
-                )
-                sub_comment_cursor = comment["sub_comment_cursor"]
-                while sub_comments_has_more:
-                    page_num = 30
-                    sub_comments_res = await self.get_note_sub_comments(
-                        note_id, comment["id"], num=page_num, cursor=sub_comment_cursor
-                    )
-                    sub_comments = sub_comments_res["comments"]
-                    sub_comments_has_more = (
-                        sub_comments_res["has_more"] and len(sub_comments) == page_num
-                    )
-                    sub_comment_cursor = sub_comments_res["cursor"]
-                    result.extend(sub_comments)
-                    await asyncio.sleep(crawl_interval)
-            await asyncio.sleep(crawl_interval)
-        return result
diff --git a/app/services/scrapers/xiaohongshu/xhs/core.py b/app/services/scrapers/xiaohongshu/xhs/core.py
deleted file mode 100644
index 00f0a54..0000000
--- a/app/services/scrapers/xiaohongshu/xhs/core.py
+++ /dev/null
@@ -1,225 +0,0 @@
-import asyncio
-import random
-from asyncio import Task
-from typing import Dict, List, Optional, Tuple
-
-from playwright.async_api import BrowserContext, BrowserType, Page, async_playwright
-
-from .base_crawler import AbstractCrawler
-from .proxy_account_pool import AccountPool
-
-# import xiaohongshu as xhs_model
-from app.utils.logger import logger
-from app import config
-
-# from var import request_keyword_var
-from .client import XHSClient
-from .exception import DataFetchError
-from .login import XHSLogin
-from . import utils
-
-
-class XiaoHongShuCrawler(AbstractCrawler):
-    platform: str
-    login_type: str
-    context_page: Page
-    xhs_client: XHSClient
-    account_pool: AccountPool
-    browser_context: BrowserContext
-
-    def __init__(self) -> None:
-        self.index_url = "https://www.xiaohongshu.com"
-        self.user_agent = utils.get_user_agent()
-
-    def init_config(
-        self, platform: str, login_type: str, account_pool: AccountPool
-    ) -> None:
-        self.platform = platform
-        self.login_type = login_type
-        self.account_pool = account_pool
-
-    async def start(self, id: str) -> dict:
-        account_phone, playwright_proxy, httpx_proxy = self.create_proxy_info()
-        async with async_playwright() as playwright:
-            # Launch a browser context.
-            chromium = playwright.chromium
-            self.browser_context = await self.launch_browser(
-                chromium, playwright_proxy, self.user_agent, headless=True
-            )
-            # stealth.min.js is a js script to prevent the website from detecting the crawler.
-            await self.browser_context.add_init_script(path="app/utils/stealth.min.js")
-            # add a cookie attribute webId to avoid the appearance of a sliding captcha on the webpage
-            await self.browser_context.add_cookies(
-                [
-                    {
-                        "name": "webId",
-                        "value": "xxx123",  # any value
-                        "domain": ".xiaohongshu.com",
-                        "path": "/",
-                    }
-                ]
-            )
-            await asyncio.sleep(1)
-            self.context_page = await self.browser_context.new_page()
-            await asyncio.sleep(1)
-            await self.context_page.goto(self.index_url)
-            await asyncio.sleep(1)
-            # Create a client to interact with the xiaohongshu website.
-            self.xhs_client = await self.create_xhs_client(httpx_proxy)
-            if not await self.xhs_client.ping():
-                login_obj = XHSLogin(
-                    login_type=self.login_type,
-                    login_phone=account_phone,
-                    browser_context=self.browser_context,
-                    context_page=self.context_page,
-                    cookie_str=config.XIAOHONGSHU_COOKIES,
-                )
-                await asyncio.sleep(1)
-                await login_obj.begin()
-                await asyncio.sleep(1)
-                await self.xhs_client.update_cookies(
-                    browser_context=self.browser_context
-                )
-
-            # Search for notes and retrieve their comment information.
-            # await self.search()
-
-            logger.info("Xhs Crawler finished ...")
-            return await self.xhs_client.get_note_by_id(id)
-
-    async def search(self) -> None:
-        """Search for notes and retrieve their comment information."""
-        logger.info("Begin search xiaohongshu keywords")
-        xhs_limit_count = 20  # xhs limit page fixed value
-        for keyword in config.KEYWORDS.split(","):
-            # set keyword to context var
-            # request_keyword_var.set(keyword)
-            logger.info(f"Current search keyword: {keyword}")
-            page = 1
-            while page * xhs_limit_count <= config.CRAWLER_MAX_NOTES_COUNT:
-                note_id_list: List[str] = []
-                notes_res = await self.xhs_client.get_note_by_keyword(
-                    keyword=keyword,
-                    page=page,
-                )
-                semaphore = asyncio.Semaphore(config.MAX_CONCURRENCY_NUM)
-                task_list = [
-                    self.get_note_detail(post_item.get("id"), semaphore)
-                    for post_item in notes_res.get("items", {})
-                    if post_item.get("model_type") not in ("rec_query", "hot_query")
-                ]
-                note_details = await asyncio.gather(*task_list)
-                for note_detail in note_details:
-                    if note_detail is not None:
-                        # await xhs_model.update_xhs_note(note_detail)
-                        note_id_list.append(note_detail.get("note_id"))
-                page += 1
-                logger.info(f"Note details: {note_details}")
-                await self.batch_get_note_comments(note_id_list)
-
-    async def get_note_detail(
-        self, note_id: str, semaphore: asyncio.Semaphore
-    ) -> Optional[Dict]:
-        """Get note detail"""
-        async with semaphore:
-            try:
-                return await self.xhs_client.get_note_by_id(note_id)
-            except DataFetchError as ex:
-                logger.error(f"Get note detail error: {ex}")
-                return None
-
-    async def batch_get_note_comments(self, note_list: List[str]):
-        """Batch get note comments"""
-        logger.info(f"Begin batch get note comments, note list: {note_list}")
-        semaphore = asyncio.Semaphore(config.MAX_CONCURRENCY_NUM)
-        task_list: List[Task] = []
-        for note_id in note_list:
-            task = asyncio.create_task(
-                self.get_comments(note_id, semaphore), name=note_id
-            )
-            task_list.append(task)
-        await asyncio.gather(*task_list)
-
-    async def get_comments(self, note_id: str, semaphore: asyncio.Semaphore):
-        """Get note comments"""
-        async with semaphore:
-            logger.info(f"Begin get note id comments {note_id}")
-            all_comments = await self.xhs_client.get_note_all_comments(
-                note_id=note_id, crawl_interval=random.random()
-            )
-            # for comment in all_comments:
-            #     await xhs_model.update_xhs_note_comment(
-            #         note_id=note_id, comment_item=comment
-            #     )
-
-    def create_proxy_info(self) -> Tuple[Optional[str], Optional[Dict], Optional[str]]:
-        """Create proxy info for playwright and httpx"""
-        # phone: 13012345671  ip_proxy: 111.122.xx.xx1:8888
-        phone, ip_proxy = self.account_pool.get_account()
-        if not config.XHS_ENABLE_IP_PROXY:
-            return phone, None, None
-        logger.info("Begin proxy info for playwright and httpx ...")
-        playwright_proxy = {
-            "server": f"{config.IP_PROXY_PROTOCOL}{ip_proxy}",
-            "username": config.IP_PROXY_USER,
-            "password": config.IP_PROXY_PASSWORD,
-        }
-        httpx_proxy = f"{config.IP_PROXY_PROTOCOL}{config.IP_PROXY_USER}:{config.IP_PROXY_PASSWORD}@{ip_proxy}"
-        return phone, playwright_proxy, httpx_proxy
-
-    async def create_xhs_client(self, httpx_proxy: Optional[str]) -> XHSClient:
-        """Create xhs client"""
-        logger.info("Begin create xiaohongshu API client ...")
-        cookie_str, cookie_dict = utils.convert_cookies(
-            await self.browser_context.cookies()
-        )
-        xhs_client_obj = XHSClient(
-            proxies=httpx_proxy,
-            headers={
-                "User-Agent": self.user_agent,
-                "Cookie": cookie_str,
-                "Origin": "https://www.xiaohongshu.com",
-                "Referer": "https://www.xiaohongshu.com",
-                "Content-Type": "application/json;charset=UTF-8",
-            },
-            playwright_page=self.context_page,
-            cookie_dict=cookie_dict,
-        )
-        return xhs_client_obj
-
-    async def launch_browser(
-        self,
-        chromium: BrowserType,
-        playwright_proxy: Optional[Dict],
-        user_agent: Optional[str],
-        headless: bool = True,
-    ) -> BrowserContext:
-        """Launch browser and create browser context"""
-        logger.info("Begin create browser context ...")
-        if config.XHS_SAVE_LOGIN_STATE:
-            # feat issue #14
-            # we will save login state to avoid login every time
-            user_data_dir = config.TEMP_DIR
-            # user_data_dir = os.path.join(
-            #     os.getcwd(), "browser_data",  self.platform
-            # )  # type: ignore
-            browser_context = await chromium.launch_persistent_context(
-                user_data_dir=user_data_dir,
-                accept_downloads=True,
-                headless=headless,
-                proxy=playwright_proxy,  # type: ignore
-                viewport={"width": 1920, "height": 1080},
-                user_agent=user_agent,
-            )
-            return browser_context
-        else:
-            browser = await chromium.launch(headless=headless, proxy=playwright_proxy)  # type: ignore
-            browser_context = await browser.new_context(
-                viewport={"width": 1920, "height": 1080}, user_agent=user_agent
-            )
-            return browser_context
-
-    async def close(self):
-        """Close browser context"""
-        await self.browser_context.close()
-        logger.info("Browser context closed ...")
diff --git a/app/services/scrapers/xiaohongshu/xhs/exception.py b/app/services/scrapers/xiaohongshu/xhs/exception.py
deleted file mode 100644
index 1a8642e..0000000
--- a/app/services/scrapers/xiaohongshu/xhs/exception.py
+++ /dev/null
@@ -1,9 +0,0 @@
-from httpx import RequestError
-
-
-class DataFetchError(RequestError):
-    """something error when fetch"""
-
-
-class IPBlockError(RequestError):
-    """fetch so fast that the server block us ip"""
diff --git a/app/services/scrapers/xiaohongshu/xhs/field.py b/app/services/scrapers/xiaohongshu/xhs/field.py
deleted file mode 100644
index fbac0d2..0000000
--- a/app/services/scrapers/xiaohongshu/xhs/field.py
+++ /dev/null
@@ -1,72 +0,0 @@
-from enum import Enum
-from typing import NamedTuple
-
-
-class FeedType(Enum):
-    # 推荐
-    RECOMMEND = "homefeed_recommend"
-    # 穿搭
-    FASION = "homefeed.fashion_v3"
-    # 美食
-    FOOD = "homefeed.food_v3"
-    # 彩妆
-    COSMETICS = "homefeed.cosmetics_v3"
-    # 影视
-    MOVIE = "homefeed.movie_and_tv_v3"
-    # 职场
-    CAREER = "homefeed.career_v3"
-    # 情感
-    EMOTION = "homefeed.love_v3"
-    # 家居
-    HOURSE = "homefeed.household_product_v3"
-    # 游戏
-    GAME = "homefeed.gaming_v3"
-    # 旅行
-    TRAVEL = "homefeed.travel_v3"
-    # 健身
-    FITNESS = "homefeed.fitness_v3"
-
-
-class NoteType(Enum):
-    NORMAL = "normal"
-    VIDEO = "video"
-
-
-class SearchSortType(Enum):
-    """search sort type"""
-    # default
-    GENERAL = "general"
-    # most popular
-    MOST_POPULAR = "popularity_descending"
-    # Latest
-    LATEST = "time_descending"
-
-
-class SearchNoteType(Enum):
-    """search note type
-    """
-    # default
-    ALL = 0
-    # only video
-    VIDEO = 1
-    # only image
-    IMAGE = 2
-
-
-class Note(NamedTuple):
-    """note tuple"""
-    note_id: str
-    title: str
-    desc: str
-    type: str
-    user: dict
-    img_urls: list
-    video_url: str
-    tag_list: list
-    at_user_list: list
-    collected_count: str
-    comment_count: str
-    liked_count: str
-    share_count: str
-    time: int
-    last_update_time: int
diff --git a/app/services/scrapers/xiaohongshu/xhs/help.py b/app/services/scrapers/xiaohongshu/xhs/help.py
deleted file mode 100644
index c1e191f..0000000
--- a/app/services/scrapers/xiaohongshu/xhs/help.py
+++ /dev/null
@@ -1,262 +0,0 @@
-import ctypes
-import json
-import random
-import time
-import urllib.parse
-
-
-def sign(a1="", b1="", x_s="", x_t=""):
-    """
-    takes in a URI (uniform resource identifier), an optional data dictionary, and an optional ctime parameter. It returns a dictionary containing two keys: "x-s" and "x-t".
-    """
-    common = {
-        "s0": 5,  # getPlatformCode
-        "s1": "",
-        "x0": "1",  # localStorage.getItem("b1b1")
-        "x1": "3.3.0",  # version
-        "x2": "Windows",
-        "x3": "xhs-pc-web",
-        "x4": "1.4.4",
-        "x5": a1,  # cookie of a1
-        "x6": x_t,
-        "x7": x_s,
-        "x8": b1,  # localStorage.getItem("b1")
-        "x9": mrc(x_t + x_s + b1),
-        "x10": 1,  # getSigCount
-    }
-    encode_str = encodeUtf8(json.dumps(common, separators=(',', ':')))
-    x_s_common = b64Encode(encode_str)
-    x_b3_traceid = get_b3_trace_id()
-    return {
-        "x-s": x_s,
-        "x-t": x_t,
-        "x-s-common": x_s_common,
-        "x-b3-traceid": x_b3_traceid
-    }
-
-
-def get_b3_trace_id():
-    re = "abcdef0123456789"
-    je = 16
-    e = ""
-    for t in range(16):
-        e += re[random.randint(0, je - 1)]
-    return e
-
-
-def mrc(e):
-    ie = [
-        0, 1996959894, 3993919788, 2567524794, 124634137, 1886057615, 3915621685,
-        2657392035, 249268274, 2044508324, 3772115230, 2547177864, 162941995,
-        2125561021, 3887607047, 2428444049, 498536548, 1789927666, 4089016648,
-        2227061214, 450548861, 1843258603, 4107580753, 2211677639, 325883990,
-        1684777152, 4251122042, 2321926636, 335633487, 1661365465, 4195302755,
-        2366115317, 997073096, 1281953886, 3579855332, 2724688242, 1006888145,
-        1258607687, 3524101629, 2768942443, 901097722, 1119000684, 3686517206,
-        2898065728, 853044451, 1172266101, 3705015759, 2882616665, 651767980,
-        1373503546, 3369554304, 3218104598, 565507253, 1454621731, 3485111705,
-        3099436303, 671266974, 1594198024, 3322730930, 2970347812, 795835527,
-        1483230225, 3244367275, 3060149565, 1994146192, 31158534, 2563907772,
-        4023717930, 1907459465, 112637215, 2680153253, 3904427059, 2013776290,
-        251722036, 2517215374, 3775830040, 2137656763, 141376813, 2439277719,
-        3865271297, 1802195444, 476864866, 2238001368, 4066508878, 1812370925,
-        453092731, 2181625025, 4111451223, 1706088902, 314042704, 2344532202,
-        4240017532, 1658658271, 366619977, 2362670323, 4224994405, 1303535960,
-        984961486, 2747007092, 3569037538, 1256170817, 1037604311, 2765210733,
-        3554079995, 1131014506, 879679996, 2909243462, 3663771856, 1141124467,
-        855842277, 2852801631, 3708648649, 1342533948, 654459306, 3188396048,
-        3373015174, 1466479909, 544179635, 3110523913, 3462522015, 1591671054,
-        702138776, 2966460450, 3352799412, 1504918807, 783551873, 3082640443,
-        3233442989, 3988292384, 2596254646, 62317068, 1957810842, 3939845945,
-        2647816111, 81470997, 1943803523, 3814918930, 2489596804, 225274430,
-        2053790376, 3826175755, 2466906013, 167816743, 2097651377, 4027552580,
-        2265490386, 503444072, 1762050814, 4150417245, 2154129355, 426522225,
-        1852507879, 4275313526, 2312317920, 282753626, 1742555852, 4189708143,
-        2394877945, 397917763, 1622183637, 3604390888, 2714866558, 953729732,
-        1340076626, 3518719985, 2797360999, 1068828381, 1219638859, 3624741850,
-        2936675148, 906185462, 1090812512, 3747672003, 2825379669, 829329135,
-        1181335161, 3412177804, 3160834842, 628085408, 1382605366, 3423369109,
-        3138078467, 570562233, 1426400815, 3317316542, 2998733608, 733239954,
-        1555261956, 3268935591, 3050360625, 752459403, 1541320221, 2607071920,
-        3965973030, 1969922972, 40735498, 2617837225, 3943577151, 1913087877,
-        83908371, 2512341634, 3803740692, 2075208622, 213261112, 2463272603,
-        3855990285, 2094854071, 198958881, 2262029012, 4057260610, 1759359992,
-        534414190, 2176718541, 4139329115, 1873836001, 414664567, 2282248934,
-        4279200368, 1711684554, 285281116, 2405801727, 4167216745, 1634467795,
-        376229701, 2685067896, 3608007406, 1308918612, 956543938, 2808555105,
-        3495958263, 1231636301, 1047427035, 2932959818, 3654703836, 1088359270,
-        936918000, 2847714899, 3736837829, 1202900863, 817233897, 3183342108,
-        3401237130, 1404277552, 615818150, 3134207493, 3453421203, 1423857449,
-        601450431, 3009837614, 3294710456, 1567103746, 711928724, 3020668471,
-        3272380065, 1510334235, 755167117,
-    ]
-    o = -1
-
-    def right_without_sign(num: int, bit: int=0) -> int:
-        val = ctypes.c_uint32(num).value >> bit
-        MAX32INT = 4294967295
-        return (val + (MAX32INT + 1)) % (2 * (MAX32INT + 1)) - MAX32INT - 1
-
-    for n in range(57):
-        o = ie[(o & 255) ^ ord(e[n])] ^ right_without_sign(o, 8)
-    return o ^ -1 ^ 3988292384
-
-
-lookup = [
-    "Z",
-    "m",
-    "s",
-    "e",
-    "r",
-    "b",
-    "B",
-    "o",
-    "H",
-    "Q",
-    "t",
-    "N",
-    "P",
-    "+",
-    "w",
-    "O",
-    "c",
-    "z",
-    "a",
-    "/",
-    "L",
-    "p",
-    "n",
-    "g",
-    "G",
-    "8",
-    "y",
-    "J",
-    "q",
-    "4",
-    "2",
-    "K",
-    "W",
-    "Y",
-    "j",
-    "0",
-    "D",
-    "S",
-    "f",
-    "d",
-    "i",
-    "k",
-    "x",
-    "3",
-    "V",
-    "T",
-    "1",
-    "6",
-    "I",
-    "l",
-    "U",
-    "A",
-    "F",
-    "M",
-    "9",
-    "7",
-    "h",
-    "E",
-    "C",
-    "v",
-    "u",
-    "R",
-    "X",
-    "5",
-]
-
-
-def tripletToBase64(e):
-    return (
-            lookup[63 & (e >> 18)] +
-            lookup[63 & (e >> 12)] +
-            lookup[(e >> 6) & 63] +
-            lookup[e & 63]
-    )
-
-
-def encodeChunk(e, t, r):
-    m = []
-    for b in range(t, r, 3):
-        n = (16711680 & (e[b] << 16)) + \
-            ((e[b + 1] << 8) & 65280) + (e[b + 2] & 255)
-        m.append(tripletToBase64(n))
-    return ''.join(m)
-
-
-def b64Encode(e):
-    P = len(e)
-    W = P % 3
-    U = []
-    z = 16383
-    H = 0
-    Z = P - W
-    while H < Z:
-        U.append(encodeChunk(e, H, Z if H + z > Z else H + z))
-        H += z
-    if 1 == W:
-        F = e[P - 1]
-        U.append(lookup[F >> 2] + lookup[(F << 4) & 63] + "==")
-    elif 2 == W:
-        F = (e[P - 2] << 8) + e[P - 1]
-        U.append(lookup[F >> 10] + lookup[63 & (F >> 4)] +
-                 lookup[(F << 2) & 63] + "=")
-    return "".join(U)
-
-
-def encodeUtf8(e):
-    b = []
-    m = urllib.parse.quote(e, safe='~()*!.\'')
-    w = 0
-    while w < len(m):
-        T = m[w]
-        if T == "%":
-            E = m[w + 1] + m[w + 2]
-            S = int(E, 16)
-            b.append(S)
-            w += 2
-        else:
-            b.append(ord(T[0]))
-        w += 1
-    return b
-
-
-def base36encode(number, alphabet='0123456789ABCDEFGHIJKLMNOPQRSTUVWXYZ'):
-    """Converts an integer to a base36 string."""
-    if not isinstance(number, int):
-        raise TypeError('number must be an integer')
-
-    base36 = ''
-    sign = ''
-
-    if number < 0:
-        sign = '-'
-        number = -number
-
-    if 0 <= number < len(alphabet):
-        return sign + alphabet[number]
-
-    while number != 0:
-        number, i = divmod(number, len(alphabet))
-        base36 = alphabet[i] + base36
-
-    return sign + base36
-
-
-def base36decode(number):
-    return int(number, 36)
-
-
-def get_search_id():
-    e = int(time.time() * 1000) << 64
-    t = int(random.uniform(0, 2147483646))
-    return base36encode((e + t))
-
-
-if __name__ == '__main__':
-    a = get_b3_trace_id()
-    print(a)
diff --git a/app/services/scrapers/xiaohongshu/xhs/login.py b/app/services/scrapers/xiaohongshu/xhs/login.py
deleted file mode 100644
index 44b2826..0000000
--- a/app/services/scrapers/xiaohongshu/xhs/login.py
+++ /dev/null
@@ -1,198 +0,0 @@
-import asyncio
-import functools
-import sys
-from typing import Optional
-
-# import redis
-from playwright.async_api import BrowserContext, Page
-from tenacity import RetryError, retry, retry_if_result, stop_after_attempt, wait_fixed
-
-from app.utils.logger import logger
-
-# import config
-from .base_crawler import AbstractLogin
-from . import utils
-
-
-class XHSLogin(AbstractLogin):
-    def __init__(
-        self,
-        login_type: str,
-        browser_context: BrowserContext,
-        context_page: Page,
-        login_phone: Optional[str] = "",
-        cookie_str: dict = {},
-    ):
-        self.login_type = login_type
-        self.browser_context = browser_context
-        self.context_page = context_page
-        self.login_phone = login_phone
-        self.cookie_str = cookie_str
-
-    @retry(
-        stop=stop_after_attempt(20),
-        wait=wait_fixed(1),
-        retry=retry_if_result(lambda value: value is False),
-    )
-    async def check_login_state(self, no_logged_in_session: str) -> bool:
-        """
-        Check if the current login status is successful and return True otherwise return False
-        retry decorator will retry 20 times if the return value is False, and the retry interval is 1 second
-        if max retry times reached, raise RetryError
-        """
-        current_cookie = await self.browser_context.cookies()
-        _, cookie_dict = utils.convert_cookies(current_cookie)
-        current_web_session = cookie_dict.get("web_session")
-        if current_web_session != no_logged_in_session:
-            return True
-        return False
-
-    async def begin(self):
-        """Start login xiaohongshu"""
-        logger.info("Begin login xiaohongshu ...")
-        if self.login_type == "qrcode":
-            await self.login_by_qrcode()
-        elif self.login_type == "phone":
-            await self.login_by_mobile()
-        elif self.login_type == "cookie":
-            await self.login_by_cookies()
-        else:
-            raise ValueError(
-                "Invalid Login Type Currently only supported qrcode or phone or cookies ..."
-            )
-
-    async def login_by_mobile(self):
-        pass
-    #     """Login xiaohongshu by mobile"""
-    #     logger.info("Begin login xiaohongshu by mobile ...")
-    #     await asyncio.sleep(1)
-    #     try:
-    #         # 小红书进入首页后，有可能不会自动弹出登录框，需要手动点击登录按钮
-    #         login_button_ele = await self.context_page.wait_for_selector(
-    #             selector="xpath=//*[@id='app']/div[1]/div[2]/div[1]/ul/div[1]/button",
-    #             timeout=5000
-    #         )
-    #         await login_button_ele.click()
-    #         # 弹窗的登录对话框也有两种形态，一种是直接可以看到手机号和验证码的
-    #         # 另一种是需要点击切换到手机登录的
-    #         element = await self.context_page.wait_for_selector(
-    #             selector='xpath=//div[@class="login-container"]//div[@class="other-method"]/div[1]',
-    #             timeout=5000
-    #         )
-    #         await element.click()
-    #     except Exception as e:
-    #         logger.info("have not found mobile button icon and keep going ...")
-    #
-    #     await asyncio.sleep(1)
-    #     login_container_ele = await self.context_page.wait_for_selector("div.login-container")
-    #     input_ele = await login_container_ele.query_selector("label.phone > input")
-    #     await input_ele.fill(self.login_phone)
-    #     await asyncio.sleep(0.5)
-    #
-    #     send_btn_ele = await login_container_ele.query_selector("label.auth-code > span")
-    #     await send_btn_ele.click()  # 点击发送验证码
-    #     sms_code_input_ele = await login_container_ele.query_selector("label.auth-code > input")
-    #     submit_btn_ele = await login_container_ele.query_selector("div.input-container > button")
-    #     redis_obj = redis.Redis(host=config.REDIS_DB_HOST, password=config.REDIS_DB_PWD)
-    #     max_get_sms_code_time = 60 * 2  # 最长获取验证码的时间为2分钟
-    #     no_logged_in_session = ""
-    #     while max_get_sms_code_time > 0:
-    #         logger.info(f"get sms code from redis remaining time {max_get_sms_code_time}s ...")
-    #         await asyncio.sleep(1)
-    #         sms_code_key = f"xhs_{self.login_phone}"
-    #         sms_code_value = redis_obj.get(sms_code_key)
-    #         if not sms_code_value:
-    #             max_get_sms_code_time -= 1
-    #             continue
-    #
-    #         current_cookie = await self.browser_context.cookies()
-    #         _, cookie_dict = utils.convert_cookies(current_cookie)
-    #         no_logged_in_session = cookie_dict.get("web_session")
-    #
-    #         await sms_code_input_ele.fill(value=sms_code_value.decode())  # 输入短信验证码
-    #         await asyncio.sleep(0.5)
-    #         agree_privacy_ele = self.context_page.locator("xpath=//div[@class='agreements']//*[local-name()='svg']")
-    #         await agree_privacy_ele.click()  # 点击同意隐私协议
-    #         await asyncio.sleep(0.5)
-    #
-    #         await submit_btn_ele.click()  # 点击登录
-    #
-    #         # todo ... 应该还需要检查验证码的正确性有可能输入的验证码不正确
-    #         break
-    #
-    #     try:
-    #         await self.check_login_state(no_logged_in_session)
-    #     except RetryError:
-    #         logger.info("Login xiaohongshu failed by mobile login method ...")
-    #         sys.exit()
-    #
-    #     wait_redirect_seconds = 5
-    #     logger.info(f"Login successful then wait for {wait_redirect_seconds} seconds redirect ...")
-    #     await asyncio.sleep(wait_redirect_seconds)
-
-    async def login_by_qrcode(self):
-        """login xiaohongshu website and keep webdriver login state"""
-        logger.info("Begin login xiaohongshu by qrcode ...")
-        # login_selector = "div.login-container > div.left > div.qrcode > img"
-        qrcode_img_selector = "xpath=//img[@class='qrcode-img']"
-        # find login qrcode
-        base64_qrcode_img = await utils.find_login_qrcode(
-            self.context_page, selector=qrcode_img_selector
-        )
-        if not base64_qrcode_img:
-            logger.info("login failed , have not found qrcode please check ....")
-            # if this website does not automatically popup login dialog box, we will manual click login button
-            await asyncio.sleep(0.5)
-            login_button_ele = self.context_page.locator(
-                "xpath=//*[@id='app']/div[1]/div[2]/div[1]/ul/div[1]/button"
-            )
-            await login_button_ele.click()
-            base64_qrcode_img = await utils.find_login_qrcode(
-                self.context_page, selector=qrcode_img_selector
-            )
-            if not base64_qrcode_img:
-                sys.exit()
-
-        # get not logged session
-        current_cookie = await self.browser_context.cookies()
-        _, cookie_dict = utils.convert_cookies(current_cookie)
-        no_logged_in_session = cookie_dict.get("web_session")
-
-        # show login qrcode
-        # fix issue #12
-        # we need to use partial function to call show_qrcode function and run in executor
-        # then current asyncio event loop will not be blocked
-        partial_show_qrcode = functools.partial(utils.show_qrcode, base64_qrcode_img)
-        asyncio.get_running_loop().run_in_executor(
-            executor=None, func=partial_show_qrcode
-        )
-
-        logger.info(f"waiting for scan code login, remaining time is 20s")
-        try:
-            await self.check_login_state(no_logged_in_session)
-        except RetryError:
-            logger.info("Login xiaohongshu failed by qrcode login method ...")
-            sys.exit()
-
-        wait_redirect_seconds = 5
-        logger.info(
-            f"Login successful then wait for {wait_redirect_seconds} seconds redirect ..."
-        )
-        await asyncio.sleep(wait_redirect_seconds)
-
-    async def login_by_cookies(self):
-        """login xiaohongshu website by cookies"""
-        logger.info("Begin login xiaohongshu by cookie ...")
-        for key, value in self.cookie_str.items():
-            if key != "web_session":  # only set web_session cookie attr
-                continue
-            await self.browser_context.add_cookies(
-                [
-                    {
-                        "name": key,
-                        "value": value,
-                        "domain": ".xiaohongshu.com",
-                        "path": "/",
-                    }
-                ]
-            )
diff --git a/app/services/scrapers/xiaohongshu/xhs/proxy_account_pool.py b/app/services/scrapers/xiaohongshu/xhs/proxy_account_pool.py
deleted file mode 100644
index 59f9b32..0000000
--- a/app/services/scrapers/xiaohongshu/xhs/proxy_account_pool.py
+++ /dev/null
@@ -1,132 +0,0 @@
-from typing import List, Optional, Set, Tuple
-
-from app import config
-
-
-class PhonePool:
-    """phone pool class"""
-
-    def __init__(self) -> None:
-        self.phones: List[str] = []
-        self.used_phones: Set[str] = set()
-
-    def add_phone(self, phone: str) -> bool:
-        """add phone to the pool"""
-        if phone not in self.phones:
-            self.phones.append(phone)
-            return True
-        return False
-
-    def remove_phone(self, phone: str) -> bool:
-        """remove phone from the pool"""
-        if phone in self.used_phones:
-            self.phones.remove(phone)
-            self.used_phones.remove(phone)
-            return True
-        return False
-
-    def get_phone(self) -> Optional[str]:
-        """get phone and mark as used"""
-        if self.phones:
-            left_phone = self.phones.pop(0)
-            self.used_phones.add(left_phone)
-            return left_phone
-        return None
-
-    def clear(self):
-        """clear phone pool"""
-        self.phones = []
-        self.used_phones = set()
-
-
-class IPPool:
-    def __init__(self) -> None:
-        self.ips: List[str] = []
-        self.used_ips: Set[str] = set()
-
-    def add_ip(self, ip):
-        """添加ip"""
-        if ip not in self.ips:
-            self.ips.append(ip)
-            return True
-        return False
-
-    def remove_ip(self, ip: str) -> bool:
-        """remove ip"""
-        if ip in self.used_ips:
-            self.ips.remove(ip)
-            self.used_ips.remove(ip)
-            return True
-        return False
-
-    def get_ip(self) -> Optional[str]:
-        """get ip and mark as used"""
-        if self.ips:
-            left_ips = self.ips.pop(0)
-            self.used_ips.add(left_ips)
-            return left_ips
-        return None
-
-    def clear(self):
-        """clear ip pool"""
-        self.ips = []
-        self.used_ips = set()
-
-
-class AccountPool:
-    """account pool class"""
-
-    def __init__(self):
-        self.phone_pool = PhonePool()
-        self.ip_pool = IPPool()
-
-    def add_account(self, phone: str, ip: str) -> bool:
-        """add account to pool with phone and ip"""
-        if self.phone_pool.add_phone(phone) and self.ip_pool.add_ip(ip):
-            return True
-        return False
-
-    def remove_account(self, phone: str, ip: str) -> bool:
-        """remove account from pool"""
-        if self.phone_pool.remove_phone(phone) and self.ip_pool.remove_ip(ip):
-            return True
-        return False
-
-    def get_account(self) -> Tuple[str, str]:
-        """get account if no account, reload account pool"""
-        phone = self.phone_pool.get_phone()
-        ip = self.ip_pool.get_ip()
-        # if not phone or not ip:
-        #     reload_account_pool(self)
-        #     return self.get_account()
-        return phone, ip
-
-    def clear_account(self):
-        """clear account pool"""
-        self.phone_pool.clear()
-        self.ip_pool.clear()
-
-
-def reload_account_pool(apo: AccountPool):
-    """reload account pool"""
-    apo.clear_account()
-    for phone, ip in zip(config.XHS_PHONE_LIST, config.XHS_IP_PROXY_LIST):
-        apo.add_account(phone, ip)
-
-
-def create_account_pool() -> AccountPool:
-    """create account pool"""
-    apo = AccountPool()
-    reload_account_pool(apo=apo)
-    return apo
-
-
-if __name__ == "__main__":
-    import time
-
-    ac_pool = create_account_pool()
-    p, i = ac_pool.get_account()
-    while p:
-        print(f"get phone:{p}, ip proxy:{i} from account pool")
-        p, i = ac_pool.get_account()
-        time.sleep(1)
diff --git a/app/services/scrapers/xiaohongshu/xhs/utils.py b/app/services/scrapers/xiaohongshu/xhs/utils.py
deleted file mode 100644
index 446d83f..0000000
--- a/app/services/scrapers/xiaohongshu/xhs/utils.py
+++ /dev/null
@@ -1,272 +0,0 @@
-import base64
-import logging
-import os
-import random
-import re
-import time
-from io import BytesIO
-from typing import Dict, List, Optional, Tuple
-from urllib.parse import urlparse
-
-import httpx
-
-from PIL import Image, ImageDraw
-from playwright.async_api import Cookie, Page
-
-
-async def find_login_qrcode(page: Page, selector: str) -> str:
-    """find login qrcode image from target selector"""
-    try:
-        elements = await page.wait_for_selector(
-            selector=selector,
-        )
-        login_qrcode_img = await elements.get_property("src")  # type: ignore
-        return str(login_qrcode_img)
-
-    except Exception as e:
-        print(e)
-        return ""
-
-
-def show_qrcode(qr_code) -> None:  # type: ignore
-    """parse base64 encode qrcode image and show it"""
-    qr_code = qr_code.split(",")[1]
-    qr_code = base64.b64decode(qr_code)
-    image = Image.open(BytesIO(qr_code))
-
-    # Add a square border around the QR code and display it within the border to improve scanning accuracy.
-    width, height = image.size
-    new_image = Image.new("RGB", (width + 20, height + 20), color=(255, 255, 255))
-    new_image.paste(image, (10, 10))
-    draw = ImageDraw.Draw(new_image)
-    draw.rectangle((0, 0, width + 19, height + 19), outline=(0, 0, 0), width=1)
-    new_image.show()
-
-
-def get_user_agent() -> str:
-    ua_list = [
-        "Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/114.0.0.0 Safari/537.36",
-        "Mozilla/5.0 (Macintosh; Intel Mac OS X 10_15_7) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/104.0.5112.79 Safari/537.36",
-        "Mozilla/5.0 (Windows NT 10.0) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/104.0.0.0 Safari/537.36",
-        "Mozilla/5.0 (Macintosh; Intel Mac OS X 10_14_6) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/104.0.0.0 Safari/537.36",
-        "Mozilla/5.0 (X11; Linux x86_64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/103.0.5060.53 Safari/537.36",
-        "Mozilla/5.0 (Macintosh; Intel Mac OS X 10_15_3) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/99.0.4844.84 Safari/537.36",
-    ]
-    return random.choice(ua_list)
-
-
-def convert_cookies(cookies: Optional[List[Cookie]]) -> Tuple[str, Dict]:
-    if not cookies:
-        return "", {}
-    cookies_str = ";".join(
-        [f"{cookie.get('name')}={cookie.get('value')}" for cookie in cookies]
-    )
-    cookie_dict = dict()
-    for cookie in cookies:
-        cookie_dict[cookie.get("name")] = cookie.get("value")
-    return cookies_str, cookie_dict
-
-
-def convert_str_cookie_to_dict(cookie_str: str) -> Dict:
-    cookie_dict: Dict[str, str] = dict()
-    if not cookie_str:
-        return cookie_dict
-    for cookie in cookie_str.split(";"):
-        cookie = cookie.strip()
-        if not cookie:
-            continue
-        cookie_list = cookie.split("=")
-        if len(cookie_list) != 2:
-            continue
-        cookie_value = cookie_list[1]
-        if isinstance(cookie_value, list):
-            cookie_value = "".join(cookie_value)
-        cookie_dict[cookie_list[0]] = cookie_value
-    return cookie_dict
-
-
-def get_current_timestamp():
-    return int(time.time() * 1000)
-
-
-def match_interact_info_count(count_str: str) -> int:
-    if not count_str:
-        return 0
-
-    match = re.search(r"\d+", count_str)
-    if match:
-        number = match.group()
-        return int(number)
-    else:
-        return 0
-
-
-def init_loging_config():
-    level = logging.INFO
-    logging.basicConfig(
-        level=level,
-        format="%(asctime)s %(name)s %(levelname)s %(message)s ",
-        datefmt="%Y-%m-%d  %H:%M:%S",
-    )
-    _logger = logging.getLogger("MediaCrawler")
-    _logger.setLevel(level)
-    return _logger
-
-
-logger = init_loging_config()
-
-
-# class Slide:
-#     """
-#     copy from https://blog.csdn.net/weixin_43582101 thanks for author
-#     update: relakkes
-#     """
-#
-#     def __init__(self, gap, bg, gap_size=None, bg_size=None, out=None):
-#         """
-#         :param gap: 缺口图片链接或者url
-#         :param bg: 带缺口的图片链接或者url
-#         """
-#         self.img_dir = os.path.join(os.getcwd(), 'temp_image')
-#         if not os.path.exists(self.img_dir):
-#             os.makedirs(self.img_dir)
-#
-#         bg_resize = bg_size if bg_size else (340, 212)
-#         gap_size = gap_size if gap_size else (68, 68)
-#         self.bg = self.check_is_img_path(bg, 'bg', resize=bg_resize)
-#         self.gap = self.check_is_img_path(gap, 'gap', resize=gap_size)
-#         self.out = out if out else os.path.join(self.img_dir, 'out.jpg')
-#
-#     @staticmethod
-#     def check_is_img_path(img, img_type, resize):
-#         if img.startswith('http'):
-#             headers = {
-#                 "Accept": "text/html,application/xhtml+xml,application/xml;q=0.9,image/avif,image/webp,image/apng,*/*;"
-#                           "q=0.8,application/signed-exchange;v=b3;q=0.9",
-#                 "Accept-Encoding": "gzip, deflate, br",
-#                 "Accept-Language": "zh-CN,zh;q=0.9,en-GB;q=0.8,en;q=0.7,ja;q=0.6",
-#                 "Cache-Control": "max-age=0",
-#                 "Connection": "keep-alive",
-#                 "Host": urlparse(img).hostname,
-#                 "Upgrade-Insecure-Requests": "1",
-#                 "User-Agent": "Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) "
-#                               "Chrome/91.0.4472.164 Safari/537.36",
-#             }
-#             img_res = httpx.get(img, headers=headers)
-#             if img_res.status_code == 200:
-#                 img_path = f'./temp_image/{img_type}.jpg'
-#                 image = np.asarray(bytearray(img_res.content), dtype="uint8")
-#                 image = cv2.imdecode(image, cv2.IMREAD_COLOR)
-#                 if resize:
-#                     image = cv2.resize(image, dsize=resize)
-#                 cv2.imwrite(img_path, image)
-#                 return img_path
-#             else:
-#                 raise Exception(f"保存{img_type}图片失败")
-#         else:
-#             return img
-#
-#     @staticmethod
-#     def clear_white(img):
-#         """清除图片的空白区域，这里主要清除滑块的空白"""
-#         img = cv2.imread(img)
-#         rows, cols, channel = img.shape
-#         min_x = 255
-#         min_y = 255
-#         max_x = 0
-#         max_y = 0
-#         for x in range(1, rows):
-#             for y in range(1, cols):
-#                 t = set(img[x, y])
-#                 if len(t) >= 2:
-#                     if x <= min_x:
-#                         min_x = x
-#                     elif x >= max_x:
-#                         max_x = x
-#
-#                     if y <= min_y:
-#                         min_y = y
-#                     elif y >= max_y:
-#                         max_y = y
-#         img1 = img[min_x:max_x, min_y: max_y]
-#         return img1
-#
-#     def template_match(self, tpl, target):
-#         th, tw = tpl.shape[:2]
-#         result = cv2.matchTemplate(target, tpl, cv2.TM_CCOEFF_NORMED)
-#         # 寻找矩阵(一维数组当作向量,用Mat定义) 中最小值和最大值的位置
-#         min_val, max_val, min_loc, max_loc = cv2.minMaxLoc(result)
-#         tl = max_loc
-#         br = (tl[0] + tw, tl[1] + th)
-#         # 绘制矩形边框，将匹配区域标注出来
-#         # target：目标图像
-#         # tl：矩形定点
-#         # br：矩形的宽高
-#         # (0,0,255)：矩形边框颜色
-#         # 1：矩形边框大小
-#         cv2.rectangle(target, tl, br, (0, 0, 255), 2)
-#         cv2.imwrite(self.out, target)
-#         return tl[0]
-#
-#     @staticmethod
-#     def image_edge_detection(img):
-#         edges = cv2.Canny(img, 100, 200)
-#         return edges
-#
-#     def discern(self):
-#         img1 = self.clear_white(self.gap)
-#         img1 = cv2.cvtColor(img1, cv2.COLOR_RGB2GRAY)
-#         slide = self.image_edge_detection(img1)
-#
-#         back = cv2.imread(self.bg, cv2.COLOR_RGB2GRAY)
-#         back = self.image_edge_detection(back)
-#
-#         slide_pic = cv2.cvtColor(slide, cv2.COLOR_GRAY2RGB)
-#         back_pic = cv2.cvtColor(back, cv2.COLOR_GRAY2RGB)
-#         x = self.template_match(slide_pic, back_pic)
-#         # 输出横坐标, 即 滑块在图片上的位置
-#         return x
-#
-
-
-def get_track_simple(distance) -> List[int]:
-    # 有的检测移动速度的 如果匀速移动会被识别出来，来个简单点的 渐进
-    # distance为传入的总距离
-    # 移动轨迹
-    track: List[int] = []
-    # 当前位移
-    current = 0
-    # 减速阈值
-    mid = distance * 4 / 5
-    # 计算间隔
-    t = 0.2
-    # 初速度
-    v = 1
-
-    while current < distance:
-        if current < mid:
-            # 加速度为2
-            a = 4
-        else:
-            # 加速度为-2
-            a = -3
-        v0 = v
-        # 当前速度
-        v = v0 + a * t  # type: ignore
-        # 移动距离
-        move = v0 * t + 1 / 2 * a * t * t
-        # 当前位移
-        current += move  # type: ignore
-        # 加入轨迹
-        track.append(round(move))
-    return track
-
-
-def get_tracks(distance: int, level: str = "easy") -> List[int]:
-    if level == "easy":
-        return get_track_simple(distance)
-    else:
-        from . import easing
-
-        _, tricks = easing.get_tracks(distance, seconds=2, ease_func="ease_out_expo")
-        return tricks
diff --git a/app/services/scrapers/zhihu/__init__.py b/app/services/scrapers/zhihu/__init__.py
deleted file mode 100644
index 949acfc..0000000
--- a/app/services/scrapers/zhihu/__init__.py
+++ /dev/null
@@ -1,792 +0,0 @@
-import json
-import re
-import traceback
-from typing import Dict, Optional, Any
-from urllib.parse import urlparse
-
-import httpx
-import jmespath
-from bs4 import BeautifulSoup
-from lxml import etree, html
-
-from app.utils.parse import (
-    get_html_text_length,
-    format_telegram_short_text,
-    unix_timestamp_to_utc,
-    wrap_text_into_html,
-)
-from app.utils.network import get_selector, get_redirect_url, get_response_json, get_random_user_agent, \
-    get_content_async, get_response
-from app.models.metadata_item import MetadataItem, MediaFile, MessageType
-from app.config import JINJA2_ENV, FXZHIHU_HOST
-from .config import (
-    SHORT_LIMIT,
-    ZHIHU_COLUMNS_API_HOST,
-    ZHIHU_API_HOST,
-    ZHIHU_HOST,
-    ALL_METHODS,
-    ZHIHU_COOKIES,
-    ZHIHU_API_ANSWER_PARAMS
-)
-from app.utils.logger import logger
-
-environment = JINJA2_ENV
-short_text_template = environment.get_template("zhihu_short_text.jinja2")
-content_template = environment.get_template("zhihu_content.jinja2")
-zhihu_client = httpx.AsyncClient()
-
-
-def _parse_answer_api_json_data(data: Dict) -> Dict:
-    expression = f"""{{
-            question_id: question.id,
-            title: question.title,
-            question_detail: question.detail,
-            answer_count: question.answer_count,
-            follower_count: question.follower_count,
-            question_created: question.created,
-            question_updated: question.updated_time,
-            author: author.name,
-            author_url_token: author.url_token,
-            content: content,
-            created: created_time
-            updated: updated_time,
-            comment_count: comment_count,
-            voteup_count: voteup_count,
-            ip_info: ipInfo
-        }}"""
-    result = jmespath.search(expression, data)
-    return result
-
-
-def _fix_json_quotes(raw_str):
-    """
-        通用修复函数：
-        1. 修复物理换行
-        2. 修复 key: value 结构中 value 内部未正确转义的引号
-        3. 修复特殊的 href="null" 等非法结构
-        """
-
-    raw_str = raw_str.replace('\n', '\\n').replace('\r', '\\r')
-    raw_str = re.sub(r'href="([^\\].*?)"', r'href=\\"\1\\"', raw_str)
-
-    target_keys = ['content','detail']
-
-    for key in target_keys:
-        pattern = r'("' + key + r'":\s*")(.*?)("(?=,"[a-z_]+":))'
-
-        def replace_inner_quotes(match):
-            prefix = match.group(1)
-            body = match.group(2)
-            suffix = match.group(3)
-
-            fixed_body = body.replace('\\"', '"').replace('\\&quot;', '').replace('"', '\\"')
-
-            return prefix + fixed_body + suffix
-
-        raw_str = re.sub(pattern, replace_inner_quotes, raw_str, flags=re.DOTALL)
-
-    return raw_str
-
-
-class Zhihu(MetadataItem):
-    def __init__(self, url: str, data: Optional[Any] = None, **kwargs):
-        # metadata fields
-        self.url: url = url
-        self.title: str = ""
-        self.author: str = ""
-        self.author_url: str = ""
-        self.text: str = ""
-        self.content: str = ""
-        self.media_files: list[MediaFile] = []
-        self.category = "zhihu"
-        self.message_type: MessageType = MessageType.SHORT
-        # auxiliary fields
-        self.item_title = ""
-        self.item_url = ""
-        self.group_name = ""
-        self.group_url = ""
-        self.zhihu_type = ""
-        self.text_group = ""
-        self.raw_content = ""
-        self.date = ""
-        self.updated = ""
-        self.retweet_html = ""
-        self.upvote: int = 0
-        self.retweeted: bool = False
-        # reqeust fields
-        self.httpx_client = zhihu_client
-        self.headers = {"User-Agent": get_random_user_agent(),
-                        "Accept": "*/*",
-                        "Referer": self.url,
-                        "Connection": "keep-alive",
-                        }
-        if kwargs.get("cookie"):
-            self.headers["Cookie"] = kwargs.get("cookie")
-        if ZHIHU_COOKIES:
-            self.headers["Cookie"] = ZHIHU_COOKIES
-        self.method = kwargs.get("method", "fxzhihu")
-        self.urlparser = urlparse(self.url)
-        self.api_url = ""
-        self.status_id = ""
-        self.answer_id = ""
-        self.question_id = ""
-        # other hard-coded fields
-        self.zhihu_type_translate = {
-            "article": "专栏文章",
-            "answer": "回答",
-            "status": "想法",
-        }
-
-    async def get_item(self) -> dict:
-        await self.get_zhihu()
-        return self.to_dict()
-
-    async def get_zhihu(self) -> None:
-        """
-        Main function.
-        Get the zhihu item and return the metadata dict.
-        :return: Dict
-        """
-        await self._get_zhihu_item()
-
-    async def _get_zhihu_item(self) -> None:
-        """
-        Get zhihu item via the corresponding method according to the zhihu type.
-        """
-        await self._check_zhihu_type()
-        function_dict = {
-            "answer": self._get_zhihu_answer,
-            "article": self._get_zhihu_article,
-            "status": self._get_zhihu_status,
-            "unknown": None,
-        }
-        for method in ALL_METHODS:
-            try:
-                if self.method not in ALL_METHODS:
-                    self.method = "json"
-                else:
-                    self.method = method
-                await self._get_request_url()
-                await function_dict[self.zhihu_type]()
-                if self.title != "":
-                    break
-            except Exception as e:
-                traceback.print_exc()
-                if method == ALL_METHODS[-1]:
-                    print("all methods failed")
-                    raise e
-                else:
-                    print(
-                        f"zhihu {self.zhihu_type} {self.method} failed, try the next method"
-                    )
-                continue
-        self._zhihu_short_text_process()
-        self._zhihu_content_process()
-        self.message_type = (
-            MessageType.LONG
-            if get_html_text_length(self.text) > SHORT_LIMIT
-            else MessageType.SHORT
-        )
-
-    async def _check_zhihu_type(self) -> None:
-        """
-        Check the zhihu type of the url. The zhihu type can be one of the following:
-        - answer (example: https://www.zhihu.com/question/19998424/answer/603067076)
-        - article (example: https://zhuanlan.zhihu.com/p/35142635)
-        - status (example: https://www.zhihu.com/pin/1667965059081945088)
-        """
-        host = self.urlparser.netloc
-        path = self.urlparser.path
-        logger.debug(
-            f"""
-        host: {host}
-        path: {path}
-        """
-        )
-        if host.startswith("zhuanlan."):
-            self.zhihu_type = "article"
-            self.article_id = self.urlparser.path.split("/")[-1]
-        elif path.startswith("/answer/") or (path.startswith("/question/") and path.find("/answer/") != -1):
-            self.zhihu_type = "answer"
-            self.answer_id = self.urlparser.path.split("/")[-1]
-            if path.find("/question/") != -1:
-                self.question_id = self.urlparser.path.split("/")[-3]
-            # self.method = "json"
-        elif path.startswith("/pin/"):
-            self.zhihu_type = "status"
-            self.status_id = self.urlparser.path.split("/")[-1]
-            # self.method = "api"
-        else:
-            self.zhihu_type = "unknown"
-        self.url = f"https://{host}{path}"
-
-    async def _get_request_url(self) -> None:
-        host = self.urlparser.netloc
-        path = self.urlparser.path
-        request_url_path = path
-        if self.method == "fxzhihu":
-            self.headers["Content-Type"] = "text/html"
-            if self.zhihu_type == "answer":
-                if self.question_id:
-                    self.request_url = (
-                            "https://" + FXZHIHU_HOST + '/question/' + self.question_id + '/answer/' + self.answer_id
-                    )
-                    return
-                self.request_url = (
-                        "https://" + FXZHIHU_HOST + '/answer/' + self.answer_id
-                )
-                return
-            elif self.zhihu_type == "article":
-                self.request_url = (
-                        "https://" + FXZHIHU_HOST + '/p/' + self.article_id
-                )
-                return
-            elif self.zhihu_type == "status":
-                self.request_url = (
-                        "https://" + FXZHIHU_HOST + '/pin/' + self.status_id
-                )
-                return
-        if self.zhihu_type == "answer":
-            if self.method == "api":
-                self.request_url = (
-                        ZHIHU_API_HOST
-                        + "/answers/"
-                        + self.answer_id
-                        + "?"
-                        + ZHIHU_API_ANSWER_PARAMS
-                )
-                return
-            else:
-                if path.find("question") != -1:
-                    self.question_id = self.urlparser.path.split("/")[-3]
-                else:
-                    await self._get_question_id()
-                request_url_path = "/aria/question/" + self.question_id + "/answer/" + self.answer_id
-        elif self.zhihu_type == "article":
-            if self.method == "api":
-                self.request_url = (
-                        ZHIHU_COLUMNS_API_HOST
-                        + "/articles/"
-                        + self.article_id
-                        + "?"
-                        + ZHIHU_API_ANSWER_PARAMS
-                )
-                return
-                # TODO: There are two api url to get a single article. The first one may fail in the future.
-                # Therefore, I remain the second one.
-                # self.request_url = (
-                #    ZHIHU_COLUMNS_API_HOST_V2 + self.article_id + "?" + ZHIHU_API_ANSWER_PARAMS)
-        elif self.zhihu_type == "status":
-            if self.method == "api":
-                self.request_url = (
-                        "https://www.zhihu.com/api/v4/pins/"
-                        + self.urlparser.path.split("/")[-1]
-                )
-                return
-        self.request_url = f"https://{host}{request_url_path}"
-
-    async def _get_zhihu_answer(self) -> None:
-        """
-        parse the zhihu answer page and get the metadata.
-        support methods: html, json. Recommend: json
-        """
-        if self.method in ["api", "json", "fxzhihu"]:
-            answer_data = {}
-            if self.method == "api":
-                try:
-                    json_data = await get_response_json(self.request_url, headers=self.headers,
-                                                        client=self.httpx_client)
-                    logger.debug(f"json data: {json_data}")
-                    answer_data = _parse_answer_api_json_data(json_data)
-                    logger.debug(f"answer data: {answer_data}")
-                except Exception as e:
-                    raise Exception("Cannot get the answer by API")
-            elif self.method == "fxzhihu":
-                try:
-                    resp = await get_response(url=self.request_url, headers=self.headers, client=self.httpx_client)
-                    json_data = json.loads(_fix_json_quotes(resp.text))
-                    logger.debug(f"json data: {json_data}")
-                    answer_data = _parse_answer_api_json_data(json_data)
-                    logger.debug(f"answer data: {answer_data}")
-                except Exception as e:
-                    raise Exception("Cannot get the answer by fxzhihu, error: " + str(e))
-            elif self.method == "json":
-                try:
-                    selector = await get_selector(self.request_url, headers=self.headers)
-                    json_data = selector.xpath('string(//script[@id="js-initialData"])')
-                    json_data = json.loads(json_data)
-                    json_data = json_data["initialState"]["entities"]
-                    answer_data = self._parse_answer_json_data(json_data)
-                except Exception as e:
-                    raise Exception("Cannot get the selector")
-            if answer_data == {}:
-                raise Exception("Cannot get the answer")
-            self._resolve_answer_json_data(answer_data)
-        else:
-            try:
-                selector = await get_selector(self.request_url, headers=self.headers)
-                self.upvote = selector.xpath(
-                    'string(//button[contains(@class,"VoteButton")])'
-                )
-                self.raw_content = str(
-                    etree.tostring(
-                        selector.xpath(
-                            '//div[contains(@class,"RichContent-inner")]//span[contains(@class,"RichText") and @itemprop="text"]'
-                        )[0],
-                        encoding="utf-8",
-                    ),
-                    encoding="utf-8",
-                )
-                self.title = selector.xpath("string(//h1)")
-                self.author = selector.xpath(
-                    'string(//div[@class="AuthorInfo"]//meta[@itemprop="name"]/@content)'
-                )
-                self.author_url = selector.xpath(
-                    'string(//div[@class="AuthorInfo"]//meta[@itemprop="url"]/@content)'
-                )
-                if self.author_url == "https://www.zhihu.com/people/":
-                    self.author_url = ""
-            except Exception as e:
-                raise Exception("Cannot get the answer")
-        if (
-                self.title == ""
-        ):  # TODO: this is not a good way to check if the scraping is successful. To be improved.
-            raise Exception("Cannot get the answer")
-
-    async def _get_zhihu_status(self):
-        """
-        parse the zhihu status page and get the metadata.
-        support methods: api, html
-        """
-        if self.method in ["api", "fxzhihu"]:
-            json_data = await get_response_json(self.request_url, headers=self.headers, client=self.httpx_client)
-            data = self._resolve_status_api_data(json_data)  # TODO: separate the function to resolve the api data
-            self.author = data["author"]
-            self.author_url = data["author_url"]
-            self.title = data["author"] + "的想法"
-            self.raw_content = json_data["content_html"]
-            self.media_files.extend(data["media_files"])
-            self.date = unix_timestamp_to_utc(data["created"])
-            self.updated = unix_timestamp_to_utc(data["updated"])
-            self.upvote = data["like_count"]
-            if data["origin_pin_id"]:
-                self.retweeted = True
-                self.origin_pin_url = ZHIHU_HOST + "/pin/" + data["origin_pin_id"]
-                self.origin_pin_author = data["origin_pin_data"]["author"]
-                self.origin_pin_author_url = data["origin_pin_data"]["author_url"]
-                self.origin_pin_raw_content = data["origin_pin_data"]["raw_content"]
-                self.origin_pin_date = unix_timestamp_to_utc(data["origin_pin_data"]["created"])
-                self.origin_pin_updated = unix_timestamp_to_utc(data["origin_pin_data"]["updated"])
-                self.origin_pin_upvote = data["origin_pin_data"]["like_count"]
-                self.origin_pin_comment_count = data["origin_pin_data"]["comment_count"]
-                self.media_files.extend(data["origin_pin_data"]["media_files"])
-        else:
-            try:
-                selector = await get_selector(self.request_url, headers=self.headers)
-            except:
-                raise Exception("zhihu request failed")
-            if self.method == "json":
-                def _process_picture(pictures, content_attr):
-                    if not hasattr(self, content_attr):
-                        setattr(self, content_attr, "")
-                    for pic in pictures:
-                        if pic["type"] == "image":
-                            if pic["isGif"]:
-                                media_type = "gif"
-                                setattr(
-                                    self,
-                                    content_attr,
-                                    getattr(self, content_attr)
-                                    + f'<br><video controls="controls" src="{pic["originalUrl"]}"><br>',
-                                )
-                            else:
-                                media_type = "image"
-                                setattr(
-                                    self,
-                                    content_attr,
-                                    getattr(self, content_attr)
-                                    + f'<br><img src="{pic["originalUrl"]}"><br>',
-                                )
-                        elif pic["type"] == "video":
-                            media_type = "video"
-                            setattr(
-                                self,
-                                content_attr,
-                                getattr(self, content_attr)
-                                + f'<br><video controls="controls" src="{pic["originalUrl"]}"><br>',
-                            )
-                        media_item = MediaFile.from_dict(
-                            {
-                                "media_type": media_type,
-                                "url": pic["originalUrl"],
-                                "caption": "",
-                            }
-                        )
-                        self.media_files.append(media_item)
-
-                json_data = selector.xpath('string(//script[@id="js-initialData"])')
-                json_data = json.loads(json_data)["initialState"]["entities"]
-                status_data = self._parse_status_json_data(json_data)
-                if status_data["origin_pin_url"] is not None:
-                    self.retweeted = True
-                    self.origin_pin_url = status_data["origin_pin_url"]
-                    self.origin_pin_author = status_data["origin_pin_author"]
-                    self.origin_pin_author_url = (
-                            ZHIHU_HOST
-                            + "/people/"
-                            + status_data["origin_pin_author_url_token"]
-                    )
-                    self.origin_pin_raw_content = status_data["origin_pin_content"]
-                    self.origin_pin_date = unix_timestamp_to_utc(
-                        status_data["origin_pin_created"]
-                    )
-                    self.origin_pin_updated = unix_timestamp_to_utc(
-                        status_data["origin_pin_updated"]
-                    )
-                    self.origin_pin_upvote = status_data["origin_pin_like_count"]
-                    self.origin_pin_comment_count = status_data[
-                        "origin_pin_comment_count"
-                    ]
-                    _process_picture(
-                        status_data["origin_pin_pictures"], "origin_pin_pic_content"
-                    )
-                self.title = status_data["author"] + "的想法"
-                self.author = status_data["author"]
-                self.author_url = (
-                        ZHIHU_HOST + "/people/" + status_data["author_url_token"]
-                )
-                self.raw_content = status_data["content"]
-                self.date = unix_timestamp_to_utc(status_data["created"])
-                self.updated = unix_timestamp_to_utc(status_data["updated"])
-                self.upvote = status_data["like_count"]
-                self.comment_count = status_data["comment_count"]
-                _process_picture(status_data["pictures"], "pic_content")
-            elif self.method == "html":
-                self.raw_content = str(
-                    etree.tostring(
-                        selector.xpath(
-                            '//span[contains(@class,"RichText") and @itemprop="text"]'
-                        )[0],
-                        encoding="utf-8",
-                    ),
-                    encoding="utf-8",
-                )
-                self.upvote = selector.xpath(
-                    'string(//button[contains(@class,"VoteButton")]//span)'
-                )
-                self.date = selector.xpath(
-                    'string(//div[@class="ContentItem-time"]//span)'
-                )
-                if (
-                        selector.xpath(
-                            'string(//div[@class="RichContent"]/div[2]/div[2]/@class)'
-                        ).find("PinItem-content-originpin")
-                        != -1
-                ):  # check if the status is a retweet
-                    if (
-                            str(
-                                etree.tostring(
-                                    selector.xpath(
-                                        '//div[contains(@class,"PinItem-content-originpin")]/div[3]'
-                                    )[0],
-                                    encoding="utf-8",
-                                ),
-                                encoding="utf-8",
-                            )
-                            != '<div class="RichText ztext PinItem-remainContentRichText"/>'
-                    ):  # if the retweet content including pictures
-                        pic_html = html.fromstring(
-                            str(
-                                etree.tostring(
-                                    selector.xpath(
-                                        '//div[contains(@class,"PinItem-content-originpin")]'
-                                    )[0],
-                                    encoding="utf-8",
-                                ),
-                                encoding="utf-8",
-                            )
-                        )
-                        self.retweet_html = str(
-                            html.tostring(pic_html, pretty_print=True)
-                        ).replace("b'<div", "<div")
-                        print(type(self.retweet_html))
-                        print(self.retweet_html)
-                    else:
-                        self.retweet_html = str(
-                            etree.tostring(
-                                selector.xpath(
-                                    '//div[contains(@class,"PinItem-content-originpin")]'
-                                )[0],
-                                encoding="utf-8",
-                            ),
-                            encoding="utf-8",
-                        )
-                        print(self.retweet_html)
-                self.author = selector.xpath(
-                    'string(//div[@class="AuthorInfo"]//meta[@itemprop="name"]/@content)'
-                )
-                self.author_url = selector.xpath(
-                    'string(//div[@class="AuthorInfo"]//meta[@itemprop="url"]/@content)'
-                )
-                self.title = self.author + "的想法"
-
-    async def _get_zhihu_article(self):
-        self.zhihu_type = "article"
-        if self.method in ["api", "fxzhihu"]:
-            try:
-                json_data = await get_response_json(self.request_url, headers=self.headers, client=self.httpx_client)
-                self.title = json_data["title"]
-                self.raw_content = json_data["content"]
-                self.author = json_data["author"]["name"]
-                self.author_url = json_data["author"]["url"]
-                self.upvote = json_data["voteup_count"]
-            except Exception as e:
-                raise Exception("zhihu request failed")
-        else:
-            try:
-                selector = await get_selector(self.request_url, headers=self.headers)
-            except Exception as e:
-                raise Exception("zhihu request failed")
-            if self.method == "json":
-                json_data = selector.xpath('string(//script[@id="js-initialData"])')
-                json_data = json.loads(json_data)
-                json_data = json_data["initialState"]["entities"]
-                article_data = self._parse_article_json_data(json_data)
-                self.title = article_data["title"]
-                self.raw_content = article_data["content"]
-                self.author = article_data["author"]
-                self.author_url = (
-                        ZHIHU_HOST + "/people/" + article_data["author_url_token"]
-                )
-                self.upvote = article_data["voteup_count"]
-                self.comment_count = article_data["comment_count"]
-                self.date = unix_timestamp_to_utc(article_data["created"])
-                self.updated = unix_timestamp_to_utc(article_data["updated"])
-                self.column = article_data["column"]
-                self.column_url = article_data["column_url"]
-                self.column_intro = article_data["column_intro"]
-            elif self.method == "html":
-                self.title = selector.xpath("string(//h1)")
-                self.upvote = selector.xpath(
-                    'string(//button[@class="Button VoteButton VoteButton--up"])'
-                )
-                self.raw_content = str(
-                    etree.tostring(
-                        selector.xpath(
-                            '//div[contains(@class,"RichText") and contains(@class,"ztext")]'
-                        )[0],
-                        encoding="utf-8",
-                    ),
-                    encoding="utf-8",
-                )
-                self.author = selector.xpath(
-                    'string(//div[contains(@class,"AuthorInfo-head")]//a)'
-                )
-                self.author_url = "https:" + selector.xpath(
-                    'string(//a[@class="UserLink-link"]/@href)'
-                )
-
-    def _zhihu_short_text_process(self):
-        def _html_process(raw_html: str) -> str:
-            soup = BeautifulSoup(raw_html, "html.parser")
-            for img_tag in soup.find_all("img"):
-                if img_tag["src"].find("data:image") != -1:
-                    continue
-                if self.zhihu_type != "status":
-                    media_item = MediaFile.from_dict(
-                        {"media_type": "image", "url": img_tag["src"], "caption": ""}
-                    )
-                    self.media_files.append(media_item)
-                src_value = img_tag["src"]
-                img_tag.attrs.clear()
-                img_tag["src"] = src_value
-            for figure in soup.find_all("figure"):
-                figure.append(BeautifulSoup("<br>", "html.parser"))
-                figure.decompose()
-            for a_tag in soup.find_all("a"):
-                if not a_tag.has_attr("href"):
-                    a_tag.unwrap()
-                    continue
-                href_value = a_tag["href"]
-                a_tag.attrs.clear()
-                a_tag["href"] = href_value
-            for br_tag in soup.find_all("br"):
-                br_tag.replace_with("\n")
-            return str(soup)
-
-        data = self.__dict__
-        data["translated_zhihu_type"] = self.zhihu_type_translate[self.zhihu_type]
-        raw_content = self.raw_content.replace("</br></br>", "\n")
-        raw_content = _html_process(raw_content)
-        data["content"] = raw_content
-        if self.zhihu_type == "status" and self.retweeted:
-            origin_pin_content = self.origin_pin_raw_content.replace("</br></br>", "\n")
-            origin_pin_content = _html_process(origin_pin_content)
-            data["origin_pin_content"] = origin_pin_content
-        self.text = short_text_template.render(data=data)
-        soup = BeautifulSoup(self.text, "html.parser")
-        soup = format_telegram_short_text(soup)
-        for h_tag in soup.find_all(["h1", "h2", "h3", "h4", "h5", "h6"]):
-            if h_tag.text != "":
-                h_tag.append(BeautifulSoup("<br>", "html.parser"))
-            h_tag.unwrap()
-        for p in soup.find_all("p"):
-            if p.text != "":
-                p.append(BeautifulSoup("<br>", "html.parser"))
-            p.unwrap()
-        self.text = (
-            str(soup)
-            .replace("<br/>", "\n")
-            .replace("<br>", "\n")
-            .replace("<br />", "")
-            .replace("<hr/>", "\n")
-        )
-        if self.text.endswith("\n"):
-            self.text = self.text[:-1]
-
-    def _zhihu_content_process(self):
-        data = self.__dict__
-        data["raw_content"] = wrap_text_into_html(
-            data["raw_content"].replace("\n", "<br>"), True
-        )
-        self.content = content_template.render(data=data)
-
-    def _parse_answer_json_data(self, data: Dict) -> Dict:
-        expression = f"""{{
-                question_id: answers."{self.answer_id}".question.id,
-                author: answers."{self.answer_id}".author.name,
-                author_url_token: answers."{self.answer_id}".author.urlToken,
-                content: answers."{self.answer_id}".content,
-                created: answers."{self.answer_id}".createdTime
-                updated: answers."{self.answer_id}".updatedTime,
-                comment_count: answers."{self.answer_id}".commentCount,
-                voteup_count: answers."{self.answer_id}".voteupCount,
-                ip_info: answers."{self.answer_id}".ipInfo
-            }}"""
-        result = jmespath.search(expression, data)
-        self.question_id = result["question_id"]
-        expression = f"""{{
-                        "title": questions."{self.question_id}".title,
-                        "question_detail": questions."{self.question_id}".detail,
-                        "answer_count": questions."{self.question_id}".answerCount,
-                        "follower_count": questions."{self.question_id}".followerCount,
-                        "question_created": questions."{self.question_id}".created,
-                        "question_updated": questions."{self.question_id}".updatedTime
-                    }}"""
-        result.update(jmespath.search(expression, data))
-        return result
-
-    def _resolve_answer_json_data(self, answer_data: Dict) -> None:
-        self.question = answer_data["question_detail"] or ""
-        self.question_date = unix_timestamp_to_utc(
-            answer_data["question_created"] or ""
-        ) or ""
-        self.question_updated = unix_timestamp_to_utc(
-            answer_data["question_updated"] or ""
-        ) or ""
-        self.question_follower_count = answer_data["follower_count"] or 0
-        self.question_answer_count = answer_data["answer_count"] or 0
-        self.title = answer_data["title"] or ""
-        self.author = answer_data["author"] or ""
-        self.author_url = (
-                                  ZHIHU_HOST + "/people/" + answer_data["author_url_token"] or ""
-                          ) or ""
-        self.raw_content = answer_data["content"] or ""
-        self.date = unix_timestamp_to_utc(answer_data["created"] or "") or ""
-        self.updated = unix_timestamp_to_utc(answer_data["updated"] or "") or ""
-        self.comment_count = answer_data["comment_count"] or 0
-        self.upvote = answer_data["voteup_count"] or 0
-        self.ip_info = answer_data["ip_info"] or ""
-
-    def _parse_article_json_data(self, data: Dict) -> Dict:
-        expression = f"""{{
-            "title": articles."{self.article_id}".title,
-            "content": articles."{self.article_id}".content,
-            "author": articles."{self.article_id}".author.name,
-            "author_url_token": articles."{self.article_id}".author.urlToken,
-            "voteup_count": articles."{self.article_id}".voteupCount,
-            "comment_count": articles."{self.article_id}".commentCount,
-            "created": articles."{self.article_id}".created,
-            "updated": articles."{self.article_id}".updated,
-            "column": articles."{self.article_id}".column.title,
-            "column_url": articles."{self.article_id}".column.url,
-            "column_intro": articles."{self.article_id}".column.intro
-        }}"""
-        result = jmespath.search(expression, data)
-        return result
-
-    @staticmethod
-    def _resolve_status_api_data(data: Dict) -> Dict:
-        result = {
-            "author": data["author"]["name"],
-            "author_url": ZHIHU_HOST + "/people/" + data["author"]["url_token"],
-            "created": data["created"],
-            "updated": data["updated"],
-            "text": None,
-            "raw_content": data["content_html"],
-            "like_count": data["like_count"],
-            "comment_count": data["comment_count"],
-            "media_files": [],
-            "origin_pin_id": None,
-        }
-        for content in data["content"]:
-            if content["type"] == "text":
-                result["text"] = content["content"]
-            elif content["type"] == "image":
-                media_item = MediaFile.from_dict(
-                    {
-                        "media_type": "image",
-                        "url": content["original_url"],
-                        "caption": "",
-                    }
-                )
-                result["media_files"].append(media_item)
-            elif content["type"] == "video":
-                media_item = MediaFile.from_dict(
-                    {
-                        "media_type": "video",
-                        "url": content["video_info"]["playlist"]["hd"]["play_url"],
-                        "caption": "",
-                    }
-                )
-                result["media_files"].append(media_item)
-        if "origin_pin" in data:
-            result["origin_pin_id"] = data["origin_pin"]["id"]
-            result["origin_pin_data"] = Zhihu._resolve_status_api_data(data["origin_pin"])
-        return result
-
-    def _parse_status_json_data(self, data: Dict) -> Dict:
-        expression = f"""{{
-                "author_url_token": pins."{self.status_id}".author,
-                "created": pins."{self.status_id}".created,
-                "updated": pins."{self.status_id}".updated,
-                "content": pins."{self.status_id}".content[0].content,
-                "pictures": pins."{self.status_id}".content[1:],
-                "like_count": pins."{self.status_id}".likeCount,
-                "comment_count": pins."{self.status_id}".commentCount,
-                "origin_pin_url": pins."{self.status_id}".originPin.url,
-                "origin_pin_author": pins."{self.status_id}".originPin.author.name,
-                "origin_pin_author_url_token": pins."{self.status_id}".originPin.author.urlToken,
-                "origin_pin_created": pins."{self.status_id}".originPin.created,
-                "origin_pin_updated": pins."{self.status_id}".originPin.updated,
-                "origin_pin_content": pins."{self.status_id}".originPin.content[0].content,
-                "origin_pin_pictures": pins."{self.status_id}".originPin.content[1:],
-                "origin_pin_like_count": pins."{self.status_id}".originPin.likeCount,
-                "origin_pin_comment_count": pins."{self.status_id}".originPin.commentCount
-                }}"""
-        result = jmespath.search(expression, data)
-        print(result)
-        author_url_token = result["author_url_token"]
-        expression = f"""{{
-                        "author": users."{author_url_token}".name
-                        }}"""
-        result.update(jmespath.search(expression, data))
-        return result
-
-    async def _get_question_id(self):
-        redirected_url = await get_redirect_url(self.url)
-        self.question_id = urlparse(redirected_url).path.split("/")[2]
-
-    def _generate_zhihu_cookie(self):
-        # TODO: a more elegant way to generate the zhihu cookie
-        pass
diff --git a/app/services/scrapers/zhihu/config.py b/app/services/scrapers/zhihu/config.py
deleted file mode 100644
index 922a18b..0000000
--- a/app/services/scrapers/zhihu/config.py
+++ /dev/null
@@ -1,23 +0,0 @@
-from app.config import ZHIHU_COOKIES_JSON
-
-SHORT_LIMIT = 600
-ZHIHU_COLUMNS_API_HOST = "https://zhuanlan.zhihu.com/api"
-ZHIHU_COLUMNS_API_HOST_V2 = "https://api.zhihu.com/article/"
-ZHIHU_API_HOST = "https://www.zhihu.com/api/v4"
-ZHIHU_API_ANSWER_PARAMS = ("include=content%2Cexcerpt%2Cauthor%2Cvoteup_count%2Ccomment_count%2Cquestion%2Ccreated_time"
-                    "%2Cquestion.detail")
-ZHIHU_HOST = "https://www.zhihu.com"
-ALL_METHODS = ["fxzhihu"]
-"""
-There are three methods to get zhihu item: from zhihu v4 api(api), a json object in the html script(json),
- or parsing the html page content directly.
- For most occasions, the api method is the best choice. But Zhihu official api only opens for status and article.
- Therefore, we must use the json method to get the answer. And if one of the above two methods fails, the get_item method
- would try to parse the html page content directly.
- You can also pass the method as a parameter when initializing the Zhihu object. If not, the default method is api.
-"""
-
-if ZHIHU_COOKIES_JSON:
-    ZHIHU_COOKIES = ';'.join(f"{cookie['name']}={cookie['value']}" for cookie in ZHIHU_COOKIES_JSON)
-else:
-    ZHIHU_COOKIES = None
diff --git a/app/services/telegram_bot/__init__.py b/app/services/telegram_bot/__init__.py
deleted file mode 100755
index 0fe696e..0000000
--- a/app/services/telegram_bot/__init__.py
+++ /dev/null
@@ -1,144 +0,0 @@
-# TODO: Implement Telegram Service
-# example: https://docs.python-telegram-bot.org/en/stable/examples.customwebhookbot.html
-import mimetypes
-
-mimetypes.init()
-
-from telegram import (
-    Update,
-    MessageEntity,
-)
-from telegram.ext import (
-    Application,
-    MessageHandler,
-    CallbackQueryHandler,
-    filters,
-    InvalidCallbackData,
-    AIORateLimiter,
-)
-
-from app.utils.logger import logger
-from app.config import (
-    TELEGRAM_BOT_TOKEN,
-    TELEGRAM_WEBHOOK_URL,
-    TELEGRAM_BOT_SECRET_TOKEN,
-    TELEBOT_API_SERVER,
-    TELEBOT_API_SERVER_FILE,
-    TELEBOT_LOCAL_FILE_MODE,
-    TELEBOT_CONNECT_TIMEOUT,
-    TELEBOT_READ_TIMEOUT,
-    TELEBOT_WRITE_TIMEOUT,
-    TELEBOT_MAX_RETRY,
-)
-
-# Re-export for external consumers
-from app.services.telegram_bot.message_sender import send_item_message  # noqa: F401
-from app.services.telegram_bot.handlers import (  # noqa: F401
-    https_url_process,
-    https_url_auto_process,
-    all_messages_process,
-    buttons_process,
-    invalid_buttons,
-    error_process,
-    content_process_function,
-)
-
-"""
-application and handlers initialization
-"""
-
-
-async def set_webhook() -> bool:
-    logger.debug(f"set_webhook: {TELEGRAM_WEBHOOK_URL}, secret_token: {TELEGRAM_BOT_SECRET_TOKEN}")
-    return await application.bot.set_webhook(
-        url=TELEGRAM_WEBHOOK_URL, secret_token=TELEGRAM_BOT_SECRET_TOKEN
-    )
-
-
-if TELEGRAM_BOT_TOKEN is not None:
-    application = (
-        Application.builder()
-        .token(TELEGRAM_BOT_TOKEN)
-        .updater(None)
-        .arbitrary_callback_data(True)
-        .connect_timeout(TELEBOT_CONNECT_TIMEOUT)
-        .read_timeout(TELEBOT_READ_TIMEOUT)
-        .write_timeout(TELEBOT_WRITE_TIMEOUT)
-        .base_url(TELEBOT_API_SERVER)
-        .base_file_url(TELEBOT_API_SERVER_FILE)
-        .local_mode(TELEBOT_LOCAL_FILE_MODE)
-        .rate_limiter(AIORateLimiter(max_retries=TELEBOT_MAX_RETRY))
-        .build()
-    )
-else:
-    logger.error("TELEGRAM_BOT_TOKEN is not set!")
-
-
-async def startup() -> None:
-    await application.initialize()
-    # initialize handlers
-    all_messages_handler = MessageHandler(
-        filters=filters.ALL,
-        callback=all_messages_process,
-    )
-    https_url_process_handler = MessageHandler(
-        filters=filters.ChatType.PRIVATE
-                & filters.Entity(MessageEntity.URL)
-                & (~filters.FORWARDED)
-                & filters.USER,
-        callback=https_url_process,
-    )
-    https_url_auto_process_handler = MessageHandler(
-        filters=(
-                        filters.ChatType.SUPERGROUP
-                        | filters.ChatType.GROUP
-                        | filters.ChatType.GROUPS
-                )
-                & filters.Entity(MessageEntity.URL)
-                & (~filters.FORWARDED)
-                & filters.USER,
-        callback=https_url_auto_process,
-    )
-    invalid_buttons_handler = CallbackQueryHandler(
-        callback=invalid_buttons,
-        pattern=InvalidCallbackData,
-    )
-    buttons_process_handler = CallbackQueryHandler(
-        callback=buttons_process, pattern=dict
-    )
-    # add handlers
-    application.add_handlers(
-        [
-            https_url_process_handler,
-            https_url_auto_process_handler,
-            all_messages_handler,
-            invalid_buttons_handler,
-            buttons_process_handler,
-        ]
-    )
-    application.add_error_handler(error_process)
-    if application.post_init:
-        await application.post_init()
-    await application.start()
-
-
-async def shutdown() -> None:
-    await application.stop()
-    if application.post_stop:
-        await application.post_stop()
-    await application.shutdown()
-    if application.post_shutdown:
-        await application.post_shutdown()
-
-
-async def process_telegram_update(
-        data: dict,
-) -> None:
-    """
-    Process telegram update, put it to the update queue.
-    :param data:
-    :return:
-    """
-    update = Update.de_json(data=data, bot=application.bot)
-    application.bot.insert_callback_data(update)
-    await application.update_queue.put(update)
diff --git a/app/services/telegram_bot/config.py b/app/services/telegram_bot/config.py
deleted file mode 100644
index 75cd5bb..0000000
--- a/app/services/telegram_bot/config.py
+++ /dev/null
@@ -1,40 +0,0 @@
-"""
-set variables for functions
-"""
-HTTPS_URL_REGEX = r"(http|https)://([\w.!@#$%^&*()_+-=])*\s*"
-
-"""
-telegram bot api constants
-"""
-TELEGRAM_SINGLE_MESSAGE_MEDIA_LIMIT = 10
-TELEGRAM_TEXT_LIMIT = 900
-TELEGRAM_FILE_UPLOAD_LIMIT = 52428800  # 50MB
-TELEGRAM_FILE_UPLOAD_LIMIT_LOCAL_API = 2147483648  # 2GB
-
-"""
-function constants
-"""
-REFERER_REQUIRED = ["douban", "weibo"]
-
-"""
-template translation(just a workaround)
-"""
-TEMPLATE_TRANSLATION = {
-    "en": {
-        "online_snapshot": "Online Snapshot",
-        "original_webpage": "Original Webpage",
-    },
-    "zh_CN": {
-        "online_snapshot": "原文备份",
-        "original_webpage": "阅读原文",
-    },
-    "zh_TW": {
-        "online_snapshot": "原文備份",
-        "original_webpage": "閱讀原文",
-    },
-}
-
-
-def template_translation(key: str, language: str = "zh_CN") -> str:
-    lang_dict = TEMPLATE_TRANSLATION.get(language, TEMPLATE_TRANSLATION["zh_CN"])
-    return lang_dict.get(key, key)
diff --git a/app/services/telegram_bot/handlers.py b/app/services/telegram_bot/handlers.py
deleted file mode 100644
index 73bd5b9..0000000
--- a/app/services/telegram_bot/handlers.py
+++ /dev/null
@@ -1,359 +0,0 @@
-import html
-import json
-import traceback
-
-from telegram import (
-    Update,
-    MessageEntity,
-    InlineKeyboardButton,
-    InlineKeyboardMarkup,
-)
-from telegram.constants import ParseMode
-from telegram.ext import (
-    CallbackContext,
-    ContextTypes,
-)
-
-from app.database import save_instances
-from app.models.metadata_item import MessageType
-from app.models.telegram_chat import TelegramMessage, TelegramUser, TelegramChat
-from app.models.url_metadata import UrlMetadata
-from app.services.scrapers.common import InfoExtractService
-from app.services.telegram_bot.message_sender import send_item_message
-from app.utils.parse import get_url_metadata
-from app.utils.config import SOCIAL_MEDIA_WEBSITE_PATTERNS, VIDEO_WEBSITE_PATTERNS
-from app.utils.logger import logger
-from app.config import (
-    TELEGRAM_CHANNEL_ID,
-    TELEGRAM_CHANNEL_ADMIN_LIST,
-    TELEBOT_DEBUG_CHANNEL,
-    TELEGRAM_GROUP_MESSAGE_BAN_LIST,
-    TELEGRAM_BOT_MESSAGE_BAN_LIST,
-    FILE_EXPORTER_ON,
-    OPENAI_API_KEY,
-    DATABASE_ON,
-    GENERAL_SCRAPING_ON,
-)
-
-
-async def content_process_function(url_metadata: UrlMetadata, **kwargs) -> dict:
-    item = InfoExtractService(url_metadata, **kwargs)
-    metadata_item = await item.get_item()
-    return metadata_item
-
-
-async def https_url_process(update: Update, context: CallbackContext) -> None:
-    message = update.message
-    welcome_message = await message.reply_text(
-        text="Processing...",
-    )
-    url_dict: dict = message.parse_entities(types=["url"])
-    await welcome_message.delete()
-    for i, url in enumerate(url_dict.values()):
-        process_message = await message.reply_text(
-            text=f"Processing the {i + 1}th url...",
-        )
-        url_metadata = await get_url_metadata(url, ban_list=TELEGRAM_BOT_MESSAGE_BAN_LIST)
-        if url_metadata.source == "banned":
-            await process_message.edit_text(
-                text=f"For the {i + 1} th url, the url is banned."
-            )
-            return
-        if url_metadata.source == "unknown":
-            if GENERAL_SCRAPING_ON:
-                await process_message.edit_text(
-                    text=f"Uncategorized url found. General webpage parser is on, Processing..."
-                )
-                metadata_item = await content_process_function(url_metadata=url_metadata)
-                await send_item_message(
-                    metadata_item, chat_id=message.chat_id
-                )
-            await process_message.edit_text(
-                text=f"For the {i + 1} th url, no supported url found."
-            )
-            return
-        else:
-            await process_message.edit_text(
-                text=f"{url_metadata.source} url found. Processing..."
-            )
-            # create the inline keyboard
-            special_function_keyboard = []
-            basic_function_keyboard = []
-            if TELEGRAM_CHANNEL_ID and (
-                    TELEGRAM_CHANNEL_ADMIN_LIST
-                    and str(message.from_user.id) in TELEGRAM_CHANNEL_ADMIN_LIST
-            ):
-                special_function_keyboard.append(
-                    InlineKeyboardButton(
-                        "Send to Channel",
-                        callback_data={
-                            "type": "channel",
-                            "metadata": url_metadata,
-                            "extra_args": {"store_document": True},
-                        },
-                    ),
-                )
-            # video content url buttons
-            if url_metadata.content_type == "video":
-                basic_function_keyboard.extend(
-                    [
-                        InlineKeyboardButton(
-                            "Get Info",
-                            callback_data={
-                                "type": "video",
-                                "metadata": url_metadata,
-                                "extra_args": {"download": False},
-                            },
-                        ),
-                        InlineKeyboardButton(
-                            "Download",
-                            callback_data={
-                                "type": "video",
-                                "metadata": url_metadata,
-                            },
-                        ),
-                    ]
-                )
-                if FILE_EXPORTER_ON:
-                    special_function_keyboard.extend(
-                        [
-                            InlineKeyboardButton(
-                                "Audio Only",
-                                callback_data={
-                                    "type": "video",
-                                    "metadata": url_metadata,
-                                    "extra_args": {
-                                        "audio_only": True,
-                                    },
-                                },
-                            ),
-                            InlineKeyboardButton(
-                                "Download HD",
-                                callback_data={
-                                    "type": "video",
-                                    "metadata": url_metadata,
-                                    "extra_args": {"hd": True},
-                                },
-                            ),
-                        ]
-                    )
-                    if OPENAI_API_KEY:
-                        special_function_keyboard.append(
-                            InlineKeyboardButton(
-                                "Transcribe Text",
-                                callback_data={
-                                    "type": "video",
-                                    "metadata": url_metadata,
-                                    "extra_args": {
-                                        "audio_only": True,
-                                        "transcribe": True,
-                                        "store_document": True,
-                                    },
-                                },
-                            ),
-                        )
-            elif url_metadata.content_type == "social_media":
-                basic_function_keyboard.extend(
-                    [
-                        InlineKeyboardButton(
-                            "Send to Me",
-                            callback_data={"type": "private", "metadata": url_metadata},
-                        ),
-                        InlineKeyboardButton(
-                            "Force Send in Chat",
-                            callback_data={"type": "force", "metadata": url_metadata},
-                        ),
-                    ]
-                )
-                if FILE_EXPORTER_ON:
-                    special_function_keyboard.append(
-                        InlineKeyboardButton(
-                            "Send with PDF",
-                            callback_data={
-                                "type": "pdf",
-                                "metadata": url_metadata,
-                                "extra_args": {"store_document": True},
-                            },
-                        ),
-                    )
-            basic_function_keyboard.append(
-                InlineKeyboardButton(
-                    "Cancel",
-                    callback_data={"type": "cancel"},
-                ),
-            )
-            keyboard = [
-                special_function_keyboard,
-                basic_function_keyboard,
-            ]
-            reply_markup = InlineKeyboardMarkup(keyboard)
-            await process_message.reply_text(
-                f"For the {i + 1}th url: {url}, please choose the function you want to use:",
-                reply_markup=reply_markup,
-            )
-            await process_message.delete()
-
-
-async def https_url_auto_process(update: Update, context: CallbackContext) -> None:
-    message = update.message
-    url_dict = message.parse_entities(types=["url"])
-    for i, url in enumerate(url_dict.values()):
-        url_metadata = await get_url_metadata(
-            url, ban_list=TELEGRAM_GROUP_MESSAGE_BAN_LIST
-        )
-        if url_metadata.source == "unknown" and GENERAL_SCRAPING_ON:
-            metadata_item = await content_process_function(url_metadata=url_metadata)
-            await send_item_message(
-                metadata_item, chat_id=message.chat_id, message=message
-            )
-        elif url_metadata.source == "unknown" or url_metadata.source == "banned":
-            logger.debug(f"for the {i + 1}th url {url}, no supported url found.")
-            return
-        if url_metadata.to_dict().get("source") in SOCIAL_MEDIA_WEBSITE_PATTERNS.keys():
-            metadata_item = await content_process_function(url_metadata=url_metadata)
-            await send_item_message(
-                metadata_item, chat_id=message.chat_id, message=message
-            )
-        if url_metadata.to_dict().get("source") in VIDEO_WEBSITE_PATTERNS.keys():
-            metadata_item = await content_process_function(url_metadata=url_metadata)
-            await send_item_message(
-                metadata_item, chat_id=message.chat_id, message=message
-            )
-
-
-async def all_messages_process(update: Update, context: CallbackContext) -> None:
-    message = update.message
-    logger.debug(message)
-    if message and DATABASE_ON:
-        telegram_chat = TelegramChat.construct(**message.chat.to_dict())
-        telegram_user = TelegramUser.construct(**message.from_user.to_dict())
-        telegram_message = TelegramMessage(
-            datetime=message.date,
-            chat=telegram_chat,
-            user=telegram_user,
-            text=message.text or "",
-        )
-        await save_instances(telegram_message)
-
-
-async def buttons_process(update: Update, context: CallbackContext) -> None:
-    from app.services.telegram_bot import application
-
-    query = update.callback_query
-    data = query.data
-    chat_id = None
-    if data["type"] == "cancel":
-        await query.answer("Canceled")
-    else:
-        if data["type"] == "private" or data["type"] == "force":
-            await query.answer("Sending to you...")
-        if data["type"] == "channel":
-            if data.get("channel_id") or len(TELEGRAM_CHANNEL_ID) == 1:
-                channel_chat = await application.bot.get_chat(
-                    chat_id=data.get("channel_id")
-                    if data.get("channel_id")
-                    else TELEGRAM_CHANNEL_ID[0]
-                )
-                await query.answer("Sending to channel...")
-                if channel_chat.type == "channel":
-                    chat_id = channel_chat.id
-                else:
-                    await query.message.reply_text(
-                        text="Sorry, the provided channel id does not exist or is not a channel."
-                    )
-                    chat_id = query.message.chat_id
-            elif len(TELEGRAM_CHANNEL_ID) > 1:
-                choose_channel_keyboard = await _create_choose_channel_keyboard(
-                    data=data
-                )
-                await query.message.reply_text(
-                    text="Please choose the channel you want to send:",
-                    reply_markup=InlineKeyboardMarkup(choose_channel_keyboard),
-                )
-                await query.message.delete()
-                context.drop_callback_data(query)
-                return
-        else:
-            chat_id = query.message.chat_id
-        if data["type"] == "video":
-            await query.answer("Video processing...")
-        replying_message = await query.message.reply_text(
-            text=f"Item processing...",
-        )
-        extra_args = data["extra_args"] if "extra_args" in data else {}
-        metadata_item = await content_process_function(
-            url_metadata=data["metadata"], **extra_args
-        )
-        await replying_message.edit_text(
-            text=f"Item processed. Sending to the target...",
-        )
-        if data["type"] == "force":
-            metadata_item["message_type"] = MessageType.SHORT
-        await send_item_message(metadata_item, chat_id=chat_id)
-        if data["type"] == "channel":
-            await query.message.reply_text(
-                text=f"Item sent to the channel.",
-            )
-        await replying_message.delete()
-    await query.message.delete()
-    context.drop_callback_data(query)
-
-
-async def _create_choose_channel_keyboard(data: dict) -> list:
-    from app.services.telegram_bot import application
-
-    choose_channel_keyboard = []
-    for i, channel_id in enumerate(TELEGRAM_CHANNEL_ID):
-        channel_chat = await application.bot.get_chat(chat_id=channel_id)
-        choose_channel_keyboard.append(
-            [
-                InlineKeyboardButton(
-                    channel_chat.title,
-                    callback_data={
-                        "type": "channel",
-                        "metadata": data["metadata"],
-                        "extra_args": data["extra_args"],
-                        "channel_id": channel_id,
-                    },
-                )
-            ]
-        )
-    choose_channel_keyboard.append(
-        [
-            InlineKeyboardButton(
-                "Cancel",
-                callback_data={"type": "cancel"},
-            )
-        ]
-    )
-    return choose_channel_keyboard
-
-
-async def invalid_buttons(update: Update, context: CallbackContext) -> None:
-    await update.callback_query.answer("Invalid button!")
-    await update.effective_message.edit_text(
-        "Sorry, Error Occurred, I could not process this button click 😕."
-    )
-
-
-async def error_process(update: object, context: ContextTypes.DEFAULT_TYPE) -> None:
-    logger.error("Exception while handling an update:", exc_info=context.error)
-    tb_list = traceback.format_exception(
-        None, context.error, context.error.__traceback__
-    )
-    tb_string = "".join(tb_list)
-    update_str = update.to_dict() if isinstance(update, Update) else str(update)
-    message = (
-        f"An exception was raised while handling an update\n"
-        f"<pre>update = {html.escape(json.dumps(update_str, indent=2, ensure_ascii=False))}"
-        "</pre>\n\n"
-        f"<pre>context.chat_data = {html.escape(str(context.chat_data))}</pre>\n\n"
-        f"<pre>context.user_data = {html.escape(str(context.user_data))}</pre>\n\n"
-        f"<pre>{html.escape(tb_string)}</pre>"
-    )
-    debug_chat_id = update.message.chat_id
-    if TELEBOT_DEBUG_CHANNEL is not None:
-        debug_chat_id = TELEBOT_DEBUG_CHANNEL
-    await context.bot.send_message(
-        chat_id=debug_chat_id, text=message, parse_mode=ParseMode.HTML
-    )
diff --git a/app/services/telegram_bot/message_sender.py b/app/services/telegram_bot/message_sender.py
deleted file mode 100644
index 8b60f8f..0000000
--- a/app/services/telegram_bot/message_sender.py
+++ /dev/null
@@ -1,345 +0,0 @@
-import asyncio
-import os
-import traceback
-from io import BytesIO
-from urllib.parse import urlparse
-from urllib.request import url2pathname
-from typing import Union
-
-import aiofiles
-from telegram import (
-    Message,
-    InputMediaPhoto,
-    InputMediaVideo,
-    InputMediaDocument,
-    InputMediaAnimation,
-    InputMediaAudio,
-)
-from telegram.constants import ParseMode
-
-from app.models.metadata_item import MessageType
-from app.models.classes import NamedBytesIO
-from app.utils.parse import telegram_message_html_trim
-from app.utils.network import download_file_by_metadata_item
-from app.utils.image import Image, image_compressing, check_image_type
-from app.utils.logger import logger
-from app.config import (
-    TELEBOT_API_SERVER,
-    TELEBOT_WRITE_TIMEOUT,
-    TELEGRAM_IMAGE_DIMENSION_LIMIT,
-    TELEGRAM_IMAGE_SIZE_LIMIT,
-    JINJA2_ENV,
-    TEMPLATE_LANGUAGE,
-)
-from app.services.telegram_bot.config import (
-    TELEGRAM_SINGLE_MESSAGE_MEDIA_LIMIT,
-    TELEGRAM_FILE_UPLOAD_LIMIT,
-    TELEGRAM_FILE_UPLOAD_LIMIT_LOCAL_API,
-    TEMPLATE_TRANSLATION,
-)
-
-environment = JINJA2_ENV
-template = environment.get_template("social_media_message.jinja2")
-template_text = TEMPLATE_TRANSLATION.get(
-    TEMPLATE_LANGUAGE, TEMPLATE_TRANSLATION["zh_CN"]
-)
-
-
-def _get_application():
-    """Lazy import to avoid circular dependency."""
-    from app.services.telegram_bot import application
-    return application
-
-
-async def send_item_message(
-        data: dict, chat_id: Union[int, str] = None, message: Message = None
-) -> None:
-    """
-    :param data: (dict) metadata of the item
-    :param chat_id: (int) any chat id for sending
-    :param message: (Message) any message to reply
-    :return:
-    """
-    application = _get_application()
-    logger.debug(f"send_item_message: {data}, {chat_id}, {message}")
-    if not chat_id and not message:
-        raise ValueError("must provide chat_id or message")
-    if (
-            not chat_id
-    ) and message:  # this function supports direct reply to a message even if the chat_id is None
-        chat_id = message.chat.id
-    discussion_chat_id = chat_id
-    the_chat = await application.bot.get_chat(chat_id=chat_id)
-    logger.debug(f"the chat of sending message: {the_chat}")
-    if the_chat.type == "channel" and the_chat.linked_chat_id:
-        discussion_chat_id = the_chat.linked_chat_id
-    try:
-        caption_text = message_formatting(data)
-        if len(data["media_files"]) > 0:
-            # if the message type is short and there are some media files, send media group
-            reply_to_message_id = None
-            media_message_group, file_message_group = await media_files_packaging(
-                media_files=data["media_files"], data=data
-            )
-            if (
-                    len(media_message_group) > 0
-            ):  # if there are some media groups to send, send it
-                for i, media_group in enumerate(media_message_group):
-                    caption_text = (
-                        caption_text
-                        if i == 0
-                        else f"the {i + 1}th part of the media item:"
-                    )
-                    logger.debug(f"media group: {media_group}")
-                    logger.debug(
-                        f"caption text: {caption_text},length={len(caption_text)}"
-                    )
-                    sent_media_files_message = await application.bot.send_media_group(
-                        chat_id=chat_id,
-                        media=media_group,
-                        parse_mode=ParseMode.HTML,
-                        caption=caption_text,
-                        write_timeout=TELEBOT_WRITE_TIMEOUT,
-                        reply_to_message_id=message.message_id if message else None,
-                    )
-                    if sent_media_files_message is tuple:
-                        reply_to_message_id = sent_media_files_message[0].message_id
-                    elif sent_media_files_message is Message:
-                        reply_to_message_id = sent_media_files_message.message_id
-                    logger.debug(f"sent media files message: {sent_media_files_message}")
-            else:
-                sent_message = await application.bot.send_message(
-                    chat_id=chat_id,
-                    text=caption_text,
-                    parse_mode=ParseMode.HTML,
-                    reply_to_message_id=message.message_id if message else None,
-                    disable_web_page_preview=True
-                    if data["message_type"] == MessageType.SHORT
-                    else False,
-                    disable_notification=True,
-                )
-            if discussion_chat_id != chat_id:
-                await asyncio.sleep(
-                    3
-                )  # wait for several seconds to avoid missing the target message
-                # if the chat is a channel, get the latest pinned message from the channel and reply to it
-                group_chat = await application.bot.get_chat(chat_id=discussion_chat_id)
-                logger.debug(f"the group chat: {group_chat}")
-                pinned_message = group_chat.pinned_message
-                logger.debug(f"the pinned message: {pinned_message}")
-                if len(media_message_group) > 0:
-                    if (
-                            pinned_message.forward_origin.message_id
-                            == sent_media_files_message[-1].message_id
-                    ):
-                        reply_to_message_id = (
-                                group_chat.pinned_message.id
-                                - len(sent_media_files_message)
-                                + 1
-                        )
-                    else:
-                        reply_to_message_id = group_chat.pinned_message.id + 1
-                elif pinned_message.forward_origin.message_id == sent_message.message_id:
-                    reply_to_message_id = group_chat.pinned_message.id
-                else:
-                    reply_to_message_id = group_chat.pinned_message.id + 1
-            if (
-                    len(file_message_group) > 0
-            ):  # to send files, the files messages should be replied to the message sent before
-                logger.debug(f"reply_to_message_id: {reply_to_message_id}")
-                for file_group in file_message_group:
-                    logger.debug(f"file group: {file_group}")
-                    await application.bot.send_media_group(
-                        chat_id=discussion_chat_id,
-                        media=file_group,
-                        reply_to_message_id=reply_to_message_id,
-                        parse_mode=ParseMode.HTML,
-                        disable_notification=True,
-                    )
-        else:
-            await application.bot.send_message(
-                chat_id=chat_id,
-                text=caption_text,
-                parse_mode=ParseMode.HTML,
-                reply_to_message_id=message.message_id if message else None,
-                disable_web_page_preview=True
-                if data["message_type"] == "short"
-                else False,
-                disable_notification=True,
-            )
-    except Exception as e:
-        logger.error(e)
-        traceback.print_exc()
-        await send_debug_channel(traceback.format_exc())
-
-
-async def send_debug_channel(message: str) -> None:
-    from app.config import TELEBOT_DEBUG_CHANNEL
-    application = _get_application()
-    if TELEBOT_DEBUG_CHANNEL is not None:
-        await application.bot.send_message(
-            chat_id=TELEBOT_DEBUG_CHANNEL, text=message, parse_mode=ParseMode.HTML
-        )
-
-
-def message_formatting(data: dict) -> str:
-    """
-    Format the message to be sent to the user.
-    :param data:
-    :return: text (str) the formatted text for telegram bot api sending message.
-    """
-    if data["message_type"] == "short":
-        data["text"] = telegram_message_html_trim(data["text"])
-    message_template = template
-    text = message_template.render(data=data, template_text=template_text)
-    logger.debug(f"message text: \n{text}")
-    return text
-
-
-async def media_files_packaging(media_files: list, data: dict) -> tuple:
-    """
-    Download the media files from data["media_files"] and package them into a list of media group or file group for
-    sending them by send_media_group method or send_document method.
-    :param data: (dict) metadata of the item
-    :param media_files: (list) a list of media files,
-    :return: (tuple) a tuple of media group and file group
-        media_message_group: (list) a list of media items, the type of each item is InputMediaPhoto or InputMediaVideo
-        file_group: (list) a list of file items, the type of each item is InputFile
-    TODO: It's not a good practice for this function. This method will still download all the media files even when
-        media files are too large and it can be memory consuming even if we use a database to store the media files.
-        The function should be optimized to resolve the media files one group by one group and send each group
-        immediately after it is resolved.
-        This processing method should be optimized in the future.
-    """
-    media_counter, file_counter = 0, 0
-    media_message_group, media_group, file_message_group, file_group = [], [], [], []
-    for (
-            media_item
-    ) in media_files:  # To traverse all media items in the media files list
-        # check if we need to create a new media group
-        if media_counter == TELEGRAM_SINGLE_MESSAGE_MEDIA_LIMIT:
-            # the limitation of media item for a single telegram media group message is 10
-            media_message_group.append(media_group)
-            media_group = []
-            media_counter = 0
-        if file_counter == TELEGRAM_SINGLE_MESSAGE_MEDIA_LIMIT:
-            # the limitation of media item for a single telegram media group message is 10
-            file_message_group.append(file_group)
-            file_group = []
-            file_counter = 0
-        if not (
-                media_item["media_type"] in ["image", "gif", "video"]
-                and data["message_type"] == "long"
-        ):
-            # check the url validity
-            url_parser = urlparse(media_item["url"])
-            if url_parser.scheme in [
-                "http",
-                "https",
-            ]:  # if the url is a http url, download the file
-                file_format = "mp4" if media_item["media_type"] == "video" else None
-                io_object = await download_file_by_metadata_item(
-                    media_item["url"], data=data, file_format=file_format
-                )
-                filename = io_object.name
-                file_size = io_object.size
-            else:  # if the url is a local file path, just add it to the media group
-                try:
-                    file_path = url2pathname(media_item["url"])
-                    async with aiofiles.open(file_path, mode="rb") as f:
-                        filename = os.path.basename(file_path)
-                        content = await f.read()
-                        io_object = NamedBytesIO(content=content, name=filename)
-                    file_size = io_object.size
-                except Exception as e:  # the url is not a valid file path
-                    logger.error(e)
-                    continue
-            # check the file size
-            if (
-                    not TELEBOT_API_SERVER
-            ):  # the official telegram bot api server only supports 50MB file
-                if file_size > TELEGRAM_FILE_UPLOAD_LIMIT:
-                    # if the size is over 50MB, skip this file
-                    continue
-            else:
-                if file_size > TELEGRAM_FILE_UPLOAD_LIMIT_LOCAL_API:
-                    # for local api sever, if the size is over 2GB, skip this file
-                    continue
-            # check media files' type and process them by their type
-            if media_item["media_type"] == "image":
-                image_url = media_item["url"]
-                ext = await check_image_type(io_object)
-                # jpg to jpeg, ignore case
-                if ext.lower() == "jpg":
-                    ext = "JPEG"
-                io_object.seek(0)
-                image = Image.open(io_object, formats=[ext])
-                img_width, img_height = image.size
-                ratio = float(max(img_height, img_width)) / float(
-                    min(img_height, img_width)
-                )
-                # don't try to resize image if the ratio is too large
-                if (
-                        ratio < 5
-                        or max(img_height, img_width) < TELEGRAM_IMAGE_DIMENSION_LIMIT
-                ):
-                    image = image_compressing(image, TELEGRAM_IMAGE_DIMENSION_LIMIT)
-                    with BytesIO() as buffer:
-                        # mime_type file format
-                        image.save(buffer, format=ext)
-                        buffer.seek(0)
-                        resized_ratio = max(image.height, image.width) / min(
-                            image.height, image.width
-                        )
-                        logger.debug(
-                            f"resized image size: {buffer.getbuffer().nbytes}, ratio: {resized_ratio}, width: {image.width}, height: {image.height}"
-                        )
-                        media_group.append(InputMediaPhoto(buffer, filename=filename))
-                # the image is not able to get json serialized
-                logger.debug(
-                    f"image size: {file_size}, ratio: {ratio}, width: {img_width}, height: {img_height}"
-                )
-                if (
-                        file_size > TELEGRAM_IMAGE_SIZE_LIMIT
-                        or img_width > TELEGRAM_IMAGE_DIMENSION_LIMIT
-                        or img_height > TELEGRAM_IMAGE_DIMENSION_LIMIT
-                ) and data["category"] not in ["xiaohongshu"]:
-                    io_object = await download_file_by_metadata_item(
-                        url=image_url, data=data
-                    )
-                    if not io_object.name.endswith(".gif"):
-                        if not io_object.name.endswith(ext.lower()):
-                            io_object.name = io_object.name + "." + ext.lower()
-                        # TODO: it is not a good way to judge whether it is a gif...
-                        file_group.append(
-                            InputMediaDocument(io_object, parse_mode=ParseMode.HTML)
-                        )
-                        file_counter += 1
-            elif media_item["media_type"] == "gif":
-                io_object = await download_file_by_metadata_item(
-                    url=media_item["url"],
-                    data=data,
-                    file_name="gif_image-" + str(media_counter) + ".gif",
-                )
-                io_object.name = io_object.name + ".gif"
-                media_group.append(InputMediaAnimation(io_object))
-            elif media_item["media_type"] == "video":
-                media_group.append(InputMediaVideo(io_object, supports_streaming=True))
-            # TODO: not have any services to store audio files for now, just a placeholder
-            elif media_item["media_type"] == "audio":
-                media_group.append(InputMediaAudio(io_object))
-            elif media_item["media_type"] == "document":
-                file_group.append(
-                    InputMediaDocument(io_object, parse_mode=ParseMode.HTML)
-                )
-                file_counter += 1
-            media_counter += 1
-            logger.info(
-                f"get the {media_counter}th media item,type: {media_item['media_type']}, url: {media_item['url']}"
-            )
-    # check if the media group is empty, if it is, return None
-    if len(media_group) > 0:  # append the last media group
-        media_message_group.append(media_group)
-    if len(file_group) > 0:
-        file_message_group.append(file_group)
-    return media_message_group, file_message_group
diff --git a/app/services/telegraph/__init__.py b/app/services/telegraph/__init__.py
deleted file mode 100644
index 1b2995d..0000000
--- a/app/services/telegraph/__init__.py
+++ /dev/null
@@ -1,74 +0,0 @@
-# TODO: copy the html-to-telegraph package and modify it to fit the asynchronous model
-import random
-import traceback
-from typing import Any
-
-from html_telegraph_poster_v2.async_poster import (
-    AsyncTelegraphPoster,
-)
-from html_telegraph_poster_v2.async_poster.utils import DocumentPreprocessor
-
-from app.config import TELEGRAPH_TOKEN_LIST
-from app.models.telegraph_item import TelegraphItem, from_str
-from app.utils.logger import logger
-
-
-class Telegraph(TelegraphItem):
-    def __init__(
-        self,
-        title: str,
-        url: str,
-        author: str,
-        author_url: str,
-        category: str,
-        content: str,
-    ):
-        self.telegraph = AsyncTelegraphPoster(use_api=True)
-        self.title = title
-        self.url = url
-        self.author = author
-        self.author_url = author_url
-        self.category = category
-        self.content = content
-
-    @staticmethod
-    def from_dict(obj: Any) -> "Telegraph":
-        assert isinstance(obj, dict)
-        title = from_str(obj.get("title"))
-        url = from_str(obj.get("url"))
-        author = from_str(obj.get("author"))
-        author_url = from_str(obj.get("author_url"))
-        category = from_str(obj.get("category"))
-        content = from_str(obj.get("content"))
-        return Telegraph(title, url, author, author_url, category, content)
-
-    async def get_telegraph(self, upload_images: bool = True) -> str:
-        try:
-            if upload_images:
-                temp_html = DocumentPreprocessor(self.content, url=self.url)
-                logger.info("Telegraph: Uploading images to telegraph...")
-                await temp_html.upload_all_images()
-                self.content = temp_html.get_processed_html()
-            logger.info("Telegraph: Uploading to telegraph...")
-            if not TELEGRAPH_TOKEN_LIST:
-                await self.telegraph.create_api_token(
-                    short_name=self.author[0:14], author_name=self.author
-                )
-            else:
-                random_token = random.choice(TELEGRAPH_TOKEN_LIST)
-                await self.telegraph.set_token(random_token)
-
-            telegraph_post = await self.telegraph.post(
-                title=self.title,
-                author=self.author,
-                author_url=self.author_url,
-                text=self.content,
-            )
-            logger.info(
-                f"Telegraph: Uploaded to telegraph. Link: {telegraph_post['url']}"
-            )
-            telegraph_url = telegraph_post["url"]
-            return telegraph_url
-        except Exception as e:
-            traceback.print_exc()
-            return ""
diff --git a/app/templates/bluesky_content.jinja2 b/app/templates/bluesky_content.jinja2
deleted file mode 100644
index b987047..0000000
--- a/app/templates/bluesky_content.jinja2
+++ /dev/null
@@ -1,19 +0,0 @@
-<p><a href="{{ data.url }}">@{{ data.author }}</a>: </p>
-<p>created at {{ data.created_at }}</p>
-{#<p>Comments: {{ data.comments_count }} Likes: {{ data.likes_count }}</p>#}
-{{ data.html_content_text }}
-{% for media_file in data.media_files %}
-    {% if media_file.type == "image" %}
-        <img src="{{ media_file.url }}" alt="{{ media_file.caption }}" />
-    {% elif media_file.type == "video" %}
-        <video controls>
-            <source src="{{ media_file.url }}" type="video/mp4">
-            Your browser does not support the video tag.
-        </video>
-    {% endif %}
-{% endfor %}
-{% if data.retweet_post %}
-    <p>Repost:</p>
-    {{ data.retweet_post.content }}
-{% endif %}
-<hr>
\ No newline at end of file
diff --git a/app/templates/bluesky_telegram_text.jinja2 b/app/templates/bluesky_telegram_text.jinja2
deleted file mode 100644
index 73bfe84..0000000
--- a/app/templates/bluesky_telegram_text.jinja2
+++ /dev/null
@@ -1 +0,0 @@
-<a href="{{ data.url }}">@{{ data.author }}</a>：{{ data.text }}
diff --git a/app/templates/douban_content.jinja2 b/app/templates/douban_content.jinja2
deleted file mode 100644
index 00b7c1d..0000000
--- a/app/templates/douban_content.jinja2
+++ /dev/null
@@ -1,5 +0,0 @@
-{% if data.douban_type.value == 'group' %}
-    <p>作者：<a href="{{data.author_url}}">{{data.author}}</a></p>
-    <p>来自<a href="{{ data.group_url }}">{{data.group_name}}</a></p>
-{% endif %}
-{{ data.raw_content }}
\ No newline at end of file
diff --git a/app/templates/douban_short_text.jinja2 b/app/templates/douban_short_text.jinja2
deleted file mode 100644
index 9af5380..0000000
--- a/app/templates/douban_short_text.jinja2
+++ /dev/null
@@ -1,11 +0,0 @@
-{% if data.douban_type.value == 'note' %}
-<a href="{{ data.author }}">{{ data.author_url }}</a>的豆瓣日记：<a href="{{ data.url }}"><b>{{ data.title }}</b></a>
-{% elif data.douban_type.value == 'group' %}
-<a href="{{ data.group_url }}">{{ data.group_name }}</a>：
-<a href="{{ data.url }}"><b>{{ data.title }}</b></a>
-{% elif data.douban_type.value == 'status' %}
-<a href="{{data.url}}"><b>{{ data.title }}</b></a>：
-{% elif data.douban_type.value in ['movie_review','book_review'] %}
-<a href="{{ data.author }}">{{ data.author_url }}</a>对<a href="{{ data.item_url }}">{{ data.item_title }}</a>的{{ data.item_type }}：
-<a href="{{ data.url }}"><b>{{ data.title }}</b></a>
-{% endif %}{{ data.short_text }}
\ No newline at end of file
diff --git a/app/templates/reddit_content.jinja2 b/app/templates/reddit_content.jinja2
deleted file mode 100644
index 0292434..0000000
--- a/app/templates/reddit_content.jinja2
+++ /dev/null
@@ -1,7 +0,0 @@
-<h2><a href="{{ data.url }}">{{ data.title }}</a></h2>
-
-<p>From <a href="{{ data.subreddit_url }}">{{ data.subreddit }}</a><a href="{{ data.author_url }}">{{ author }}</a> created at {{ data.created }}</p>
-
-<p>Comments: {{ data.comments_count }} Score: {{ data.score }} Upvote ratio: {{ data.upvote_ratio }}</p>
-
-{{ data.content }}
\ No newline at end of file
diff --git a/app/templates/reddit_short_text.jinja2 b/app/templates/reddit_short_text.jinja2
deleted file mode 100644
index 1671e87..0000000
--- a/app/templates/reddit_short_text.jinja2
+++ /dev/null
@@ -1,3 +0,0 @@
-<a href="{{ data.url }}"><b>{{ data.title }}</b></a>
-From <a href="{{ data.subreddit_url }}">{{ data.subreddit_name_prefixed }}</a> - <a href="{{ data.author_url }}">{{ data.author }}</a>
-{{ data.text }}
\ No newline at end of file
diff --git a/app/templates/social_media_message.jinja2 b/app/templates/social_media_message.jinja2
deleted file mode 100644
index d3319b0..0000000
--- a/app/templates/social_media_message.jinja2
+++ /dev/null
@@ -1,32 +0,0 @@
-{# templates/social_media_message.html #}
-
-{% if data.message_type == "short" %}
-   {% if data.title and data.url and data.category in ['other','unknown'] %}
-<a href="{{ data.url }}">
-<b>{{ data.title }}</b>
-</a>
-   {% endif %}
-{{ data.text }}
-    {% if data.category in ['youtube', 'bilibili'] %}
-    {% endif %}
-
-#{{ data.category }}
-{% if data.telegraph_url %}
-<a href="{{ data.telegraph_url }}">{{ template_text.online_snapshot }}</a>
-{% endif %}
-{% else %}
-    {# title #}
-    {% if data.category in ['youtube', 'bilibili'] %}
-        <a href="{{ data.url }}">
-            <b>{{ data.title }}</b>
-        </a>
-    {% else %}<a href="{{ data.telegraph_url }}"><b>{{ data.title }}</b></a>{% endif %}
-
-via #{{ data.category }} - <a href="{{ data.author_url }}">{{ data.author }}</a>
-    {# the message, which is from inoreader comment or telegram bot comment function (todo) #}
-    {% if data.message %}{{ data.message }}
-    {% endif %}
-    {% if data.message_type == "long" %}<a href="{{ data.url }}">{{ template_text.original_webpage }}</a>{% endif %}
-{% endif %}
-
-{# the original page function only supports long type item #}
\ No newline at end of file
diff --git a/app/templates/video_info.jinja2 b/app/templates/video_info.jinja2
deleted file mode 100644
index 60e8fa0..0000000
--- a/app/templates/video_info.jinja2
+++ /dev/null
@@ -1,6 +0,0 @@
-<a href="{{ data.url }}"><b>{{ data.title }}</b></a>
-作者：<a href="{{ data.author_url }}">{{ data.author }}</a>
-视频时长：{{ data.duration }}
-视频上传日期：{{ data.created }}
-播放数据：{{ data.playback_data }}
-视频简介：{{ data.description }}
diff --git a/app/templates/weibo_content.jinja2 b/app/templates/weibo_content.jinja2
deleted file mode 100644
index 3e12141..0000000
--- a/app/templates/weibo_content.jinja2
+++ /dev/null
@@ -1,11 +0,0 @@
-<p>发布于{{ data.date }}</p>
-{% if data.source %}
-<p>通过{{ data.source }}发布</p>
-{% endif %}
-<p>转发：{{ data.reposts_count }} 评论：{{ data.comments_count }} 点赞：{{ data.attitudes_count }}
-{% if data.region_name %}
-来自{{ data.region_name }}
-{% endif %}
-</p>
-<p><a href="{{ data.author_url }}">@{{ data.author }}</a>：</p>
-{{ data.raw_content }}
\ No newline at end of file
diff --git a/app/templates/weibo_short_text.jinja2 b/app/templates/weibo_short_text.jinja2
deleted file mode 100644
index 377215e..0000000
--- a/app/templates/weibo_short_text.jinja2
+++ /dev/null
@@ -1,5 +0,0 @@
-<a href="{{ data.url }}">@{{ data.author }}</a>：{{ data.raw_content }}
-{% if data.retweeted_info %}
-
-<a href="{{ data.retweeted_info.url }}">@{{ data.retweeted_info.author }}</a>：{{ data.raw_content }}
-{% endif %}
\ No newline at end of file
diff --git a/app/templates/xiaohongshu_content.jinja2 b/app/templates/xiaohongshu_content.jinja2
deleted file mode 100644
index d26fbed..0000000
--- a/app/templates/xiaohongshu_content.jinja2
+++ /dev/null
@@ -1,10 +0,0 @@
-<h2>{{ data.title }}</h2>
-<p>作者：<a href="{{ author_url }}">{{ data.author }}</a></p>
-<p>发布于 {{ data.created }} 最近更新于 {{ data.updated }}</p>
-<p>收藏：{{ data.collected_count }} 转发：{{ data.share_count }} 评论：{{ data.comments_count }} 点赞：{{ data.like_count }}
-{% if data.ip_location %}
-来自{{ data.ip_location }}
-{% endif %}
-</p>
-<p><a href="{{ data.author_url }}">@{{ data.author }}</a>：</p>
-{{ data.raw_content }}
\ No newline at end of file
diff --git a/app/templates/xiaohongshu_short_text.jinja2 b/app/templates/xiaohongshu_short_text.jinja2
deleted file mode 100644
index 0f0e88a..0000000
--- a/app/templates/xiaohongshu_short_text.jinja2
+++ /dev/null
@@ -1,2 +0,0 @@
-<b><a href="{{ data.url }}">{{ data.title }}</a></b> - <a href="{{ data.author_url }}">{{ data.author }}</a>
-{{ data.raw_content }}
\ No newline at end of file
diff --git a/app/templates/zhihu_content.jinja2 b/app/templates/zhihu_content.jinja2
deleted file mode 100644
index 2ad8501..0000000
--- a/app/templates/zhihu_content.jinja2
+++ /dev/null
@@ -1,47 +0,0 @@
-{# templates/zhihu_short_text.html #}
-
-{% if data.zhihu_type == "answer" %}
-<h2><a href="https://www.zhihu.com/question/{{ data.question_id }}" target="_blank">{{ data.title }}</a></h2>
-{% if data.question is not none %}
-<p>{{ data.question }}</p>
-<p>发表于：{{ data.question_date }} 更新于：{{ data.question_updated }}<br>回答数：{{ data.question_answer_count }} 关注数：{{ data.question_follower_count }}</p>
-<hr>
-{% endif %}
-<p>回答作者：<a href="{{ data.author_url }}">{{ data.author }}</a></p>
-<p>发表于：{{ data.date }} 更新于：{{ data.updated }}
-<br>
-点赞数：{{ self.upvote }}
-{% if data.comment_count %}
-<br>
-评论数：{{ self.comment_count }}
-{% endif %}
-</p>
-{{ data.raw_content }}
-{% elif data.zhihu_type == "article" %}
-{% if data.column %}
-<p>所属专栏：<a href="{{ data.column_url }}">{{ data.column }}</a></p>
-<p>专栏简介：{{ data.column_intro }}</p>
-{% endif %}
-<p>作者：<a href="{{ data.author_url }}">{{ data.author }}</a></p>
-<p>发表于：{{ data.date }}
-{% if data.updated != data.date %}
-更新于：{{ data.updated }}
-{% endif %}</p>
-更新于：{{ data.updated }}
-<br>
-<p>{% if data.upvote %}点赞数：{{ data.upvote }}{% endif %}{% if data.comment_count %}评论数：{{ data.comment_count }}{% endif %}</p>
-<br>
-{{ data.raw_content }}
-{% elif data.zhihu_type == "status" %}
-<p>发表于{{ data.date }} 点赞数：{{ data.upvote }} 评论数：{{ data.comment_count }}</p>
-<p><a href="{{ data.author_url }}">@{{ data.author }}</a>：{{ data.raw_content }}</p>
-{{ data.pic_content }}
-{% if data.origin_pin_author %}
-<hr>
-<p>发表于{{ data.origin_pin_date }} 点赞数：{{ data.origin_pin_upvote }} 评论数：{{ data.origin_pin_comment_count }}</p>
-<p><a href="{{ data.origin_pin_author_url }}">@{{ data.origin_pin_author }}</a>：{{ data.origin_pin_content }}</p>
-{{ data.origin_pin_pic_content }}
-{% endif %}
-{% endif %}
-{#<hr>#}
-{#<a href="{{ data.url }}">阅读原文</a>#}
\ No newline at end of file
diff --git a/app/templates/zhihu_short_text.jinja2 b/app/templates/zhihu_short_text.jinja2
deleted file mode 100644
index eb247cb..0000000
--- a/app/templates/zhihu_short_text.jinja2
+++ /dev/null
@@ -1,11 +0,0 @@
-{# templates/zhihu_short_text.html #}
-
-{% if data.zhihu_type == "status" %}
-<a href="{{ data.url }}"><b>{{ data.title }}</b></a>：{{ data.content }}
-{% if data.origin_pin_url %}
-<a href="{{ data.origin_pin_url }}"><b>{{ data.origin_pin_author }}的想法</b></a>：{{ data.origin_pin_content }}
-{% endif %}
-{% else %}
-<a href="{{ data.url }}"><b>{{ data.title }}</b> - {{ data.author }}的{{ data.translated_zhihu_type }}</a>
-{{ data.content }}
-{% endif %}
\ No newline at end of file
diff --git a/app/utils/config.py b/app/utils/config.py
deleted file mode 100644
index ad3d691..0000000
--- a/app/utils/config.py
+++ /dev/null
@@ -1,7 +0,0 @@
-# Re-export from shared package
-from fastfetchbot_shared.utils.config import *  # noqa: F401,F403
-from fastfetchbot_shared.utils.config import (  # noqa: F401
-    SOCIAL_MEDIA_WEBSITE_PATTERNS,
-    VIDEO_WEBSITE_PATTERNS,
-    BANNED_PATTERNS,
-)
diff --git a/app/utils/image.py b/app/utils/image.py
deleted file mode 100644
index 500afcd..0000000
--- a/app/utils/image.py
+++ /dev/null
@@ -1,9 +0,0 @@
-# Re-export from shared package
-from fastfetchbot_shared.utils.image import *  # noqa: F401,F403
-from fastfetchbot_shared.utils.image import (  # noqa: F401
-    Image,
-    get_image_dimension,
-    image_compressing,
-    check_image_type,
-    DEFAULT_IMAGE_LIMITATION,
-)
diff --git a/app/utils/logger.py b/app/utils/logger.py
deleted file mode 100644
index 1d4ac5f..0000000
--- a/app/utils/logger.py
+++ /dev/null
@@ -1,2 +0,0 @@
-# Re-export from shared package
-from fastfetchbot_shared.utils.logger import logger  # noqa: F401
diff --git a/app/utils/network.py b/app/utils/network.py
deleted file mode 100644
index bb422db..0000000
--- a/app/utils/network.py
+++ /dev/null
@@ -1,13 +0,0 @@
-# Re-export from shared package
-from fastfetchbot_shared.utils.network import *  # noqa: F401,F403
-from fastfetchbot_shared.utils.network import (  # noqa: F401
-    get_response,
-    get_response_json,
-    get_selector,
-    get_redirect_url,
-    get_content_async,
-    download_file_by_metadata_item,
-    download_file_to_local,
-    get_random_user_agent,
-    HEADERS,
-)
diff --git a/app/utils/parse.py b/app/utils/parse.py
deleted file mode 100644
index 8843e7e..0000000
--- a/app/utils/parse.py
+++ /dev/null
@@ -1,16 +0,0 @@
-# Re-export from shared package
-from fastfetchbot_shared.utils.parse import *  # noqa: F401,F403
-from fastfetchbot_shared.utils.parse import (  # noqa: F401
-    get_html_text_length,
-    format_telegram_short_text,
-    unix_timestamp_to_utc,
-    second_to_time,
-    string_to_list,
-    get_url_metadata,
-    get_ext_from_url,
-    wrap_text_into_html,
-    telegram_message_html_trim,
-    get_bool,
-    get_env_bool,
-    TELEGRAM_TEXT_LIMIT,
-)
diff --git a/app/utils/stealth.min.js b/app/utils/stealth.min.js
deleted file mode 100644
index b4ca68f..0000000
--- a/app/utils/stealth.min.js
+++ /dev/null
@@ -1,7 +0,0 @@
-/*!
- * Note: Auto-generated, do not update manually.
- * Generated by: https://github.com/berstend/puppeteer-extra/tree/master/packages/extract-stealth-evasions
- * Generated on: Mon, 05 Jun 2023 06:17:57 GMT
- * License: MIT
- */
-(({_utilsFns:_utilsFns,_mainFunction:_mainFunction,_args:_args})=>{const utils=Object.fromEntries(Object.entries(_utilsFns).map((([key,value])=>[key,eval(value)])));utils.init(),eval(_mainFunction)(utils,..._args)})({_utilsFns:{init:"() => {\n  utils.preloadCache()\n}",stripProxyFromErrors:"(handler = {}) => {\n  const newHandler = {\n    setPrototypeOf: function (target, proto) {\n      if (proto === null)\n        throw new TypeError('Cannot convert object to primitive value')\n      if (Object.getPrototypeOf(target) === Object.getPrototypeOf(proto)) {\n        throw new TypeError('Cyclic __proto__ value')\n      }\n      return Reflect.setPrototypeOf(target, proto)\n    }\n  }\n  // We wrap each trap in the handler in a try/catch and modify the error stack if they throw\n  const traps = Object.getOwnPropertyNames(handler)\n  traps.forEach(trap => {\n    newHandler[trap] = function () {\n      try {\n        // Forward the call to the defined proxy handler\n        return handler[trap].apply(this, arguments || [])\n      } catch (err) {\n        // Stack traces differ per browser, we only support chromium based ones currently\n        if (!err || !err.stack || !err.stack.includes(`at `)) {\n          throw err\n        }\n\n        // When something throws within one of our traps the Proxy will show up in error stacks\n        // An earlier implementation of this code would simply strip lines with a blacklist,\n        // but it makes sense to be more surgical here and only remove lines related to our Proxy.\n        // We try to use a known \"anchor\" line for that and strip it with everything above it.\n        // If the anchor line cannot be found for some reason we fall back to our blacklist approach.\n\n        const stripWithBlacklist = (stack, stripFirstLine = true) => {\n          const blacklist = [\n            `at Reflect.${trap} `, // e.g. Reflect.get or Reflect.apply\n            `at Object.${trap} `, // e.g. Object.get or Object.apply\n            `at Object.newHandler.<computed> [as ${trap}] ` // caused by this very wrapper :-)\n          ]\n          return (\n            err.stack\n              .split('\\n')\n              // Always remove the first (file) line in the stack (guaranteed to be our proxy)\n              .filter((line, index) => !(index === 1 && stripFirstLine))\n              // Check if the line starts with one of our blacklisted strings\n              .filter(line => !blacklist.some(bl => line.trim().startsWith(bl)))\n              .join('\\n')\n          )\n        }\n\n        const stripWithAnchor = (stack, anchor) => {\n          const stackArr = stack.split('\\n')\n          anchor = anchor || `at Object.newHandler.<computed> [as ${trap}] ` // Known first Proxy line in chromium\n          const anchorIndex = stackArr.findIndex(line =>\n            line.trim().startsWith(anchor)\n          )\n          if (anchorIndex === -1) {\n            return false // 404, anchor not found\n          }\n          // Strip everything from the top until we reach the anchor line\n          // Note: We're keeping the 1st line (zero index) as it's unrelated (e.g. `TypeError`)\n          stackArr.splice(1, anchorIndex)\n          return stackArr.join('\\n')\n        }\n\n        // Special cases due to our nested toString proxies\n        err.stack = err.stack.replace(\n          'at Object.toString (',\n          'at Function.toString ('\n        )\n        if ((err.stack || '').includes('at Function.toString (')) {\n          err.stack = stripWithBlacklist(err.stack, false)\n          throw err\n        }\n\n        // Try using the anchor method, fallback to blacklist if necessary\n        err.stack = stripWithAnchor(err.stack) || stripWithBlacklist(err.stack)\n\n        throw err // Re-throw our now sanitized error\n      }\n    }\n  })\n  return newHandler\n}",stripErrorWithAnchor:"(err, anchor) => {\n  const stackArr = err.stack.split('\\n')\n  const anchorIndex = stackArr.findIndex(line => line.trim().startsWith(anchor))\n  if (anchorIndex === -1) {\n    return err // 404, anchor not found\n  }\n  // Strip everything from the top until we reach the anchor line (remove anchor line as well)\n  // Note: We're keeping the 1st line (zero index) as it's unrelated (e.g. `TypeError`)\n  stackArr.splice(1, anchorIndex)\n  err.stack = stackArr.join('\\n')\n  return err\n}",replaceProperty:"(obj, propName, descriptorOverrides = {}) => {\n  return Object.defineProperty(obj, propName, {\n    // Copy over the existing descriptors (writable, enumerable, configurable, etc)\n    ...(Object.getOwnPropertyDescriptor(obj, propName) || {}),\n    // Add our overrides (e.g. value, get())\n    ...descriptorOverrides\n  })\n}",preloadCache:"() => {\n  if (utils.cache) {\n    return\n  }\n  utils.cache = {\n    // Used in our proxies\n    Reflect: {\n      get: Reflect.get.bind(Reflect),\n      apply: Reflect.apply.bind(Reflect)\n    },\n    // Used in `makeNativeString`\n    nativeToStringStr: Function.toString + '' // => `function toString() { [native code] }`\n  }\n}",makeNativeString:"(name = '') => {\n  return utils.cache.nativeToStringStr.replace('toString', name || '')\n}",patchToString:"(obj, str = '') => {\n  const handler = {\n    apply: function (target, ctx) {\n      // This fixes e.g. `HTMLMediaElement.prototype.canPlayType.toString + \"\"`\n      if (ctx === Function.prototype.toString) {\n        return utils.makeNativeString('toString')\n      }\n      // `toString` targeted at our proxied Object detected\n      if (ctx === obj) {\n        // We either return the optional string verbatim or derive the most desired result automatically\n        return str || utils.makeNativeString(obj.name)\n      }\n      // Check if the toString protype of the context is the same as the global prototype,\n      // if not indicates that we are doing a check across different windows., e.g. the iframeWithdirect` test case\n      const hasSameProto = Object.getPrototypeOf(\n        Function.prototype.toString\n      ).isPrototypeOf(ctx.toString) // eslint-disable-line no-prototype-builtins\n      if (!hasSameProto) {\n        // Pass the call on to the local Function.prototype.toString instead\n        return ctx.toString()\n      }\n      return target.call(ctx)\n    }\n  }\n\n  const toStringProxy = new Proxy(\n    Function.prototype.toString,\n    utils.stripProxyFromErrors(handler)\n  )\n  utils.replaceProperty(Function.prototype, 'toString', {\n    value: toStringProxy\n  })\n}",patchToStringNested:"(obj = {}) => {\n  return utils.execRecursively(obj, ['function'], utils.patchToString)\n}",redirectToString:"(proxyObj, originalObj) => {\n  const handler = {\n    apply: function (target, ctx) {\n      // This fixes e.g. `HTMLMediaElement.prototype.canPlayType.toString + \"\"`\n      if (ctx === Function.prototype.toString) {\n        return utils.makeNativeString('toString')\n      }\n\n      // `toString` targeted at our proxied Object detected\n      if (ctx === proxyObj) {\n        const fallback = () =>\n          originalObj && originalObj.name\n            ? utils.makeNativeString(originalObj.name)\n            : utils.makeNativeString(proxyObj.name)\n\n        // Return the toString representation of our original object if possible\n        return originalObj + '' || fallback()\n      }\n\n      if (typeof ctx === 'undefined' || ctx === null) {\n        return target.call(ctx)\n      }\n\n      // Check if the toString protype of the context is the same as the global prototype,\n      // if not indicates that we are doing a check across different windows., e.g. the iframeWithdirect` test case\n      const hasSameProto = Object.getPrototypeOf(\n        Function.prototype.toString\n      ).isPrototypeOf(ctx.toString) // eslint-disable-line no-prototype-builtins\n      if (!hasSameProto) {\n        // Pass the call on to the local Function.prototype.toString instead\n        return ctx.toString()\n      }\n\n      return target.call(ctx)\n    }\n  }\n\n  const toStringProxy = new Proxy(\n    Function.prototype.toString,\n    utils.stripProxyFromErrors(handler)\n  )\n  utils.replaceProperty(Function.prototype, 'toString', {\n    value: toStringProxy\n  })\n}",replaceWithProxy:"(obj, propName, handler) => {\n  const originalObj = obj[propName]\n  const proxyObj = new Proxy(obj[propName], utils.stripProxyFromErrors(handler))\n\n  utils.replaceProperty(obj, propName, { value: proxyObj })\n  utils.redirectToString(proxyObj, originalObj)\n\n  return true\n}",replaceGetterWithProxy:"(obj, propName, handler) => {\n  const fn = Object.getOwnPropertyDescriptor(obj, propName).get\n  const fnStr = fn.toString() // special getter function string\n  const proxyObj = new Proxy(fn, utils.stripProxyFromErrors(handler))\n\n  utils.replaceProperty(obj, propName, { get: proxyObj })\n  utils.patchToString(proxyObj, fnStr)\n\n  return true\n}",replaceGetterSetter:"(obj, propName, handlerGetterSetter) => {\n  const ownPropertyDescriptor = Object.getOwnPropertyDescriptor(obj, propName)\n  const handler = { ...ownPropertyDescriptor }\n\n  if (handlerGetterSetter.get !== undefined) {\n    const nativeFn = ownPropertyDescriptor.get\n    handler.get = function() {\n      return handlerGetterSetter.get.call(this, nativeFn.bind(this))\n    }\n    utils.redirectToString(handler.get, nativeFn)\n  }\n\n  if (handlerGetterSetter.set !== undefined) {\n    const nativeFn = ownPropertyDescriptor.set\n    handler.set = function(newValue) {\n      handlerGetterSetter.set.call(this, newValue, nativeFn.bind(this))\n    }\n    utils.redirectToString(handler.set, nativeFn)\n  }\n\n  Object.defineProperty(obj, propName, handler)\n}",mockWithProxy:"(obj, propName, pseudoTarget, handler) => {\n  const proxyObj = new Proxy(pseudoTarget, utils.stripProxyFromErrors(handler))\n\n  utils.replaceProperty(obj, propName, { value: proxyObj })\n  utils.patchToString(proxyObj)\n\n  return true\n}",createProxy:"(pseudoTarget, handler) => {\n  const proxyObj = new Proxy(pseudoTarget, utils.stripProxyFromErrors(handler))\n  utils.patchToString(proxyObj)\n\n  return proxyObj\n}",splitObjPath:"objPath => ({\n  // Remove last dot entry (property) ==> `HTMLMediaElement.prototype`\n  objName: objPath.split('.').slice(0, -1).join('.'),\n  // Extract last dot entry ==> `canPlayType`\n  propName: objPath.split('.').slice(-1)[0]\n})",replaceObjPathWithProxy:"(objPath, handler) => {\n  const { objName, propName } = utils.splitObjPath(objPath)\n  const obj = eval(objName) // eslint-disable-line no-eval\n  return utils.replaceWithProxy(obj, propName, handler)\n}",execRecursively:"(obj = {}, typeFilter = [], fn) => {\n  function recurse(obj) {\n    for (const key in obj) {\n      if (obj[key] === undefined) {\n        continue\n      }\n      if (obj[key] && typeof obj[key] === 'object') {\n        recurse(obj[key])\n      } else {\n        if (obj[key] && typeFilter.includes(typeof obj[key])) {\n          fn.call(this, obj[key])\n        }\n      }\n    }\n  }\n  recurse(obj)\n  return obj\n}",stringifyFns:"(fnObj = { hello: () => 'world' }) => {\n  // Object.fromEntries() ponyfill (in 6 lines) - supported only in Node v12+, modern browsers are fine\n  // https://github.com/feross/fromentries\n  function fromEntries(iterable) {\n    return [...iterable].reduce((obj, [key, val]) => {\n      obj[key] = val\n      return obj\n    }, {})\n  }\n  return (Object.fromEntries || fromEntries)(\n    Object.entries(fnObj)\n      .filter(([key, value]) => typeof value === 'function')\n      .map(([key, value]) => [key, value.toString()]) // eslint-disable-line no-eval\n  )\n}",materializeFns:"(fnStrObj = { hello: \"() => 'world'\" }) => {\n  return Object.fromEntries(\n    Object.entries(fnStrObj).map(([key, value]) => {\n      if (value.startsWith('function')) {\n        // some trickery is needed to make oldschool functions work :-)\n        return [key, eval(`() => ${value}`)()] // eslint-disable-line no-eval\n      } else {\n        // arrow functions just work\n        return [key, eval(value)] // eslint-disable-line no-eval\n      }\n    })\n  )\n}",makeHandler:"() => ({\n  // Used by simple `navigator` getter evasions\n  getterValue: value => ({\n    apply(target, ctx, args) {\n      // Let's fetch the value first, to trigger and escalate potential errors\n      // Illegal invocations like `navigator.__proto__.vendor` will throw here\n      utils.cache.Reflect.apply(...arguments)\n      return value\n    }\n  })\n})",arrayEquals:"(array1, array2) => {\n  if (array1.length !== array2.length) {\n    return false\n  }\n  for (let i = 0; i < array1.length; ++i) {\n    if (array1[i] !== array2[i]) {\n      return false\n    }\n  }\n  return true\n}",memoize:"fn => {\n  const cache = []\n  return function(...args) {\n    if (!cache.some(c => utils.arrayEquals(c.key, args))) {\n      cache.push({ key: args, value: fn.apply(this, args) })\n    }\n    return cache.find(c => utils.arrayEquals(c.key, args)).value\n  }\n}"},_mainFunction:'utils => {\n      if (!window.chrome) {\n        // Use the exact property descriptor found in headful Chrome\n        // fetch it via `Object.getOwnPropertyDescriptor(window, \'chrome\')`\n        Object.defineProperty(window, \'chrome\', {\n          writable: true,\n          enumerable: true,\n          configurable: false, // note!\n          value: {} // We\'ll extend that later\n        })\n      }\n\n      // That means we\'re running headful and don\'t need to mock anything\n      if (\'app\' in window.chrome) {\n        return // Nothing to do here\n      }\n\n      const makeError = {\n        ErrorInInvocation: fn => {\n          const err = new TypeError(`Error in invocation of app.${fn}()`)\n          return utils.stripErrorWithAnchor(\n            err,\n            `at ${fn} (eval at <anonymous>`\n          )\n        }\n      }\n\n      // There\'s a some static data in that property which doesn\'t seem to change,\n      // we should periodically check for updates: `JSON.stringify(window.app, null, 2)`\n      const STATIC_DATA = JSON.parse(\n        `\n{\n  "isInstalled": false,\n  "InstallState": {\n    "DISABLED": "disabled",\n    "INSTALLED": "installed",\n    "NOT_INSTALLED": "not_installed"\n  },\n  "RunningState": {\n    "CANNOT_RUN": "cannot_run",\n    "READY_TO_RUN": "ready_to_run",\n    "RUNNING": "running"\n  }\n}\n        `.trim()\n      )\n\n      window.chrome.app = {\n        ...STATIC_DATA,\n\n        get isInstalled() {\n          return false\n        },\n\n        getDetails: function getDetails() {\n          if (arguments.length) {\n            throw makeError.ErrorInInvocation(`getDetails`)\n          }\n          return null\n        },\n        getIsInstalled: function getDetails() {\n          if (arguments.length) {\n            throw makeError.ErrorInInvocation(`getIsInstalled`)\n          }\n          return false\n        },\n        runningState: function getDetails() {\n          if (arguments.length) {\n            throw makeError.ErrorInInvocation(`runningState`)\n          }\n          return \'cannot_run\'\n        }\n      }\n      utils.patchToStringNested(window.chrome.app)\n    }',_args:[]}),(({_utilsFns:_utilsFns,_mainFunction:_mainFunction,_args:_args})=>{const utils=Object.fromEntries(Object.entries(_utilsFns).map((([key,value])=>[key,eval(value)])));utils.init(),eval(_mainFunction)(utils,..._args)})({_utilsFns:{init:"() => {\n  utils.preloadCache()\n}",stripProxyFromErrors:"(handler = {}) => {\n  const newHandler = {\n    setPrototypeOf: function (target, proto) {\n      if (proto === null)\n        throw new TypeError('Cannot convert object to primitive value')\n      if (Object.getPrototypeOf(target) === Object.getPrototypeOf(proto)) {\n        throw new TypeError('Cyclic __proto__ value')\n      }\n      return Reflect.setPrototypeOf(target, proto)\n    }\n  }\n  // We wrap each trap in the handler in a try/catch and modify the error stack if they throw\n  const traps = Object.getOwnPropertyNames(handler)\n  traps.forEach(trap => {\n    newHandler[trap] = function () {\n      try {\n        // Forward the call to the defined proxy handler\n        return handler[trap].apply(this, arguments || [])\n      } catch (err) {\n        // Stack traces differ per browser, we only support chromium based ones currently\n        if (!err || !err.stack || !err.stack.includes(`at `)) {\n          throw err\n        }\n\n        // When something throws within one of our traps the Proxy will show up in error stacks\n        // An earlier implementation of this code would simply strip lines with a blacklist,\n        // but it makes sense to be more surgical here and only remove lines related to our Proxy.\n        // We try to use a known \"anchor\" line for that and strip it with everything above it.\n        // If the anchor line cannot be found for some reason we fall back to our blacklist approach.\n\n        const stripWithBlacklist = (stack, stripFirstLine = true) => {\n          const blacklist = [\n            `at Reflect.${trap} `, // e.g. Reflect.get or Reflect.apply\n            `at Object.${trap} `, // e.g. Object.get or Object.apply\n            `at Object.newHandler.<computed> [as ${trap}] ` // caused by this very wrapper :-)\n          ]\n          return (\n            err.stack\n              .split('\\n')\n              // Always remove the first (file) line in the stack (guaranteed to be our proxy)\n              .filter((line, index) => !(index === 1 && stripFirstLine))\n              // Check if the line starts with one of our blacklisted strings\n              .filter(line => !blacklist.some(bl => line.trim().startsWith(bl)))\n              .join('\\n')\n          )\n        }\n\n        const stripWithAnchor = (stack, anchor) => {\n          const stackArr = stack.split('\\n')\n          anchor = anchor || `at Object.newHandler.<computed> [as ${trap}] ` // Known first Proxy line in chromium\n          const anchorIndex = stackArr.findIndex(line =>\n            line.trim().startsWith(anchor)\n          )\n          if (anchorIndex === -1) {\n            return false // 404, anchor not found\n          }\n          // Strip everything from the top until we reach the anchor line\n          // Note: We're keeping the 1st line (zero index) as it's unrelated (e.g. `TypeError`)\n          stackArr.splice(1, anchorIndex)\n          return stackArr.join('\\n')\n        }\n\n        // Special cases due to our nested toString proxies\n        err.stack = err.stack.replace(\n          'at Object.toString (',\n          'at Function.toString ('\n        )\n        if ((err.stack || '').includes('at Function.toString (')) {\n          err.stack = stripWithBlacklist(err.stack, false)\n          throw err\n        }\n\n        // Try using the anchor method, fallback to blacklist if necessary\n        err.stack = stripWithAnchor(err.stack) || stripWithBlacklist(err.stack)\n\n        throw err // Re-throw our now sanitized error\n      }\n    }\n  })\n  return newHandler\n}",stripErrorWithAnchor:"(err, anchor) => {\n  const stackArr = err.stack.split('\\n')\n  const anchorIndex = stackArr.findIndex(line => line.trim().startsWith(anchor))\n  if (anchorIndex === -1) {\n    return err // 404, anchor not found\n  }\n  // Strip everything from the top until we reach the anchor line (remove anchor line as well)\n  // Note: We're keeping the 1st line (zero index) as it's unrelated (e.g. `TypeError`)\n  stackArr.splice(1, anchorIndex)\n  err.stack = stackArr.join('\\n')\n  return err\n}",replaceProperty:"(obj, propName, descriptorOverrides = {}) => {\n  return Object.defineProperty(obj, propName, {\n    // Copy over the existing descriptors (writable, enumerable, configurable, etc)\n    ...(Object.getOwnPropertyDescriptor(obj, propName) || {}),\n    // Add our overrides (e.g. value, get())\n    ...descriptorOverrides\n  })\n}",preloadCache:"() => {\n  if (utils.cache) {\n    return\n  }\n  utils.cache = {\n    // Used in our proxies\n    Reflect: {\n      get: Reflect.get.bind(Reflect),\n      apply: Reflect.apply.bind(Reflect)\n    },\n    // Used in `makeNativeString`\n    nativeToStringStr: Function.toString + '' // => `function toString() { [native code] }`\n  }\n}",makeNativeString:"(name = '') => {\n  return utils.cache.nativeToStringStr.replace('toString', name || '')\n}",patchToString:"(obj, str = '') => {\n  const handler = {\n    apply: function (target, ctx) {\n      // This fixes e.g. `HTMLMediaElement.prototype.canPlayType.toString + \"\"`\n      if (ctx === Function.prototype.toString) {\n        return utils.makeNativeString('toString')\n      }\n      // `toString` targeted at our proxied Object detected\n      if (ctx === obj) {\n        // We either return the optional string verbatim or derive the most desired result automatically\n        return str || utils.makeNativeString(obj.name)\n      }\n      // Check if the toString protype of the context is the same as the global prototype,\n      // if not indicates that we are doing a check across different windows., e.g. the iframeWithdirect` test case\n      const hasSameProto = Object.getPrototypeOf(\n        Function.prototype.toString\n      ).isPrototypeOf(ctx.toString) // eslint-disable-line no-prototype-builtins\n      if (!hasSameProto) {\n        // Pass the call on to the local Function.prototype.toString instead\n        return ctx.toString()\n      }\n      return target.call(ctx)\n    }\n  }\n\n  const toStringProxy = new Proxy(\n    Function.prototype.toString,\n    utils.stripProxyFromErrors(handler)\n  )\n  utils.replaceProperty(Function.prototype, 'toString', {\n    value: toStringProxy\n  })\n}",patchToStringNested:"(obj = {}) => {\n  return utils.execRecursively(obj, ['function'], utils.patchToString)\n}",redirectToString:"(proxyObj, originalObj) => {\n  const handler = {\n    apply: function (target, ctx) {\n      // This fixes e.g. `HTMLMediaElement.prototype.canPlayType.toString + \"\"`\n      if (ctx === Function.prototype.toString) {\n        return utils.makeNativeString('toString')\n      }\n\n      // `toString` targeted at our proxied Object detected\n      if (ctx === proxyObj) {\n        const fallback = () =>\n          originalObj && originalObj.name\n            ? utils.makeNativeString(originalObj.name)\n            : utils.makeNativeString(proxyObj.name)\n\n        // Return the toString representation of our original object if possible\n        return originalObj + '' || fallback()\n      }\n\n      if (typeof ctx === 'undefined' || ctx === null) {\n        return target.call(ctx)\n      }\n\n      // Check if the toString protype of the context is the same as the global prototype,\n      // if not indicates that we are doing a check across different windows., e.g. the iframeWithdirect` test case\n      const hasSameProto = Object.getPrototypeOf(\n        Function.prototype.toString\n      ).isPrototypeOf(ctx.toString) // eslint-disable-line no-prototype-builtins\n      if (!hasSameProto) {\n        // Pass the call on to the local Function.prototype.toString instead\n        return ctx.toString()\n      }\n\n      return target.call(ctx)\n    }\n  }\n\n  const toStringProxy = new Proxy(\n    Function.prototype.toString,\n    utils.stripProxyFromErrors(handler)\n  )\n  utils.replaceProperty(Function.prototype, 'toString', {\n    value: toStringProxy\n  })\n}",replaceWithProxy:"(obj, propName, handler) => {\n  const originalObj = obj[propName]\n  const proxyObj = new Proxy(obj[propName], utils.stripProxyFromErrors(handler))\n\n  utils.replaceProperty(obj, propName, { value: proxyObj })\n  utils.redirectToString(proxyObj, originalObj)\n\n  return true\n}",replaceGetterWithProxy:"(obj, propName, handler) => {\n  const fn = Object.getOwnPropertyDescriptor(obj, propName).get\n  const fnStr = fn.toString() // special getter function string\n  const proxyObj = new Proxy(fn, utils.stripProxyFromErrors(handler))\n\n  utils.replaceProperty(obj, propName, { get: proxyObj })\n  utils.patchToString(proxyObj, fnStr)\n\n  return true\n}",replaceGetterSetter:"(obj, propName, handlerGetterSetter) => {\n  const ownPropertyDescriptor = Object.getOwnPropertyDescriptor(obj, propName)\n  const handler = { ...ownPropertyDescriptor }\n\n  if (handlerGetterSetter.get !== undefined) {\n    const nativeFn = ownPropertyDescriptor.get\n    handler.get = function() {\n      return handlerGetterSetter.get.call(this, nativeFn.bind(this))\n    }\n    utils.redirectToString(handler.get, nativeFn)\n  }\n\n  if (handlerGetterSetter.set !== undefined) {\n    const nativeFn = ownPropertyDescriptor.set\n    handler.set = function(newValue) {\n      handlerGetterSetter.set.call(this, newValue, nativeFn.bind(this))\n    }\n    utils.redirectToString(handler.set, nativeFn)\n  }\n\n  Object.defineProperty(obj, propName, handler)\n}",mockWithProxy:"(obj, propName, pseudoTarget, handler) => {\n  const proxyObj = new Proxy(pseudoTarget, utils.stripProxyFromErrors(handler))\n\n  utils.replaceProperty(obj, propName, { value: proxyObj })\n  utils.patchToString(proxyObj)\n\n  return true\n}",createProxy:"(pseudoTarget, handler) => {\n  const proxyObj = new Proxy(pseudoTarget, utils.stripProxyFromErrors(handler))\n  utils.patchToString(proxyObj)\n\n  return proxyObj\n}",splitObjPath:"objPath => ({\n  // Remove last dot entry (property) ==> `HTMLMediaElement.prototype`\n  objName: objPath.split('.').slice(0, -1).join('.'),\n  // Extract last dot entry ==> `canPlayType`\n  propName: objPath.split('.').slice(-1)[0]\n})",replaceObjPathWithProxy:"(objPath, handler) => {\n  const { objName, propName } = utils.splitObjPath(objPath)\n  const obj = eval(objName) // eslint-disable-line no-eval\n  return utils.replaceWithProxy(obj, propName, handler)\n}",execRecursively:"(obj = {}, typeFilter = [], fn) => {\n  function recurse(obj) {\n    for (const key in obj) {\n      if (obj[key] === undefined) {\n        continue\n      }\n      if (obj[key] && typeof obj[key] === 'object') {\n        recurse(obj[key])\n      } else {\n        if (obj[key] && typeFilter.includes(typeof obj[key])) {\n          fn.call(this, obj[key])\n        }\n      }\n    }\n  }\n  recurse(obj)\n  return obj\n}",stringifyFns:"(fnObj = { hello: () => 'world' }) => {\n  // Object.fromEntries() ponyfill (in 6 lines) - supported only in Node v12+, modern browsers are fine\n  // https://github.com/feross/fromentries\n  function fromEntries(iterable) {\n    return [...iterable].reduce((obj, [key, val]) => {\n      obj[key] = val\n      return obj\n    }, {})\n  }\n  return (Object.fromEntries || fromEntries)(\n    Object.entries(fnObj)\n      .filter(([key, value]) => typeof value === 'function')\n      .map(([key, value]) => [key, value.toString()]) // eslint-disable-line no-eval\n  )\n}",materializeFns:"(fnStrObj = { hello: \"() => 'world'\" }) => {\n  return Object.fromEntries(\n    Object.entries(fnStrObj).map(([key, value]) => {\n      if (value.startsWith('function')) {\n        // some trickery is needed to make oldschool functions work :-)\n        return [key, eval(`() => ${value}`)()] // eslint-disable-line no-eval\n      } else {\n        // arrow functions just work\n        return [key, eval(value)] // eslint-disable-line no-eval\n      }\n    })\n  )\n}",makeHandler:"() => ({\n  // Used by simple `navigator` getter evasions\n  getterValue: value => ({\n    apply(target, ctx, args) {\n      // Let's fetch the value first, to trigger and escalate potential errors\n      // Illegal invocations like `navigator.__proto__.vendor` will throw here\n      utils.cache.Reflect.apply(...arguments)\n      return value\n    }\n  })\n})",arrayEquals:"(array1, array2) => {\n  if (array1.length !== array2.length) {\n    return false\n  }\n  for (let i = 0; i < array1.length; ++i) {\n    if (array1[i] !== array2[i]) {\n      return false\n    }\n  }\n  return true\n}",memoize:"fn => {\n  const cache = []\n  return function(...args) {\n    if (!cache.some(c => utils.arrayEquals(c.key, args))) {\n      cache.push({ key: args, value: fn.apply(this, args) })\n    }\n    return cache.find(c => utils.arrayEquals(c.key, args)).value\n  }\n}"},_mainFunction:"utils => {\n      if (!window.chrome) {\n        // Use the exact property descriptor found in headful Chrome\n        // fetch it via `Object.getOwnPropertyDescriptor(window, 'chrome')`\n        Object.defineProperty(window, 'chrome', {\n          writable: true,\n          enumerable: true,\n          configurable: false, // note!\n          value: {} // We'll extend that later\n        })\n      }\n\n      // That means we're running headful and don't need to mock anything\n      if ('csi' in window.chrome) {\n        return // Nothing to do here\n      }\n\n      // Check that the Navigation Timing API v1 is available, we need that\n      if (!window.performance || !window.performance.timing) {\n        return\n      }\n\n      const { timing } = window.performance\n\n      window.chrome.csi = function() {\n        return {\n          onloadT: timing.domContentLoadedEventEnd,\n          startE: timing.navigationStart,\n          pageT: Date.now() - timing.navigationStart,\n          tran: 15 // Transition type or something\n        }\n      }\n      utils.patchToString(window.chrome.csi)\n    }",_args:[]}),(({_utilsFns:_utilsFns,_mainFunction:_mainFunction,_args:_args})=>{const utils=Object.fromEntries(Object.entries(_utilsFns).map((([key,value])=>[key,eval(value)])));utils.init(),eval(_mainFunction)(utils,..._args)})({_utilsFns:{init:"() => {\n  utils.preloadCache()\n}",stripProxyFromErrors:"(handler = {}) => {\n  const newHandler = {\n    setPrototypeOf: function (target, proto) {\n      if (proto === null)\n        throw new TypeError('Cannot convert object to primitive value')\n      if (Object.getPrototypeOf(target) === Object.getPrototypeOf(proto)) {\n        throw new TypeError('Cyclic __proto__ value')\n      }\n      return Reflect.setPrototypeOf(target, proto)\n    }\n  }\n  // We wrap each trap in the handler in a try/catch and modify the error stack if they throw\n  const traps = Object.getOwnPropertyNames(handler)\n  traps.forEach(trap => {\n    newHandler[trap] = function () {\n      try {\n        // Forward the call to the defined proxy handler\n        return handler[trap].apply(this, arguments || [])\n      } catch (err) {\n        // Stack traces differ per browser, we only support chromium based ones currently\n        if (!err || !err.stack || !err.stack.includes(`at `)) {\n          throw err\n        }\n\n        // When something throws within one of our traps the Proxy will show up in error stacks\n        // An earlier implementation of this code would simply strip lines with a blacklist,\n        // but it makes sense to be more surgical here and only remove lines related to our Proxy.\n        // We try to use a known \"anchor\" line for that and strip it with everything above it.\n        // If the anchor line cannot be found for some reason we fall back to our blacklist approach.\n\n        const stripWithBlacklist = (stack, stripFirstLine = true) => {\n          const blacklist = [\n            `at Reflect.${trap} `, // e.g. Reflect.get or Reflect.apply\n            `at Object.${trap} `, // e.g. Object.get or Object.apply\n            `at Object.newHandler.<computed> [as ${trap}] ` // caused by this very wrapper :-)\n          ]\n          return (\n            err.stack\n              .split('\\n')\n              // Always remove the first (file) line in the stack (guaranteed to be our proxy)\n              .filter((line, index) => !(index === 1 && stripFirstLine))\n              // Check if the line starts with one of our blacklisted strings\n              .filter(line => !blacklist.some(bl => line.trim().startsWith(bl)))\n              .join('\\n')\n          )\n        }\n\n        const stripWithAnchor = (stack, anchor) => {\n          const stackArr = stack.split('\\n')\n          anchor = anchor || `at Object.newHandler.<computed> [as ${trap}] ` // Known first Proxy line in chromium\n          const anchorIndex = stackArr.findIndex(line =>\n            line.trim().startsWith(anchor)\n          )\n          if (anchorIndex === -1) {\n            return false // 404, anchor not found\n          }\n          // Strip everything from the top until we reach the anchor line\n          // Note: We're keeping the 1st line (zero index) as it's unrelated (e.g. `TypeError`)\n          stackArr.splice(1, anchorIndex)\n          return stackArr.join('\\n')\n        }\n\n        // Special cases due to our nested toString proxies\n        err.stack = err.stack.replace(\n          'at Object.toString (',\n          'at Function.toString ('\n        )\n        if ((err.stack || '').includes('at Function.toString (')) {\n          err.stack = stripWithBlacklist(err.stack, false)\n          throw err\n        }\n\n        // Try using the anchor method, fallback to blacklist if necessary\n        err.stack = stripWithAnchor(err.stack) || stripWithBlacklist(err.stack)\n\n        throw err // Re-throw our now sanitized error\n      }\n    }\n  })\n  return newHandler\n}",stripErrorWithAnchor:"(err, anchor) => {\n  const stackArr = err.stack.split('\\n')\n  const anchorIndex = stackArr.findIndex(line => line.trim().startsWith(anchor))\n  if (anchorIndex === -1) {\n    return err // 404, anchor not found\n  }\n  // Strip everything from the top until we reach the anchor line (remove anchor line as well)\n  // Note: We're keeping the 1st line (zero index) as it's unrelated (e.g. `TypeError`)\n  stackArr.splice(1, anchorIndex)\n  err.stack = stackArr.join('\\n')\n  return err\n}",replaceProperty:"(obj, propName, descriptorOverrides = {}) => {\n  return Object.defineProperty(obj, propName, {\n    // Copy over the existing descriptors (writable, enumerable, configurable, etc)\n    ...(Object.getOwnPropertyDescriptor(obj, propName) || {}),\n    // Add our overrides (e.g. value, get())\n    ...descriptorOverrides\n  })\n}",preloadCache:"() => {\n  if (utils.cache) {\n    return\n  }\n  utils.cache = {\n    // Used in our proxies\n    Reflect: {\n      get: Reflect.get.bind(Reflect),\n      apply: Reflect.apply.bind(Reflect)\n    },\n    // Used in `makeNativeString`\n    nativeToStringStr: Function.toString + '' // => `function toString() { [native code] }`\n  }\n}",makeNativeString:"(name = '') => {\n  return utils.cache.nativeToStringStr.replace('toString', name || '')\n}",patchToString:"(obj, str = '') => {\n  const handler = {\n    apply: function (target, ctx) {\n      // This fixes e.g. `HTMLMediaElement.prototype.canPlayType.toString + \"\"`\n      if (ctx === Function.prototype.toString) {\n        return utils.makeNativeString('toString')\n      }\n      // `toString` targeted at our proxied Object detected\n      if (ctx === obj) {\n        // We either return the optional string verbatim or derive the most desired result automatically\n        return str || utils.makeNativeString(obj.name)\n      }\n      // Check if the toString protype of the context is the same as the global prototype,\n      // if not indicates that we are doing a check across different windows., e.g. the iframeWithdirect` test case\n      const hasSameProto = Object.getPrototypeOf(\n        Function.prototype.toString\n      ).isPrototypeOf(ctx.toString) // eslint-disable-line no-prototype-builtins\n      if (!hasSameProto) {\n        // Pass the call on to the local Function.prototype.toString instead\n        return ctx.toString()\n      }\n      return target.call(ctx)\n    }\n  }\n\n  const toStringProxy = new Proxy(\n    Function.prototype.toString,\n    utils.stripProxyFromErrors(handler)\n  )\n  utils.replaceProperty(Function.prototype, 'toString', {\n    value: toStringProxy\n  })\n}",patchToStringNested:"(obj = {}) => {\n  return utils.execRecursively(obj, ['function'], utils.patchToString)\n}",redirectToString:"(proxyObj, originalObj) => {\n  const handler = {\n    apply: function (target, ctx) {\n      // This fixes e.g. `HTMLMediaElement.prototype.canPlayType.toString + \"\"`\n      if (ctx === Function.prototype.toString) {\n        return utils.makeNativeString('toString')\n      }\n\n      // `toString` targeted at our proxied Object detected\n      if (ctx === proxyObj) {\n        const fallback = () =>\n          originalObj && originalObj.name\n            ? utils.makeNativeString(originalObj.name)\n            : utils.makeNativeString(proxyObj.name)\n\n        // Return the toString representation of our original object if possible\n        return originalObj + '' || fallback()\n      }\n\n      if (typeof ctx === 'undefined' || ctx === null) {\n        return target.call(ctx)\n      }\n\n      // Check if the toString protype of the context is the same as the global prototype,\n      // if not indicates that we are doing a check across different windows., e.g. the iframeWithdirect` test case\n      const hasSameProto = Object.getPrototypeOf(\n        Function.prototype.toString\n      ).isPrototypeOf(ctx.toString) // eslint-disable-line no-prototype-builtins\n      if (!hasSameProto) {\n        // Pass the call on to the local Function.prototype.toString instead\n        return ctx.toString()\n      }\n\n      return target.call(ctx)\n    }\n  }\n\n  const toStringProxy = new Proxy(\n    Function.prototype.toString,\n    utils.stripProxyFromErrors(handler)\n  )\n  utils.replaceProperty(Function.prototype, 'toString', {\n    value: toStringProxy\n  })\n}",replaceWithProxy:"(obj, propName, handler) => {\n  const originalObj = obj[propName]\n  const proxyObj = new Proxy(obj[propName], utils.stripProxyFromErrors(handler))\n\n  utils.replaceProperty(obj, propName, { value: proxyObj })\n  utils.redirectToString(proxyObj, originalObj)\n\n  return true\n}",replaceGetterWithProxy:"(obj, propName, handler) => {\n  const fn = Object.getOwnPropertyDescriptor(obj, propName).get\n  const fnStr = fn.toString() // special getter function string\n  const proxyObj = new Proxy(fn, utils.stripProxyFromErrors(handler))\n\n  utils.replaceProperty(obj, propName, { get: proxyObj })\n  utils.patchToString(proxyObj, fnStr)\n\n  return true\n}",replaceGetterSetter:"(obj, propName, handlerGetterSetter) => {\n  const ownPropertyDescriptor = Object.getOwnPropertyDescriptor(obj, propName)\n  const handler = { ...ownPropertyDescriptor }\n\n  if (handlerGetterSetter.get !== undefined) {\n    const nativeFn = ownPropertyDescriptor.get\n    handler.get = function() {\n      return handlerGetterSetter.get.call(this, nativeFn.bind(this))\n    }\n    utils.redirectToString(handler.get, nativeFn)\n  }\n\n  if (handlerGetterSetter.set !== undefined) {\n    const nativeFn = ownPropertyDescriptor.set\n    handler.set = function(newValue) {\n      handlerGetterSetter.set.call(this, newValue, nativeFn.bind(this))\n    }\n    utils.redirectToString(handler.set, nativeFn)\n  }\n\n  Object.defineProperty(obj, propName, handler)\n}",mockWithProxy:"(obj, propName, pseudoTarget, handler) => {\n  const proxyObj = new Proxy(pseudoTarget, utils.stripProxyFromErrors(handler))\n\n  utils.replaceProperty(obj, propName, { value: proxyObj })\n  utils.patchToString(proxyObj)\n\n  return true\n}",createProxy:"(pseudoTarget, handler) => {\n  const proxyObj = new Proxy(pseudoTarget, utils.stripProxyFromErrors(handler))\n  utils.patchToString(proxyObj)\n\n  return proxyObj\n}",splitObjPath:"objPath => ({\n  // Remove last dot entry (property) ==> `HTMLMediaElement.prototype`\n  objName: objPath.split('.').slice(0, -1).join('.'),\n  // Extract last dot entry ==> `canPlayType`\n  propName: objPath.split('.').slice(-1)[0]\n})",replaceObjPathWithProxy:"(objPath, handler) => {\n  const { objName, propName } = utils.splitObjPath(objPath)\n  const obj = eval(objName) // eslint-disable-line no-eval\n  return utils.replaceWithProxy(obj, propName, handler)\n}",execRecursively:"(obj = {}, typeFilter = [], fn) => {\n  function recurse(obj) {\n    for (const key in obj) {\n      if (obj[key] === undefined) {\n        continue\n      }\n      if (obj[key] && typeof obj[key] === 'object') {\n        recurse(obj[key])\n      } else {\n        if (obj[key] && typeFilter.includes(typeof obj[key])) {\n          fn.call(this, obj[key])\n        }\n      }\n    }\n  }\n  recurse(obj)\n  return obj\n}",stringifyFns:"(fnObj = { hello: () => 'world' }) => {\n  // Object.fromEntries() ponyfill (in 6 lines) - supported only in Node v12+, modern browsers are fine\n  // https://github.com/feross/fromentries\n  function fromEntries(iterable) {\n    return [...iterable].reduce((obj, [key, val]) => {\n      obj[key] = val\n      return obj\n    }, {})\n  }\n  return (Object.fromEntries || fromEntries)(\n    Object.entries(fnObj)\n      .filter(([key, value]) => typeof value === 'function')\n      .map(([key, value]) => [key, value.toString()]) // eslint-disable-line no-eval\n  )\n}",materializeFns:"(fnStrObj = { hello: \"() => 'world'\" }) => {\n  return Object.fromEntries(\n    Object.entries(fnStrObj).map(([key, value]) => {\n      if (value.startsWith('function')) {\n        // some trickery is needed to make oldschool functions work :-)\n        return [key, eval(`() => ${value}`)()] // eslint-disable-line no-eval\n      } else {\n        // arrow functions just work\n        return [key, eval(value)] // eslint-disable-line no-eval\n      }\n    })\n  )\n}",makeHandler:"() => ({\n  // Used by simple `navigator` getter evasions\n  getterValue: value => ({\n    apply(target, ctx, args) {\n      // Let's fetch the value first, to trigger and escalate potential errors\n      // Illegal invocations like `navigator.__proto__.vendor` will throw here\n      utils.cache.Reflect.apply(...arguments)\n      return value\n    }\n  })\n})",arrayEquals:"(array1, array2) => {\n  if (array1.length !== array2.length) {\n    return false\n  }\n  for (let i = 0; i < array1.length; ++i) {\n    if (array1[i] !== array2[i]) {\n      return false\n    }\n  }\n  return true\n}",memoize:"fn => {\n  const cache = []\n  return function(...args) {\n    if (!cache.some(c => utils.arrayEquals(c.key, args))) {\n      cache.push({ key: args, value: fn.apply(this, args) })\n    }\n    return cache.find(c => utils.arrayEquals(c.key, args)).value\n  }\n}"},_mainFunction:"(utils, { opts }) => {\n        if (!window.chrome) {\n          // Use the exact property descriptor found in headful Chrome\n          // fetch it via `Object.getOwnPropertyDescriptor(window, 'chrome')`\n          Object.defineProperty(window, 'chrome', {\n            writable: true,\n            enumerable: true,\n            configurable: false, // note!\n            value: {} // We'll extend that later\n          })\n        }\n\n        // That means we're running headful and don't need to mock anything\n        if ('loadTimes' in window.chrome) {\n          return // Nothing to do here\n        }\n\n        // Check that the Navigation Timing API v1 + v2 is available, we need that\n        if (\n          !window.performance ||\n          !window.performance.timing ||\n          !window.PerformancePaintTiming\n        ) {\n          return\n        }\n\n        const { performance } = window\n\n        // Some stuff is not available on about:blank as it requires a navigation to occur,\n        // let's harden the code to not fail then:\n        const ntEntryFallback = {\n          nextHopProtocol: 'h2',\n          type: 'other'\n        }\n\n        // The API exposes some funky info regarding the connection\n        const protocolInfo = {\n          get connectionInfo() {\n            const ntEntry =\n              performance.getEntriesByType('navigation')[0] || ntEntryFallback\n            return ntEntry.nextHopProtocol\n          },\n          get npnNegotiatedProtocol() {\n            // NPN is deprecated in favor of ALPN, but this implementation returns the\n            // HTTP/2 or HTTP2+QUIC/39 requests negotiated via ALPN.\n            const ntEntry =\n              performance.getEntriesByType('navigation')[0] || ntEntryFallback\n            return ['h2', 'hq'].includes(ntEntry.nextHopProtocol)\n              ? ntEntry.nextHopProtocol\n              : 'unknown'\n          },\n          get navigationType() {\n            const ntEntry =\n              performance.getEntriesByType('navigation')[0] || ntEntryFallback\n            return ntEntry.type\n          },\n          get wasAlternateProtocolAvailable() {\n            // The Alternate-Protocol header is deprecated in favor of Alt-Svc\n            // (https://www.mnot.net/blog/2016/03/09/alt-svc), so technically this\n            // should always return false.\n            return false\n          },\n          get wasFetchedViaSpdy() {\n            // SPDY is deprecated in favor of HTTP/2, but this implementation returns\n            // true for HTTP/2 or HTTP2+QUIC/39 as well.\n            const ntEntry =\n              performance.getEntriesByType('navigation')[0] || ntEntryFallback\n            return ['h2', 'hq'].includes(ntEntry.nextHopProtocol)\n          },\n          get wasNpnNegotiated() {\n            // NPN is deprecated in favor of ALPN, but this implementation returns true\n            // for HTTP/2 or HTTP2+QUIC/39 requests negotiated via ALPN.\n            const ntEntry =\n              performance.getEntriesByType('navigation')[0] || ntEntryFallback\n            return ['h2', 'hq'].includes(ntEntry.nextHopProtocol)\n          }\n        }\n\n        const { timing } = window.performance\n\n        // Truncate number to specific number of decimals, most of the `loadTimes` stuff has 3\n        function toFixed(num, fixed) {\n          var re = new RegExp('^-?\\\\d+(?:.\\\\d{0,' + (fixed || -1) + '})?')\n          return num.toString().match(re)[0]\n        }\n\n        const timingInfo = {\n          get firstPaintAfterLoadTime() {\n            // This was never actually implemented and always returns 0.\n            return 0\n          },\n          get requestTime() {\n            return timing.navigationStart / 1000\n          },\n          get startLoadTime() {\n            return timing.navigationStart / 1000\n          },\n          get commitLoadTime() {\n            return timing.responseStart / 1000\n          },\n          get finishDocumentLoadTime() {\n            return timing.domContentLoadedEventEnd / 1000\n          },\n          get finishLoadTime() {\n            return timing.loadEventEnd / 1000\n          },\n          get firstPaintTime() {\n            const fpEntry = performance.getEntriesByType('paint')[0] || {\n              startTime: timing.loadEventEnd / 1000 // Fallback if no navigation occured (`about:blank`)\n            }\n            return toFixed(\n              (fpEntry.startTime + performance.timeOrigin) / 1000,\n              3\n            )\n          }\n        }\n\n        window.chrome.loadTimes = function() {\n          return {\n            ...protocolInfo,\n            ...timingInfo\n          }\n        }\n        utils.patchToString(window.chrome.loadTimes)\n      }",_args:[{opts:{}}]}),(({_utilsFns:_utilsFns,_mainFunction:_mainFunction,_args:_args})=>{const utils=Object.fromEntries(Object.entries(_utilsFns).map((([key,value])=>[key,eval(value)])));utils.init(),eval(_mainFunction)(utils,..._args)})({_utilsFns:{init:"() => {\n  utils.preloadCache()\n}",stripProxyFromErrors:"(handler = {}) => {\n  const newHandler = {\n    setPrototypeOf: function (target, proto) {\n      if (proto === null)\n        throw new TypeError('Cannot convert object to primitive value')\n      if (Object.getPrototypeOf(target) === Object.getPrototypeOf(proto)) {\n        throw new TypeError('Cyclic __proto__ value')\n      }\n      return Reflect.setPrototypeOf(target, proto)\n    }\n  }\n  // We wrap each trap in the handler in a try/catch and modify the error stack if they throw\n  const traps = Object.getOwnPropertyNames(handler)\n  traps.forEach(trap => {\n    newHandler[trap] = function () {\n      try {\n        // Forward the call to the defined proxy handler\n        return handler[trap].apply(this, arguments || [])\n      } catch (err) {\n        // Stack traces differ per browser, we only support chromium based ones currently\n        if (!err || !err.stack || !err.stack.includes(`at `)) {\n          throw err\n        }\n\n        // When something throws within one of our traps the Proxy will show up in error stacks\n        // An earlier implementation of this code would simply strip lines with a blacklist,\n        // but it makes sense to be more surgical here and only remove lines related to our Proxy.\n        // We try to use a known \"anchor\" line for that and strip it with everything above it.\n        // If the anchor line cannot be found for some reason we fall back to our blacklist approach.\n\n        const stripWithBlacklist = (stack, stripFirstLine = true) => {\n          const blacklist = [\n            `at Reflect.${trap} `, // e.g. Reflect.get or Reflect.apply\n            `at Object.${trap} `, // e.g. Object.get or Object.apply\n            `at Object.newHandler.<computed> [as ${trap}] ` // caused by this very wrapper :-)\n          ]\n          return (\n            err.stack\n              .split('\\n')\n              // Always remove the first (file) line in the stack (guaranteed to be our proxy)\n              .filter((line, index) => !(index === 1 && stripFirstLine))\n              // Check if the line starts with one of our blacklisted strings\n              .filter(line => !blacklist.some(bl => line.trim().startsWith(bl)))\n              .join('\\n')\n          )\n        }\n\n        const stripWithAnchor = (stack, anchor) => {\n          const stackArr = stack.split('\\n')\n          anchor = anchor || `at Object.newHandler.<computed> [as ${trap}] ` // Known first Proxy line in chromium\n          const anchorIndex = stackArr.findIndex(line =>\n            line.trim().startsWith(anchor)\n          )\n          if (anchorIndex === -1) {\n            return false // 404, anchor not found\n          }\n          // Strip everything from the top until we reach the anchor line\n          // Note: We're keeping the 1st line (zero index) as it's unrelated (e.g. `TypeError`)\n          stackArr.splice(1, anchorIndex)\n          return stackArr.join('\\n')\n        }\n\n        // Special cases due to our nested toString proxies\n        err.stack = err.stack.replace(\n          'at Object.toString (',\n          'at Function.toString ('\n        )\n        if ((err.stack || '').includes('at Function.toString (')) {\n          err.stack = stripWithBlacklist(err.stack, false)\n          throw err\n        }\n\n        // Try using the anchor method, fallback to blacklist if necessary\n        err.stack = stripWithAnchor(err.stack) || stripWithBlacklist(err.stack)\n\n        throw err // Re-throw our now sanitized error\n      }\n    }\n  })\n  return newHandler\n}",stripErrorWithAnchor:"(err, anchor) => {\n  const stackArr = err.stack.split('\\n')\n  const anchorIndex = stackArr.findIndex(line => line.trim().startsWith(anchor))\n  if (anchorIndex === -1) {\n    return err // 404, anchor not found\n  }\n  // Strip everything from the top until we reach the anchor line (remove anchor line as well)\n  // Note: We're keeping the 1st line (zero index) as it's unrelated (e.g. `TypeError`)\n  stackArr.splice(1, anchorIndex)\n  err.stack = stackArr.join('\\n')\n  return err\n}",replaceProperty:"(obj, propName, descriptorOverrides = {}) => {\n  return Object.defineProperty(obj, propName, {\n    // Copy over the existing descriptors (writable, enumerable, configurable, etc)\n    ...(Object.getOwnPropertyDescriptor(obj, propName) || {}),\n    // Add our overrides (e.g. value, get())\n    ...descriptorOverrides\n  })\n}",preloadCache:"() => {\n  if (utils.cache) {\n    return\n  }\n  utils.cache = {\n    // Used in our proxies\n    Reflect: {\n      get: Reflect.get.bind(Reflect),\n      apply: Reflect.apply.bind(Reflect)\n    },\n    // Used in `makeNativeString`\n    nativeToStringStr: Function.toString + '' // => `function toString() { [native code] }`\n  }\n}",makeNativeString:"(name = '') => {\n  return utils.cache.nativeToStringStr.replace('toString', name || '')\n}",patchToString:"(obj, str = '') => {\n  const handler = {\n    apply: function (target, ctx) {\n      // This fixes e.g. `HTMLMediaElement.prototype.canPlayType.toString + \"\"`\n      if (ctx === Function.prototype.toString) {\n        return utils.makeNativeString('toString')\n      }\n      // `toString` targeted at our proxied Object detected\n      if (ctx === obj) {\n        // We either return the optional string verbatim or derive the most desired result automatically\n        return str || utils.makeNativeString(obj.name)\n      }\n      // Check if the toString protype of the context is the same as the global prototype,\n      // if not indicates that we are doing a check across different windows., e.g. the iframeWithdirect` test case\n      const hasSameProto = Object.getPrototypeOf(\n        Function.prototype.toString\n      ).isPrototypeOf(ctx.toString) // eslint-disable-line no-prototype-builtins\n      if (!hasSameProto) {\n        // Pass the call on to the local Function.prototype.toString instead\n        return ctx.toString()\n      }\n      return target.call(ctx)\n    }\n  }\n\n  const toStringProxy = new Proxy(\n    Function.prototype.toString,\n    utils.stripProxyFromErrors(handler)\n  )\n  utils.replaceProperty(Function.prototype, 'toString', {\n    value: toStringProxy\n  })\n}",patchToStringNested:"(obj = {}) => {\n  return utils.execRecursively(obj, ['function'], utils.patchToString)\n}",redirectToString:"(proxyObj, originalObj) => {\n  const handler = {\n    apply: function (target, ctx) {\n      // This fixes e.g. `HTMLMediaElement.prototype.canPlayType.toString + \"\"`\n      if (ctx === Function.prototype.toString) {\n        return utils.makeNativeString('toString')\n      }\n\n      // `toString` targeted at our proxied Object detected\n      if (ctx === proxyObj) {\n        const fallback = () =>\n          originalObj && originalObj.name\n            ? utils.makeNativeString(originalObj.name)\n            : utils.makeNativeString(proxyObj.name)\n\n        // Return the toString representation of our original object if possible\n        return originalObj + '' || fallback()\n      }\n\n      if (typeof ctx === 'undefined' || ctx === null) {\n        return target.call(ctx)\n      }\n\n      // Check if the toString protype of the context is the same as the global prototype,\n      // if not indicates that we are doing a check across different windows., e.g. the iframeWithdirect` test case\n      const hasSameProto = Object.getPrototypeOf(\n        Function.prototype.toString\n      ).isPrototypeOf(ctx.toString) // eslint-disable-line no-prototype-builtins\n      if (!hasSameProto) {\n        // Pass the call on to the local Function.prototype.toString instead\n        return ctx.toString()\n      }\n\n      return target.call(ctx)\n    }\n  }\n\n  const toStringProxy = new Proxy(\n    Function.prototype.toString,\n    utils.stripProxyFromErrors(handler)\n  )\n  utils.replaceProperty(Function.prototype, 'toString', {\n    value: toStringProxy\n  })\n}",replaceWithProxy:"(obj, propName, handler) => {\n  const originalObj = obj[propName]\n  const proxyObj = new Proxy(obj[propName], utils.stripProxyFromErrors(handler))\n\n  utils.replaceProperty(obj, propName, { value: proxyObj })\n  utils.redirectToString(proxyObj, originalObj)\n\n  return true\n}",replaceGetterWithProxy:"(obj, propName, handler) => {\n  const fn = Object.getOwnPropertyDescriptor(obj, propName).get\n  const fnStr = fn.toString() // special getter function string\n  const proxyObj = new Proxy(fn, utils.stripProxyFromErrors(handler))\n\n  utils.replaceProperty(obj, propName, { get: proxyObj })\n  utils.patchToString(proxyObj, fnStr)\n\n  return true\n}",replaceGetterSetter:"(obj, propName, handlerGetterSetter) => {\n  const ownPropertyDescriptor = Object.getOwnPropertyDescriptor(obj, propName)\n  const handler = { ...ownPropertyDescriptor }\n\n  if (handlerGetterSetter.get !== undefined) {\n    const nativeFn = ownPropertyDescriptor.get\n    handler.get = function() {\n      return handlerGetterSetter.get.call(this, nativeFn.bind(this))\n    }\n    utils.redirectToString(handler.get, nativeFn)\n  }\n\n  if (handlerGetterSetter.set !== undefined) {\n    const nativeFn = ownPropertyDescriptor.set\n    handler.set = function(newValue) {\n      handlerGetterSetter.set.call(this, newValue, nativeFn.bind(this))\n    }\n    utils.redirectToString(handler.set, nativeFn)\n  }\n\n  Object.defineProperty(obj, propName, handler)\n}",mockWithProxy:"(obj, propName, pseudoTarget, handler) => {\n  const proxyObj = new Proxy(pseudoTarget, utils.stripProxyFromErrors(handler))\n\n  utils.replaceProperty(obj, propName, { value: proxyObj })\n  utils.patchToString(proxyObj)\n\n  return true\n}",createProxy:"(pseudoTarget, handler) => {\n  const proxyObj = new Proxy(pseudoTarget, utils.stripProxyFromErrors(handler))\n  utils.patchToString(proxyObj)\n\n  return proxyObj\n}",splitObjPath:"objPath => ({\n  // Remove last dot entry (property) ==> `HTMLMediaElement.prototype`\n  objName: objPath.split('.').slice(0, -1).join('.'),\n  // Extract last dot entry ==> `canPlayType`\n  propName: objPath.split('.').slice(-1)[0]\n})",replaceObjPathWithProxy:"(objPath, handler) => {\n  const { objName, propName } = utils.splitObjPath(objPath)\n  const obj = eval(objName) // eslint-disable-line no-eval\n  return utils.replaceWithProxy(obj, propName, handler)\n}",execRecursively:"(obj = {}, typeFilter = [], fn) => {\n  function recurse(obj) {\n    for (const key in obj) {\n      if (obj[key] === undefined) {\n        continue\n      }\n      if (obj[key] && typeof obj[key] === 'object') {\n        recurse(obj[key])\n      } else {\n        if (obj[key] && typeFilter.includes(typeof obj[key])) {\n          fn.call(this, obj[key])\n        }\n      }\n    }\n  }\n  recurse(obj)\n  return obj\n}",stringifyFns:"(fnObj = { hello: () => 'world' }) => {\n  // Object.fromEntries() ponyfill (in 6 lines) - supported only in Node v12+, modern browsers are fine\n  // https://github.com/feross/fromentries\n  function fromEntries(iterable) {\n    return [...iterable].reduce((obj, [key, val]) => {\n      obj[key] = val\n      return obj\n    }, {})\n  }\n  return (Object.fromEntries || fromEntries)(\n    Object.entries(fnObj)\n      .filter(([key, value]) => typeof value === 'function')\n      .map(([key, value]) => [key, value.toString()]) // eslint-disable-line no-eval\n  )\n}",materializeFns:"(fnStrObj = { hello: \"() => 'world'\" }) => {\n  return Object.fromEntries(\n    Object.entries(fnStrObj).map(([key, value]) => {\n      if (value.startsWith('function')) {\n        // some trickery is needed to make oldschool functions work :-)\n        return [key, eval(`() => ${value}`)()] // eslint-disable-line no-eval\n      } else {\n        // arrow functions just work\n        return [key, eval(value)] // eslint-disable-line no-eval\n      }\n    })\n  )\n}",makeHandler:"() => ({\n  // Used by simple `navigator` getter evasions\n  getterValue: value => ({\n    apply(target, ctx, args) {\n      // Let's fetch the value first, to trigger and escalate potential errors\n      // Illegal invocations like `navigator.__proto__.vendor` will throw here\n      utils.cache.Reflect.apply(...arguments)\n      return value\n    }\n  })\n})",arrayEquals:"(array1, array2) => {\n  if (array1.length !== array2.length) {\n    return false\n  }\n  for (let i = 0; i < array1.length; ++i) {\n    if (array1[i] !== array2[i]) {\n      return false\n    }\n  }\n  return true\n}",memoize:"fn => {\n  const cache = []\n  return function(...args) {\n    if (!cache.some(c => utils.arrayEquals(c.key, args))) {\n      cache.push({ key: args, value: fn.apply(this, args) })\n    }\n    return cache.find(c => utils.arrayEquals(c.key, args)).value\n  }\n}"},_mainFunction:"(utils, { opts, STATIC_DATA }) => {\n        if (!window.chrome) {\n          // Use the exact property descriptor found in headful Chrome\n          // fetch it via `Object.getOwnPropertyDescriptor(window, 'chrome')`\n          Object.defineProperty(window, 'chrome', {\n            writable: true,\n            enumerable: true,\n            configurable: false, // note!\n            value: {} // We'll extend that later\n          })\n        }\n\n        // That means we're running headful and don't need to mock anything\n        const existsAlready = 'runtime' in window.chrome\n        // `chrome.runtime` is only exposed on secure origins\n        const isNotSecure = !window.location.protocol.startsWith('https')\n        if (existsAlready || (isNotSecure && !opts.runOnInsecureOrigins)) {\n          return // Nothing to do here\n        }\n\n        window.chrome.runtime = {\n          // There's a bunch of static data in that property which doesn't seem to change,\n          // we should periodically check for updates: `JSON.stringify(window.chrome.runtime, null, 2)`\n          ...STATIC_DATA,\n          // `chrome.runtime.id` is extension related and returns undefined in Chrome\n          get id() {\n            return undefined\n          },\n          // These two require more sophisticated mocks\n          connect: null,\n          sendMessage: null\n        }\n\n        const makeCustomRuntimeErrors = (preamble, method, extensionId) => ({\n          NoMatchingSignature: new TypeError(\n            preamble + `No matching signature.`\n          ),\n          MustSpecifyExtensionID: new TypeError(\n            preamble +\n              `${method} called from a webpage must specify an Extension ID (string) for its first argument.`\n          ),\n          InvalidExtensionID: new TypeError(\n            preamble + `Invalid extension id: '${extensionId}'`\n          )\n        })\n\n        // Valid Extension IDs are 32 characters in length and use the letter `a` to `p`:\n        // https://source.chromium.org/chromium/chromium/src/+/master:components/crx_file/id_util.cc;drc=14a055ccb17e8c8d5d437fe080faba4c6f07beac;l=90\n        const isValidExtensionID = str =>\n          str.length === 32 && str.toLowerCase().match(/^[a-p]+$/)\n\n        /** Mock `chrome.runtime.sendMessage` */\n        const sendMessageHandler = {\n          apply: function(target, ctx, args) {\n            const [extensionId, options, responseCallback] = args || []\n\n            // Define custom errors\n            const errorPreamble = `Error in invocation of runtime.sendMessage(optional string extensionId, any message, optional object options, optional function responseCallback): `\n            const Errors = makeCustomRuntimeErrors(\n              errorPreamble,\n              `chrome.runtime.sendMessage()`,\n              extensionId\n            )\n\n            // Check if the call signature looks ok\n            const noArguments = args.length === 0\n            const tooManyArguments = args.length > 4\n            const incorrectOptions = options && typeof options !== 'object'\n            const incorrectResponseCallback =\n              responseCallback && typeof responseCallback !== 'function'\n            if (\n              noArguments ||\n              tooManyArguments ||\n              incorrectOptions ||\n              incorrectResponseCallback\n            ) {\n              throw Errors.NoMatchingSignature\n            }\n\n            // At least 2 arguments are required before we even validate the extension ID\n            if (args.length < 2) {\n              throw Errors.MustSpecifyExtensionID\n            }\n\n            // Now let's make sure we got a string as extension ID\n            if (typeof extensionId !== 'string') {\n              throw Errors.NoMatchingSignature\n            }\n\n            if (!isValidExtensionID(extensionId)) {\n              throw Errors.InvalidExtensionID\n            }\n\n            return undefined // Normal behavior\n          }\n        }\n        utils.mockWithProxy(\n          window.chrome.runtime,\n          'sendMessage',\n          function sendMessage() {},\n          sendMessageHandler\n        )\n\n        /**\n         * Mock `chrome.runtime.connect`\n         *\n         * @see https://developer.chrome.com/apps/runtime#method-connect\n         */\n        const connectHandler = {\n          apply: function(target, ctx, args) {\n            const [extensionId, connectInfo] = args || []\n\n            // Define custom errors\n            const errorPreamble = `Error in invocation of runtime.connect(optional string extensionId, optional object connectInfo): `\n            const Errors = makeCustomRuntimeErrors(\n              errorPreamble,\n              `chrome.runtime.connect()`,\n              extensionId\n            )\n\n            // Behavior differs a bit from sendMessage:\n            const noArguments = args.length === 0\n            const emptyStringArgument = args.length === 1 && extensionId === ''\n            if (noArguments || emptyStringArgument) {\n              throw Errors.MustSpecifyExtensionID\n            }\n\n            const tooManyArguments = args.length > 2\n            const incorrectConnectInfoType =\n              connectInfo && typeof connectInfo !== 'object'\n\n            if (tooManyArguments || incorrectConnectInfoType) {\n              throw Errors.NoMatchingSignature\n            }\n\n            const extensionIdIsString = typeof extensionId === 'string'\n            if (extensionIdIsString && extensionId === '') {\n              throw Errors.MustSpecifyExtensionID\n            }\n            if (extensionIdIsString && !isValidExtensionID(extensionId)) {\n              throw Errors.InvalidExtensionID\n            }\n\n            // There's another edge-case here: extensionId is optional so we might find a connectInfo object as first param, which we need to validate\n            const validateConnectInfo = ci => {\n              // More than a first param connectInfo as been provided\n              if (args.length > 1) {\n                throw Errors.NoMatchingSignature\n              }\n              // An empty connectInfo has been provided\n              if (Object.keys(ci).length === 0) {\n                throw Errors.MustSpecifyExtensionID\n              }\n              // Loop over all connectInfo props an check them\n              Object.entries(ci).forEach(([k, v]) => {\n                const isExpected = ['name', 'includeTlsChannelId'].includes(k)\n                if (!isExpected) {\n                  throw new TypeError(\n                    errorPreamble + `Unexpected property: '${k}'.`\n                  )\n                }\n                const MismatchError = (propName, expected, found) =>\n                  TypeError(\n                    errorPreamble +\n                      `Error at property '${propName}': Invalid type: expected ${expected}, found ${found}.`\n                  )\n                if (k === 'name' && typeof v !== 'string') {\n                  throw MismatchError(k, 'string', typeof v)\n                }\n                if (k === 'includeTlsChannelId' && typeof v !== 'boolean') {\n                  throw MismatchError(k, 'boolean', typeof v)\n                }\n              })\n            }\n            if (typeof extensionId === 'object') {\n              validateConnectInfo(extensionId)\n              throw Errors.MustSpecifyExtensionID\n            }\n\n            // Unfortunately even when the connect fails Chrome will return an object with methods we need to mock as well\n            return utils.patchToStringNested(makeConnectResponse())\n          }\n        }\n        utils.mockWithProxy(\n          window.chrome.runtime,\n          'connect',\n          function connect() {},\n          connectHandler\n        )\n\n        function makeConnectResponse() {\n          const onSomething = () => ({\n            addListener: function addListener() {},\n            dispatch: function dispatch() {},\n            hasListener: function hasListener() {},\n            hasListeners: function hasListeners() {\n              return false\n            },\n            removeListener: function removeListener() {}\n          })\n\n          const response = {\n            name: '',\n            sender: undefined,\n            disconnect: function disconnect() {},\n            onDisconnect: onSomething(),\n            onMessage: onSomething(),\n            postMessage: function postMessage() {\n              if (!arguments.length) {\n                throw new TypeError(`Insufficient number of arguments.`)\n              }\n              throw new Error(`Attempting to use a disconnected port object`)\n            }\n          }\n          return response\n        }\n      }",_args:[{opts:{runOnInsecureOrigins:!1},STATIC_DATA:{OnInstalledReason:{CHROME_UPDATE:"chrome_update",INSTALL:"install",SHARED_MODULE_UPDATE:"shared_module_update",UPDATE:"update"},OnRestartRequiredReason:{APP_UPDATE:"app_update",OS_UPDATE:"os_update",PERIODIC:"periodic"},PlatformArch:{ARM:"arm",ARM64:"arm64",MIPS:"mips",MIPS64:"mips64",X86_32:"x86-32",X86_64:"x86-64"},PlatformNaclArch:{ARM:"arm",MIPS:"mips",MIPS64:"mips64",X86_32:"x86-32",X86_64:"x86-64"},PlatformOs:{ANDROID:"android",CROS:"cros",LINUX:"linux",MAC:"mac",OPENBSD:"openbsd",WIN:"win"},RequestUpdateCheckStatus:{NO_UPDATE:"no_update",THROTTLED:"throttled",UPDATE_AVAILABLE:"update_available"}}}]}),(({_utilsFns:_utilsFns,_mainFunction:_mainFunction,_args:_args})=>{const utils=Object.fromEntries(Object.entries(_utilsFns).map((([key,value])=>[key,eval(value)])));utils.init(),eval(_mainFunction)(utils,..._args)})({_utilsFns:{init:"() => {\n  utils.preloadCache()\n}",stripProxyFromErrors:"(handler = {}) => {\n  const newHandler = {\n    setPrototypeOf: function (target, proto) {\n      if (proto === null)\n        throw new TypeError('Cannot convert object to primitive value')\n      if (Object.getPrototypeOf(target) === Object.getPrototypeOf(proto)) {\n        throw new TypeError('Cyclic __proto__ value')\n      }\n      return Reflect.setPrototypeOf(target, proto)\n    }\n  }\n  // We wrap each trap in the handler in a try/catch and modify the error stack if they throw\n  const traps = Object.getOwnPropertyNames(handler)\n  traps.forEach(trap => {\n    newHandler[trap] = function () {\n      try {\n        // Forward the call to the defined proxy handler\n        return handler[trap].apply(this, arguments || [])\n      } catch (err) {\n        // Stack traces differ per browser, we only support chromium based ones currently\n        if (!err || !err.stack || !err.stack.includes(`at `)) {\n          throw err\n        }\n\n        // When something throws within one of our traps the Proxy will show up in error stacks\n        // An earlier implementation of this code would simply strip lines with a blacklist,\n        // but it makes sense to be more surgical here and only remove lines related to our Proxy.\n        // We try to use a known \"anchor\" line for that and strip it with everything above it.\n        // If the anchor line cannot be found for some reason we fall back to our blacklist approach.\n\n        const stripWithBlacklist = (stack, stripFirstLine = true) => {\n          const blacklist = [\n            `at Reflect.${trap} `, // e.g. Reflect.get or Reflect.apply\n            `at Object.${trap} `, // e.g. Object.get or Object.apply\n            `at Object.newHandler.<computed> [as ${trap}] ` // caused by this very wrapper :-)\n          ]\n          return (\n            err.stack\n              .split('\\n')\n              // Always remove the first (file) line in the stack (guaranteed to be our proxy)\n              .filter((line, index) => !(index === 1 && stripFirstLine))\n              // Check if the line starts with one of our blacklisted strings\n              .filter(line => !blacklist.some(bl => line.trim().startsWith(bl)))\n              .join('\\n')\n          )\n        }\n\n        const stripWithAnchor = (stack, anchor) => {\n          const stackArr = stack.split('\\n')\n          anchor = anchor || `at Object.newHandler.<computed> [as ${trap}] ` // Known first Proxy line in chromium\n          const anchorIndex = stackArr.findIndex(line =>\n            line.trim().startsWith(anchor)\n          )\n          if (anchorIndex === -1) {\n            return false // 404, anchor not found\n          }\n          // Strip everything from the top until we reach the anchor line\n          // Note: We're keeping the 1st line (zero index) as it's unrelated (e.g. `TypeError`)\n          stackArr.splice(1, anchorIndex)\n          return stackArr.join('\\n')\n        }\n\n        // Special cases due to our nested toString proxies\n        err.stack = err.stack.replace(\n          'at Object.toString (',\n          'at Function.toString ('\n        )\n        if ((err.stack || '').includes('at Function.toString (')) {\n          err.stack = stripWithBlacklist(err.stack, false)\n          throw err\n        }\n\n        // Try using the anchor method, fallback to blacklist if necessary\n        err.stack = stripWithAnchor(err.stack) || stripWithBlacklist(err.stack)\n\n        throw err // Re-throw our now sanitized error\n      }\n    }\n  })\n  return newHandler\n}",stripErrorWithAnchor:"(err, anchor) => {\n  const stackArr = err.stack.split('\\n')\n  const anchorIndex = stackArr.findIndex(line => line.trim().startsWith(anchor))\n  if (anchorIndex === -1) {\n    return err // 404, anchor not found\n  }\n  // Strip everything from the top until we reach the anchor line (remove anchor line as well)\n  // Note: We're keeping the 1st line (zero index) as it's unrelated (e.g. `TypeError`)\n  stackArr.splice(1, anchorIndex)\n  err.stack = stackArr.join('\\n')\n  return err\n}",replaceProperty:"(obj, propName, descriptorOverrides = {}) => {\n  return Object.defineProperty(obj, propName, {\n    // Copy over the existing descriptors (writable, enumerable, configurable, etc)\n    ...(Object.getOwnPropertyDescriptor(obj, propName) || {}),\n    // Add our overrides (e.g. value, get())\n    ...descriptorOverrides\n  })\n}",preloadCache:"() => {\n  if (utils.cache) {\n    return\n  }\n  utils.cache = {\n    // Used in our proxies\n    Reflect: {\n      get: Reflect.get.bind(Reflect),\n      apply: Reflect.apply.bind(Reflect)\n    },\n    // Used in `makeNativeString`\n    nativeToStringStr: Function.toString + '' // => `function toString() { [native code] }`\n  }\n}",makeNativeString:"(name = '') => {\n  return utils.cache.nativeToStringStr.replace('toString', name || '')\n}",patchToString:"(obj, str = '') => {\n  const handler = {\n    apply: function (target, ctx) {\n      // This fixes e.g. `HTMLMediaElement.prototype.canPlayType.toString + \"\"`\n      if (ctx === Function.prototype.toString) {\n        return utils.makeNativeString('toString')\n      }\n      // `toString` targeted at our proxied Object detected\n      if (ctx === obj) {\n        // We either return the optional string verbatim or derive the most desired result automatically\n        return str || utils.makeNativeString(obj.name)\n      }\n      // Check if the toString protype of the context is the same as the global prototype,\n      // if not indicates that we are doing a check across different windows., e.g. the iframeWithdirect` test case\n      const hasSameProto = Object.getPrototypeOf(\n        Function.prototype.toString\n      ).isPrototypeOf(ctx.toString) // eslint-disable-line no-prototype-builtins\n      if (!hasSameProto) {\n        // Pass the call on to the local Function.prototype.toString instead\n        return ctx.toString()\n      }\n      return target.call(ctx)\n    }\n  }\n\n  const toStringProxy = new Proxy(\n    Function.prototype.toString,\n    utils.stripProxyFromErrors(handler)\n  )\n  utils.replaceProperty(Function.prototype, 'toString', {\n    value: toStringProxy\n  })\n}",patchToStringNested:"(obj = {}) => {\n  return utils.execRecursively(obj, ['function'], utils.patchToString)\n}",redirectToString:"(proxyObj, originalObj) => {\n  const handler = {\n    apply: function (target, ctx) {\n      // This fixes e.g. `HTMLMediaElement.prototype.canPlayType.toString + \"\"`\n      if (ctx === Function.prototype.toString) {\n        return utils.makeNativeString('toString')\n      }\n\n      // `toString` targeted at our proxied Object detected\n      if (ctx === proxyObj) {\n        const fallback = () =>\n          originalObj && originalObj.name\n            ? utils.makeNativeString(originalObj.name)\n            : utils.makeNativeString(proxyObj.name)\n\n        // Return the toString representation of our original object if possible\n        return originalObj + '' || fallback()\n      }\n\n      if (typeof ctx === 'undefined' || ctx === null) {\n        return target.call(ctx)\n      }\n\n      // Check if the toString protype of the context is the same as the global prototype,\n      // if not indicates that we are doing a check across different windows., e.g. the iframeWithdirect` test case\n      const hasSameProto = Object.getPrototypeOf(\n        Function.prototype.toString\n      ).isPrototypeOf(ctx.toString) // eslint-disable-line no-prototype-builtins\n      if (!hasSameProto) {\n        // Pass the call on to the local Function.prototype.toString instead\n        return ctx.toString()\n      }\n\n      return target.call(ctx)\n    }\n  }\n\n  const toStringProxy = new Proxy(\n    Function.prototype.toString,\n    utils.stripProxyFromErrors(handler)\n  )\n  utils.replaceProperty(Function.prototype, 'toString', {\n    value: toStringProxy\n  })\n}",replaceWithProxy:"(obj, propName, handler) => {\n  const originalObj = obj[propName]\n  const proxyObj = new Proxy(obj[propName], utils.stripProxyFromErrors(handler))\n\n  utils.replaceProperty(obj, propName, { value: proxyObj })\n  utils.redirectToString(proxyObj, originalObj)\n\n  return true\n}",replaceGetterWithProxy:"(obj, propName, handler) => {\n  const fn = Object.getOwnPropertyDescriptor(obj, propName).get\n  const fnStr = fn.toString() // special getter function string\n  const proxyObj = new Proxy(fn, utils.stripProxyFromErrors(handler))\n\n  utils.replaceProperty(obj, propName, { get: proxyObj })\n  utils.patchToString(proxyObj, fnStr)\n\n  return true\n}",replaceGetterSetter:"(obj, propName, handlerGetterSetter) => {\n  const ownPropertyDescriptor = Object.getOwnPropertyDescriptor(obj, propName)\n  const handler = { ...ownPropertyDescriptor }\n\n  if (handlerGetterSetter.get !== undefined) {\n    const nativeFn = ownPropertyDescriptor.get\n    handler.get = function() {\n      return handlerGetterSetter.get.call(this, nativeFn.bind(this))\n    }\n    utils.redirectToString(handler.get, nativeFn)\n  }\n\n  if (handlerGetterSetter.set !== undefined) {\n    const nativeFn = ownPropertyDescriptor.set\n    handler.set = function(newValue) {\n      handlerGetterSetter.set.call(this, newValue, nativeFn.bind(this))\n    }\n    utils.redirectToString(handler.set, nativeFn)\n  }\n\n  Object.defineProperty(obj, propName, handler)\n}",mockWithProxy:"(obj, propName, pseudoTarget, handler) => {\n  const proxyObj = new Proxy(pseudoTarget, utils.stripProxyFromErrors(handler))\n\n  utils.replaceProperty(obj, propName, { value: proxyObj })\n  utils.patchToString(proxyObj)\n\n  return true\n}",createProxy:"(pseudoTarget, handler) => {\n  const proxyObj = new Proxy(pseudoTarget, utils.stripProxyFromErrors(handler))\n  utils.patchToString(proxyObj)\n\n  return proxyObj\n}",splitObjPath:"objPath => ({\n  // Remove last dot entry (property) ==> `HTMLMediaElement.prototype`\n  objName: objPath.split('.').slice(0, -1).join('.'),\n  // Extract last dot entry ==> `canPlayType`\n  propName: objPath.split('.').slice(-1)[0]\n})",replaceObjPathWithProxy:"(objPath, handler) => {\n  const { objName, propName } = utils.splitObjPath(objPath)\n  const obj = eval(objName) // eslint-disable-line no-eval\n  return utils.replaceWithProxy(obj, propName, handler)\n}",execRecursively:"(obj = {}, typeFilter = [], fn) => {\n  function recurse(obj) {\n    for (const key in obj) {\n      if (obj[key] === undefined) {\n        continue\n      }\n      if (obj[key] && typeof obj[key] === 'object') {\n        recurse(obj[key])\n      } else {\n        if (obj[key] && typeFilter.includes(typeof obj[key])) {\n          fn.call(this, obj[key])\n        }\n      }\n    }\n  }\n  recurse(obj)\n  return obj\n}",stringifyFns:"(fnObj = { hello: () => 'world' }) => {\n  // Object.fromEntries() ponyfill (in 6 lines) - supported only in Node v12+, modern browsers are fine\n  // https://github.com/feross/fromentries\n  function fromEntries(iterable) {\n    return [...iterable].reduce((obj, [key, val]) => {\n      obj[key] = val\n      return obj\n    }, {})\n  }\n  return (Object.fromEntries || fromEntries)(\n    Object.entries(fnObj)\n      .filter(([key, value]) => typeof value === 'function')\n      .map(([key, value]) => [key, value.toString()]) // eslint-disable-line no-eval\n  )\n}",materializeFns:"(fnStrObj = { hello: \"() => 'world'\" }) => {\n  return Object.fromEntries(\n    Object.entries(fnStrObj).map(([key, value]) => {\n      if (value.startsWith('function')) {\n        // some trickery is needed to make oldschool functions work :-)\n        return [key, eval(`() => ${value}`)()] // eslint-disable-line no-eval\n      } else {\n        // arrow functions just work\n        return [key, eval(value)] // eslint-disable-line no-eval\n      }\n    })\n  )\n}",makeHandler:"() => ({\n  // Used by simple `navigator` getter evasions\n  getterValue: value => ({\n    apply(target, ctx, args) {\n      // Let's fetch the value first, to trigger and escalate potential errors\n      // Illegal invocations like `navigator.__proto__.vendor` will throw here\n      utils.cache.Reflect.apply(...arguments)\n      return value\n    }\n  })\n})",arrayEquals:"(array1, array2) => {\n  if (array1.length !== array2.length) {\n    return false\n  }\n  for (let i = 0; i < array1.length; ++i) {\n    if (array1[i] !== array2[i]) {\n      return false\n    }\n  }\n  return true\n}",memoize:"fn => {\n  const cache = []\n  return function(...args) {\n    if (!cache.some(c => utils.arrayEquals(c.key, args))) {\n      cache.push({ key: args, value: fn.apply(this, args) })\n    }\n    return cache.find(c => utils.arrayEquals(c.key, args)).value\n  }\n}"},_mainFunction:"utils => {\n      /**\n       * Input might look funky, we need to normalize it so e.g. whitespace isn't an issue for our spoofing.\n       *\n       * @example\n       * video/webm; codecs=\"vp8, vorbis\"\n       * video/mp4; codecs=\"avc1.42E01E\"\n       * audio/x-m4a;\n       * audio/ogg; codecs=\"vorbis\"\n       * @param {String} arg\n       */\n      const parseInput = arg => {\n        const [mime, codecStr] = arg.trim().split(';')\n        let codecs = []\n        if (codecStr && codecStr.includes('codecs=\"')) {\n          codecs = codecStr\n            .trim()\n            .replace(`codecs=\"`, '')\n            .replace(`\"`, '')\n            .trim()\n            .split(',')\n            .filter(x => !!x)\n            .map(x => x.trim())\n        }\n        return {\n          mime,\n          codecStr,\n          codecs\n        }\n      }\n\n      const canPlayType = {\n        // Intercept certain requests\n        apply: function(target, ctx, args) {\n          if (!args || !args.length) {\n            return target.apply(ctx, args)\n          }\n          const { mime, codecs } = parseInput(args[0])\n          // This specific mp4 codec is missing in Chromium\n          if (mime === 'video/mp4') {\n            if (codecs.includes('avc1.42E01E')) {\n              return 'probably'\n            }\n          }\n          // This mimetype is only supported if no codecs are specified\n          if (mime === 'audio/x-m4a' && !codecs.length) {\n            return 'maybe'\n          }\n\n          // This mimetype is only supported if no codecs are specified\n          if (mime === 'audio/aac' && !codecs.length) {\n            return 'probably'\n          }\n          // Everything else as usual\n          return target.apply(ctx, args)\n        }\n      }\n\n      /* global HTMLMediaElement */\n      utils.replaceWithProxy(\n        HTMLMediaElement.prototype,\n        'canPlayType',\n        canPlayType\n      )\n    }",_args:[]}),(({_utilsFns:_utilsFns,_mainFunction:_mainFunction,_args:_args})=>{const utils=Object.fromEntries(Object.entries(_utilsFns).map((([key,value])=>[key,eval(value)])));utils.init(),eval(_mainFunction)(utils,..._args)})({_utilsFns:{init:"() => {\n  utils.preloadCache()\n}",stripProxyFromErrors:"(handler = {}) => {\n  const newHandler = {\n    setPrototypeOf: function (target, proto) {\n      if (proto === null)\n        throw new TypeError('Cannot convert object to primitive value')\n      if (Object.getPrototypeOf(target) === Object.getPrototypeOf(proto)) {\n        throw new TypeError('Cyclic __proto__ value')\n      }\n      return Reflect.setPrototypeOf(target, proto)\n    }\n  }\n  // We wrap each trap in the handler in a try/catch and modify the error stack if they throw\n  const traps = Object.getOwnPropertyNames(handler)\n  traps.forEach(trap => {\n    newHandler[trap] = function () {\n      try {\n        // Forward the call to the defined proxy handler\n        return handler[trap].apply(this, arguments || [])\n      } catch (err) {\n        // Stack traces differ per browser, we only support chromium based ones currently\n        if (!err || !err.stack || !err.stack.includes(`at `)) {\n          throw err\n        }\n\n        // When something throws within one of our traps the Proxy will show up in error stacks\n        // An earlier implementation of this code would simply strip lines with a blacklist,\n        // but it makes sense to be more surgical here and only remove lines related to our Proxy.\n        // We try to use a known \"anchor\" line for that and strip it with everything above it.\n        // If the anchor line cannot be found for some reason we fall back to our blacklist approach.\n\n        const stripWithBlacklist = (stack, stripFirstLine = true) => {\n          const blacklist = [\n            `at Reflect.${trap} `, // e.g. Reflect.get or Reflect.apply\n            `at Object.${trap} `, // e.g. Object.get or Object.apply\n            `at Object.newHandler.<computed> [as ${trap}] ` // caused by this very wrapper :-)\n          ]\n          return (\n            err.stack\n              .split('\\n')\n              // Always remove the first (file) line in the stack (guaranteed to be our proxy)\n              .filter((line, index) => !(index === 1 && stripFirstLine))\n              // Check if the line starts with one of our blacklisted strings\n              .filter(line => !blacklist.some(bl => line.trim().startsWith(bl)))\n              .join('\\n')\n          )\n        }\n\n        const stripWithAnchor = (stack, anchor) => {\n          const stackArr = stack.split('\\n')\n          anchor = anchor || `at Object.newHandler.<computed> [as ${trap}] ` // Known first Proxy line in chromium\n          const anchorIndex = stackArr.findIndex(line =>\n            line.trim().startsWith(anchor)\n          )\n          if (anchorIndex === -1) {\n            return false // 404, anchor not found\n          }\n          // Strip everything from the top until we reach the anchor line\n          // Note: We're keeping the 1st line (zero index) as it's unrelated (e.g. `TypeError`)\n          stackArr.splice(1, anchorIndex)\n          return stackArr.join('\\n')\n        }\n\n        // Special cases due to our nested toString proxies\n        err.stack = err.stack.replace(\n          'at Object.toString (',\n          'at Function.toString ('\n        )\n        if ((err.stack || '').includes('at Function.toString (')) {\n          err.stack = stripWithBlacklist(err.stack, false)\n          throw err\n        }\n\n        // Try using the anchor method, fallback to blacklist if necessary\n        err.stack = stripWithAnchor(err.stack) || stripWithBlacklist(err.stack)\n\n        throw err // Re-throw our now sanitized error\n      }\n    }\n  })\n  return newHandler\n}",stripErrorWithAnchor:"(err, anchor) => {\n  const stackArr = err.stack.split('\\n')\n  const anchorIndex = stackArr.findIndex(line => line.trim().startsWith(anchor))\n  if (anchorIndex === -1) {\n    return err // 404, anchor not found\n  }\n  // Strip everything from the top until we reach the anchor line (remove anchor line as well)\n  // Note: We're keeping the 1st line (zero index) as it's unrelated (e.g. `TypeError`)\n  stackArr.splice(1, anchorIndex)\n  err.stack = stackArr.join('\\n')\n  return err\n}",replaceProperty:"(obj, propName, descriptorOverrides = {}) => {\n  return Object.defineProperty(obj, propName, {\n    // Copy over the existing descriptors (writable, enumerable, configurable, etc)\n    ...(Object.getOwnPropertyDescriptor(obj, propName) || {}),\n    // Add our overrides (e.g. value, get())\n    ...descriptorOverrides\n  })\n}",preloadCache:"() => {\n  if (utils.cache) {\n    return\n  }\n  utils.cache = {\n    // Used in our proxies\n    Reflect: {\n      get: Reflect.get.bind(Reflect),\n      apply: Reflect.apply.bind(Reflect)\n    },\n    // Used in `makeNativeString`\n    nativeToStringStr: Function.toString + '' // => `function toString() { [native code] }`\n  }\n}",makeNativeString:"(name = '') => {\n  return utils.cache.nativeToStringStr.replace('toString', name || '')\n}",patchToString:"(obj, str = '') => {\n  const handler = {\n    apply: function (target, ctx) {\n      // This fixes e.g. `HTMLMediaElement.prototype.canPlayType.toString + \"\"`\n      if (ctx === Function.prototype.toString) {\n        return utils.makeNativeString('toString')\n      }\n      // `toString` targeted at our proxied Object detected\n      if (ctx === obj) {\n        // We either return the optional string verbatim or derive the most desired result automatically\n        return str || utils.makeNativeString(obj.name)\n      }\n      // Check if the toString protype of the context is the same as the global prototype,\n      // if not indicates that we are doing a check across different windows., e.g. the iframeWithdirect` test case\n      const hasSameProto = Object.getPrototypeOf(\n        Function.prototype.toString\n      ).isPrototypeOf(ctx.toString) // eslint-disable-line no-prototype-builtins\n      if (!hasSameProto) {\n        // Pass the call on to the local Function.prototype.toString instead\n        return ctx.toString()\n      }\n      return target.call(ctx)\n    }\n  }\n\n  const toStringProxy = new Proxy(\n    Function.prototype.toString,\n    utils.stripProxyFromErrors(handler)\n  )\n  utils.replaceProperty(Function.prototype, 'toString', {\n    value: toStringProxy\n  })\n}",patchToStringNested:"(obj = {}) => {\n  return utils.execRecursively(obj, ['function'], utils.patchToString)\n}",redirectToString:"(proxyObj, originalObj) => {\n  const handler = {\n    apply: function (target, ctx) {\n      // This fixes e.g. `HTMLMediaElement.prototype.canPlayType.toString + \"\"`\n      if (ctx === Function.prototype.toString) {\n        return utils.makeNativeString('toString')\n      }\n\n      // `toString` targeted at our proxied Object detected\n      if (ctx === proxyObj) {\n        const fallback = () =>\n          originalObj && originalObj.name\n            ? utils.makeNativeString(originalObj.name)\n            : utils.makeNativeString(proxyObj.name)\n\n        // Return the toString representation of our original object if possible\n        return originalObj + '' || fallback()\n      }\n\n      if (typeof ctx === 'undefined' || ctx === null) {\n        return target.call(ctx)\n      }\n\n      // Check if the toString protype of the context is the same as the global prototype,\n      // if not indicates that we are doing a check across different windows., e.g. the iframeWithdirect` test case\n      const hasSameProto = Object.getPrototypeOf(\n        Function.prototype.toString\n      ).isPrototypeOf(ctx.toString) // eslint-disable-line no-prototype-builtins\n      if (!hasSameProto) {\n        // Pass the call on to the local Function.prototype.toString instead\n        return ctx.toString()\n      }\n\n      return target.call(ctx)\n    }\n  }\n\n  const toStringProxy = new Proxy(\n    Function.prototype.toString,\n    utils.stripProxyFromErrors(handler)\n  )\n  utils.replaceProperty(Function.prototype, 'toString', {\n    value: toStringProxy\n  })\n}",replaceWithProxy:"(obj, propName, handler) => {\n  const originalObj = obj[propName]\n  const proxyObj = new Proxy(obj[propName], utils.stripProxyFromErrors(handler))\n\n  utils.replaceProperty(obj, propName, { value: proxyObj })\n  utils.redirectToString(proxyObj, originalObj)\n\n  return true\n}",replaceGetterWithProxy:"(obj, propName, handler) => {\n  const fn = Object.getOwnPropertyDescriptor(obj, propName).get\n  const fnStr = fn.toString() // special getter function string\n  const proxyObj = new Proxy(fn, utils.stripProxyFromErrors(handler))\n\n  utils.replaceProperty(obj, propName, { get: proxyObj })\n  utils.patchToString(proxyObj, fnStr)\n\n  return true\n}",replaceGetterSetter:"(obj, propName, handlerGetterSetter) => {\n  const ownPropertyDescriptor = Object.getOwnPropertyDescriptor(obj, propName)\n  const handler = { ...ownPropertyDescriptor }\n\n  if (handlerGetterSetter.get !== undefined) {\n    const nativeFn = ownPropertyDescriptor.get\n    handler.get = function() {\n      return handlerGetterSetter.get.call(this, nativeFn.bind(this))\n    }\n    utils.redirectToString(handler.get, nativeFn)\n  }\n\n  if (handlerGetterSetter.set !== undefined) {\n    const nativeFn = ownPropertyDescriptor.set\n    handler.set = function(newValue) {\n      handlerGetterSetter.set.call(this, newValue, nativeFn.bind(this))\n    }\n    utils.redirectToString(handler.set, nativeFn)\n  }\n\n  Object.defineProperty(obj, propName, handler)\n}",mockWithProxy:"(obj, propName, pseudoTarget, handler) => {\n  const proxyObj = new Proxy(pseudoTarget, utils.stripProxyFromErrors(handler))\n\n  utils.replaceProperty(obj, propName, { value: proxyObj })\n  utils.patchToString(proxyObj)\n\n  return true\n}",createProxy:"(pseudoTarget, handler) => {\n  const proxyObj = new Proxy(pseudoTarget, utils.stripProxyFromErrors(handler))\n  utils.patchToString(proxyObj)\n\n  return proxyObj\n}",splitObjPath:"objPath => ({\n  // Remove last dot entry (property) ==> `HTMLMediaElement.prototype`\n  objName: objPath.split('.').slice(0, -1).join('.'),\n  // Extract last dot entry ==> `canPlayType`\n  propName: objPath.split('.').slice(-1)[0]\n})",replaceObjPathWithProxy:"(objPath, handler) => {\n  const { objName, propName } = utils.splitObjPath(objPath)\n  const obj = eval(objName) // eslint-disable-line no-eval\n  return utils.replaceWithProxy(obj, propName, handler)\n}",execRecursively:"(obj = {}, typeFilter = [], fn) => {\n  function recurse(obj) {\n    for (const key in obj) {\n      if (obj[key] === undefined) {\n        continue\n      }\n      if (obj[key] && typeof obj[key] === 'object') {\n        recurse(obj[key])\n      } else {\n        if (obj[key] && typeFilter.includes(typeof obj[key])) {\n          fn.call(this, obj[key])\n        }\n      }\n    }\n  }\n  recurse(obj)\n  return obj\n}",stringifyFns:"(fnObj = { hello: () => 'world' }) => {\n  // Object.fromEntries() ponyfill (in 6 lines) - supported only in Node v12+, modern browsers are fine\n  // https://github.com/feross/fromentries\n  function fromEntries(iterable) {\n    return [...iterable].reduce((obj, [key, val]) => {\n      obj[key] = val\n      return obj\n    }, {})\n  }\n  return (Object.fromEntries || fromEntries)(\n    Object.entries(fnObj)\n      .filter(([key, value]) => typeof value === 'function')\n      .map(([key, value]) => [key, value.toString()]) // eslint-disable-line no-eval\n  )\n}",materializeFns:"(fnStrObj = { hello: \"() => 'world'\" }) => {\n  return Object.fromEntries(\n    Object.entries(fnStrObj).map(([key, value]) => {\n      if (value.startsWith('function')) {\n        // some trickery is needed to make oldschool functions work :-)\n        return [key, eval(`() => ${value}`)()] // eslint-disable-line no-eval\n      } else {\n        // arrow functions just work\n        return [key, eval(value)] // eslint-disable-line no-eval\n      }\n    })\n  )\n}",makeHandler:"() => ({\n  // Used by simple `navigator` getter evasions\n  getterValue: value => ({\n    apply(target, ctx, args) {\n      // Let's fetch the value first, to trigger and escalate potential errors\n      // Illegal invocations like `navigator.__proto__.vendor` will throw here\n      utils.cache.Reflect.apply(...arguments)\n      return value\n    }\n  })\n})",arrayEquals:"(array1, array2) => {\n  if (array1.length !== array2.length) {\n    return false\n  }\n  for (let i = 0; i < array1.length; ++i) {\n    if (array1[i] !== array2[i]) {\n      return false\n    }\n  }\n  return true\n}",memoize:"fn => {\n  const cache = []\n  return function(...args) {\n    if (!cache.some(c => utils.arrayEquals(c.key, args))) {\n      cache.push({ key: args, value: fn.apply(this, args) })\n    }\n    return cache.find(c => utils.arrayEquals(c.key, args)).value\n  }\n}"},_mainFunction:"(utils, { opts }) => {\n        utils.replaceGetterWithProxy(\n          Object.getPrototypeOf(navigator),\n          'hardwareConcurrency',\n          utils.makeHandler().getterValue(opts.hardwareConcurrency)\n        )\n      }",_args:[{opts:{hardwareConcurrency:4}}]}),(({_utilsFns:_utilsFns,_mainFunction:_mainFunction,_args:_args})=>{const utils=Object.fromEntries(Object.entries(_utilsFns).map((([key,value])=>[key,eval(value)])));utils.init(),eval(_mainFunction)(utils,..._args)})({_utilsFns:{init:"() => {\n  utils.preloadCache()\n}",stripProxyFromErrors:"(handler = {}) => {\n  const newHandler = {\n    setPrototypeOf: function (target, proto) {\n      if (proto === null)\n        throw new TypeError('Cannot convert object to primitive value')\n      if (Object.getPrototypeOf(target) === Object.getPrototypeOf(proto)) {\n        throw new TypeError('Cyclic __proto__ value')\n      }\n      return Reflect.setPrototypeOf(target, proto)\n    }\n  }\n  // We wrap each trap in the handler in a try/catch and modify the error stack if they throw\n  const traps = Object.getOwnPropertyNames(handler)\n  traps.forEach(trap => {\n    newHandler[trap] = function () {\n      try {\n        // Forward the call to the defined proxy handler\n        return handler[trap].apply(this, arguments || [])\n      } catch (err) {\n        // Stack traces differ per browser, we only support chromium based ones currently\n        if (!err || !err.stack || !err.stack.includes(`at `)) {\n          throw err\n        }\n\n        // When something throws within one of our traps the Proxy will show up in error stacks\n        // An earlier implementation of this code would simply strip lines with a blacklist,\n        // but it makes sense to be more surgical here and only remove lines related to our Proxy.\n        // We try to use a known \"anchor\" line for that and strip it with everything above it.\n        // If the anchor line cannot be found for some reason we fall back to our blacklist approach.\n\n        const stripWithBlacklist = (stack, stripFirstLine = true) => {\n          const blacklist = [\n            `at Reflect.${trap} `, // e.g. Reflect.get or Reflect.apply\n            `at Object.${trap} `, // e.g. Object.get or Object.apply\n            `at Object.newHandler.<computed> [as ${trap}] ` // caused by this very wrapper :-)\n          ]\n          return (\n            err.stack\n              .split('\\n')\n              // Always remove the first (file) line in the stack (guaranteed to be our proxy)\n              .filter((line, index) => !(index === 1 && stripFirstLine))\n              // Check if the line starts with one of our blacklisted strings\n              .filter(line => !blacklist.some(bl => line.trim().startsWith(bl)))\n              .join('\\n')\n          )\n        }\n\n        const stripWithAnchor = (stack, anchor) => {\n          const stackArr = stack.split('\\n')\n          anchor = anchor || `at Object.newHandler.<computed> [as ${trap}] ` // Known first Proxy line in chromium\n          const anchorIndex = stackArr.findIndex(line =>\n            line.trim().startsWith(anchor)\n          )\n          if (anchorIndex === -1) {\n            return false // 404, anchor not found\n          }\n          // Strip everything from the top until we reach the anchor line\n          // Note: We're keeping the 1st line (zero index) as it's unrelated (e.g. `TypeError`)\n          stackArr.splice(1, anchorIndex)\n          return stackArr.join('\\n')\n        }\n\n        // Special cases due to our nested toString proxies\n        err.stack = err.stack.replace(\n          'at Object.toString (',\n          'at Function.toString ('\n        )\n        if ((err.stack || '').includes('at Function.toString (')) {\n          err.stack = stripWithBlacklist(err.stack, false)\n          throw err\n        }\n\n        // Try using the anchor method, fallback to blacklist if necessary\n        err.stack = stripWithAnchor(err.stack) || stripWithBlacklist(err.stack)\n\n        throw err // Re-throw our now sanitized error\n      }\n    }\n  })\n  return newHandler\n}",stripErrorWithAnchor:"(err, anchor) => {\n  const stackArr = err.stack.split('\\n')\n  const anchorIndex = stackArr.findIndex(line => line.trim().startsWith(anchor))\n  if (anchorIndex === -1) {\n    return err // 404, anchor not found\n  }\n  // Strip everything from the top until we reach the anchor line (remove anchor line as well)\n  // Note: We're keeping the 1st line (zero index) as it's unrelated (e.g. `TypeError`)\n  stackArr.splice(1, anchorIndex)\n  err.stack = stackArr.join('\\n')\n  return err\n}",replaceProperty:"(obj, propName, descriptorOverrides = {}) => {\n  return Object.defineProperty(obj, propName, {\n    // Copy over the existing descriptors (writable, enumerable, configurable, etc)\n    ...(Object.getOwnPropertyDescriptor(obj, propName) || {}),\n    // Add our overrides (e.g. value, get())\n    ...descriptorOverrides\n  })\n}",preloadCache:"() => {\n  if (utils.cache) {\n    return\n  }\n  utils.cache = {\n    // Used in our proxies\n    Reflect: {\n      get: Reflect.get.bind(Reflect),\n      apply: Reflect.apply.bind(Reflect)\n    },\n    // Used in `makeNativeString`\n    nativeToStringStr: Function.toString + '' // => `function toString() { [native code] }`\n  }\n}",makeNativeString:"(name = '') => {\n  return utils.cache.nativeToStringStr.replace('toString', name || '')\n}",patchToString:"(obj, str = '') => {\n  const handler = {\n    apply: function (target, ctx) {\n      // This fixes e.g. `HTMLMediaElement.prototype.canPlayType.toString + \"\"`\n      if (ctx === Function.prototype.toString) {\n        return utils.makeNativeString('toString')\n      }\n      // `toString` targeted at our proxied Object detected\n      if (ctx === obj) {\n        // We either return the optional string verbatim or derive the most desired result automatically\n        return str || utils.makeNativeString(obj.name)\n      }\n      // Check if the toString protype of the context is the same as the global prototype,\n      // if not indicates that we are doing a check across different windows., e.g. the iframeWithdirect` test case\n      const hasSameProto = Object.getPrototypeOf(\n        Function.prototype.toString\n      ).isPrototypeOf(ctx.toString) // eslint-disable-line no-prototype-builtins\n      if (!hasSameProto) {\n        // Pass the call on to the local Function.prototype.toString instead\n        return ctx.toString()\n      }\n      return target.call(ctx)\n    }\n  }\n\n  const toStringProxy = new Proxy(\n    Function.prototype.toString,\n    utils.stripProxyFromErrors(handler)\n  )\n  utils.replaceProperty(Function.prototype, 'toString', {\n    value: toStringProxy\n  })\n}",patchToStringNested:"(obj = {}) => {\n  return utils.execRecursively(obj, ['function'], utils.patchToString)\n}",redirectToString:"(proxyObj, originalObj) => {\n  const handler = {\n    apply: function (target, ctx) {\n      // This fixes e.g. `HTMLMediaElement.prototype.canPlayType.toString + \"\"`\n      if (ctx === Function.prototype.toString) {\n        return utils.makeNativeString('toString')\n      }\n\n      // `toString` targeted at our proxied Object detected\n      if (ctx === proxyObj) {\n        const fallback = () =>\n          originalObj && originalObj.name\n            ? utils.makeNativeString(originalObj.name)\n            : utils.makeNativeString(proxyObj.name)\n\n        // Return the toString representation of our original object if possible\n        return originalObj + '' || fallback()\n      }\n\n      if (typeof ctx === 'undefined' || ctx === null) {\n        return target.call(ctx)\n      }\n\n      // Check if the toString protype of the context is the same as the global prototype,\n      // if not indicates that we are doing a check across different windows., e.g. the iframeWithdirect` test case\n      const hasSameProto = Object.getPrototypeOf(\n        Function.prototype.toString\n      ).isPrototypeOf(ctx.toString) // eslint-disable-line no-prototype-builtins\n      if (!hasSameProto) {\n        // Pass the call on to the local Function.prototype.toString instead\n        return ctx.toString()\n      }\n\n      return target.call(ctx)\n    }\n  }\n\n  const toStringProxy = new Proxy(\n    Function.prototype.toString,\n    utils.stripProxyFromErrors(handler)\n  )\n  utils.replaceProperty(Function.prototype, 'toString', {\n    value: toStringProxy\n  })\n}",replaceWithProxy:"(obj, propName, handler) => {\n  const originalObj = obj[propName]\n  const proxyObj = new Proxy(obj[propName], utils.stripProxyFromErrors(handler))\n\n  utils.replaceProperty(obj, propName, { value: proxyObj })\n  utils.redirectToString(proxyObj, originalObj)\n\n  return true\n}",replaceGetterWithProxy:"(obj, propName, handler) => {\n  const fn = Object.getOwnPropertyDescriptor(obj, propName).get\n  const fnStr = fn.toString() // special getter function string\n  const proxyObj = new Proxy(fn, utils.stripProxyFromErrors(handler))\n\n  utils.replaceProperty(obj, propName, { get: proxyObj })\n  utils.patchToString(proxyObj, fnStr)\n\n  return true\n}",replaceGetterSetter:"(obj, propName, handlerGetterSetter) => {\n  const ownPropertyDescriptor = Object.getOwnPropertyDescriptor(obj, propName)\n  const handler = { ...ownPropertyDescriptor }\n\n  if (handlerGetterSetter.get !== undefined) {\n    const nativeFn = ownPropertyDescriptor.get\n    handler.get = function() {\n      return handlerGetterSetter.get.call(this, nativeFn.bind(this))\n    }\n    utils.redirectToString(handler.get, nativeFn)\n  }\n\n  if (handlerGetterSetter.set !== undefined) {\n    const nativeFn = ownPropertyDescriptor.set\n    handler.set = function(newValue) {\n      handlerGetterSetter.set.call(this, newValue, nativeFn.bind(this))\n    }\n    utils.redirectToString(handler.set, nativeFn)\n  }\n\n  Object.defineProperty(obj, propName, handler)\n}",mockWithProxy:"(obj, propName, pseudoTarget, handler) => {\n  const proxyObj = new Proxy(pseudoTarget, utils.stripProxyFromErrors(handler))\n\n  utils.replaceProperty(obj, propName, { value: proxyObj })\n  utils.patchToString(proxyObj)\n\n  return true\n}",createProxy:"(pseudoTarget, handler) => {\n  const proxyObj = new Proxy(pseudoTarget, utils.stripProxyFromErrors(handler))\n  utils.patchToString(proxyObj)\n\n  return proxyObj\n}",splitObjPath:"objPath => ({\n  // Remove last dot entry (property) ==> `HTMLMediaElement.prototype`\n  objName: objPath.split('.').slice(0, -1).join('.'),\n  // Extract last dot entry ==> `canPlayType`\n  propName: objPath.split('.').slice(-1)[0]\n})",replaceObjPathWithProxy:"(objPath, handler) => {\n  const { objName, propName } = utils.splitObjPath(objPath)\n  const obj = eval(objName) // eslint-disable-line no-eval\n  return utils.replaceWithProxy(obj, propName, handler)\n}",execRecursively:"(obj = {}, typeFilter = [], fn) => {\n  function recurse(obj) {\n    for (const key in obj) {\n      if (obj[key] === undefined) {\n        continue\n      }\n      if (obj[key] && typeof obj[key] === 'object') {\n        recurse(obj[key])\n      } else {\n        if (obj[key] && typeFilter.includes(typeof obj[key])) {\n          fn.call(this, obj[key])\n        }\n      }\n    }\n  }\n  recurse(obj)\n  return obj\n}",stringifyFns:"(fnObj = { hello: () => 'world' }) => {\n  // Object.fromEntries() ponyfill (in 6 lines) - supported only in Node v12+, modern browsers are fine\n  // https://github.com/feross/fromentries\n  function fromEntries(iterable) {\n    return [...iterable].reduce((obj, [key, val]) => {\n      obj[key] = val\n      return obj\n    }, {})\n  }\n  return (Object.fromEntries || fromEntries)(\n    Object.entries(fnObj)\n      .filter(([key, value]) => typeof value === 'function')\n      .map(([key, value]) => [key, value.toString()]) // eslint-disable-line no-eval\n  )\n}",materializeFns:"(fnStrObj = { hello: \"() => 'world'\" }) => {\n  return Object.fromEntries(\n    Object.entries(fnStrObj).map(([key, value]) => {\n      if (value.startsWith('function')) {\n        // some trickery is needed to make oldschool functions work :-)\n        return [key, eval(`() => ${value}`)()] // eslint-disable-line no-eval\n      } else {\n        // arrow functions just work\n        return [key, eval(value)] // eslint-disable-line no-eval\n      }\n    })\n  )\n}",makeHandler:"() => ({\n  // Used by simple `navigator` getter evasions\n  getterValue: value => ({\n    apply(target, ctx, args) {\n      // Let's fetch the value first, to trigger and escalate potential errors\n      // Illegal invocations like `navigator.__proto__.vendor` will throw here\n      utils.cache.Reflect.apply(...arguments)\n      return value\n    }\n  })\n})",arrayEquals:"(array1, array2) => {\n  if (array1.length !== array2.length) {\n    return false\n  }\n  for (let i = 0; i < array1.length; ++i) {\n    if (array1[i] !== array2[i]) {\n      return false\n    }\n  }\n  return true\n}",memoize:"fn => {\n  const cache = []\n  return function(...args) {\n    if (!cache.some(c => utils.arrayEquals(c.key, args))) {\n      cache.push({ key: args, value: fn.apply(this, args) })\n    }\n    return cache.find(c => utils.arrayEquals(c.key, args)).value\n  }\n}"},_mainFunction:"(utils, { opts }) => {\n        const languages = opts.languages.length\n          ? opts.languages\n          : ['en-US', 'en']\n        utils.replaceGetterWithProxy(\n          Object.getPrototypeOf(navigator),\n          'languages',\n          utils.makeHandler().getterValue(Object.freeze([...languages]))\n        )\n      }",_args:[{opts:{languages:[]}}]}),(({_utilsFns:_utilsFns,_mainFunction:_mainFunction,_args:_args})=>{const utils=Object.fromEntries(Object.entries(_utilsFns).map((([key,value])=>[key,eval(value)])));utils.init(),eval(_mainFunction)(utils,..._args)})({_utilsFns:{init:"() => {\n  utils.preloadCache()\n}",stripProxyFromErrors:"(handler = {}) => {\n  const newHandler = {\n    setPrototypeOf: function (target, proto) {\n      if (proto === null)\n        throw new TypeError('Cannot convert object to primitive value')\n      if (Object.getPrototypeOf(target) === Object.getPrototypeOf(proto)) {\n        throw new TypeError('Cyclic __proto__ value')\n      }\n      return Reflect.setPrototypeOf(target, proto)\n    }\n  }\n  // We wrap each trap in the handler in a try/catch and modify the error stack if they throw\n  const traps = Object.getOwnPropertyNames(handler)\n  traps.forEach(trap => {\n    newHandler[trap] = function () {\n      try {\n        // Forward the call to the defined proxy handler\n        return handler[trap].apply(this, arguments || [])\n      } catch (err) {\n        // Stack traces differ per browser, we only support chromium based ones currently\n        if (!err || !err.stack || !err.stack.includes(`at `)) {\n          throw err\n        }\n\n        // When something throws within one of our traps the Proxy will show up in error stacks\n        // An earlier implementation of this code would simply strip lines with a blacklist,\n        // but it makes sense to be more surgical here and only remove lines related to our Proxy.\n        // We try to use a known \"anchor\" line for that and strip it with everything above it.\n        // If the anchor line cannot be found for some reason we fall back to our blacklist approach.\n\n        const stripWithBlacklist = (stack, stripFirstLine = true) => {\n          const blacklist = [\n            `at Reflect.${trap} `, // e.g. Reflect.get or Reflect.apply\n            `at Object.${trap} `, // e.g. Object.get or Object.apply\n            `at Object.newHandler.<computed> [as ${trap}] ` // caused by this very wrapper :-)\n          ]\n          return (\n            err.stack\n              .split('\\n')\n              // Always remove the first (file) line in the stack (guaranteed to be our proxy)\n              .filter((line, index) => !(index === 1 && stripFirstLine))\n              // Check if the line starts with one of our blacklisted strings\n              .filter(line => !blacklist.some(bl => line.trim().startsWith(bl)))\n              .join('\\n')\n          )\n        }\n\n        const stripWithAnchor = (stack, anchor) => {\n          const stackArr = stack.split('\\n')\n          anchor = anchor || `at Object.newHandler.<computed> [as ${trap}] ` // Known first Proxy line in chromium\n          const anchorIndex = stackArr.findIndex(line =>\n            line.trim().startsWith(anchor)\n          )\n          if (anchorIndex === -1) {\n            return false // 404, anchor not found\n          }\n          // Strip everything from the top until we reach the anchor line\n          // Note: We're keeping the 1st line (zero index) as it's unrelated (e.g. `TypeError`)\n          stackArr.splice(1, anchorIndex)\n          return stackArr.join('\\n')\n        }\n\n        // Special cases due to our nested toString proxies\n        err.stack = err.stack.replace(\n          'at Object.toString (',\n          'at Function.toString ('\n        )\n        if ((err.stack || '').includes('at Function.toString (')) {\n          err.stack = stripWithBlacklist(err.stack, false)\n          throw err\n        }\n\n        // Try using the anchor method, fallback to blacklist if necessary\n        err.stack = stripWithAnchor(err.stack) || stripWithBlacklist(err.stack)\n\n        throw err // Re-throw our now sanitized error\n      }\n    }\n  })\n  return newHandler\n}",stripErrorWithAnchor:"(err, anchor) => {\n  const stackArr = err.stack.split('\\n')\n  const anchorIndex = stackArr.findIndex(line => line.trim().startsWith(anchor))\n  if (anchorIndex === -1) {\n    return err // 404, anchor not found\n  }\n  // Strip everything from the top until we reach the anchor line (remove anchor line as well)\n  // Note: We're keeping the 1st line (zero index) as it's unrelated (e.g. `TypeError`)\n  stackArr.splice(1, anchorIndex)\n  err.stack = stackArr.join('\\n')\n  return err\n}",replaceProperty:"(obj, propName, descriptorOverrides = {}) => {\n  return Object.defineProperty(obj, propName, {\n    // Copy over the existing descriptors (writable, enumerable, configurable, etc)\n    ...(Object.getOwnPropertyDescriptor(obj, propName) || {}),\n    // Add our overrides (e.g. value, get())\n    ...descriptorOverrides\n  })\n}",preloadCache:"() => {\n  if (utils.cache) {\n    return\n  }\n  utils.cache = {\n    // Used in our proxies\n    Reflect: {\n      get: Reflect.get.bind(Reflect),\n      apply: Reflect.apply.bind(Reflect)\n    },\n    // Used in `makeNativeString`\n    nativeToStringStr: Function.toString + '' // => `function toString() { [native code] }`\n  }\n}",makeNativeString:"(name = '') => {\n  return utils.cache.nativeToStringStr.replace('toString', name || '')\n}",patchToString:"(obj, str = '') => {\n  const handler = {\n    apply: function (target, ctx) {\n      // This fixes e.g. `HTMLMediaElement.prototype.canPlayType.toString + \"\"`\n      if (ctx === Function.prototype.toString) {\n        return utils.makeNativeString('toString')\n      }\n      // `toString` targeted at our proxied Object detected\n      if (ctx === obj) {\n        // We either return the optional string verbatim or derive the most desired result automatically\n        return str || utils.makeNativeString(obj.name)\n      }\n      // Check if the toString protype of the context is the same as the global prototype,\n      // if not indicates that we are doing a check across different windows., e.g. the iframeWithdirect` test case\n      const hasSameProto = Object.getPrototypeOf(\n        Function.prototype.toString\n      ).isPrototypeOf(ctx.toString) // eslint-disable-line no-prototype-builtins\n      if (!hasSameProto) {\n        // Pass the call on to the local Function.prototype.toString instead\n        return ctx.toString()\n      }\n      return target.call(ctx)\n    }\n  }\n\n  const toStringProxy = new Proxy(\n    Function.prototype.toString,\n    utils.stripProxyFromErrors(handler)\n  )\n  utils.replaceProperty(Function.prototype, 'toString', {\n    value: toStringProxy\n  })\n}",patchToStringNested:"(obj = {}) => {\n  return utils.execRecursively(obj, ['function'], utils.patchToString)\n}",redirectToString:"(proxyObj, originalObj) => {\n  const handler = {\n    apply: function (target, ctx) {\n      // This fixes e.g. `HTMLMediaElement.prototype.canPlayType.toString + \"\"`\n      if (ctx === Function.prototype.toString) {\n        return utils.makeNativeString('toString')\n      }\n\n      // `toString` targeted at our proxied Object detected\n      if (ctx === proxyObj) {\n        const fallback = () =>\n          originalObj && originalObj.name\n            ? utils.makeNativeString(originalObj.name)\n            : utils.makeNativeString(proxyObj.name)\n\n        // Return the toString representation of our original object if possible\n        return originalObj + '' || fallback()\n      }\n\n      if (typeof ctx === 'undefined' || ctx === null) {\n        return target.call(ctx)\n      }\n\n      // Check if the toString protype of the context is the same as the global prototype,\n      // if not indicates that we are doing a check across different windows., e.g. the iframeWithdirect` test case\n      const hasSameProto = Object.getPrototypeOf(\n        Function.prototype.toString\n      ).isPrototypeOf(ctx.toString) // eslint-disable-line no-prototype-builtins\n      if (!hasSameProto) {\n        // Pass the call on to the local Function.prototype.toString instead\n        return ctx.toString()\n      }\n\n      return target.call(ctx)\n    }\n  }\n\n  const toStringProxy = new Proxy(\n    Function.prototype.toString,\n    utils.stripProxyFromErrors(handler)\n  )\n  utils.replaceProperty(Function.prototype, 'toString', {\n    value: toStringProxy\n  })\n}",replaceWithProxy:"(obj, propName, handler) => {\n  const originalObj = obj[propName]\n  const proxyObj = new Proxy(obj[propName], utils.stripProxyFromErrors(handler))\n\n  utils.replaceProperty(obj, propName, { value: proxyObj })\n  utils.redirectToString(proxyObj, originalObj)\n\n  return true\n}",replaceGetterWithProxy:"(obj, propName, handler) => {\n  const fn = Object.getOwnPropertyDescriptor(obj, propName).get\n  const fnStr = fn.toString() // special getter function string\n  const proxyObj = new Proxy(fn, utils.stripProxyFromErrors(handler))\n\n  utils.replaceProperty(obj, propName, { get: proxyObj })\n  utils.patchToString(proxyObj, fnStr)\n\n  return true\n}",replaceGetterSetter:"(obj, propName, handlerGetterSetter) => {\n  const ownPropertyDescriptor = Object.getOwnPropertyDescriptor(obj, propName)\n  const handler = { ...ownPropertyDescriptor }\n\n  if (handlerGetterSetter.get !== undefined) {\n    const nativeFn = ownPropertyDescriptor.get\n    handler.get = function() {\n      return handlerGetterSetter.get.call(this, nativeFn.bind(this))\n    }\n    utils.redirectToString(handler.get, nativeFn)\n  }\n\n  if (handlerGetterSetter.set !== undefined) {\n    const nativeFn = ownPropertyDescriptor.set\n    handler.set = function(newValue) {\n      handlerGetterSetter.set.call(this, newValue, nativeFn.bind(this))\n    }\n    utils.redirectToString(handler.set, nativeFn)\n  }\n\n  Object.defineProperty(obj, propName, handler)\n}",mockWithProxy:"(obj, propName, pseudoTarget, handler) => {\n  const proxyObj = new Proxy(pseudoTarget, utils.stripProxyFromErrors(handler))\n\n  utils.replaceProperty(obj, propName, { value: proxyObj })\n  utils.patchToString(proxyObj)\n\n  return true\n}",createProxy:"(pseudoTarget, handler) => {\n  const proxyObj = new Proxy(pseudoTarget, utils.stripProxyFromErrors(handler))\n  utils.patchToString(proxyObj)\n\n  return proxyObj\n}",splitObjPath:"objPath => ({\n  // Remove last dot entry (property) ==> `HTMLMediaElement.prototype`\n  objName: objPath.split('.').slice(0, -1).join('.'),\n  // Extract last dot entry ==> `canPlayType`\n  propName: objPath.split('.').slice(-1)[0]\n})",replaceObjPathWithProxy:"(objPath, handler) => {\n  const { objName, propName } = utils.splitObjPath(objPath)\n  const obj = eval(objName) // eslint-disable-line no-eval\n  return utils.replaceWithProxy(obj, propName, handler)\n}",execRecursively:"(obj = {}, typeFilter = [], fn) => {\n  function recurse(obj) {\n    for (const key in obj) {\n      if (obj[key] === undefined) {\n        continue\n      }\n      if (obj[key] && typeof obj[key] === 'object') {\n        recurse(obj[key])\n      } else {\n        if (obj[key] && typeFilter.includes(typeof obj[key])) {\n          fn.call(this, obj[key])\n        }\n      }\n    }\n  }\n  recurse(obj)\n  return obj\n}",stringifyFns:"(fnObj = { hello: () => 'world' }) => {\n  // Object.fromEntries() ponyfill (in 6 lines) - supported only in Node v12+, modern browsers are fine\n  // https://github.com/feross/fromentries\n  function fromEntries(iterable) {\n    return [...iterable].reduce((obj, [key, val]) => {\n      obj[key] = val\n      return obj\n    }, {})\n  }\n  return (Object.fromEntries || fromEntries)(\n    Object.entries(fnObj)\n      .filter(([key, value]) => typeof value === 'function')\n      .map(([key, value]) => [key, value.toString()]) // eslint-disable-line no-eval\n  )\n}",materializeFns:"(fnStrObj = { hello: \"() => 'world'\" }) => {\n  return Object.fromEntries(\n    Object.entries(fnStrObj).map(([key, value]) => {\n      if (value.startsWith('function')) {\n        // some trickery is needed to make oldschool functions work :-)\n        return [key, eval(`() => ${value}`)()] // eslint-disable-line no-eval\n      } else {\n        // arrow functions just work\n        return [key, eval(value)] // eslint-disable-line no-eval\n      }\n    })\n  )\n}",makeHandler:"() => ({\n  // Used by simple `navigator` getter evasions\n  getterValue: value => ({\n    apply(target, ctx, args) {\n      // Let's fetch the value first, to trigger and escalate potential errors\n      // Illegal invocations like `navigator.__proto__.vendor` will throw here\n      utils.cache.Reflect.apply(...arguments)\n      return value\n    }\n  })\n})",arrayEquals:"(array1, array2) => {\n  if (array1.length !== array2.length) {\n    return false\n  }\n  for (let i = 0; i < array1.length; ++i) {\n    if (array1[i] !== array2[i]) {\n      return false\n    }\n  }\n  return true\n}",memoize:"fn => {\n  const cache = []\n  return function(...args) {\n    if (!cache.some(c => utils.arrayEquals(c.key, args))) {\n      cache.push({ key: args, value: fn.apply(this, args) })\n    }\n    return cache.find(c => utils.arrayEquals(c.key, args)).value\n  }\n}"},_mainFunction:"(utils, opts) => {\n      const isSecure = document.location.protocol.startsWith('https')\n\n      // In headful on secure origins the permission should be \"default\", not \"denied\"\n      if (isSecure) {\n        utils.replaceGetterWithProxy(Notification, 'permission', {\n          apply() {\n            return 'default'\n          }\n        })\n      }\n\n      // Another weird behavior:\n      // On insecure origins in headful the state is \"denied\",\n      // whereas in headless it's \"prompt\"\n      if (!isSecure) {\n        const handler = {\n          apply(target, ctx, args) {\n            const param = (args || [])[0]\n\n            const isNotifications =\n              param && param.name && param.name === 'notifications'\n            if (!isNotifications) {\n              return utils.cache.Reflect.apply(...arguments)\n            }\n\n            return Promise.resolve(\n              Object.setPrototypeOf(\n                {\n                  state: 'denied',\n                  onchange: null\n                },\n                PermissionStatus.prototype\n              )\n            )\n          }\n        }\n        // Note: Don't use `Object.getPrototypeOf` here\n        utils.replaceWithProxy(Permissions.prototype, 'query', handler)\n      }\n    }",_args:[{}]}),(({_utilsFns:_utilsFns,_mainFunction:_mainFunction,_args:_args})=>{const utils=Object.fromEntries(Object.entries(_utilsFns).map((([key,value])=>[key,eval(value)])));utils.init(),eval(_mainFunction)(utils,..._args)})({_utilsFns:{init:"() => {\n  utils.preloadCache()\n}",stripProxyFromErrors:"(handler = {}) => {\n  const newHandler = {\n    setPrototypeOf: function (target, proto) {\n      if (proto === null)\n        throw new TypeError('Cannot convert object to primitive value')\n      if (Object.getPrototypeOf(target) === Object.getPrototypeOf(proto)) {\n        throw new TypeError('Cyclic __proto__ value')\n      }\n      return Reflect.setPrototypeOf(target, proto)\n    }\n  }\n  // We wrap each trap in the handler in a try/catch and modify the error stack if they throw\n  const traps = Object.getOwnPropertyNames(handler)\n  traps.forEach(trap => {\n    newHandler[trap] = function () {\n      try {\n        // Forward the call to the defined proxy handler\n        return handler[trap].apply(this, arguments || [])\n      } catch (err) {\n        // Stack traces differ per browser, we only support chromium based ones currently\n        if (!err || !err.stack || !err.stack.includes(`at `)) {\n          throw err\n        }\n\n        // When something throws within one of our traps the Proxy will show up in error stacks\n        // An earlier implementation of this code would simply strip lines with a blacklist,\n        // but it makes sense to be more surgical here and only remove lines related to our Proxy.\n        // We try to use a known \"anchor\" line for that and strip it with everything above it.\n        // If the anchor line cannot be found for some reason we fall back to our blacklist approach.\n\n        const stripWithBlacklist = (stack, stripFirstLine = true) => {\n          const blacklist = [\n            `at Reflect.${trap} `, // e.g. Reflect.get or Reflect.apply\n            `at Object.${trap} `, // e.g. Object.get or Object.apply\n            `at Object.newHandler.<computed> [as ${trap}] ` // caused by this very wrapper :-)\n          ]\n          return (\n            err.stack\n              .split('\\n')\n              // Always remove the first (file) line in the stack (guaranteed to be our proxy)\n              .filter((line, index) => !(index === 1 && stripFirstLine))\n              // Check if the line starts with one of our blacklisted strings\n              .filter(line => !blacklist.some(bl => line.trim().startsWith(bl)))\n              .join('\\n')\n          )\n        }\n\n        const stripWithAnchor = (stack, anchor) => {\n          const stackArr = stack.split('\\n')\n          anchor = anchor || `at Object.newHandler.<computed> [as ${trap}] ` // Known first Proxy line in chromium\n          const anchorIndex = stackArr.findIndex(line =>\n            line.trim().startsWith(anchor)\n          )\n          if (anchorIndex === -1) {\n            return false // 404, anchor not found\n          }\n          // Strip everything from the top until we reach the anchor line\n          // Note: We're keeping the 1st line (zero index) as it's unrelated (e.g. `TypeError`)\n          stackArr.splice(1, anchorIndex)\n          return stackArr.join('\\n')\n        }\n\n        // Special cases due to our nested toString proxies\n        err.stack = err.stack.replace(\n          'at Object.toString (',\n          'at Function.toString ('\n        )\n        if ((err.stack || '').includes('at Function.toString (')) {\n          err.stack = stripWithBlacklist(err.stack, false)\n          throw err\n        }\n\n        // Try using the anchor method, fallback to blacklist if necessary\n        err.stack = stripWithAnchor(err.stack) || stripWithBlacklist(err.stack)\n\n        throw err // Re-throw our now sanitized error\n      }\n    }\n  })\n  return newHandler\n}",stripErrorWithAnchor:"(err, anchor) => {\n  const stackArr = err.stack.split('\\n')\n  const anchorIndex = stackArr.findIndex(line => line.trim().startsWith(anchor))\n  if (anchorIndex === -1) {\n    return err // 404, anchor not found\n  }\n  // Strip everything from the top until we reach the anchor line (remove anchor line as well)\n  // Note: We're keeping the 1st line (zero index) as it's unrelated (e.g. `TypeError`)\n  stackArr.splice(1, anchorIndex)\n  err.stack = stackArr.join('\\n')\n  return err\n}",replaceProperty:"(obj, propName, descriptorOverrides = {}) => {\n  return Object.defineProperty(obj, propName, {\n    // Copy over the existing descriptors (writable, enumerable, configurable, etc)\n    ...(Object.getOwnPropertyDescriptor(obj, propName) || {}),\n    // Add our overrides (e.g. value, get())\n    ...descriptorOverrides\n  })\n}",preloadCache:"() => {\n  if (utils.cache) {\n    return\n  }\n  utils.cache = {\n    // Used in our proxies\n    Reflect: {\n      get: Reflect.get.bind(Reflect),\n      apply: Reflect.apply.bind(Reflect)\n    },\n    // Used in `makeNativeString`\n    nativeToStringStr: Function.toString + '' // => `function toString() { [native code] }`\n  }\n}",makeNativeString:"(name = '') => {\n  return utils.cache.nativeToStringStr.replace('toString', name || '')\n}",patchToString:"(obj, str = '') => {\n  const handler = {\n    apply: function (target, ctx) {\n      // This fixes e.g. `HTMLMediaElement.prototype.canPlayType.toString + \"\"`\n      if (ctx === Function.prototype.toString) {\n        return utils.makeNativeString('toString')\n      }\n      // `toString` targeted at our proxied Object detected\n      if (ctx === obj) {\n        // We either return the optional string verbatim or derive the most desired result automatically\n        return str || utils.makeNativeString(obj.name)\n      }\n      // Check if the toString protype of the context is the same as the global prototype,\n      // if not indicates that we are doing a check across different windows., e.g. the iframeWithdirect` test case\n      const hasSameProto = Object.getPrototypeOf(\n        Function.prototype.toString\n      ).isPrototypeOf(ctx.toString) // eslint-disable-line no-prototype-builtins\n      if (!hasSameProto) {\n        // Pass the call on to the local Function.prototype.toString instead\n        return ctx.toString()\n      }\n      return target.call(ctx)\n    }\n  }\n\n  const toStringProxy = new Proxy(\n    Function.prototype.toString,\n    utils.stripProxyFromErrors(handler)\n  )\n  utils.replaceProperty(Function.prototype, 'toString', {\n    value: toStringProxy\n  })\n}",patchToStringNested:"(obj = {}) => {\n  return utils.execRecursively(obj, ['function'], utils.patchToString)\n}",redirectToString:"(proxyObj, originalObj) => {\n  const handler = {\n    apply: function (target, ctx) {\n      // This fixes e.g. `HTMLMediaElement.prototype.canPlayType.toString + \"\"`\n      if (ctx === Function.prototype.toString) {\n        return utils.makeNativeString('toString')\n      }\n\n      // `toString` targeted at our proxied Object detected\n      if (ctx === proxyObj) {\n        const fallback = () =>\n          originalObj && originalObj.name\n            ? utils.makeNativeString(originalObj.name)\n            : utils.makeNativeString(proxyObj.name)\n\n        // Return the toString representation of our original object if possible\n        return originalObj + '' || fallback()\n      }\n\n      if (typeof ctx === 'undefined' || ctx === null) {\n        return target.call(ctx)\n      }\n\n      // Check if the toString protype of the context is the same as the global prototype,\n      // if not indicates that we are doing a check across different windows., e.g. the iframeWithdirect` test case\n      const hasSameProto = Object.getPrototypeOf(\n        Function.prototype.toString\n      ).isPrototypeOf(ctx.toString) // eslint-disable-line no-prototype-builtins\n      if (!hasSameProto) {\n        // Pass the call on to the local Function.prototype.toString instead\n        return ctx.toString()\n      }\n\n      return target.call(ctx)\n    }\n  }\n\n  const toStringProxy = new Proxy(\n    Function.prototype.toString,\n    utils.stripProxyFromErrors(handler)\n  )\n  utils.replaceProperty(Function.prototype, 'toString', {\n    value: toStringProxy\n  })\n}",replaceWithProxy:"(obj, propName, handler) => {\n  const originalObj = obj[propName]\n  const proxyObj = new Proxy(obj[propName], utils.stripProxyFromErrors(handler))\n\n  utils.replaceProperty(obj, propName, { value: proxyObj })\n  utils.redirectToString(proxyObj, originalObj)\n\n  return true\n}",replaceGetterWithProxy:"(obj, propName, handler) => {\n  const fn = Object.getOwnPropertyDescriptor(obj, propName).get\n  const fnStr = fn.toString() // special getter function string\n  const proxyObj = new Proxy(fn, utils.stripProxyFromErrors(handler))\n\n  utils.replaceProperty(obj, propName, { get: proxyObj })\n  utils.patchToString(proxyObj, fnStr)\n\n  return true\n}",replaceGetterSetter:"(obj, propName, handlerGetterSetter) => {\n  const ownPropertyDescriptor = Object.getOwnPropertyDescriptor(obj, propName)\n  const handler = { ...ownPropertyDescriptor }\n\n  if (handlerGetterSetter.get !== undefined) {\n    const nativeFn = ownPropertyDescriptor.get\n    handler.get = function() {\n      return handlerGetterSetter.get.call(this, nativeFn.bind(this))\n    }\n    utils.redirectToString(handler.get, nativeFn)\n  }\n\n  if (handlerGetterSetter.set !== undefined) {\n    const nativeFn = ownPropertyDescriptor.set\n    handler.set = function(newValue) {\n      handlerGetterSetter.set.call(this, newValue, nativeFn.bind(this))\n    }\n    utils.redirectToString(handler.set, nativeFn)\n  }\n\n  Object.defineProperty(obj, propName, handler)\n}",mockWithProxy:"(obj, propName, pseudoTarget, handler) => {\n  const proxyObj = new Proxy(pseudoTarget, utils.stripProxyFromErrors(handler))\n\n  utils.replaceProperty(obj, propName, { value: proxyObj })\n  utils.patchToString(proxyObj)\n\n  return true\n}",createProxy:"(pseudoTarget, handler) => {\n  const proxyObj = new Proxy(pseudoTarget, utils.stripProxyFromErrors(handler))\n  utils.patchToString(proxyObj)\n\n  return proxyObj\n}",splitObjPath:"objPath => ({\n  // Remove last dot entry (property) ==> `HTMLMediaElement.prototype`\n  objName: objPath.split('.').slice(0, -1).join('.'),\n  // Extract last dot entry ==> `canPlayType`\n  propName: objPath.split('.').slice(-1)[0]\n})",replaceObjPathWithProxy:"(objPath, handler) => {\n  const { objName, propName } = utils.splitObjPath(objPath)\n  const obj = eval(objName) // eslint-disable-line no-eval\n  return utils.replaceWithProxy(obj, propName, handler)\n}",execRecursively:"(obj = {}, typeFilter = [], fn) => {\n  function recurse(obj) {\n    for (const key in obj) {\n      if (obj[key] === undefined) {\n        continue\n      }\n      if (obj[key] && typeof obj[key] === 'object') {\n        recurse(obj[key])\n      } else {\n        if (obj[key] && typeFilter.includes(typeof obj[key])) {\n          fn.call(this, obj[key])\n        }\n      }\n    }\n  }\n  recurse(obj)\n  return obj\n}",stringifyFns:"(fnObj = { hello: () => 'world' }) => {\n  // Object.fromEntries() ponyfill (in 6 lines) - supported only in Node v12+, modern browsers are fine\n  // https://github.com/feross/fromentries\n  function fromEntries(iterable) {\n    return [...iterable].reduce((obj, [key, val]) => {\n      obj[key] = val\n      return obj\n    }, {})\n  }\n  return (Object.fromEntries || fromEntries)(\n    Object.entries(fnObj)\n      .filter(([key, value]) => typeof value === 'function')\n      .map(([key, value]) => [key, value.toString()]) // eslint-disable-line no-eval\n  )\n}",materializeFns:"(fnStrObj = { hello: \"() => 'world'\" }) => {\n  return Object.fromEntries(\n    Object.entries(fnStrObj).map(([key, value]) => {\n      if (value.startsWith('function')) {\n        // some trickery is needed to make oldschool functions work :-)\n        return [key, eval(`() => ${value}`)()] // eslint-disable-line no-eval\n      } else {\n        // arrow functions just work\n        return [key, eval(value)] // eslint-disable-line no-eval\n      }\n    })\n  )\n}",makeHandler:"() => ({\n  // Used by simple `navigator` getter evasions\n  getterValue: value => ({\n    apply(target, ctx, args) {\n      // Let's fetch the value first, to trigger and escalate potential errors\n      // Illegal invocations like `navigator.__proto__.vendor` will throw here\n      utils.cache.Reflect.apply(...arguments)\n      return value\n    }\n  })\n})",arrayEquals:"(array1, array2) => {\n  if (array1.length !== array2.length) {\n    return false\n  }\n  for (let i = 0; i < array1.length; ++i) {\n    if (array1[i] !== array2[i]) {\n      return false\n    }\n  }\n  return true\n}",memoize:"fn => {\n  const cache = []\n  return function(...args) {\n    if (!cache.some(c => utils.arrayEquals(c.key, args))) {\n      cache.push({ key: args, value: fn.apply(this, args) })\n    }\n    return cache.find(c => utils.arrayEquals(c.key, args)).value\n  }\n}"},_mainFunction:"(utils, { fns, data }) => {\n        fns = utils.materializeFns(fns)\n\n        // That means we're running headful\n        const hasPlugins = 'plugins' in navigator && navigator.plugins.length\n        if (hasPlugins) {\n          return // nothing to do here\n        }\n\n        const mimeTypes = fns.generateMimeTypeArray(utils, fns)(data.mimeTypes)\n        const plugins = fns.generatePluginArray(utils, fns)(data.plugins)\n\n        // Plugin and MimeType cross-reference each other, let's do that now\n        // Note: We're looping through `data.plugins` here, not the generated `plugins`\n        for (const pluginData of data.plugins) {\n          pluginData.__mimeTypes.forEach((type, index) => {\n            plugins[pluginData.name][index] = mimeTypes[type]\n\n            Object.defineProperty(plugins[pluginData.name], type, {\n              value: mimeTypes[type],\n              writable: false,\n              enumerable: false, // Not enumerable\n              configurable: true\n            })\n            Object.defineProperty(mimeTypes[type], 'enabledPlugin', {\n              value:\n                type === 'application/x-pnacl'\n                  ? mimeTypes['application/x-nacl'].enabledPlugin // these reference the same plugin, so we need to re-use the Proxy in order to avoid leaks\n                  : new Proxy(plugins[pluginData.name], {}), // Prevent circular references\n              writable: false,\n              enumerable: false, // Important: `JSON.stringify(navigator.plugins)`\n              configurable: true\n            })\n          })\n        }\n\n        const patchNavigator = (name, value) =>\n          utils.replaceProperty(Object.getPrototypeOf(navigator), name, {\n            get() {\n              return value\n            }\n          })\n\n        patchNavigator('mimeTypes', mimeTypes)\n        patchNavigator('plugins', plugins)\n\n        // All done\n      }",_args:[{fns:{generateMimeTypeArray:"(utils, fns) => mimeTypesData => {\n  return fns.generateMagicArray(utils, fns)(\n    mimeTypesData,\n    MimeTypeArray.prototype,\n    MimeType.prototype,\n    'type'\n  )\n}",generatePluginArray:"(utils, fns) => pluginsData => {\n  return fns.generateMagicArray(utils, fns)(\n    pluginsData,\n    PluginArray.prototype,\n    Plugin.prototype,\n    'name'\n  )\n}",generateMagicArray:"(utils, fns) =>\n  function(\n    dataArray = [],\n    proto = MimeTypeArray.prototype,\n    itemProto = MimeType.prototype,\n    itemMainProp = 'type'\n  ) {\n    // Quick helper to set props with the same descriptors vanilla is using\n    const defineProp = (obj, prop, value) =>\n      Object.defineProperty(obj, prop, {\n        value,\n        writable: false,\n        enumerable: false, // Important for mimeTypes & plugins: `JSON.stringify(navigator.mimeTypes)`\n        configurable: true\n      })\n\n    // Loop over our fake data and construct items\n    const makeItem = data => {\n      const item = {}\n      for (const prop of Object.keys(data)) {\n        if (prop.startsWith('__')) {\n          continue\n        }\n        defineProp(item, prop, data[prop])\n      }\n      return patchItem(item, data)\n    }\n\n    const patchItem = (item, data) => {\n      let descriptor = Object.getOwnPropertyDescriptors(item)\n\n      // Special case: Plugins have a magic length property which is not enumerable\n      // e.g. `navigator.plugins[i].length` should always be the length of the assigned mimeTypes\n      if (itemProto === Plugin.prototype) {\n        descriptor = {\n          ...descriptor,\n          length: {\n            value: data.__mimeTypes.length,\n            writable: false,\n            enumerable: false,\n            configurable: true // Important to be able to use the ownKeys trap in a Proxy to strip `length`\n          }\n        }\n      }\n\n      // We need to spoof a specific `MimeType` or `Plugin` object\n      const obj = Object.create(itemProto, descriptor)\n\n      // Virtually all property keys are not enumerable in vanilla\n      const blacklist = [...Object.keys(data), 'length', 'enabledPlugin']\n      return new Proxy(obj, {\n        ownKeys(target) {\n          return Reflect.ownKeys(target).filter(k => !blacklist.includes(k))\n        },\n        getOwnPropertyDescriptor(target, prop) {\n          if (blacklist.includes(prop)) {\n            return undefined\n          }\n          return Reflect.getOwnPropertyDescriptor(target, prop)\n        }\n      })\n    }\n\n    const magicArray = []\n\n    // Loop through our fake data and use that to create convincing entities\n    dataArray.forEach(data => {\n      magicArray.push(makeItem(data))\n    })\n\n    // Add direct property access  based on types (e.g. `obj['application/pdf']`) afterwards\n    magicArray.forEach(entry => {\n      defineProp(magicArray, entry[itemMainProp], entry)\n    })\n\n    // This is the best way to fake the type to make sure this is false: `Array.isArray(navigator.mimeTypes)`\n    const magicArrayObj = Object.create(proto, {\n      ...Object.getOwnPropertyDescriptors(magicArray),\n\n      // There's one ugly quirk we unfortunately need to take care of:\n      // The `MimeTypeArray` prototype has an enumerable `length` property,\n      // but headful Chrome will still skip it when running `Object.getOwnPropertyNames(navigator.mimeTypes)`.\n      // To strip it we need to make it first `configurable` and can then overlay a Proxy with an `ownKeys` trap.\n      length: {\n        value: magicArray.length,\n        writable: false,\n        enumerable: false,\n        configurable: true // Important to be able to use the ownKeys trap in a Proxy to strip `length`\n      }\n    })\n\n    // Generate our functional function mocks :-)\n    const functionMocks = fns.generateFunctionMocks(utils)(\n      proto,\n      itemMainProp,\n      magicArray\n    )\n\n    // We need to overlay our custom object with a JS Proxy\n    const magicArrayObjProxy = new Proxy(magicArrayObj, {\n      get(target, key = '') {\n        // Redirect function calls to our custom proxied versions mocking the vanilla behavior\n        if (key === 'item') {\n          return functionMocks.item\n        }\n        if (key === 'namedItem') {\n          return functionMocks.namedItem\n        }\n        if (proto === PluginArray.prototype && key === 'refresh') {\n          return functionMocks.refresh\n        }\n        // Everything else can pass through as normal\n        return utils.cache.Reflect.get(...arguments)\n      },\n      ownKeys(target) {\n        // There are a couple of quirks where the original property demonstrates \"magical\" behavior that makes no sense\n        // This can be witnessed when calling `Object.getOwnPropertyNames(navigator.mimeTypes)` and the absense of `length`\n        // My guess is that it has to do with the recent change of not allowing data enumeration and this being implemented weirdly\n        // For that reason we just completely fake the available property names based on our data to match what regular Chrome is doing\n        // Specific issues when not patching this: `length` property is available, direct `types` props (e.g. `obj['application/pdf']`) are missing\n        const keys = []\n        const typeProps = magicArray.map(mt => mt[itemMainProp])\n        typeProps.forEach((_, i) => keys.push(`${i}`))\n        typeProps.forEach(propName => keys.push(propName))\n        return keys\n      },\n      getOwnPropertyDescriptor(target, prop) {\n        if (prop === 'length') {\n          return undefined\n        }\n        return Reflect.getOwnPropertyDescriptor(target, prop)\n      }\n    })\n\n    return magicArrayObjProxy\n  }",generateFunctionMocks:"utils => (\n  proto,\n  itemMainProp,\n  dataArray\n) => ({\n  /** Returns the MimeType object with the specified index. */\n  item: utils.createProxy(proto.item, {\n    apply(target, ctx, args) {\n      if (!args.length) {\n        throw new TypeError(\n          `Failed to execute 'item' on '${\n            proto[Symbol.toStringTag]\n          }': 1 argument required, but only 0 present.`\n        )\n      }\n      // Special behavior alert:\n      // - Vanilla tries to cast strings to Numbers (only integers!) and use them as property index lookup\n      // - If anything else than an integer (including as string) is provided it will return the first entry\n      const isInteger = args[0] && Number.isInteger(Number(args[0])) // Cast potential string to number first, then check for integer\n      // Note: Vanilla never returns `undefined`\n      return (isInteger ? dataArray[Number(args[0])] : dataArray[0]) || null\n    }\n  }),\n  /** Returns the MimeType object with the specified name. */\n  namedItem: utils.createProxy(proto.namedItem, {\n    apply(target, ctx, args) {\n      if (!args.length) {\n        throw new TypeError(\n          `Failed to execute 'namedItem' on '${\n            proto[Symbol.toStringTag]\n          }': 1 argument required, but only 0 present.`\n        )\n      }\n      return dataArray.find(mt => mt[itemMainProp] === args[0]) || null // Not `undefined`!\n    }\n  }),\n  /** Does nothing and shall return nothing */\n  refresh: proto.refresh\n    ? utils.createProxy(proto.refresh, {\n        apply(target, ctx, args) {\n          return undefined\n        }\n      })\n    : undefined\n})"},data:{mimeTypes:[{type:"application/pdf",suffixes:"pdf",description:"",__pluginName:"Chrome PDF Viewer"},{type:"application/x-google-chrome-pdf",suffixes:"pdf",description:"Portable Document Format",__pluginName:"Chrome PDF Plugin"},{type:"application/x-nacl",suffixes:"",description:"Native Client Executable",__pluginName:"Native Client"},{type:"application/x-pnacl",suffixes:"",description:"Portable Native Client Executable",__pluginName:"Native Client"}],plugins:[{name:"Chrome PDF Plugin",filename:"internal-pdf-viewer",description:"Portable Document Format",__mimeTypes:["application/x-google-chrome-pdf"]},{name:"Chrome PDF Viewer",filename:"mhjfbmdgcfjbbpaeojofohoefgiehjai",description:"",__mimeTypes:["application/pdf"]},{name:"Native Client",filename:"internal-nacl-plugin",description:"",__mimeTypes:["application/x-nacl","application/x-pnacl"]}]}}]}),!1===navigator.webdriver||void 0===navigator.webdriver||delete Object.getPrototypeOf(navigator).webdriver,(({_utilsFns:_utilsFns,_mainFunction:_mainFunction,_args:_args})=>{const utils=Object.fromEntries(Object.entries(_utilsFns).map((([key,value])=>[key,eval(value)])));utils.init(),eval(_mainFunction)(utils,..._args)})({_utilsFns:{init:"() => {\n  utils.preloadCache()\n}",stripProxyFromErrors:"(handler = {}) => {\n  const newHandler = {\n    setPrototypeOf: function (target, proto) {\n      if (proto === null)\n        throw new TypeError('Cannot convert object to primitive value')\n      if (Object.getPrototypeOf(target) === Object.getPrototypeOf(proto)) {\n        throw new TypeError('Cyclic __proto__ value')\n      }\n      return Reflect.setPrototypeOf(target, proto)\n    }\n  }\n  // We wrap each trap in the handler in a try/catch and modify the error stack if they throw\n  const traps = Object.getOwnPropertyNames(handler)\n  traps.forEach(trap => {\n    newHandler[trap] = function () {\n      try {\n        // Forward the call to the defined proxy handler\n        return handler[trap].apply(this, arguments || [])\n      } catch (err) {\n        // Stack traces differ per browser, we only support chromium based ones currently\n        if (!err || !err.stack || !err.stack.includes(`at `)) {\n          throw err\n        }\n\n        // When something throws within one of our traps the Proxy will show up in error stacks\n        // An earlier implementation of this code would simply strip lines with a blacklist,\n        // but it makes sense to be more surgical here and only remove lines related to our Proxy.\n        // We try to use a known \"anchor\" line for that and strip it with everything above it.\n        // If the anchor line cannot be found for some reason we fall back to our blacklist approach.\n\n        const stripWithBlacklist = (stack, stripFirstLine = true) => {\n          const blacklist = [\n            `at Reflect.${trap} `, // e.g. Reflect.get or Reflect.apply\n            `at Object.${trap} `, // e.g. Object.get or Object.apply\n            `at Object.newHandler.<computed> [as ${trap}] ` // caused by this very wrapper :-)\n          ]\n          return (\n            err.stack\n              .split('\\n')\n              // Always remove the first (file) line in the stack (guaranteed to be our proxy)\n              .filter((line, index) => !(index === 1 && stripFirstLine))\n              // Check if the line starts with one of our blacklisted strings\n              .filter(line => !blacklist.some(bl => line.trim().startsWith(bl)))\n              .join('\\n')\n          )\n        }\n\n        const stripWithAnchor = (stack, anchor) => {\n          const stackArr = stack.split('\\n')\n          anchor = anchor || `at Object.newHandler.<computed> [as ${trap}] ` // Known first Proxy line in chromium\n          const anchorIndex = stackArr.findIndex(line =>\n            line.trim().startsWith(anchor)\n          )\n          if (anchorIndex === -1) {\n            return false // 404, anchor not found\n          }\n          // Strip everything from the top until we reach the anchor line\n          // Note: We're keeping the 1st line (zero index) as it's unrelated (e.g. `TypeError`)\n          stackArr.splice(1, anchorIndex)\n          return stackArr.join('\\n')\n        }\n\n        // Special cases due to our nested toString proxies\n        err.stack = err.stack.replace(\n          'at Object.toString (',\n          'at Function.toString ('\n        )\n        if ((err.stack || '').includes('at Function.toString (')) {\n          err.stack = stripWithBlacklist(err.stack, false)\n          throw err\n        }\n\n        // Try using the anchor method, fallback to blacklist if necessary\n        err.stack = stripWithAnchor(err.stack) || stripWithBlacklist(err.stack)\n\n        throw err // Re-throw our now sanitized error\n      }\n    }\n  })\n  return newHandler\n}",stripErrorWithAnchor:"(err, anchor) => {\n  const stackArr = err.stack.split('\\n')\n  const anchorIndex = stackArr.findIndex(line => line.trim().startsWith(anchor))\n  if (anchorIndex === -1) {\n    return err // 404, anchor not found\n  }\n  // Strip everything from the top until we reach the anchor line (remove anchor line as well)\n  // Note: We're keeping the 1st line (zero index) as it's unrelated (e.g. `TypeError`)\n  stackArr.splice(1, anchorIndex)\n  err.stack = stackArr.join('\\n')\n  return err\n}",replaceProperty:"(obj, propName, descriptorOverrides = {}) => {\n  return Object.defineProperty(obj, propName, {\n    // Copy over the existing descriptors (writable, enumerable, configurable, etc)\n    ...(Object.getOwnPropertyDescriptor(obj, propName) || {}),\n    // Add our overrides (e.g. value, get())\n    ...descriptorOverrides\n  })\n}",preloadCache:"() => {\n  if (utils.cache) {\n    return\n  }\n  utils.cache = {\n    // Used in our proxies\n    Reflect: {\n      get: Reflect.get.bind(Reflect),\n      apply: Reflect.apply.bind(Reflect)\n    },\n    // Used in `makeNativeString`\n    nativeToStringStr: Function.toString + '' // => `function toString() { [native code] }`\n  }\n}",makeNativeString:"(name = '') => {\n  return utils.cache.nativeToStringStr.replace('toString', name || '')\n}",patchToString:"(obj, str = '') => {\n  const handler = {\n    apply: function (target, ctx) {\n      // This fixes e.g. `HTMLMediaElement.prototype.canPlayType.toString + \"\"`\n      if (ctx === Function.prototype.toString) {\n        return utils.makeNativeString('toString')\n      }\n      // `toString` targeted at our proxied Object detected\n      if (ctx === obj) {\n        // We either return the optional string verbatim or derive the most desired result automatically\n        return str || utils.makeNativeString(obj.name)\n      }\n      // Check if the toString protype of the context is the same as the global prototype,\n      // if not indicates that we are doing a check across different windows., e.g. the iframeWithdirect` test case\n      const hasSameProto = Object.getPrototypeOf(\n        Function.prototype.toString\n      ).isPrototypeOf(ctx.toString) // eslint-disable-line no-prototype-builtins\n      if (!hasSameProto) {\n        // Pass the call on to the local Function.prototype.toString instead\n        return ctx.toString()\n      }\n      return target.call(ctx)\n    }\n  }\n\n  const toStringProxy = new Proxy(\n    Function.prototype.toString,\n    utils.stripProxyFromErrors(handler)\n  )\n  utils.replaceProperty(Function.prototype, 'toString', {\n    value: toStringProxy\n  })\n}",patchToStringNested:"(obj = {}) => {\n  return utils.execRecursively(obj, ['function'], utils.patchToString)\n}",redirectToString:"(proxyObj, originalObj) => {\n  const handler = {\n    apply: function (target, ctx) {\n      // This fixes e.g. `HTMLMediaElement.prototype.canPlayType.toString + \"\"`\n      if (ctx === Function.prototype.toString) {\n        return utils.makeNativeString('toString')\n      }\n\n      // `toString` targeted at our proxied Object detected\n      if (ctx === proxyObj) {\n        const fallback = () =>\n          originalObj && originalObj.name\n            ? utils.makeNativeString(originalObj.name)\n            : utils.makeNativeString(proxyObj.name)\n\n        // Return the toString representation of our original object if possible\n        return originalObj + '' || fallback()\n      }\n\n      if (typeof ctx === 'undefined' || ctx === null) {\n        return target.call(ctx)\n      }\n\n      // Check if the toString protype of the context is the same as the global prototype,\n      // if not indicates that we are doing a check across different windows., e.g. the iframeWithdirect` test case\n      const hasSameProto = Object.getPrototypeOf(\n        Function.prototype.toString\n      ).isPrototypeOf(ctx.toString) // eslint-disable-line no-prototype-builtins\n      if (!hasSameProto) {\n        // Pass the call on to the local Function.prototype.toString instead\n        return ctx.toString()\n      }\n\n      return target.call(ctx)\n    }\n  }\n\n  const toStringProxy = new Proxy(\n    Function.prototype.toString,\n    utils.stripProxyFromErrors(handler)\n  )\n  utils.replaceProperty(Function.prototype, 'toString', {\n    value: toStringProxy\n  })\n}",replaceWithProxy:"(obj, propName, handler) => {\n  const originalObj = obj[propName]\n  const proxyObj = new Proxy(obj[propName], utils.stripProxyFromErrors(handler))\n\n  utils.replaceProperty(obj, propName, { value: proxyObj })\n  utils.redirectToString(proxyObj, originalObj)\n\n  return true\n}",replaceGetterWithProxy:"(obj, propName, handler) => {\n  const fn = Object.getOwnPropertyDescriptor(obj, propName).get\n  const fnStr = fn.toString() // special getter function string\n  const proxyObj = new Proxy(fn, utils.stripProxyFromErrors(handler))\n\n  utils.replaceProperty(obj, propName, { get: proxyObj })\n  utils.patchToString(proxyObj, fnStr)\n\n  return true\n}",replaceGetterSetter:"(obj, propName, handlerGetterSetter) => {\n  const ownPropertyDescriptor = Object.getOwnPropertyDescriptor(obj, propName)\n  const handler = { ...ownPropertyDescriptor }\n\n  if (handlerGetterSetter.get !== undefined) {\n    const nativeFn = ownPropertyDescriptor.get\n    handler.get = function() {\n      return handlerGetterSetter.get.call(this, nativeFn.bind(this))\n    }\n    utils.redirectToString(handler.get, nativeFn)\n  }\n\n  if (handlerGetterSetter.set !== undefined) {\n    const nativeFn = ownPropertyDescriptor.set\n    handler.set = function(newValue) {\n      handlerGetterSetter.set.call(this, newValue, nativeFn.bind(this))\n    }\n    utils.redirectToString(handler.set, nativeFn)\n  }\n\n  Object.defineProperty(obj, propName, handler)\n}",mockWithProxy:"(obj, propName, pseudoTarget, handler) => {\n  const proxyObj = new Proxy(pseudoTarget, utils.stripProxyFromErrors(handler))\n\n  utils.replaceProperty(obj, propName, { value: proxyObj })\n  utils.patchToString(proxyObj)\n\n  return true\n}",createProxy:"(pseudoTarget, handler) => {\n  const proxyObj = new Proxy(pseudoTarget, utils.stripProxyFromErrors(handler))\n  utils.patchToString(proxyObj)\n\n  return proxyObj\n}",splitObjPath:"objPath => ({\n  // Remove last dot entry (property) ==> `HTMLMediaElement.prototype`\n  objName: objPath.split('.').slice(0, -1).join('.'),\n  // Extract last dot entry ==> `canPlayType`\n  propName: objPath.split('.').slice(-1)[0]\n})",replaceObjPathWithProxy:"(objPath, handler) => {\n  const { objName, propName } = utils.splitObjPath(objPath)\n  const obj = eval(objName) // eslint-disable-line no-eval\n  return utils.replaceWithProxy(obj, propName, handler)\n}",execRecursively:"(obj = {}, typeFilter = [], fn) => {\n  function recurse(obj) {\n    for (const key in obj) {\n      if (obj[key] === undefined) {\n        continue\n      }\n      if (obj[key] && typeof obj[key] === 'object') {\n        recurse(obj[key])\n      } else {\n        if (obj[key] && typeFilter.includes(typeof obj[key])) {\n          fn.call(this, obj[key])\n        }\n      }\n    }\n  }\n  recurse(obj)\n  return obj\n}",stringifyFns:"(fnObj = { hello: () => 'world' }) => {\n  // Object.fromEntries() ponyfill (in 6 lines) - supported only in Node v12+, modern browsers are fine\n  // https://github.com/feross/fromentries\n  function fromEntries(iterable) {\n    return [...iterable].reduce((obj, [key, val]) => {\n      obj[key] = val\n      return obj\n    }, {})\n  }\n  return (Object.fromEntries || fromEntries)(\n    Object.entries(fnObj)\n      .filter(([key, value]) => typeof value === 'function')\n      .map(([key, value]) => [key, value.toString()]) // eslint-disable-line no-eval\n  )\n}",materializeFns:"(fnStrObj = { hello: \"() => 'world'\" }) => {\n  return Object.fromEntries(\n    Object.entries(fnStrObj).map(([key, value]) => {\n      if (value.startsWith('function')) {\n        // some trickery is needed to make oldschool functions work :-)\n        return [key, eval(`() => ${value}`)()] // eslint-disable-line no-eval\n      } else {\n        // arrow functions just work\n        return [key, eval(value)] // eslint-disable-line no-eval\n      }\n    })\n  )\n}",makeHandler:"() => ({\n  // Used by simple `navigator` getter evasions\n  getterValue: value => ({\n    apply(target, ctx, args) {\n      // Let's fetch the value first, to trigger and escalate potential errors\n      // Illegal invocations like `navigator.__proto__.vendor` will throw here\n      utils.cache.Reflect.apply(...arguments)\n      return value\n    }\n  })\n})",arrayEquals:"(array1, array2) => {\n  if (array1.length !== array2.length) {\n    return false\n  }\n  for (let i = 0; i < array1.length; ++i) {\n    if (array1[i] !== array2[i]) {\n      return false\n    }\n  }\n  return true\n}",memoize:"fn => {\n  const cache = []\n  return function(...args) {\n    if (!cache.some(c => utils.arrayEquals(c.key, args))) {\n      cache.push({ key: args, value: fn.apply(this, args) })\n    }\n    return cache.find(c => utils.arrayEquals(c.key, args)).value\n  }\n}"},_mainFunction:"(utils, opts) => {\n      const getParameterProxyHandler = {\n        apply: function(target, ctx, args) {\n          const param = (args || [])[0]\n          const result = utils.cache.Reflect.apply(target, ctx, args)\n          // UNMASKED_VENDOR_WEBGL\n          if (param === 37445) {\n            return opts.vendor || 'Intel Inc.' // default in headless: Google Inc.\n          }\n          // UNMASKED_RENDERER_WEBGL\n          if (param === 37446) {\n            return opts.renderer || 'Intel Iris OpenGL Engine' // default in headless: Google SwiftShader\n          }\n          return result\n        }\n      }\n\n      // There's more than one WebGL rendering context\n      // https://developer.mozilla.org/en-US/docs/Web/API/WebGL2RenderingContext#Browser_compatibility\n      // To find out the original values here: Object.getOwnPropertyDescriptors(WebGLRenderingContext.prototype.getParameter)\n      const addProxy = (obj, propName) => {\n        utils.replaceWithProxy(obj, propName, getParameterProxyHandler)\n      }\n      // For whatever weird reason loops don't play nice with Object.defineProperty, here's the next best thing:\n      addProxy(WebGLRenderingContext.prototype, 'getParameter')\n      addProxy(WebGL2RenderingContext.prototype, 'getParameter')\n    }",_args:[{}]}),(()=>{try{if(window.outerWidth&&window.outerHeight)return;const n=85;window.outerWidth=window.innerWidth,window.outerHeight=window.innerHeight+n}catch(n){}})(),(({_utilsFns:_utilsFns,_mainFunction:_mainFunction,_args:_args})=>{const utils=Object.fromEntries(Object.entries(_utilsFns).map((([key,value])=>[key,eval(value)])));utils.init(),eval(_mainFunction)(utils,..._args)})({_utilsFns:{init:"() => {\n  utils.preloadCache()\n}",stripProxyFromErrors:"(handler = {}) => {\n  const newHandler = {\n    setPrototypeOf: function (target, proto) {\n      if (proto === null)\n        throw new TypeError('Cannot convert object to primitive value')\n      if (Object.getPrototypeOf(target) === Object.getPrototypeOf(proto)) {\n        throw new TypeError('Cyclic __proto__ value')\n      }\n      return Reflect.setPrototypeOf(target, proto)\n    }\n  }\n  // We wrap each trap in the handler in a try/catch and modify the error stack if they throw\n  const traps = Object.getOwnPropertyNames(handler)\n  traps.forEach(trap => {\n    newHandler[trap] = function () {\n      try {\n        // Forward the call to the defined proxy handler\n        return handler[trap].apply(this, arguments || [])\n      } catch (err) {\n        // Stack traces differ per browser, we only support chromium based ones currently\n        if (!err || !err.stack || !err.stack.includes(`at `)) {\n          throw err\n        }\n\n        // When something throws within one of our traps the Proxy will show up in error stacks\n        // An earlier implementation of this code would simply strip lines with a blacklist,\n        // but it makes sense to be more surgical here and only remove lines related to our Proxy.\n        // We try to use a known \"anchor\" line for that and strip it with everything above it.\n        // If the anchor line cannot be found for some reason we fall back to our blacklist approach.\n\n        const stripWithBlacklist = (stack, stripFirstLine = true) => {\n          const blacklist = [\n            `at Reflect.${trap} `, // e.g. Reflect.get or Reflect.apply\n            `at Object.${trap} `, // e.g. Object.get or Object.apply\n            `at Object.newHandler.<computed> [as ${trap}] ` // caused by this very wrapper :-)\n          ]\n          return (\n            err.stack\n              .split('\\n')\n              // Always remove the first (file) line in the stack (guaranteed to be our proxy)\n              .filter((line, index) => !(index === 1 && stripFirstLine))\n              // Check if the line starts with one of our blacklisted strings\n              .filter(line => !blacklist.some(bl => line.trim().startsWith(bl)))\n              .join('\\n')\n          )\n        }\n\n        const stripWithAnchor = (stack, anchor) => {\n          const stackArr = stack.split('\\n')\n          anchor = anchor || `at Object.newHandler.<computed> [as ${trap}] ` // Known first Proxy line in chromium\n          const anchorIndex = stackArr.findIndex(line =>\n            line.trim().startsWith(anchor)\n          )\n          if (anchorIndex === -1) {\n            return false // 404, anchor not found\n          }\n          // Strip everything from the top until we reach the anchor line\n          // Note: We're keeping the 1st line (zero index) as it's unrelated (e.g. `TypeError`)\n          stackArr.splice(1, anchorIndex)\n          return stackArr.join('\\n')\n        }\n\n        // Special cases due to our nested toString proxies\n        err.stack = err.stack.replace(\n          'at Object.toString (',\n          'at Function.toString ('\n        )\n        if ((err.stack || '').includes('at Function.toString (')) {\n          err.stack = stripWithBlacklist(err.stack, false)\n          throw err\n        }\n\n        // Try using the anchor method, fallback to blacklist if necessary\n        err.stack = stripWithAnchor(err.stack) || stripWithBlacklist(err.stack)\n\n        throw err // Re-throw our now sanitized error\n      }\n    }\n  })\n  return newHandler\n}",stripErrorWithAnchor:"(err, anchor) => {\n  const stackArr = err.stack.split('\\n')\n  const anchorIndex = stackArr.findIndex(line => line.trim().startsWith(anchor))\n  if (anchorIndex === -1) {\n    return err // 404, anchor not found\n  }\n  // Strip everything from the top until we reach the anchor line (remove anchor line as well)\n  // Note: We're keeping the 1st line (zero index) as it's unrelated (e.g. `TypeError`)\n  stackArr.splice(1, anchorIndex)\n  err.stack = stackArr.join('\\n')\n  return err\n}",replaceProperty:"(obj, propName, descriptorOverrides = {}) => {\n  return Object.defineProperty(obj, propName, {\n    // Copy over the existing descriptors (writable, enumerable, configurable, etc)\n    ...(Object.getOwnPropertyDescriptor(obj, propName) || {}),\n    // Add our overrides (e.g. value, get())\n    ...descriptorOverrides\n  })\n}",preloadCache:"() => {\n  if (utils.cache) {\n    return\n  }\n  utils.cache = {\n    // Used in our proxies\n    Reflect: {\n      get: Reflect.get.bind(Reflect),\n      apply: Reflect.apply.bind(Reflect)\n    },\n    // Used in `makeNativeString`\n    nativeToStringStr: Function.toString + '' // => `function toString() { [native code] }`\n  }\n}",makeNativeString:"(name = '') => {\n  return utils.cache.nativeToStringStr.replace('toString', name || '')\n}",patchToString:"(obj, str = '') => {\n  const handler = {\n    apply: function (target, ctx) {\n      // This fixes e.g. `HTMLMediaElement.prototype.canPlayType.toString + \"\"`\n      if (ctx === Function.prototype.toString) {\n        return utils.makeNativeString('toString')\n      }\n      // `toString` targeted at our proxied Object detected\n      if (ctx === obj) {\n        // We either return the optional string verbatim or derive the most desired result automatically\n        return str || utils.makeNativeString(obj.name)\n      }\n      // Check if the toString protype of the context is the same as the global prototype,\n      // if not indicates that we are doing a check across different windows., e.g. the iframeWithdirect` test case\n      const hasSameProto = Object.getPrototypeOf(\n        Function.prototype.toString\n      ).isPrototypeOf(ctx.toString) // eslint-disable-line no-prototype-builtins\n      if (!hasSameProto) {\n        // Pass the call on to the local Function.prototype.toString instead\n        return ctx.toString()\n      }\n      return target.call(ctx)\n    }\n  }\n\n  const toStringProxy = new Proxy(\n    Function.prototype.toString,\n    utils.stripProxyFromErrors(handler)\n  )\n  utils.replaceProperty(Function.prototype, 'toString', {\n    value: toStringProxy\n  })\n}",patchToStringNested:"(obj = {}) => {\n  return utils.execRecursively(obj, ['function'], utils.patchToString)\n}",redirectToString:"(proxyObj, originalObj) => {\n  const handler = {\n    apply: function (target, ctx) {\n      // This fixes e.g. `HTMLMediaElement.prototype.canPlayType.toString + \"\"`\n      if (ctx === Function.prototype.toString) {\n        return utils.makeNativeString('toString')\n      }\n\n      // `toString` targeted at our proxied Object detected\n      if (ctx === proxyObj) {\n        const fallback = () =>\n          originalObj && originalObj.name\n            ? utils.makeNativeString(originalObj.name)\n            : utils.makeNativeString(proxyObj.name)\n\n        // Return the toString representation of our original object if possible\n        return originalObj + '' || fallback()\n      }\n\n      if (typeof ctx === 'undefined' || ctx === null) {\n        return target.call(ctx)\n      }\n\n      // Check if the toString protype of the context is the same as the global prototype,\n      // if not indicates that we are doing a check across different windows., e.g. the iframeWithdirect` test case\n      const hasSameProto = Object.getPrototypeOf(\n        Function.prototype.toString\n      ).isPrototypeOf(ctx.toString) // eslint-disable-line no-prototype-builtins\n      if (!hasSameProto) {\n        // Pass the call on to the local Function.prototype.toString instead\n        return ctx.toString()\n      }\n\n      return target.call(ctx)\n    }\n  }\n\n  const toStringProxy = new Proxy(\n    Function.prototype.toString,\n    utils.stripProxyFromErrors(handler)\n  )\n  utils.replaceProperty(Function.prototype, 'toString', {\n    value: toStringProxy\n  })\n}",replaceWithProxy:"(obj, propName, handler) => {\n  const originalObj = obj[propName]\n  const proxyObj = new Proxy(obj[propName], utils.stripProxyFromErrors(handler))\n\n  utils.replaceProperty(obj, propName, { value: proxyObj })\n  utils.redirectToString(proxyObj, originalObj)\n\n  return true\n}",replaceGetterWithProxy:"(obj, propName, handler) => {\n  const fn = Object.getOwnPropertyDescriptor(obj, propName).get\n  const fnStr = fn.toString() // special getter function string\n  const proxyObj = new Proxy(fn, utils.stripProxyFromErrors(handler))\n\n  utils.replaceProperty(obj, propName, { get: proxyObj })\n  utils.patchToString(proxyObj, fnStr)\n\n  return true\n}",replaceGetterSetter:"(obj, propName, handlerGetterSetter) => {\n  const ownPropertyDescriptor = Object.getOwnPropertyDescriptor(obj, propName)\n  const handler = { ...ownPropertyDescriptor }\n\n  if (handlerGetterSetter.get !== undefined) {\n    const nativeFn = ownPropertyDescriptor.get\n    handler.get = function() {\n      return handlerGetterSetter.get.call(this, nativeFn.bind(this))\n    }\n    utils.redirectToString(handler.get, nativeFn)\n  }\n\n  if (handlerGetterSetter.set !== undefined) {\n    const nativeFn = ownPropertyDescriptor.set\n    handler.set = function(newValue) {\n      handlerGetterSetter.set.call(this, newValue, nativeFn.bind(this))\n    }\n    utils.redirectToString(handler.set, nativeFn)\n  }\n\n  Object.defineProperty(obj, propName, handler)\n}",mockWithProxy:"(obj, propName, pseudoTarget, handler) => {\n  const proxyObj = new Proxy(pseudoTarget, utils.stripProxyFromErrors(handler))\n\n  utils.replaceProperty(obj, propName, { value: proxyObj })\n  utils.patchToString(proxyObj)\n\n  return true\n}",createProxy:"(pseudoTarget, handler) => {\n  const proxyObj = new Proxy(pseudoTarget, utils.stripProxyFromErrors(handler))\n  utils.patchToString(proxyObj)\n\n  return proxyObj\n}",splitObjPath:"objPath => ({\n  // Remove last dot entry (property) ==> `HTMLMediaElement.prototype`\n  objName: objPath.split('.').slice(0, -1).join('.'),\n  // Extract last dot entry ==> `canPlayType`\n  propName: objPath.split('.').slice(-1)[0]\n})",replaceObjPathWithProxy:"(objPath, handler) => {\n  const { objName, propName } = utils.splitObjPath(objPath)\n  const obj = eval(objName) // eslint-disable-line no-eval\n  return utils.replaceWithProxy(obj, propName, handler)\n}",execRecursively:"(obj = {}, typeFilter = [], fn) => {\n  function recurse(obj) {\n    for (const key in obj) {\n      if (obj[key] === undefined) {\n        continue\n      }\n      if (obj[key] && typeof obj[key] === 'object') {\n        recurse(obj[key])\n      } else {\n        if (obj[key] && typeFilter.includes(typeof obj[key])) {\n          fn.call(this, obj[key])\n        }\n      }\n    }\n  }\n  recurse(obj)\n  return obj\n}",stringifyFns:"(fnObj = { hello: () => 'world' }) => {\n  // Object.fromEntries() ponyfill (in 6 lines) - supported only in Node v12+, modern browsers are fine\n  // https://github.com/feross/fromentries\n  function fromEntries(iterable) {\n    return [...iterable].reduce((obj, [key, val]) => {\n      obj[key] = val\n      return obj\n    }, {})\n  }\n  return (Object.fromEntries || fromEntries)(\n    Object.entries(fnObj)\n      .filter(([key, value]) => typeof value === 'function')\n      .map(([key, value]) => [key, value.toString()]) // eslint-disable-line no-eval\n  )\n}",materializeFns:"(fnStrObj = { hello: \"() => 'world'\" }) => {\n  return Object.fromEntries(\n    Object.entries(fnStrObj).map(([key, value]) => {\n      if (value.startsWith('function')) {\n        // some trickery is needed to make oldschool functions work :-)\n        return [key, eval(`() => ${value}`)()] // eslint-disable-line no-eval\n      } else {\n        // arrow functions just work\n        return [key, eval(value)] // eslint-disable-line no-eval\n      }\n    })\n  )\n}",makeHandler:"() => ({\n  // Used by simple `navigator` getter evasions\n  getterValue: value => ({\n    apply(target, ctx, args) {\n      // Let's fetch the value first, to trigger and escalate potential errors\n      // Illegal invocations like `navigator.__proto__.vendor` will throw here\n      utils.cache.Reflect.apply(...arguments)\n      return value\n    }\n  })\n})",arrayEquals:"(array1, array2) => {\n  if (array1.length !== array2.length) {\n    return false\n  }\n  for (let i = 0; i < array1.length; ++i) {\n    if (array1[i] !== array2[i]) {\n      return false\n    }\n  }\n  return true\n}",memoize:"fn => {\n  const cache = []\n  return function(...args) {\n    if (!cache.some(c => utils.arrayEquals(c.key, args))) {\n      cache.push({ key: args, value: fn.apply(this, args) })\n    }\n    return cache.find(c => utils.arrayEquals(c.key, args)).value\n  }\n}"},_mainFunction:"(utils, opts) => {\n      try {\n        // Adds a contentWindow proxy to the provided iframe element\n        const addContentWindowProxy = iframe => {\n          const contentWindowProxy = {\n            get(target, key) {\n              // Now to the interesting part:\n              // We actually make this thing behave like a regular iframe window,\n              // by intercepting calls to e.g. `.self` and redirect it to the correct thing. :)\n              // That makes it possible for these assertions to be correct:\n              // iframe.contentWindow.self === window.top // must be false\n              if (key === 'self') {\n                return this\n              }\n              // iframe.contentWindow.frameElement === iframe // must be true\n              if (key === 'frameElement') {\n                return iframe\n              }\n              // Intercept iframe.contentWindow[0] to hide the property 0 added by the proxy.\n              if (key === '0') {\n                return undefined\n              }\n              return Reflect.get(target, key)\n            }\n          }\n\n          if (!iframe.contentWindow) {\n            const proxy = new Proxy(window, contentWindowProxy)\n            Object.defineProperty(iframe, 'contentWindow', {\n              get() {\n                return proxy\n              },\n              set(newValue) {\n                return newValue // contentWindow is immutable\n              },\n              enumerable: true,\n              configurable: false\n            })\n          }\n        }\n\n        // Handles iframe element creation, augments `srcdoc` property so we can intercept further\n        const handleIframeCreation = (target, thisArg, args) => {\n          const iframe = target.apply(thisArg, args)\n\n          // We need to keep the originals around\n          const _iframe = iframe\n          const _srcdoc = _iframe.srcdoc\n\n          // Add hook for the srcdoc property\n          // We need to be very surgical here to not break other iframes by accident\n          Object.defineProperty(iframe, 'srcdoc', {\n            configurable: true, // Important, so we can reset this later\n            get: function() {\n              return _srcdoc\n            },\n            set: function(newValue) {\n              addContentWindowProxy(this)\n              // Reset property, the hook is only needed once\n              Object.defineProperty(iframe, 'srcdoc', {\n                configurable: false,\n                writable: false,\n                value: _srcdoc\n              })\n              _iframe.srcdoc = newValue\n            }\n          })\n          return iframe\n        }\n\n        // Adds a hook to intercept iframe creation events\n        const addIframeCreationSniffer = () => {\n          /* global document */\n          const createElementHandler = {\n            // Make toString() native\n            get(target, key) {\n              return Reflect.get(target, key)\n            },\n            apply: function(target, thisArg, args) {\n              const isIframe =\n                args && args.length && `${args[0]}`.toLowerCase() === 'iframe'\n              if (!isIframe) {\n                // Everything as usual\n                return target.apply(thisArg, args)\n              } else {\n                return handleIframeCreation(target, thisArg, args)\n              }\n            }\n          }\n          // All this just due to iframes with srcdoc bug\n          utils.replaceWithProxy(\n            document,\n            'createElement',\n            createElementHandler\n          )\n        }\n\n        // Let's go\n        addIframeCreationSniffer()\n      } catch (err) {\n        // console.warn(err)\n      }\n    }",_args:[]});
\ No newline at end of file
diff --git a/apps/api/pyproject.toml b/apps/api/pyproject.toml
index dc07911..578c0bd 100644
--- a/apps/api/pyproject.toml
+++ b/apps/api/pyproject.toml
@@ -25,6 +25,7 @@ dependencies = [
     "html-telegraph-poster-v2>=0.2.5",
     "firecrawl-py>=4.13.0",
     "zyte-api>=0.8.1",
+    "celery[redis]>=5.4.0",
 ]
 
 [build-system]
diff --git a/apps/api/src/config.py b/apps/api/src/config.py
index aa1e7de..e02c3af 100644
--- a/apps/api/src/config.py
+++ b/apps/api/src/config.py
@@ -37,13 +37,14 @@
 telegraph_token_list = env.get("TELEGRAPH_TOKEN_LIST", "")
 TELEGRAPH_TOKEN_LIST = telegraph_token_list.split(",") if telegraph_token_list else None
 
-# Youtube-dl environment variables
+# File exporter toggle (used by telegram bot to show/hide buttons)
 FILE_EXPORTER_ON = get_env_bool(env, "FILE_EXPORTER_ON", True)
-FILE_EXPORTER_HOST = env.get("FILE_EXPORTER_HOST", "fast-yt-downloader")
-FILE_EXPORTER_PORT = env.get("FILE_EXPORTER_PORT", "4000")
-FILE_EXPORTER_URL = f"http://{FILE_EXPORTER_HOST}:{FILE_EXPORTER_PORT}"
 DOWNLOAD_VIDEO_TIMEOUT = env.get("DOWNLOAD_VIDEO_TIMEOUT", 600)
 
+# Celery configuration
+CELERY_BROKER_URL = env.get("CELERY_BROKER_URL", "redis://localhost:6379/0")
+CELERY_RESULT_BACKEND = env.get("CELERY_RESULT_BACKEND", "redis://localhost:6379/1")
+
 # Services environment variables
 templates_directory = os.path.join(current_directory, "templates")
 JINJA2_ENV = Environment(
diff --git a/apps/api/src/services/celery_client.py b/apps/api/src/services/celery_client.py
new file mode 100644
index 0000000..49a94ec
--- /dev/null
+++ b/apps/api/src/services/celery_client.py
@@ -0,0 +1,8 @@
+from celery import Celery
+from src.config import CELERY_BROKER_URL, CELERY_RESULT_BACKEND
+
+celery_app = Celery(
+    "fastfetchbot_worker",
+    broker=CELERY_BROKER_URL,
+    backend=CELERY_RESULT_BACKEND,
+)
diff --git a/apps/api/src/services/file_export/audio_transcribe/__init__.py b/apps/api/src/services/file_export/audio_transcribe/__init__.py
index 5088ff7..2f811ca 100644
--- a/apps/api/src/services/file_export/audio_transcribe/__init__.py
+++ b/apps/api/src/services/file_export/audio_transcribe/__init__.py
@@ -1,11 +1,8 @@
-import httpx
+import asyncio
 
-from src.config import OPENAI_API_KEY, FILE_EXPORTER_URL, DOWNLOAD_VIDEO_TIMEOUT
+from src.config import DOWNLOAD_VIDEO_TIMEOUT
+from src.services.celery_client import celery_app
 from fastfetchbot_shared.utils.logger import logger
-from fastfetchbot_shared.utils.parse import wrap_text_into_html
-
-TRANSCRIBE_MODEL = "whisper-1"
-SEGMENT_LENGTH = 5 * 60
 
 
 class AudioTranscribe:
@@ -17,14 +14,16 @@ async def transcribe(self):
 
     @staticmethod
     async def _get_audio_text(audio_file: str):
-        async with httpx.AsyncClient() as client:
-            body = {
-                "audio_file": audio_file,
-                "openai_api_key": OPENAI_API_KEY,
-            }
-            request_url = FILE_EXPORTER_URL + "/transcribe"
-            response = await client.post(
-                url=request_url, json=body, timeout=DOWNLOAD_VIDEO_TIMEOUT
+        logger.info(f"submitting transcribe task: {audio_file}")
+        result = celery_app.send_task("file_export.transcribe", kwargs={
+            "audio_file": audio_file,
+        })
+        try:
+            response = await asyncio.to_thread(result.get, timeout=int(DOWNLOAD_VIDEO_TIMEOUT))
+            return response["transcript"]
+        except Exception:
+            logger.exception(
+                f"file_export.transcribe task failed: audio_file={audio_file}, "
+                f"timeout={DOWNLOAD_VIDEO_TIMEOUT}"
             )
-            transcript = response.json().get("transcript")
-            return transcript
+            raise
diff --git a/apps/api/src/services/file_export/document_export/__init__.py b/apps/api/src/services/file_export/document_export/__init__.py
index 282167d..eb3e41d 100644
--- a/apps/api/src/services/file_export/document_export/__init__.py
+++ b/apps/api/src/services/file_export/document_export/__init__.py
@@ -2,9 +2,13 @@
 
 
 class DocumentExport(object):
+    # TODO: Implement document export interface for multiple types of documents,
+    #  currently only support pdf export
+
     def __init__(self, document):
         self.document = document
 
-    def export(self):
+    async def export(self):
         if self.document["type"] == "pdf":
             return pdf_export.PdfExport(self.document["content"]).export()
+        return None
diff --git a/apps/api/src/services/file_export/document_export/pdf_export.py b/apps/api/src/services/file_export/document_export/pdf_export.py
index 88fd0b5..111c3a4 100644
--- a/apps/api/src/services/file_export/document_export/pdf_export.py
+++ b/apps/api/src/services/file_export/document_export/pdf_export.py
@@ -1,24 +1,15 @@
 import asyncio
-import functools
-
-# import gc
-import os
 import uuid
 from pathlib import Path
 
-import aiofiles
 import aiofiles.os
-import httpx
 from bs4 import BeautifulSoup
 
-from src.config import DOWNLOAD_DIR, FILE_EXPORTER_URL, DOWNLOAD_VIDEO_TIMEOUT, TEMP_DIR, AWS_STORAGE_ON
+from src.config import DOWNLOAD_VIDEO_TIMEOUT, AWS_STORAGE_ON
+from src.services.celery_client import celery_app
 from src.services.amazon.s3 import upload as upload_to_s3
 from fastfetchbot_shared.utils.logger import logger
 
-current_directory = os.path.dirname(os.path.abspath(__file__))
-
-PDF_STYLESHEET = os.path.join(current_directory, "pdf_export.css")
-
 
 async def upload_file_to_s3(output_filename):
     return await upload_to_s3(
@@ -33,40 +24,26 @@ def __init__(self, title: str, html_string: str = None):
         self.title = title
         self.html_string = html_string
 
-    async def export(self, method: str = "file") -> str:
-        body = {
-            "method": method
-        }
+    async def export(self) -> str:
         html_string = self.wrap_html_string(self.html_string)
-        if method == "string":
-            body["html_string"] = html_string,
-            logger.debug(
-                f"""
-                    html_string: {html_string}
-                    """
-            )
-        elif method == "file":
-            filename = f"{self.title}-{uuid.uuid4()}.html"
-            filename = os.path.join(TEMP_DIR, filename)
-            async with aiofiles.open(
-                filename, "w", encoding="utf-8"
-            ) as f:
-                await f.write(html_string)
-                html_file = filename
-                logger.debug(html_file)
-            body["html_file"] = html_file
         output_filename = f"{self.title}-{uuid.uuid4()}.pdf"
-        body["output_filename"] = output_filename
 
-        async with httpx.AsyncClient() as client:
-            request_url = FILE_EXPORTER_URL + "/pdfExport"
-            logger.info(f"requesting pdf export from pdf server: {body}")
-            resp = await client.post(
-                request_url, json=body, timeout=DOWNLOAD_VIDEO_TIMEOUT
+        logger.info(f"submitting pdf export task: {output_filename}")
+        result = celery_app.send_task("file_export.pdf_export", kwargs={
+            "html_string": html_string,
+            "output_filename": output_filename,
+        })
+        try:
+            response = await asyncio.to_thread(result.get, timeout=int(DOWNLOAD_VIDEO_TIMEOUT))
+            output_filename = response["output_filename"]
+        except Exception:
+            logger.exception(
+                f"file_export.pdf_export task failed: output_filename={output_filename}, "
+                f"timeout={DOWNLOAD_VIDEO_TIMEOUT}"
             )
-        output_filename = resp.json().get("output_filename")
+            raise
         logger.info(f"pdf export success: {output_filename}")
-        await aiofiles.os.remove(html_file)
+
         if AWS_STORAGE_ON:
             local_filename = output_filename
             output_filename = await upload_file_to_s3(Path(output_filename))
diff --git a/apps/api/src/services/file_export/video_download/__init__.py b/apps/api/src/services/file_export/video_download/__init__.py
index 01f95b6..aebda54 100644
--- a/apps/api/src/services/file_export/video_download/__init__.py
+++ b/apps/api/src/services/file_export/video_download/__init__.py
@@ -1,3 +1,4 @@
+import asyncio
 from typing import Any, Optional
 
 import httpx
@@ -5,7 +6,8 @@
 
 from fastfetchbot_shared.models.metadata_item import MetadataItem, MessageType, MediaFile
 from src.services.file_export.audio_transcribe import AudioTranscribe
-from src.config import FILE_EXPORTER_URL, DOWNLOAD_VIDEO_TIMEOUT
+from src.services.celery_client import celery_app
+from src.config import DOWNLOAD_VIDEO_TIMEOUT
 from fastfetchbot_shared.utils.parse import unix_timestamp_to_utc, second_to_time, wrap_text_into_html
 from fastfetchbot_shared.utils.logger import logger
 from src.config import JINJA2_ENV
@@ -136,7 +138,7 @@ async def get_video_info(
             hd: bool = None,
     ) -> dict:
         """
-        make a request to youtube-dl server to get video info
+        Submit a Celery task to download/extract video info.
         :return: video info dict
         """
         if url is None:
@@ -149,30 +151,33 @@ async def get_video_info(
             audio_only = self.audio_only
         if hd is None:
             hd = self.hd
-        async with httpx.AsyncClient() as client:
-            body = {
-                "url": url,
-                "download": download,
-                "extractor": extractor,
-                "audio_only": audio_only,
-                "hd": hd,
-            }
-            request_url = FILE_EXPORTER_URL + "/videoDownload"
-            logger.info(f"requesting video info from youtube-dl server: {body}")
-            if download is True:
-                logger.info(f"video downloading... it may take a while")
-                if hd is True:
-                    logger.info(f"downloading HD video, it may take longer")
-                elif audio_only is True:
-                    logger.info(f"downloading audio only")
-            logger.debug(f"downloading video timeout: {DOWNLOAD_VIDEO_TIMEOUT}")
-            resp = await client.post(
-                request_url, json=body, timeout=DOWNLOAD_VIDEO_TIMEOUT
-            )
-            content_info = resp.json().get("content_info")
-            file_path = resp.json().get("file_path")
-            content_info["file_path"] = file_path
+        body = {
+            "url": url,
+            "download": download,
+            "extractor": extractor,
+            "audio_only": audio_only,
+            "hd": hd,
+        }
+        logger.info(f"submitting video download task: {body}")
+        if download is True:
+            logger.info("video downloading... it may take a while")
+            if hd is True:
+                logger.info("downloading HD video, it may take longer")
+            elif audio_only is True:
+                logger.info("downloading audio only")
+        logger.debug(f"downloading video timeout: {DOWNLOAD_VIDEO_TIMEOUT}")
+        result = celery_app.send_task("file_export.video_download", kwargs=body)
+        try:
+            response = await asyncio.to_thread(result.get, timeout=int(DOWNLOAD_VIDEO_TIMEOUT))
+            content_info = response["content_info"]
+            content_info["file_path"] = response["file_path"]
             return content_info
+        except Exception:
+            logger.exception(
+                f"file_export.video_download task failed: url={url}, extractor={extractor}, "
+                f"timeout={DOWNLOAD_VIDEO_TIMEOUT}"
+            )
+            raise
 
     def _video_info_formatting(self, meta_info: dict):
         self.title = meta_info["title"]
diff --git a/apps/api/src/services/scrapers/common.py b/apps/api/src/services/scrapers/common.py
index d7b83cf..0ea0d7a 100644
--- a/apps/api/src/services/scrapers/common.py
+++ b/apps/api/src/services/scrapers/common.py
@@ -97,7 +97,7 @@ async def process_item(self, metadata_item: dict) -> dict:
                 pdf_document = document_export.pdf_export.PdfExport(
                     title=metadata_item["title"], html_string=metadata_item["content"]
                 )
-                output_filename = await pdf_document.export(method="file")
+                output_filename = await pdf_document.export()
                 metadata_item["media_files"].append(
                     {
                         "media_type": "document",
diff --git a/apps/worker/Dockerfile b/apps/worker/Dockerfile
new file mode 100644
index 0000000..bf626b1
--- /dev/null
+++ b/apps/worker/Dockerfile
@@ -0,0 +1,68 @@
+
+# `python-base` sets up all our shared environment variables
+FROM python:3.12-slim AS python-base
+
+ENV PYTHONUNBUFFERED=1 \
+    PYTHONDONTWRITEBYTECODE=1 \
+    # uv settings
+    UV_PROJECT_ENVIRONMENT="/opt/pysetup/.venv" \
+    UV_COMPILE_BYTECODE=1 \
+    UV_LINK_MODE=copy \
+    # paths
+    PYSETUP_PATH="/opt/pysetup" \
+    VENV_PATH="/opt/pysetup/.venv"
+
+# prepend venv to path
+ENV PATH="$VENV_PATH/bin:$PATH"
+
+
+# `builder-base` stage is used to build deps + create our virtual environment
+FROM python-base AS builder-base
+
+# install uv from the official image
+COPY --from=ghcr.io/astral-sh/uv:0.10.4 /uv /usr/local/bin/uv
+
+RUN apt-get update \
+    && apt-get install --no-install-recommends -y \
+        ffmpeg \
+        libpango-1.0-0 \
+        libpangoft2-1.0-0 \
+        libjpeg-dev \
+        libopenjp2-7-dev \
+        libffi-dev \
+        build-essential \
+        fonts-wqy-microhei \
+        fonts-wqy-zenhei \
+        fonts-noto-cjk \
+        fonts-noto-cjk-extra
+
+# copy workspace files for dependency resolution
+WORKDIR $PYSETUP_PATH
+COPY pyproject.toml uv.lock ./
+COPY packages/ packages/
+COPY apps/worker/ apps/worker/
+
+# install runtime deps
+RUN uv sync --frozen --no-dev --no-install-project --package fastfetchbot-worker
+
+
+# `production` image used for runtime
+FROM python-base AS production
+ENV PYTHONPATH=/app/apps/worker:$PYTHONPATH
+RUN apt-get update \
+    && apt-get install --no-install-recommends -y \
+        ffmpeg \
+        libpango-1.0-0 \
+        libpangoft2-1.0-0 \
+        libjpeg-dev \
+        libopenjp2-7-dev \
+        libffi-dev \
+        fonts-wqy-microhei \
+        fonts-wqy-zenhei \
+        fonts-noto-cjk \
+        fonts-noto-cjk-extra
+COPY --from=builder-base $PYSETUP_PATH $PYSETUP_PATH
+COPY packages/ /app/packages/
+COPY apps/worker/ /app/apps/worker/
+WORKDIR /app/apps/worker
+CMD ["celery", "-A", "worker_core.main:app", "worker", "--loglevel=info", "--concurrency=2"]
diff --git a/app/__init__.py b/apps/worker/celerybeat-schedule.db
similarity index 100%
rename from app/__init__.py
rename to apps/worker/celerybeat-schedule.db
diff --git a/apps/worker/pyproject.toml b/apps/worker/pyproject.toml
new file mode 100644
index 0000000..46376b2
--- /dev/null
+++ b/apps/worker/pyproject.toml
@@ -0,0 +1,23 @@
+[project]
+name = "fastfetchbot-worker"
+version = "0.1.0"
+requires-python = ">=3.12,<3.13"
+dependencies = [
+    "fastfetchbot-file-export",
+    "fastfetchbot-shared",
+    "celery[redis]>=5.4.0",
+]
+
+[build-system]
+requires = ["hatchling"]
+build-backend = "hatchling.build"
+
+[tool.hatch.build.targets.wheel]
+packages = ["worker_core"]
+
+[tool.uv]
+package = false
+
+[tool.uv.sources]
+fastfetchbot-file-export = { workspace = true }
+fastfetchbot-shared = { workspace = true }
diff --git a/app/services/__init__.py b/apps/worker/worker_core/__init__.py
similarity index 100%
rename from app/services/__init__.py
rename to apps/worker/worker_core/__init__.py
diff --git a/apps/worker/worker_core/config.py b/apps/worker/worker_core/config.py
new file mode 100644
index 0000000..cb4fdc1
--- /dev/null
+++ b/apps/worker/worker_core/config.py
@@ -0,0 +1,24 @@
+import os
+
+from fastfetchbot_shared.utils.parse import get_env_bool
+
+env = os.environ
+
+current_directory = os.path.dirname(os.path.abspath(__file__))
+conf_dir = os.path.join(current_directory, "..", "conf")
+
+CELERY_BROKER_URL = env.get("CELERY_BROKER_URL", "redis://localhost:6379/0")
+CELERY_RESULT_BACKEND = env.get("CELERY_RESULT_BACKEND", "redis://localhost:6379/1")
+
+# Conf directory: defaults to apps/worker/conf/ (same convention as API's apps/api/conf/)
+# In Docker, override via CONF_DIR env var to /app/conf (where the volume is mounted)
+CONF_DIR = env.get("CONF_DIR", conf_dir)
+
+# File export config
+DOWNLOAD_DIR = env.get("DOWNLOAD_DIR", "/tmp")
+COOKIE_FILE_PATH = env.get("COOKIE_FILE_PATH", os.path.join(CONF_DIR, "cookies.txt"))
+PROXY_MODE = get_env_bool(env, "PROXY_MODE", False)
+PROXY_URL = env.get("PROXY_URL", "")
+YOUTUBE_COOKIE = get_env_bool(env, "YOUTUBE_COOKIE", False)
+BILIBILI_COOKIE = get_env_bool(env, "BILIBILI_COOKIE", False)
+OPENAI_API_KEY = env.get("OPENAI_API_KEY", "")
diff --git a/apps/worker/worker_core/main.py b/apps/worker/worker_core/main.py
new file mode 100644
index 0000000..348cb66
--- /dev/null
+++ b/apps/worker/worker_core/main.py
@@ -0,0 +1,21 @@
+from celery import Celery
+from worker_core.config import CELERY_BROKER_URL, CELERY_RESULT_BACKEND
+
+app = Celery(
+    "fastfetchbot_worker",
+    broker=CELERY_BROKER_URL,
+    backend=CELERY_RESULT_BACKEND,
+)
+
+app.conf.update(
+    task_serializer="json",
+    result_serializer="json",
+    accept_content=["json"],
+    task_track_started=True,
+    task_time_limit=660,  # hard limit slightly above download timeout
+    task_soft_time_limit=600,
+    result_expires=3600,
+)
+
+# Auto-discover tasks
+app.autodiscover_tasks(["worker_core"])
diff --git a/apps/worker/worker_core/tasks/__init__.py b/apps/worker/worker_core/tasks/__init__.py
new file mode 100644
index 0000000..e9cf0ab
--- /dev/null
+++ b/apps/worker/worker_core/tasks/__init__.py
@@ -0,0 +1,2 @@
+# Explicitly import all task modules so @app.task decorators run on worker startup
+from . import video, pdf, transcribe
diff --git a/apps/worker/worker_core/tasks/pdf.py b/apps/worker/worker_core/tasks/pdf.py
new file mode 100644
index 0000000..8f47060
--- /dev/null
+++ b/apps/worker/worker_core/tasks/pdf.py
@@ -0,0 +1,23 @@
+from worker_core.main import app
+from worker_core.config import DOWNLOAD_DIR
+from fastfetchbot_file_export.pdf_export import export_pdf
+from fastfetchbot_shared.utils.logger import logger
+
+
+@app.task(name="file_export.pdf_export")
+def pdf_export_task(html_string: str, output_filename: str) -> dict:
+    logger.info(
+        f"pdf_export_task started: output_filename={output_filename}, "
+        f"html_string length={len(html_string)}, DOWNLOAD_DIR={DOWNLOAD_DIR}"
+    )
+    try:
+        output_path = export_pdf(
+            html_string=html_string,
+            output_filename=output_filename,
+            download_dir=DOWNLOAD_DIR,
+        )
+    except Exception:
+        logger.exception(f"pdf_export_task failed: output_filename={output_filename}")
+        raise
+    logger.info(f"pdf_export_task completed: output_path={output_path}")
+    return {"status": "success", "output_filename": output_path}
diff --git a/apps/worker/worker_core/tasks/transcribe.py b/apps/worker/worker_core/tasks/transcribe.py
new file mode 100644
index 0000000..82068d6
--- /dev/null
+++ b/apps/worker/worker_core/tasks/transcribe.py
@@ -0,0 +1,19 @@
+from worker_core.main import app
+from worker_core.config import OPENAI_API_KEY
+from fastfetchbot_file_export.transcribe import get_audio_text
+from fastfetchbot_shared.utils.logger import logger
+
+
+@app.task(name="file_export.transcribe")
+def transcribe_task(audio_file: str) -> dict:
+    logger.info(f"transcribe_task started: audio_file={audio_file}")
+    if not OPENAI_API_KEY:
+        logger.error("transcribe_task failed: OPENAI_API_KEY is not set")
+        raise ValueError("OPENAI_API_KEY is not configured in the worker environment")
+    try:
+        transcript = get_audio_text(audio_file, OPENAI_API_KEY)
+    except Exception:
+        logger.exception(f"transcribe_task failed: audio_file={audio_file}")
+        raise
+    logger.info(f"transcribe_task completed: audio_file={audio_file}, transcript length={len(transcript)}")
+    return {"transcript": transcript, "message": "ok"}
diff --git a/apps/worker/worker_core/tasks/video.py b/apps/worker/worker_core/tasks/video.py
new file mode 100644
index 0000000..767a737
--- /dev/null
+++ b/apps/worker/worker_core/tasks/video.py
@@ -0,0 +1,72 @@
+from worker_core.main import app
+from worker_core.config import (
+    DOWNLOAD_DIR,
+    COOKIE_FILE_PATH,
+    PROXY_MODE,
+    PROXY_URL,
+    YOUTUBE_COOKIE,
+    BILIBILI_COOKIE,
+)
+from fastfetchbot_file_export.video_download import download_video
+from fastfetchbot_shared.utils.logger import logger
+
+# Union of fields used by _youtube_info_parse and _bilibili_info_parse
+_CONTENT_INFO_FIELDS = (
+    "id", "title", "uploader", "uploader_url", "uploader_id", "channel_url",
+    "description", "view_count", "comment_count", "like_count",
+    "thumbnail", "upload_date", "timestamp", "duration", "ext",
+)
+
+
+def _sanitize_content_info(content_info: dict) -> dict:
+    """Extract only the fields the API consumer needs from the full yt-dlp dict.
+
+    The raw yt-dlp content_info contains 100+ fields (including a formats array
+    with 20-50+ objects). The API only uses ~15 metadata fields plus the first
+    video format's aspect_ratio for orientation detection.
+    """
+    sanitized = {k: content_info.get(k) for k in _CONTENT_INFO_FIELDS}
+    # Find the first video format (has aspect_ratio) — mirrors get_video_orientation logic
+    formats = content_info.get("formats") or []
+    video_aspect_ratio = None
+    for fmt in formats:
+        if "aspect_ratio" in fmt and fmt["aspect_ratio"] is not None:
+            video_aspect_ratio = fmt["aspect_ratio"]
+            break
+    sanitized["formats"] = [{"aspect_ratio": video_aspect_ratio}] if video_aspect_ratio is not None else []
+    return sanitized
+
+
+@app.task(name="file_export.video_download")
+def video_download_task(
+    url: str,
+    download: bool = True,
+    hd: bool = False,
+    extractor: str = "youtube",
+    audio_only: bool = False,
+) -> dict:
+    logger.info(f"video_download_task started: url={url}, extractor={extractor}, download={download}, hd={hd}, audio_only={audio_only}")
+    config = {
+        "DOWNLOAD_DIR": DOWNLOAD_DIR,
+        "COOKIE_FILE_PATH": COOKIE_FILE_PATH,
+        "PROXY_MODE": PROXY_MODE,
+        "PROXY_URL": PROXY_URL,
+        "YOUTUBE_COOKIE": YOUTUBE_COOKIE,
+        "BILIBILI_COOKIE": BILIBILI_COOKIE,
+        "LOCAL_MODE": True,
+    }
+    try:
+        result = download_video(
+            url=url,
+            download=download,
+            hd=hd,
+            extractor=extractor,
+            audio_only=audio_only,
+            config=config,
+        )
+    except Exception:
+        logger.exception(f"video_download_task failed: url={url}, extractor={extractor}")
+        raise
+    result["content_info"] = _sanitize_content_info(result["content_info"])
+    logger.info(f"video_download_task completed: url={url}, file_path={result.get('file_path')}")
+    return result
diff --git a/docker-compose.template.yml b/docker-compose.template.yml
index 7380e5f..24aff9c 100644
--- a/docker-compose.template.yml
+++ b/docker-compose.template.yml
@@ -8,13 +8,17 @@ services:
     # restart: always
     volumes:
       - ./conf:/app/conf
-      - video_file:/tmp
+      - shared_files:/tmp
     env_file:
       - .env
+    environment:
+      - CELERY_BROKER_URL=redis://redis:6379/0
+      - CELERY_RESULT_BACKEND=redis://redis:6379/1
     ports:
       - 10450:10450
     depends_on:
       - telegram-bot-api
+      - redis
 
   telegram-bot:
     image: ghcr.io/aturret/fastfetchbot-telegram-bot:latest
@@ -50,20 +54,36 @@ services:
       - TELEGRAM_STAT=1
       - TELEBOT_API_SERVER_PORT=8081
 
-  fast-yt-downloader:
-    image: aturret/fast-yt-downloader:latest
-    container_name: fastytd
+  redis:
+    image: redis:7-alpine
+    container_name: fastfetchbot-redis
     restart: always
-    environment:
-      - PORT=4000
     volumes:
-      - video_file:${DOWNLOAD_DIR}
+      - redis_data:/data
     ports:
-      - 4000:4000
+      - 6379:6379
+
+  worker:
+    image: ghcr.io/aturret/fastfetchbot-worker:latest
+    # build:
+    #   context: .
+    #   dockerfile: apps/worker/Dockerfile
+    container_name: fastfetchbot-worker
+    restart: always
+    env_file:
+      - .env
+    environment:
+      - CELERY_BROKER_URL=redis://redis:6379/0
+      - CELERY_RESULT_BACKEND=redis://redis:6379/1
+      - CONF_DIR=/app/conf
+    volumes:
+      - ./conf:/app/conf
+      - shared_files:/tmp
     depends_on:
-      - api
+      - redis
 
 
 volumes:
   telegram-bot-api-data-cache:
-  video_file:
+  redis_data:
+  shared_files:
diff --git a/packages/file-export/fastfetchbot_file_export/__init__.py b/packages/file-export/fastfetchbot_file_export/__init__.py
new file mode 100644
index 0000000..4ecdaf4
--- /dev/null
+++ b/packages/file-export/fastfetchbot_file_export/__init__.py
@@ -0,0 +1 @@
+"""FastFetchBot file export services: video download, PDF export, audio transcription."""
diff --git a/app/services/file_export/document_export/pdf_export.css b/packages/file-export/fastfetchbot_file_export/pdf_export.css
similarity index 100%
rename from app/services/file_export/document_export/pdf_export.css
rename to packages/file-export/fastfetchbot_file_export/pdf_export.css
diff --git a/packages/file-export/fastfetchbot_file_export/pdf_export.py b/packages/file-export/fastfetchbot_file_export/pdf_export.py
new file mode 100644
index 0000000..e9ec16c
--- /dev/null
+++ b/packages/file-export/fastfetchbot_file_export/pdf_export.py
@@ -0,0 +1,39 @@
+import os
+
+from weasyprint import HTML, CSS
+from weasyprint.text.fonts import FontConfiguration
+
+CSS_FILE = os.path.join(os.path.dirname(os.path.abspath(__file__)), "pdf_export.css")
+
+
+def convert_html_to_pdf(
+    output_filename: str,
+    html_string: str = None,
+    html_file: str = None,
+) -> None:
+    """Convert HTML content to PDF using WeasyPrint."""
+    font_config = FontConfiguration()
+    css_item = CSS(filename=CSS_FILE, font_config=font_config)
+    if html_file:
+        html_item = HTML(filename=html_file, encoding="utf-8")
+    elif html_string:
+        html_item = HTML(string=html_string)
+    else:
+        raise ValueError("Either html_string or html_file must be provided")
+    html_item.write_pdf(output_filename, stylesheets=[css_item])
+
+
+def export_pdf(
+    html_string: str = None,
+    html_file: str = None,
+    output_filename: str = "output.pdf",
+    download_dir: str = "/tmp",
+) -> str:
+    """Export HTML to PDF and return the output file path."""
+    output_path = os.path.join(download_dir, output_filename)
+    convert_html_to_pdf(
+        output_filename=output_path,
+        html_string=html_string,
+        html_file=html_file,
+    )
+    return output_path
diff --git a/packages/file-export/fastfetchbot_file_export/transcribe.py b/packages/file-export/fastfetchbot_file_export/transcribe.py
new file mode 100644
index 0000000..54c81f4
--- /dev/null
+++ b/packages/file-export/fastfetchbot_file_export/transcribe.py
@@ -0,0 +1,113 @@
+import os
+
+from pydub import AudioSegment
+from openai import OpenAI
+from loguru import logger
+
+TRANSCRIBE_MODEL = "whisper-1"
+SEGMENT_LENGTH = 5 * 60  # 5 minutes in seconds
+
+PUNCTUATION_SYSTEM_PROMPT = (
+    "You are a helpful assistant. Your job is to adds punctuation to text. "
+    "What you are going to do should follow the rules below: \n"
+    '1. You have received a text which is transcribed from an audio file which we call it "original text".\n'
+    "2. The response should be presented in the language of the original text.\n"
+    "3. I need you to convert the original text into a new context. During "
+    "this process, please preserve the original words of the given original text and only insert "
+    "necessary punctuation such as periods, commas, capitalization, symbols like dollar signs or "
+    "percentage signs, and formatting according to the language of the provided original text. And I "
+    "hope you to separate the original text into several paragraphs based on the meaning. Please "
+    "use only the provided original text. \n"
+)
+
+SUMMARY_SYSTEM_PROMPT = (
+    "You are a helpful assistant. Your job is to summarize text. "
+    "What you are going to do should follow the rules below: \n"
+    '1. You have received a text which we call it "original text".\n'
+    "2. The response should be presented in the language of the original text.\n"
+    "3. I need you to make a brief statement of the main points of the original text."
+    "Please use only the provided original text. \n"
+)
+
+
+def milliseconds_until_sound(sound, silence_threshold_in_decibels=-20.0, chunk_size=10):
+    """Find the number of milliseconds until the first non-silent part."""
+    trim_ms = 0
+    assert chunk_size > 0
+    while (
+        sound[trim_ms : trim_ms + chunk_size].dBFS < silence_threshold_in_decibels
+        and trim_ms < len(sound)
+    ):
+        trim_ms += chunk_size
+    return trim_ms
+
+
+def punctuation_assistant(client: OpenAI, transcript: str) -> str:
+    """Use GPT to add punctuation and formatting to raw transcript."""
+    response = client.chat.completions.create(
+        model="gpt-3.5-turbo-16k",
+        temperature=0,
+        messages=[
+            {"role": "system", "content": PUNCTUATION_SYSTEM_PROMPT},
+            {"role": "user", "content": transcript},
+        ],
+    )
+    return response.choices[0].message.content
+
+
+def summary_assistant(client: OpenAI, transcript: str) -> str:
+    """Use GPT to generate a summary of the transcript."""
+    response = client.chat.completions.create(
+        model="gpt-3.5-turbo-16k",
+        temperature=0,
+        messages=[
+            {"role": "system", "content": SUMMARY_SYSTEM_PROMPT},
+            {"role": "user", "content": transcript},
+        ],
+    )
+    return response.choices[0].message.content
+
+
+def get_audio_text(audio_file: str, openai_api_key: str) -> str:
+    """
+    Transcribe an audio file using OpenAI Whisper, then post-process with GPT.
+
+    Returns formatted string with summary and full transcript.
+    """
+    client = OpenAI(api_key=openai_api_key)
+    transcript = ""
+    AudioSegment.converter = "ffmpeg"
+    audio_file_non_ext, audio_file_ext = os.path.splitext(audio_file)
+    ext = audio_file_ext.lstrip(".")
+    audio_item = AudioSegment.from_file(audio_file, ext)
+    start_trim = milliseconds_until_sound(audio_item)
+    audio_item = audio_item[start_trim:]
+    audio_length = int(audio_item.duration_seconds) + 1
+
+    for index, i in enumerate(range(0, audio_length * 1000, SEGMENT_LENGTH * 1000)):
+        start_time = i
+        end_time = i + SEGMENT_LENGTH * 1000
+        if end_time >= audio_length * 1000:
+            audio_segment = audio_item[start_time:]
+        else:
+            audio_segment = audio_item[start_time:end_time]
+
+        segment_path = f"{audio_file_non_ext}-{index + 1}{audio_file_ext}"
+        audio_segment.export(segment_path)
+        logger.info(f"audio_segment_path: {segment_path}")
+
+        with open(segment_path, "rb") as f:
+            result = client.audio.transcriptions.create(
+                model=TRANSCRIBE_MODEL, file=f
+            )
+            transcript += result.text
+
+        os.remove(segment_path)
+
+    transcript = punctuation_assistant(client, transcript)
+    transcript = (
+        f"全文总结：\n{summary_assistant(client, transcript)}\n原文：\n{transcript}"
+    )
+    logger.info(f"transcript: {transcript}")
+    os.remove(audio_file)
+    return transcript
diff --git a/packages/file-export/fastfetchbot_file_export/video_download.py b/packages/file-export/fastfetchbot_file_export/video_download.py
new file mode 100644
index 0000000..e70cb73
--- /dev/null
+++ b/packages/file-export/fastfetchbot_file_export/video_download.py
@@ -0,0 +1,206 @@
+import os
+import traceback
+
+from loguru import logger
+from yt_dlp import YoutubeDL
+
+
+def get_video_orientation(content_info: dict, extractor: str) -> str:
+    """Detect if video is vertical or horizontal. Only applies to YouTube."""
+    if extractor != "youtube":
+        return "horizontal"
+
+    formats = content_info.get("formats")
+    if not formats:
+        return "horizontal"
+
+    # Find the first video format (has aspect_ratio), skipping audio-only entries
+    for fmt in formats:
+        if "aspect_ratio" in fmt and fmt["aspect_ratio"] is not None:
+            return "vertical" if fmt["aspect_ratio"] < 1 else "horizontal"
+
+    return "horizontal"
+
+
+def get_format_for_orientation(
+    extractor: str, orientation: str, hd: bool, bilibili_cookie: bool = False
+) -> str:
+    """Return appropriate yt-dlp format string based on video orientation."""
+    if extractor == "youtube":
+        if orientation == "vertical":
+            return "bv[ext=mp4]+ba/b"
+        else:
+            return (
+                "bv[ext=mp4]+(258/256/140)/best"
+                if hd
+                else "bv+ba/b"
+            )
+    elif extractor == "bilibili":
+        if hd and bilibili_cookie:
+            return "bestvideo[ext=mp4]+bestaudio[ext=m4a]/best[ext=mp4]/best"
+        return "bv*[height<=480]+ba/b[height<=480] / wv*+ba/w"
+    raise ValueError("no available extractor found")
+
+
+def init_yt_downloader(
+    hd: bool = False,
+    audio_only: bool = False,
+    extractor: str = None,
+    no_proxy: bool = False,
+    extract_only: bool = False,
+    video_format: str = None,
+    download_dir: str = "/tmp",
+    cookie_file_path: str = None,
+    proxy_mode: bool = False,
+    proxy_url: str = "",
+    youtube_cookie: bool = False,
+    bilibili_cookie: bool = False,
+) -> YoutubeDL:
+    """Initialize a YoutubeDL instance with the given configuration."""
+    base_opts = {"merge_output_format": "mp4"}
+
+    if extract_only:
+        ydl_opts = {
+            **base_opts,
+            "ignore_no_formats_error": True,
+            "skip_download": True,
+            "quiet": True,
+            "no_warnings": True,
+            "extract_flat": False,
+            "allow_unplayable_formats": True,
+        }
+    elif audio_only:
+        ydl_opts = {
+            **base_opts,
+            "paths": {"home": download_dir},
+            "format": "m4a/bestaudio/best",
+            "postprocessors": [
+                {"key": "FFmpegExtractAudio", "preferredcodec": "m4a"}
+            ],
+        }
+    else:
+        if video_format is None:
+            video_format = get_format_for_orientation(
+                extractor, "horizontal", hd, bilibili_cookie
+            )
+
+        ydl_opts = {
+            **base_opts,
+            "paths": {"home": download_dir},
+            "outtmpl": {"default": "%(title).10s-%(id)s.%(ext)s"},
+            "format": video_format,
+        }
+        if extractor == "bilibili":
+            ydl_opts["referer"] = "https://www.bilibili.com/"
+
+    if youtube_cookie and extractor == "youtube" and cookie_file_path:
+        logger.info("Using cookies for youtube")
+        ydl_opts["cookiefile"] = cookie_file_path
+
+    if bilibili_cookie and extractor == "bilibili" and cookie_file_path:
+        logger.info("Using cookies for bilibili")
+        ydl_opts["cookiefile"] = cookie_file_path
+
+    if proxy_mode and not no_proxy:
+        logger.info("Using proxy")
+        ydl_opts["proxy"] = proxy_url
+
+    downloader = YoutubeDL(ydl_opts)
+    return downloader
+
+
+def download_video(
+    url: str,
+    download: bool = True,
+    hd: bool = False,
+    extractor: str = "youtube",
+    audio_only: bool = False,
+    config: dict = None,
+) -> dict:
+    """
+    Download or extract info for a video.
+
+    config keys: DOWNLOAD_DIR, COOKIE_FILE_PATH, PROXY_MODE, PROXY_URL,
+                 YOUTUBE_COOKIE, BILIBILI_COOKIE, LOCAL_MODE, BASE_URL
+    """
+    if config is None:
+        config = {}
+
+    download_dir = config.get("DOWNLOAD_DIR", "/tmp")
+    cookie_file_path = config.get("COOKIE_FILE_PATH", "")
+    proxy_mode = config.get("PROXY_MODE", False)
+    proxy_url = config.get("PROXY_URL", "")
+    youtube_cookie = config.get("YOUTUBE_COOKIE", False)
+    bilibili_cookie = config.get("BILIBILI_COOKIE", False)
+    local_mode = config.get("LOCAL_MODE", True)
+    base_url = config.get("BASE_URL", "")
+
+    file_path_output = None
+
+    try:
+        # Phase 1: Extract info only (no downloading)
+        with init_yt_downloader(
+            extractor=extractor,
+            extract_only=True,
+            download_dir=download_dir,
+            cookie_file_path=cookie_file_path,
+            proxy_mode=proxy_mode,
+            proxy_url=proxy_url,
+            youtube_cookie=youtube_cookie,
+            bilibili_cookie=bilibili_cookie,
+        ) as extractor_dl:
+            content_info = extractor_dl.extract_info(url, download=False)
+
+        # Determine video orientation
+        orientation = get_video_orientation(content_info, extractor)
+        logger.info(f"Video orientation: {orientation}")
+
+        # Phase 2: Download with appropriate format based on orientation
+        if download:
+            if audio_only:
+                downloader = init_yt_downloader(
+                    audio_only=True,
+                    extractor=extractor,
+                    download_dir=download_dir,
+                    cookie_file_path=cookie_file_path,
+                    proxy_mode=proxy_mode,
+                    proxy_url=proxy_url,
+                    youtube_cookie=youtube_cookie,
+                    bilibili_cookie=bilibili_cookie,
+                )
+            else:
+                video_format = get_format_for_orientation(
+                    extractor, orientation, hd, bilibili_cookie
+                )
+                downloader = init_yt_downloader(
+                    extractor=extractor,
+                    video_format=video_format,
+                    download_dir=download_dir,
+                    cookie_file_path=cookie_file_path,
+                    proxy_mode=proxy_mode,
+                    proxy_url=proxy_url,
+                    youtube_cookie=youtube_cookie,
+                    bilibili_cookie=bilibili_cookie,
+                )
+
+            with downloader:
+                download_info = downloader.extract_info(url, download=True)
+                file_path = (
+                    download_info.get("filepath")
+                    or downloader.prepare_filename(download_info)
+                )
+                file_path_output = (
+                    file_path
+                    if local_mode
+                    else base_url + "/fileDownload" + file_path
+                )
+
+        return {
+            "message": "success",
+            "content_info": content_info,
+            "orientation": orientation,
+            "file_path": file_path_output,
+        }
+    except Exception:
+        logger.exception(f"download_video failed: url={url}\n{traceback.format_exc()}")
+        raise
diff --git a/packages/file-export/pyproject.toml b/packages/file-export/pyproject.toml
new file mode 100644
index 0000000..96d59fe
--- /dev/null
+++ b/packages/file-export/pyproject.toml
@@ -0,0 +1,15 @@
+[project]
+name = "fastfetchbot-file-export"
+version = "0.1.0"
+requires-python = ">=3.12,<3.13"
+dependencies = [
+    "yt-dlp[default]>=2026.02.04",
+    "weasyprint>=65.1",
+    "pydub>=0.25.1",
+    "openai>=2.15.0",
+    "loguru>=0.7.2",
+]
+
+[build-system]
+requires = ["hatchling"]
+build-backend = "hatchling.build"
diff --git a/pyproject.toml b/pyproject.toml
index f3c357e..993e102 100644
--- a/pyproject.toml
+++ b/pyproject.toml
@@ -41,7 +41,9 @@ dependencies = [
     "html-telegraph-poster-v2>=0.2.5,<0.3.0",
     "firecrawl-py>=4.13.0,<5.0.0",
     "zyte-api>=0.8.1,<0.9.0",
+    "celery[redis]>=5.4.0,<6.0.0",
     "fastfetchbot-shared",
+    "fastfetchbot-file-export",
 ]
 
 [project.optional-dependencies]
@@ -52,6 +54,7 @@ dev = [
     "black>=25.1.0,<26.0.0",
     "pytest>=8.3.5,<9.0.0",
     "pytest-asyncio>=0.26.0,<0.27.0",
+    "celery-types>=0.24.0",
 ]
 
 [build-system]
@@ -63,9 +66,11 @@ package = false
 
 [tool.uv.workspace]
 members = ["packages/*", "apps/*"]
+exclude = ["packages/FastFileExporter"]
 
 [tool.uv.sources]
 fastfetchbot-shared = { workspace = true }
+fastfetchbot-file-export = { workspace = true }
 
 [tool.pytest.ini_options]
 asyncio_default_fixture_loop_scope = "module"
diff --git a/template.env b/template.env
index 29a0345..2cc7512 100644
--- a/template.env
+++ b/template.env
@@ -136,3 +136,10 @@ FIRECRAWL_WAIT_FOR=3000
 # Zyte API
 # The API key for Zyte. Default: `None`
 ZYTE_API_KEY=
+
+# Celery Worker
+# Redis URL for Celery message broker. Default: `redis://localhost:6379/0`
+CELERY_BROKER_URL=redis://redis:6379/0
+
+# Redis URL for Celery result backend. Default: `redis://localhost:6379/1`
+CELERY_RESULT_BACKEND=redis://redis:6379/1
diff --git a/app/services/amazon/__init__.py b/tests/cases/test_file_export/__init__.py
similarity index 100%
rename from app/services/amazon/__init__.py
rename to tests/cases/test_file_export/__init__.py
diff --git a/tests/cases/test_file_export/test_pdf_export.py b/tests/cases/test_file_export/test_pdf_export.py
new file mode 100644
index 0000000..7705fa6
--- /dev/null
+++ b/tests/cases/test_file_export/test_pdf_export.py
@@ -0,0 +1,22 @@
+import os
+import tempfile
+
+import pytest
+
+try:
+    from fastfetchbot_file_export.pdf_export import convert_html_to_pdf
+    HAS_WEASYPRINT = True
+except (OSError, ImportError):
+    HAS_WEASYPRINT = False
+
+
+@pytest.mark.skipif(not HAS_WEASYPRINT, reason="WeasyPrint requires native pango/gobject libraries")
+def test_convert_html_string_to_pdf():
+    with tempfile.TemporaryDirectory() as tmpdir:
+        output = os.path.join(tmpdir, "test.pdf")
+        convert_html_to_pdf(
+            output_filename=output,
+            html_string="<html><body><h1>Test</h1></body></html>",
+        )
+        assert os.path.exists(output)
+        assert os.path.getsize(output) > 0
diff --git a/tests/cases/test_file_export/test_transcribe.py b/tests/cases/test_file_export/test_transcribe.py
new file mode 100644
index 0000000..d0e63bd
--- /dev/null
+++ b/tests/cases/test_file_export/test_transcribe.py
@@ -0,0 +1,26 @@
+import pytest
+
+try:
+    from pydub import AudioSegment
+    from pydub.generators import Sine
+    HAS_FFMPEG = True
+except Exception:
+    HAS_FFMPEG = False
+
+from fastfetchbot_file_export.transcribe import milliseconds_until_sound
+
+
+@pytest.mark.skipif(not HAS_FFMPEG, reason="Requires ffmpeg for audio processing")
+def test_milliseconds_until_sound_no_silence():
+    tone = Sine(440).to_audio_segment(duration=1000)
+    result = milliseconds_until_sound(tone)
+    assert result == 0
+
+
+@pytest.mark.skipif(not HAS_FFMPEG, reason="Requires ffmpeg for audio processing")
+def test_milliseconds_until_sound_with_silence():
+    silence = AudioSegment.silent(duration=500)
+    tone = Sine(440).to_audio_segment(duration=500)
+    audio = silence + tone
+    result = milliseconds_until_sound(audio)
+    assert 450 <= result <= 510  # ~500ms of silence
diff --git a/tests/cases/test_file_export/test_video_download.py b/tests/cases/test_file_export/test_video_download.py
new file mode 100644
index 0000000..989597e
--- /dev/null
+++ b/tests/cases/test_file_export/test_video_download.py
@@ -0,0 +1,58 @@
+from fastfetchbot_file_export.video_download import get_video_orientation, get_format_for_orientation
+
+
+def test_get_video_orientation_vertical():
+    content_info = {"formats": [{"aspect_ratio": 0.5}]}
+    assert get_video_orientation(content_info, "youtube") == "vertical"
+
+
+def test_get_video_orientation_horizontal():
+    content_info = {"formats": [{"aspect_ratio": 1.78}]}
+    assert get_video_orientation(content_info, "youtube") == "horizontal"
+
+
+def test_get_video_orientation_non_youtube():
+    assert get_video_orientation({}, "bilibili") == "horizontal"
+
+
+def test_get_video_orientation_missing_formats():
+    """Empty or missing formats should default to horizontal, not vertical."""
+    assert get_video_orientation({"formats": []}, "youtube") == "horizontal"
+    assert get_video_orientation({}, "youtube") == "horizontal"
+
+
+def test_get_video_orientation_audio_only_first():
+    """Should skip audio-only formats (no aspect_ratio) and use the first video format."""
+    content_info = {
+        "formats": [
+            {"format_id": "140", "acodec": "mp4a", "vcodec": "none"},  # audio-only, no aspect_ratio
+            {"format_id": "137", "aspect_ratio": 0.5, "vcodec": "avc1"},  # vertical video
+        ]
+    }
+    assert get_video_orientation(content_info, "youtube") == "vertical"
+
+
+def test_get_video_orientation_no_video_formats():
+    """All formats are audio-only (no aspect_ratio) — should default to horizontal."""
+    content_info = {
+        "formats": [
+            {"format_id": "140", "acodec": "mp4a", "vcodec": "none"},
+            {"format_id": "251", "acodec": "opus", "vcodec": "none"},
+        ]
+    }
+    assert get_video_orientation(content_info, "youtube") == "horizontal"
+
+
+def test_get_format_youtube_horizontal_hd():
+    fmt = get_format_for_orientation("youtube", "horizontal", hd=True)
+    assert "258" in fmt or "256" in fmt
+
+
+def test_get_format_youtube_vertical():
+    fmt = get_format_for_orientation("youtube", "vertical", hd=False)
+    assert "bv" in fmt
+
+
+def test_get_format_bilibili_non_hd():
+    fmt = get_format_for_orientation("bilibili", "horizontal", hd=False)
+    assert "480" in fmt
diff --git a/uv.lock b/uv.lock
index d5f412f..1eec7af 100644
--- a/uv.lock
+++ b/uv.lock
@@ -6,8 +6,10 @@ requires-python = "==3.12.*"
 members = [
     "fastfetchbot",
     "fastfetchbot-api",
+    "fastfetchbot-file-export",
     "fastfetchbot-shared",
     "fastfetchbot-telegram-bot",
+    "fastfetchbot-worker",
 ]
 
 [[package]]
@@ -142,6 +144,18 @@ wheels = [
     { url = "https://files.pythonhosted.org/packages/a0/48/77c0092f716c4bf9460dca44f5120f70b8f71f14a12f40d22551a7152719/aiosqlite-0.17.0-py3-none-any.whl", hash = "sha256:6c49dc6d3405929b1d08eeccc72306d3677503cc5e5e43771efc1e00232e8231", size = 15433, upload-time = "2021-02-22T01:01:07.698Z" },
 ]
 
+[[package]]
+name = "amqp"
+version = "5.3.1"
+source = { registry = "https://pypi.org/simple" }
+dependencies = [
+    { name = "vine" },
+]
+sdist = { url = "https://files.pythonhosted.org/packages/79/fc/ec94a357dfc6683d8c86f8b4cfa5416a4c36b28052ec8260c77aca96a443/amqp-5.3.1.tar.gz", hash = "sha256:cddc00c725449522023bad949f70fff7b48f0b1ade74d170a6f10ab044739432", size = 129013, upload-time = "2024-11-12T19:55:44.051Z" }
+wheels = [
+    { url = "https://files.pythonhosted.org/packages/26/99/fc813cd978842c26c82534010ea849eee9ab3a13ea2b74e95cb9c99e747b/amqp-5.3.1-py3-none-any.whl", hash = "sha256:43b3319e1b4e7d1251833a93d672b4af1e40f3d632d479b98661a95f117880a2", size = 50944, upload-time = "2024-11-12T19:55:41.782Z" },
+]
+
 [[package]]
 name = "annotated-types"
 version = "0.7.0"
@@ -277,6 +291,15 @@ wheels = [
     { url = "https://files.pythonhosted.org/packages/1a/39/47f9197bdd44df24d67ac8893641e16f386c984a0619ef2ee4c51fbbc019/beautifulsoup4-4.14.3-py3-none-any.whl", hash = "sha256:0918bfe44902e6ad8d57732ba310582e98da931428d231a5ecb9e7c703a735bb", size = 107721, upload-time = "2025-11-30T15:08:24.087Z" },
 ]
 
+[[package]]
+name = "billiard"
+version = "4.2.4"
+source = { registry = "https://pypi.org/simple" }
+sdist = { url = "https://files.pythonhosted.org/packages/58/23/b12ac0bcdfb7360d664f40a00b1bda139cbbbced012c34e375506dbd0143/billiard-4.2.4.tar.gz", hash = "sha256:55f542c371209e03cd5862299b74e52e4fbcba8250ba611ad94276b369b6a85f", size = 156537, upload-time = "2025-11-30T13:28:48.52Z" }
+wheels = [
+    { url = "https://files.pythonhosted.org/packages/cb/87/8bab77b323f16d67be364031220069f79159117dd5e43eeb4be2fef1ac9b/billiard-4.2.4-py3-none-any.whl", hash = "sha256:525b42bdec68d2b983347ac312f892db930858495db601b5836ac24e6477cde5", size = 87070, upload-time = "2025-11-30T13:28:47.016Z" },
+]
+
 [[package]]
 name = "black"
 version = "25.12.0"
@@ -345,6 +368,22 @@ wheels = [
     { url = "https://files.pythonhosted.org/packages/1c/4e/bc1dcac9498859d5e353c9b153627a3752868a9d5f05ce8dedd81a2354ab/brotli-1.2.0-cp312-cp312-win_amd64.whl", hash = "sha256:b35c13ce241abdd44cb8ca70683f20c0c079728a36a996297adb5334adfc1c44", size = 369115, upload-time = "2025-11-05T18:38:33.765Z" },
 ]
 
+[[package]]
+name = "brotlicffi"
+version = "1.2.0.0"
+source = { registry = "https://pypi.org/simple" }
+dependencies = [
+    { name = "cffi" },
+]
+sdist = { url = "https://files.pythonhosted.org/packages/84/85/57c314a6b35336efbbdc13e5fc9ae13f6b60a0647cfa7c1221178ac6d8ae/brotlicffi-1.2.0.0.tar.gz", hash = "sha256:34345d8d1f9d534fcac2249e57a4c3c8801a33c9942ff9f8574f67a175e17adb", size = 476682, upload-time = "2025-11-21T18:17:57.334Z" }
+wheels = [
+    { url = "https://files.pythonhosted.org/packages/e4/df/a72b284d8c7bef0ed5756b41c2eb7d0219a1dd6ac6762f1c7bdbc31ef3af/brotlicffi-1.2.0.0-cp38-abi3-macosx_11_0_arm64.whl", hash = "sha256:9458d08a7ccde8e3c0afedbf2c70a8263227a68dea5ab13590593f4c0a4fd5f4", size = 432340, upload-time = "2025-11-21T18:17:42.277Z" },
+    { url = "https://files.pythonhosted.org/packages/74/2b/cc55a2d1d6fb4f5d458fba44a3d3f91fb4320aa14145799fd3a996af0686/brotlicffi-1.2.0.0-cp38-abi3-manylinux2014_aarch64.manylinux_2_17_aarch64.manylinux_2_28_aarch64.whl", hash = "sha256:84e3d0020cf1bd8b8131f4a07819edee9f283721566fe044a20ec792ca8fd8b7", size = 1534002, upload-time = "2025-11-21T18:17:43.746Z" },
+    { url = "https://files.pythonhosted.org/packages/e4/9c/d51486bf366fc7d6735f0e46b5b96ca58dc005b250263525a1eea3cd5d21/brotlicffi-1.2.0.0-cp38-abi3-manylinux2014_x86_64.manylinux_2_17_x86_64.manylinux_2_28_x86_64.whl", hash = "sha256:33cfb408d0cff64cd50bef268c0fed397c46fbb53944aa37264148614a62e990", size = 1536547, upload-time = "2025-11-21T18:17:45.729Z" },
+    { url = "https://files.pythonhosted.org/packages/1b/37/293a9a0a7caf17e6e657668bebb92dfe730305999fe8c0e2703b8888789c/brotlicffi-1.2.0.0-cp38-abi3-win32.whl", hash = "sha256:23e5c912fdc6fd37143203820230374d24babd078fc054e18070a647118158f6", size = 343085, upload-time = "2025-11-21T18:17:48.887Z" },
+    { url = "https://files.pythonhosted.org/packages/07/6b/6e92009df3b8b7272f85a0992b306b61c34b7ea1c4776643746e61c380ac/brotlicffi-1.2.0.0-cp38-abi3-win_amd64.whl", hash = "sha256:f139a7cdfe4ae7859513067b736eb44d19fae1186f9e99370092f6915216451b", size = 378586, upload-time = "2025-11-21T18:17:50.531Z" },
+]
+
 [[package]]
 name = "cachetools"
 version = "5.5.2"
@@ -354,6 +393,43 @@ wheels = [
     { url = "https://files.pythonhosted.org/packages/72/76/20fa66124dbe6be5cafeb312ece67de6b61dd91a0247d1ea13db4ebb33c2/cachetools-5.5.2-py3-none-any.whl", hash = "sha256:d26a22bcc62eb95c3beabd9f1ee5e820d3d2704fe2967cbe350e20c8ffcd3f0a", size = 10080, upload-time = "2025-02-20T21:01:16.647Z" },
 ]
 
+[[package]]
+name = "celery"
+version = "5.6.2"
+source = { registry = "https://pypi.org/simple" }
+dependencies = [
+    { name = "billiard" },
+    { name = "click" },
+    { name = "click-didyoumean" },
+    { name = "click-plugins" },
+    { name = "click-repl" },
+    { name = "kombu" },
+    { name = "python-dateutil" },
+    { name = "tzlocal" },
+    { name = "vine" },
+]
+sdist = { url = "https://files.pythonhosted.org/packages/8f/9d/3d13596519cfa7207a6f9834f4b082554845eb3cd2684b5f8535d50c7c44/celery-5.6.2.tar.gz", hash = "sha256:4a8921c3fcf2ad76317d3b29020772103581ed2454c4c042cc55dcc43585009b", size = 1718802, upload-time = "2026-01-04T12:35:58.012Z" }
+wheels = [
+    { url = "https://files.pythonhosted.org/packages/dd/bd/9ecd619e456ae4ba73b6583cc313f26152afae13e9a82ac4fe7f8856bfd1/celery-5.6.2-py3-none-any.whl", hash = "sha256:3ffafacbe056951b629c7abcf9064c4a2366de0bdfc9fdba421b97ebb68619a5", size = 445502, upload-time = "2026-01-04T12:35:55.894Z" },
+]
+
+[package.optional-dependencies]
+redis = [
+    { name = "kombu", extra = ["redis"] },
+]
+
+[[package]]
+name = "celery-types"
+version = "0.24.0"
+source = { registry = "https://pypi.org/simple" }
+dependencies = [
+    { name = "typing-extensions" },
+]
+sdist = { url = "https://files.pythonhosted.org/packages/72/25/2276a1f00f8ab9fc88128c939333933a24db7df1d75aa57ecc27b7dd3a22/celery_types-0.24.0.tar.gz", hash = "sha256:c93fbcd0b04a9e9c2f55d5540aca4aa1ea4cc06a870c0c8dee5062fdd59663fe", size = 33148, upload-time = "2025-12-23T17:16:30.847Z" }
+wheels = [
+    { url = "https://files.pythonhosted.org/packages/3a/7e/3252cba5f5c9a65a3f52a69734d8e51e023db8981022b503e8183cf0225e/celery_types-0.24.0-py3-none-any.whl", hash = "sha256:a21e04681e68719a208335e556a79909da4be9c5e0d6d2fd0dd4c5615954b3fd", size = 60473, upload-time = "2025-12-23T17:16:29.89Z" },
+]
+
 [[package]]
 name = "certifi"
 version = "2026.1.4"
@@ -423,6 +499,43 @@ wheels = [
     { url = "https://files.pythonhosted.org/packages/98/78/01c019cdb5d6498122777c1a43056ebb3ebfeef2076d9d026bfe15583b2b/click-8.3.1-py3-none-any.whl", hash = "sha256:981153a64e25f12d547d3426c367a4857371575ee7ad18df2a6183ab0545b2a6", size = 108274, upload-time = "2025-11-15T20:45:41.139Z" },
 ]
 
+[[package]]
+name = "click-didyoumean"
+version = "0.3.1"
+source = { registry = "https://pypi.org/simple" }
+dependencies = [
+    { name = "click" },
+]
+sdist = { url = "https://files.pythonhosted.org/packages/30/ce/217289b77c590ea1e7c24242d9ddd6e249e52c795ff10fac2c50062c48cb/click_didyoumean-0.3.1.tar.gz", hash = "sha256:4f82fdff0dbe64ef8ab2279bd6aa3f6a99c3b28c05aa09cbfc07c9d7fbb5a463", size = 3089, upload-time = "2024-03-24T08:22:07.499Z" }
+wheels = [
+    { url = "https://files.pythonhosted.org/packages/1b/5b/974430b5ffdb7a4f1941d13d83c64a0395114503cc357c6b9ae4ce5047ed/click_didyoumean-0.3.1-py3-none-any.whl", hash = "sha256:5c4bb6007cfea5f2fd6583a2fb6701a22a41eb98957e63d0fac41c10e7c3117c", size = 3631, upload-time = "2024-03-24T08:22:06.356Z" },
+]
+
+[[package]]
+name = "click-plugins"
+version = "1.1.1.2"
+source = { registry = "https://pypi.org/simple" }
+dependencies = [
+    { name = "click" },
+]
+sdist = { url = "https://files.pythonhosted.org/packages/c3/a4/34847b59150da33690a36da3681d6bbc2ec14ee9a846bc30a6746e5984e4/click_plugins-1.1.1.2.tar.gz", hash = "sha256:d7af3984a99d243c131aa1a828331e7630f4a88a9741fd05c927b204bcf92261", size = 8343, upload-time = "2025-06-25T00:47:37.555Z" }
+wheels = [
+    { url = "https://files.pythonhosted.org/packages/3d/9a/2abecb28ae875e39c8cad711eb1186d8d14eab564705325e77e4e6ab9ae5/click_plugins-1.1.1.2-py2.py3-none-any.whl", hash = "sha256:008d65743833ffc1f5417bf0e78e8d2c23aab04d9745ba817bd3e71b0feb6aa6", size = 11051, upload-time = "2025-06-25T00:47:36.731Z" },
+]
+
+[[package]]
+name = "click-repl"
+version = "0.3.0"
+source = { registry = "https://pypi.org/simple" }
+dependencies = [
+    { name = "click" },
+    { name = "prompt-toolkit" },
+]
+sdist = { url = "https://files.pythonhosted.org/packages/cb/a2/57f4ac79838cfae6912f997b4d1a64a858fb0c86d7fcaae6f7b58d267fca/click-repl-0.3.0.tar.gz", hash = "sha256:17849c23dba3d667247dc4defe1757fff98694e90fe37474f3feebb69ced26a9", size = 10449, upload-time = "2023-06-15T12:43:51.141Z" }
+wheels = [
+    { url = "https://files.pythonhosted.org/packages/52/40/9d857001228658f0d59e97ebd4c346fe73e138c6de1bce61dc568a57c7f8/click_repl-0.3.0-py3-none-any.whl", hash = "sha256:fb7e06deb8da8de86180a33a9da97ac316751c094c6899382da7feeeeb51b812", size = 10289, upload-time = "2023-06-15T12:43:48.626Z" },
+]
+
 [[package]]
 name = "colorama"
 version = "0.4.6"
@@ -533,8 +646,10 @@ dependencies = [
     { name = "babel" },
     { name = "beanie" },
     { name = "beautifulsoup4" },
+    { name = "celery", extra = ["redis"] },
     { name = "fake-useragent" },
     { name = "fastapi" },
+    { name = "fastfetchbot-file-export" },
     { name = "fastfetchbot-shared" },
     { name = "firecrawl-py" },
     { name = "gunicorn" },
@@ -567,6 +682,7 @@ windows = [
 [package.dev-dependencies]
 dev = [
     { name = "black" },
+    { name = "celery-types" },
     { name = "pytest" },
     { name = "pytest-asyncio" },
 ]
@@ -580,8 +696,10 @@ requires-dist = [
     { name = "babel", specifier = ">=2.17.0,<3.0.0" },
     { name = "beanie", specifier = ">=1.29.0,<2.0.0" },
     { name = "beautifulsoup4", specifier = ">=4.13.4,<5.0.0" },
+    { name = "celery", extras = ["redis"], specifier = ">=5.4.0,<6.0.0" },
     { name = "fake-useragent", specifier = ">=1.5.1,<2.0.0" },
     { name = "fastapi", specifier = ">=0.115.12,<0.116.0" },
+    { name = "fastfetchbot-file-export", editable = "packages/file-export" },
     { name = "fastfetchbot-shared", editable = "packages/shared" },
     { name = "firecrawl-py", specifier = ">=4.13.0,<5.0.0" },
     { name = "gunicorn", specifier = ">=23.0.0,<24.0.0" },
@@ -611,6 +729,7 @@ provides-extras = ["windows"]
 [package.metadata.requires-dev]
 dev = [
     { name = "black", specifier = ">=25.1.0,<26.0.0" },
+    { name = "celery-types", specifier = ">=0.24.0" },
     { name = "pytest", specifier = ">=8.3.5,<9.0.0" },
     { name = "pytest-asyncio", specifier = ">=0.26.0,<0.27.0" },
 ]
@@ -625,6 +744,7 @@ dependencies = [
     { name = "atproto" },
     { name = "babel" },
     { name = "beanie" },
+    { name = "celery", extra = ["redis"] },
     { name = "fastapi" },
     { name = "fastfetchbot-shared" },
     { name = "firecrawl-py" },
@@ -651,6 +771,7 @@ requires-dist = [
     { name = "atproto", specifier = ">=0.0.61" },
     { name = "babel", specifier = ">=2.17.0" },
     { name = "beanie", specifier = ">=1.29.0" },
+    { name = "celery", extras = ["redis"], specifier = ">=5.4.0" },
     { name = "fastapi", specifier = ">=0.115.12" },
     { name = "fastfetchbot-shared", editable = "packages/shared" },
     { name = "firecrawl-py", specifier = ">=4.13.0" },
@@ -670,6 +791,27 @@ requires-dist = [
     { name = "zyte-api", specifier = ">=0.8.1" },
 ]
 
+[[package]]
+name = "fastfetchbot-file-export"
+version = "0.1.0"
+source = { editable = "packages/file-export" }
+dependencies = [
+    { name = "loguru" },
+    { name = "openai" },
+    { name = "pydub" },
+    { name = "weasyprint" },
+    { name = "yt-dlp", extra = ["default"] },
+]
+
+[package.metadata]
+requires-dist = [
+    { name = "loguru", specifier = ">=0.7.2" },
+    { name = "openai", specifier = ">=2.15.0" },
+    { name = "pydub", specifier = ">=0.25.1" },
+    { name = "weasyprint", specifier = ">=65.1" },
+    { name = "yt-dlp", extras = ["default"], specifier = ">=2026.2.4" },
+]
+
 [[package]]
 name = "fastfetchbot-shared"
 version = "0.1.0"
@@ -728,6 +870,23 @@ requires-dist = [
     { name = "uvicorn", specifier = ">=0.34.2" },
 ]
 
+[[package]]
+name = "fastfetchbot-worker"
+version = "0.1.0"
+source = { virtual = "apps/worker" }
+dependencies = [
+    { name = "celery", extra = ["redis"] },
+    { name = "fastfetchbot-file-export" },
+    { name = "fastfetchbot-shared" },
+]
+
+[package.metadata]
+requires-dist = [
+    { name = "celery", extras = ["redis"], specifier = ">=5.4.0" },
+    { name = "fastfetchbot-file-export", editable = "packages/file-export" },
+    { name = "fastfetchbot-shared", editable = "packages/shared" },
+]
+
 [[package]]
 name = "firecrawl-py"
 version = "4.15.1"
@@ -746,6 +905,30 @@ wheels = [
     { url = "https://files.pythonhosted.org/packages/88/0e/6353b31ab25948308f8756c51e6c7f6298951a082778a667edaec519e11d/firecrawl_py-4.15.1-py3-none-any.whl", hash = "sha256:0ae69c6800c4c182e995ab2eb3a9a5cd947e16d2b447c06b7bb086862af7e43b", size = 210827, upload-time = "2026-02-17T16:11:07.391Z" },
 ]
 
+[[package]]
+name = "fonttools"
+version = "4.61.1"
+source = { registry = "https://pypi.org/simple" }
+sdist = { url = "https://files.pythonhosted.org/packages/ec/ca/cf17b88a8df95691275a3d77dc0a5ad9907f328ae53acbe6795da1b2f5ed/fonttools-4.61.1.tar.gz", hash = "sha256:6675329885c44657f826ef01d9e4fb33b9158e9d93c537d84ad8399539bc6f69", size = 3565756, upload-time = "2025-12-12T17:31:24.246Z" }
+wheels = [
+    { url = "https://files.pythonhosted.org/packages/6f/16/7decaa24a1bd3a70c607b2e29f0adc6159f36a7e40eaba59846414765fd4/fonttools-4.61.1-cp312-cp312-macosx_10_13_universal2.whl", hash = "sha256:f3cb4a569029b9f291f88aafc927dd53683757e640081ca8c412781ea144565e", size = 2851593, upload-time = "2025-12-12T17:30:04.225Z" },
+    { url = "https://files.pythonhosted.org/packages/94/98/3c4cb97c64713a8cf499b3245c3bf9a2b8fd16a3e375feff2aed78f96259/fonttools-4.61.1-cp312-cp312-macosx_10_13_x86_64.whl", hash = "sha256:41a7170d042e8c0024703ed13b71893519a1a6d6e18e933e3ec7507a2c26a4b2", size = 2400231, upload-time = "2025-12-12T17:30:06.47Z" },
+    { url = "https://files.pythonhosted.org/packages/b7/37/82dbef0f6342eb01f54bca073ac1498433d6ce71e50c3c3282b655733b31/fonttools-4.61.1-cp312-cp312-manylinux1_x86_64.manylinux2014_x86_64.manylinux_2_17_x86_64.manylinux_2_5_x86_64.whl", hash = "sha256:10d88e55330e092940584774ee5e8a6971b01fc2f4d3466a1d6c158230880796", size = 4954103, upload-time = "2025-12-12T17:30:08.432Z" },
+    { url = "https://files.pythonhosted.org/packages/6c/44/f3aeac0fa98e7ad527f479e161aca6c3a1e47bb6996b053d45226fe37bf2/fonttools-4.61.1-cp312-cp312-manylinux2014_aarch64.manylinux_2_17_aarch64.manylinux_2_28_aarch64.whl", hash = "sha256:15acc09befd16a0fb8a8f62bc147e1a82817542d72184acca9ce6e0aeda9fa6d", size = 5004295, upload-time = "2025-12-12T17:30:10.56Z" },
+    { url = "https://files.pythonhosted.org/packages/14/e8/7424ced75473983b964d09f6747fa09f054a6d656f60e9ac9324cf40c743/fonttools-4.61.1-cp312-cp312-musllinux_1_2_aarch64.whl", hash = "sha256:e6bcdf33aec38d16508ce61fd81838f24c83c90a1d1b8c68982857038673d6b8", size = 4944109, upload-time = "2025-12-12T17:30:12.874Z" },
+    { url = "https://files.pythonhosted.org/packages/c8/8b/6391b257fa3d0b553d73e778f953a2f0154292a7a7a085e2374b111e5410/fonttools-4.61.1-cp312-cp312-musllinux_1_2_x86_64.whl", hash = "sha256:5fade934607a523614726119164ff621e8c30e8fa1ffffbbd358662056ba69f0", size = 5093598, upload-time = "2025-12-12T17:30:15.79Z" },
+    { url = "https://files.pythonhosted.org/packages/d9/71/fd2ea96cdc512d92da5678a1c98c267ddd4d8c5130b76d0f7a80f9a9fde8/fonttools-4.61.1-cp312-cp312-win32.whl", hash = "sha256:75da8f28eff26defba42c52986de97b22106cb8f26515b7c22443ebc9c2d3261", size = 2269060, upload-time = "2025-12-12T17:30:18.058Z" },
+    { url = "https://files.pythonhosted.org/packages/80/3b/a3e81b71aed5a688e89dfe0e2694b26b78c7d7f39a5ffd8a7d75f54a12a8/fonttools-4.61.1-cp312-cp312-win_amd64.whl", hash = "sha256:497c31ce314219888c0e2fce5ad9178ca83fe5230b01a5006726cdf3ac9f24d9", size = 2319078, upload-time = "2025-12-12T17:30:22.862Z" },
+    { url = "https://files.pythonhosted.org/packages/c7/4e/ce75a57ff3aebf6fc1f4e9d508b8e5810618a33d900ad6c19eb30b290b97/fonttools-4.61.1-py3-none-any.whl", hash = "sha256:17d2bf5d541add43822bcf0c43d7d847b160c9bb01d15d5007d84e2217aaa371", size = 1148996, upload-time = "2025-12-12T17:31:21.03Z" },
+]
+
+[package.optional-dependencies]
+woff = [
+    { name = "brotli", marker = "platform_python_implementation == 'CPython'" },
+    { name = "brotlicffi", marker = "platform_python_implementation != 'CPython'" },
+    { name = "zopfli" },
+]
+
 [[package]]
 name = "frozenlist"
 version = "1.8.0"
@@ -932,6 +1115,26 @@ wheels = [
     { url = "https://files.pythonhosted.org/packages/14/2f/967ba146e6d58cf6a652da73885f52fc68001525b4197effc174321d70b4/jmespath-1.1.0-py3-none-any.whl", hash = "sha256:a5663118de4908c91729bea0acadca56526eb2698e83de10cd116ae0f4e97c64", size = 20419, upload-time = "2026-01-22T16:35:24.919Z" },
 ]
 
+[[package]]
+name = "kombu"
+version = "5.6.2"
+source = { registry = "https://pypi.org/simple" }
+dependencies = [
+    { name = "amqp" },
+    { name = "packaging" },
+    { name = "tzdata" },
+    { name = "vine" },
+]
+sdist = { url = "https://files.pythonhosted.org/packages/b6/a5/607e533ed6c83ae1a696969b8e1c137dfebd5759a2e9682e26ff1b97740b/kombu-5.6.2.tar.gz", hash = "sha256:8060497058066c6f5aed7c26d7cd0d3b574990b09de842a8c5aaed0b92cc5a55", size = 472594, upload-time = "2025-12-29T20:30:07.779Z" }
+wheels = [
+    { url = "https://files.pythonhosted.org/packages/fb/0f/834427d8c03ff1d7e867d3db3d176470c64871753252b21b4f4897d1fa45/kombu-5.6.2-py3-none-any.whl", hash = "sha256:efcfc559da324d41d61ca311b0c64965ea35b4c55cc04ee36e55386145dace93", size = 214219, upload-time = "2025-12-29T20:30:05.74Z" },
+]
+
+[package.optional-dependencies]
+redis = [
+    { name = "redis" },
+]
+
 [[package]]
 name = "lazy-model"
 version = "0.2.0"
@@ -1096,6 +1299,15 @@ wheels = [
     { url = "https://files.pythonhosted.org/packages/81/08/7036c080d7117f28a4af526d794aab6a84463126db031b007717c1a6676e/multidict-6.7.1-py3-none-any.whl", hash = "sha256:55d97cc6dae627efa6a6e548885712d4864b81110ac76fa4e534c03819fa4a56", size = 12319, upload-time = "2026-01-26T02:46:44.004Z" },
 ]
 
+[[package]]
+name = "mutagen"
+version = "1.47.0"
+source = { registry = "https://pypi.org/simple" }
+sdist = { url = "https://files.pythonhosted.org/packages/81/e6/64bc71b74eef4b68e61eb921dcf72dabd9e4ec4af1e11891bbd312ccbb77/mutagen-1.47.0.tar.gz", hash = "sha256:719fadef0a978c31b4cf3c956261b3c58b6948b32023078a2117b1de09f0fc99", size = 1274186, upload-time = "2023-09-03T16:33:33.411Z" }
+wheels = [
+    { url = "https://files.pythonhosted.org/packages/b0/7a/620f945b96be1f6ee357d211d5bf74ab1b7fe72a9f1525aafbfe3aee6875/mutagen-1.47.0-py3-none-any.whl", hash = "sha256:edd96f50c5907a9539d8e5bba7245f62c9f520aef333d13392a79a4f70aca719", size = 194391, upload-time = "2023-09-03T16:33:29.955Z" },
+]
+
 [[package]]
 name = "mypy-extensions"
 version = "1.1.0"
@@ -1242,6 +1454,18 @@ wheels = [
     { url = "https://files.pythonhosted.org/packages/54/20/4d324d65cc6d9205fabedc306948156824eb9f0ee1633355a8f7ec5c66bf/pluggy-1.6.0-py3-none-any.whl", hash = "sha256:e920276dd6813095e9377c0bc5566d94c932c33b27a3e3945d8389c374dd4746", size = 20538, upload-time = "2025-05-15T12:30:06.134Z" },
 ]
 
+[[package]]
+name = "prompt-toolkit"
+version = "3.0.52"
+source = { registry = "https://pypi.org/simple" }
+dependencies = [
+    { name = "wcwidth" },
+]
+sdist = { url = "https://files.pythonhosted.org/packages/a1/96/06e01a7b38dce6fe1db213e061a4602dd6032a8a97ef6c1a862537732421/prompt_toolkit-3.0.52.tar.gz", hash = "sha256:28cde192929c8e7321de85de1ddbe736f1375148b02f2e17edd840042b1be855", size = 434198, upload-time = "2025-08-27T15:24:02.057Z" }
+wheels = [
+    { url = "https://files.pythonhosted.org/packages/84/03/0d3ce49e2505ae70cf43bc5bb3033955d2fc9f932163e84dc0779cc47f48/prompt_toolkit-3.0.52-py3-none-any.whl", hash = "sha256:9aac639a3bbd33284347de5ad8d68ecc044b91a762dc39b7c21095fcd6a19955", size = 391431, upload-time = "2025-08-27T15:23:59.498Z" },
+]
+
 [[package]]
 name = "propcache"
 version = "0.4.1"
@@ -1275,6 +1499,25 @@ wheels = [
     { url = "https://files.pythonhosted.org/packages/0c/c3/44f3fbbfa403ea2a7c779186dc20772604442dde72947e7d01069cbe98e3/pycparser-3.0-py3-none-any.whl", hash = "sha256:b727414169a36b7d524c1c3e31839a521725078d7b2ff038656844266160a992", size = 48172, upload-time = "2026-01-21T14:26:50.693Z" },
 ]
 
+[[package]]
+name = "pycryptodomex"
+version = "3.23.0"
+source = { registry = "https://pypi.org/simple" }
+sdist = { url = "https://files.pythonhosted.org/packages/c9/85/e24bf90972a30b0fcd16c73009add1d7d7cd9140c2498a68252028899e41/pycryptodomex-3.23.0.tar.gz", hash = "sha256:71909758f010c82bc99b0abf4ea12012c98962fbf0583c2164f8b84533c2e4da", size = 4922157, upload-time = "2025-05-17T17:23:41.434Z" }
+wheels = [
+    { url = "https://files.pythonhosted.org/packages/dd/9c/1a8f35daa39784ed8adf93a694e7e5dc15c23c741bbda06e1d45f8979e9e/pycryptodomex-3.23.0-cp37-abi3-macosx_10_9_universal2.whl", hash = "sha256:06698f957fe1ab229a99ba2defeeae1c09af185baa909a31a5d1f9d42b1aaed6", size = 2499240, upload-time = "2025-05-17T17:22:46.953Z" },
+    { url = "https://files.pythonhosted.org/packages/7a/62/f5221a191a97157d240cf6643747558759126c76ee92f29a3f4aee3197a5/pycryptodomex-3.23.0-cp37-abi3-macosx_10_9_x86_64.whl", hash = "sha256:b2c2537863eccef2d41061e82a881dcabb04944c5c06c5aa7110b577cc487545", size = 1644042, upload-time = "2025-05-17T17:22:49.098Z" },
+    { url = "https://files.pythonhosted.org/packages/8c/fd/5a054543c8988d4ed7b612721d7e78a4b9bf36bc3c5ad45ef45c22d0060e/pycryptodomex-3.23.0-cp37-abi3-manylinux_2_17_aarch64.manylinux2014_aarch64.whl", hash = "sha256:43c446e2ba8df8889e0e16f02211c25b4934898384c1ec1ec04d7889c0333587", size = 2186227, upload-time = "2025-05-17T17:22:51.139Z" },
+    { url = "https://files.pythonhosted.org/packages/c8/a9/8862616a85cf450d2822dbd4fff1fcaba90877907a6ff5bc2672cafe42f8/pycryptodomex-3.23.0-cp37-abi3-manylinux_2_17_x86_64.manylinux2014_x86_64.whl", hash = "sha256:f489c4765093fb60e2edafdf223397bc716491b2b69fe74367b70d6999257a5c", size = 2272578, upload-time = "2025-05-17T17:22:53.676Z" },
+    { url = "https://files.pythonhosted.org/packages/46/9f/bda9c49a7c1842820de674ab36c79f4fbeeee03f8ff0e4f3546c3889076b/pycryptodomex-3.23.0-cp37-abi3-manylinux_2_5_i686.manylinux1_i686.manylinux_2_17_i686.manylinux2014_i686.whl", hash = "sha256:bdc69d0d3d989a1029df0eed67cc5e8e5d968f3724f4519bd03e0ec68df7543c", size = 2312166, upload-time = "2025-05-17T17:22:56.585Z" },
+    { url = "https://files.pythonhosted.org/packages/03/cc/870b9bf8ca92866ca0186534801cf8d20554ad2a76ca959538041b7a7cf4/pycryptodomex-3.23.0-cp37-abi3-musllinux_1_2_aarch64.whl", hash = "sha256:6bbcb1dd0f646484939e142462d9e532482bc74475cecf9c4903d4e1cd21f003", size = 2185467, upload-time = "2025-05-17T17:22:59.237Z" },
+    { url = "https://files.pythonhosted.org/packages/96/e3/ce9348236d8e669fea5dd82a90e86be48b9c341210f44e25443162aba187/pycryptodomex-3.23.0-cp37-abi3-musllinux_1_2_i686.whl", hash = "sha256:8a4fcd42ccb04c31268d1efeecfccfd1249612b4de6374205376b8f280321744", size = 2346104, upload-time = "2025-05-17T17:23:02.112Z" },
+    { url = "https://files.pythonhosted.org/packages/a5/e9/e869bcee87beb89040263c416a8a50204f7f7a83ac11897646c9e71e0daf/pycryptodomex-3.23.0-cp37-abi3-musllinux_1_2_x86_64.whl", hash = "sha256:55ccbe27f049743a4caf4f4221b166560d3438d0b1e5ab929e07ae1702a4d6fd", size = 2271038, upload-time = "2025-05-17T17:23:04.872Z" },
+    { url = "https://files.pythonhosted.org/packages/8d/67/09ee8500dd22614af5fbaa51a4aee6e342b5fa8aecf0a6cb9cbf52fa6d45/pycryptodomex-3.23.0-cp37-abi3-win32.whl", hash = "sha256:189afbc87f0b9f158386bf051f720e20fa6145975f1e76369303d0f31d1a8d7c", size = 1771969, upload-time = "2025-05-17T17:23:07.115Z" },
+    { url = "https://files.pythonhosted.org/packages/69/96/11f36f71a865dd6df03716d33bd07a67e9d20f6b8d39820470b766af323c/pycryptodomex-3.23.0-cp37-abi3-win_amd64.whl", hash = "sha256:52e5ca58c3a0b0bd5e100a9fbc8015059b05cffc6c66ce9d98b4b45e023443b9", size = 1803124, upload-time = "2025-05-17T17:23:09.267Z" },
+    { url = "https://files.pythonhosted.org/packages/f9/93/45c1cdcbeb182ccd2e144c693eaa097763b08b38cded279f0053ed53c553/pycryptodomex-3.23.0-cp37-abi3-win_arm64.whl", hash = "sha256:02d87b80778c171445d67e23d1caef279bf4b25c3597050ccd2e13970b57fd51", size = 1707161, upload-time = "2025-05-17T17:23:11.414Z" },
+]
+
 [[package]]
 name = "pydantic"
 version = "2.12.5"
@@ -1328,6 +1571,15 @@ wheels = [
     { url = "https://files.pythonhosted.org/packages/a6/53/d78dc063216e62fc55f6b2eebb447f6a4b0a59f55c8406376f76bf959b08/pydub-0.25.1-py2.py3-none-any.whl", hash = "sha256:65617e33033874b59d87db603aa1ed450633288aefead953b30bded59cb599a6", size = 32327, upload-time = "2021-03-10T02:09:53.503Z" },
 ]
 
+[[package]]
+name = "pydyf"
+version = "0.12.1"
+source = { registry = "https://pypi.org/simple" }
+sdist = { url = "https://files.pythonhosted.org/packages/36/ee/fb410c5c854b6a081a49077912a9765aeffd8e07cbb0663cfda310b01fb4/pydyf-0.12.1.tar.gz", hash = "sha256:fbd7e759541ac725c29c506612003de393249b94310ea78ae44cb1d04b220095", size = 17716, upload-time = "2025-12-02T14:52:14.244Z" }
+wheels = [
+    { url = "https://files.pythonhosted.org/packages/22/11/47efe2f66ba848a107adfd490b508f5c0cedc82127950553dca44d29e6c4/pydyf-0.12.1-py3-none-any.whl", hash = "sha256:ea25b4e1fe7911195cb57067560daaa266639184e8335365cc3ee5214e7eaadc", size = 8028, upload-time = "2025-12-02T14:52:12.938Z" },
+]
+
 [[package]]
 name = "pyee"
 version = "13.0.1"
@@ -1413,6 +1665,15 @@ wheels = [
     { url = "https://files.pythonhosted.org/packages/68/77/38bd7744bb9e06d465b0c23879e6d2c187d93a383f8fa485c862822bb8a3/pypdf-6.7.1-py3-none-any.whl", hash = "sha256:a02ccbb06463f7c334ce1612e91b3e68a8e827f3cee100b9941771e6066b094e", size = 331048, upload-time = "2026-02-17T17:00:46.991Z" },
 ]
 
+[[package]]
+name = "pyphen"
+version = "0.17.2"
+source = { registry = "https://pypi.org/simple" }
+sdist = { url = "https://files.pythonhosted.org/packages/69/56/e4d7e1bd70d997713649c5ce530b2d15a5fc2245a74ca820fc2d51d89d4d/pyphen-0.17.2.tar.gz", hash = "sha256:f60647a9c9b30ec6c59910097af82bc5dd2d36576b918e44148d8b07ef3b4aa3", size = 2079470, upload-time = "2025-01-20T13:18:36.296Z" }
+wheels = [
+    { url = "https://files.pythonhosted.org/packages/7b/1f/c2142d2edf833a90728e5cdeb10bdbdc094dde8dbac078cee0cf33f5e11b/pyphen-0.17.2-py3-none-any.whl", hash = "sha256:3a07fb017cb2341e1d9ff31b8634efb1ae4dc4b130468c7c39dd3d32e7c3affd", size = 2079358, upload-time = "2025-01-20T13:18:29.629Z" },
+]
+
 [[package]]
 name = "pytest"
 version = "8.4.2"
@@ -1555,6 +1816,15 @@ wheels = [
     { url = "https://files.pythonhosted.org/packages/1a/08/67bd04656199bbb51dbed1439b7f27601dfb576fb864099c7ef0c3e55531/pyyaml-6.0.3-cp312-cp312-win_arm64.whl", hash = "sha256:64386e5e707d03a7e172c0701abfb7e10f0fb753ee1d773128192742712a98fd", size = 140344, upload-time = "2025-09-25T21:32:22.617Z" },
 ]
 
+[[package]]
+name = "redis"
+version = "6.4.0"
+source = { registry = "https://pypi.org/simple" }
+sdist = { url = "https://files.pythonhosted.org/packages/0d/d6/e8b92798a5bd67d659d51a18170e91c16ac3b59738d91894651ee255ed49/redis-6.4.0.tar.gz", hash = "sha256:b01bc7282b8444e28ec36b261df5375183bb47a07eb9c603f284e89cbc5ef010", size = 4647399, upload-time = "2025-08-07T08:10:11.441Z" }
+wheels = [
+    { url = "https://files.pythonhosted.org/packages/e8/02/89e2ed7e85db6c93dfa9e8f691c5087df4e3551ab39081a4d7c6d1f90e05/redis-6.4.0-py3-none-any.whl", hash = "sha256:f0544fa9604264e9464cdf4814e7d4830f74b165d52f2a330a760a88dd248b7f", size = 279847, upload-time = "2025-08-07T08:10:09.84Z" },
+]
+
 [[package]]
 name = "reportlab"
 version = "4.4.10"
@@ -1703,6 +1973,18 @@ wheels = [
     { url = "https://files.pythonhosted.org/packages/60/45/c7b5c3168458db837e8ceab06dc77824e18202679d0463f0e8f002143a97/tinycss2-1.5.1-py3-none-any.whl", hash = "sha256:3415ba0f5839c062696996998176c4a3751d18b7edaaeeb658c9ce21ec150661", size = 28404, upload-time = "2025-11-23T10:29:08.676Z" },
 ]
 
+[[package]]
+name = "tinyhtml5"
+version = "2.0.0"
+source = { registry = "https://pypi.org/simple" }
+dependencies = [
+    { name = "webencodings" },
+]
+sdist = { url = "https://files.pythonhosted.org/packages/fd/03/6111ed99e9bf7dfa1c30baeef0e0fb7e0bd387bd07f8e5b270776fe1de3f/tinyhtml5-2.0.0.tar.gz", hash = "sha256:086f998833da24c300c414d9fe81d9b368fd04cb9d2596a008421cbc705fcfcc", size = 179507, upload-time = "2024-10-29T15:37:14.078Z" }
+wheels = [
+    { url = "https://files.pythonhosted.org/packages/5c/de/27c57899297163a4a84104d5cec0af3b1ac5faf62f44667e506373c6b8ce/tinyhtml5-2.0.0-py3-none-any.whl", hash = "sha256:13683277c5b176d070f82d099d977194b7a1e26815b016114f581a74bbfbf47e", size = 39793, upload-time = "2024-10-29T15:37:11.743Z" },
+]
+
 [[package]]
 name = "tqdm"
 version = "4.67.3"
@@ -1833,6 +2115,15 @@ wheels = [
     { url = "https://files.pythonhosted.org/packages/99/39/6b3f7d234ba3964c428a6e40006340f53ba37993f46ed6e111c6e9141d18/uvloop-0.22.1-cp312-cp312-musllinux_1_2_x86_64.whl", hash = "sha256:512fec6815e2dd45161054592441ef76c830eddaad55c8aa30952e6fe1ed07c0", size = 4296343, upload-time = "2025-10-16T22:16:35.149Z" },
 ]
 
+[[package]]
+name = "vine"
+version = "5.1.0"
+source = { registry = "https://pypi.org/simple" }
+sdist = { url = "https://files.pythonhosted.org/packages/bd/e4/d07b5f29d283596b9727dd5275ccbceb63c44a1a82aa9e4bfd20426762ac/vine-5.1.0.tar.gz", hash = "sha256:8b62e981d35c41049211cf62a0a1242d8c1ee9bd15bb196ce38aefd6799e61e0", size = 48980, upload-time = "2023-11-05T08:46:53.857Z" }
+wheels = [
+    { url = "https://files.pythonhosted.org/packages/03/ff/7c0c86c43b3cbb927e0ccc0255cb4057ceba4799cd44ae95174ce8e8b5b2/vine-5.1.0-py3-none-any.whl", hash = "sha256:40fdf3c48b2cfe1c38a49e9ae2da6fda88e4794c810050a728bd7413811fb1dc", size = 9636, upload-time = "2023-11-05T08:46:51.205Z" },
+]
+
 [[package]]
 name = "w3lib"
 version = "2.4.0"
@@ -1842,6 +2133,34 @@ wheels = [
     { url = "https://files.pythonhosted.org/packages/2e/f5/ce3ab627e0cb51591c9e3dc4b9b173f15d7f2bec1c0010420b15fc442940/w3lib-2.4.0-py3-none-any.whl", hash = "sha256:260b5a22aeb86ae73213857f69ed20829a45150f8d5b12050b1f02ada414db79", size = 21603, upload-time = "2026-01-29T07:05:05.841Z" },
 ]
 
+[[package]]
+name = "wcwidth"
+version = "0.6.0"
+source = { registry = "https://pypi.org/simple" }
+sdist = { url = "https://files.pythonhosted.org/packages/35/a2/8e3becb46433538a38726c948d3399905a4c7cabd0df578ede5dc51f0ec2/wcwidth-0.6.0.tar.gz", hash = "sha256:cdc4e4262d6ef9a1a57e018384cbeb1208d8abbc64176027e2c2455c81313159", size = 159684, upload-time = "2026-02-06T19:19:40.919Z" }
+wheels = [
+    { url = "https://files.pythonhosted.org/packages/68/5a/199c59e0a824a3db2b89c5d2dade7ab5f9624dbf6448dc291b46d5ec94d3/wcwidth-0.6.0-py3-none-any.whl", hash = "sha256:1a3a1e510b553315f8e146c54764f4fb6264ffad731b3d78088cdb1478ffbdad", size = 94189, upload-time = "2026-02-06T19:19:39.646Z" },
+]
+
+[[package]]
+name = "weasyprint"
+version = "68.1"
+source = { registry = "https://pypi.org/simple" }
+dependencies = [
+    { name = "cffi" },
+    { name = "cssselect2" },
+    { name = "fonttools", extra = ["woff"] },
+    { name = "pillow" },
+    { name = "pydyf" },
+    { name = "pyphen" },
+    { name = "tinycss2" },
+    { name = "tinyhtml5" },
+]
+sdist = { url = "https://files.pythonhosted.org/packages/db/3e/65c0f176e6fb5c2b0a1ac13185b366f727d9723541babfa7fa4309998169/weasyprint-68.1.tar.gz", hash = "sha256:d3b752049b453a5c95edb27ce78d69e9319af5a34f257fa0f4c738c701b4184e", size = 1542379, upload-time = "2026-02-06T15:04:11.203Z" }
+wheels = [
+    { url = "https://files.pythonhosted.org/packages/dd/dd/14eb73cea481ad8162d3b18a4850d4a84d6e804a22840cca207648532265/weasyprint-68.1-py3-none-any.whl", hash = "sha256:4dc3ba63c68bbbce3e9617cb2226251c372f5ee90a8a484503b1c099da9cf5be", size = 319789, upload-time = "2026-02-06T15:04:09.189Z" },
+]
+
 [[package]]
 name = "webencodings"
 version = "0.5.1"
@@ -1949,6 +2268,52 @@ wheels = [
     { url = "https://files.pythonhosted.org/packages/73/ae/b48f95715333080afb75a4504487cbe142cae1268afc482d06692d605ae6/yarl-1.22.0-py3-none-any.whl", hash = "sha256:1380560bdba02b6b6c90de54133c81c9f2a453dee9912fe58c1dcced1edb7cff", size = 46814, upload-time = "2025-10-06T14:12:53.872Z" },
 ]
 
+[[package]]
+name = "yt-dlp"
+version = "2026.2.4"
+source = { registry = "https://pypi.org/simple" }
+sdist = { url = "https://files.pythonhosted.org/packages/16/be/8e099f3f34bac6851490525fb1a8b62d525a95fcb5af082e8c52ba884fb5/yt_dlp-2026.2.4.tar.gz", hash = "sha256:24733ef081116f29d8ee6eae7a48127101e6c56eb7aa228dd604a60654760022", size = 3100305, upload-time = "2026-02-04T00:49:27.043Z" }
+wheels = [
+    { url = "https://files.pythonhosted.org/packages/96/38/b17cbeaf6712a4c1b97f7f9ec3a55f3a8ddee678cc88742af47dca0315b7/yt_dlp-2026.2.4-py3-none-any.whl", hash = "sha256:d6ea83257e8127a0097b1d37ee36201f99a292067e4616b2e5d51ab153b3dbb9", size = 3299165, upload-time = "2026-02-04T00:49:25.31Z" },
+]
+
+[package.optional-dependencies]
+default = [
+    { name = "brotli", marker = "implementation_name == 'cpython'" },
+    { name = "brotlicffi", marker = "implementation_name != 'cpython'" },
+    { name = "certifi" },
+    { name = "mutagen" },
+    { name = "pycryptodomex" },
+    { name = "requests" },
+    { name = "urllib3" },
+    { name = "websockets" },
+    { name = "yt-dlp-ejs" },
+]
+
+[[package]]
+name = "yt-dlp-ejs"
+version = "0.4.0"
+source = { registry = "https://pypi.org/simple" }
+sdist = { url = "https://files.pythonhosted.org/packages/e9/80/4b6c7f91b373e01cdc18080f41fa399592945abce7db74c2e6d0fb8468db/yt_dlp_ejs-0.4.0.tar.gz", hash = "sha256:3c67e0beb6f9f3603fbcb56f425eabaa37c52243d90d20ccbcce1dd941cfbd07", size = 96768, upload-time = "2026-01-29T16:25:59.964Z" }
+wheels = [
+    { url = "https://files.pythonhosted.org/packages/a4/90/8911146822364666be47f184c4180cec20fcc537a268ef40d1ab077dd25b/yt_dlp_ejs-0.4.0-py3-none-any.whl", hash = "sha256:19278cff397b243074df46342bb7616c404296aeaff01986b62b4e21823b0b9c", size = 53600, upload-time = "2026-01-29T16:25:57.87Z" },
+]
+
+[[package]]
+name = "zopfli"
+version = "0.4.1"
+source = { registry = "https://pypi.org/simple" }
+sdist = { url = "https://files.pythonhosted.org/packages/0a/4d/a8cc1768b2eda3c0c7470bf8059dcb94ef96d45dd91fc6edd29430d44072/zopfli-0.4.1.tar.gz", hash = "sha256:07a5cdc5d1aaa6c288c5d9f5a5383042ba743641abf8e2fd898dcad622d8a38e", size = 179001, upload-time = "2026-02-13T14:17:27.156Z" }
+wheels = [
+    { url = "https://files.pythonhosted.org/packages/e1/2f/1a7082e9163ae3703b27d571720bf3c954a02a9cf1fdce47c51e70639256/zopfli-0.4.1-cp310-abi3-macosx_10_9_universal2.whl", hash = "sha256:4238d4d746d1095e29c9125490985e0c12ffd3654f54a24af551e2391e936d54", size = 291570, upload-time = "2026-02-13T14:17:12.556Z" },
+    { url = "https://files.pythonhosted.org/packages/dd/6f/4a1a88edf9fa0ce102703f38ab4dfb285b7cd2dde5389184264ec759e06e/zopfli-0.4.1-cp310-abi3-manylinux2014_x86_64.manylinux_2_17_x86_64.whl", hash = "sha256:fdfb7ce9f5de37a5b2f75dd2642fd7717956ef2a72e0387302a36d382440db07", size = 829437, upload-time = "2026-02-13T14:17:14.431Z" },
+    { url = "https://files.pythonhosted.org/packages/e3/77/d231012ddcaac9d2e184bd7808e106a8a0048855912e2e1c902b3f383413/zopfli-0.4.1-cp310-abi3-manylinux_2_24_aarch64.manylinux_2_28_aarch64.whl", hash = "sha256:d7bcee1b189d64ec33d1e05cfa1b6a1268c29329c382f6ca1bd6245b04925c57", size = 818542, upload-time = "2026-02-13T14:17:16.353Z" },
+    { url = "https://files.pythonhosted.org/packages/0d/4e/9b23690c4ca14fbeae2a8f7f6b2006611bf4cd7d5bcb2d9e6c718bd4b0e9/zopfli-0.4.1-cp310-abi3-musllinux_1_2_aarch64.whl", hash = "sha256:27823dc1161a4031d1c25925fd45d9868ec0cbc7692341830a7dcfa25063662c", size = 1778034, upload-time = "2026-02-13T14:17:17.509Z" },
+    { url = "https://files.pythonhosted.org/packages/e3/1b/51f7c28d4cde639cac4f5d47ff615548c1d9809f43cbacdd66eba5cd679d/zopfli-0.4.1-cp310-abi3-musllinux_1_2_x86_64.whl", hash = "sha256:5a4c22b6161f47f5bd34637dbaee6735abd287cd64e0d1ce28ef1871bf625f4b", size = 1863957, upload-time = "2026-02-13T14:17:19.259Z" },
+    { url = "https://files.pythonhosted.org/packages/ae/4d/1ef17017d38eabe7ae28f18ef0f16d48966cc23a5657e4555fff61704539/zopfli-0.4.1-cp310-abi3-win32.whl", hash = "sha256:a899eca405662a23ae75054affa3517a060362eae1185d3d791c86a50153c4dd", size = 82314, upload-time = "2026-02-13T14:17:20.795Z" },
+    { url = "https://files.pythonhosted.org/packages/0f/94/806bc84b389c7d70051d7c9a0179cff52de8b9f8dc2fc25bcf0bca302986/zopfli-0.4.1-cp310-abi3-win_amd64.whl", hash = "sha256:84a31ba9edc921b1d3a4449929394a993888f32d70de3a3617800c428a947b9b", size = 102186, upload-time = "2026-02-13T14:17:21.622Z" },
+]
+
 [[package]]
 name = "zyte-api"
 version = "0.8.2"