# App Setup NODE_ENV=production # Set to 'development' or 'production' as required JWT_SECRET=a9Z$kLq7^f03GzNw!bP9dH4xV6sT2yXl3O8vR@uYq3 # Replace with a secure JWT secret key DB_NAME=maxun # Your PostgreSQL database name DB_USER=postgres # PostgreSQL username DB_PASSWORD=postgres # PostgreSQL password DB_HOST=postgres # Host for PostgreSQL in Docker DB_PORT=5432# Port for PostgreSQL (default: 5432) ENCRYPTION_KEY=f4d5e6a7b8c9d0e1f23456789abcdef01234567890abcdef123456789abcdef0 # Key for encrypting sensitive data (passwords and proxies) MINIO_ENDPOINT=minio # MinIO endpoint in Docker MINIO_PORT=9000# Port for MinIO (default: 9000) MINIO_ACCESS_KEY=minio_access_key # MinIO access key MINIO_SECRET_KEY=minio_secret_key # MinIO secret key REDIS_HOST=redis # Redis host in Docker REDIS_PORT=6379# Redis port (default: 6379)
# Backend URLs BACKEND_URL=http://192.168.0.197:5174# Internal URL for backend service VITE_BACKEND_URL=http://192.168.0.197:5174# URL used by frontend to connect to backend
# Optional Google OAuth settings for Google Sheet Integration GOOGLE_CLIENT_ID=your_google_client_id GOOGLE_CLIENT_SECRET=your_google_client_secret GOOGLE_REDIRECT_URI=your_google_redirect_uri
# Telemetry Settings - Please keep it enabled. Keeping it enabled helps us understand how the product is used and assess the impact of any new changes. MAXUN_TELEMETRY=true
minio: image:minio/minio container_name:maxun-minio environment: MINIO_ROOT_USER:${MINIO_ACCESS_KEY} MINIO_ROOT_PASSWORD:${MINIO_SECRET_KEY} command:server/data--console-address:9001 # ports: # - "9000:9000" # API port # - "9001:9001" # WebUI port volumes: -./mdata:/data
backend: image:getmaxun/maxun-backend:v0.0.2 container_name:maxun-backend # ports: # - "8750:8080" env_file:env.txt environment: # to ensure Playwright works in Docker PLAYWRIGHT_BROWSERS_PATH:/ms-playwright PLAYWRIGHT_SKIP_BROWSER_DOWNLOAD:0 # DEBUG: pw:api # PWDEBUG: 1 # Enables debugging CHROMIUM_FLAGS:'--disable-gpu --no-sandbox --headless=new' security_opt: -seccomp=unconfined# This might help with browser sandbox issues # Increase shared memory size for Chromium shm_size:'2gb' mem_limit:2g# Set a 2GB memory limit depends_on: -postgres -redis -minio volumes: -./server:/app/server# Mount server source code for hot reloading -./maxun-core:/app/maxun-core# Mount maxun-core for any shared code updates -/var/run/dbus:/var/run/dbus
frontend: image:getmaxun/maxun-frontend:v0.0.1 container_name:maxun-frontend # ports: # - "5173:5173" env_file:env.txt volumes: -./:/app# Mount entire frontend app directory for hot reloading -/app/node_modules# Anonymous volume to prevent overwriting node_modules depends_on: -backend
Playwright 是一个由 Microsoft 开发的用于浏览器测试和网页抓取的开源自动化库。于 2020 年推出,它的功能类似于 Selenium、Pyppeteer 等,都可以驱动浏览器进行各种自动化操作。Playwright 提供了使用单个 API 在 Chromium、Firefox 和 WebKit 中自动执行浏览器任务的能力。
接下来可以在界面上选择元素,具体使用方法可以看官方的视频
参考文档
getmaxun/maxun: Free, open-source no-code web data extraction platform. Build custom robots to automate data scraping [In Beta] 地址:https://github.com/getmaxun/maxun