feat(*):增加了一些模型

2025-03-27 21:19:43 +08:00
parent a55bb3a448
commit a513dd8a91
62 changed files with 2420 additions and 109 deletions
--- a/.gitignore
+++ b/.gitignore
@@ -0,0 +1 @@
+open-webui/data
--- a/anythinllm/.version
+++ b/anythinllm/.version
@@ -1 +0,0 @@
-v25.03.17
--- a/chattts/.env
+++ b/chattts/.env
@@ -1 +0,0 @@
-CUDA_VISIBLE_DEVICES=0,1
--- a/chattts/.version
+++ b/chattts/.version
@@ -1 +0,0 @@
-v25.03.17
--- a/chattts/compose.yaml
+++ b/chattts/compose.yaml
@@ -1,11 +1,10 @@
 version: "3.8"
 services:
  lenml-chattts-forge:
-    image: docker.citory.tech/public/lenml-chattts-forge
+    image: docker.citory.tech/public/lenml-chattts-forge:latest
    container_name: lenml-chattts-forge
    ports:
      - 10583:7860
-    env_file: .env
    deploy:
      resources:
        reservations:
--- a/cloudflared/.env
+++ b/cloudflared/.env
--- a/cloudflared/compose.yaml
+++ b/cloudflared/compose.yaml
@@ -0,0 +1,8 @@
+version: '3.8'
+
+services:
+  cloudflared-tunnel:
+    image: docker.citory.tech/public/cloudflared:latest
+    container_name: cloudflared-tunnel
+    command: tunnel --no-autoupdate run --token eyJhIjoiYjZiYjdkZDFkYjA1NDExOGRjODNlMjJiYzJhNGIwZmYiLCJ0IjoiYTI0YTViYmYtYWU0MC00N2M4LWI0NTktYjRjMjlkMWVlMWFkIiwicyI6Ik1URmtabUprWWpBdE9UZzBZUzAwWm1FekxUZ3laVFF0TUdJM1pqSXhOVEUyTldGaCJ9
+    restart: unless-stopped
--- a/comfyui/.version
+++ b/comfyui/.version
@@ -1 +0,0 @@
-v25.03.17
--- a/deepgeek-os/.env
+++ b/deepgeek-os/.env
@@ -0,0 +1,16 @@
+# 数据库配置
+DATABASE_URL=postgresql://deepgeek:deepgeek@deepgeek-os-login-db:5432/deepgeek_db
+
+# JWT配置
+SECRET_KEY=RnlnkjsdyoIr8rlM2b8bkqyOhoyQ1DF2
+
+# 微信配置
+# 城室科技登录中心
+WECHAT_APP_ID=wx323cef66ee834caa
+WECHAT_APP_SECRET=bf106302b080a1533aaa760b632d2dc5
+# 激活码配置
+ACTIVATION_CODE_LENGTH=16 
+
+# API文档认证配置
+DOCS_USERNAME=deepgeek
+DOCS_SECRET=citorytech
--- a/deepgeek-os/compose.yaml
+++ b/deepgeek-os/compose.yaml
@@ -0,0 +1,59 @@
+services:
+  # 桌面系统主容器
+  deepgeek-os:
+    image: docker.citory.tech/public/deepgeek-os:latest
+    container_name: deepgeek-os
+    ports:
+      - 10500:4000
+    environment:
+      - NODE_ENV=production
+      - VITE_SSO_ENDPOINT=http://deepgeek-os-login:8000
+      - VITE_SYSINFO_ENDPOINT=http://host.docker.internal:1635
+      - VITE_LLM_ENDPOINT=http://host.docker.internal:10580
+      - VITE_GITEA_ENDPOINT=https://git.citory.tech/api/v1
+      - VITE_WECHAT_REDIRECT_URI=https%3A%2F%2Fdesktop.deepgeek.tech%2Fcallback
+      - VITE_WECHAT_APPID=wx323cef66ee834caa
+    networks:
+      - deepgeek_network
+    depends_on:
+      - deepgeek-os-login
+    extra_hosts:
+      - host.docker.internal:host-gateway
+    restart: unless-stopped
+  # 桌面系统登录容器
+  deepgeek-os-login:
+    image: docker.citory.tech/public/deepgeek-os-login:1.0.3
+    container_name: deepgeek-os-login
+    ports:
+      - 10520:8000
+    environment:
+      - DATABASE_URL=postgresql://deepgeek:deepgeek@deepgeek-os-login-db:5432/deepgeek_db
+      - SECRET_KEY=RnlnkjsdyoIr8rlM2b8bkqyOhoyQ1DF2
+      - WECHAT_APP_ID=wx323cef66ee834caa
+      - WECHAT_APP_SECRET=bf106302b080a1533aaa760b632d2dc5
+      - ACTIVATION_CODE_LENGTH=16
+      - DOCS_USERNAME=deepgeek
+      - DOCS_SECRET=citorytech
+    depends_on:
+      - deepgeek-os-login-db
+    networks:
+      - deepgeek_network
+    restart: unless-stopped
+  # 桌面系统登录数据库容器，用于存储桌面系统登录数据，生产环境不暴露端口
+  deepgeek-os-login-db:
+    image: docker.citory.tech/mirror/postgres:15-alpine
+    container_name: deepgeek-os-login-db
+    environment:
+      - POSTGRES_USER=deepgeek
+      - POSTGRES_PASSWORD=deepgeek
+      - POSTGRES_DB=deepgeek_db
+    volumes:
+      - /home/deepgeek/data/data_local/server/deepgeek-data/postgres-data:/var/lib/postgresql/data
+    ports:
+      - 8002:5432
+    networks:
+      - deepgeek_network
+    restart: unless-stopped
+networks:
+  deepgeek_network:
+    driver: bridge
--- a/dify/.env
+++ b/dify/.env
@@ -0,0 +1,994 @@
+# ------------------------------
+# Environment Variables for API service & worker
+# ------------------------------
+
+# ------------------------------
+# Common Variables
+# ------------------------------
+
+# The backend URL of the console API,
+# used to concatenate the authorization callback.
+# If empty, it is the same domain.
+# Example: https://api.console.dify.ai
+CONSOLE_API_URL=
+
+# The front-end URL of the console web,
+# used to concatenate some front-end addresses and for CORS configuration use.
+# If empty, it is the same domain.
+# Example: https://console.dify.ai
+CONSOLE_WEB_URL=
+
+# Service API Url,
+# used to display Service API Base Url to the front-end.
+# If empty, it is the same domain.
+# Example: https://api.dify.ai
+SERVICE_API_URL=
+
+# WebApp API backend Url,
+# used to declare the back-end URL for the front-end API.
+# If empty, it is the same domain.
+# Example: https://api.app.dify.ai
+APP_API_URL=
+
+# WebApp Url,
+# used to display WebAPP API Base Url to the front-end.
+# If empty, it is the same domain.
+# Example: https://app.dify.ai
+APP_WEB_URL=
+
+# File preview or download Url prefix.
+# used to display File preview or download Url to the front-end or as Multi-model inputs;
+# Url is signed and has expiration time.
+FILES_URL=
+
+# ------------------------------
+# Server Configuration
+# ------------------------------
+
+# The log level for the application.
+# Supported values are `DEBUG`, `INFO`, `WARNING`, `ERROR`, `CRITICAL`
+LOG_LEVEL=INFO
+# Log file path
+LOG_FILE=/app/logs/server.log
+# Log file max size, the unit is MB
+LOG_FILE_MAX_SIZE=20
+# Log file max backup count
+LOG_FILE_BACKUP_COUNT=5
+# Log dateformat
+LOG_DATEFORMAT=%Y-%m-%d %H:%M:%S
+# Log Timezone
+LOG_TZ=UTC
+
+# Debug mode, default is false.
+# It is recommended to turn on this configuration for local development
+# to prevent some problems caused by monkey patch.
+DEBUG=false
+
+# Flask debug mode, it can output trace information at the interface when turned on,
+# which is convenient for debugging.
+FLASK_DEBUG=false
+
+# A secretkey that is used for securely signing the session cookie
+# and encrypting sensitive information on the database.
+# You can generate a strong key using `openssl rand -base64 42`.
+SECRET_KEY=sk-9f73s3ljTXVcMT3Blb3ljTqtsKiGHXVcMT3BlbkFJLK7U
+
+# Password for admin user initialization.
+# If left unset, admin user will not be prompted for a password
+# when creating the initial admin account. 
+# The length of the password cannot exceed 30 charactors.
+INIT_PASSWORD=
+
+# Deployment environment.
+# Supported values are `PRODUCTION`, `TESTING`. Default is `PRODUCTION`.
+# Testing environment. There will be a distinct color label on the front-end page,
+# indicating that this environment is a testing environment.
+DEPLOY_ENV=PRODUCTION
+
+# Whether to enable the version check policy.
+# If set to empty, https://updates.dify.ai will be called for version check.
+CHECK_UPDATE_URL=https://updates.dify.ai
+
+# Used to change the OpenAI base address, default is https://api.openai.com/v1.
+# When OpenAI cannot be accessed in China, replace it with a domestic mirror address,
+# or when a local model provides OpenAI compatible API, it can be replaced.
+OPENAI_API_BASE=https://api.openai.com/v1
+
+# When enabled, migrations will be executed prior to application startup
+# and the application will start after the migrations have completed.
+MIGRATION_ENABLED=true
+
+# File Access Time specifies a time interval in seconds for the file to be accessed.
+# The default value is 300 seconds.
+FILES_ACCESS_TIMEOUT=300
+
+# Access token expiration time in minutes
+ACCESS_TOKEN_EXPIRE_MINUTES=60
+
+# Refresh token expiration time in days
+REFRESH_TOKEN_EXPIRE_DAYS=30
+
+# The maximum number of active requests for the application, where 0 means unlimited, should be a non-negative integer.
+APP_MAX_ACTIVE_REQUESTS=0
+APP_MAX_EXECUTION_TIME=1200
+
+# ------------------------------
+# Container Startup Related Configuration
+# Only effective when starting with docker image or docker-compose.
+# ------------------------------
+
+# API service binding address, default: 0.0.0.0, i.e., all addresses can be accessed.
+DIFY_BIND_ADDRESS=0.0.0.0
+
+# API service binding port number, default 5001.
+DIFY_PORT=5001
+
+# The number of API server workers, i.e., the number of workers.
+# Formula: number of cpu cores x 2 + 1 for sync, 1 for Gevent
+# Reference: https://docs.gunicorn.org/en/stable/design.html#how-many-workers
+SERVER_WORKER_AMOUNT=1
+
+# Defaults to gevent. If using windows, it can be switched to sync or solo.
+SERVER_WORKER_CLASS=gevent
+
+# Default number of worker connections, the default is 10.
+SERVER_WORKER_CONNECTIONS=10
+
+# Similar to SERVER_WORKER_CLASS.
+# If using windows, it can be switched to sync or solo.
+CELERY_WORKER_CLASS=
+
+# Request handling timeout. The default is 200,
+# it is recommended to set it to 360 to support a longer sse connection time.
+GUNICORN_TIMEOUT=360
+
+# The number of Celery workers. The default is 1, and can be set as needed.
+CELERY_WORKER_AMOUNT=
+
+# Flag indicating whether to enable autoscaling of Celery workers.
+#
+# Autoscaling is useful when tasks are CPU intensive and can be dynamically
+# allocated and deallocated based on the workload.
+#
+# When autoscaling is enabled, the maximum and minimum number of workers can
+# be specified. The autoscaling algorithm will dynamically adjust the number
+# of workers within the specified range.
+#
+# Default is false (i.e., autoscaling is disabled).
+#
+# Example:
+# CELERY_AUTO_SCALE=true
+CELERY_AUTO_SCALE=false
+
+# The maximum number of Celery workers that can be autoscaled.
+# This is optional and only used when autoscaling is enabled.
+# Default is not set.
+CELERY_MAX_WORKERS=
+
+# The minimum number of Celery workers that can be autoscaled.
+# This is optional and only used when autoscaling is enabled.
+# Default is not set.
+CELERY_MIN_WORKERS=
+
+# API Tool configuration
+API_TOOL_DEFAULT_CONNECT_TIMEOUT=10
+API_TOOL_DEFAULT_READ_TIMEOUT=60
+
+
+# ------------------------------
+# Database Configuration
+# The database uses PostgreSQL. Please use the public schema.
+# It is consistent with the configuration in the 'db' service below.
+# ------------------------------
+
+DB_USERNAME=postgres
+DB_PASSWORD=difyai123456
+DB_HOST=db
+DB_PORT=5432
+DB_DATABASE=dify
+# The size of the database connection pool.
+# The default is 30 connections, which can be appropriately increased.
+SQLALCHEMY_POOL_SIZE=30
+# Database connection pool recycling time, the default is 3600 seconds.
+SQLALCHEMY_POOL_RECYCLE=3600
+# Whether to print SQL, default is false.
+SQLALCHEMY_ECHO=false
+
+# Maximum number of connections to the database
+# Default is 100
+#
+# Reference: https://www.postgresql.org/docs/current/runtime-config-connection.html#GUC-MAX-CONNECTIONS
+POSTGRES_MAX_CONNECTIONS=100
+
+# Sets the amount of shared memory used for postgres's shared buffers.
+# Default is 128MB
+# Recommended value: 25% of available memory
+# Reference: https://www.postgresql.org/docs/current/runtime-config-resource.html#GUC-SHARED-BUFFERS
+POSTGRES_SHARED_BUFFERS=128MB
+
+# Sets the amount of memory used by each database worker for working space.
+# Default is 4MB
+#
+# Reference: https://www.postgresql.org/docs/current/runtime-config-resource.html#GUC-WORK-MEM
+POSTGRES_WORK_MEM=4MB
+
+# Sets the amount of memory reserved for maintenance activities.
+# Default is 64MB
+#
+# Reference: https://www.postgresql.org/docs/current/runtime-config-resource.html#GUC-MAINTENANCE-WORK-MEM
+POSTGRES_MAINTENANCE_WORK_MEM=64MB
+
+# Sets the planner's assumption about the effective cache size.
+# Default is 4096MB
+#
+# Reference: https://www.postgresql.org/docs/current/runtime-config-query.html#GUC-EFFECTIVE-CACHE-SIZE
+POSTGRES_EFFECTIVE_CACHE_SIZE=4096MB
+
+# ------------------------------
+# Redis Configuration
+# This Redis configuration is used for caching and for pub/sub during conversation.
+# ------------------------------
+
+REDIS_HOST=redis
+REDIS_PORT=6379
+REDIS_USERNAME=
+REDIS_PASSWORD=difyai123456
+REDIS_USE_SSL=false
+REDIS_DB=0
+
+# Whether to use Redis Sentinel mode.
+# If set to true, the application will automatically discover and connect to the master node through Sentinel.
+REDIS_USE_SENTINEL=false
+
+# List of Redis Sentinel nodes. If Sentinel mode is enabled, provide at least one Sentinel IP and port.
+# Format: `<sentinel1_ip>:<sentinel1_port>,<sentinel2_ip>:<sentinel2_port>,<sentinel3_ip>:<sentinel3_port>`
+REDIS_SENTINELS=
+REDIS_SENTINEL_SERVICE_NAME=
+REDIS_SENTINEL_USERNAME=
+REDIS_SENTINEL_PASSWORD=
+REDIS_SENTINEL_SOCKET_TIMEOUT=0.1
+
+# List of Redis Cluster nodes. If Cluster mode is enabled, provide at least one Cluster IP and port.
+# Format: `<Cluster1_ip>:<Cluster1_port>,<Cluster2_ip>:<Cluster2_port>,<Cluster3_ip>:<Cluster3_port>`
+REDIS_USE_CLUSTERS=false
+REDIS_CLUSTERS=
+REDIS_CLUSTERS_PASSWORD=
+
+# ------------------------------
+# Celery Configuration
+# ------------------------------
+
+# Use redis as the broker, and redis db 1 for celery broker.
+# Format as follows: `redis://<redis_username>:<redis_password>@<redis_host>:<redis_port>/<redis_database>`
+# Example: redis://:difyai123456@redis:6379/1
+# If use Redis Sentinel, format as follows: `sentinel://<sentinel_username>:<sentinel_password>@<sentinel_host>:<sentinel_port>/<redis_database>`
+# Example: sentinel://localhost:26379/1;sentinel://localhost:26380/1;sentinel://localhost:26381/1
+CELERY_BROKER_URL=redis://:difyai123456@redis:6379/1
+BROKER_USE_SSL=false
+
+# If you are using Redis Sentinel for high availability, configure the following settings.
+CELERY_USE_SENTINEL=false
+CELERY_SENTINEL_MASTER_NAME=
+CELERY_SENTINEL_SOCKET_TIMEOUT=0.1
+
+# ------------------------------
+# CORS Configuration
+# Used to set the front-end cross-domain access policy.
+# ------------------------------
+
+# Specifies the allowed origins for cross-origin requests to the Web API,
+# e.g. https://dify.app or * for all origins.
+WEB_API_CORS_ALLOW_ORIGINS=*
+
+# Specifies the allowed origins for cross-origin requests to the console API,
+# e.g. https://cloud.dify.ai or * for all origins.
+CONSOLE_CORS_ALLOW_ORIGINS=*
+
+# ------------------------------
+# File Storage Configuration
+# ------------------------------
+
+# The type of storage to use for storing user files.
+STORAGE_TYPE=opendal
+
+# Apache OpenDAL Configuration
+# The configuration for OpenDAL consists of the following format: OPENDAL_<SCHEME_NAME>_<CONFIG_NAME>.
+# You can find all the service configurations (CONFIG_NAME) in the repository at: https://github.com/apache/opendal/tree/main/core/src/services.
+# Dify will scan configurations starting with OPENDAL_<SCHEME_NAME> and automatically apply them.
+# The scheme name for the OpenDAL storage.
+OPENDAL_SCHEME=fs
+# Configurations for OpenDAL Local File System.
+OPENDAL_FS_ROOT=storage
+
+# S3 Configuration
+#
+S3_ENDPOINT=
+S3_REGION=us-east-1
+S3_BUCKET_NAME=difyai
+S3_ACCESS_KEY=
+S3_SECRET_KEY=
+# Whether to use AWS managed IAM roles for authenticating with the S3 service.
+# If set to false, the access key and secret key must be provided.
+S3_USE_AWS_MANAGED_IAM=false
+
+# Azure Blob Configuration
+#
+AZURE_BLOB_ACCOUNT_NAME=difyai
+AZURE_BLOB_ACCOUNT_KEY=difyai
+AZURE_BLOB_CONTAINER_NAME=difyai-container
+AZURE_BLOB_ACCOUNT_URL=https://<your_account_name>.blob.core.windows.net
+
+# Google Storage Configuration
+#
+GOOGLE_STORAGE_BUCKET_NAME=your-bucket-name
+GOOGLE_STORAGE_SERVICE_ACCOUNT_JSON_BASE64=
+
+# The Alibaba Cloud OSS configurations,
+#
+ALIYUN_OSS_BUCKET_NAME=your-bucket-name
+ALIYUN_OSS_ACCESS_KEY=your-access-key
+ALIYUN_OSS_SECRET_KEY=your-secret-key
+ALIYUN_OSS_ENDPOINT=https://oss-ap-southeast-1-internal.aliyuncs.com
+ALIYUN_OSS_REGION=ap-southeast-1
+ALIYUN_OSS_AUTH_VERSION=v4
+# Don't start with '/'. OSS doesn't support leading slash in object names.
+ALIYUN_OSS_PATH=your-path
+
+# Tencent COS Configuration
+#
+TENCENT_COS_BUCKET_NAME=your-bucket-name
+TENCENT_COS_SECRET_KEY=your-secret-key
+TENCENT_COS_SECRET_ID=your-secret-id
+TENCENT_COS_REGION=your-region
+TENCENT_COS_SCHEME=your-scheme
+
+# Oracle Storage Configuration
+#
+OCI_ENDPOINT=https://your-object-storage-namespace.compat.objectstorage.us-ashburn-1.oraclecloud.com
+OCI_BUCKET_NAME=your-bucket-name
+OCI_ACCESS_KEY=your-access-key
+OCI_SECRET_KEY=your-secret-key
+OCI_REGION=us-ashburn-1
+
+# Huawei OBS Configuration
+#
+HUAWEI_OBS_BUCKET_NAME=your-bucket-name
+HUAWEI_OBS_SECRET_KEY=your-secret-key
+HUAWEI_OBS_ACCESS_KEY=your-access-key
+HUAWEI_OBS_SERVER=your-server-url
+
+# Volcengine TOS Configuration
+#
+VOLCENGINE_TOS_BUCKET_NAME=your-bucket-name
+VOLCENGINE_TOS_SECRET_KEY=your-secret-key
+VOLCENGINE_TOS_ACCESS_KEY=your-access-key
+VOLCENGINE_TOS_ENDPOINT=your-server-url
+VOLCENGINE_TOS_REGION=your-region
+
+# Baidu OBS Storage Configuration
+#
+BAIDU_OBS_BUCKET_NAME=your-bucket-name
+BAIDU_OBS_SECRET_KEY=your-secret-key
+BAIDU_OBS_ACCESS_KEY=your-access-key
+BAIDU_OBS_ENDPOINT=your-server-url
+
+# Supabase Storage Configuration
+#
+SUPABASE_BUCKET_NAME=your-bucket-name
+SUPABASE_API_KEY=your-access-key
+SUPABASE_URL=your-server-url
+
+# ------------------------------
+# Vector Database Configuration
+# ------------------------------
+
+# The type of vector store to use.
+# Supported values are `weaviate`, `qdrant`, `milvus`, `myscale`, `relyt`, `pgvector`, `pgvecto-rs`, `chroma`, `opensearch`, `tidb_vector`, `oracle`, `tencent`, `elasticsearch`, `elasticsearch-ja`, `analyticdb`, `couchbase`, `vikingdb`, `oceanbase`, `opengauss`.
+VECTOR_STORE=weaviate
+
+# The Weaviate endpoint URL. Only available when VECTOR_STORE is `weaviate`.
+WEAVIATE_ENDPOINT=http://weaviate:8080
+WEAVIATE_API_KEY=WVF5YThaHlkYwhGUSmCRgsX3tD5ngdN8pkih
+
+# The Qdrant endpoint URL. Only available when VECTOR_STORE is `qdrant`.
+QDRANT_URL=http://qdrant:6333
+QDRANT_API_KEY=difyai123456
+QDRANT_CLIENT_TIMEOUT=20
+QDRANT_GRPC_ENABLED=false
+QDRANT_GRPC_PORT=6334
+
+# Milvus configuration. Only available when VECTOR_STORE is `milvus`.
+# The milvus uri.
+MILVUS_URI=http://host.docker.internal:19530
+MILVUS_TOKEN=
+MILVUS_USER=
+MILVUS_PASSWORD=
+MILVUS_ENABLE_HYBRID_SEARCH=False
+
+# MyScale configuration, only available when VECTOR_STORE is `myscale`
+# For multi-language support, please set MYSCALE_FTS_PARAMS with referring to:
+# https://myscale.com/docs/en/text-search/#understanding-fts-index-parameters
+MYSCALE_HOST=myscale
+MYSCALE_PORT=8123
+MYSCALE_USER=default
+MYSCALE_PASSWORD=
+MYSCALE_DATABASE=dify
+MYSCALE_FTS_PARAMS=
+
+# Couchbase configurations, only available when VECTOR_STORE is `couchbase`
+# The connection string must include hostname defined in the docker-compose file (couchbase-server in this case)
+COUCHBASE_CONNECTION_STRING=couchbase://couchbase-server
+COUCHBASE_USER=Administrator
+COUCHBASE_PASSWORD=password
+COUCHBASE_BUCKET_NAME=Embeddings
+COUCHBASE_SCOPE_NAME=_default
+
+# pgvector configurations, only available when VECTOR_STORE is `pgvector`
+PGVECTOR_HOST=pgvector
+PGVECTOR_PORT=5432
+PGVECTOR_USER=postgres
+PGVECTOR_PASSWORD=difyai123456
+PGVECTOR_DATABASE=dify
+PGVECTOR_MIN_CONNECTION=1
+PGVECTOR_MAX_CONNECTION=5
+PGVECTOR_PG_BIGM=false
+PGVECTOR_PG_BIGM_VERSION=1.2-20240606
+
+# pgvecto-rs configurations, only available when VECTOR_STORE is `pgvecto-rs`
+PGVECTO_RS_HOST=pgvecto-rs
+PGVECTO_RS_PORT=5432
+PGVECTO_RS_USER=postgres
+PGVECTO_RS_PASSWORD=difyai123456
+PGVECTO_RS_DATABASE=dify
+
+# analyticdb configurations, only available when VECTOR_STORE is `analyticdb`
+ANALYTICDB_KEY_ID=your-ak
+ANALYTICDB_KEY_SECRET=your-sk
+ANALYTICDB_REGION_ID=cn-hangzhou
+ANALYTICDB_INSTANCE_ID=gp-ab123456
+ANALYTICDB_ACCOUNT=testaccount
+ANALYTICDB_PASSWORD=testpassword
+ANALYTICDB_NAMESPACE=dify
+ANALYTICDB_NAMESPACE_PASSWORD=difypassword
+ANALYTICDB_HOST=gp-test.aliyuncs.com
+ANALYTICDB_PORT=5432
+ANALYTICDB_MIN_CONNECTION=1
+ANALYTICDB_MAX_CONNECTION=5
+
+# TiDB vector configurations, only available when VECTOR_STORE is `tidb`
+TIDB_VECTOR_HOST=tidb
+TIDB_VECTOR_PORT=4000
+TIDB_VECTOR_USER=
+TIDB_VECTOR_PASSWORD=
+TIDB_VECTOR_DATABASE=dify
+
+# Tidb on qdrant configuration, only available when VECTOR_STORE is `tidb_on_qdrant`
+TIDB_ON_QDRANT_URL=http://127.0.0.1
+TIDB_ON_QDRANT_API_KEY=dify
+TIDB_ON_QDRANT_CLIENT_TIMEOUT=20
+TIDB_ON_QDRANT_GRPC_ENABLED=false
+TIDB_ON_QDRANT_GRPC_PORT=6334
+TIDB_PUBLIC_KEY=dify
+TIDB_PRIVATE_KEY=dify
+TIDB_API_URL=http://127.0.0.1
+TIDB_IAM_API_URL=http://127.0.0.1
+TIDB_REGION=regions/aws-us-east-1
+TIDB_PROJECT_ID=dify
+TIDB_SPEND_LIMIT=100
+
+# Chroma configuration, only available when VECTOR_STORE is `chroma`
+CHROMA_HOST=127.0.0.1
+CHROMA_PORT=8000
+CHROMA_TENANT=default_tenant
+CHROMA_DATABASE=default_database
+CHROMA_AUTH_PROVIDER=chromadb.auth.token_authn.TokenAuthClientProvider
+CHROMA_AUTH_CREDENTIALS=
+
+# Oracle configuration, only available when VECTOR_STORE is `oracle`
+ORACLE_USER=dify
+ORACLE_PASSWORD=dify
+ORACLE_DSN=oracle:1521/FREEPDB1
+ORACLE_CONFIG_DIR=/app/api/storage/wallet
+ORACLE_WALLET_LOCATION=/app/api/storage/wallet
+ORACLE_WALLET_PASSWORD=dify
+ORACLE_IS_AUTONOMOUS=false
+
+# relyt configurations, only available when VECTOR_STORE is `relyt`
+RELYT_HOST=db
+RELYT_PORT=5432
+RELYT_USER=postgres
+RELYT_PASSWORD=difyai123456
+RELYT_DATABASE=postgres
+
+# open search configuration, only available when VECTOR_STORE is `opensearch`
+OPENSEARCH_HOST=opensearch
+OPENSEARCH_PORT=9200
+OPENSEARCH_USER=admin
+OPENSEARCH_PASSWORD=admin
+OPENSEARCH_SECURE=true
+
+# tencent vector configurations, only available when VECTOR_STORE is `tencent`
+TENCENT_VECTOR_DB_URL=http://127.0.0.1
+TENCENT_VECTOR_DB_API_KEY=dify
+TENCENT_VECTOR_DB_TIMEOUT=30
+TENCENT_VECTOR_DB_USERNAME=dify
+TENCENT_VECTOR_DB_DATABASE=dify
+TENCENT_VECTOR_DB_SHARD=1
+TENCENT_VECTOR_DB_REPLICAS=2
+
+# ElasticSearch configuration, only available when VECTOR_STORE is `elasticsearch`
+ELASTICSEARCH_HOST=0.0.0.0
+ELASTICSEARCH_PORT=9200
+ELASTICSEARCH_USERNAME=elastic
+ELASTICSEARCH_PASSWORD=elastic
+KIBANA_PORT=5601
+
+# baidu vector configurations, only available when VECTOR_STORE is `baidu`
+BAIDU_VECTOR_DB_ENDPOINT=http://127.0.0.1:5287
+BAIDU_VECTOR_DB_CONNECTION_TIMEOUT_MS=30000
+BAIDU_VECTOR_DB_ACCOUNT=root
+BAIDU_VECTOR_DB_API_KEY=dify
+BAIDU_VECTOR_DB_DATABASE=dify
+BAIDU_VECTOR_DB_SHARD=1
+BAIDU_VECTOR_DB_REPLICAS=3
+
+# VikingDB configurations, only available when VECTOR_STORE is `vikingdb`
+VIKINGDB_ACCESS_KEY=your-ak
+VIKINGDB_SECRET_KEY=your-sk
+VIKINGDB_REGION=cn-shanghai
+VIKINGDB_HOST=api-vikingdb.xxx.volces.com
+VIKINGDB_SCHEMA=http
+VIKINGDB_CONNECTION_TIMEOUT=30
+VIKINGDB_SOCKET_TIMEOUT=30
+
+# Lindorm configuration, only available when VECTOR_STORE is `lindorm`
+LINDORM_URL=http://lindorm:30070
+LINDORM_USERNAME=lindorm
+LINDORM_PASSWORD=lindorm
+
+# OceanBase Vector configuration, only available when VECTOR_STORE is `oceanbase`
+OCEANBASE_VECTOR_HOST=oceanbase
+OCEANBASE_VECTOR_PORT=2881
+OCEANBASE_VECTOR_USER=root@test
+OCEANBASE_VECTOR_PASSWORD=difyai123456
+OCEANBASE_VECTOR_DATABASE=test
+OCEANBASE_CLUSTER_NAME=difyai
+OCEANBASE_MEMORY_LIMIT=6G
+
+# opengauss configurations, only available when VECTOR_STORE is `opengauss`
+OPENGAUSS_HOST=opengauss
+OPENGAUSS_PORT=6600
+OPENGAUSS_USER=postgres
+OPENGAUSS_PASSWORD=Dify@123
+OPENGAUSS_DATABASE=dify
+OPENGAUSS_MIN_CONNECTION=1
+OPENGAUSS_MAX_CONNECTION=5
+
+# Upstash Vector configuration, only available when VECTOR_STORE is `upstash`
+UPSTASH_VECTOR_URL=https://xxx-vector.upstash.io
+UPSTASH_VECTOR_TOKEN=dify
+
+# ------------------------------
+# Knowledge Configuration
+# ------------------------------
+
+# Upload file size limit, default 15M.
+UPLOAD_FILE_SIZE_LIMIT=15
+
+# The maximum number of files that can be uploaded at a time, default 5.
+UPLOAD_FILE_BATCH_LIMIT=5
+
+# ETL type, support: `dify`, `Unstructured`
+# `dify` Dify's proprietary file extraction scheme
+# `Unstructured` Unstructured.io file extraction scheme
+ETL_TYPE=dify
+
+# Unstructured API path and API key, needs to be configured when ETL_TYPE is Unstructured
+# Or using Unstructured for document extractor node for pptx.
+# For example: http://unstructured:8000/general/v0/general
+UNSTRUCTURED_API_URL=
+UNSTRUCTURED_API_KEY=
+SCARF_NO_ANALYTICS=true
+
+# ------------------------------
+# Model Configuration
+# ------------------------------
+
+# The maximum number of tokens allowed for prompt generation.
+# This setting controls the upper limit of tokens that can be used by the LLM 
+# when generating a prompt in the prompt generation tool.
+# Default: 512 tokens.
+PROMPT_GENERATION_MAX_TOKENS=512
+
+# The maximum number of tokens allowed for code generation.
+# This setting controls the upper limit of tokens that can be used by the LLM 
+# when generating code in the code generation tool.
+# Default: 1024 tokens.
+CODE_GENERATION_MAX_TOKENS=1024
+
+# ------------------------------
+# Multi-modal Configuration
+# ------------------------------
+
+# The format of the image/video/audio/document sent when the multi-modal model is input,
+# the default is base64, optional url.
+# The delay of the call in url mode will be lower than that in base64 mode.
+# It is generally recommended to use the more compatible base64 mode.
+# If configured as url, you need to configure FILES_URL as an externally accessible address so that the multi-modal model can access the image/video/audio/document.
+MULTIMODAL_SEND_FORMAT=base64
+# Upload image file size limit, default 10M.
+UPLOAD_IMAGE_FILE_SIZE_LIMIT=10
+# Upload video file size limit, default 100M.
+UPLOAD_VIDEO_FILE_SIZE_LIMIT=100
+# Upload audio file size limit, default 50M.
+UPLOAD_AUDIO_FILE_SIZE_LIMIT=50
+
+# ------------------------------
+# Sentry Configuration
+# Used for application monitoring and error log tracking.
+# ------------------------------
+SENTRY_DSN=
+
+# API Service Sentry DSN address, default is empty, when empty,
+# all monitoring information is not reported to Sentry.
+# If not set, Sentry error reporting will be disabled.
+API_SENTRY_DSN=
+# API Service The reporting ratio of Sentry events, if it is 0.01, it is 1%.
+API_SENTRY_TRACES_SAMPLE_RATE=1.0
+# API Service The reporting ratio of Sentry profiles, if it is 0.01, it is 1%.
+API_SENTRY_PROFILES_SAMPLE_RATE=1.0
+
+# Web Service Sentry DSN address, default is empty, when empty,
+# all monitoring information is not reported to Sentry.
+# If not set, Sentry error reporting will be disabled.
+WEB_SENTRY_DSN=
+
+# ------------------------------
+# Notion Integration Configuration
+# Variables can be obtained by applying for Notion integration: https://www.notion.so/my-integrations
+# ------------------------------
+
+# Configure as "public" or "internal".
+# Since Notion's OAuth redirect URL only supports HTTPS,
+# if deploying locally, please use Notion's internal integration.
+NOTION_INTEGRATION_TYPE=public
+# Notion OAuth client secret (used for public integration type)
+NOTION_CLIENT_SECRET=
+# Notion OAuth client id (used for public integration type)
+NOTION_CLIENT_ID=
+# Notion internal integration secret.
+# If the value of NOTION_INTEGRATION_TYPE is "internal",
+# you need to configure this variable.
+NOTION_INTERNAL_SECRET=
+
+# ------------------------------
+# Mail related configuration
+# ------------------------------
+
+# Mail type, support: resend, smtp
+MAIL_TYPE=resend
+
+# Default send from email address, if not specified
+MAIL_DEFAULT_SEND_FROM=
+
+# API-Key for the Resend email provider, used when MAIL_TYPE is `resend`.
+RESEND_API_URL=https://api.resend.com
+RESEND_API_KEY=your-resend-api-key
+
+
+# SMTP server configuration, used when MAIL_TYPE is `smtp`
+SMTP_SERVER=
+SMTP_PORT=465
+SMTP_USERNAME=
+SMTP_PASSWORD=
+SMTP_USE_TLS=true
+SMTP_OPPORTUNISTIC_TLS=false
+
+# ------------------------------
+# Others Configuration
+# ------------------------------
+
+# Maximum length of segmentation tokens for indexing
+INDEXING_MAX_SEGMENTATION_TOKENS_LENGTH=4000
+
+# Member invitation link valid time (hours),
+# Default: 72.
+INVITE_EXPIRY_HOURS=72
+
+# Reset password token valid time (minutes),
+RESET_PASSWORD_TOKEN_EXPIRY_MINUTES=5
+
+# The sandbox service endpoint.
+CODE_EXECUTION_ENDPOINT=http://sandbox:8194
+CODE_EXECUTION_API_KEY=dify-sandbox
+CODE_MAX_NUMBER=9223372036854775807
+CODE_MIN_NUMBER=-9223372036854775808
+CODE_MAX_DEPTH=5
+CODE_MAX_PRECISION=20
+CODE_MAX_STRING_LENGTH=80000
+CODE_MAX_STRING_ARRAY_LENGTH=30
+CODE_MAX_OBJECT_ARRAY_LENGTH=30
+CODE_MAX_NUMBER_ARRAY_LENGTH=1000
+CODE_EXECUTION_CONNECT_TIMEOUT=10
+CODE_EXECUTION_READ_TIMEOUT=60
+CODE_EXECUTION_WRITE_TIMEOUT=10
+TEMPLATE_TRANSFORM_MAX_LENGTH=80000
+
+# Workflow runtime configuration
+WORKFLOW_MAX_EXECUTION_STEPS=500
+WORKFLOW_MAX_EXECUTION_TIME=1200
+WORKFLOW_CALL_MAX_DEPTH=5
+MAX_VARIABLE_SIZE=204800
+WORKFLOW_PARALLEL_DEPTH_LIMIT=3
+WORKFLOW_FILE_UPLOAD_LIMIT=10
+
+# HTTP request node in workflow configuration
+HTTP_REQUEST_NODE_MAX_BINARY_SIZE=10485760
+HTTP_REQUEST_NODE_MAX_TEXT_SIZE=1048576
+HTTP_REQUEST_NODE_SSL_VERIFY=True
+
+# SSRF Proxy server HTTP URL
+SSRF_PROXY_HTTP_URL=http://ssrf_proxy:3128
+# SSRF Proxy server HTTPS URL
+SSRF_PROXY_HTTPS_URL=http://ssrf_proxy:3128
+
+# Maximum loop count in the workflow
+LOOP_NODE_MAX_COUNT=100
+
+# The maximum number of tools that can be used in the agent.
+MAX_TOOLS_NUM=10
+
+# Maximum number of Parallelism branches in the workflow
+MAX_PARALLEL_LIMIT=10
+
+# ------------------------------
+# Environment Variables for web Service
+# ------------------------------
+
+# The timeout for the text generation in millisecond
+TEXT_GENERATION_TIMEOUT_MS=60000
+
+# ------------------------------
+# Environment Variables for db Service
+# ------------------------------
+
+PGUSER=${DB_USERNAME}
+# The password for the default postgres user.
+POSTGRES_PASSWORD=${DB_PASSWORD}
+# The name of the default postgres database.
+POSTGRES_DB=${DB_DATABASE}
+# postgres data directory
+PGDATA=/var/lib/postgresql/data/pgdata
+
+# ------------------------------
+# Environment Variables for sandbox Service
+# ------------------------------
+
+# The API key for the sandbox service
+SANDBOX_API_KEY=dify-sandbox
+# The mode in which the Gin framework runs
+SANDBOX_GIN_MODE=release
+# The timeout for the worker in seconds
+SANDBOX_WORKER_TIMEOUT=15
+# Enable network for the sandbox service
+SANDBOX_ENABLE_NETWORK=true
+# HTTP proxy URL for SSRF protection
+SANDBOX_HTTP_PROXY=http://ssrf_proxy:3128
+# HTTPS proxy URL for SSRF protection
+SANDBOX_HTTPS_PROXY=http://ssrf_proxy:3128
+# The port on which the sandbox service runs
+SANDBOX_PORT=8194
+
+# ------------------------------
+# Environment Variables for weaviate Service
+# (only used when VECTOR_STORE is weaviate)
+# ------------------------------
+WEAVIATE_PERSISTENCE_DATA_PATH=/var/lib/weaviate
+WEAVIATE_QUERY_DEFAULTS_LIMIT=25
+WEAVIATE_AUTHENTICATION_ANONYMOUS_ACCESS_ENABLED=true
+WEAVIATE_DEFAULT_VECTORIZER_MODULE=none
+WEAVIATE_CLUSTER_HOSTNAME=node1
+WEAVIATE_AUTHENTICATION_APIKEY_ENABLED=true
+WEAVIATE_AUTHENTICATION_APIKEY_ALLOWED_KEYS=WVF5YThaHlkYwhGUSmCRgsX3tD5ngdN8pkih
+WEAVIATE_AUTHENTICATION_APIKEY_USERS=hello@dify.ai
+WEAVIATE_AUTHORIZATION_ADMINLIST_ENABLED=true
+WEAVIATE_AUTHORIZATION_ADMINLIST_USERS=hello@dify.ai
+
+# ------------------------------
+# Environment Variables for Chroma
+# (only used when VECTOR_STORE is chroma)
+# ------------------------------
+
+# Authentication credentials for Chroma server
+CHROMA_SERVER_AUTHN_CREDENTIALS=difyai123456
+# Authentication provider for Chroma server
+CHROMA_SERVER_AUTHN_PROVIDER=chromadb.auth.token_authn.TokenAuthenticationServerProvider
+# Persistence setting for Chroma server
+CHROMA_IS_PERSISTENT=TRUE
+
+# ------------------------------
+# Environment Variables for Oracle Service
+# (only used when VECTOR_STORE is Oracle)
+# ------------------------------
+ORACLE_PWD=Dify123456
+ORACLE_CHARACTERSET=AL32UTF8
+
+# ------------------------------
+# Environment Variables for milvus Service
+# (only used when VECTOR_STORE is milvus)
+# ------------------------------
+# ETCD configuration for auto compaction mode
+ETCD_AUTO_COMPACTION_MODE=revision
+# ETCD configuration for auto compaction retention in terms of number of revisions
+ETCD_AUTO_COMPACTION_RETENTION=1000
+# ETCD configuration for backend quota in bytes
+ETCD_QUOTA_BACKEND_BYTES=4294967296
+# ETCD configuration for the number of changes before triggering a snapshot
+ETCD_SNAPSHOT_COUNT=50000
+# MinIO access key for authentication
+MINIO_ACCESS_KEY=minioadmin
+# MinIO secret key for authentication
+MINIO_SECRET_KEY=minioadmin
+# ETCD service endpoints
+ETCD_ENDPOINTS=etcd:2379
+# MinIO service address
+MINIO_ADDRESS=minio:9000
+# Enable or disable security authorization
+MILVUS_AUTHORIZATION_ENABLED=true
+
+# ------------------------------
+# Environment Variables for pgvector / pgvector-rs Service
+# (only used when VECTOR_STORE is pgvector / pgvector-rs)
+# ------------------------------
+PGVECTOR_PGUSER=postgres
+# The password for the default postgres user.
+PGVECTOR_POSTGRES_PASSWORD=difyai123456
+# The name of the default postgres database.
+PGVECTOR_POSTGRES_DB=dify
+# postgres data directory
+PGVECTOR_PGDATA=/var/lib/postgresql/data/pgdata
+
+# ------------------------------
+# Environment Variables for opensearch
+# (only used when VECTOR_STORE is opensearch)
+# ------------------------------
+OPENSEARCH_DISCOVERY_TYPE=single-node
+OPENSEARCH_BOOTSTRAP_MEMORY_LOCK=true
+OPENSEARCH_JAVA_OPTS_MIN=512m
+OPENSEARCH_JAVA_OPTS_MAX=1024m
+OPENSEARCH_INITIAL_ADMIN_PASSWORD=Qazwsxedc!@#123
+OPENSEARCH_MEMLOCK_SOFT=-1
+OPENSEARCH_MEMLOCK_HARD=-1
+OPENSEARCH_NOFILE_SOFT=65536
+OPENSEARCH_NOFILE_HARD=65536
+
+# ------------------------------
+# Environment Variables for Nginx reverse proxy
+# ------------------------------
+NGINX_SERVER_NAME=_
+NGINX_HTTPS_ENABLED=false
+# HTTP port
+NGINX_PORT=80
+# SSL settings are only applied when HTTPS_ENABLED is true
+NGINX_SSL_PORT=443
+# if HTTPS_ENABLED is true, you're required to add your own SSL certificates/keys to the `./nginx/ssl` directory
+# and modify the env vars below accordingly.
+NGINX_SSL_CERT_FILENAME=dify.crt
+NGINX_SSL_CERT_KEY_FILENAME=dify.key
+NGINX_SSL_PROTOCOLS=TLSv1.1 TLSv1.2 TLSv1.3
+
+# Nginx performance tuning
+NGINX_WORKER_PROCESSES=auto
+NGINX_CLIENT_MAX_BODY_SIZE=15M
+NGINX_KEEPALIVE_TIMEOUT=65
+
+# Proxy settings
+NGINX_PROXY_READ_TIMEOUT=3600s
+NGINX_PROXY_SEND_TIMEOUT=3600s
+
+# Set true to accept requests for /.well-known/acme-challenge/
+NGINX_ENABLE_CERTBOT_CHALLENGE=false
+
+# ------------------------------
+# Certbot Configuration
+# ------------------------------
+
+# Email address (required to get certificates from Let's Encrypt)
+CERTBOT_EMAIL=your_email@example.com
+
+# Domain name
+CERTBOT_DOMAIN=your_domain.com
+
+# certbot command options
+# i.e: --force-renewal --dry-run --test-cert --debug
+CERTBOT_OPTIONS=
+
+# ------------------------------
+# Environment Variables for SSRF Proxy
+# ------------------------------
+SSRF_HTTP_PORT=3128
+SSRF_COREDUMP_DIR=/var/spool/squid
+SSRF_REVERSE_PROXY_PORT=8194
+SSRF_SANDBOX_HOST=sandbox
+SSRF_DEFAULT_TIME_OUT=5
+SSRF_DEFAULT_CONNECT_TIME_OUT=5
+SSRF_DEFAULT_READ_TIME_OUT=5
+SSRF_DEFAULT_WRITE_TIME_OUT=5
+
+# ------------------------------
+# docker env var for specifying vector db type at startup
+# (based on the vector db type, the corresponding docker
+# compose profile will be used)
+# if you want to use unstructured, add ',unstructured' to the end
+# ------------------------------
+COMPOSE_PROFILES=${VECTOR_STORE:-weaviate}
+
+# ------------------------------
+# Docker Compose Service Expose Host Port Configurations
+# ------------------------------
+EXPOSE_NGINX_PORT=10505
+EXPOSE_NGINX_SSL_PORT=443
+
+# ----------------------------------------------------------------------------
+# ModelProvider & Tool Position Configuration
+# Used to specify the model providers and tools that can be used in the app.
+# ----------------------------------------------------------------------------
+
+# Pin, include, and exclude tools
+# Use comma-separated values with no spaces between items.
+# Example: POSITION_TOOL_PINS=bing,google
+POSITION_TOOL_PINS=
+POSITION_TOOL_INCLUDES=
+POSITION_TOOL_EXCLUDES=
+
+# Pin, include, and exclude model providers
+# Use comma-separated values with no spaces between items.
+# Example: POSITION_PROVIDER_PINS=openai,openllm
+POSITION_PROVIDER_PINS=
+POSITION_PROVIDER_INCLUDES=
+POSITION_PROVIDER_EXCLUDES=
+
+# CSP https://developer.mozilla.org/en-US/docs/Web/HTTP/CSP
+CSP_WHITELIST=
+
+# Enable or disable create tidb service job
+CREATE_TIDB_SERVICE_JOB_ENABLED=false
+
+# Maximum number of submitted thread count in a ThreadPool for parallel node execution
+MAX_SUBMIT_COUNT=100
+
+# The maximum number of top-k value for RAG.
+TOP_K_MAX_VALUE=10
+
+# ------------------------------
+# Plugin Daemon Configuration
+# ------------------------------
+
+DB_PLUGIN_DATABASE=dify_plugin
+EXPOSE_PLUGIN_DAEMON_PORT=5002
+PLUGIN_DAEMON_PORT=5002
+PLUGIN_DAEMON_KEY=lYkiYYT6owG+71oLerGzA7GXCgOT++6ovaezWAjpCjf+Sjc3ZtU+qUEi
+PLUGIN_DAEMON_URL=http://plugin_daemon:5002
+PLUGIN_MAX_PACKAGE_SIZE=52428800
+PLUGIN_PPROF_ENABLED=false
+
+PLUGIN_DEBUGGING_HOST=0.0.0.0
+PLUGIN_DEBUGGING_PORT=5003
+EXPOSE_PLUGIN_DEBUGGING_HOST=localhost
+EXPOSE_PLUGIN_DEBUGGING_PORT=5003
+
+# If this key is changed, DIFY_INNER_API_KEY in plugin_daemon service must also be updated or agent node will fail.
+PLUGIN_DIFY_INNER_API_KEY=QaHbTe77CtuXmsfyhR7+vRjI/+XbV1AaFy691iy+kGDv2Jvy0/eAh8Y1
+PLUGIN_DIFY_INNER_API_URL=http://api:5001
+
+ENDPOINT_URL_TEMPLATE=http://localhost/e/{hook_id}
+
+MARKETPLACE_ENABLED=true
+MARKETPLACE_API_URL=https://marketplace.dify.ai
+
+FORCE_VERIFYING_SIGNATURE=true
+
+PLUGIN_PYTHON_ENV_INIT_TIMEOUT=120
+PLUGIN_MAX_EXECUTION_TIMEOUT=600
+# PIP_MIRROR_URL=https://pypi.tuna.tsinghua.edu.cn/simple
+PIP_MIRROR_URL=
--- a/dify/compose.yaml
+++ b/dify/compose.yaml
--- a/gpustat-web/.version
+++ b/gpustat-web/.version
@@ -1 +0,0 @@
-v25.03.17
--- a/gpustat-web/compose.yaml
+++ b/gpustat-web/compose.yaml
@@ -1,13 +0,0 @@
-version: "3.8"
-services:
-  gpustat-web:
-    image: docker.citory.tech/public/gpustat-web:10599
-    container_name: gpustat-web
-    ports:
-      - 10509:80
-    extra_hosts:
-      - host.docker.internal:host-gateway
-    restart: always
-x-dockge:
-  urls:
-    - http://local.citory.tech:10509
--- a/kodbox/.version
+++ b/kodbox/.version
@@ -1 +0,0 @@
-v25.03.17
--- a/ktransformers/.env
+++ b/ktransformers/.env
@@ -0,0 +1,3 @@
+TRANSFORMERS_OFFLINE=0
+HF_HUB_OFFLINE=0
+TORCH_CUDA_ARCH_LIST=8.9
--- a/ktransformers/compose.yaml
+++ b/ktransformers/compose.yaml
@@ -0,0 +1,47 @@
+version: "3.8"
+services:
+  ktransformers:
+    image: docker.citory.tech/public/ktransformers:0.2.2rc1
+    container_name: ktransformers
+    runtime: nvidia
+    tty: true
+    stdin_open: true
+    ports:
+      - 10580:10580
+    deploy:
+      resources:
+        reservations:
+          devices:
+            - driver: nvidia
+              count: 2
+              capabilities:
+                - gpu
+    ipc: host
+    volumes:
+      - /home/deepgeek/data/data_local/server/ktransformers/models:/workspace/models
+      - /home/deepgeek/data/data_local/server/ktransformers/ktransformers/website:/workspace/ktransformers/ktransformers/website
+    env_file:
+      - .env
+    restart: unless-stopped
+    entrypoint: [
+      "python3", "/workspace/ktransformers/ktransformers/server/main.py",
+      "--gguf_path", "/workspace/models/DeepSeek-R1-GGUF/DeepSeek-R1-UD-Q2_K_XL",
+      "--model_path", "/workspace/models/DeepSeek-R1",
+      "--model_name", "deepseek-r1:671b",
+      "--cpu_infer", "94",
+      "--optimize_config_path", "/workspace/ktransformers/ktransformers/optimize/optimize_rules/DeepSeek-V3-Chat-multi-gpu.yaml",
+      "--max_new_tokens", "8192",
+      "--cache_lens", "32768",
+      "--total_context", "32768",
+      "--cache_q4", "true",
+      "--temperature", "0.6",
+      "--top_p", "0.95",
+      "--force_think",
+      "--no-use_cuda_graph",
+      "--host", "0.0.0.0",
+      "--port", "10580"
+    ]
+x-dockge:
+  urls:
+    - http://local.citory.tech:10580
+networks: {}
--- a/nlp/.version
+++ b/nlp/.version
@@ -1 +0,0 @@
-v25.03.17
--- a/ollama/.version
+++ b/ollama/.version
@@ -1 +0,0 @@
-v25.03.17
--- a/ollama/compose.yaml
+++ b/ollama/compose.yaml
@@ -4,19 +4,23 @@ services:
    image: docker.citory.tech/mirror/ollama/ollama:latest
    container_name: ollama
    ports:
-      - 10581:11434
-    runtime: nvidia
-    volumes:
-      - /home/deepgeek/data/data_local/server/ollama:/root/.ollama
-    environment:
-      NVIDIA_VISIBLE_DEVICES: all
+      - 10580:11434
+    tty: true
    deploy:
      resources:
        reservations:
          devices:
-            - capabilities:
+            - driver: nvidia
+              count: 2
+              capabilities:
                - gpu
+    ipc: host
+    runtime: nvidia
+    volumes:
+      - /home/deepgeek/data/data_base/ollama:/root/.ollama
+    restart: always
+    command: ollama run gemma3:27b
 x-dockge:
  urls:
-    - http://local.citory.tech:10581
+    - http://local.citory.tech:10580
 networks: {}
--- a/open-webui/.version
+++ b/open-webui/.version
@@ -1 +0,0 @@
-v25.03.17
--- a/open-webui/compose.yaml
+++ b/open-webui/compose.yaml
@@ -1,17 +1,24 @@
 version: "3.8"
 services:
  open-webui:
-    image: docker.citory.tech/mirror/backplane/open-webui:0
+    image: docker.citory.tech/mirror/backplane/open-webui:0.5.20
    container_name: open-webui
    ports:
      - 10503:8080
    environment:
+      - OPENAI_API_KEY='' # 替换为您的 OpenAI API 密钥
+      - OPENAI_API_BASE_URL=http://host.docker.internal:10580/v1 # 替换为您的 VLLM IP 和端口
+      - WHISPER_MODEL=large
+      - ENABLE_OLLAMA_API=true
+      - OLLAMA_BASE_URL=http://host.docker.internal:10580
+      - SCARF_NO_ANALYTICS=true
+      - ANONYMIZED_TELEMETRY=false
+      - DO_NOT_TRACK=true
+      - ENABLE_SIGNUP=false
+      - WEBUI_AUTH=false
      - ENABLE_RAG_WEB_SEARCH=true
      - RAG_WEB_SEARCH_ENGINE=duckduckgo
-      - ENABLE_OLLAMA_API=false
-      - OPENAI_API_KEY=1ZfFN6nICGfMAUhPKwRbpmbwnd9aYkwT8RbluK32ASpPZgglPhdmLv4zDHh7BebQ # 替换为您的 OpenAI API 密钥
-      - WHISPER_MODEL=large
-      - OPENAI_API_BASE_URL=http://host.docker.internal:10580/v1 # 替换为您的 VLLM IP 和端口
+      - RAG_EMBEDDING_MODEL_AUTO_UPDATE=true
    volumes:
      - ./data/:/app/backend/data
    extra_hosts:
--- a/owlsam/.version
+++ b/owlsam/.version
@@ -1 +0,0 @@
-v25.03.17
--- a/portainer/.version
+++ b/portainer/.version
@@ -1 +0,0 @@
-v25.03.17
--- a/stable-diffusion-webui/.version
+++ b/stable-diffusion-webui/.version
@@ -1 +0,0 @@
-v25.03.17
--- a/sun-panel/.version
+++ b/sun-panel/.version
@@ -1 +0,0 @@
-v25.03.17
--- a/sun-panel/compose.yaml
+++ b/sun-panel/compose.yaml
@@ -1,18 +0,0 @@
-version: "3.8"
-services:
-  sun-panel:
-    image: docker.citory.tech/mirror/hslr/sun-panel:latest
-    container_name: sun-panel
-    volumes:
-      - ./conf:/app/conf
-      - /var/run/docker.sock:/var/run/docker.sock # 挂载docker.sock
-      - ./runtime:/app/runtime # 挂载日志目录
-      - /mnt/data_base:/os # 硬盘挂载点（根据自己需求修改）
-      - /:/system # 硬盘挂载点（根据自己需求修改）
-    ports:
-      - 10500:3002
-    restart: always
-networks: {}
-x-dockge:
-  urls:
-    - http://local.citory.tech:10500
--- a/sun-panel/conf/custom/favicon.ico
+++ b/sun-panel/conf/custom/favicon.ico
--- a/sun-panel/conf/custom/index.css
+++ b/sun-panel/conf/custom/index.css
--- a/sun-panel/conf/custom/index.js
+++ b/sun-panel/conf/custom/index.js
--- a/sun-panel/conf/uploads/2025/3/16/10df03379d5c47d63ecebeaa41968c32.png
+++ b/sun-panel/conf/uploads/2025/3/16/10df03379d5c47d63ecebeaa41968c32.png
--- a/sun-panel/conf/uploads/2025/3/16/2e20b93fbf3a346375f847c468ef3035.jpeg
+++ b/sun-panel/conf/uploads/2025/3/16/2e20b93fbf3a346375f847c468ef3035.jpeg
--- a/sun-panel/conf/uploads/2025/3/16/41d76155bd23bd4fdb194675e797dbcf.png
+++ b/sun-panel/conf/uploads/2025/3/16/41d76155bd23bd4fdb194675e797dbcf.png
--- a/sun-panel/conf/uploads/2025/3/16/46c41a6f2049ea26e483ccf6542947f4.svg
+++ b/sun-panel/conf/uploads/2025/3/16/46c41a6f2049ea26e483ccf6542947f4.svg
@@ -1 +0,0 @@
-<svg height="1em" style="flex:none;line-height:1" viewBox="0 0 24 24" width="1em" xmlns="http://www.w3.org/2000/svg"><title>vLLM</title><path d="M0 4.973h9.324V23L0 4.973z" fill="#FDB515"></path><path d="M13.986 4.351L22.378 0l-6.216 23H9.324l4.662-18.649z" fill="#30A2FF"></path></svg>
--- a/sun-panel/conf/uploads/2025/3/16/47e55c2485bb3a79fe74f774c7c28b0f.png
+++ b/sun-panel/conf/uploads/2025/3/16/47e55c2485bb3a79fe74f774c7c28b0f.png
--- a/sun-panel/conf/uploads/2025/3/16/4d9c54fc716689d490b6f7d486b0005f.png
+++ b/sun-panel/conf/uploads/2025/3/16/4d9c54fc716689d490b6f7d486b0005f.png
--- a/sun-panel/conf/uploads/2025/3/16/5b918100963a1305b232eae785a2d3a5.jpg
+++ b/sun-panel/conf/uploads/2025/3/16/5b918100963a1305b232eae785a2d3a5.jpg
--- a/sun-panel/conf/uploads/2025/3/16/5d3bac9a4753399641c4d5c0ee278db1.png
+++ b/sun-panel/conf/uploads/2025/3/16/5d3bac9a4753399641c4d5c0ee278db1.png
--- a/sun-panel/conf/uploads/2025/3/16/605fc080b590bc0f42c2a1bdab20aa57.png
+++ b/sun-panel/conf/uploads/2025/3/16/605fc080b590bc0f42c2a1bdab20aa57.png
--- a/sun-panel/conf/uploads/2025/3/16/7e9970e7aa0c31f2e71f416bcfc0b281.svg
+++ b/sun-panel/conf/uploads/2025/3/16/7e9970e7aa0c31f2e71f416bcfc0b281.svg
@@ -1,14 +0,0 @@
-<?xml version="1.0" encoding="UTF-8" standalone="no" ?>
-<!DOCTYPE svg PUBLIC "-//W3C//DTD SVG 1.1//EN" "http://www.w3.org/Graphics/SVG/1.1/DTD/svg11.dtd">
-<svg xmlns="http://www.w3.org/2000/svg" xmlns:xlink="http://www.w3.org/1999/xlink" version="1.1" width="640" height="640" viewBox="0 0 640 640" xml:space="preserve">
-<desc>Created with Fabric.js 5.3.0</desc>
-<defs>
-</defs>
-<g transform="matrix(0.9544918218 0 0 0.9544918218 320 325.5657767239)" id="0UAuLmXgnot4bJxVEVJCQ"  >
-<linearGradient id="SVGID_136_0" gradientUnits="userSpaceOnUse" gradientTransform="matrix(1 0 0 1 -236.6470440833 -213.9441386034)"  x1="259.78" y1="261.15" x2="463.85" y2="456.49">
-<stop offset="0%" style="stop-color:#74C2FF;stop-opacity: 1"/>
-<stop offset="100%" style="stop-color:rgb(134,230,169);stop-opacity: 1"/>
-</linearGradient>
-<path style="stroke: rgb(242,242,242); stroke-opacity: 0.51; stroke-width: 190; stroke-dasharray: none; stroke-linecap: butt; stroke-dashoffset: 0; stroke-linejoin: miter; stroke-miterlimit: 4; fill: url(#SVGID_136_0); fill-rule: nonzero; opacity: 1;"  transform=" translate(0, 0)" d="M 131.8665 -139.04883 C 159.01022 -111.20969000000001 170.12421 -99.45396000000001 203.11849999999998 -51.72057000000001 C 236.1128 -3.9871800000000093 264.44147999999996 83.98416999999998 187.33995 144.05073 C 177.72728999999998 151.53955 166.73827 158.81189999999998 154.65932999999998 165.65812999999997 C 69.85514999999998 213.72433999999998 -68.67309000000003 240.78578 -161.79279 174.28328999999997 C -268.17583 98.30862999999997 -260.10282 -68.66557000000003 -144.35093 -170.50579000000005 C -28.599040000000002 -272.34602000000007 104.72278 -166.88797000000005 131.86649999999997 -139.04883000000004 z" stroke-linecap="round" />
-</g>
-</svg>
--- a/sun-panel/conf/uploads/2025/3/16/97376d7cf0c2d90fa0f9c5e14da2a89f.ico
+++ b/sun-panel/conf/uploads/2025/3/16/97376d7cf0c2d90fa0f9c5e14da2a89f.ico
--- a/sun-panel/conf/uploads/2025/3/16/9d135876afb73c0ef637a24b9ad93945.ico
+++ b/sun-panel/conf/uploads/2025/3/16/9d135876afb73c0ef637a24b9ad93945.ico
--- a/sun-panel/conf/uploads/2025/3/16/d4bdc7ed4011fe08d1057fed05190f23.png
+++ b/sun-panel/conf/uploads/2025/3/16/d4bdc7ed4011fe08d1057fed05190f23.png
--- a/sun-panel/conf/uploads/2025/3/16/db44ee8e8563ba14fcb7622c6b606d31.png
+++ b/sun-panel/conf/uploads/2025/3/16/db44ee8e8563ba14fcb7622c6b606d31.png
--- a/sun-panel/conf/uploads/2025/3/16/de41043b7c03d4a2fe94c9f954f9e14c.png
+++ b/sun-panel/conf/uploads/2025/3/16/de41043b7c03d4a2fe94c9f954f9e14c.png
--- a/sun-panel/conf/uploads/2025/3/16/f47a87c35f4780def333db0ac8659636.png
+++ b/sun-panel/conf/uploads/2025/3/16/f47a87c35f4780def333db0ac8659636.png
--- a/toolbox-ocr/.version
+++ b/toolbox-ocr/.version
@@ -1 +0,0 @@
-v25.03.17
--- a/vllm-deepseek-r1-32b/.env
+++ b/vllm-deepseek-r1-32b/.env
--- a/vllm-deepseek-r1-32b/compose.yaml
+++ b/vllm-deepseek-r1-32b/compose.yaml
@@ -0,0 +1,30 @@
+services:
+  vllm-deepseek-r1-32b:
+    image: docker.citory.tech/mirror/vllm/vllm-openai:latest
+    container_name: vllm-deepseek-r1-32b
+    ports:
+      - 10580:8080
+    tty: true
+    deploy:
+      resources:
+        reservations:
+          devices:
+            - driver: nvidia
+              count: 2
+              capabilities:
+                - gpu
+    ipc: host
+    runtime: nvidia
+    volumes:
+      - /home/deepgeek/data/data_local/server/vllm/models:/models
+    restart: always
+    command: --served-model-name deepseek-r1:32b越狱 --model
+      /models/huihui-ai/DeepSeek-R1-Distill-Qwen-32B-abliterated
+      --trust-remote-code --host 0.0.0.0 --port 8080 --max-model-len 8192
+      --tensor-parallel-size 2 --gpu_memory_utilization 0.9 --enforce-eager
+      --dtype auto --swap-space 8 --enable-auto-tool-choice
+      --tool-call-parser pythonic
+x-dockge:
+  urls:
+    - http://local.citory.tech:10580
+networks: {}
--- a/vllm-deepseek-r1-70b/.env
+++ b/vllm-deepseek-r1-70b/.env
--- a/vllm-deepseek-r1-70b/compose.yaml
+++ b/vllm-deepseek-r1-70b/compose.yaml
@@ -0,0 +1,30 @@
+version: "3.9"
+services:
+  vllm-deepseek-r1-70b:
+    image: docker.citory.tech/mirror/vllm/vllm-openai:latest
+    container_name: vllm-deepseek-r1-70b
+    ports:
+      - 10580:8080
+    tty: true
+    deploy:
+      resources:
+        reservations:
+          devices:
+            - driver: nvidia
+              count: 2
+              capabilities:
+                - gpu
+    ipc: host
+    runtime: nvidia
+    volumes:
+      - /home/deepgeek/data/data_local/server/vllm/models:/models
+    restart: always
+    command: --served-model-name deepseek-r1:70b越狱 --model
+      /models/Fasiany/DeepSeek-R1-Distill-Llama-70B-abliterated-GPTQ-int4
+      --trust-remote-code --host 0.0.0.0 --port 8080 --enable-auto-tool-choice --tool-call-parser pythonic --max-model-len 8192
+      --tensor-parallel-size 2 --gpu_memory_utilization 0.9 --enforce-eager
+      --dtype auto --swap-space 8 
+x-dockge:
+  urls:
+    - http://local.citory.tech:10580
+networks: {}
--- a/vllm-qwen25-72b-instruct-awq/.env
+++ b/vllm-qwen25-72b-instruct-awq/.env
@@ -0,0 +1 @@
+# VARIABLE=value #comment
--- a/vllm-qwen25-72b-instruct-awq/compose.yaml
+++ b/vllm-qwen25-72b-instruct-awq/compose.yaml
@@ -0,0 +1,30 @@
+version: "3.9"
+services:
+  vllm-Qwen2.5-72B-Instruct-AWQ:
+    image: docker.citory.tech/mirror/vllm/vllm-openai:latest
+    container_name: vllm-Qwen2.5-72B-Instruct-AWQ
+    ports:
+      - 10580:8080
+    tty: true
+    deploy:
+      resources:
+        reservations:
+          devices:
+            - driver: nvidia
+              count: 2
+              capabilities:
+                - gpu
+    ipc: host
+    runtime: nvidia
+    volumes:
+      - /home/deepgeek/data/data_local/server/vllm/models:/models
+    restart: always
+    command: --served-model-name Qwen2.5-72B-Instruct-AWQ --model /models/Qwen/Qwen2.5-72B-Instruct-AWQ
+      --trust-remote-code --host 0.0.0.0 --port 8080 --max-model-len 8192
+      --tensor-parallel-size 2 --gpu_memory_utilization 0.9 --enforce-eager
+      --dtype auto --swap-space 8 --enable-auto-tool-choice --tool-call-parser
+      llama3_json
+x-dockge:
+  urls:
+    - http://local.citory.tech:10580
+networks: {}
--- a/vllm-qwen25-coder-32b-instruct/.env
+++ b/vllm-qwen25-coder-32b-instruct/.env
@@ -0,0 +1 @@
+# VARIABLE=value #comment
--- a/vllm-qwen25-coder-32b-instruct/compose.yaml
+++ b/vllm-qwen25-coder-32b-instruct/compose.yaml
@@ -0,0 +1,30 @@
+version: "3.9"
+services:
+  vllm-Qwen2.5-Coder-32B-Instruct:
+    image: docker.citory.tech/mirror/vllm/vllm-openai:latest
+    container_name: vllm-Qwen2.5-Coder-32B-Instruct
+    ports:
+      - 10580:8080
+    tty: true
+    deploy:
+      resources:
+        reservations:
+          devices:
+            - driver: nvidia
+              count: 2
+              capabilities:
+                - gpu
+    ipc: host
+    runtime: nvidia
+    volumes:
+      - /home/deepgeek/data/data_local/server/vllm/models:/models
+    restart: always
+    command: --served-model-name Qwen2.5-Coder-32B-Instruct --model
+      /models/Qwen/Qwen2.5-Coder-32B-Instruct --trust-remote-code --host 0.0.0.0
+      --port 8080 --max-model-len 8192 --tensor-parallel-size 2
+      --gpu_memory_utilization 0.9 --enforce-eager --dtype auto --swap-space 8
+      --enable-auto-tool-choice --tool-call-parser llama3_json
+x-dockge:
+  urls:
+    - http://local.citory.tech:10580
+networks: {}
--- a/vllm-qwen25-vl-32b-instruct/.env
+++ b/vllm-qwen25-vl-32b-instruct/.env
@@ -0,0 +1 @@
+# VARIABLE=value #comment
--- a/vllm-qwen25-vl-32b-instruct/compose.yaml
+++ b/vllm-qwen25-vl-32b-instruct/compose.yaml
@@ -0,0 +1,30 @@
+version: "3.9"
+services:
+  vllm-Qwen2.5-VL-32B-Instruct:
+    image: docker.citory.tech/mirror/vllm/vllm-openai:latest
+    container_name: vllm-Qwen2.5-VL-32B-Instruct
+    ports:
+      - 10580:8080
+    tty: true
+    deploy:
+      resources:
+        reservations:
+          devices:
+            - driver: nvidia
+              count: 2
+              capabilities:
+                - gpu
+    ipc: host
+    runtime: nvidia
+    volumes:
+      - /home/deepgeek/data/data_local/server/vllm/models:/models
+    restart: always
+    command: --served-model-name Qwen2.5-VL-32B-Instruct --model
+      /models/Qwen/Qwen2.5-VL-32B-Instruct --trust-remote-code --host 0.0.0.0
+      --port 8080 --max-model-len 8192 --tensor-parallel-size 2
+      --gpu_memory_utilization 0.9 --enforce-eager --dtype auto --swap-space 8
+      --enable-auto-tool-choice --tool-call-parser llama3_json
+x-dockge:
+  urls:
+    - http://local.citory.tech:10580
+networks: {}
--- a/vllm-qwq-32b/.env
+++ b/vllm-qwq-32b/.env
@@ -0,0 +1 @@
+# VARIABLE=value #comment
--- a/vllm-qwq-32b/compose.yaml
+++ b/vllm-qwq-32b/compose.yaml
@@ -0,0 +1,30 @@
+version: "3.9"
+services:
+  vllm-QwQ-32B:
+    image: docker.citory.tech/mirror/vllm/vllm-openai:latest
+    container_name: vllm-QwQ-32B
+    ports:
+      - 10580:8080
+    tty: true
+    deploy:
+      resources:
+        reservations:
+          devices:
+            - driver: nvidia
+              count: 2
+              capabilities:
+                - gpu
+    ipc: host
+    runtime: nvidia
+    volumes:
+      - /home/deepgeek/data/data_local/server/vllm/models:/models
+    restart: always
+    command: --served-model-name QwQ-32B --model /models/Qwen/QwQ-32B
+      --trust-remote-code --host 0.0.0.0 --port 8080 --max-model-len 8192
+      --tensor-parallel-size 2 --gpu_memory_utilization 0.9 --enforce-eager
+      --dtype auto --swap-space 8 --enable-auto-tool-choice
+      --tool-call-parser llama3_json
+x-dockge:
+  urls:
+    - http://local.citory.tech:10580
+networks: {}
--- a/vllm/.version
+++ b/vllm/.version
@@ -1 +0,0 @@
-v25.03.17
--- a/vllm/compose.yaml
+++ b/vllm/compose.yaml
@@ -1,32 +0,0 @@
-version: "3.8"
-services:
-  vllm:
-    image: docker.citory.tech/mirror/vllm/vllm-openai:latest
-    container_name: vllm
-    ports:
-      - 10580:8080
-    tty: true
-    environment:
-      - CUDA_VISIBLE_DEVICES=0,1
-    deploy:
-      resources:
-        reservations:
-          devices:
-            - driver: nvidia
-              count: 2
-              capabilities:
-                - gpu
-    ipc: host
-    runtime: nvidia
-    volumes:
-      - /home/deepgeek/data/data_local/server/vllm/models:/models
-    restart: always
-    command: --served-model-name DeepSeek-R1-Distill-Llama-70B-AWQ --model
-      /models/Valdemardi/DeepSeek-R1-Distill-Llama-70B-AWQ --trust-remote-code
-      --host 0.0.0.0 --port 8080 --max-model-len 8192 --tensor-parallel-size 2
-      --gpu_memory_utilization 0.96 --enforce-eager --dtype auto --swap-space 8
-      --api-key
-      "O8Is3NSYnp5fICWFbhkbwpLWgvMLkdCSuXR5ZggLmgwTKNPEWsjx1NqUxkyU7wLX"
-x-dockge:
-  urls:
-    - http://local.citory.tech:10580
--- a/watchtower/.version
+++ b/watchtower/.version
@@ -1 +0,0 @@
-v25.03.17
				`@@ -1 +0,0 @@`
				`<svg height="1em" style="flex:none;line-height:1" viewBox="0 0 24 24" width="1em" xmlns="http://www.w3.org/2000/svg"><title>vLLM</title><path d="M0 4.973h9.324V23L0 4.973z" fill="#FDB515"></path><path d="M13.986 4.351L22.378 0l-6.216 23H9.324l4.662-18.649z" fill="#30A2FF"></path></svg>`