diff --git a/services/nvidia_sidecar/README.md b/services/nvidia_sidecar/README.md index 6f62657..98a8862 100644 --- a/services/nvidia_sidecar/README.md +++ b/services/nvidia_sidecar/README.md @@ -24,7 +24,7 @@ nvidia-sidecar | `SIDECAR_API_KEY` | — | NVIDIA API Key(必填) | | `SIDECAR_RATE_RPM` | `40` | 每分钟请求数限制 | | `SIDECAR_BUCKET_CAPACITY` | `40` | 令牌桶容量 | -| `SIDECAR_TIMEOUT` | `6000` | 上游请求超时(秒) | +| `SIDECAR_TIMEOUT` | `60` | 上游请求超时(秒,上限截断 300s) | | `SIDECAR_QUEUE_MAX` | `500` | 队列最大长度 | | `SIDECAR_LOW_TIMEOUT` | `2.0` | 低优先级令牌等待超时(秒) | | `SIDECAR_FALLBACK_PASSTHROUGH` | `true` | 队列满时是否直通上游 | diff --git a/services/nvidia_sidecar/rate_limiter.py b/services/nvidia_sidecar/rate_limiter.py index d87fa28..e687b5d 100644 --- a/services/nvidia_sidecar/rate_limiter.py +++ b/services/nvidia_sidecar/rate_limiter.py @@ -30,10 +30,15 @@ class Priority(IntEnum): # --------------------------------------------------------------------------- NVIDIA_GATEWAY_ALIASES: set[str] = { + # OpenClaw 配置中全部的 NVIDIA provider 名称 + # 同步自 openclaw.json models.providers 中的 NVIDIA 条目 "nvidia", "nvidia-gateway", + "nvidia98053", + "nvidialiuweicheng84", "nvidiavx", "nvidiavx18088980513", + "nvidiavx64391942", }