0894a86af8
v2.1 changes from 2nd-round review: + Emergency channel RPM: max(1, max_rpm * 0.1) + Queue 503: add Retry-After: 30 header + sidecar_backup_success Prometheus metric + Startup crypto.py key validation on boot + SQLite size limits: 100MB practical, 500MB WAL + RPM flow: per-request counting, not token-based + SSE streaming: TTFT for avg_latency_ms + Merge proxy/retry.py into core/cooldown.py Added sidecar-v2-nvidia-providers.yaml (11 keys) Co-authored-by: multica-agent <github@multica.ai>
121 lines
3.7 KiB
YAML
121 lines
3.7 KiB
YAML
# NVIDIA Provider Keys Reference for Sidecar V2
|
|
# =============================================
|
|
# ⚠️ SECURITY: This file contains sensitive API key material.
|
|
# In Sidecar V2 production deployment, API keys are stored as
|
|
# AES-256-GCM ciphertext in SQLite (providers.api_key column).
|
|
# The plaintext keys below are for V2 initial provisioning only.
|
|
#
|
|
# Usage: Import into Sidecar V2 via WebUI Admin or POST /api/v2/providers
|
|
# After import, this file should be stored in a secure location
|
|
# (Bitwarden / password manager) and NOT kept in plaintext on disk.
|
|
#
|
|
# Created: 2026-06-25 | By: 梁思筑 (architect)
|
|
# Total providers: 11 | Pool: main | RPM each: 40 | Total RPM capacity: 440
|
|
|
|
providers:
|
|
- account: bizwings
|
|
email: vincent@bizwingsinc.com
|
|
api_key: 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
|
|
endpoint_url: https://integrate.api.nvidia.com/v1
|
|
model_prefix: "nvidia/"
|
|
pool: main
|
|
rpm_limit: 40
|
|
notes: "主账号"
|
|
|
|
- account: "98053"
|
|
email: 98053@qq.com
|
|
api_key: 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
|
|
endpoint_url: https://integrate.api.nvidia.com/v1
|
|
model_prefix: "nvidia/"
|
|
pool: main
|
|
rpm_limit: 40
|
|
notes: ""
|
|
|
|
- account: liuweicheng84
|
|
email: liuweicheng84@gmail.com
|
|
api_key: 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
|
|
endpoint_url: https://integrate.api.nvidia.com/v1
|
|
model_prefix: "nvidia/"
|
|
pool: main
|
|
rpm_limit: 40
|
|
notes: ""
|
|
|
|
- account: vx18088980513
|
|
email: vx18088980513@qq.com
|
|
api_key: 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
|
|
endpoint_url: https://integrate.api.nvidia.com/v1
|
|
model_prefix: "nvidia/"
|
|
pool: main
|
|
rpm_limit: 40
|
|
notes: ""
|
|
|
|
- account: "64391942"
|
|
email: 64391942@qq.com
|
|
api_key: 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
|
|
endpoint_url: https://integrate.api.nvidia.com/v1
|
|
model_prefix: "nvidia/"
|
|
pool: main
|
|
rpm_limit: 40
|
|
notes: ""
|
|
|
|
- account: cgtest1
|
|
email: cgtest1@bizwingsinc.com
|
|
api_key: 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
|
|
endpoint_url: https://integrate.api.nvidia.com/v1
|
|
model_prefix: "nvidia/"
|
|
pool: main
|
|
rpm_limit: 40
|
|
notes: "测试账号1"
|
|
|
|
- account: cgtest2
|
|
email: cgtest2@bizwingsinc.com
|
|
api_key: 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
|
|
endpoint_url: https://integrate.api.nvidia.com/v1
|
|
model_prefix: "nvidia/"
|
|
pool: main
|
|
rpm_limit: 40
|
|
notes: "测试账号2"
|
|
|
|
- account: "15876517651"
|
|
email: 1248106918@qq.com
|
|
api_key: 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
|
|
endpoint_url: https://integrate.api.nvidia.com/v1
|
|
model_prefix: "nvidia/"
|
|
pool: main
|
|
rpm_limit: 40
|
|
notes: ""
|
|
|
|
- account: "19584586741"
|
|
email: 414133763@qq.com
|
|
api_key: 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
|
|
endpoint_url: https://integrate.api.nvidia.com/v1
|
|
model_prefix: "nvidia/"
|
|
pool: main
|
|
rpm_limit: 40
|
|
notes: ""
|
|
|
|
- account: "18874954146"
|
|
email: 350894172@qq.com
|
|
api_key: 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
|
|
endpoint_url: https://integrate.api.nvidia.com/v1
|
|
model_prefix: "nvidia/"
|
|
pool: main
|
|
rpm_limit: 40
|
|
notes: ""
|
|
|
|
- account: "2405483110"
|
|
email: 2405483110@qq.com
|
|
api_key: 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
|
|
endpoint_url: https://integrate.api.nvidia.com/v1
|
|
model_prefix: "nvidia/"
|
|
pool: main
|
|
rpm_limit: 40
|
|
notes: ""
|
|
|
|
# Aggregated stats
|
|
summary:
|
|
total_providers: 11
|
|
total_rpm_capacity: 440
|
|
pools:
|
|
main: 11
|
|
fallback: 0 |