We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent 3605cad commit 88f57afCopy full SHA for 88f57af
infra/modal/webserver.py
@@ -56,7 +56,7 @@ def download_models():
56
# Run a web server on port 7997 and expose the Infinity embedding server
57
@app.function(
58
# allow up to 16 requests pending on a single container
59
- allow_concurrent_inputs=16,
+ allow_concurrent_inputs=8,
60
# boots take around 30 seconds, so keep containers alive for a few times longer
61
container_idle_timeout=3 * MINUTES,
62
# max 5 container instances
0 commit comments