Compare commits

...

3 Commits

Author SHA1 Message Date
Mikhail Yevchenko 40db98915f Add devcontainer configuration for Vast.ai serverless Ollama template 2026-05-18 20:38:26 +00:00
Mikhail Yevchenko 94926b74b6 Add log message for server listening status 2026-05-18 19:42:40 +00:00
Mikhail Yevchenko d0347b0755 Update log file path and enhance load log messages 2026-05-18 18:41:14 +00:00
2 changed files with 41 additions and 1 deletions
+37
View File
@@ -0,0 +1,37 @@
// .devcontainer/devcontainer.json
// Dev container for the Vast.ai serverless Ollama template.
// Includes Docker-in-Docker so you can build and test images from inside the container.
{
"name": "vast.ai-serverless-ollama",
"image": "mcr.microsoft.com/devcontainers/base:trixie",
"features": {
"ghcr.io/devcontainers/features/python:1": {
"installTools": true,
"version": "3.12"
},
"ghcr.io/devcontainers/features/docker-in-docker:3.0.0": {
"moby": false,
"version": "latest",
"installDockerBuildx": true,
"dockerDashComposeVersion": "v2"
}
},
"runArgs": ["--privileged"],
"containerEnv": {
"DOCKER_BUILDKIT": "1"
},
"postCreateCommand": "python3 -m pip install --user --upgrade pip && python3 -m pip install --user -r requirements.txt pyyaml",
"customizations": {
"vscode": {
"extensions": [
"ms-python.python",
"ms-azuretools.vscode-docker"
],
"settings": {
"python.defaultInterpreterPath": "/usr/bin/python3",
"terminal.integrated.defaultProfile.linux": "bash",
"docker.showStartPage": false
}
}
}
}
+4 -1
View File
@@ -7,12 +7,15 @@ from vastai import Worker, WorkerConfig, HandlerConfig, LogActionConfig, Benchma
# vLLM model configuration # vLLM model configuration
MODEL_SERVER_URL = 'http://127.0.0.1' MODEL_SERVER_URL = 'http://127.0.0.1'
MODEL_SERVER_PORT = 18000 MODEL_SERVER_PORT = 18000
MODEL_LOG_FILE = '/var/log/portal/vllm.log' MODEL_LOG_FILE = '/var/log/onstart.log'
MODEL_HEALTHCHECK_ENDPOINT = "/health" MODEL_HEALTHCHECK_ENDPOINT = "/health"
# vLLM-specific log messages # vLLM-specific log messages
MODEL_LOAD_LOG_MSG = [ MODEL_LOAD_LOG_MSG = [
"Application startup complete.", "Application startup complete.",
"llama runner started in",
"Server listening on",
"msg=\"Listening on",
] ]
MODEL_ERROR_LOG_MSGS = [ MODEL_ERROR_LOG_MSGS = [