We have a service with GPU that we would like to stop when no requests are coming internally.
We use the service.internal
address to make requests to this service, is stopping automatically but not restarted again.
[mounts]
source = 'gpu_data'
destination = '/data'
[[services]]
internal_port = 8000
protocol = "tcp"
auto_stop_machines = true
auto_start_machines = true
min_machines_running = 0
[[services.ports]]
handlers = ["http"]
port = 80
[[services.ports]]
port = 443
handlers = ["tls", "http"]
[services.concurrency]
hard_limit = 5000
soft_limit = 4000
type = "connections"
[[vm]]
size = 'l40s'
memory = '32gb'
cpu_kind = 'performance'
cpus = 8
[[services.tcp_checks]]
grace_period = "1s"
interval = "15s"
restart_limit = 0
timeout = "2s"