compute_tpl_8_cpu_autoscaling.yaml 757 B

12345678910111213141516171819202122232425262728
  1. cloud_id: {{env["ANYSCALE_CLOUD_ID"]}}
  2. region: us-west-2
  3. # 1k max replicas (1000 / 8 = 125 containers needed)
  4. max_workers: 130
  5. head_node_type:
  6. name: head_node
  7. # 8 cpus, x86, 32G mem, 10Gb NIC, $0.384/hr on demand
  8. instance_type: m5.2xlarge
  9. worker_node_types:
  10. - name: worker_node
  11. # 8 cpus, x86, 32G mem, 10Gb NIC, $0.384/hr on demand
  12. instance_type: m5.2xlarge
  13. # smaller min workers will make the head node cpu usage very high, and crash the head node.
  14. # issue: https://github.com/ray-project/ray/issues/18908
  15. min_workers: 5
  16. # 1k max replicas
  17. max_workers: 130
  18. use_spot: false
  19. aws:
  20. TagSpecifications:
  21. - ResourceType: "instance"
  22. Tags:
  23. - Key: ttl-hours
  24. Value: '24'