← console

job 885ab28b-c0a9-45d0-a158-c9382a888f8d

StateFAILED
Quotaservitor-demo
Manifestadabffc64cc3874a33dd5b5290dd808bc43e29b652e811e86e9eb96d3700d50b
Entry overridetirefireind.us/flowmetal-servitor/reinstall-host/reinstall
Workerworker-cb363943-e8d5-4544-959e-0acbf94251c1
Inbox HWM0
ErrorTraceback (most recent call last): File <builtin>, in <module> * main.star:119, in _reinstall_impl fail("escalated host %s to RDS for repair" % hostname) error: escalated host host-a38df12a to RDS for repair --> main.star:119:5 | 119 | fail("escalated host %s to RDS for repair" % hostname) | ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^ |

Log

#0 print >>> [noc] pulling next host record off laskey…
#2 req 1 connector:http
{
  "method": "GET",
  "url": "http://laskey.flowmetal.svc.cluster.local:8080/hosts/next"
}
#3 req 1 ok
{
  "body": {
    "config": {
      "disk_layout": "single-nvme",
      "os": "ubuntu-24.04",
      "profile": "batch-worker",
      "rack": "rack-b1"
    },
    "hostname": "host-a38df12a"
  },
  "headers": {
    "content-length": "129",
    "content-type": "application/json",
    "date": "Tue, 21 Apr 2026 09:54:00 GMT",
    "server": "uvicorn"
  },
  "status": 200.0
}
#4 print >>> [noc] target host host-a38df12a (ubuntu-24.04 / batch-worker / single-nvme) — handing off to wilson.
#6 print >>> [noc] attempt 1/4: kicking off reinstall of host-a38df12a.
#8 req 4 connector:http
{
  "body_json": {
    "config": {
      "disk_layout": "single-nvme",
      "os": "ubuntu-24.04",
      "profile": "batch-worker",
      "rack": "rack-b1"
    },
    "hostname": "host-a38df12a"
  },
  "method": "POST",
  "url": "http://wilson.flowmetal.svc.cluster.local:8080/reinstall"
}
#9 req 4 ok
{
  "body": {
    "hostname": "host-a38df12a",
    "reinstall_id": "ri_25c62a394091"
  },
  "headers": {
    "content-length": "61",
    "content-type": "application/json",
    "date": "Tue, 21 Apr 2026 09:54:08 GMT",
    "server": "uvicorn"
  },
  "status": 202.0
}
#10 req 5 sleep deadline=1776765254.088334076 duration=2s
#11 req 5 ok
null
#12 req 6 connector:http
{
  "method": "GET",
  "url": "http://wilson.flowmetal.svc.cluster.local:8080/reinstall/ri_25c62a394091"
}
#13 req 6 ok
{
  "body": {
    "eta_seconds": 7.85,
    "hostname": "host-a38df12a",
    "reinstall_id": "ri_25c62a394091",
    "status": "pending"
  },
  "headers": {
    "content-length": "99",
    "content-type": "application/json",
    "date": "Tue, 21 Apr 2026 09:54:14 GMT",
    "server": "uvicorn"
  },
  "status": 200.0
}
#14 req 7 sleep deadline=1776765267.036021626 duration=2s
#15 req 7 ok
null
#16 req 8 connector:http
{
  "method": "GET",
  "url": "http://wilson.flowmetal.svc.cluster.local:8080/reinstall/ri_25c62a394091"
}
#17 req 8 ok
{
  "body": {
    "error_kind": "reinstall_broken",
    "hostname": "host-a38df12a",
    "message": "reinstall broke partway through",
    "reinstall_id": "ri_25c62a394091",
    "retryable": true,
    "status": "failed"
  },
  "headers": {
    "content-length": "172",
    "content-type": "application/json",
    "date": "Tue, 21 Apr 2026 09:54:27 GMT",
    "server": "uvicorn"
  },
  "status": 200.0
}
#18 print >>> [noc] attempt 1 failed (reinstall_broken); looping back to wilson.
#20 print >>> [noc] attempt 2/4: kicking off reinstall of host-a38df12a.
#22 req 11 connector:http
{
  "body_json": {
    "config": {
      "disk_layout": "single-nvme",
      "os": "ubuntu-24.04",
      "profile": "batch-worker",
      "rack": "rack-b1"
    },
    "hostname": "host-a38df12a"
  },
  "method": "POST",
  "url": "http://wilson.flowmetal.svc.cluster.local:8080/reinstall"
}
#23 req 11 ok
{
  "body": {
    "hostname": "host-a38df12a",
    "reinstall_id": "ri_ed350a18e81b"
  },
  "headers": {
    "content-length": "61",
    "content-type": "application/json",
    "date": "Tue, 21 Apr 2026 09:54:37 GMT",
    "server": "uvicorn"
  },
  "status": 202.0
}
#24 req 12 sleep deadline=1776765287.074012964 duration=2s
#25 req 12 ok
null
#26 req 13 connector:http
{
  "method": "GET",
  "url": "http://wilson.flowmetal.svc.cluster.local:8080/reinstall/ri_ed350a18e81b"
}
#27 req 13 ok
{
  "body": {
    "eta_seconds": 2.24,
    "hostname": "host-a38df12a",
    "reinstall_id": "ri_ed350a18e81b",
    "status": "pending"
  },
  "headers": {
    "content-length": "99",
    "content-type": "application/json",
    "date": "Tue, 21 Apr 2026 09:54:46 GMT",
    "server": "uvicorn"
  },
  "status": 200.0
}
#28 req 14 sleep deadline=1776765298.017600777 duration=2s
#29 req 14 ok
null
#30 req 15 connector:http
{
  "method": "GET",
  "url": "http://wilson.flowmetal.svc.cluster.local:8080/reinstall/ri_ed350a18e81b"
}
#31 req 15 ok
{
  "body": {
    "error_kind": "reinstall_broken",
    "hostname": "host-a38df12a",
    "message": "reinstall broke partway through",
    "reinstall_id": "ri_ed350a18e81b",
    "retryable": true,
    "status": "failed"
  },
  "headers": {
    "content-length": "172",
    "content-type": "application/json",
    "date": "Tue, 21 Apr 2026 09:54:58 GMT",
    "server": "uvicorn"
  },
  "status": 200.0
}
#32 print >>> [noc] attempt 2 failed (reinstall_broken); looping back to wilson.
#34 print >>> [noc] attempt 3/4: kicking off reinstall of host-a38df12a.
#36 req 18 connector:http
{
  "body_json": {
    "config": {
      "disk_layout": "single-nvme",
      "os": "ubuntu-24.04",
      "profile": "batch-worker",
      "rack": "rack-b1"
    },
    "hostname": "host-a38df12a"
  },
  "method": "POST",
  "url": "http://wilson.flowmetal.svc.cluster.local:8080/reinstall"
}
#37 req 18 ok
{
  "body": {
    "hostname": "host-a38df12a",
    "reinstall_id": "ri_3fdd90720503"
  },
  "headers": {
    "content-length": "61",
    "content-type": "application/json",
    "date": "Tue, 21 Apr 2026 09:54:59 GMT",
    "server": "uvicorn"
  },
  "status": 202.0
}
#38 req 19 sleep deadline=1776765303.088982352 duration=2s
#39 req 19 ok
null
#40 req 20 connector:http
{
  "method": "GET",
  "url": "http://wilson.flowmetal.svc.cluster.local:8080/reinstall/ri_3fdd90720503"
}
#41 req 20 ok
{
  "body": {
    "eta_seconds": 5.25,
    "hostname": "host-a38df12a",
    "reinstall_id": "ri_3fdd90720503",
    "status": "pending"
  },
  "headers": {
    "content-length": "99",
    "content-type": "application/json",
    "date": "Tue, 21 Apr 2026 09:55:02 GMT",
    "server": "uvicorn"
  },
  "status": 200.0
}
#42 req 21 sleep deadline=1776765312.008663763 duration=2s
#43 req 21 ok
null
#44 req 22 connector:http
{
  "method": "GET",
  "url": "http://wilson.flowmetal.svc.cluster.local:8080/reinstall/ri_3fdd90720503"
}
#45 req 22 ok
{
  "body": {
    "error_kind": "reinstall_broken",
    "hostname": "host-a38df12a",
    "message": "reinstall broke partway through",
    "reinstall_id": "ri_3fdd90720503",
    "retryable": true,
    "status": "failed"
  },
  "headers": {
    "content-length": "172",
    "content-type": "application/json",
    "date": "Tue, 21 Apr 2026 09:55:13 GMT",
    "server": "uvicorn"
  },
  "status": 200.0
}
#46 print >>> [noc] attempt 3 failed (reinstall_broken); looping back to wilson.
#48 print >>> [noc] attempt 4/4: kicking off reinstall of host-a38df12a.
#50 req 25 connector:http
{
  "body_json": {
    "config": {
      "disk_layout": "single-nvme",
      "os": "ubuntu-24.04",
      "profile": "batch-worker",
      "rack": "rack-b1"
    },
    "hostname": "host-a38df12a"
  },
  "method": "POST",
  "url": "http://wilson.flowmetal.svc.cluster.local:8080/reinstall"
}
#51 req 25 ok
{
  "body": {
    "hostname": "host-a38df12a",
    "reinstall_id": "ri_831321daae38"
  },
  "headers": {
    "content-length": "61",
    "content-type": "application/json",
    "date": "Tue, 21 Apr 2026 09:55:20 GMT",
    "server": "uvicorn"
  },
  "status": 202.0
}
#52 req 26 sleep deadline=1776765328.011737022 duration=2s
#53 req 26 ok
null
#54 req 27 connector:http
{
  "method": "GET",
  "url": "http://wilson.flowmetal.svc.cluster.local:8080/reinstall/ri_831321daae38"
}
#55 req 27 ok
{
  "body": {
    "eta_seconds": 3.28,
    "hostname": "host-a38df12a",
    "reinstall_id": "ri_831321daae38",
    "status": "pending"
  },
  "headers": {
    "content-length": "99",
    "content-type": "application/json",
    "date": "Tue, 21 Apr 2026 09:55:29 GMT",
    "server": "uvicorn"
  },
  "status": 200.0
}
#56 req 28 sleep deadline=1776765338.946246543 duration=2s
#57 req 28 ok
null
#58 req 29 connector:http
{
  "method": "GET",
  "url": "http://wilson.flowmetal.svc.cluster.local:8080/reinstall/ri_831321daae38"
}
#59 req 29 ok
{
  "body": {
    "error_kind": "reinstall_broken",
    "hostname": "host-a38df12a",
    "message": "reinstall broke partway through",
    "reinstall_id": "ri_831321daae38",
    "retryable": true,
    "status": "failed"
  },
  "headers": {
    "content-length": "172",
    "content-type": "application/json",
    "date": "Tue, 21 Apr 2026 09:55:39 GMT",
    "server": "uvicorn"
  },
  "status": 200.0
}
#60 print >>> [noc] attempt 4 failed (reinstall_broken); looping back to wilson.
#62 print >>> [noc] escalating host-a38df12a to RDS: wilson exhausted 4 attempts.
#64 req 32 connector:http
{
  "body_json": {
    "hostname": "host-a38df12a",
    "reason": "wilson exhausted 4 attempts"
  },
  "method": "POST",
  "url": "http://rds.flowmetal.svc.cluster.local:8080/tickets"
}
#65 req 32 ok
{
  "body": {
    "created_at": 1776765345.0,
    "hostname": "host-a38df12a",
    "reason": "wilson exhausted 4 attempts",
    "ticket_id": "rds_abcb46ab7a66"
  },
  "headers": {
    "content-length": "122",
    "content-type": "application/json",
    "date": "Tue, 21 Apr 2026 09:55:44 GMT",
    "server": "uvicorn"
  },
  "status": 201.0
}
#66 print >>> [noc] RDS ticket rds_abcb46ab7a66 filed for host-a38df12a — paging humans.
#68 FAILED worker=worker-cb363943-e8d5-4544-959e-0acbf94251c1