← console

job fad3944b-3143-492c-936c-1b207ef6e865

StateFAILED
Quotaservitor-demo
Manifestadabffc64cc3874a33dd5b5290dd808bc43e29b652e811e86e9eb96d3700d50b
Entry overridetirefireind.us/flowmetal-servitor/reinstall-host/reinstall
Workerworker-cb363943-e8d5-4544-959e-0acbf94251c1
Inbox HWM0
ErrorTraceback (most recent call last): File <builtin>, in <module> * main.star:119, in _reinstall_impl fail("escalated host %s to RDS for repair" % hostname) error: escalated host host-632a20b0 to RDS for repair --> main.star:119:5 | 119 | fail("escalated host %s to RDS for repair" % hostname) | ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^ |

Log

#0 print >>> [noc] pulling next host record off laskey…
#2 req 1 connector:http
{
  "method": "GET",
  "url": "http://laskey.flowmetal.svc.cluster.local:8080/hosts/next"
}
#3 req 1 ok
{
  "body": {
    "config": {
      "disk_layout": "md-raid10",
      "os": "flatcar-stable",
      "profile": "api-worker",
      "rack": "rack-b1"
    },
    "hostname": "host-632a20b0"
  },
  "headers": {
    "content-length": "127",
    "content-type": "application/json",
    "date": "Tue, 21 Apr 2026 09:44:00 GMT",
    "server": "uvicorn"
  },
  "status": 200.0
}
#4 print >>> [noc] target host host-632a20b0 (flatcar-stable / api-worker / md-raid10) — handing off to wilson.
#6 print >>> [noc] attempt 1/4: kicking off reinstall of host-632a20b0.
#8 req 4 connector:http
{
  "body_json": {
    "config": {
      "disk_layout": "md-raid10",
      "os": "flatcar-stable",
      "profile": "api-worker",
      "rack": "rack-b1"
    },
    "hostname": "host-632a20b0"
  },
  "method": "POST",
  "url": "http://wilson.flowmetal.svc.cluster.local:8080/reinstall"
}
#9 req 4 ok
{
  "body": {
    "hostname": "host-632a20b0",
    "reinstall_id": "ri_2496f0f9292e"
  },
  "headers": {
    "content-length": "61",
    "content-type": "application/json",
    "date": "Tue, 21 Apr 2026 09:44:10 GMT",
    "server": "uvicorn"
  },
  "status": 202.0
}
#10 req 5 sleep deadline=1776764663.277071638 duration=2s
#11 req 5 ok
null
#12 req 6 connector:http
{
  "method": "GET",
  "url": "http://wilson.flowmetal.svc.cluster.local:8080/reinstall/ri_2496f0f9292e"
}
#13 req 6 ok
{
  "body": {
    "error_kind": "wilson_forgot",
    "hostname": "host-632a20b0",
    "message": "wilson forgot this reinstall ever happened",
    "reinstall_id": "ri_2496f0f9292e",
    "retryable": true,
    "status": "forgotten"
  },
  "headers": {
    "content-length": "183",
    "content-type": "application/json",
    "date": "Tue, 21 Apr 2026 09:44:23 GMT",
    "server": "uvicorn"
  },
  "status": 200.0
}
#14 print >>> [noc] attempt 1: wilson claims it never heard of ri_2496f0f9292e. classic.
#16 print >>> [noc] attempt 2/4: kicking off reinstall of host-632a20b0.
#18 req 9 connector:http
{
  "body_json": {
    "config": {
      "disk_layout": "md-raid10",
      "os": "flatcar-stable",
      "profile": "api-worker",
      "rack": "rack-b1"
    },
    "hostname": "host-632a20b0"
  },
  "method": "POST",
  "url": "http://wilson.flowmetal.svc.cluster.local:8080/reinstall"
}
#19 req 9 ok
{
  "body": {
    "hostname": "host-632a20b0",
    "reinstall_id": "ri_b26b0d4cdbc5"
  },
  "headers": {
    "content-length": "61",
    "content-type": "application/json",
    "date": "Tue, 21 Apr 2026 09:44:33 GMT",
    "server": "uvicorn"
  },
  "status": 202.0
}
#20 req 10 sleep deadline=1776764683.013600678 duration=2s
#21 req 10 ok
null
#22 req 11 connector:http
{
  "method": "GET",
  "url": "http://wilson.flowmetal.svc.cluster.local:8080/reinstall/ri_b26b0d4cdbc5"
}
#23 req 11 ok
{
  "body": {
    "error_kind": "wilson_forgot",
    "hostname": "host-632a20b0",
    "message": "wilson forgot this reinstall ever happened",
    "reinstall_id": "ri_b26b0d4cdbc5",
    "retryable": true,
    "status": "forgotten"
  },
  "headers": {
    "content-length": "183",
    "content-type": "application/json",
    "date": "Tue, 21 Apr 2026 09:44:43 GMT",
    "server": "uvicorn"
  },
  "status": 200.0
}
#24 print >>> [noc] attempt 2: wilson claims it never heard of ri_b26b0d4cdbc5. classic.
#26 print >>> [noc] attempt 3/4: kicking off reinstall of host-632a20b0.
#28 req 14 connector:http
{
  "body_json": {
    "config": {
      "disk_layout": "md-raid10",
      "os": "flatcar-stable",
      "profile": "api-worker",
      "rack": "rack-b1"
    },
    "hostname": "host-632a20b0"
  },
  "method": "POST",
  "url": "http://wilson.flowmetal.svc.cluster.local:8080/reinstall"
}
#29 req 14 ok
{
  "body": {
    "hostname": "host-632a20b0",
    "reinstall_id": "ri_34502a4bfb57"
  },
  "headers": {
    "content-length": "61",
    "content-type": "application/json",
    "date": "Tue, 21 Apr 2026 09:44:51 GMT",
    "server": "uvicorn"
  },
  "status": 202.0
}
#30 req 15 sleep deadline=1776764701.056203549 duration=2s
#31 req 15 ok
null
#32 req 16 connector:http
{
  "method": "GET",
  "url": "http://wilson.flowmetal.svc.cluster.local:8080/reinstall/ri_34502a4bfb57"
}
#33 req 16 ok
{
  "body": {
    "eta_seconds": 5.02,
    "hostname": "host-632a20b0",
    "reinstall_id": "ri_34502a4bfb57",
    "status": "pending"
  },
  "headers": {
    "content-length": "99",
    "content-type": "application/json",
    "date": "Tue, 21 Apr 2026 09:45:01 GMT",
    "server": "uvicorn"
  },
  "status": 200.0
}
#34 req 17 sleep deadline=1776764704.940776671 duration=2s
#35 req 17 ok
null
#36 req 18 connector:http
{
  "method": "GET",
  "url": "http://wilson.flowmetal.svc.cluster.local:8080/reinstall/ri_34502a4bfb57"
}
#37 req 18 ok
{
  "body": {
    "eta_seconds": 0.97,
    "hostname": "host-632a20b0",
    "reinstall_id": "ri_34502a4bfb57",
    "status": "pending"
  },
  "headers": {
    "content-length": "99",
    "content-type": "application/json",
    "date": "Tue, 21 Apr 2026 09:45:05 GMT",
    "server": "uvicorn"
  },
  "status": 200.0
}
#38 req 19 sleep deadline=1776764714.173990257 duration=2s
#39 req 19 ok
null
#40 req 20 connector:http
{
  "method": "GET",
  "url": "http://wilson.flowmetal.svc.cluster.local:8080/reinstall/ri_34502a4bfb57"
}
#41 req 20 ok
{
  "body": {
    "error_kind": "reinstall_broken",
    "hostname": "host-632a20b0",
    "message": "reinstall broke partway through",
    "reinstall_id": "ri_34502a4bfb57",
    "retryable": true,
    "status": "failed"
  },
  "headers": {
    "content-length": "172",
    "content-type": "application/json",
    "date": "Tue, 21 Apr 2026 09:45:14 GMT",
    "server": "uvicorn"
  },
  "status": 200.0
}
#42 print >>> [noc] attempt 3 failed (reinstall_broken); looping back to wilson.
#44 print >>> [noc] attempt 4/4: kicking off reinstall of host-632a20b0.
#46 req 23 connector:http
{
  "body_json": {
    "config": {
      "disk_layout": "md-raid10",
      "os": "flatcar-stable",
      "profile": "api-worker",
      "rack": "rack-b1"
    },
    "hostname": "host-632a20b0"
  },
  "method": "POST",
  "url": "http://wilson.flowmetal.svc.cluster.local:8080/reinstall"
}
#47 req 23 ok
{
  "body": {
    "hostname": "host-632a20b0",
    "reinstall_id": "ri_aeced82f3f51"
  },
  "headers": {
    "content-length": "61",
    "content-type": "application/json",
    "date": "Tue, 21 Apr 2026 09:45:16 GMT",
    "server": "uvicorn"
  },
  "status": 202.0
}
#48 req 24 sleep deadline=1776764722.930637834 duration=2s
#49 req 24 ok
null
#50 req 25 connector:http
{
  "method": "GET",
  "url": "http://wilson.flowmetal.svc.cluster.local:8080/reinstall/ri_aeced82f3f51"
}
#51 req 25 ok
{
  "body": {
    "eta_seconds": 3.0,
    "hostname": "host-632a20b0",
    "reinstall_id": "ri_aeced82f3f51",
    "status": "pending"
  },
  "headers": {
    "content-length": "98",
    "content-type": "application/json",
    "date": "Tue, 21 Apr 2026 09:45:23 GMT",
    "server": "uvicorn"
  },
  "status": 200.0
}
#52 req 26 sleep deadline=1776764734.147652974 duration=2s
#53 req 26 ok
null
#54 req 27 connector:http
{
  "method": "GET",
  "url": "http://wilson.flowmetal.svc.cluster.local:8080/reinstall/ri_aeced82f3f51"
}
#55 req 27 ok
{
  "body": {
    "error_kind": "wilson_forgot",
    "hostname": "host-632a20b0",
    "message": "wilson forgot this reinstall ever happened",
    "reinstall_id": "ri_aeced82f3f51",
    "retryable": true,
    "status": "forgotten"
  },
  "headers": {
    "content-length": "183",
    "content-type": "application/json",
    "date": "Tue, 21 Apr 2026 09:45:34 GMT",
    "server": "uvicorn"
  },
  "status": 200.0
}
#56 print >>> [noc] attempt 4: wilson claims it never heard of ri_aeced82f3f51. classic.
#58 print >>> [noc] escalating host-632a20b0 to RDS: wilson exhausted 4 attempts.
#60 req 30 connector:http
{
  "body_json": {
    "hostname": "host-632a20b0",
    "reason": "wilson exhausted 4 attempts"
  },
  "method": "POST",
  "url": "http://rds.flowmetal.svc.cluster.local:8080/tickets"
}
#61 req 30 ok
{
  "body": {
    "created_at": 1776764750.0,
    "hostname": "host-632a20b0",
    "reason": "wilson exhausted 4 attempts",
    "ticket_id": "rds_17e6ad02d3e8"
  },
  "headers": {
    "content-length": "122",
    "content-type": "application/json",
    "date": "Tue, 21 Apr 2026 09:45:49 GMT",
    "server": "uvicorn"
  },
  "status": 201.0
}
#62 print >>> [noc] RDS ticket rds_17e6ad02d3e8 filed for host-632a20b0 — paging humans.
#64 FAILED worker=worker-cb363943-e8d5-4544-959e-0acbf94251c1