Begin: Running /scripts/init-premount ... done.
...
Begin: Will now check root file system ... fsck from util-linux 2.40.2
[/usr/sbin/fsck.ext4 (1) -- /dev/nvme0n1p1] fsck.ext4 -a -C0 /dev/nvme0n1p1
cloudimg-rootfs: recovering journal
cloudimg-rootfs: Clearing orphaned inode 86387 (uid=0, gid=0, mode=0100644, size=113)
cloudimg-rootfs: clean, 119390/878080 files, 801009/1806587 blocks
done.
[ 2.746978] EXT4-fs (nvme0n1p1): orphan cleanup on readonly fs
[ 2.749154] EXT4-fs error (device nvme0n1p1): ext4_orphan_get:1422: comm mount: bad orphan inode 86387
[ 2.752630] ext4_test_bit(bit=7986, block=278) = 0
[ 2.754377] EXT4-fs (nvme0n1p1): recovery complete
[ 2.756155] EXT4-fs error (device nvme0n1p1): ext4_mark_recovery_complete:6236: comm mount: Orphan file not empty on read-only fs.
[ 2.759987] EXT4-fs (nvme0n1p1): mount failed
mount: mounting /dev/nvme0n1p1 on /root failed: Structure needs cleaning
done.
Begin: Running /scripts/local-bottom ... done.
Begin: Running /scripts/init-bottom ... mount: mounting /dev on /root/dev failed: No such file or directory
mount: mounting /dev on /root/dev failed: No such file or directory
done.
Searching for the disk regions on their corresponding sleds, we see a repair job on BRM42220015 on Aug 18 18:50. There were no obvious errors with this job.
# pilot host exec -c 'grep -h 4ed7e67a-7fa5-46eb-b312-67c647489808 $(/opt/oxide/oxlog/oxlog logs oxz_nexus* nexus --current --archived -A 2025-08-18 -B 2025-08-19) | looker' 8 14 20
INFO 1cfdb5b6-e568-436a-a85f-7fecf1b8eef2 (ServerContext): saga create
dag = {"end_node":9,"graph":{"edge_property":"directed","edges":[[0,1,null],[1,2,null],[2,3,null],[3,4,null],[4,5,null],[5,6,null],[6,7,null],[8,0,null],[7,9,null]],"node_holes":[],"nodes":[{"Action":{"action_name":"common.uuid_generate","label":"GenerateSagaId","name":"saga_id"}},{"Action":{"action_name":"common.uuid_generate","label":"GenerateJobId","name":"job_id"}},{"Action":{"action_name":"region_replacement_drive.set_saga_id","label":"SetSagaId","name":"unused_1"}},{"Action":{"action_name":"region_replacement_drive.drive_region_replacement_check","label":"DriveRegionReplacementCheck","name":"check"}},{"Action":{"action_name":"region_replacement_drive.drive_region_replacement_prepare","label":"DriveRegionReplacementPrepare","name":"prepare"}},{"Action":{"action_name":"region_replacement_drive.drive_region_replacement_execute","label":"DriveRegionReplacementExecute","name":"execute"}},{"Action":{"action_name":"region_replacement_drive.drive_region_replacement_commit","label":"DriveRegionReplacementCommit","name":"commit"}},{"Action":{"action_name":"region_replacement_drive.finish_saga","label":"FinishSaga","name":"unused_2"}},{"Start":{"params":{"request":{"id":"4342f5e1-0690-4cac-bb30-f7b98a857856","new_region_id":"4ed7e67a-7fa5-46eb-b312-67c647489808","old_region_id":"54462a44-99ea-44e2-8743-ee4a369405e6","old_region_volume_id":"be11ed6d-b780-492f-afda-2bd00a1e219b","operating_saga_id":null,"replacement_state":"Running","request_time":"2025-08-18T18:46:01.776498Z","volume_id":"b5e92f40-390e-4d00-a9a4-b25709152250"},"serialized_authn":{"kind":{"Authenticated":[{"actor":{"UserBuiltin":{"user_builtin_id":"001de000-05e4-4000-8000-000000000002"}}},null]}}}}},"End"]},"saga_name":"region-replacement-drive","start_node":8}
file = /home/build/.cargo/registry/src/index.crates.io-1949cf8c6b5b557f/steno-0.4.1/src/sec.rs:1146
saga_id = 00bd8bcd-fcfc-4054-9acf-2e3e68799c73
saga_name = region-replacement-drive
sec_id = 1cfdb5b6-e568-436a-a85f-7fecf1b8eef2
18:50:04.994Z INFO 1cfdb5b6-e568-436a-a85f-7fecf1b8eef2 (ServerContext): saga create
dag = {"end_node":15,"graph":{"edge_property":"directed","edges":[[0,1,null],[1,2,null],[2,3,null],[4,5,null],[4,6,null],[6,7,null],[5,7,null],[7,8,null],[8,9,null],[9,10,null],[10,11,null],[3,4,null],[11,12,null],[12,13,null],[14,0,null],[13,15,null]],"node_holes":[],"nodes":[{"Action":{"action_name":"common.uuid_generate","label":"GenerateSagaId","name":"saga_id"}},{"Action":{"action_name":"region_replacement_finish.set_saga_id","label":"SetSagaId","name":"unused_1"}},{"Constant":{"name":"params_for_volume_delete_subsaga","value":{"serialized_authn":{"kind":{"Authenticated":[{"actor":{"UserBuiltin":{"user_builtin_id":"001de000-05e4-4000-8000-000000000002"}}},null]}},"volume_id":"be11ed6d-b780-492f-afda-2bd00a1e219b"}}},{"SubsagaStart":{"params_node_name":"params_for_volume_delete_subsaga","saga_name":"volume-delete"}},{"Action":{"action_name":"volume_delete.decrease_crucible_resource_count","label":"DecreaseCrucibleResourceCount","name":"crucible_resources_to_delete"}},{"Action":{"action_name":"volume_delete.delete_crucible_regions","label":"DeleteCrucibleRegions","name":"no_result_1"}},{"Action":{"action_name":"volume_delete.delete_crucible_running_snapshots","label":"DeleteCrucibleRunningSnapshots","name":"no_result_2"}},{"Action":{"action_name":"volume_delete.delete_crucible_snapshots","label":"DeleteCrucibleSnapshots","name":"no_result_3"}},{"Action":{"action_name":"volume_delete.delete_crucible_snapshot_records","label":"DeleteCrucibleSnapshotRecords","name":"no_result_4"}},{"Action":{"action_name":"volume_delete.find_freed_crucible_regions","label":"FindFreedCrucibleRegions","name":"freed_crucible_regions"}},{"Action":{"action_name":"volume_delete.delete_freed_crucible_regions","label":"DeleteFreedCrucibleRegions","name":"no_result_5"}},{"Action":{"action_name":"volume_delete.hard_delete_volume_record","label":"HardDeleteVolumeRecord","name":"volume_hard_deleted"}},{"SubsagaEnd":{"name":"volume_delete_subsaga_no_result"}},{"Action":{"action_name":"region_replacement_finish.update_request_record","label":"UpdateRequestRecord","name":"unused_2"}},{"Start":{"params":{"region_volume_id":"be11ed6d-b780-492f-afda-2bd00a1e219b","request":{"id":"4342f5e1-0690-4cac-bb30-f7b98a857856","new_region_id":"4ed7e67a-7fa5-46eb-b312-67c647489808","old_region_id":"54462a44-99ea-44e2-8743-ee4a369405e6","old_region_volume_id":"be11ed6d-b780-492f-afda-2bd00a1e219b","operating_saga_id":null,"replacement_state":"ReplacementDone","request_time":"2025-08-18T18:46:01.776498Z","volume_id":"b5e92f40-390e-4d00-a9a4-b25709152250"},"serialized_authn":{"kind":{"Authenticated":[{"actor":{"UserBuiltin":{"user_builtin_id":"001de000-05e4-4000-8000-000000000002"}}},null]}}}}},"End"]},"saga_name":"region-replacement-finish","start_node":14}
file = /home/build/.cargo/registry/src/index.crates.io-1949cf8c6b5b557f/steno-0.4.1/src/sec.rs:1146
saga_id = dc873936-3647-4d72-a780-bd1677c3008b
saga_name = region-replacement-finish
sec_id = 1cfdb5b6-e568-436a-a85f-7fecf1b8eef2
Checking for outstanding replacements, we don't see any that appear to be associated with this disk:
Expanded saga details
Saga DAG:
{
"end_node": 9,
"graph": {
"edge_property": "directed",
"edges": [
[
0,
1,
null
],
[
1,
2,
null
],
[
2,
3,
null
],
[
3,
4,
null
],
[
4,
5,
null
],
[
5,
6,
null
],
[
6,
7,
null
],
[
8,
0,
null
],
[
7,
9,
null
]
],
"node_holes": [],
"nodes": [
{
"Action": {
"action_name": "common.uuid_generate",
"label": "GenerateSagaId",
"name": "saga_id"
}
},
{
"Action": {
"action_name": "common.uuid_generate",
"label": "GenerateJobId",
"name": "job_id"
}
},
{
"Action": {
"action_name": "region_replacement_drive.set_saga_id",
"label": "SetSagaId",
"name": "unused_1"
}
},
{
"Action": {
"action_name": "region_replacement_drive.drive_region_replacement_check",
"label": "DriveRegionReplacementCheck",
"name": "check"
}
},
{
"Action": {
"action_name": "region_replacement_drive.drive_region_replacement_prepare",
"label": "DriveRegionReplacementPrepare",
"name": "prepare"
}
},
{
"Action": {
"action_name": "region_replacement_drive.drive_region_replacement_execute",
"label": "DriveRegionReplacementExecute",
"name": "execute"
}
},
{
"Action": {
"action_name": "region_replacement_drive.drive_region_replacement_commit",
"label": "DriveRegionReplacementCommit",
"name": "commit"
}
},
{
"Action": {
"action_name": "region_replacement_drive.finish_saga",
"label": "FinishSaga",
"name": "unused_2"
}
},
{
"Start": {
"params": {
"request": {
"id": "4342f5e1-0690-4cac-bb30-f7b98a857856",
"new_region_id": "4ed7e67a-7fa5-46eb-b312-67c647489808",
"old_region_id": "54462a44-99ea-44e2-8743-ee4a369405e6",
"old_region_volume_id": "be11ed6d-b780-492f-afda-2bd00a1e219b",
"operating_saga_id": null,
"replacement_state": "Running",
"request_time": "2025-08-18T18:46:01.776498Z",
"volume_id": "b5e92f40-390e-4d00-a9a4-b25709152250"
},
"serialized_authn": {
"kind": {
"Authenticated": [
{
"actor": {
"UserBuiltin": {
"user_builtin_id": "001de000-05e4-4000-8000-000000000002"
}
}
},
null
]
}
}
}
}
},
"End"
]
},
"saga_name": "region-replacement-drive",
"start_node": 8
}
Saga finish DAG:
{
"end_node": 15,
"graph": {
"edge_property": "directed",
"edges": [
[
0,
1,
null
],
[
1,
2,
null
],
[
2,
3,
null
],
[
4,
5,
null
],
[
4,
6,
null
],
[
6,
7,
null
],
[
5,
7,
null
],
[
7,
8,
null
],
[
8,
9,
null
],
[
9,
10,
null
],
[
10,
11,
null
],
[
3,
4,
null
],
[
11,
12,
null
],
[
12,
13,
null
],
[
14,
0,
null
],
[
13,
15,
null
]
],
"node_holes": [],
"nodes": [
{
"Action": {
"action_name": "common.uuid_generate",
"label": "GenerateSagaId",
"name": "saga_id"
}
},
{
"Action": {
"action_name": "region_replacement_finish.set_saga_id",
"label": "SetSagaId",
"name": "unused_1"
}
},
{
"Constant": {
"name": "params_for_volume_delete_subsaga",
"value": {
"serialized_authn": {
"kind": {
"Authenticated": [
{
"actor": {
"UserBuiltin": {
"user_builtin_id": "001de000-05e4-4000-8000-000000000002"
}
}
},
null
]
}
},
"volume_id": "be11ed6d-b780-492f-afda-2bd00a1e219b"
}
}
},
{
"SubsagaStart": {
"params_node_name": "params_for_volume_delete_subsaga",
"saga_name": "volume-delete"
}
},
{
"Action": {
"action_name": "volume_delete.decrease_crucible_resource_count",
"label": "DecreaseCrucibleResourceCount",
"name": "crucible_resources_to_delete"
}
},
{
"Action": {
"action_name": "volume_delete.delete_crucible_regions",
"label": "DeleteCrucibleRegions",
"name": "no_result_1"
}
},
{
"Action": {
"action_name": "volume_delete.delete_crucible_running_snapshots",
"label": "DeleteCrucibleRunningSnapshots",
"name": "no_result_2"
}
},
{
"Action": {
"action_name": "volume_delete.delete_crucible_snapshots",
"label": "DeleteCrucibleSnapshots",
"name": "no_result_3"
}
},
{
"Action": {
"action_name": "volume_delete.delete_crucible_snapshot_records",
"label": "DeleteCrucibleSnapshotRecords",
"name": "no_result_4"
}
},
{
"Action": {
"action_name": "volume_delete.find_freed_crucible_regions",
"label": "FindFreedCrucibleRegions",
"name": "freed_crucible_regions"
}
},
{
"Action": {
"action_name": "volume_delete.delete_freed_crucible_regions",
"label": "DeleteFreedCrucibleRegions",
"name": "no_result_5"
}
},
{
"Action": {
"action_name": "volume_delete.hard_delete_volume_record",
"label": "HardDeleteVolumeRecord",
"name": "volume_hard_deleted"
}
},
{
"SubsagaEnd": {
"name": "volume_delete_subsaga_no_result"
}
},
{
"Action": {
"action_name": "region_replacement_finish.update_request_record",
"label": "UpdateRequestRecord",
"name": "unused_2"
}
},
{
"Start": {
"params": {
"region_volume_id": "be11ed6d-b780-492f-afda-2bd00a1e219b",
"request": {
"id": "4342f5e1-0690-4cac-bb30-f7b98a857856",
"new_region_id": "4ed7e67a-7fa5-46eb-b312-67c647489808",
"old_region_id": "54462a44-99ea-44e2-8743-ee4a369405e6",
"old_region_volume_id": "be11ed6d-b780-492f-afda-2bd00a1e219b",
"operating_saga_id": null,
"replacement_state": "ReplacementDone",
"request_time": "2025-08-18T18:46:01.776498Z",
"volume_id": "b5e92f40-390e-4d00-a9a4-b25709152250"
},
"serialized_authn": {
"kind": {
"Authenticated": [
{
"actor": {
"UserBuiltin": {
"user_builtin_id": "001de000-05e4-4000-8000-000000000002"
}
}
},
null
]
}
}
}
}
},
"End"
]
},
"saga_name": "region-replacement-finish",
"start_node": 14
}
A preview-silo user on colo reported that instance
5d62dadc-09a6-427b-8a4b-c7f1d4585a2abecame corrupted at some point between 2025-08-12 and 2025-08-20 while the instance was idle. This appears to have been caused by a region replace that occurred on 2025-08-18 when two sleds were expunged from the rack.The instance spontaneously rebooted and reported a failed
fsck:Instance details:
Disk details:
Searching for the disk regions on their corresponding sleds, we see a repair job on BRM42220015 on Aug 18 18:50. There were no obvious errors with this job.
From
/pool/ext/7e67cb32-0c00-4090-9647-eb7bae75deeb/crypt/debug/oxz_crucible_b990911b-805a-4f9d-bd83-e977f5b19a35/oxide-crucible-downstairs:downstairs-4ed7e67a-7fa5-46eb-b312-67c647489808.log.1755543004One of the downstairs for this disk appears to have been hosted on
BRM42220001orBRM44220002, which were expunged from the colo rack on 2025-08-18.We see a corresponding saga in the Nexus logs:
Both sagas succeeded:
Checking for outstanding replacements, we don't see any that appear to be associated with this disk:
Nor do we see any incomplete region replacements:
Expanded saga details
Saga DAG:
{ "end_node": 9, "graph": { "edge_property": "directed", "edges": [ [ 0, 1, null ], [ 1, 2, null ], [ 2, 3, null ], [ 3, 4, null ], [ 4, 5, null ], [ 5, 6, null ], [ 6, 7, null ], [ 8, 0, null ], [ 7, 9, null ] ], "node_holes": [], "nodes": [ { "Action": { "action_name": "common.uuid_generate", "label": "GenerateSagaId", "name": "saga_id" } }, { "Action": { "action_name": "common.uuid_generate", "label": "GenerateJobId", "name": "job_id" } }, { "Action": { "action_name": "region_replacement_drive.set_saga_id", "label": "SetSagaId", "name": "unused_1" } }, { "Action": { "action_name": "region_replacement_drive.drive_region_replacement_check", "label": "DriveRegionReplacementCheck", "name": "check" } }, { "Action": { "action_name": "region_replacement_drive.drive_region_replacement_prepare", "label": "DriveRegionReplacementPrepare", "name": "prepare" } }, { "Action": { "action_name": "region_replacement_drive.drive_region_replacement_execute", "label": "DriveRegionReplacementExecute", "name": "execute" } }, { "Action": { "action_name": "region_replacement_drive.drive_region_replacement_commit", "label": "DriveRegionReplacementCommit", "name": "commit" } }, { "Action": { "action_name": "region_replacement_drive.finish_saga", "label": "FinishSaga", "name": "unused_2" } }, { "Start": { "params": { "request": { "id": "4342f5e1-0690-4cac-bb30-f7b98a857856", "new_region_id": "4ed7e67a-7fa5-46eb-b312-67c647489808", "old_region_id": "54462a44-99ea-44e2-8743-ee4a369405e6", "old_region_volume_id": "be11ed6d-b780-492f-afda-2bd00a1e219b", "operating_saga_id": null, "replacement_state": "Running", "request_time": "2025-08-18T18:46:01.776498Z", "volume_id": "b5e92f40-390e-4d00-a9a4-b25709152250" }, "serialized_authn": { "kind": { "Authenticated": [ { "actor": { "UserBuiltin": { "user_builtin_id": "001de000-05e4-4000-8000-000000000002" } } }, null ] } } } } }, "End" ] }, "saga_name": "region-replacement-drive", "start_node": 8 }Saga finish DAG:
{ "end_node": 15, "graph": { "edge_property": "directed", "edges": [ [ 0, 1, null ], [ 1, 2, null ], [ 2, 3, null ], [ 4, 5, null ], [ 4, 6, null ], [ 6, 7, null ], [ 5, 7, null ], [ 7, 8, null ], [ 8, 9, null ], [ 9, 10, null ], [ 10, 11, null ], [ 3, 4, null ], [ 11, 12, null ], [ 12, 13, null ], [ 14, 0, null ], [ 13, 15, null ] ], "node_holes": [], "nodes": [ { "Action": { "action_name": "common.uuid_generate", "label": "GenerateSagaId", "name": "saga_id" } }, { "Action": { "action_name": "region_replacement_finish.set_saga_id", "label": "SetSagaId", "name": "unused_1" } }, { "Constant": { "name": "params_for_volume_delete_subsaga", "value": { "serialized_authn": { "kind": { "Authenticated": [ { "actor": { "UserBuiltin": { "user_builtin_id": "001de000-05e4-4000-8000-000000000002" } } }, null ] } }, "volume_id": "be11ed6d-b780-492f-afda-2bd00a1e219b" } } }, { "SubsagaStart": { "params_node_name": "params_for_volume_delete_subsaga", "saga_name": "volume-delete" } }, { "Action": { "action_name": "volume_delete.decrease_crucible_resource_count", "label": "DecreaseCrucibleResourceCount", "name": "crucible_resources_to_delete" } }, { "Action": { "action_name": "volume_delete.delete_crucible_regions", "label": "DeleteCrucibleRegions", "name": "no_result_1" } }, { "Action": { "action_name": "volume_delete.delete_crucible_running_snapshots", "label": "DeleteCrucibleRunningSnapshots", "name": "no_result_2" } }, { "Action": { "action_name": "volume_delete.delete_crucible_snapshots", "label": "DeleteCrucibleSnapshots", "name": "no_result_3" } }, { "Action": { "action_name": "volume_delete.delete_crucible_snapshot_records", "label": "DeleteCrucibleSnapshotRecords", "name": "no_result_4" } }, { "Action": { "action_name": "volume_delete.find_freed_crucible_regions", "label": "FindFreedCrucibleRegions", "name": "freed_crucible_regions" } }, { "Action": { "action_name": "volume_delete.delete_freed_crucible_regions", "label": "DeleteFreedCrucibleRegions", "name": "no_result_5" } }, { "Action": { "action_name": "volume_delete.hard_delete_volume_record", "label": "HardDeleteVolumeRecord", "name": "volume_hard_deleted" } }, { "SubsagaEnd": { "name": "volume_delete_subsaga_no_result" } }, { "Action": { "action_name": "region_replacement_finish.update_request_record", "label": "UpdateRequestRecord", "name": "unused_2" } }, { "Start": { "params": { "region_volume_id": "be11ed6d-b780-492f-afda-2bd00a1e219b", "request": { "id": "4342f5e1-0690-4cac-bb30-f7b98a857856", "new_region_id": "4ed7e67a-7fa5-46eb-b312-67c647489808", "old_region_id": "54462a44-99ea-44e2-8743-ee4a369405e6", "old_region_volume_id": "be11ed6d-b780-492f-afda-2bd00a1e219b", "operating_saga_id": null, "replacement_state": "ReplacementDone", "request_time": "2025-08-18T18:46:01.776498Z", "volume_id": "b5e92f40-390e-4d00-a9a4-b25709152250" }, "serialized_authn": { "kind": { "Authenticated": [ { "actor": { "UserBuiltin": { "user_builtin_id": "001de000-05e4-4000-8000-000000000002" } } }, null ] } } } } }, "End" ] }, "saga_name": "region-replacement-finish", "start_node": 14 }