Open
Description
Intentionally plugged some very bad SAS hard drives in a 24-bay enclosure.
Noticed some discrepancy regarding smartctl_device_smartctl_exit_status
, which is an important indicator of drive failure:
# smartctl -a -T permissive /dev/sdc -d scsi; echo $?
4
smartctl -a -T permissive /dev/sdd -d scsi; echo $?
0
smartctl -a -T permissive /dev/sde -d scsi; echo $?
0
# smartctl -a -T permissive /dev/sdk -d scsi; echo $?
128
# smartctl -a -T permissive /dev/sdp -d scsi; echo $?
8
# smartctl -a -T permissive /dev/sdq -d scsi; echo $?
8
however:
smartctl_device_smartctl_exit_status{device="sdc"} 0
smartctl_device_smartctl_exit_status{device="sdd"} 0
smartctl_device_smartctl_exit_status{device="sde"} 0
smartctl_device_smartctl_exit_status{device="sdk"} 0
smartctl_device_smartctl_exit_status{device="sdp"} 8
smartctl_device_smartctl_exit_status{device="sdq"} 8
JSON data for/dev/sdc
(drive defect: takes around 60s to respond)
{
"json_format_version": [
1,
0
],
"smartctl": {
"version": [
7,
3
],
"svn_revision": "5338",
"platform_info": "x86_64-linux-6.8.12-4-pve",
"build_info": "(local build)",
"argv": [
"smartctl",
"-a",
"-T",
"permissive",
"-d",
"scsi",
"/dev/sdc",
"--json"
],
"exit_status": 4
},
"local_time": {
"time_t": 1737324399,
"asctime": "Sun Jan 19 19:06:39 2025 -03"
},
"device": {
"name": "/dev/sdc",
"info_name": "/dev/sdc",
"type": "scsi",
"protocol": "SCSI"
},
"scsi_vendor": "SEAGATE",
"scsi_product": "ST3600057SS",
"scsi_model_name": "SEAGATE ST3600057SS",
"scsi_revision": "EN03",
"scsi_version": "SPC-3",
"rotation_rate": 15000,
"form_factor": {
"scsi_value": 2,
"name": "3.5 inches"
},
"logical_unit_id": "0x5000c50053c26987",
"serial_number": "6SL458D5",
"device_type": {
"scsi_terminology": "Peripheral Device Type [PDT]",
"scsi_value": 0,
"name": "disk"
},
"scsi_transport_protocol": {
"name": "SAS (SPL-4)",
"value": 6
},
"smart_support": {
"available": false
},
"temperature": {
"current": 0
},
"scsi_temperature": {
"drive_trip": 0
}
}
JSON data for /dev/sdk
(drive defect: several bad blocks, DST failing)
{
"json_format_version": [
1,
0
],
"smartctl": {
"version": [
7,
3
],
"svn_revision": "5338",
"platform_info": "x86_64-linux-6.8.12-4-pve",
"build_info": "(local build)",
"argv": [
"smartctl",
"-a",
"-T",
"permissive",
"-d",
"scsi",
"/dev/sdk",
"--json"
],
"exit_status": 128
},
"local_time": {
"time_t": 1737324706,
"asctime": "Sun Jan 19 19:11:46 2025 -03"
},
"device": {
"name": "/dev/sdk",
"info_name": "/dev/sdk",
"type": "scsi",
"protocol": "SCSI"
},
"scsi_vendor": "IBM-SSG",
"scsi_product": "S7AQ3P0",
"scsi_model_name": "IBM-SSG S7AQ3P0",
"scsi_revision": "A058",
"scsi_version": "SPC-4",
"user_capacity": {
"blocks": 5860533168,
"bytes": 3000592982016
},
"logical_block_size": 512,
"rotation_rate": 7200,
"form_factor": {
"scsi_value": 2,
"name": "3.5 inches"
},
"logical_unit_id": "0x5000c500349f40f7",
"serial_number": "Z290Q54400009145WCJ4",
"device_type": {
"scsi_terminology": "Peripheral Device Type [PDT]",
"scsi_value": 0,
"name": "disk"
},
"scsi_transport_protocol": {
"name": "SAS (SPL-4)",
"value": 6
},
"smart_support": {
"available": true,
"enabled": true
},
"temperature_warning": {
"enabled": true
},
"smart_status": {
"passed": true
},
"temperature": {
"current": 39,
"drive_trip": 65
},
"power_on_time": {
"hours": 51871,
"minutes": 57
},
"scsi_grown_defect_list": 1239,
"scsi_error_counter_log": {
"read": {
"errors_corrected_by_eccfast": 2545895999,
"errors_corrected_by_eccdelayed": 0,
"errors_corrected_by_rereads_rewrites": 0,
"total_errors_corrected": 2545895999,
"correction_algorithm_invocations": 1,
"gigabytes_processed": "529664.798",
"total_uncorrected_errors": 1
},
"write": {
"errors_corrected_by_eccfast": 0,
"errors_corrected_by_eccdelayed": 0,
"errors_corrected_by_rereads_rewrites": 0,
"total_errors_corrected": 0,
"correction_algorithm_invocations": 0,
"gigabytes_processed": "104245.228",
"total_uncorrected_errors": 0
},
"verify": {
"errors_corrected_by_eccfast": 836386951,
"errors_corrected_by_eccdelayed": 1,
"errors_corrected_by_rereads_rewrites": 0,
"total_errors_corrected": 836386952,
"correction_algorithm_invocations": 1,
"gigabytes_processed": "4497341.609",
"total_uncorrected_errors": 0
}
},
"scsi_self_test_0": {
"code": {
"value": 2,
"string": "Background long"
},
"result": {
"value": 7,
"string": "Failed in segment"
},
"power_on_time": {
"hours": 51543,
"aka": "accumulated_power_on_hours"
},
"lba_first_failure": {
"value": 5165202415,
"aka": "address_of_first_failure"
},
"sense_key": {
"value": 3,
"string": "Medium Error"
},
"asc": 17,
"ascq": 0,
"vendor_specific": 129
},
"scsi_self_test_1": {
"code": {
"value": 2,
"string": "Background long"
},
"result": {
"value": 7,
"string": "Failed in segment"
},
"power_on_time": {
"hours": 51288,
"aka": "accumulated_power_on_hours"
},
"lba_first_failure": {
"value": 5165202415,
"aka": "address_of_first_failure"
},
"sense_key": {
"value": 3,
"string": "Medium Error"
},
"asc": 17,
"ascq": 0,
"vendor_specific": 129
},
"scsi_self_test_2": {
"code": {
"value": 2,
"string": "Background long"
},
"result": {
"value": 2,
"string": "Aborted (device reset ?)"
},
"power_on_time": {
"hours": 50516,
"aka": "accumulated_power_on_hours"
}
},
"scsi_extended_self_test_seconds": 27600
}
JSON data for /dev/sdp
(drive defect: I don't know, available spare sectors depletion maybe?)
{
"json_format_version": [
1,
0
],
"smartctl": {
"version": [
7,
3
],
"svn_revision": "5338",
"platform_info": "x86_64-linux-6.8.12-4-pve",
"build_info": "(local build)",
"argv": [
"smartctl",
"-a",
"-T",
"permissive",
"-d",
"scsi",
"/dev/sdp",
"--json"
],
"exit_status": 8
},
"local_time": {
"time_t": 1737324877,
"asctime": "Sun Jan 19 19:14:37 2025 -03"
},
"device": {
"name": "/dev/sdp",
"info_name": "/dev/sdp",
"type": "scsi",
"protocol": "SCSI"
},
"scsi_vendor": "IBM-SSG",
"scsi_product": "H0YH600",
"scsi_model_name": "IBM-SSG H0YH600",
"scsi_revision": "CF08",
"scsi_version": "SPC-4",
"user_capacity": {
"blocks": 1172123568,
"bytes": 600127266816
},
"logical_block_size": 512,
"scsi_lb_provisioning": {
"name": "fully provisioned",
"value": 0,
"management_enabled": {
"name": "LBPME",
"value": 0
},
"read_zeros": {
"name": "LBPRZ",
"value": 0
}
},
"rotation_rate": 10000,
"form_factor": {
"scsi_value": 3,
"name": "2.5 inches"
},
"logical_unit_id": "0x5000cca07d4e1980",
"serial_number": "0BHBYHXH",
"device_type": {
"scsi_terminology": "Peripheral Device Type [PDT]",
"scsi_value": 0,
"name": "disk"
},
"scsi_transport_protocol": {
"name": "SAS (SPL-4)",
"value": 6
},
"smart_support": {
"available": true,
"enabled": true
},
"temperature_warning": {
"enabled": true
},
"smart_status": {
"passed": false,
"scsi": {
"asc": 93,
"ascq": 100,
"ie_string": "FIRMWARE IMPENDING FAILURE TOO MANY BLOCK REASSIGNS"
}
},
"temperature": {
"current": 32,
"drive_trip": 65
},
"power_on_time": {
"hours": 21975,
"minutes": 22
},
"scsi_start_stop_cycle_counter": {
"year_of_manufacture": "2018",
"week_of_manufacture": "09",
"specified_cycle_count_over_device_lifetime": 50000,
"accumulated_start_stop_cycles": 88,
"specified_load_unload_count_over_device_lifetime": 600000,
"accumulated_load_unload_cycles": 998
},
"scsi_grown_defect_list": 0,
"scsi_error_counter_log": {
"read": {
"errors_corrected_by_eccfast": 0,
"errors_corrected_by_eccdelayed": 221387,
"errors_corrected_by_rereads_rewrites": 0,
"total_errors_corrected": 221387,
"correction_algorithm_invocations": 32499236,
"gigabytes_processed": "5575.751",
"total_uncorrected_errors": 40
},
"write": {
"errors_corrected_by_eccfast": 0,
"errors_corrected_by_eccdelayed": 0,
"errors_corrected_by_rereads_rewrites": 0,
"total_errors_corrected": 0,
"correction_algorithm_invocations": 87410,
"gigabytes_processed": "19893.007",
"total_uncorrected_errors": 0
},
"verify": {
"errors_corrected_by_eccfast": 0,
"errors_corrected_by_eccdelayed": 3795,
"errors_corrected_by_rereads_rewrites": 0,
"total_errors_corrected": 3795,
"correction_algorithm_invocations": 389822872,
"gigabytes_processed": "115152.801",
"total_uncorrected_errors": 0
}
}
}
Metadata
Metadata
Assignees
Labels
No labels