On 2019-01-30 16:00:18, Martín Ferrari wrote: > Hi Antoine, > > On 29/01/2019 17:50, Antoine Beaupre wrote: > >> I started seeing this in my logs on buster recently: >> >> jan 29 12:48:02 curie prometheus-node-exporter[940]: >> time="2019-01-29T12:48:02-05:00" level=error msg="Error parsing >> \"/var/lib/prometheus/node-exporter/smartmon.prom\": text format parsing >> error in line 54: unknown metric type \"type is not sat, scsi or megaraid >> but usbsunplus gauge\"" source="textfile.go:211" > >> It's strange because "line 54" of that file is: >> >> smartmon_end_to_end_error_threshold{disk="/dev/sdb",type="sat",smart_id="184"} >> 0 >> >> and type *is* "sat, scsi or megaraid" (it's "sat") and most definitely >> not "usbsunplus". what's going on here? > > > That's weird.. But I'd bet the error refers to another line in that > file. After all, node-exporter has no idea of sat, scsi, or megaraid. I > think that must be some text in the file. Could you send the contents of it?
Sure, attached. -- La dictature c'est ferme ta gueule. La démocratie c'est cause toujours! - Jean-Louis Barrault
# HELP smartmon_smartctl_version SMART metric smartctl_version # TYPE smartmon_smartctl_version gauge smartmon_smartctl_version{version="6.6"} 1 # HELP smartmon_command_timeout_raw_value SMART metric command_timeout_raw_value # TYPE smartmon_command_timeout_raw_value gauge smartmon_command_timeout_raw_value{disk="/dev/sdb",type="sat",smart_id="188"} 0.000000e+00 # HELP smartmon_command_timeout_threshold SMART metric command_timeout_threshold # TYPE smartmon_command_timeout_threshold gauge smartmon_command_timeout_threshold{disk="/dev/sdb",type="sat",smart_id="188"} 0 # HELP smartmon_command_timeout_value SMART metric command_timeout_value # TYPE smartmon_command_timeout_value gauge smartmon_command_timeout_value{disk="/dev/sdb",type="sat",smart_id="188"} 100 # HELP smartmon_command_timeout_worst SMART metric command_timeout_worst # TYPE smartmon_command_timeout_worst gauge smartmon_command_timeout_worst{disk="/dev/sdb",type="sat",smart_id="188"} 100 # HELP smartmon_current_pending_sector_raw_value SMART metric current_pending_sector_raw_value # TYPE smartmon_current_pending_sector_raw_value gauge smartmon_current_pending_sector_raw_value{disk="/dev/sda",type="sat",smart_id="197"} 0.000000e+00 # HELP smartmon_current_pending_sector_threshold SMART metric current_pending_sector_threshold # TYPE smartmon_current_pending_sector_threshold gauge smartmon_current_pending_sector_threshold{disk="/dev/sda",type="sat",smart_id="197"} 0 # HELP smartmon_current_pending_sector_value SMART metric current_pending_sector_value # TYPE smartmon_current_pending_sector_value gauge smartmon_current_pending_sector_value{disk="/dev/sda",type="sat",smart_id="197"} 100 # HELP smartmon_current_pending_sector_worst SMART metric current_pending_sector_worst # TYPE smartmon_current_pending_sector_worst gauge smartmon_current_pending_sector_worst{disk="/dev/sda",type="sat",smart_id="197"} 100 # HELP smartmon_device_active SMART metric device_active # TYPE smartmon_device_active gauge smartmon_device_active{disk="/dev/sda",type="sat"} 1 smartmon_device_active{disk="/dev/sdb",type="sat"} 1 # HELP smartmon_device_info SMART metric device_info # TYPE smartmon_device_info gauge smartmon_device_info{disk="/dev/sda",type="sat",vendor="",product="",revision="",lun_id="",model_family="Western Digital Black Mobile",device_model="WDC WD10JPLX-00MBPT0",serial_number="[REDACTED]",firmware_version="01.01H01"} 1 smartmon_device_info{disk="/dev/sdb",type="sat",vendor="",product="",revision="",lun_id="",model_family="WD Blue PC SSD",device_model="WDC WDS500G1B0B-00AS40",serial_number="[REDACTED]",firmware_version="X41000WD"} 1 # HELP smartmon_device_smart_available SMART metric device_smart_available # TYPE smartmon_device_smart_available gauge smartmon_device_smart_available{disk="/dev/sda",type="sat"} 1 smartmon_device_smart_available{disk="/dev/sdb",type="sat"} 1 # HELP smartmon_device_smart_enabled SMART metric device_smart_enabled # TYPE smartmon_device_smart_enabled gauge smartmon_device_smart_enabled{disk="/dev/sda",type="sat"} 1 smartmon_device_smart_enabled{disk="/dev/sdb",type="sat"} 1 # HELP smartmon_device_smart_healthy SMART metric device_smart_healthy # TYPE smartmon_device_smart_healthy gauge smartmon_device_smart_healthy{disk="/dev/sda",type="sat"} 1 smartmon_device_smart_healthy{disk="/dev/sdb",type="sat"} 1 # HELP smartmon_end_to_end_error_raw_value SMART metric end_to_end_error_raw_value # TYPE smartmon_end_to_end_error_raw_value gauge smartmon_end_to_end_error_raw_value{disk="/dev/sdb",type="sat",smart_id="184"} 0.000000e+00 # HELP smartmon_end_to_end_error_threshold SMART metric end_to_end_error_threshold # TYPE smartmon_end_to_end_error_threshold gauge smartmon_end_to_end_error_threshold{disk="/dev/sdb",type="sat",smart_id="184"} 0 # HELP smartmon_end_to_end_error_value SMART metric end_to_end_error_value # TYPE smartmon_end_to_end_error_value gauge smartmon_end_to_end_error_value{disk="/dev/sdb",type="sat",smart_id="184"} 100 # HELP smartmon_end_to_end_error_worst SMART metric end_to_end_error_worst # TYPE smartmon_end_to_end_error_worst gauge smartmon_end_to_end_error_worst{disk="/dev/sdb",type="sat",smart_id="184"} 100 # HELP smartmon_erase_fail_count_raw_value SMART metric erase_fail_count_raw_value # TYPE smartmon_erase_fail_count_raw_value gauge smartmon_erase_fail_count_raw_value{disk="/dev/sdb",type="sat",smart_id="172"} 0.000000e+00 # HELP smartmon_erase_fail_count_threshold SMART metric erase_fail_count_threshold # TYPE smartmon_erase_fail_count_threshold gauge smartmon_erase_fail_count_threshold{disk="/dev/sdb",type="sat",smart_id="172"} 0 # HELP smartmon_erase_fail_count_value SMART metric erase_fail_count_value # TYPE smartmon_erase_fail_count_value gauge smartmon_erase_fail_count_value{disk="/dev/sdb",type="sat",smart_id="172"} 100 # HELP smartmon_erase_fail_count_worst SMART metric erase_fail_count_worst # TYPE smartmon_erase_fail_count_worst gauge smartmon_erase_fail_count_worst{disk="/dev/sdb",type="sat",smart_id="172"} 100 # HELP smartmon_g_sense_error_rate_raw_value SMART metric g_sense_error_rate_raw_value # TYPE smartmon_g_sense_error_rate_raw_value gauge smartmon_g_sense_error_rate_raw_value{disk="/dev/sda",type="sat",smart_id="191"} 0.000000e+00 # HELP smartmon_g_sense_error_rate_threshold SMART metric g_sense_error_rate_threshold # TYPE smartmon_g_sense_error_rate_threshold gauge smartmon_g_sense_error_rate_threshold{disk="/dev/sda",type="sat",smart_id="191"} 0 # HELP smartmon_g_sense_error_rate_value SMART metric g_sense_error_rate_value # TYPE smartmon_g_sense_error_rate_value gauge smartmon_g_sense_error_rate_value{disk="/dev/sda",type="sat",smart_id="191"} 100 # HELP smartmon_g_sense_error_rate_worst SMART metric g_sense_error_rate_worst # TYPE smartmon_g_sense_error_rate_worst gauge smartmon_g_sense_error_rate_worst{disk="/dev/sda",type="sat",smart_id="191"} 100 # HELP smartmon_load_cycle_count_raw_value SMART metric load_cycle_count_raw_value # TYPE smartmon_load_cycle_count_raw_value gauge smartmon_load_cycle_count_raw_value{disk="/dev/sda",type="sat",smart_id="193"} 7.670000e+02 # HELP smartmon_load_cycle_count_threshold SMART metric load_cycle_count_threshold # TYPE smartmon_load_cycle_count_threshold gauge smartmon_load_cycle_count_threshold{disk="/dev/sda",type="sat",smart_id="193"} 0 # HELP smartmon_load_cycle_count_value SMART metric load_cycle_count_value # TYPE smartmon_load_cycle_count_value gauge smartmon_load_cycle_count_value{disk="/dev/sda",type="sat",smart_id="193"} 100 # HELP smartmon_load_cycle_count_worst SMART metric load_cycle_count_worst # TYPE smartmon_load_cycle_count_worst gauge smartmon_load_cycle_count_worst{disk="/dev/sda",type="sat",smart_id="193"} 100 # HELP smartmon_media_wearout_indicator_raw_value SMART metric media_wearout_indicator_raw_value # TYPE smartmon_media_wearout_indicator_raw_value gauge smartmon_media_wearout_indicator_raw_value{disk="/dev/sdb",type="sat",smart_id="230"} 0.000000e+00 # HELP smartmon_media_wearout_indicator_threshold SMART metric media_wearout_indicator_threshold # TYPE smartmon_media_wearout_indicator_threshold gauge smartmon_media_wearout_indicator_threshold{disk="/dev/sdb",type="sat",smart_id="230"} 0 # HELP smartmon_media_wearout_indicator_value SMART metric media_wearout_indicator_value # TYPE smartmon_media_wearout_indicator_value gauge smartmon_media_wearout_indicator_value{disk="/dev/sdb",type="sat",smart_id="230"} 100 # HELP smartmon_media_wearout_indicator_worst SMART metric media_wearout_indicator_worst # TYPE smartmon_media_wearout_indicator_worst gauge smartmon_media_wearout_indicator_worst{disk="/dev/sdb",type="sat",smart_id="230"} 100 # HELP smartmon_offline_uncorrectable_raw_value SMART metric offline_uncorrectable_raw_value # TYPE smartmon_offline_uncorrectable_raw_value gauge smartmon_offline_uncorrectable_raw_value{disk="/dev/sda",type="sat",smart_id="198"} 0.000000e+00 # HELP smartmon_offline_uncorrectable_threshold SMART metric offline_uncorrectable_threshold # TYPE smartmon_offline_uncorrectable_threshold gauge smartmon_offline_uncorrectable_threshold{disk="/dev/sda",type="sat",smart_id="198"} 0 # HELP smartmon_offline_uncorrectable_value SMART metric offline_uncorrectable_value # TYPE smartmon_offline_uncorrectable_value gauge smartmon_offline_uncorrectable_value{disk="/dev/sda",type="sat",smart_id="198"} 100 # HELP smartmon_offline_uncorrectable_worst SMART metric offline_uncorrectable_worst # TYPE smartmon_offline_uncorrectable_worst gauge smartmon_offline_uncorrectable_worst{disk="/dev/sda",type="sat",smart_id="198"} 100 # HELP smartmon_power_cycle_count_raw_value SMART metric power_cycle_count_raw_value # TYPE smartmon_power_cycle_count_raw_value gauge smartmon_power_cycle_count_raw_value{disk="/dev/sda",type="sat",smart_id="12"} 2.170000e+02 smartmon_power_cycle_count_raw_value{disk="/dev/sdb",type="sat",smart_id="12"} 3.240000e+02 # HELP smartmon_power_cycle_count_threshold SMART metric power_cycle_count_threshold # TYPE smartmon_power_cycle_count_threshold gauge smartmon_power_cycle_count_threshold{disk="/dev/sda",type="sat",smart_id="12"} 0 smartmon_power_cycle_count_threshold{disk="/dev/sdb",type="sat",smart_id="12"} 0 # HELP smartmon_power_cycle_count_value SMART metric power_cycle_count_value # TYPE smartmon_power_cycle_count_value gauge smartmon_power_cycle_count_value{disk="/dev/sda",type="sat",smart_id="12"} 100 smartmon_power_cycle_count_value{disk="/dev/sdb",type="sat",smart_id="12"} 100 # HELP smartmon_power_cycle_count_worst SMART metric power_cycle_count_worst # TYPE smartmon_power_cycle_count_worst gauge smartmon_power_cycle_count_worst{disk="/dev/sda",type="sat",smart_id="12"} 100 smartmon_power_cycle_count_worst{disk="/dev/sdb",type="sat",smart_id="12"} 100 # HELP smartmon_power_on_hours_raw_value SMART metric power_on_hours_raw_value # TYPE smartmon_power_on_hours_raw_value gauge smartmon_power_on_hours_raw_value{disk="/dev/sda",type="sat",smart_id="9"} 5.280000e+03 smartmon_power_on_hours_raw_value{disk="/dev/sdb",type="sat",smart_id="9"} 1.419400e+04 # HELP smartmon_power_on_hours_threshold SMART metric power_on_hours_threshold # TYPE smartmon_power_on_hours_threshold gauge smartmon_power_on_hours_threshold{disk="/dev/sda",type="sat",smart_id="9"} 0 smartmon_power_on_hours_threshold{disk="/dev/sdb",type="sat",smart_id="9"} 0 # HELP smartmon_power_on_hours_value SMART metric power_on_hours_value # TYPE smartmon_power_on_hours_value gauge smartmon_power_on_hours_value{disk="/dev/sda",type="sat",smart_id="9"} 88 smartmon_power_on_hours_value{disk="/dev/sdb",type="sat",smart_id="9"} 100 # HELP smartmon_power_on_hours_worst SMART metric power_on_hours_worst # TYPE smartmon_power_on_hours_worst gauge smartmon_power_on_hours_worst{disk="/dev/sda",type="sat",smart_id="9"} 88 smartmon_power_on_hours_worst{disk="/dev/sdb",type="sat",smart_id="9"} 100 # HELP smartmon_program_fail_count_raw_value SMART metric program_fail_count_raw_value # TYPE smartmon_program_fail_count_raw_value gauge smartmon_program_fail_count_raw_value{disk="/dev/sdb",type="sat",smart_id="171"} 0.000000e+00 # HELP smartmon_program_fail_count_threshold SMART metric program_fail_count_threshold # TYPE smartmon_program_fail_count_threshold gauge smartmon_program_fail_count_threshold{disk="/dev/sdb",type="sat",smart_id="171"} 0 # HELP smartmon_program_fail_count_value SMART metric program_fail_count_value # TYPE smartmon_program_fail_count_value gauge smartmon_program_fail_count_value{disk="/dev/sdb",type="sat",smart_id="171"} 100 # HELP smartmon_program_fail_count_worst SMART metric program_fail_count_worst # TYPE smartmon_program_fail_count_worst gauge smartmon_program_fail_count_worst{disk="/dev/sdb",type="sat",smart_id="171"} 100 # HELP smartmon_raw_read_error_rate_raw_value SMART metric raw_read_error_rate_raw_value # TYPE smartmon_raw_read_error_rate_raw_value gauge smartmon_raw_read_error_rate_raw_value{disk="/dev/sda",type="sat",smart_id="1"} 0.000000e+00 # HELP smartmon_raw_read_error_rate_threshold SMART metric raw_read_error_rate_threshold # TYPE smartmon_raw_read_error_rate_threshold gauge smartmon_raw_read_error_rate_threshold{disk="/dev/sda",type="sat",smart_id="1"} 62 # HELP smartmon_raw_read_error_rate_value SMART metric raw_read_error_rate_value # TYPE smartmon_raw_read_error_rate_value gauge smartmon_raw_read_error_rate_value{disk="/dev/sda",type="sat",smart_id="1"} 100 # HELP smartmon_raw_read_error_rate_worst SMART metric raw_read_error_rate_worst # TYPE smartmon_raw_read_error_rate_worst gauge smartmon_raw_read_error_rate_worst{disk="/dev/sda",type="sat",smart_id="1"} 100 # HELP smartmon_reallocated_sector_ct_raw_value SMART metric reallocated_sector_ct_raw_value # TYPE smartmon_reallocated_sector_ct_raw_value gauge smartmon_reallocated_sector_ct_raw_value{disk="/dev/sda",type="sat",smart_id="5"} 0.000000e+00 smartmon_reallocated_sector_ct_raw_value{disk="/dev/sdb",type="sat",smart_id="5"} 0.000000e+00 # HELP smartmon_reallocated_sector_ct_threshold SMART metric reallocated_sector_ct_threshold # TYPE smartmon_reallocated_sector_ct_threshold gauge smartmon_reallocated_sector_ct_threshold{disk="/dev/sda",type="sat",smart_id="5"} 5 smartmon_reallocated_sector_ct_threshold{disk="/dev/sdb",type="sat",smart_id="5"} 0 # HELP smartmon_reallocated_sector_ct_value SMART metric reallocated_sector_ct_value # TYPE smartmon_reallocated_sector_ct_value gauge smartmon_reallocated_sector_ct_value{disk="/dev/sda",type="sat",smart_id="5"} 100 smartmon_reallocated_sector_ct_value{disk="/dev/sdb",type="sat",smart_id="5"} 100 # HELP smartmon_reallocated_sector_ct_worst SMART metric reallocated_sector_ct_worst # TYPE smartmon_reallocated_sector_ct_worst gauge smartmon_reallocated_sector_ct_worst{disk="/dev/sda",type="sat",smart_id="5"} 100 smartmon_reallocated_sector_ct_worst{disk="/dev/sdb",type="sat",smart_id="5"} 100 # HELP smartmon_reported_uncorrect_raw_value SMART metric reported_uncorrect_raw_value # TYPE smartmon_reported_uncorrect_raw_value gauge smartmon_reported_uncorrect_raw_value{disk="/dev/sdb",type="sat",smart_id="187"} 0.000000e+00 # HELP smartmon_reported_uncorrect_threshold SMART metric reported_uncorrect_threshold # TYPE smartmon_reported_uncorrect_threshold gauge smartmon_reported_uncorrect_threshold{disk="/dev/sdb",type="sat",smart_id="187"} 0 # HELP smartmon_reported_uncorrect_value SMART metric reported_uncorrect_value # TYPE smartmon_reported_uncorrect_value gauge smartmon_reported_uncorrect_value{disk="/dev/sdb",type="sat",smart_id="187"} 100 # HELP smartmon_reported_uncorrect_worst SMART metric reported_uncorrect_worst # TYPE smartmon_reported_uncorrect_worst gauge smartmon_reported_uncorrect_worst{disk="/dev/sdb",type="sat",smart_id="187"} 100 # HELP smartmon_smartctl_run SMART metric smartctl_run # TYPE smartmon_smartctl_run gauge smartmon_smartctl_run{disk="/dev/sda",type="sat"} 1548863732 smartmon_smartctl_run{disk="/dev/sdb",type="sat"} 1548863733 # HELP smartmon_spin_retry_count_raw_value SMART metric spin_retry_count_raw_value # TYPE smartmon_spin_retry_count_raw_value gauge smartmon_spin_retry_count_raw_value{disk="/dev/sda",type="sat",smart_id="10"} 0.000000e+00 # HELP smartmon_spin_retry_count_threshold SMART metric spin_retry_count_threshold # TYPE smartmon_spin_retry_count_threshold gauge smartmon_spin_retry_count_threshold{disk="/dev/sda",type="sat",smart_id="10"} 60 # HELP smartmon_spin_retry_count_value SMART metric spin_retry_count_value # TYPE smartmon_spin_retry_count_value gauge smartmon_spin_retry_count_value{disk="/dev/sda",type="sat",smart_id="10"} 100 # HELP smartmon_spin_retry_count_worst SMART metric spin_retry_count_worst # TYPE smartmon_spin_retry_count_worst gauge smartmon_spin_retry_count_worst{disk="/dev/sda",type="sat",smart_id="10"} 100 # HELP smartmon_spin_up_time_raw_value SMART metric spin_up_time_raw_value # TYPE smartmon_spin_up_time_raw_value gauge smartmon_spin_up_time_raw_value{disk="/dev/sda",type="sat",smart_id="3"} 2.000000e+00 # HELP smartmon_spin_up_time_threshold SMART metric spin_up_time_threshold # TYPE smartmon_spin_up_time_threshold gauge smartmon_spin_up_time_threshold{disk="/dev/sda",type="sat",smart_id="3"} 33 # HELP smartmon_spin_up_time_value SMART metric spin_up_time_value # TYPE smartmon_spin_up_time_value gauge smartmon_spin_up_time_value{disk="/dev/sda",type="sat",smart_id="3"} 119 # HELP smartmon_spin_up_time_worst SMART metric spin_up_time_worst # TYPE smartmon_spin_up_time_worst gauge smartmon_spin_up_time_worst{disk="/dev/sda",type="sat",smart_id="3"} 119 # HELP smartmon_start_stop_count_raw_value SMART metric start_stop_count_raw_value # TYPE smartmon_start_stop_count_raw_value gauge smartmon_start_stop_count_raw_value{disk="/dev/sda",type="sat",smart_id="4"} 2.600000e+02 # HELP smartmon_start_stop_count_threshold SMART metric start_stop_count_threshold # TYPE smartmon_start_stop_count_threshold gauge smartmon_start_stop_count_threshold{disk="/dev/sda",type="sat",smart_id="4"} 0 # HELP smartmon_start_stop_count_value SMART metric start_stop_count_value # TYPE smartmon_start_stop_count_value gauge smartmon_start_stop_count_value{disk="/dev/sda",type="sat",smart_id="4"} 100 # HELP smartmon_start_stop_count_worst SMART metric start_stop_count_worst # TYPE smartmon_start_stop_count_worst gauge smartmon_start_stop_count_worst{disk="/dev/sda",type="sat",smart_id="4"} 100 # HELP smartmon_temperature_celsius_raw_value SMART metric temperature_celsius_raw_value # TYPE smartmon_temperature_celsius_raw_value gauge smartmon_temperature_celsius_raw_value{disk="/dev/sda",type="sat",smart_id="194"} 3.700000e+01 smartmon_temperature_celsius_raw_value{disk="/dev/sdb",type="sat",smart_id="194"} 4.200000e+01 # HELP smartmon_temperature_celsius_threshold SMART metric temperature_celsius_threshold # TYPE smartmon_temperature_celsius_threshold gauge smartmon_temperature_celsius_threshold{disk="/dev/sda",type="sat",smart_id="194"} 0 smartmon_temperature_celsius_threshold{disk="/dev/sdb",type="sat",smart_id="194"} 0 # HELP smartmon_temperature_celsius_value SMART metric temperature_celsius_value # TYPE smartmon_temperature_celsius_value gauge smartmon_temperature_celsius_value{disk="/dev/sda",type="sat",smart_id="194"} 162 smartmon_temperature_celsius_value{disk="/dev/sdb",type="sat",smart_id="194"} 58 # HELP smartmon_temperature_celsius_worst SMART metric temperature_celsius_worst # TYPE smartmon_temperature_celsius_worst gauge smartmon_temperature_celsius_worst{disk="/dev/sda",type="sat",smart_id="194"} 162 smartmon_temperature_celsius_worst{disk="/dev/sdb",type="sat",smart_id="194"} 65 # HELP smartmon_udma_crc_error_count_raw_value SMART metric udma_crc_error_count_raw_value # TYPE smartmon_udma_crc_error_count_raw_value gauge smartmon_udma_crc_error_count_raw_value{disk="/dev/sda",type="sat",smart_id="199"} 0.000000e+00 smartmon_udma_crc_error_count_raw_value{disk="/dev/sdb",type="sat",smart_id="199"} 0.000000e+00 # HELP smartmon_udma_crc_error_count_threshold SMART metric udma_crc_error_count_threshold # TYPE smartmon_udma_crc_error_count_threshold gauge smartmon_udma_crc_error_count_threshold{disk="/dev/sda",type="sat",smart_id="199"} 0 smartmon_udma_crc_error_count_threshold{disk="/dev/sdb",type="sat",smart_id="199"} 0 # HELP smartmon_udma_crc_error_count_value SMART metric udma_crc_error_count_value # TYPE smartmon_udma_crc_error_count_value gauge smartmon_udma_crc_error_count_value{disk="/dev/sda",type="sat",smart_id="199"} 200 smartmon_udma_crc_error_count_value{disk="/dev/sdb",type="sat",smart_id="199"} 100 # HELP smartmon_udma_crc_error_count_worst SMART metric udma_crc_error_count_worst # TYPE smartmon_udma_crc_error_count_worst gauge smartmon_udma_crc_error_count_worst{disk="/dev/sda",type="sat",smart_id="199"} 200 smartmon_udma_crc_error_count_worst{disk="/dev/sdb",type="sat",smart_id="199"} 100