a91fbc1088
Now mdcheck service can't be run successfully. We need to put mdcheck in to the right place (/usr/share/mdadm/mdcheck) and it needs to remove the dependency of mdadm_env.sh which is fixed in patch 76c224c6c. And there is a history problem. It needed KillMode=none before, so it removed the upstream patch 52c67fcdd. Now this problem has been fixed, so we can do the backport more easilly now. We don't need to remove the upstream patch here again. Resolves: bz#2175540 Signed-off-by: Xiao Ni <xni@redhat.com>
407 lines
14 KiB
Diff
407 lines
14 KiB
Diff
From cc3df167c599d2ee0c132149c86fc0ad70d9f14e Mon Sep 17 00:00:00 2001
|
|
From: Mateusz Grzonka <mateusz.grzonka@intel.com>
|
|
Date: Thu, 2 Feb 2023 12:27:01 +0100
|
|
Subject: [PATCH 089/120] Mdmonitor: Add helper functions
|
|
|
|
Add functions:
|
|
- is_email_event(),
|
|
- get_syslog_event_priority(),
|
|
- sprint_event_message(),
|
|
with kernel style comments containing more detailed descriptions.
|
|
|
|
Also update event syslog priorities to be consistent with man. MoveSpare event was described in man as priority info, while implemented as warning. Move event data into a struct, so that it is passed between different functions if needed.
|
|
Sort function declarations alphabetically and remove redundant alert() declaration.
|
|
|
|
Signed-off-by: Mateusz Grzonka <mateusz.grzonka@intel.com>
|
|
Acked-by: Coly Li <colyli@suse.de>
|
|
Signed-off-by: Jes Sorensen <jes@trained-monkey.org>
|
|
---
|
|
Monitor.c | 228 +++++++++++++++++++++++++++++++++++++-----------------
|
|
1 file changed, 158 insertions(+), 70 deletions(-)
|
|
|
|
diff --git a/Monitor.c b/Monitor.c
|
|
index 029e9efd..39598ba0 100644
|
|
--- a/Monitor.c
|
|
+++ b/Monitor.c
|
|
@@ -73,10 +73,12 @@ enum event {
|
|
EVENT_NEW_ARRAY,
|
|
EVENT_MOVE_SPARE,
|
|
EVENT_TEST_MESSAGE,
|
|
+ __SYSLOG_PRIORITY_WARNING,
|
|
EVENT_REBUILD_STARTED,
|
|
EVENT_REBUILD,
|
|
EVENT_REBUILD_FINISHED,
|
|
EVENT_SPARES_MISSING,
|
|
+ __SYSLOG_PRIORITY_CRITICAL,
|
|
EVENT_DEVICE_DISAPPEARED,
|
|
EVENT_FAIL,
|
|
EVENT_FAIL_SPARE,
|
|
@@ -100,18 +102,31 @@ mapping_t events_map[] = {
|
|
{NULL, EVENT_UNKNOWN}
|
|
};
|
|
|
|
-static int make_daemon(char *pidfile);
|
|
-static int check_one_sharer(int scan);
|
|
-static void write_autorebuild_pid(void);
|
|
-static void alert(const enum event event_enum, const unsigned int progress, const char *dev, const char *disc);
|
|
-static int check_array(struct state *st, struct mdstat_ent *mdstat, int increments, char *prefer);
|
|
+struct event_data {
|
|
+ enum event event_enum;
|
|
+ /*
|
|
+ * @event_name: Rebuild event name must be in form "RebuildXX", where XX is rebuild progress.
|
|
+ */
|
|
+ char event_name[EVENT_NAME_MAX];
|
|
+ char message[BUFSIZ];
|
|
+ const char *description;
|
|
+ const char *dev;
|
|
+ const char *disc;
|
|
+};
|
|
+
|
|
static int add_new_arrays(struct mdstat_ent *mdstat, struct state **statelist);
|
|
static void try_spare_migration(struct state *statelist);
|
|
static void link_containers_with_subarrays(struct state *list);
|
|
static void free_statelist(struct state *statelist);
|
|
+static int check_array(struct state *st, struct mdstat_ent *mdstat, int increments, char *prefer);
|
|
+static int check_one_sharer(int scan);
|
|
#ifndef NO_LIBUDEV
|
|
static int check_udev_activity(void);
|
|
#endif
|
|
+static void link_containers_with_subarrays(struct state *list);
|
|
+static int make_daemon(char *pidfile);
|
|
+static void try_spare_migration(struct state *statelist);
|
|
+static void write_autorebuild_pid(void);
|
|
|
|
int Monitor(struct mddev_dev *devlist,
|
|
char *mailaddr, char *alert_cmd,
|
|
@@ -450,7 +465,80 @@ static void write_autorebuild_pid()
|
|
}
|
|
}
|
|
|
|
-static void execute_alert_cmd(const char *event_name, const char *dev, const char *disc)
|
|
+#define BASE_MESSAGE "%s event detected on md device %s"
|
|
+#define COMPONENT_DEVICE_MESSAGE ", component device %s"
|
|
+#define DESCRIPTION_MESSAGE ": %s"
|
|
+/*
|
|
+ * sprint_event_message() - Writes basic message about detected event to destination ptr.
|
|
+ * @dest: message destination, should be at least the size of BUFSIZ
|
|
+ * @data: event data
|
|
+ *
|
|
+ * Return: 0 on success, 1 on error
|
|
+ */
|
|
+static int sprint_event_message(char *dest, const struct event_data *data)
|
|
+{
|
|
+ if (!dest || !data)
|
|
+ return 1;
|
|
+
|
|
+ if (data->disc && data->description)
|
|
+ snprintf(dest, BUFSIZ, BASE_MESSAGE COMPONENT_DEVICE_MESSAGE DESCRIPTION_MESSAGE,
|
|
+ data->event_name, data->dev, data->disc, data->description);
|
|
+ else if (data->disc)
|
|
+ snprintf(dest, BUFSIZ, BASE_MESSAGE COMPONENT_DEVICE_MESSAGE,
|
|
+ data->event_name, data->dev, data->disc);
|
|
+ else if (data->description)
|
|
+ snprintf(dest, BUFSIZ, BASE_MESSAGE DESCRIPTION_MESSAGE,
|
|
+ data->event_name, data->dev, data->description);
|
|
+ else
|
|
+ snprintf(dest, BUFSIZ, BASE_MESSAGE, data->event_name, data->dev);
|
|
+
|
|
+ return 0;
|
|
+}
|
|
+
|
|
+/*
|
|
+ * get_syslog_event_priority() - Determines event priority.
|
|
+ * @event_enum: event to be checked
|
|
+ *
|
|
+ * Return: LOG_CRIT, LOG_WARNING or LOG_INFO
|
|
+ */
|
|
+static int get_syslog_event_priority(const enum event event_enum)
|
|
+{
|
|
+ if (event_enum > __SYSLOG_PRIORITY_CRITICAL)
|
|
+ return LOG_CRIT;
|
|
+ if (event_enum > __SYSLOG_PRIORITY_WARNING)
|
|
+ return LOG_WARNING;
|
|
+ return LOG_INFO;
|
|
+}
|
|
+
|
|
+/*
|
|
+ * is_email_event() - Determines whether email for event should be sent or not.
|
|
+ * @event_enum: event to be checked
|
|
+ *
|
|
+ * Return: true if email should be sent, false otherwise
|
|
+ */
|
|
+static bool is_email_event(const enum event event_enum)
|
|
+{
|
|
+ static const enum event email_events[] = {
|
|
+ EVENT_FAIL,
|
|
+ EVENT_FAIL_SPARE,
|
|
+ EVENT_DEGRADED_ARRAY,
|
|
+ EVENT_SPARES_MISSING,
|
|
+ EVENT_TEST_MESSAGE
|
|
+ };
|
|
+ unsigned int i;
|
|
+
|
|
+ for (i = 0; i < ARRAY_SIZE(email_events); ++i) {
|
|
+ if (event_enum == email_events[i])
|
|
+ return true;
|
|
+ }
|
|
+ return false;
|
|
+}
|
|
+
|
|
+/*
|
|
+ * execute_alert_cmd() - Forks and executes command provided as alert_cmd.
|
|
+ * @data: event data
|
|
+ */
|
|
+static void execute_alert_cmd(const struct event_data *data)
|
|
{
|
|
int pid = fork();
|
|
|
|
@@ -462,12 +550,16 @@ static void execute_alert_cmd(const char *event_name, const char *dev, const cha
|
|
pr_err("Cannot fork to execute alert command");
|
|
break;
|
|
case 0:
|
|
- execl(info.alert_cmd, info.alert_cmd, event_name, dev, disc, NULL);
|
|
+ execl(info.alert_cmd, info.alert_cmd, data->event_name, data->dev, data->disc, NULL);
|
|
exit(2);
|
|
}
|
|
}
|
|
|
|
-static void send_event_email(const char *event_name, const char *dev, const char *disc)
|
|
+/*
|
|
+ * send_event_email() - Sends an email about event detected by monitor.
|
|
+ * @data: event data
|
|
+ */
|
|
+static void send_event_email(const struct event_data *data)
|
|
{
|
|
FILE *mp, *mdstat;
|
|
char buf[BUFSIZ];
|
|
@@ -485,15 +577,9 @@ static void send_event_email(const char *event_name, const char *dev, const char
|
|
else
|
|
fprintf(mp, "From: %s monitoring <root>\n", Name);
|
|
fprintf(mp, "To: %s\n", info.mailaddr);
|
|
- fprintf(mp, "Subject: %s event on %s:%s\n\n", event_name, dev, info.hostname);
|
|
- fprintf(mp, "This is an automatically generated mail message. \n");
|
|
- fprintf(mp, "A %s event had been detected on md device %s.\n\n", event_name, dev);
|
|
-
|
|
- if (disc && disc[0] != ' ')
|
|
- fprintf(mp,
|
|
- "It could be related to component device %s.\n\n", disc);
|
|
- if (disc && disc[0] == ' ')
|
|
- fprintf(mp, "Extra information:%s.\n\n", disc);
|
|
+ fprintf(mp, "Subject: %s event on %s:%s\n\n", data->event_name, data->dev, info.hostname);
|
|
+ fprintf(mp, "This is an automatically generated mail message.\n");
|
|
+ fprintf(mp, "%s\n", data->message);
|
|
|
|
mdstat = fopen("/proc/mdstat", "r");
|
|
if (!mdstat) {
|
|
@@ -509,58 +595,60 @@ static void send_event_email(const char *event_name, const char *dev, const char
|
|
pclose(mp);
|
|
}
|
|
|
|
-static void log_event_to_syslog(const enum event event_enum, const char *event_name, const char *dev, const char *disc)
|
|
+/*
|
|
+ * log_event_to_syslog() - Logs an event into syslog.
|
|
+ * @data: event data
|
|
+ */
|
|
+static void log_event_to_syslog(const struct event_data *data)
|
|
{
|
|
int priority;
|
|
- /* Log at a different severity depending on the event.
|
|
- *
|
|
- * These are the critical events: */
|
|
- if (event_enum == EVENT_FAIL ||
|
|
- event_enum == EVENT_DEGRADED_ARRAY ||
|
|
- event_enum == EVENT_DEVICE_DISAPPEARED)
|
|
- priority = LOG_CRIT;
|
|
- /* Good to know about, but are not failures: */
|
|
- else if (event_enum == EVENT_REBUILD ||
|
|
- event_enum == EVENT_MOVE_SPARE ||
|
|
- event_enum == EVENT_SPARES_MISSING)
|
|
- priority = LOG_WARNING;
|
|
- /* Everything else: */
|
|
- else
|
|
- priority = LOG_INFO;
|
|
-
|
|
- if (disc && disc[0] != ' ')
|
|
- syslog(priority,
|
|
- "%s event detected on md device %s, component device %s",
|
|
- event_name, dev, disc);
|
|
- else if (disc)
|
|
- syslog(priority, "%s event detected on md device %s: %s", event_name, dev, disc);
|
|
- else
|
|
- syslog(priority, "%s event detected on md device %s", event_name, dev);
|
|
+
|
|
+ priority = get_syslog_event_priority(data->event_enum);
|
|
+
|
|
+ syslog(priority, "%s\n", data->message);
|
|
}
|
|
|
|
-static void alert(const enum event event_enum, const unsigned int progress, const char *dev, const char *disc)
|
|
+/*
|
|
+ * alert() - Alerts about the monitor event.
|
|
+ * @event_enum: event to be sent
|
|
+ * @description: event description
|
|
+ * @progress: rebuild progress
|
|
+ * @dev: md device name
|
|
+ * @disc: component device
|
|
+ *
|
|
+ * If needed function executes alert command, sends an email or logs event to syslog.
|
|
+ */
|
|
+static void alert(const enum event event_enum, const char *description, const uint8_t progress,
|
|
+ const char *dev, const char *disc)
|
|
{
|
|
- char event_name[EVENT_NAME_MAX];
|
|
+ struct event_data data = {.dev = dev, .disc = disc, .description = description};
|
|
+
|
|
+ if (!dev)
|
|
+ return;
|
|
|
|
if (event_enum == EVENT_REBUILD) {
|
|
- snprintf(event_name, sizeof(event_name), "%s%02d",
|
|
+ snprintf(data.event_name, sizeof(data.event_name), "%s%02d",
|
|
map_num_s(events_map, EVENT_REBUILD), progress);
|
|
} else {
|
|
- snprintf(event_name, sizeof(event_name), "%s", map_num_s(events_map, event_enum));
|
|
+ snprintf(data.event_name, sizeof(data.event_name), "%s", map_num_s(events_map, event_enum));
|
|
}
|
|
|
|
- if (info.alert_cmd)
|
|
- execute_alert_cmd(event_name, dev, disc);
|
|
+ data.event_enum = event_enum;
|
|
|
|
- if (info.mailaddr && (event_enum == EVENT_FAIL ||
|
|
- event_enum == EVENT_TEST_MESSAGE ||
|
|
- event_enum == EVENT_SPARES_MISSING ||
|
|
- event_enum == EVENT_DEGRADED_ARRAY)) {
|
|
- send_event_email(event_name, dev, disc);
|
|
+ if (sprint_event_message(data.message, &data) != 0) {
|
|
+ pr_err("Cannot create event message.\n");
|
|
+ return;
|
|
}
|
|
+ pr_err("%s\n", data.message);
|
|
+
|
|
+ if (info.alert_cmd)
|
|
+ execute_alert_cmd(&data);
|
|
+
|
|
+ if (info.mailaddr && is_email_event(event_enum))
|
|
+ send_event_email(&data);
|
|
|
|
if (info.dosyslog)
|
|
- log_event_to_syslog(event_enum, event_name, dev, disc);
|
|
+ log_event_to_syslog(&data);
|
|
}
|
|
|
|
static int check_array(struct state *st, struct mdstat_ent *mdstat,
|
|
@@ -585,7 +673,7 @@ static int check_array(struct state *st, struct mdstat_ent *mdstat,
|
|
unsigned long redundancy_only_flags = 0;
|
|
|
|
if (info.test)
|
|
- alert(EVENT_TEST_MESSAGE, 0, dev, NULL);
|
|
+ alert(EVENT_TEST_MESSAGE, NULL, 0, dev, NULL);
|
|
|
|
retval = 0;
|
|
|
|
@@ -634,7 +722,7 @@ static int check_array(struct state *st, struct mdstat_ent *mdstat,
|
|
*/
|
|
if (sra->array.level == 0 || sra->array.level == -1) {
|
|
if (!st->err && !st->from_config)
|
|
- alert(EVENT_DEVICE_DISAPPEARED, 0, dev, " Wrong-Level");
|
|
+ alert(EVENT_DEVICE_DISAPPEARED, "Wrong-Level", 0, dev, NULL);
|
|
st->err++;
|
|
goto out;
|
|
}
|
|
@@ -651,7 +739,7 @@ static int check_array(struct state *st, struct mdstat_ent *mdstat,
|
|
st->percent = RESYNC_NONE;
|
|
new_array = 1;
|
|
if (!is_container)
|
|
- alert(EVENT_NEW_ARRAY, 0, st->devname, NULL);
|
|
+ alert(EVENT_NEW_ARRAY, NULL, 0, st->devname, NULL);
|
|
}
|
|
|
|
if (st->utime == array.utime && st->failed == sra->array.failed_disks &&
|
|
@@ -664,20 +752,20 @@ static int check_array(struct state *st, struct mdstat_ent *mdstat,
|
|
}
|
|
if (st->utime == 0 && /* new array */
|
|
mse->pattern && strchr(mse->pattern, '_') /* degraded */)
|
|
- alert(EVENT_DEGRADED_ARRAY, 0, dev, NULL);
|
|
+ alert(EVENT_DEGRADED_ARRAY, NULL, 0, dev, NULL);
|
|
|
|
if (st->utime == 0 && /* new array */ st->expected_spares > 0 &&
|
|
sra->array.spare_disks < st->expected_spares)
|
|
- alert(EVENT_SPARES_MISSING, 0, dev, NULL);
|
|
+ alert(EVENT_SPARES_MISSING, NULL, 0, dev, NULL);
|
|
if (st->percent < 0 && st->percent != RESYNC_UNKNOWN &&
|
|
mse->percent >= 0)
|
|
- alert(EVENT_REBUILD_STARTED, 0, dev, NULL);
|
|
+ alert(EVENT_REBUILD_STARTED, NULL, 0, dev, NULL);
|
|
if (st->percent >= 0 && mse->percent >= 0 &&
|
|
(mse->percent / increments) > (st->percent / increments)) {
|
|
if((mse->percent / increments) == 0)
|
|
- alert(EVENT_REBUILD_STARTED, 0, dev, NULL);
|
|
+ alert(EVENT_REBUILD_STARTED, NULL, 0, dev, NULL);
|
|
else
|
|
- alert(EVENT_REBUILD, mse->percent, dev, NULL);
|
|
+ alert(EVENT_REBUILD, NULL, mse->percent, dev, NULL);
|
|
}
|
|
|
|
if (mse->percent == RESYNC_NONE && st->percent >= 0) {
|
|
@@ -690,9 +778,9 @@ static int check_array(struct state *st, struct mdstat_ent *mdstat,
|
|
snprintf(cnt, sizeof(cnt),
|
|
" mismatches found: %d (on raid level %d)",
|
|
sra->mismatch_cnt, sra->array.level);
|
|
- alert(EVENT_REBUILD_FINISHED, 0, dev, cnt);
|
|
+ alert(EVENT_REBUILD_FINISHED, NULL, 0, dev, cnt);
|
|
} else
|
|
- alert(EVENT_REBUILD_FINISHED, 0, dev, NULL);
|
|
+ alert(EVENT_REBUILD_FINISHED, NULL, 0, dev, NULL);
|
|
}
|
|
st->percent = mse->percent;
|
|
|
|
@@ -746,14 +834,14 @@ static int check_array(struct state *st, struct mdstat_ent *mdstat,
|
|
change = newstate ^ st->devstate[i];
|
|
if (st->utime && change && !st->err && !new_array) {
|
|
if ((st->devstate[i]&change) & (1 << MD_DISK_SYNC))
|
|
- alert(EVENT_FAIL, 0, dev, dv);
|
|
+ alert(EVENT_FAIL, NULL, 0, dev, dv);
|
|
else if ((newstate & (1 << MD_DISK_FAULTY)) &&
|
|
(disc.major || disc.minor) &&
|
|
st->devid[i] == makedev(disc.major,
|
|
disc.minor))
|
|
- alert(EVENT_FAIL_SPARE, 0, dev, dv);
|
|
+ alert(EVENT_FAIL_SPARE, NULL, 0, dev, dv);
|
|
else if ((newstate&change) & (1 << MD_DISK_SYNC))
|
|
- alert(EVENT_SPARE_ACTIVE, 0, dev, dv);
|
|
+ alert(EVENT_SPARE_ACTIVE, NULL, 0, dev, dv);
|
|
}
|
|
st->devstate[i] = newstate;
|
|
st->devid[i] = makedev(disc.major, disc.minor);
|
|
@@ -777,7 +865,7 @@ static int check_array(struct state *st, struct mdstat_ent *mdstat,
|
|
|
|
disappeared:
|
|
if (!st->err && !is_container)
|
|
- alert(EVENT_DEVICE_DISAPPEARED, 0, dev, NULL);
|
|
+ alert(EVENT_DEVICE_DISAPPEARED, NULL, 0, dev, NULL);
|
|
st->err++;
|
|
goto out;
|
|
}
|
|
@@ -836,7 +924,7 @@ static int add_new_arrays(struct mdstat_ent *mdstat, struct state **statelist)
|
|
st->parent_devnm[0] = 0;
|
|
*statelist = st;
|
|
if (info.test)
|
|
- alert(EVENT_TEST_MESSAGE, 0, st->devname, NULL);
|
|
+ alert(EVENT_TEST_MESSAGE, NULL, 0, st->devname, NULL);
|
|
new_found = 1;
|
|
}
|
|
return new_found;
|
|
@@ -1059,7 +1147,7 @@ static void try_spare_migration(struct state *statelist)
|
|
if (devid > 0 &&
|
|
move_spare(from->devname, to->devname,
|
|
devid)) {
|
|
- alert(EVENT_MOVE_SPARE, 0, to->devname, from->devname);
|
|
+ alert(EVENT_MOVE_SPARE, NULL, 0, to->devname, from->devname);
|
|
break;
|
|
}
|
|
}
|
|
--
|
|
2.38.1
|
|
|