[<prev] [next>] [<thread-prev] [day] [month] [year] [list]
Message-ID: <20251008155407.GZ8757@google.com>
Date: Wed, 8 Oct 2025 16:54:07 +0100
From: Lee Jones <lee@...nel.org>
To: Heiko Stuebner <heiko@...ech.de>
Cc: linux-kernel@...r.kernel.org
Subject: Re: [PATCH 4/4] mfd: qnap-mcu: Add proper error handling for command
errors
On Tue, 23 Sep 2025, Heiko Stuebner wrote:
> Further investigation revealed that the MCU in QNAP devices may return
> two error states. One "@8" for a checksum error in the submitted command
> and one "@9" for any generic (and sadly unspecified) error.
>
> These error codes with 2 data character can of course also be shorter
> then the expected reply length for the submitted command, so we'll
> need to check the received data for error codes and exit the receive
> portion early in that case.
>
> Signed-off-by: Heiko Stuebner <heiko@...ech.de>
> ---
> drivers/mfd/qnap-mcu.c | 44 +++++++++++++++++++++++++++++++++++++++++-
> 1 file changed, 43 insertions(+), 1 deletion(-)
I can't help but think that there is a bunch of avoidable duplication in
here.
> diff --git a/drivers/mfd/qnap-mcu.c b/drivers/mfd/qnap-mcu.c
> index cd836bdd44a8..fb78609a8433 100644
> --- a/drivers/mfd/qnap-mcu.c
> +++ b/drivers/mfd/qnap-mcu.c
> @@ -19,6 +19,7 @@
> /* The longest command found so far is 5 bytes long */
> #define QNAP_MCU_MAX_CMD_SIZE 5
> #define QNAP_MCU_MAX_DATA_SIZE 36
> +#define QNAP_MCU_ERROR_SIZE 2
> #define QNAP_MCU_CHECKSUM_SIZE 1
>
> #define QNAP_MCU_RX_BUFFER_SIZE \
> @@ -103,6 +104,24 @@ static int qnap_mcu_write(struct qnap_mcu *mcu, const u8 *data, u8 data_size)
> return serdev_device_write(mcu->serdev, tx, length, HZ);
> }
>
> +static bool qnap_mcu_reply_is_generic_error(unsigned char *buf, size_t size)
> +{
> + return (size == QNAP_MCU_ERROR_SIZE + QNAP_MCU_CHECKSUM_SIZE &&
I'd place this check into a separate, concisely named function, then
call it at the start of qnap_mcu_reply_is_generic_error() and
qnap_mcu_reply_is_checksum_error(). Perhaps something like:
static bool qnap_mcu_is_error_msg(size) {
return (size == QNAP_MCU_ERROR_SIZE + QNAP_MCU_CHECKSUM_SIZE);
}
Then at the start of both functions have:
if (!qnap_mcu_is_error_msg(size))
return false;
if (buf[0] == '@' && buf[1] == '9')(
return true;
return false;
> + buf[0] == '@' && buf[1] == '9');
> +}
> +
> +static bool qnap_mcu_reply_is_checksum_error(unsigned char *buf, size_t size)
> +{
> + return (size == QNAP_MCU_ERROR_SIZE + QNAP_MCU_CHECKSUM_SIZE &&
> + buf[0] == '@' && buf[1] == '8');
> +}
> +
> +static bool qnap_mcu_reply_is_any_error(unsigned char *buf, size_t size)
> +{
Then this should simply call each of the functions above:
if (qnap_mcu_reply_is_generic_error(buf, size)) {
dev_err(&mcu->serdev->dev, "Controller received invalid Checksum\n");
return true;
}
if (qnap_mcu_reply_is_checksum_error(buf, size)) {
dev_err(&mcu->serdev->dev, "Controller received invalid Checksum\n");
return true;
}
return false;
Note: all of this is just hand-written psudo-code that was knocked-up in
about 2-mins. None of it has even vaguely been checked or tested.
> + return (size == QNAP_MCU_ERROR_SIZE + QNAP_MCU_CHECKSUM_SIZE &&
> + buf[0] == '@' && (buf[1] == '8' || buf[1] == '9'));
> +}
> +
> static size_t qnap_mcu_receive_buf(struct serdev_device *serdev, const u8 *buf, size_t size)
> {
> struct device *dev = &serdev->dev;
> @@ -136,6 +155,19 @@ static size_t qnap_mcu_receive_buf(struct serdev_device *serdev, const u8 *buf,
> }
> }
>
> + /*
> + * We received everything the uart had to offer for now.
> + * Check for a possible error reply in the received data.
> + */
> + if (reply->received == QNAP_MCU_ERROR_SIZE + QNAP_MCU_CHECKSUM_SIZE &&
If qnap_mcu_verify_checksum() needs this, it too should be inserted into
the function itself.
> + qnap_mcu_verify_checksum(reply->data, reply->received) &&
> + qnap_mcu_reply_is_any_error(reply->data, reply->received)) {
> + /* The reply was an error code, we're done */
> + reply->length = 0;
> +
> + complete(&reply->done);
> + }
> +
> /*
> * The only way to get out of the above loop and end up here
> * is through consuming all of the supplied data, so here we
> @@ -182,10 +214,20 @@ int qnap_mcu_exec(struct qnap_mcu *mcu,
> }
>
> if (!qnap_mcu_verify_checksum(rx, reply->received)) {
> - dev_err(&mcu->serdev->dev, "Invalid Checksum received\n");
> + dev_err(&mcu->serdev->dev, "Invalid Checksum received from controller\n");
As you can see above, I moved the messages into the checking functions too.
> + return -EPROTO;
> + }
> +
> + if (qnap_mcu_reply_is_checksum_error(rx, reply->received)) {
> + dev_err(&mcu->serdev->dev, "Controller received invalid Checksum\n");
> return -EPROTO;
> }
>
> + if (qnap_mcu_reply_is_generic_error(rx, reply->received)) {
> + dev_err(&mcu->serdev->dev, "Generic error received from controller\n");
> + return -EIO;
> + }
> +
> memcpy(reply_data, rx, reply_data_size);
>
> return 0;
> --
> 2.47.2
>
--
Lee Jones [李琼斯]
Powered by blists - more mailing lists