[<prev] [next>] [<thread-prev] [thread-next>] [day] [month] [year] [list]
Message-ID: <77129f40-2da6-4463-b06f-4c6d38135fed@roeck-us.net>
Date: Sun, 2 Nov 2025 09:53:53 -0800
From: Guenter Roeck <linux@...ck-us.net>
To: "Usyskin, Alexander" <alexander.usyskin@...el.com>
Cc: Marek Marczykowski-Górecki
 <marmarek@...isiblethingslab.com>,
 Greg Kroah-Hartman <gregkh@...uxfoundation.org>,
 "Abliyev, Reuven" <reuven.abliyev@...el.com>,
 "linux-kernel@...r.kernel.org" <linux-kernel@...r.kernel.org>
Subject: Re: [char-misc-next] mei: hook mei_device on class device
On 11/2/25 07:37, Guenter Roeck wrote:
> On Sun, Nov 2, 2025 at 7:00 AM Usyskin, Alexander <linux@...ck-us.net> wrote:
That got messed up. Sorry for that. Really sending to Alexander this time.
Guenter
> ...
>>
>> Seems I've missed the error flow in probe (my test machines always have an ME in a good state...).
>>
>> Below patch should fix the problem, can you confirm?
>>
> Yes, it does. With this patch applied, the log output is:
> 
> ...
> [   16.406790] mtdoops: mtd device (mtddev=name/number) must be supplied
> [   18.380400] mei mei0: wait hw ready failed
> [   18.384594] mei mei0: hw_start failed ret = -62 fw status =
> 00070355 002F0006 00000000 00000000 00000000 00000000
> [   20.428395] mei mei0: wait hw ready failed
> [   20.432542] mei mei0: hw_start failed ret = -62 fw status =
> 00070355 002F0006 00000000 00000000 00000000 00000000
> [   22.476390] mei mei0: wait hw ready failed
> [   22.480533] mei mei0: hw_start failed ret = -62 fw status =
> 00070355 002F0006 00000000 00000000 00000000 00000000
> [   22.490847] mei mei0: reset: reached maximal consecutive resets:
> disabling the device
> [   22.498718] mei mei0: reset failed ret = -19
> [   22.503012] mei mei0: link layer initialization failed.
> [   22.508261] mei_me 0000:00:16.0: init hw failure.
> [   22.513662] mei_me 0000:00:16.0: initialization failed.
> initramfs(out): Mounting system filesystems for initramfs init.d
> ...
> 
> Official Tested-by: tag below. Note that it is from my Google address
> since this is where I tested the fix.
> 
>   Thanks a lot for the quick turnaround!
> 
> Guenter
> 
>>  From c58f311df60f26df2efe1e0f9fc523bfa4b93936 Mon Sep 17 00:00:00 2001
>> From: Alexander Usyskin <alexander.usyskin@...el.com>
>> Date: Sun, 2 Nov 2025 10:57:22 +0200
>> Subject: [PATCH] mei: fix error flow in probe
>> MIME-Version: 1.0
>> Content-Type: text/plain; charset=UTF-8
>> Content-Transfer-Encoding: 8bit
>>
>> Dismantle class device last in probe error flow to avoid accessing freed memory like:
>>
>> [   87.926774] WARNING: CPU: 9 PID: 518 at kernel/workqueue.c:4234
>> __flush_work+0x340/0x390
>> ...
>> [   87.926912] Workqueue: async async_run_entry_fn
>> [   87.926918] RIP: e030:__flush_work+0x340/0x390
>> [   87.926923] Code: 26 9d 05 00 65 48 8b 15 26 3c ca 02 48 85 db 48 8b
>> 04 24 48 89 54 24 58 0f 85 de fe ff ff e9 f6 fd ff ff 0f 0b e9 77 ff ff
>> ff <0f> 0b e9 70 ff ff ff 0f 0b e9 19 ff ff ff e8 7d 8b 0e 01 48 89 de
>> [   87.926931] RSP: e02b:ffffc900412ebc00 EFLAGS: 00010246
>> [   87.926936] RAX: 0000000000000000 RBX: ffff888103e55090 RCX: 0000000000000000
>> [   87.926941] RDX: 000fffffffe00000 RSI: 0000000000000001 RDI: ffffc900412ebc60
>> [   87.926945] RBP: ffff888103e55090 R08: ffffffffc1266ec8 R09: ffff8881109076e8
>> [   87.926949] R10: 0000000080040003 R11: 0000000000000000 R12: ffff888103e54000
>> [   87.926953] R13: ffffc900412ebc18 R14: 0000000000000001 R15: 0000000000000000
>> [   87.926962] FS:  0000000000000000(0000) GS:ffff888233238000(0000) knlGS:0000000000000000
>> [   87.926967] CS:  e030 DS: 0000 ES: 0000 CR0: 0000000080050033
>> [   87.926971] CR2: 00007e7923b32708 CR3: 00000001088df000 CR4: 0000000000050660
>> [   87.926977] Call Trace:
>> [   87.926981]  <TASK>
>> [   87.926987]  ? __call_rcu_common.constprop.0+0x11e/0x310
>> [   87.926993]  cancel_work_sync+0x5e/0x80
>> [   87.926999]  mei_cancel_work+0x19/0x40 [mei]
>> [   87.927051]  mei_me_probe+0x273/0x2b0 [mei_me]
>> [   87.927060]  local_pci_probe+0x45/0x90
>> [   87.927066]  pci_call_probe+0x5b/0x180
>> [   87.927070]  pci_device_probe+0x95/0x140
>> [   87.927074]  ? driver_sysfs_add+0x57/0xc0
>> [   87.927079]  really_probe+0xde/0x340
>> [   87.927083]  ? pm_runtime_barrier+0x54/0x90
>> [   87.927087]  __driver_probe_device+0x78/0x110
>> [   87.927092]  driver_probe_device+0x1f/0xa0
>> [   87.927095]  __driver_attach_async_helper+0x5e/0xe0
>> [   87.927100]  async_run_entry_fn+0x34/0x130
>> [   87.927104]  process_one_work+0x18d/0x340
>> [   87.927108]  worker_thread+0x256/0x3a0
>> [   87.927111]  ? __pfx_worker_thread+0x10/0x10
>> [   87.927115]  kthread+0xfc/0x240
>> [   87.927120]  ? __pfx_kthread+0x10/0x10
>> [   87.927124]  ? __pfx_kthread+0x10/0x10
>> [   87.927127]  ret_from_fork+0xf5/0x110
>> [   87.927132]  ? __pfx_kthread+0x10/0x10
>> [   87.927136]  ret_from_fork_asm+0x1a/0x30
>> [   87.927141]  </TASK>
>>
>> Reported-by: Marek Marczykowski-Górecki <marmarek@...isiblethingslab.com>
>> Reported-by: Guenter Roeck <linux@...ck-us.net>
>> Fixes: 7704e6be4ed2 ("mei: hook mei_device on class device")
>> Signed-off-by: Alexander Usyskin <alexander.usyskin@...el.com>
> 
> Tested-by: Guenter Roeck <groeck@...gle.com>
> 
>>
>> ---
>>   drivers/misc/mei/pci-me.c       | 13 ++++++-------
>>   drivers/misc/mei/pci-txe.c      | 13 ++++++-------
>>   drivers/misc/mei/platform-vsc.c | 11 +++++------
>>   3 files changed, 17 insertions(+), 20 deletions(-)
>>
>> diff --git a/drivers/misc/mei/pci-me.c b/drivers/misc/mei/pci-me.c
>> index b017ff29dbd1..73cad914be9f 100644
>> --- a/drivers/misc/mei/pci-me.c
>> +++ b/drivers/misc/mei/pci-me.c
>> @@ -223,6 +223,10 @@ static int mei_me_probe(struct pci_dev *pdev, const struct pci_device_id *ent)
>>          hw->mem_addr = pcim_iomap_table(pdev)[0];
>>          hw->read_fws = mei_me_read_fws;
>>
>> +       err = mei_register(dev, &pdev->dev);
>> +       if (err)
>> +               goto end;
>> +
>>          pci_enable_msi(pdev);
>>
>>          hw->irq = pdev->irq;
>> @@ -237,13 +241,9 @@ static int mei_me_probe(struct pci_dev *pdev, const struct pci_device_id *ent)
>>          if (err) {
>>                  dev_err(&pdev->dev, "request_threaded_irq failure. irq = %d\n",
>>                         pdev->irq);
>> -               goto end;
>> +               goto deregister;
>>          }
>>
>> -       err = mei_register(dev, &pdev->dev);
>> -       if (err)
>> -               goto release_irq;
>> -
>>          if (mei_start(dev)) {
>>                  dev_err(&pdev->dev, "init hw failure.\n");
>>                  err = -ENODEV;
>> @@ -283,11 +283,10 @@ static int mei_me_probe(struct pci_dev *pdev, const struct pci_device_id *ent)
>>          return 0;
>>
>>   deregister:
>> -       mei_deregister(dev);
>> -release_irq:
>>          mei_cancel_work(dev);
>>          mei_disable_interrupts(dev);
>>          free_irq(pdev->irq, dev);
>> +       mei_deregister(dev);
>>   end:
>>          dev_err(&pdev->dev, "initialization failed.\n");
>>          return err;
>> diff --git a/drivers/misc/mei/pci-txe.c b/drivers/misc/mei/pci-txe.c
>> index 06b55a891c6b..98d1bc2c7f4b 100644
>> --- a/drivers/misc/mei/pci-txe.c
>> +++ b/drivers/misc/mei/pci-txe.c
>> @@ -87,6 +87,10 @@ static int mei_txe_probe(struct pci_dev *pdev, const struct pci_device_id *ent)
>>          hw = to_txe_hw(dev);
>>          hw->mem_addr = pcim_iomap_table(pdev);
>>
>> +       err = mei_register(dev, &pdev->dev);
>> +       if (err)
>> +               goto end;
>> +
>>          pci_enable_msi(pdev);
>>
>>          /* clear spurious interrupts */
>> @@ -106,13 +110,9 @@ static int mei_txe_probe(struct pci_dev *pdev, const struct pci_device_id *ent)
>>          if (err) {
>>                  dev_err(&pdev->dev, "mei: request_threaded_irq failure. irq = %d\n",
>>                          pdev->irq);
>> -               goto end;
>> +               goto deregister;
>>          }
>>
>> -       err = mei_register(dev, &pdev->dev);
>> -       if (err)
>> -               goto release_irq;
>> -
>>          if (mei_start(dev)) {
>>                  dev_err(&pdev->dev, "init hw failure.\n");
>>                  err = -ENODEV;
>> @@ -145,11 +145,10 @@ static int mei_txe_probe(struct pci_dev *pdev, const struct pci_device_id *ent)
>>          return 0;
>>
>>   deregister:
>> -       mei_deregister(dev);
>> -release_irq:
>>          mei_cancel_work(dev);
>>          mei_disable_interrupts(dev);
>>          free_irq(pdev->irq, dev);
>> +       mei_deregister(dev);
>>   end:
>>          dev_err(&pdev->dev, "initialization failed.\n");
>>          return err;
>> diff --git a/drivers/misc/mei/platform-vsc.c b/drivers/misc/mei/platform-vsc.c
>> index 288e7b72e942..9787b9cee71c 100644
>> --- a/drivers/misc/mei/platform-vsc.c
>> +++ b/drivers/misc/mei/platform-vsc.c
>> @@ -362,28 +362,27 @@ static int mei_vsc_probe(struct platform_device *pdev)
>>
>>          ret = mei_register(mei_dev, dev);
>>          if (ret)
>> -               goto err_dereg;
>> +               goto err;
>>
>>          ret = mei_start(mei_dev);
>>          if (ret) {
>>                  dev_err_probe(dev, ret, "init hw failed\n");
>> -               goto err_cancel;
>> +               goto err;
>>          }
>>
>>          pm_runtime_enable(mei_dev->parent);
>>
>>          return 0;
>>
>> -err_dereg:
>> -       mei_deregister(mei_dev);
>> -
>> -err_cancel:
>> +err:
>>          mei_cancel_work(mei_dev);
>>
>>          vsc_tp_register_event_cb(tp, NULL, NULL);
>>
>>          mei_disable_interrupts(mei_dev);
>>
>> +       mei_deregister(mei_dev);
>> +
>>          return ret;
>>   }
>>
>> --
>> 2.43.0
>>
>>
>>
>>
Powered by blists - more mailing lists