Skip to content

Commit 00452ba

Browse files
jwrdegoedeKAGA-KOKO
authored andcommitted
x86/platform/intel/iosf_mbi Rewrite locking
There are 2 problems with the old iosf PMIC I2C bus arbritration code which need to be addressed: 1. The lockdep code complains about a possible deadlock in the iosf_mbi_[un]block_punit_i2c_access code: [ 6.712662] ====================================================== [ 6.712673] WARNING: possible circular locking dependency detected [ 6.712685] 5.3.0-rc2+ #79 Not tainted [ 6.712692] ------------------------------------------------------ [ 6.712702] kworker/0:1/7 is trying to acquire lock: [ 6.712712] 00000000df1c5681 (iosf_mbi_block_punit_i2c_access_count_mutex){+.+.}, at: iosf_mbi_unblock_punit_i2c_access+0x13/0x90 [ 6.712739] but task is already holding lock: [ 6.712749] 0000000067cb23e7 (iosf_mbi_punit_mutex){+.+.}, at: iosf_mbi_block_punit_i2c_access+0x97/0x186 [ 6.712768] which lock already depends on the new lock. [ 6.712780] the existing dependency chain (in reverse order) is: [ 6.712792] -> #1 (iosf_mbi_punit_mutex){+.+.}: [ 6.712808] __mutex_lock+0xa8/0x9a0 [ 6.712818] iosf_mbi_block_punit_i2c_access+0x97/0x186 [ 6.712831] i2c_dw_acquire_lock+0x20/0x30 [ 6.712841] i2c_dw_set_reg_access+0x15/0xb0 [ 6.712851] i2c_dw_probe+0x57/0x473 [ 6.712861] dw_i2c_plat_probe+0x33e/0x640 [ 6.712874] platform_drv_probe+0x38/0x80 [ 6.712884] really_probe+0xf3/0x380 [ 6.712894] driver_probe_device+0x59/0xd0 [ 6.712905] bus_for_each_drv+0x84/0xd0 [ 6.712915] __device_attach+0xe4/0x170 [ 6.712925] bus_probe_device+0x9f/0xb0 [ 6.712935] deferred_probe_work_func+0x79/0xd0 [ 6.712946] process_one_work+0x234/0x560 [ 6.712957] worker_thread+0x50/0x3b0 [ 6.712967] kthread+0x10a/0x140 [ 6.712977] ret_from_fork+0x3a/0x50 [ 6.712986] -> #0 (iosf_mbi_block_punit_i2c_access_count_mutex){+.+.}: [ 6.713004] __lock_acquire+0xe07/0x1930 [ 6.713015] lock_acquire+0x9d/0x1a0 [ 6.713025] __mutex_lock+0xa8/0x9a0 [ 6.713035] iosf_mbi_unblock_punit_i2c_access+0x13/0x90 [ 6.713047] i2c_dw_set_reg_access+0x4d/0xb0 [ 6.713058] i2c_dw_probe+0x57/0x473 [ 6.713068] dw_i2c_plat_probe+0x33e/0x640 [ 6.713079] platform_drv_probe+0x38/0x80 [ 6.713089] really_probe+0xf3/0x380 [ 6.713099] driver_probe_device+0x59/0xd0 [ 6.713109] bus_for_each_drv+0x84/0xd0 [ 6.713119] __device_attach+0xe4/0x170 [ 6.713129] bus_probe_device+0x9f/0xb0 [ 6.713140] deferred_probe_work_func+0x79/0xd0 [ 6.713150] process_one_work+0x234/0x560 [ 6.713160] worker_thread+0x50/0x3b0 [ 6.713170] kthread+0x10a/0x140 [ 6.713180] ret_from_fork+0x3a/0x50 [ 6.713189] other info that might help us debug this: [ 6.713202] Possible unsafe locking scenario: [ 6.713212] CPU0 CPU1 [ 6.713221] ---- ---- [ 6.713229] lock(iosf_mbi_punit_mutex); [ 6.713239] lock(iosf_mbi_block_punit_i2c_access_count_mutex); [ 6.713253] lock(iosf_mbi_punit_mutex); [ 6.713265] lock(iosf_mbi_block_punit_i2c_access_count_mutex); [ 6.713276] *** DEADLOCK *** In practice can never happen because only the first caller which increments iosf_mbi_block_punit_i2c_access_count will also take iosf_mbi_punit_mutex, that is the whole purpose of the counter, which itself is protected by iosf_mbi_block_punit_i2c_access_count_mutex. But there is no way to tell the lockdep code about this and we really want to be able to run a kernel with lockdep enabled without these warnings being triggered. 2. The lockdep warning also points out another real problem, if 2 threads both are in a block of code protected by iosf_mbi_block_punit_i2c_access and the first thread to acquire the block exits before the second thread then the second thread will call mutex_unlock on iosf_mbi_punit_mutex, but it is not the thread which took the mutex and unlocking by another thread is not allowed. Fix this by getting rid of the notion of holding a mutex for the entire duration of the PMIC accesses, be it either from the PUnit side, or from an in kernel I2C driver. In general holding a mutex after exiting a function is a bad idea and the above problems show this case is no different. Instead 2 counters are now used, one for PMIC accesses from the PUnit and one for accesses from in kernel I2C code. When access is requested now the code will wait (using a waitqueue) for the counter of the other type of access to reach 0 and on release, if the counter reaches 0 the wakequeue is woken. Note that the counter approach is necessary to allow nested calls. The main reason for this is so that a series of i2c transfers can be done with the punit blocked from accessing the bus the whole time. This is necessary to be able to safely read/modify/write a PMIC register without racing with the PUNIT doing the same thing. Allowing nested iosf_mbi_block_punit_i2c_access() calls also is desirable from a performance pov since the whole dance necessary to block the PUnit from accessing the PMIC I2C bus is somewhat expensive. Signed-off-by: Hans de Goede <[email protected]> Signed-off-by: Thomas Gleixner <[email protected]> Reviewed-by: Andy Shevchenko <[email protected]> Link: https://lkml.kernel.org/r/[email protected]
1 parent d1abaeb commit 00452ba

File tree

1 file changed

+62
-38
lines changed

1 file changed

+62
-38
lines changed

arch/x86/platform/intel/iosf_mbi.c

Lines changed: 62 additions & 38 deletions
Original file line numberDiff line numberDiff line change
@@ -17,6 +17,7 @@
1717
#include <linux/debugfs.h>
1818
#include <linux/capability.h>
1919
#include <linux/pm_qos.h>
20+
#include <linux/wait.h>
2021

2122
#include <asm/iosf_mbi.h>
2223

@@ -201,23 +202,45 @@ EXPORT_SYMBOL(iosf_mbi_available);
201202
#define PUNIT_SEMAPHORE_BIT BIT(0)
202203
#define PUNIT_SEMAPHORE_ACQUIRE BIT(1)
203204

204-
static DEFINE_MUTEX(iosf_mbi_punit_mutex);
205-
static DEFINE_MUTEX(iosf_mbi_block_punit_i2c_access_count_mutex);
205+
static DEFINE_MUTEX(iosf_mbi_pmic_access_mutex);
206206
static BLOCKING_NOTIFIER_HEAD(iosf_mbi_pmic_bus_access_notifier);
207-
static u32 iosf_mbi_block_punit_i2c_access_count;
207+
static DECLARE_WAIT_QUEUE_HEAD(iosf_mbi_pmic_access_waitq);
208+
static u32 iosf_mbi_pmic_punit_access_count;
209+
static u32 iosf_mbi_pmic_i2c_access_count;
208210
static u32 iosf_mbi_sem_address;
209211
static unsigned long iosf_mbi_sem_acquired;
210212
static struct pm_qos_request iosf_mbi_pm_qos;
211213

212214
void iosf_mbi_punit_acquire(void)
213215
{
214-
mutex_lock(&iosf_mbi_punit_mutex);
216+
/* Wait for any I2C PMIC accesses from in kernel drivers to finish. */
217+
mutex_lock(&iosf_mbi_pmic_access_mutex);
218+
while (iosf_mbi_pmic_i2c_access_count != 0) {
219+
mutex_unlock(&iosf_mbi_pmic_access_mutex);
220+
wait_event(iosf_mbi_pmic_access_waitq,
221+
iosf_mbi_pmic_i2c_access_count == 0);
222+
mutex_lock(&iosf_mbi_pmic_access_mutex);
223+
}
224+
/*
225+
* We do not need to do anything to allow the PUNIT to safely access
226+
* the PMIC, other then block in kernel accesses to the PMIC.
227+
*/
228+
iosf_mbi_pmic_punit_access_count++;
229+
mutex_unlock(&iosf_mbi_pmic_access_mutex);
215230
}
216231
EXPORT_SYMBOL(iosf_mbi_punit_acquire);
217232

218233
void iosf_mbi_punit_release(void)
219234
{
220-
mutex_unlock(&iosf_mbi_punit_mutex);
235+
bool do_wakeup;
236+
237+
mutex_lock(&iosf_mbi_pmic_access_mutex);
238+
iosf_mbi_pmic_punit_access_count--;
239+
do_wakeup = iosf_mbi_pmic_punit_access_count == 0;
240+
mutex_unlock(&iosf_mbi_pmic_access_mutex);
241+
242+
if (do_wakeup)
243+
wake_up(&iosf_mbi_pmic_access_waitq);
221244
}
222245
EXPORT_SYMBOL(iosf_mbi_punit_release);
223246

@@ -256,34 +279,32 @@ static void iosf_mbi_reset_semaphore(void)
256279
* already blocked P-Unit accesses because it wants them blocked over multiple
257280
* i2c-transfers, for e.g. read-modify-write of an I2C client register.
258281
*
259-
* The P-Unit accesses already being blocked is tracked through the
260-
* iosf_mbi_block_punit_i2c_access_count variable which is protected by the
261-
* iosf_mbi_block_punit_i2c_access_count_mutex this mutex is hold for the
262-
* entire duration of the function.
263-
*
264-
* If access is not blocked yet, this function takes the following steps:
282+
* To allow safe PMIC i2c bus accesses this function takes the following steps:
265283
*
266284
* 1) Some code sends request to the P-Unit which make it access the PMIC
267285
* I2C bus. Testing has shown that the P-Unit does not check its internal
268286
* PMIC bus semaphore for these requests. Callers of these requests call
269287
* iosf_mbi_punit_acquire()/_release() around their P-Unit accesses, these
270-
* functions lock/unlock the iosf_mbi_punit_mutex.
271-
* As the first step we lock the iosf_mbi_punit_mutex, to wait for any in
272-
* flight requests to finish and to block any new requests.
288+
* functions increase/decrease iosf_mbi_pmic_punit_access_count, so first
289+
* we wait for iosf_mbi_pmic_punit_access_count to become 0.
290+
*
291+
* 2) Check iosf_mbi_pmic_i2c_access_count, if access has already
292+
* been blocked by another caller, we only need to increment
293+
* iosf_mbi_pmic_i2c_access_count and we can skip the other steps.
273294
*
274-
* 2) Some code makes such P-Unit requests from atomic contexts where it
295+
* 3) Some code makes such P-Unit requests from atomic contexts where it
275296
* cannot call iosf_mbi_punit_acquire() as that may sleep.
276297
* As the second step we call a notifier chain which allows any code
277298
* needing P-Unit resources from atomic context to acquire them before
278299
* we take control over the PMIC I2C bus.
279300
*
280-
* 3) When CPU cores enter C6 or C7 the P-Unit needs to talk to the PMIC
301+
* 4) When CPU cores enter C6 or C7 the P-Unit needs to talk to the PMIC
281302
* if this happens while the kernel itself is accessing the PMIC I2C bus
282303
* the SoC hangs.
283304
* As the third step we call pm_qos_update_request() to disallow the CPU
284305
* to enter C6 or C7.
285306
*
286-
* 4) The P-Unit has a PMIC bus semaphore which we can request to stop
307+
* 5) The P-Unit has a PMIC bus semaphore which we can request to stop
287308
* autonomous P-Unit tasks from accessing the PMIC I2C bus while we hold it.
288309
* As the fourth and final step we request this semaphore and wait for our
289310
* request to be acknowledged.
@@ -297,12 +318,18 @@ int iosf_mbi_block_punit_i2c_access(void)
297318
if (WARN_ON(!mbi_pdev || !iosf_mbi_sem_address))
298319
return -ENXIO;
299320

300-
mutex_lock(&iosf_mbi_block_punit_i2c_access_count_mutex);
321+
mutex_lock(&iosf_mbi_pmic_access_mutex);
301322

302-
if (iosf_mbi_block_punit_i2c_access_count > 0)
323+
while (iosf_mbi_pmic_punit_access_count != 0) {
324+
mutex_unlock(&iosf_mbi_pmic_access_mutex);
325+
wait_event(iosf_mbi_pmic_access_waitq,
326+
iosf_mbi_pmic_punit_access_count == 0);
327+
mutex_lock(&iosf_mbi_pmic_access_mutex);
328+
}
329+
330+
if (iosf_mbi_pmic_i2c_access_count > 0)
303331
goto success;
304332

305-
mutex_lock(&iosf_mbi_punit_mutex);
306333
blocking_notifier_call_chain(&iosf_mbi_pmic_bus_access_notifier,
307334
MBI_PMIC_BUS_ACCESS_BEGIN, NULL);
308335

@@ -330,10 +357,6 @@ int iosf_mbi_block_punit_i2c_access(void)
330357
iosf_mbi_sem_acquired = jiffies;
331358
dev_dbg(&mbi_pdev->dev, "P-Unit semaphore acquired after %ums\n",
332359
jiffies_to_msecs(jiffies - start));
333-
/*
334-
* Success, keep iosf_mbi_punit_mutex locked till
335-
* iosf_mbi_unblock_punit_i2c_access() gets called.
336-
*/
337360
goto success;
338361
}
339362

@@ -344,33 +367,34 @@ int iosf_mbi_block_punit_i2c_access(void)
344367
dev_err(&mbi_pdev->dev, "Error P-Unit semaphore timed out, resetting\n");
345368
error:
346369
iosf_mbi_reset_semaphore();
347-
mutex_unlock(&iosf_mbi_punit_mutex);
348-
349370
if (!iosf_mbi_get_sem(&sem))
350371
dev_err(&mbi_pdev->dev, "P-Unit semaphore: %d\n", sem);
351372
success:
352373
if (!WARN_ON(ret))
353-
iosf_mbi_block_punit_i2c_access_count++;
374+
iosf_mbi_pmic_i2c_access_count++;
354375

355-
mutex_unlock(&iosf_mbi_block_punit_i2c_access_count_mutex);
376+
mutex_unlock(&iosf_mbi_pmic_access_mutex);
356377

357378
return ret;
358379
}
359380
EXPORT_SYMBOL(iosf_mbi_block_punit_i2c_access);
360381

361382
void iosf_mbi_unblock_punit_i2c_access(void)
362383
{
363-
mutex_lock(&iosf_mbi_block_punit_i2c_access_count_mutex);
384+
bool do_wakeup = false;
364385

365-
iosf_mbi_block_punit_i2c_access_count--;
366-
if (iosf_mbi_block_punit_i2c_access_count == 0) {
386+
mutex_lock(&iosf_mbi_pmic_access_mutex);
387+
iosf_mbi_pmic_i2c_access_count--;
388+
if (iosf_mbi_pmic_i2c_access_count == 0) {
367389
iosf_mbi_reset_semaphore();
368-
mutex_unlock(&iosf_mbi_punit_mutex);
369390
dev_dbg(&mbi_pdev->dev, "punit semaphore held for %ums\n",
370391
jiffies_to_msecs(jiffies - iosf_mbi_sem_acquired));
392+
do_wakeup = true;
371393
}
394+
mutex_unlock(&iosf_mbi_pmic_access_mutex);
372395

373-
mutex_unlock(&iosf_mbi_block_punit_i2c_access_count_mutex);
396+
if (do_wakeup)
397+
wake_up(&iosf_mbi_pmic_access_waitq);
374398
}
375399
EXPORT_SYMBOL(iosf_mbi_unblock_punit_i2c_access);
376400

@@ -379,10 +403,10 @@ int iosf_mbi_register_pmic_bus_access_notifier(struct notifier_block *nb)
379403
int ret;
380404

381405
/* Wait for the bus to go inactive before registering */
382-
mutex_lock(&iosf_mbi_punit_mutex);
406+
iosf_mbi_punit_acquire();
383407
ret = blocking_notifier_chain_register(
384408
&iosf_mbi_pmic_bus_access_notifier, nb);
385-
mutex_unlock(&iosf_mbi_punit_mutex);
409+
iosf_mbi_punit_release();
386410

387411
return ret;
388412
}
@@ -403,17 +427,17 @@ int iosf_mbi_unregister_pmic_bus_access_notifier(struct notifier_block *nb)
403427
int ret;
404428

405429
/* Wait for the bus to go inactive before unregistering */
406-
mutex_lock(&iosf_mbi_punit_mutex);
430+
iosf_mbi_punit_acquire();
407431
ret = iosf_mbi_unregister_pmic_bus_access_notifier_unlocked(nb);
408-
mutex_unlock(&iosf_mbi_punit_mutex);
432+
iosf_mbi_punit_release();
409433

410434
return ret;
411435
}
412436
EXPORT_SYMBOL(iosf_mbi_unregister_pmic_bus_access_notifier);
413437

414438
void iosf_mbi_assert_punit_acquired(void)
415439
{
416-
WARN_ON(!mutex_is_locked(&iosf_mbi_punit_mutex));
440+
WARN_ON(iosf_mbi_pmic_punit_access_count == 0);
417441
}
418442
EXPORT_SYMBOL(iosf_mbi_assert_punit_acquired);
419443

0 commit comments

Comments
 (0)