Re: [PATCH v2 04/10] EDAC/ghes: Make SMBIOS handle private data to ghes

From: Borislav Petkov
Date: Fri Apr 24 2020 - 12:22:40 EST


On Wed, Apr 22, 2020 at 01:58:08PM +0200, Robert Richter wrote:
> diff --git a/drivers/edac/ghes_edac.c b/drivers/edac/ghes_edac.c
> index 39efce0df881..23adb7674f9b 100644
> --- a/drivers/edac/ghes_edac.c
> +++ b/drivers/edac/ghes_edac.c
> @@ -15,6 +15,12 @@
> #include "edac_module.h"
> #include <ras/ras_event.h>
>
> +struct ghes_dimm {

Simply struct dimm

> + struct list_head entry;
> + struct dimm_info *dimm;
> + u16 handle;
> +};
> +
> struct ghes_mci {
> struct mem_ctl_info *mci;
>
> @@ -42,6 +48,16 @@ static DEFINE_MUTEX(ghes_reg_mutex);
> */
> static DEFINE_SPINLOCK(ghes_lock);
>
> +/*
> + * Locking:
> + *
> + * dimms, ghes_dimm_pool: ghes_reg_mutex
> + * ghes_dimm_list: ghes_lock
> + */
> +static struct ghes_dimm *dimms;
> +static LIST_HEAD(ghes_dimm_list);
> +static LIST_HEAD(ghes_dimm_pool);

Those are static lists, no need to prefix them with "ghes_". There's too
much "ghes" in that code. :)

> +
> /* "ghes_edac.force_load=1" skips the platform check */
> static bool __read_mostly force_load;
> module_param(force_load, bool, 0);
> @@ -72,11 +88,63 @@ struct memdev_dmi_entry {
> u16 conf_mem_clk_speed;
> } __attribute__((__packed__));
>
> -struct ghes_edac_dimm_fill {
> +struct dimm_fill {
> + struct list_head dimms;
> struct mem_ctl_info *mci;
> unsigned int count;
> };
>
> +static int ghes_dimm_pool_create(int num_dimm)

Yeah, drop "ghes_" here too. I'm not going to comment on this in the
rest of the patchset but for the next version, please drop the "ghes_"
prefix from static functions and members - it unnecessarily gets in the
way when reading the code.

> +{
> + struct ghes_dimm *ghes_dimm;
> +
> + if (!num_dimm)
> + return 0;
> +
> + lockdep_assert_held(ghes_reg_mutex);
> +
> + dimms = kcalloc(num_dimm, sizeof(*dimms), GFP_KERNEL);
> + if (!dimms)
> + return -ENOMEM;
> +
> + for (ghes_dimm = dimms; ghes_dimm < dimms + num_dimm; ghes_dimm++)

And with the above shortening of names, this loop becomes:

for (d = dimms; d < dimms + num_dimms; d++)
list_add(&d->entry, &dimm_pool);

Simple.

> +
> + return 0;
> +}
> +
> +static void ghes_dimm_pool_destroy(void)
> +{
> + lockdep_assert_held(ghes_reg_mutex);
> + INIT_LIST_HEAD(&ghes_dimm_pool);
> + kfree(dimms);
> +}
> +
> +static struct ghes_dimm *ghes_dimm_alloc(struct dimm_info *dimm, u16 handle)
> +{
> + struct ghes_dimm *ghes_dimm;
> +
> + lockdep_assert_held(ghes_reg_mutex);

The 0day bot caught it already - this needs to be a ptr. Please test
with PROVE_LOCKING enabled before sending next time.

> +
> + ghes_dimm = list_first_entry_or_null(&ghes_dimm_pool,
> + struct ghes_dimm, entry);

Let that line stick out.

> +
> + /* should be always non-zero */
> + if (!WARN_ON_ONCE(!ghes_dimm)) {
> + ghes_dimm->dimm = dimm;
> + ghes_dimm->handle = handle;
> + list_del(&ghes_dimm->entry);
> + }
> +
> + return ghes_dimm;
> +}
> +
> +static void ghes_dimm_release(struct list_head *dimms)
> +{
> + lockdep_assert_held(ghes_reg_mutex);
> + list_splice(dimms, &ghes_dimm_pool);
> +}
> +
> static void ghes_edac_count_dimms(const struct dmi_header *dh, void *arg)
> {
> int *num_dimm = arg;

...

> @@ -547,12 +626,18 @@ int ghes_edac_register(struct ghes *ghes, struct device *dev)
>
> spin_lock_irqsave(&ghes_lock, flags);
> ghes_pvt = pvt;
> + list_splice_tail(&dimm_fill.dimms, &ghes_dimm_list);
> spin_unlock_irqrestore(&ghes_lock, flags);
>
> /* only set on success */
> refcount_set(&ghes_refcount, 1);
>
> unlock:
> + if (rc < 0) {
> + ghes_dimm_pool_destroy();
> + pr_err("Can't register at EDAC core: %d\n", rc);

with the EDAC core:

> + }
> +
> mutex_unlock(&ghes_reg_mutex);
>
> return rc;
> @@ -562,6 +647,7 @@ void ghes_edac_unregister(struct ghes *ghes)
> {
> struct mem_ctl_info *mci;
> unsigned long flags;
> + LIST_HEAD(dimm_list);
>
> mutex_lock(&ghes_reg_mutex);
>
> @@ -574,14 +660,19 @@ void ghes_edac_unregister(struct ghes *ghes)
> spin_lock_irqsave(&ghes_lock, flags);
> mci = ghes_pvt ? ghes_pvt->mci : NULL;
> ghes_pvt = NULL;
> + list_splice_init(&ghes_dimm_list, &dimm_list);

Why do you need to do this?

Can't you simply do:

ghes_dimm_release(&ghes_dimm_list);

here?

Btw, please add an explanation above ghes_dimm_list and ghes_dimm_pool
what those are and what the rules are: stuff gets added on register to
what list and freed on unreg from what list, etc. So that it is clear
upon a quick glance.

Thx.

--
Regards/Gruss,
Boris.

https://people.kernel.org/tglx/notes-about-netiquette