Re: Maple tree implementation for irq descriptor management

From: Mukesh Ojha
Date: Fri Dec 15 2023 - 09:20:02 EST


Hi @Liam,

On 12/14/2023 1:05 AM, Liam R. Howlett wrote:
* Mukesh Ojha <quic_mojha@xxxxxxxxxxx> [231213 10:46]:
Hi All,

We are facing an issue in maple tree implementation for irq descriptor
where while allocating a new descriptor in irq_create_mapping(index=300) it
gets interrupted and get stuck in infinite loop inside
mtree_lookup_walk()=>ma_dead_node(index=287) due to dead node
(0xFFFFFF8819DECF00) and it is the same node where earlier call
for creating descriptor is about to added.

What kernel version?

6.5


There was an issue with the tree a while back which could result in this
happening [1], although I was never successful in causing it or seeing
it before now.

Looking though the dump below, it appears that you do not have the
patches in [1] as they should prevent the node from being marked dead
until the new node exists in the tree. Note that this occurs in your
case in splitting of the node which should be fixed in the last patch of
the series.

[1] https://lore.kernel.org/all/20230804165951.2661157-3-Liam.Howlett@xxxxxxxxxx/T/#u

Thanks for the prompt response, yes these patches are missing.
Let me apply them and try.

-Mukesh

Thanks,
Liam



(struct maple_node *)0xFFFFFF8819DECF00 = 0xFFFFFF8819DECF00 -> (
parent = 0xFFFFFF8819DECF00,
slot = (0x0, 0x011E, 0x011F, 0x0120, 0x0121, 0x0122, 0x0123, 0x0124,
0x0125, 0x0126, 0x0127, 0x0128, 0x0129, 0x012A, 0x012B, 0xFFFFFF8813125600,
0xFFFFFF8828BC6E00, 0xFFFFFF8821A4C800, 0x
pad = 0xFFFFFF8819DECF00,
rcu = (next = 0x0, func = 0x011E),
piv_parent = 0x011F,
parent_slot = 32,
type = maple_dense = 0,
slot_len = 33,
ma_flags = 0,
mr64 = (
parent = 0xFFFFFF8819DECF00,
pivot = (0, 286, 287, 288, 289, 290, 291, 292, 293, 294, 295, 296,
297, 298, 299),
slot = (0xFFFFFF8813125600, 0xFFFFFF8828BC6E00, 0xFFFFFF8821A4C800,
0xFFFFFF8815595A00, 0xFFFFFF8815594400, 0xFFFFFF8815596800,
0xFFFFFF8815597E00, 0xFFFFFF88155B7C00, 0xFFFFFF881559400
pad = (0xFFFFFF8813125600, 0xFFFFFF8828BC6E00, 0xFFFFFF8821A4C800,
0xFFFFFF8815595A00, 0xFFFFFF8815594400, 0xFFFFFF8815596800,
0xFFFFFF8815597E00, 0xFFFFFF88155B7C00, 0xFFFFFF8815594000
meta = (end = 0, gap = 0)),
ma64 = (
parent = 0xFFFFFF8819DECF00,
pivot = (0, 286, 287, 288, 289, 290, 291, 292, 293),
slot = (0x0126, 0x0127, 0x0128, 0x0129, 0x012A, 0x012B,
0xFFFFFF8813125600, 0xFFFFFF8828BC6E00, 0xFFFFFF8821A4C800,
0xFFFFFF8815595A00),
gap = (18446743558671647744, 18446743558671656960,
18446743558671662592, 18446743558671793152, 18446743558671646720,
18446743558671650304, 18446743558800159744, 18446743558759686144, 18
meta = (end = 0, gap = 118)),
alloc = (total = 18446743558747508480, node_count = 0, request_count =
0, slot = (0x011E, 0x011F, 0x0120, 0x0121, 0x0122, 0x0123, 0x0124, 0x0125,
0x0126, 0x0127, 0x0128, 0x0129, 0x012A, 0

Backtrace:

-000|mtree_lookup_walk(inline)
| max = 18446744073709551615
| next = 0xFFFFFF881B197C1C
| offset = 2
| node = 0xFFFFFF881B197C00
| type = maple_arange_64
-000|mtree_load(mt = ?, index = 287)
| index = 287
| mas = (tree = 0xFFFFFFC081EB3EC0, index = 287, last = 287, node =
0xFFFFFF881B197C1C, min = 0, max = 18446744073709551615, alloc = 0x0, depth
= 1, offset = 0, mas_flags = 0)
| entry = 0x0
-001|irq_to_desc(inline)
-001|generic_handle_irq(irq = ?)
| irq = ?
-002|NSX:0x0::0xFFFFFFC07A0E0500(asm)
-003|__handle_irq_event_percpu(:desc = 0xFFFFFF8807D18600)
| desc = 0xFFFFFF8807D18600
| __already_done = FALSE
| irq = 17
| retval = IRQ_NONE
| res = IRQ_NONE
-004|handle_irq_event_percpu(inline)
| desc = 0xFFFFFF8807D18600
| retval = IRQ_NONE
-004|handle_irq_event(:desc = 0xFFFFFF8807D18600)
| desc = 0xFFFFFF8807D18600
| ret = IRQ_NONE
-005|handle_fasteoi_irq(desc = 0xFFFFFF8807D18600)
| desc = 0xFFFFFF8807D18600
| chip = 0xFFFFFFC081F21288
-006|generic_handle_irq_desc(inline)
-006|handle_irq_desc(inline)
-006|generic_handle_domain_irq(domain = ?, :hwirq = 261)
| domain = ?
| hwirq = 261
-007|__gic_handle_irq(inline)
| irqnr = 261
-007|__gic_handle_irq_from_irqson(inline)
| is_nmi = FALSE
| irqnr = 261
-007|gic_handle_irq()
-008|call_on_irq_stack(asm)
-009|do_interrupt_handler(inline)
| regs = 0xFFFFFFC082142DB0
| old_regs = 0x0
-009|__el1_irq(inline)
| regs = 0xFFFFFFC082142DB0
-009|el1_interrupt(regs = 0xFFFFFFC082142DB0, handler = 0xFFFFFFC0800100F8)
| regs = 0xFFFFFFC082142DB0
| handler = 0xFFFFFFC0800100F8
-010|el1h_64_irq_handler(regs = ?)
| regs = ?
-011|el1h_64_irq(asm)
-->|exception
-012|__memcpy(asm)
-013|mas_mab_cp(:mas = 0xFFFFFFC0821434A8, :mas_start = 80, mas_end = ?,
b_node = 0xFFFFFFC082143108, :mab_start = 80)
| mas = 0xFFFFFFC0821434A8
| mas_start = 0
| b_node = 0xFFFFFFC082143108
| mab_start = 0
| gaps = 0x0
| node = 0xFFFFFF88118A8900
| mt = maple_arange_64
| __fortify_size = 32
| __p_size = 18446744073709551615
| __p_size_field = 18446744073709551615
| __q_size = 0
-014|mast_fill_bnode(:mast = 0xFFFFFFC0821430C8, :mas = 0xFFFFFFC0821434A8,
:skip = 1)
| mast = 0xFFFFFFC0821430C8 -> (
| orig_l = 0xFFFFFFC082143000,
| orig_r = 0xFFFFFFC082142FC0,
| l = 0xFFFFFFC082143080 -> (
| tree = 0xFFFFFFC081EB3EC0,
| index = 300,
| last = 300,
| node = 0xFFFFFF881409570C,
| min = 285,
| max = 293,
| alloc = 0xFFFFFF8814094600,
| depth = 3,
| offset = 4,
| mas_flags = 0),
| m = 0x0,
| r = 0xFFFFFFC082143040 -> (
| tree = 0xFFFFFFC081EB3EC0,
| index = 300,
| last = 300,
| node = 0xFFFFFF881409510C,
| min = 294,
| max = 18446744073709551615,
| alloc = 0xFFFFFF8814094600,
| depth = 3,
| offset = 15,
| mas_flags = 0),
| free = 0xFFFFFFC082142FA8,
| destroy = 0x0,
| bn = 0xFFFFFFC082143108)
| mas = 0xFFFFFFC0821434A8
| skip = 1
| split = 0
| old = 0x0
-015|mas_split(inline)
| mas = 0xFFFFFFC0821434A8
| mast = (orig_l = 0xFFFFFFC082143000, orig_r = 0xFFFFFFC082142FC0, l =
0xFFFFFFC082143080, m = 0x0, r = 0xFFFFFFC082143040, free =
0xFFFFFFC082142FA8, destroy = 0x0, bn = 0xFFFFFFC082143108)
| l_mas = (tree = 0xFFFFFFC081EB3EC0, index = 300, last = 300, node =
0xFFFFFF881409570C, min = 285, max = 293, alloc = 0xFFFFFF8814094600, depth
= 3, offset = 4, mas_flags = 0)
| r_mas = (tree = 0xFFFFFFC081EB3EC0, index = 300, last = 300, node =
0xFFFFFF881409510C, min = 294, max = 18446744073709551615, alloc =
0xFFFFFF8814094600, depth = 3, offset = 15, mas_flags = 0)
| prev_l_mas = (tree = 0xFFFFFFC081EB3EC0, index = 300, last = 300,
node = 0x1, min = 0, max = 18446744073709551615, alloc = 0x0, depth = 0,
offset = 0, mas_flags = 0)
| prev_r_mas = (tree = 0xFFFFFFC081EB3EC0, index = 300, last = 300,
node = 0x1, min = 0, max = 18446744073709551615, alloc = 0x0, depth = 0,
offset = 0, mas_flags = 0)
| mat = (head = 0xFFFFFF8819DECF0C, tail = 0xFFFFFF8819DECF0C, mtree =
0xFFFFFFC081EB3EC0)
| mid_split = 0
-015|mas_commit_b_node(inline)
| b_type = maple_leaf_64
| node = 0x0
-015|mas_wr_bnode(inline)
| b_node = (
| parent = 0x0,
| pivot = (239, 254, 269, 284, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,
0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0),
| slot = (0x0, 0x0, 0x0, 0x0, 0x0, 0x0, 0x0, 0x0, 0x0, 0x0, 0x0, 0x0,
0x0, 0x0, 0x0, 0x0, 0x0, 0x0, 0x0, 0x0, 0x0, 0x0, 0x0, 0x0, 0x0, 0x0, 0x0,
0x0, 0x0, 0x0, 0x0, 0x0, 0x0, 0x0),
| padding = (0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,
0, 0),
| gap = (0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,
0),
| b_end = 4,
| type = maple_leaf_64)
-015|mas_wr_modify(:wr_mas = 0xFFFFFFC082143408)
-016|mas_wr_store_entry(:wr_mas = 0xFFFFFFC082143408)
| wr_mas = 0xFFFFFFC082143408 -> (
| mas = 0xFFFFFFC0821434A8 -> (
| tree = 0xFFFFFFC081EB3EC0,
| index = 300,
| last = 300,
| node = 0xFFFFFF88118A891C,
| min = 225,
| max = 18446744073709551615,
| alloc = 0xFFFFFF8814094600,
| depth = 3,
| offset = 2,
| mas_flags = 0),
| node = 0xFFFFFF8819DECF00,
| r_min = 300,
| r_max = 0xFFFFFFFFFFFFFFFF,
| type = maple_leaf_64,
| offset_end = 15,
| node_end = 15,
| pivots = 0xFFFFFF8819DECF08 -> 0,
| end_piv = 0xFFFFFFFFFFFFFFFF,
| slots = 0xFFFFFF8819DECF80 -> 0xFFFFFF8813125600 -> ,
| entry = 0xFFFFFF8848A27A00,
| content = 0x0)
| mas = 0x0
-017|mas_store_gfp(:mas = 0xFFFFFFC0821434A8, :entry = 0xFFFFFF8848A27A00,
:gfp = 3264)
| mas = 0xFFFFFFC0821434A8
| entry = 0xFFFFFF8848A27A00
| gfp = 3264
| wr_mas = (mas = 0xFFFFFFC0821434A8, node = 0xFFFFFF8819DECF00, r_min
= 300, r_max = 18446744073709551615, type = maple_leaf_64, offset_end = 15,
node_end = 15, pivots = 0xFFFFFF8819DECF08, end_piv = 18446744073709551615,
slots = 0xFFFFFF8819DECF80, entry = 0xFFFFFF8848A27A00, content = 0x0)
-018|irq_insert_desc(inline)
| desc = 0xFFFFFF8848A27A00
| mas = (tree = 0xFFFFFFC081EB3EC0, index = 300, last = 300, node =
0xFFFFFF88118A891C, min = 225, max = 18446744073709551615, alloc =
0xFFFFFF8814094600, depth = 3, offset = 2, mas_flags = 0)
-018|alloc_descs(inline)
| start = 300
| node = -1
| affinity = 0x0
| owner = 0x0
| desc = 0xFFFFFF8848A27A00
-018|__irq_alloc_descs(irq = ?, from = ?, :cnt = 1, node = ?, owner = 0x0,
:affinity = 0x0)
| cnt = 1
| owner = 0x0
| start = 300
-019|irq_domain_alloc_descs(inline)
| virq = -1
| cnt = 1
| hwirq = 0
| node = -1
| affinity = 0x0
-019|irq_create_mapping_affinity_locked(inline)
| domain = 0xFFFFFF885BFF6840
| hwirq = 0
| affinity = 0x0
| virq = 0
-019|irq_create_mapping_affinity(domain = 0xFFFFFF885BFF6840, hwirq = 0,
affinity = 0x0)
| domain = 0xFFFFFF885BFF6840
| hwirq = 0
| affinity = 0x0
-020|NSX:0x0::0xFFFFFFC07AE32720(asm)
-021|NSX:0x0::0xFFFFFFC07AC9AB38(asm)
-022|NSX:0x0::0xFFFFFFC07B3E49F4(asm)
-023|call_driver_probe(inline)
| dev = 0xFFFFFF8848951848
| drv = 0xFFFFFFC07AFD90C0
| ret = 0
-023|really_probe(:dev = 0xFFFFFF8848951848, :drv = 0xFFFFFFC07AFD90C0)
| dev = 0xFFFFFF8848951848
| drv = 0xFFFFFFC07AFD90C0
| link_ret = 0
| test_remove = FALSE
-024|__driver_probe_device(drv = 0xFFFFFFC07AFD90C0, :dev =
0xFFFFFF8848951848)
| drv = 0xFFFFFFC07AFD90C0
| dev = 0xFFFFFF8848951848
| ret = 0
-025|driver_probe_device(drv = 0xFFFFFFC07AFD90C0, :dev =
0xFFFFFF8848951848)
| drv = 0xFFFFFFC07AFD90C0
| dev = 0xFFFFFF8848951848
| trigger_count = 783
| ret = 0
-026|__device_attach_driver(drv = 0xFFFFFFC07AFD90C0, :_data =
0xFFFFFFC0821437E8)
| drv = 0xFFFFFFC07AFD90C0
| _data = 0xFFFFFFC0821437E8
| data = 0xFFFFFFC0821437E8
| dev = 0xFFFFFF8848951848
| ret = ???
-027|bus_for_each_drv(bus = ?, :start = 0xFFFFFFC0821437E0, :data =
0xFFFFFFC0821437E8, fn = 0xFFFFFFC08089C798)
| data = 0xFFFFFFC0821437E8
| fn = 0xFFFFFFC08089C798
| i = (i_klist = 0xFFFFFF881ED5C6C8, i_cur = 0xFFFFFF8823649968)
| sp = 0xFFFFFF881ED5C600
| error = 0
-028|__device_attach(dev = 0xFFFFFF8848951848)
| dev = 0xFFFFFF8848951848
| async = FALSE
| ret = 0
| data = (dev = 0xFFFFFF8848951848, check_async = TRUE, want_async =
FALSE, have_async = FALSE)
-029|device_initial_probe(dev = 0xFFFFFF8848951848)
| dev = 0xFFFFFF8848951848
-030|bus_probe_device(:dev = 0xFFFFFF8848951848)
| dev = 0xFFFFFF8848951848
| sp = 0xFFFFFF881ED5C600
| sif = 0x0
-031|device_add(:dev = 0xFFFFFF8848951848)
| dev = 0xFFFFFF8848951848
| sp = 0x0
| parent = 0xFFFFFF8851B70080
| class_intf = 0x0
| error = 0
| glue_dir = 0x0
-032|device_register(dev = 0xFFFFFF8848951848)
| dev = 0xFFFFFF8848951848
-033|NSX:0x0::0xFFFFFFC07B3E3944(asm)
-034|NSX:0x0::0xFFFFFFC07B3E3C20(asm)
-035|NSX:0x0::0xFFFFFFC07B6B5148(asm)
-036|platform_probe(:_dev = 0xFFFFFF8848956010)
| _dev = 0xFFFFFF8848956010
| drv = 0xFFFFFFC07B299648
| ret = 0
-037|call_driver_probe(inline)
| dev = 0xFFFFFF8848956010
| drv = 0xFFFFFFC07B299678
| ret = 0
-037|really_probe(:dev = 0xFFFFFF8848956010, :drv = 0xFFFFFFC07B299678)
| dev = 0xFFFFFF8848956010
| drv = 0xFFFFFFC07B299678
| link_ret = 0
| test_remove = FALSE
-038|__driver_probe_device(drv = 0xFFFFFFC07B299678, :dev =
0xFFFFFF8848956010)
| drv = 0xFFFFFFC07B299678
| dev = 0xFFFFFF8848956010
| ret = 0
-039|driver_probe_device(drv = 0xFFFFFFC07B299678, :dev =
0xFFFFFF8848956010)
| drv = 0xFFFFFFC07B299678
| dev = 0xFFFFFF8848956010
| trigger_count = 781
| ret = 0
-040|__device_attach_driver(drv = 0xFFFFFFC07B299678, :_data =
0xFFFFFFC082143BA8)
| drv = 0xFFFFFFC07B299678
| _data = 0xFFFFFFC082143BA8
| data = 0xFFFFFFC082143BA8
| dev = 0xFFFFFF8848956010
| ret = ???
-041|bus_for_each_drv(bus = ?, :start = 0xFFFFFFC082143BA0, :data =
0xFFFFFFC082143BA8, fn = 0xFFFFFFC08089C798)
| data = 0xFFFFFFC082143BA8
| fn = 0xFFFFFFC08089C798
| i = (i_klist = 0xFFFFFF8804034AC8, i_cur = 0xFFFFFF8821B45068)
| sp = 0xFFFFFF8804034A00
| error = 0
-042|__device_attach(dev = 0xFFFFFF8848956010)
| dev = 0xFFFFFF8848956010
| async = FALSE
| ret = 0
| data = (dev = 0xFFFFFF8848956010, check_async = TRUE, want_async =
FALSE, have_async = FALSE)
-043|device_initial_probe(dev = 0xFFFFFF8848956010)
| dev = 0xFFFFFF8848956010
-044|bus_probe_device(:dev = 0xFFFFFF8848956010)
| dev = 0xFFFFFF8848956010
| sp = 0xFFFFFF8804034A00
| sif = 0x0
-045|device_add(:dev = 0xFFFFFF8848956010)
| dev = 0xFFFFFF8848956010
| sp = 0x0
| parent = 0xFFFFFF8851BCE410
| class_intf = 0x0
| error = 0
| glue_dir = 0x0
-046|platform_device_add(pdev = 0xFFFFFF8848956000)
| pdev = 0xFFFFFF8848956000
-047|NSX:0x0::0xFFFFFFC07B73DD48(asm)
-048|process_one_work(:worker = 0xFFFFFF880300AF00, work =
0xFFFFFF8833434930)
| worker = 0xFFFFFF880300AF00
| work = 0xFFFFFF8833434930
| pool = 0xFFFFFF8B7DCAA180
| pwq = 0xFFFFFF8B7DCAE600
| collision = 0x0
| work_data = 18446743573308827141
-049|worker_thread(:__worker = 0xFFFFFF880300AF00)
| __worker = 0xFFFFFF880300AF00
| worker = 0x0
| pool = 0xFFFFFF8B7DCAA180
-050|kthread(_create = 0xFFFFFF8803290240)
| _create = 0xFFFFFF8803290240
| param = (sched_priority = 0)
| create = 0x0
| data = 0xFFFFFF880300AF00
| threadfn = 0x0
| ret = ???
| self = 0xFFFFFF88030D8180
| done = 0xFFFFFFC082133CB8
-051|ret_from_fork(asm)
---|end of frame

-Mukesh