Maple tree implementation for irq descriptor management

Mukesh Ojha quic_mojha at quicinc.com
Fri Dec 15 06:18:50 PST 2023


Hi @Liam,

On 12/14/2023 1:05 AM, Liam R. Howlett wrote:
> * Mukesh Ojha <quic_mojha at quicinc.com> [231213 10:46]:
>> Hi All,
>>
>> We are facing an issue in maple tree implementation for irq descriptor
>> where while allocating a new descriptor in irq_create_mapping(index=300) it
>> gets interrupted and get stuck in infinite loop inside
>> mtree_lookup_walk()=>ma_dead_node(index=287) due to dead node
>> (0xFFFFFF8819DECF00) and it is the same node where earlier call
>> for creating descriptor is about to added.
> 
> What kernel version?

6.5

> 
> There was an issue with the tree a while back which could result in this
> happening [1], although I was never successful in causing it or seeing
> it before now.
> 
> Looking though the dump below, it appears that you do not have the
> patches in [1] as they should prevent the node from being marked dead
> until the new node exists in the tree.  Note that this occurs in your
> case in splitting of the node which should be fixed in the last patch of
> the series.
> 
> [1] https://lore.kernel.org/all/20230804165951.2661157-3-Liam.Howlett@oracle.com/T/#u

Thanks for the prompt response, yes these patches are missing.
Let me apply them and try.

-Mukesh
> 
> Thanks,
> Liam
> 
>>
>>
>>    (struct maple_node *)0xFFFFFF8819DECF00 = 0xFFFFFF8819DECF00 -> (
>>      parent = 0xFFFFFF8819DECF00,
>>      slot = (0x0, 0x011E, 0x011F, 0x0120, 0x0121, 0x0122, 0x0123, 0x0124,
>> 0x0125, 0x0126, 0x0127, 0x0128, 0x0129, 0x012A, 0x012B, 0xFFFFFF8813125600,
>> 0xFFFFFF8828BC6E00, 0xFFFFFF8821A4C800, 0x
>>      pad = 0xFFFFFF8819DECF00,
>>      rcu = (next = 0x0, func = 0x011E),
>>      piv_parent = 0x011F,
>>      parent_slot = 32,
>>      type = maple_dense = 0,
>>      slot_len = 33,
>>      ma_flags = 0,
>>      mr64 = (
>>        parent = 0xFFFFFF8819DECF00,
>>        pivot = (0, 286, 287, 288, 289, 290, 291, 292, 293, 294, 295, 296,
>> 297, 298, 299),
>>        slot = (0xFFFFFF8813125600, 0xFFFFFF8828BC6E00, 0xFFFFFF8821A4C800,
>> 0xFFFFFF8815595A00, 0xFFFFFF8815594400, 0xFFFFFF8815596800,
>> 0xFFFFFF8815597E00, 0xFFFFFF88155B7C00, 0xFFFFFF881559400
>>        pad = (0xFFFFFF8813125600, 0xFFFFFF8828BC6E00, 0xFFFFFF8821A4C800,
>> 0xFFFFFF8815595A00, 0xFFFFFF8815594400, 0xFFFFFF8815596800,
>> 0xFFFFFF8815597E00, 0xFFFFFF88155B7C00, 0xFFFFFF8815594000
>>        meta = (end = 0, gap = 0)),
>>      ma64 = (
>>        parent = 0xFFFFFF8819DECF00,
>>        pivot = (0, 286, 287, 288, 289, 290, 291, 292, 293),
>>        slot = (0x0126, 0x0127, 0x0128, 0x0129, 0x012A, 0x012B,
>> 0xFFFFFF8813125600, 0xFFFFFF8828BC6E00, 0xFFFFFF8821A4C800,
>> 0xFFFFFF8815595A00),
>>        gap = (18446743558671647744, 18446743558671656960,
>> 18446743558671662592, 18446743558671793152, 18446743558671646720,
>> 18446743558671650304, 18446743558800159744, 18446743558759686144, 18
>>        meta = (end = 0, gap = 118)),
>>      alloc = (total = 18446743558747508480, node_count = 0, request_count =
>> 0, slot = (0x011E, 0x011F, 0x0120, 0x0121, 0x0122, 0x0123, 0x0124, 0x0125,
>> 0x0126, 0x0127, 0x0128, 0x0129, 0x012A, 0
>>
>> Backtrace:
>>
>> -000|mtree_lookup_walk(inline)
>>      |  max = 18446744073709551615
>>      |  next = 0xFFFFFF881B197C1C
>>      |  offset = 2
>>      |  node = 0xFFFFFF881B197C00
>>      |  type = maple_arange_64
>> -000|mtree_load(mt = ?, index = 287)
>>      |  index = 287
>>      |  mas = (tree = 0xFFFFFFC081EB3EC0, index = 287, last = 287, node =
>> 0xFFFFFF881B197C1C, min = 0, max = 18446744073709551615, alloc = 0x0, depth
>> = 1, offset = 0, mas_flags = 0)
>>      |  entry = 0x0
>> -001|irq_to_desc(inline)
>> -001|generic_handle_irq(irq = ?)
>>      |  irq = ?
>> -002|NSX:0x0::0xFFFFFFC07A0E0500(asm)
>> -003|__handle_irq_event_percpu(:desc = 0xFFFFFF8807D18600)
>>      |  desc = 0xFFFFFF8807D18600
>>      |  __already_done = FALSE
>>      |  irq = 17
>>      |  retval = IRQ_NONE
>>      |  res = IRQ_NONE
>> -004|handle_irq_event_percpu(inline)
>>      |  desc = 0xFFFFFF8807D18600
>>      |  retval = IRQ_NONE
>> -004|handle_irq_event(:desc = 0xFFFFFF8807D18600)
>>      |  desc = 0xFFFFFF8807D18600
>>      |  ret = IRQ_NONE
>> -005|handle_fasteoi_irq(desc = 0xFFFFFF8807D18600)
>>      |  desc = 0xFFFFFF8807D18600
>>      |  chip = 0xFFFFFFC081F21288
>> -006|generic_handle_irq_desc(inline)
>> -006|handle_irq_desc(inline)
>> -006|generic_handle_domain_irq(domain = ?, :hwirq = 261)
>>      |  domain = ?
>>      |  hwirq = 261
>> -007|__gic_handle_irq(inline)
>>      |  irqnr = 261
>> -007|__gic_handle_irq_from_irqson(inline)
>>      |  is_nmi = FALSE
>>      |  irqnr = 261
>> -007|gic_handle_irq()
>> -008|call_on_irq_stack(asm)
>> -009|do_interrupt_handler(inline)
>>      |  regs = 0xFFFFFFC082142DB0
>>      |  old_regs = 0x0
>> -009|__el1_irq(inline)
>>      |  regs = 0xFFFFFFC082142DB0
>> -009|el1_interrupt(regs = 0xFFFFFFC082142DB0, handler = 0xFFFFFFC0800100F8)
>>      |  regs = 0xFFFFFFC082142DB0
>>      |  handler = 0xFFFFFFC0800100F8
>> -010|el1h_64_irq_handler(regs = ?)
>>      |  regs = ?
>> -011|el1h_64_irq(asm)
>>   -->|exception
>> -012|__memcpy(asm)
>> -013|mas_mab_cp(:mas = 0xFFFFFFC0821434A8, :mas_start = 80, mas_end = ?,
>> b_node = 0xFFFFFFC082143108, :mab_start = 80)
>>      |  mas = 0xFFFFFFC0821434A8
>>      |  mas_start = 0
>>      |  b_node = 0xFFFFFFC082143108
>>      |  mab_start = 0
>>      |  gaps = 0x0
>>      |  node = 0xFFFFFF88118A8900
>>      |  mt = maple_arange_64
>>      |  __fortify_size = 32
>>      |  __p_size = 18446744073709551615
>>      |  __p_size_field = 18446744073709551615
>>      |  __q_size = 0
>> -014|mast_fill_bnode(:mast = 0xFFFFFFC0821430C8, :mas = 0xFFFFFFC0821434A8,
>> :skip = 1)
>>      |  mast = 0xFFFFFFC0821430C8 -> (
>>      |    orig_l = 0xFFFFFFC082143000,
>>      |    orig_r = 0xFFFFFFC082142FC0,
>>      |    l = 0xFFFFFFC082143080 -> (
>>      |      tree = 0xFFFFFFC081EB3EC0,
>>      |      index = 300,
>>      |      last = 300,
>>      |      node = 0xFFFFFF881409570C,
>>      |      min = 285,
>>      |      max = 293,
>>      |      alloc = 0xFFFFFF8814094600,
>>      |      depth = 3,
>>      |      offset = 4,
>>      |      mas_flags = 0),
>>      |    m = 0x0,
>>      |    r = 0xFFFFFFC082143040 -> (
>>      |      tree = 0xFFFFFFC081EB3EC0,
>>      |      index = 300,
>>      |      last = 300,
>>      |      node = 0xFFFFFF881409510C,
>>      |      min = 294,
>>      |      max = 18446744073709551615,
>>      |      alloc = 0xFFFFFF8814094600,
>>      |      depth = 3,
>>      |      offset = 15,
>>      |      mas_flags = 0),
>>      |    free = 0xFFFFFFC082142FA8,
>>      |    destroy = 0x0,
>>      |    bn = 0xFFFFFFC082143108)
>>      |  mas = 0xFFFFFFC0821434A8
>>      |  skip = 1
>>      |  split = 0
>>      |  old = 0x0
>> -015|mas_split(inline)
>>      |  mas = 0xFFFFFFC0821434A8
>>      |  mast = (orig_l = 0xFFFFFFC082143000, orig_r = 0xFFFFFFC082142FC0, l =
>> 0xFFFFFFC082143080, m = 0x0, r = 0xFFFFFFC082143040, free =
>> 0xFFFFFFC082142FA8, destroy = 0x0, bn = 0xFFFFFFC082143108)
>>      |  l_mas = (tree = 0xFFFFFFC081EB3EC0, index = 300, last = 300, node =
>> 0xFFFFFF881409570C, min = 285, max = 293, alloc = 0xFFFFFF8814094600, depth
>> = 3, offset = 4, mas_flags = 0)
>>      |  r_mas = (tree = 0xFFFFFFC081EB3EC0, index = 300, last = 300, node =
>> 0xFFFFFF881409510C, min = 294, max = 18446744073709551615, alloc =
>> 0xFFFFFF8814094600, depth = 3, offset = 15, mas_flags = 0)
>>      |  prev_l_mas = (tree = 0xFFFFFFC081EB3EC0, index = 300, last = 300,
>> node = 0x1, min = 0, max = 18446744073709551615, alloc = 0x0, depth = 0,
>> offset = 0, mas_flags = 0)
>>      |  prev_r_mas = (tree = 0xFFFFFFC081EB3EC0, index = 300, last = 300,
>> node = 0x1, min = 0, max = 18446744073709551615, alloc = 0x0, depth = 0,
>> offset = 0, mas_flags = 0)
>>      |  mat = (head = 0xFFFFFF8819DECF0C, tail = 0xFFFFFF8819DECF0C, mtree =
>> 0xFFFFFFC081EB3EC0)
>>      |  mid_split = 0
>> -015|mas_commit_b_node(inline)
>>      |  b_type = maple_leaf_64
>>      |  node = 0x0
>> -015|mas_wr_bnode(inline)
>>      |  b_node = (
>>      |    parent = 0x0,
>>      |    pivot = (239, 254, 269, 284, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,
>> 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0),
>>      |    slot = (0x0, 0x0, 0x0, 0x0, 0x0, 0x0, 0x0, 0x0, 0x0, 0x0, 0x0, 0x0,
>> 0x0, 0x0, 0x0, 0x0, 0x0, 0x0, 0x0, 0x0, 0x0, 0x0, 0x0, 0x0, 0x0, 0x0, 0x0,
>> 0x0, 0x0, 0x0, 0x0, 0x0, 0x0, 0x0),
>>      |    padding = (0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,
>> 0, 0),
>>      |    gap = (0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,
>> 0),
>>      |    b_end = 4,
>>      |    type = maple_leaf_64)
>> -015|mas_wr_modify(:wr_mas = 0xFFFFFFC082143408)
>> -016|mas_wr_store_entry(:wr_mas = 0xFFFFFFC082143408)
>>      |  wr_mas = 0xFFFFFFC082143408 -> (
>>      |    mas = 0xFFFFFFC0821434A8 -> (
>>      |      tree = 0xFFFFFFC081EB3EC0,
>>      |      index = 300,
>>      |      last = 300,
>>      |      node = 0xFFFFFF88118A891C,
>>      |      min = 225,
>>      |      max = 18446744073709551615,
>>      |      alloc = 0xFFFFFF8814094600,
>>      |      depth = 3,
>>      |      offset = 2,
>>      |      mas_flags = 0),
>>      |    node = 0xFFFFFF8819DECF00,
>>      |    r_min = 300,
>>      |    r_max = 0xFFFFFFFFFFFFFFFF,
>>      |    type = maple_leaf_64,
>>      |    offset_end = 15,
>>      |    node_end = 15,
>>      |    pivots = 0xFFFFFF8819DECF08 -> 0,
>>      |    end_piv = 0xFFFFFFFFFFFFFFFF,
>>      |    slots = 0xFFFFFF8819DECF80 -> 0xFFFFFF8813125600 -> ,
>>      |    entry = 0xFFFFFF8848A27A00,
>>      |    content = 0x0)
>>      |  mas = 0x0
>> -017|mas_store_gfp(:mas = 0xFFFFFFC0821434A8, :entry = 0xFFFFFF8848A27A00,
>> :gfp = 3264)
>>      |  mas = 0xFFFFFFC0821434A8
>>      |  entry = 0xFFFFFF8848A27A00
>>      |  gfp = 3264
>>      |  wr_mas = (mas = 0xFFFFFFC0821434A8, node = 0xFFFFFF8819DECF00, r_min
>> = 300, r_max = 18446744073709551615, type = maple_leaf_64, offset_end = 15,
>> node_end = 15, pivots = 0xFFFFFF8819DECF08, end_piv = 18446744073709551615,
>> slots = 0xFFFFFF8819DECF80, entry = 0xFFFFFF8848A27A00, content = 0x0)
>> -018|irq_insert_desc(inline)
>>      |  desc = 0xFFFFFF8848A27A00
>>      |  mas = (tree = 0xFFFFFFC081EB3EC0, index = 300, last = 300, node =
>> 0xFFFFFF88118A891C, min = 225, max = 18446744073709551615, alloc =
>> 0xFFFFFF8814094600, depth = 3, offset = 2, mas_flags = 0)
>> -018|alloc_descs(inline)
>>      |  start = 300
>>      |  node = -1
>>      |  affinity = 0x0
>>      |  owner = 0x0
>>      |  desc = 0xFFFFFF8848A27A00
>> -018|__irq_alloc_descs(irq = ?, from = ?, :cnt = 1, node = ?, owner = 0x0,
>> :affinity = 0x0)
>>      |  cnt = 1
>>      |  owner = 0x0
>>      |  start = 300
>> -019|irq_domain_alloc_descs(inline)
>>      |  virq = -1
>>      |  cnt = 1
>>      |  hwirq = 0
>>      |  node = -1
>>      |  affinity = 0x0
>> -019|irq_create_mapping_affinity_locked(inline)
>>      |  domain = 0xFFFFFF885BFF6840
>>      |  hwirq = 0
>>      |  affinity = 0x0
>>      |  virq = 0
>> -019|irq_create_mapping_affinity(domain = 0xFFFFFF885BFF6840, hwirq = 0,
>> affinity = 0x0)
>>      |  domain = 0xFFFFFF885BFF6840
>>      |  hwirq = 0
>>      |  affinity = 0x0
>> -020|NSX:0x0::0xFFFFFFC07AE32720(asm)
>> -021|NSX:0x0::0xFFFFFFC07AC9AB38(asm)
>> -022|NSX:0x0::0xFFFFFFC07B3E49F4(asm)
>> -023|call_driver_probe(inline)
>>      |  dev = 0xFFFFFF8848951848
>>      |  drv = 0xFFFFFFC07AFD90C0
>>      |  ret = 0
>> -023|really_probe(:dev = 0xFFFFFF8848951848, :drv = 0xFFFFFFC07AFD90C0)
>>      |  dev = 0xFFFFFF8848951848
>>      |  drv = 0xFFFFFFC07AFD90C0
>>      |  link_ret = 0
>>      |  test_remove = FALSE
>> -024|__driver_probe_device(drv = 0xFFFFFFC07AFD90C0, :dev =
>> 0xFFFFFF8848951848)
>>      |  drv = 0xFFFFFFC07AFD90C0
>>      |  dev = 0xFFFFFF8848951848
>>      |  ret = 0
>> -025|driver_probe_device(drv = 0xFFFFFFC07AFD90C0, :dev =
>> 0xFFFFFF8848951848)
>>      |  drv = 0xFFFFFFC07AFD90C0
>>      |  dev = 0xFFFFFF8848951848
>>      |  trigger_count = 783
>>      |  ret = 0
>> -026|__device_attach_driver(drv = 0xFFFFFFC07AFD90C0, :_data =
>> 0xFFFFFFC0821437E8)
>>      |  drv = 0xFFFFFFC07AFD90C0
>>      |  _data = 0xFFFFFFC0821437E8
>>      |  data = 0xFFFFFFC0821437E8
>>      |  dev = 0xFFFFFF8848951848
>>      |  ret = ???
>> -027|bus_for_each_drv(bus = ?, :start = 0xFFFFFFC0821437E0, :data =
>> 0xFFFFFFC0821437E8, fn = 0xFFFFFFC08089C798)
>>      |  data = 0xFFFFFFC0821437E8
>>      |  fn = 0xFFFFFFC08089C798
>>      |  i = (i_klist = 0xFFFFFF881ED5C6C8, i_cur = 0xFFFFFF8823649968)
>>      |  sp = 0xFFFFFF881ED5C600
>>      |  error = 0
>> -028|__device_attach(dev = 0xFFFFFF8848951848)
>>      |  dev = 0xFFFFFF8848951848
>>      |  async = FALSE
>>      |  ret = 0
>>      |  data = (dev = 0xFFFFFF8848951848, check_async = TRUE, want_async =
>> FALSE, have_async = FALSE)
>> -029|device_initial_probe(dev = 0xFFFFFF8848951848)
>>      |  dev = 0xFFFFFF8848951848
>> -030|bus_probe_device(:dev = 0xFFFFFF8848951848)
>>      |  dev = 0xFFFFFF8848951848
>>      |  sp = 0xFFFFFF881ED5C600
>>      |  sif = 0x0
>> -031|device_add(:dev = 0xFFFFFF8848951848)
>>      |  dev = 0xFFFFFF8848951848
>>      |  sp = 0x0
>>      |  parent = 0xFFFFFF8851B70080
>>      |  class_intf = 0x0
>>      |  error = 0
>>      |  glue_dir = 0x0
>> -032|device_register(dev = 0xFFFFFF8848951848)
>>      |  dev = 0xFFFFFF8848951848
>> -033|NSX:0x0::0xFFFFFFC07B3E3944(asm)
>> -034|NSX:0x0::0xFFFFFFC07B3E3C20(asm)
>> -035|NSX:0x0::0xFFFFFFC07B6B5148(asm)
>> -036|platform_probe(:_dev = 0xFFFFFF8848956010)
>>      |  _dev = 0xFFFFFF8848956010
>>      |  drv = 0xFFFFFFC07B299648
>>      |  ret = 0
>> -037|call_driver_probe(inline)
>>      |  dev = 0xFFFFFF8848956010
>>      |  drv = 0xFFFFFFC07B299678
>>      |  ret = 0
>> -037|really_probe(:dev = 0xFFFFFF8848956010, :drv = 0xFFFFFFC07B299678)
>>      |  dev = 0xFFFFFF8848956010
>>      |  drv = 0xFFFFFFC07B299678
>>      |  link_ret = 0
>>      |  test_remove = FALSE
>> -038|__driver_probe_device(drv = 0xFFFFFFC07B299678, :dev =
>> 0xFFFFFF8848956010)
>>      |  drv = 0xFFFFFFC07B299678
>>      |  dev = 0xFFFFFF8848956010
>>      |  ret = 0
>> -039|driver_probe_device(drv = 0xFFFFFFC07B299678, :dev =
>> 0xFFFFFF8848956010)
>>      |  drv = 0xFFFFFFC07B299678
>>      |  dev = 0xFFFFFF8848956010
>>      |  trigger_count = 781
>>      |  ret = 0
>> -040|__device_attach_driver(drv = 0xFFFFFFC07B299678, :_data =
>> 0xFFFFFFC082143BA8)
>>      |  drv = 0xFFFFFFC07B299678
>>      |  _data = 0xFFFFFFC082143BA8
>>      |  data = 0xFFFFFFC082143BA8
>>      |  dev = 0xFFFFFF8848956010
>>      |  ret = ???
>> -041|bus_for_each_drv(bus = ?, :start = 0xFFFFFFC082143BA0, :data =
>> 0xFFFFFFC082143BA8, fn = 0xFFFFFFC08089C798)
>>      |  data = 0xFFFFFFC082143BA8
>>      |  fn = 0xFFFFFFC08089C798
>>      |  i = (i_klist = 0xFFFFFF8804034AC8, i_cur = 0xFFFFFF8821B45068)
>>      |  sp = 0xFFFFFF8804034A00
>>      |  error = 0
>> -042|__device_attach(dev = 0xFFFFFF8848956010)
>>      |  dev = 0xFFFFFF8848956010
>>      |  async = FALSE
>>      |  ret = 0
>>      |  data = (dev = 0xFFFFFF8848956010, check_async = TRUE, want_async =
>> FALSE, have_async = FALSE)
>> -043|device_initial_probe(dev = 0xFFFFFF8848956010)
>>      |  dev = 0xFFFFFF8848956010
>> -044|bus_probe_device(:dev = 0xFFFFFF8848956010)
>>      |  dev = 0xFFFFFF8848956010
>>      |  sp = 0xFFFFFF8804034A00
>>      |  sif = 0x0
>> -045|device_add(:dev = 0xFFFFFF8848956010)
>>      |  dev = 0xFFFFFF8848956010
>>      |  sp = 0x0
>>      |  parent = 0xFFFFFF8851BCE410
>>      |  class_intf = 0x0
>>      |  error = 0
>>      |  glue_dir = 0x0
>> -046|platform_device_add(pdev = 0xFFFFFF8848956000)
>>      |  pdev = 0xFFFFFF8848956000
>> -047|NSX:0x0::0xFFFFFFC07B73DD48(asm)
>> -048|process_one_work(:worker = 0xFFFFFF880300AF00, work =
>> 0xFFFFFF8833434930)
>>      |  worker = 0xFFFFFF880300AF00
>>      |  work = 0xFFFFFF8833434930
>>      |  pool = 0xFFFFFF8B7DCAA180
>>      |  pwq = 0xFFFFFF8B7DCAE600
>>      |  collision = 0x0
>>      |  work_data = 18446743573308827141
>> -049|worker_thread(:__worker = 0xFFFFFF880300AF00)
>>      |  __worker = 0xFFFFFF880300AF00
>>      |  worker = 0x0
>>      |  pool = 0xFFFFFF8B7DCAA180
>> -050|kthread(_create = 0xFFFFFF8803290240)
>>      |  _create = 0xFFFFFF8803290240
>>      |  param = (sched_priority = 0)
>>      |  create = 0x0
>>      |  data = 0xFFFFFF880300AF00
>>      |  threadfn = 0x0
>>      |  ret = ???
>>      |  self = 0xFFFFFF88030D8180
>>      |  done = 0xFFFFFFC082133CB8
>> -051|ret_from_fork(asm)
>>   ---|end of frame
>>
>> -Mukesh



More information about the maple-tree mailing list