struct multicall_entry entries[MC_BATCH];
 #if MC_DEBUG
        struct multicall_entry debug[MC_BATCH];
+       void *caller[MC_BATCH];
 #endif
        unsigned char args[MC_ARGS];
        struct callback {
                               ret, smp_processor_id());
                        dump_stack();
                        for (i = 0; i < b->mcidx; i++) {
-                               printk(KERN_DEBUG "  call %2d/%d: op=%lu arg=[%lx] result=%ld\n",
+                               printk(KERN_DEBUG "  call %2d/%d: op=%lu arg=[%lx] result=%ld\t%pF\n",
                                       i+1, b->mcidx,
                                       b->debug[i].op,
                                       b->debug[i].args[0],
-                                      b->entries[i].result);
+                                      b->entries[i].result,
+                                      b->caller[i]);
                        }
                }
 #endif
        }
 
        ret.mc = &b->entries[b->mcidx];
+#ifdef MC_DEBUG
+       b->caller[b->mcidx] = __builtin_return_address(0);
+#endif
        b->mcidx++;
        ret.args = &b->args[argidx];
        b->argidx = argidx + args;