Add kmalloc failover to vmalloc

[lttng-modules.git] / lib / ringbuffer / ring_buffer_frontend.c
diff --git a/lib/ringbuffer/ring_buffer_frontend.c b/lib/ringbuffer/ring_buffer_frontend.c

index 5d4be3b3dcf4ddc60920377c3d1f160ceb629261..1e439803735ae28814216ee0a4ca132c0c1caf33 100644 (file)
--- a/lib/ringbuffer/ring_buffer_frontend.c
+++ b/lib/ringbuffer/ring_buffer_frontend.c
@@ -54,6 +54,7 @@
  #include <linux/delay.h>
  #include <linux/module.h>
  #include <linux/percpu.h>
+#include <asm/cacheflush.h>
  
  #include <wrapper/ringbuffer/config.h>
  #include <wrapper/ringbuffer/backend.h>
@@ -64,6 +65,7 @@
  #include <wrapper/kref.h>
  #include <wrapper/percpu-defs.h>
  #include <wrapper/timer.h>
+#include <wrapper/vmalloc.h>
  
  /*
   * Internal structure representing offsets to use at a sub-buffer switch.
@@ -146,8 +148,8 @@ void lib_ring_buffer_free(struct lib_ring_buffer *buf)
         struct channel *chan = buf->backend.chan;
  
         lib_ring_buffer_print_errors(chan, buf, buf->backend.cpu);
-       kfree(buf->commit_hot);
-       kfree(buf->commit_cold);
+       lttng_kvfree(buf->commit_hot);
+       lttng_kvfree(buf->commit_cold);
  
         lib_ring_buffer_backend_free(&buf->backend);
  }
@@ -244,7 +246,7 @@ int lib_ring_buffer_create(struct lib_ring_buffer *buf,
                 return ret;
  
         buf->commit_hot =
-               kzalloc_node(ALIGN(sizeof(*buf->commit_hot)
+               lttng_kvzalloc_node(ALIGN(sizeof(*buf->commit_hot)
                                    * chan->backend.num_subbuf,
                                    1 << INTERNODE_CACHE_SHIFT),
                         GFP_KERNEL | __GFP_NOWARN,
@@ -255,7 +257,7 @@ int lib_ring_buffer_create(struct lib_ring_buffer *buf,
         }
  
         buf->commit_cold =
-               kzalloc_node(ALIGN(sizeof(*buf->commit_cold)
+               lttng_kvzalloc_node(ALIGN(sizeof(*buf->commit_cold)
                                    * chan->backend.num_subbuf,
                                    1 << INTERNODE_CACHE_SHIFT),
                         GFP_KERNEL | __GFP_NOWARN,
@@ -304,9 +306,9 @@ int lib_ring_buffer_create(struct lib_ring_buffer *buf,
  
         /* Error handling */
  free_init:
-       kfree(buf->commit_cold);
+       lttng_kvfree(buf->commit_cold);
  free_commit:
-       kfree(buf->commit_hot);
+       lttng_kvfree(buf->commit_hot);
  free_chanbuf:
         lib_ring_buffer_backend_free(&buf->backend);
         return ret;
@@ -451,7 +453,81 @@ static void lib_ring_buffer_stop_read_timer(struct lib_ring_buffer *buf)
         buf->read_timer_enabled = 0;
  }
  
+#if (LINUX_VERSION_CODE >= KERNEL_VERSION(4,10,0))
+
+enum cpuhp_state lttng_rb_hp_prepare;
+enum cpuhp_state lttng_rb_hp_online;
+
+void lttng_rb_set_hp_prepare(enum cpuhp_state val)
+{
+       lttng_rb_hp_prepare = val;
+}
+EXPORT_SYMBOL_GPL(lttng_rb_set_hp_prepare);
+
+void lttng_rb_set_hp_online(enum cpuhp_state val)
+{
+       lttng_rb_hp_online = val;
+}
+EXPORT_SYMBOL_GPL(lttng_rb_set_hp_online);
+
+int lttng_cpuhp_rb_frontend_dead(unsigned int cpu,
+               struct lttng_cpuhp_node *node)
+{
+       struct channel *chan = container_of(node, struct channel,
+                                           cpuhp_prepare);
+       struct lib_ring_buffer *buf = per_cpu_ptr(chan->backend.buf, cpu);
+       const struct lib_ring_buffer_config *config = &chan->backend.config;
+
+       CHAN_WARN_ON(chan, config->alloc == RING_BUFFER_ALLOC_GLOBAL);
+
+       /*
+        * Performing a buffer switch on a remote CPU. Performed by
+        * the CPU responsible for doing the hotunplug after the target
+        * CPU stopped running completely. Ensures that all data
+        * from that remote CPU is flushed.
+        */
+       lib_ring_buffer_switch_slow(buf, SWITCH_ACTIVE);
+       return 0;
+}
+EXPORT_SYMBOL_GPL(lttng_cpuhp_rb_frontend_dead);
+
+int lttng_cpuhp_rb_frontend_online(unsigned int cpu,
+               struct lttng_cpuhp_node *node)
+{
+       struct channel *chan = container_of(node, struct channel,
+                                           cpuhp_online);
+       struct lib_ring_buffer *buf = per_cpu_ptr(chan->backend.buf, cpu);
+       const struct lib_ring_buffer_config *config = &chan->backend.config;
+
+       CHAN_WARN_ON(chan, config->alloc == RING_BUFFER_ALLOC_GLOBAL);
+
+       wake_up_interruptible(&chan->hp_wait);
+       lib_ring_buffer_start_switch_timer(buf);
+       lib_ring_buffer_start_read_timer(buf);
+       return 0;
+}
+EXPORT_SYMBOL_GPL(lttng_cpuhp_rb_frontend_online);
+
+int lttng_cpuhp_rb_frontend_offline(unsigned int cpu,
+               struct lttng_cpuhp_node *node)
+{
+       struct channel *chan = container_of(node, struct channel,
+                                           cpuhp_online);
+       struct lib_ring_buffer *buf = per_cpu_ptr(chan->backend.buf, cpu);
+       const struct lib_ring_buffer_config *config = &chan->backend.config;
+
+       CHAN_WARN_ON(chan, config->alloc == RING_BUFFER_ALLOC_GLOBAL);
+
+       lib_ring_buffer_stop_switch_timer(buf);
+       lib_ring_buffer_stop_read_timer(buf);
+       return 0;
+}
+EXPORT_SYMBOL_GPL(lttng_cpuhp_rb_frontend_offline);
+
+#else /* #if (LINUX_VERSION_CODE >= KERNEL_VERSION(4,10,0)) */
+
  #ifdef CONFIG_HOTPLUG_CPU
+
  /**
   *     lib_ring_buffer_cpu_hp_callback - CPU hotplug callback
   *     @nb: notifier block
@@ -507,8 +583,11 @@ int lib_ring_buffer_cpu_hp_callback(struct notifier_block *nb,
                 return NOTIFY_DONE;
         }
  }
+
  #endif
  
+#endif /* #else #if (LINUX_VERSION_CODE >= KERNEL_VERSION(4,10,0)) */
+
  #if defined(CONFIG_NO_HZ) && defined(CONFIG_LIB_RING_BUFFER)
  /*
   * For per-cpu buffers, call the reader wakeups before switching the buffer, so
@@ -597,7 +676,6 @@ void notrace lib_ring_buffer_tick_nohz_restart(void)
  static void channel_unregister_notifiers(struct channel *chan)
  {
         const struct lib_ring_buffer_config *config = &chan->backend.config;
-       int cpu;
  
         channel_iterator_unregister_notifiers(chan);
         if (config->alloc == RING_BUFFER_ALLOC_PER_CPU) {
@@ -614,25 +692,42 @@ static void channel_unregister_notifiers(struct channel *chan)
                  * concurrency.
                  */
  #endif /* CONFIG_NO_HZ */
-#ifdef CONFIG_HOTPLUG_CPU
-               get_online_cpus();
-               chan->cpu_hp_enable = 0;
-               for_each_online_cpu(cpu) {
-                       struct lib_ring_buffer *buf = per_cpu_ptr(chan->backend.buf,
-                                                             cpu);
-                       lib_ring_buffer_stop_switch_timer(buf);
-                       lib_ring_buffer_stop_read_timer(buf);
+#if (LINUX_VERSION_CODE >= KERNEL_VERSION(4,10,0))
+               {
+                       int ret;
+
+                       ret = cpuhp_state_remove_instance(lttng_rb_hp_online,
+                               &chan->cpuhp_online.node);
+                       WARN_ON(ret);
+                       ret = cpuhp_state_remove_instance_nocalls(lttng_rb_hp_prepare,
+                               &chan->cpuhp_prepare.node);
+                       WARN_ON(ret);
                 }
-               put_online_cpus();
-               unregister_cpu_notifier(&chan->cpu_hp_notifier);
+#else /* #if (LINUX_VERSION_CODE >= KERNEL_VERSION(4,10,0)) */
+               {
+                       int cpu;
+
+#ifdef CONFIG_HOTPLUG_CPU
+                       get_online_cpus();
+                       chan->cpu_hp_enable = 0;
+                       for_each_online_cpu(cpu) {
+                               struct lib_ring_buffer *buf = per_cpu_ptr(chan->backend.buf,
+                                                                     cpu);
+                               lib_ring_buffer_stop_switch_timer(buf);
+                               lib_ring_buffer_stop_read_timer(buf);
+                       }
+                       put_online_cpus();
+                       unregister_cpu_notifier(&chan->cpu_hp_notifier);
  #else
-               for_each_possible_cpu(cpu) {
-                       struct lib_ring_buffer *buf = per_cpu_ptr(chan->backend.buf,
-                                                             cpu);
-                       lib_ring_buffer_stop_switch_timer(buf);
-                       lib_ring_buffer_stop_read_timer(buf);
-               }
+                       for_each_possible_cpu(cpu) {
+                               struct lib_ring_buffer *buf = per_cpu_ptr(chan->backend.buf,
+                                                                     cpu);
+                               lib_ring_buffer_stop_switch_timer(buf);
+                               lib_ring_buffer_stop_read_timer(buf);
+                       }
  #endif
+               }
+#endif /* #else #if (LINUX_VERSION_CODE >= KERNEL_VERSION(4,10,0)) */
         } else {
                 struct lib_ring_buffer *buf = chan->backend.buf;
  
@@ -733,7 +828,7 @@ struct channel *channel_create(const struct lib_ring_buffer_config *config,
                    size_t num_subbuf, unsigned int switch_timer_interval,
                    unsigned int read_timer_interval)
  {
-       int ret, cpu;
+       int ret;
         struct channel *chan;
  
         if (lib_ring_buffer_check_config(config, switch_timer_interval,
@@ -761,6 +856,56 @@ struct channel *channel_create(const struct lib_ring_buffer_config *config,
         init_waitqueue_head(&chan->hp_wait);
  
         if (config->alloc == RING_BUFFER_ALLOC_PER_CPU) {
+#if (LINUX_VERSION_CODE >= KERNEL_VERSION(4,10,0))
+               chan->cpuhp_prepare.component = LTTNG_RING_BUFFER_FRONTEND;
+               ret = cpuhp_state_add_instance_nocalls(lttng_rb_hp_prepare,
+                       &chan->cpuhp_prepare.node);
+               if (ret)
+                       goto cpuhp_prepare_error;
+
+               chan->cpuhp_online.component = LTTNG_RING_BUFFER_FRONTEND;
+               ret = cpuhp_state_add_instance(lttng_rb_hp_online,
+                       &chan->cpuhp_online.node);
+               if (ret)
+                       goto cpuhp_online_error;
+#else /* #if (LINUX_VERSION_CODE >= KERNEL_VERSION(4,10,0)) */
+               {
+                       int cpu;
+                       /*
+                        * In case of non-hotplug cpu, if the ring-buffer is allocated
+                        * in early initcall, it will not be notified of secondary cpus.
+                        * In that off case, we need to allocate for all possible cpus.
+                        */
+#ifdef CONFIG_HOTPLUG_CPU
+                       chan->cpu_hp_notifier.notifier_call =
+                                       lib_ring_buffer_cpu_hp_callback;
+                       chan->cpu_hp_notifier.priority = 6;
+                       register_cpu_notifier(&chan->cpu_hp_notifier);
+
+                       get_online_cpus();
+                       for_each_online_cpu(cpu) {
+                               struct lib_ring_buffer *buf = per_cpu_ptr(chan->backend.buf,
+                                                                      cpu);
+                               spin_lock(&per_cpu(ring_buffer_nohz_lock, cpu));
+                               lib_ring_buffer_start_switch_timer(buf);
+                               lib_ring_buffer_start_read_timer(buf);
+                               spin_unlock(&per_cpu(ring_buffer_nohz_lock, cpu));
+                       }
+                       chan->cpu_hp_enable = 1;
+                       put_online_cpus();
+#else
+                       for_each_possible_cpu(cpu) {
+                               struct lib_ring_buffer *buf = per_cpu_ptr(chan->backend.buf,
+                                                                     cpu);
+                               spin_lock(&per_cpu(ring_buffer_nohz_lock, cpu));
+                               lib_ring_buffer_start_switch_timer(buf);
+                               lib_ring_buffer_start_read_timer(buf);
+                               spin_unlock(&per_cpu(ring_buffer_nohz_lock, cpu));
+                       }
+#endif
+               }
+#endif /* #else #if (LINUX_VERSION_CODE >= KERNEL_VERSION(4,10,0)) */
+
  #if defined(CONFIG_NO_HZ) && defined(CONFIG_LIB_RING_BUFFER)
                 /* Only benefit from NO_HZ idle with per-cpu buffers for now. */
                 chan->tick_nohz_notifier.notifier_call =
@@ -770,38 +915,6 @@ struct channel *channel_create(const struct lib_ring_buffer_config *config,
                                        &chan->tick_nohz_notifier);
  #endif /* defined(CONFIG_NO_HZ) && defined(CONFIG_LIB_RING_BUFFER) */
  
-               /*
-                * In case of non-hotplug cpu, if the ring-buffer is allocated
-                * in early initcall, it will not be notified of secondary cpus.
-                * In that off case, we need to allocate for all possible cpus.
-                */
-#ifdef CONFIG_HOTPLUG_CPU
-               chan->cpu_hp_notifier.notifier_call =
-                               lib_ring_buffer_cpu_hp_callback;
-               chan->cpu_hp_notifier.priority = 6;
-               register_cpu_notifier(&chan->cpu_hp_notifier);
-
-               get_online_cpus();
-               for_each_online_cpu(cpu) {
-                       struct lib_ring_buffer *buf = per_cpu_ptr(chan->backend.buf,
-                                                              cpu);
-                       spin_lock(&per_cpu(ring_buffer_nohz_lock, cpu));
-                       lib_ring_buffer_start_switch_timer(buf);
-                       lib_ring_buffer_start_read_timer(buf);
-                       spin_unlock(&per_cpu(ring_buffer_nohz_lock, cpu));
-               }
-               chan->cpu_hp_enable = 1;
-               put_online_cpus();
-#else
-               for_each_possible_cpu(cpu) {
-                       struct lib_ring_buffer *buf = per_cpu_ptr(chan->backend.buf,
-                                                             cpu);
-                       spin_lock(&per_cpu(ring_buffer_nohz_lock, cpu));
-                       lib_ring_buffer_start_switch_timer(buf);
-                       lib_ring_buffer_start_read_timer(buf);
-                       spin_unlock(&per_cpu(ring_buffer_nohz_lock, cpu));
-               }
-#endif
         } else {
                 struct lib_ring_buffer *buf = chan->backend.buf;
  
@@ -811,6 +924,13 @@ struct channel *channel_create(const struct lib_ring_buffer_config *config,
  
         return chan;
  
+#if (LINUX_VERSION_CODE >= KERNEL_VERSION(4,10,0))
+cpuhp_online_error:
+       ret = cpuhp_state_remove_instance_nocalls(lttng_rb_hp_prepare,
+                       &chan->cpuhp_prepare.node);
+       WARN_ON(ret);
+cpuhp_prepare_error:
+#endif /* #if (LINUX_VERSION_CODE >= KERNEL_VERSION(4,10,0)) */
  error_free_backend:
         channel_backend_free(&chan->backend);
  error:
@@ -1031,6 +1151,47 @@ void lib_ring_buffer_move_consumer(struct lib_ring_buffer *buf,
  }
  EXPORT_SYMBOL_GPL(lib_ring_buffer_move_consumer);
  
+#if ARCH_IMPLEMENTS_FLUSH_DCACHE_PAGE
+static void lib_ring_buffer_flush_read_subbuf_dcache(
+               const struct lib_ring_buffer_config *config,
+               struct channel *chan,
+               struct lib_ring_buffer *buf)
+{
+       struct lib_ring_buffer_backend_pages *pages;
+       unsigned long sb_bindex, id, i, nr_pages;
+
+       if (config->output != RING_BUFFER_MMAP)
+               return;
+
+       /*
+        * Architectures with caches aliased on virtual addresses may
+        * use different cache lines for the linear mapping vs
+        * user-space memory mapping. Given that the ring buffer is
+        * based on the kernel linear mapping, aligning it with the
+        * user-space mapping is not straightforward, and would require
+        * extra TLB entries. Therefore, simply flush the dcache for the
+        * entire sub-buffer before reading it.
+        */
+       id = buf->backend.buf_rsb.id;
+       sb_bindex = subbuffer_id_get_index(config, id);
+       pages = buf->backend.array[sb_bindex];
+       nr_pages = buf->backend.num_pages_per_subbuf;
+       for (i = 0; i < nr_pages; i++) {
+               struct lib_ring_buffer_backend_page *backend_page;
+
+               backend_page = &pages->p[i];
+               flush_dcache_page(pfn_to_page(backend_page->pfn));
+       }
+}
+#else
+static void lib_ring_buffer_flush_read_subbuf_dcache(
+               const struct lib_ring_buffer_config *config,
+               struct channel *chan,
+               struct lib_ring_buffer *buf)
+{
+}
+#endif
+
  /**
   * lib_ring_buffer_get_subbuf - get exclusive access to subbuffer for reading
   * @buf: ring buffer
@@ -1173,6 +1334,8 @@ retry:
         buf->get_subbuf_consumed = consumed;
         buf->get_subbuf = 1;
  
+       lib_ring_buffer_flush_read_subbuf_dcache(config, chan, buf);
+
         return 0;
  
  nodata:
@@ -1346,8 +1509,7 @@ void lib_ring_buffer_print_errors(struct channel *chan,
  /*
   * lib_ring_buffer_switch_old_start: Populate old subbuffer header.
   *
- * Only executed by SWITCH_FLUSH, which can be issued while tracing is active
- * or at buffer finalization (destroy).
+ * Only executed when the buffer is finalized, in SWITCH_FLUSH.
   */
  static
  void lib_ring_buffer_switch_old_start(struct lib_ring_buffer *buf,
@@ -1543,14 +1705,12 @@ int lib_ring_buffer_try_switch_slow(enum switch_mode mode,
                 unsigned long sb_index, commit_count;
  
                 /*
-                * We are performing a SWITCH_FLUSH. There may be concurrent
-                * writes into the buffer if e.g. invoked while performing a
-                * snapshot on an active trace.
+                * We are performing a SWITCH_FLUSH. At this stage, there are no
+                * concurrent writes into the buffer.
                  *
-                * If the client does not save any header information (sub-buffer
-                * header size == 0), don't switch empty subbuffer on finalize,
-                * because it is invalid to deliver a completely empty
-                * subbuffer.
+                * The client does not save any header information.  Don't
+                * switch empty subbuffer on finalize, because it is invalid to
+                * deliver a completely empty subbuffer.
                  */
                 if (!config->cb.subbuffer_header_size())
                         return -1;
@@ -1715,6 +1875,7 @@ static void _lib_ring_buffer_switch_remote(struct lib_ring_buffer *buf,
         put_online_cpus();
  }
  
+/* Switch sub-buffer if current sub-buffer is non-empty. */
  void lib_ring_buffer_switch_remote(struct lib_ring_buffer *buf)
  {
         _lib_ring_buffer_switch_remote(buf, SWITCH_ACTIVE);