[PATCH 1/6] perf_counter: more elaborate write API

From: Peter Zijlstra
Date: Wed Mar 25 2009 - 07:39:20 EST


Provide a begin, copy, end interface to the output buffer.

begin() reserves the space,
copy() copies the data over, considering page boundaries,
end() finalizes the event and does the wakeup.

Signed-off-by: Peter Zijlstra <a.p.zijlstra@xxxxxxxxx>
---
kernel/perf_counter.c | 96 +++++++++++++++++++++++++++++++++-----------------
1 file changed, 65 insertions(+), 31 deletions(-)

Index: linux-2.6/kernel/perf_counter.c
===================================================================
--- linux-2.6.orig/kernel/perf_counter.c
+++ linux-2.6/kernel/perf_counter.c
@@ -1411,16 +1411,20 @@ static const struct file_operations perf
* Output
*/

-static int perf_output_write(struct perf_counter *counter, int nmi,
- void *buf, ssize_t size)
+struct perf_output_handle {
+ struct perf_counter *counter;
+ struct perf_mmap_data *data;
+ unsigned int offset;
+ int wakeup;
+};
+
+static int perf_output_begin(struct perf_output_handle *handle,
+ struct perf_counter *counter, unsigned int size)
{
struct perf_mmap_data *data;
- unsigned int offset, head, nr;
- unsigned int len;
- int ret, wakeup;
+ unsigned int offset, head;

rcu_read_lock();
- ret = -ENOSPC;
data = rcu_dereference(counter->data);
if (!data)
goto out;
@@ -1428,45 +1432,75 @@ static int perf_output_write(struct perf
if (!data->nr_pages)
goto out;

- ret = -EINVAL;
- if (size > PAGE_SIZE)
- goto out;
-
do {
offset = head = atomic_read(&data->head);
head += size;
} while (atomic_cmpxchg(&data->head, offset, head) != offset);

- wakeup = (offset >> PAGE_SHIFT) != (head >> PAGE_SHIFT);
+ handle->counter = counter;
+ handle->data = data;
+ handle->offset = offset;
+ handle->wakeup = (offset >> PAGE_SHIFT) != (head >> PAGE_SHIFT);

- nr = (offset >> PAGE_SHIFT) & (data->nr_pages - 1);
- offset &= PAGE_SIZE - 1;
+ return 0;

- len = min_t(unsigned int, PAGE_SIZE - offset, size);
- memcpy(data->data_pages[nr] + offset, buf, len);
- size -= len;
-
- if (size) {
- nr = (nr + 1) & (data->nr_pages - 1);
- memcpy(data->data_pages[nr], buf + len, size);
- }
+out:
+ rcu_read_unlock();
+ return -ENOSPC;
+}

- /*
- * generate a poll() wakeup for every page boundary crossed
- */
- if (wakeup) {
- atomic_xchg(&data->wakeup, POLL_IN);
- __perf_counter_update_userpage(counter, data);
+static void perf_output_copy(struct perf_output_handle *handle,
+ void *buf, unsigned int len)
+{
+ unsigned int offset = handle->offset;
+ unsigned int pages_mask = handle->data->nr_pages - 1;
+ unsigned int size;
+ void **pages = handle->data->data_pages;
+
+ do {
+ unsigned int page_offset;
+ int nr;
+
+ nr = (offset >> PAGE_SHIFT) & pages_mask;
+ page_offset = offset & (PAGE_SIZE - 1);
+ size = min_t(unsigned int, PAGE_SIZE - page_offset, len);
+ memcpy(pages[nr] + page_offset, buf, size);
+ len -= size;
+ buf += size;
+ offset += size;
+ } while (len);
+
+ handle->offset = offset;
+}
+
+static void perf_output_end(struct perf_output_handle *handle, int nmi)
+{
+ if (handle->wakeup) {
+ (void)atomic_xchg(&handle->data->wakeup, POLL_IN);
+ __perf_counter_update_userpage(handle->counter, handle->data);
if (nmi) {
- counter->wakeup_pending = 1;
+ handle->counter->wakeup_pending = 1;
set_perf_counter_pending();
} else
- wake_up(&counter->waitq);
+ wake_up(&handle->counter->waitq);
}
- ret = 0;
-out:
rcu_read_unlock();
+}
+
+static int perf_output_write(struct perf_counter *counter, int nmi,
+ void *buf, ssize_t size)
+{
+ struct perf_output_handle handle;
+ int ret;
+
+ ret = perf_output_begin(&handle, counter, size);
+ if (ret)
+ goto out;

+ perf_output_copy(&handle, buf, size);
+ perf_output_end(&handle, nmi);
+
+out:
return ret;
}


--

--
To unsubscribe from this list: send the line "unsubscribe linux-kernel" in
the body of a message to majordomo@xxxxxxxxxxxxxxx
More majordomo info at http://vger.kernel.org/majordomo-info.html
Please read the FAQ at http://www.tux.org/lkml/