Add the rt linux 4.1.3-rt3 as base
[kvmfornfv.git] / kernel / kernel / trace / trace_events_filter.c
diff --git a/kernel/kernel/trace/trace_events_filter.c b/kernel/kernel/trace/trace_events_filter.c
new file mode 100644 (file)
index 0000000..7f2e97c
--- /dev/null
@@ -0,0 +1,2432 @@
+/*
+ * trace_events_filter - generic event filtering
+ *
+ * This program is free software; you can redistribute it and/or modify
+ * it under the terms of the GNU General Public License as published by
+ * the Free Software Foundation; either version 2 of the License, or
+ * (at your option) any later version.
+ *
+ * This program is distributed in the hope that it will be useful,
+ * but WITHOUT ANY WARRANTY; without even the implied warranty of
+ * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
+ * GNU General Public License for more details.
+ *
+ * You should have received a copy of the GNU General Public License
+ * along with this program; if not, write to the Free Software
+ * Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA 02111-1307, USA.
+ *
+ * Copyright (C) 2009 Tom Zanussi <tzanussi@gmail.com>
+ */
+
+#include <linux/module.h>
+#include <linux/ctype.h>
+#include <linux/mutex.h>
+#include <linux/perf_event.h>
+#include <linux/slab.h>
+
+#include "trace.h"
+#include "trace_output.h"
+
+#define DEFAULT_SYS_FILTER_MESSAGE                                     \
+       "### global filter ###\n"                                       \
+       "# Use this to set filters for multiple events.\n"              \
+       "# Only events with the given fields will be affected.\n"       \
+       "# If no events are modified, an error message will be displayed here"
+
+enum filter_op_ids
+{
+       OP_OR,
+       OP_AND,
+       OP_GLOB,
+       OP_NE,
+       OP_EQ,
+       OP_LT,
+       OP_LE,
+       OP_GT,
+       OP_GE,
+       OP_BAND,
+       OP_NOT,
+       OP_NONE,
+       OP_OPEN_PAREN,
+};
+
+struct filter_op {
+       int id;
+       char *string;
+       int precedence;
+};
+
+/* Order must be the same as enum filter_op_ids above */
+static struct filter_op filter_ops[] = {
+       { OP_OR,        "||",           1 },
+       { OP_AND,       "&&",           2 },
+       { OP_GLOB,      "~",            4 },
+       { OP_NE,        "!=",           4 },
+       { OP_EQ,        "==",           4 },
+       { OP_LT,        "<",            5 },
+       { OP_LE,        "<=",           5 },
+       { OP_GT,        ">",            5 },
+       { OP_GE,        ">=",           5 },
+       { OP_BAND,      "&",            6 },
+       { OP_NOT,       "!",            6 },
+       { OP_NONE,      "OP_NONE",      0 },
+       { OP_OPEN_PAREN, "(",           0 },
+};
+
+enum {
+       FILT_ERR_NONE,
+       FILT_ERR_INVALID_OP,
+       FILT_ERR_UNBALANCED_PAREN,
+       FILT_ERR_TOO_MANY_OPERANDS,
+       FILT_ERR_OPERAND_TOO_LONG,
+       FILT_ERR_FIELD_NOT_FOUND,
+       FILT_ERR_ILLEGAL_FIELD_OP,
+       FILT_ERR_ILLEGAL_INTVAL,
+       FILT_ERR_BAD_SUBSYS_FILTER,
+       FILT_ERR_TOO_MANY_PREDS,
+       FILT_ERR_MISSING_FIELD,
+       FILT_ERR_INVALID_FILTER,
+       FILT_ERR_IP_FIELD_ONLY,
+       FILT_ERR_ILLEGAL_NOT_OP,
+};
+
+static char *err_text[] = {
+       "No error",
+       "Invalid operator",
+       "Unbalanced parens",
+       "Too many operands",
+       "Operand too long",
+       "Field not found",
+       "Illegal operation for field type",
+       "Illegal integer value",
+       "Couldn't find or set field in one of a subsystem's events",
+       "Too many terms in predicate expression",
+       "Missing field name and/or value",
+       "Meaningless filter expression",
+       "Only 'ip' field is supported for function trace",
+       "Illegal use of '!'",
+};
+
+struct opstack_op {
+       int op;
+       struct list_head list;
+};
+
+struct postfix_elt {
+       int op;
+       char *operand;
+       struct list_head list;
+};
+
+struct filter_parse_state {
+       struct filter_op *ops;
+       struct list_head opstack;
+       struct list_head postfix;
+       int lasterr;
+       int lasterr_pos;
+
+       struct {
+               char *string;
+               unsigned int cnt;
+               unsigned int tail;
+       } infix;
+
+       struct {
+               char string[MAX_FILTER_STR_VAL];
+               int pos;
+               unsigned int tail;
+       } operand;
+};
+
+struct pred_stack {
+       struct filter_pred      **preds;
+       int                     index;
+};
+
+/* If not of not match is equal to not of not, then it is a match */
+#define DEFINE_COMPARISON_PRED(type)                                   \
+static int filter_pred_##type(struct filter_pred *pred, void *event)   \
+{                                                                      \
+       type *addr = (type *)(event + pred->offset);                    \
+       type val = (type)pred->val;                                     \
+       int match = 0;                                                  \
+                                                                       \
+       switch (pred->op) {                                             \
+       case OP_LT:                                                     \
+               match = (*addr < val);                                  \
+               break;                                                  \
+       case OP_LE:                                                     \
+               match = (*addr <= val);                                 \
+               break;                                                  \
+       case OP_GT:                                                     \
+               match = (*addr > val);                                  \
+               break;                                                  \
+       case OP_GE:                                                     \
+               match = (*addr >= val);                                 \
+               break;                                                  \
+       case OP_BAND:                                                   \
+               match = (*addr & val);                                  \
+               break;                                                  \
+       default:                                                        \
+               break;                                                  \
+       }                                                               \
+                                                                       \
+       return !!match == !pred->not;                                   \
+}
+
+#define DEFINE_EQUALITY_PRED(size)                                     \
+static int filter_pred_##size(struct filter_pred *pred, void *event)   \
+{                                                                      \
+       u##size *addr = (u##size *)(event + pred->offset);              \
+       u##size val = (u##size)pred->val;                               \
+       int match;                                                      \
+                                                                       \
+       match = (val == *addr) ^ pred->not;                             \
+                                                                       \
+       return match;                                                   \
+}
+
+DEFINE_COMPARISON_PRED(s64);
+DEFINE_COMPARISON_PRED(u64);
+DEFINE_COMPARISON_PRED(s32);
+DEFINE_COMPARISON_PRED(u32);
+DEFINE_COMPARISON_PRED(s16);
+DEFINE_COMPARISON_PRED(u16);
+DEFINE_COMPARISON_PRED(s8);
+DEFINE_COMPARISON_PRED(u8);
+
+DEFINE_EQUALITY_PRED(64);
+DEFINE_EQUALITY_PRED(32);
+DEFINE_EQUALITY_PRED(16);
+DEFINE_EQUALITY_PRED(8);
+
+/* Filter predicate for fixed sized arrays of characters */
+static int filter_pred_string(struct filter_pred *pred, void *event)
+{
+       char *addr = (char *)(event + pred->offset);
+       int cmp, match;
+
+       cmp = pred->regex.match(addr, &pred->regex, pred->regex.field_len);
+
+       match = cmp ^ pred->not;
+
+       return match;
+}
+
+/* Filter predicate for char * pointers */
+static int filter_pred_pchar(struct filter_pred *pred, void *event)
+{
+       char **addr = (char **)(event + pred->offset);
+       int cmp, match;
+       int len = strlen(*addr) + 1;    /* including tailing '\0' */
+
+       cmp = pred->regex.match(*addr, &pred->regex, len);
+
+       match = cmp ^ pred->not;
+
+       return match;
+}
+
+/*
+ * Filter predicate for dynamic sized arrays of characters.
+ * These are implemented through a list of strings at the end
+ * of the entry.
+ * Also each of these strings have a field in the entry which
+ * contains its offset from the beginning of the entry.
+ * We have then first to get this field, dereference it
+ * and add it to the address of the entry, and at last we have
+ * the address of the string.
+ */
+static int filter_pred_strloc(struct filter_pred *pred, void *event)
+{
+       u32 str_item = *(u32 *)(event + pred->offset);
+       int str_loc = str_item & 0xffff;
+       int str_len = str_item >> 16;
+       char *addr = (char *)(event + str_loc);
+       int cmp, match;
+
+       cmp = pred->regex.match(addr, &pred->regex, str_len);
+
+       match = cmp ^ pred->not;
+
+       return match;
+}
+
+static int filter_pred_none(struct filter_pred *pred, void *event)
+{
+       return 0;
+}
+
+/*
+ * regex_match_foo - Basic regex callbacks
+ *
+ * @str: the string to be searched
+ * @r:   the regex structure containing the pattern string
+ * @len: the length of the string to be searched (including '\0')
+ *
+ * Note:
+ * - @str might not be NULL-terminated if it's of type DYN_STRING
+ *   or STATIC_STRING
+ */
+
+static int regex_match_full(char *str, struct regex *r, int len)
+{
+       if (strncmp(str, r->pattern, len) == 0)
+               return 1;
+       return 0;
+}
+
+static int regex_match_front(char *str, struct regex *r, int len)
+{
+       if (strncmp(str, r->pattern, r->len) == 0)
+               return 1;
+       return 0;
+}
+
+static int regex_match_middle(char *str, struct regex *r, int len)
+{
+       if (strnstr(str, r->pattern, len))
+               return 1;
+       return 0;
+}
+
+static int regex_match_end(char *str, struct regex *r, int len)
+{
+       int strlen = len - 1;
+
+       if (strlen >= r->len &&
+           memcmp(str + strlen - r->len, r->pattern, r->len) == 0)
+               return 1;
+       return 0;
+}
+
+/**
+ * filter_parse_regex - parse a basic regex
+ * @buff:   the raw regex
+ * @len:    length of the regex
+ * @search: will point to the beginning of the string to compare
+ * @not:    tell whether the match will have to be inverted
+ *
+ * This passes in a buffer containing a regex and this function will
+ * set search to point to the search part of the buffer and
+ * return the type of search it is (see enum above).
+ * This does modify buff.
+ *
+ * Returns enum type.
+ *  search returns the pointer to use for comparison.
+ *  not returns 1 if buff started with a '!'
+ *     0 otherwise.
+ */
+enum regex_type filter_parse_regex(char *buff, int len, char **search, int *not)
+{
+       int type = MATCH_FULL;
+       int i;
+
+       if (buff[0] == '!') {
+               *not = 1;
+               buff++;
+               len--;
+       } else
+               *not = 0;
+
+       *search = buff;
+
+       for (i = 0; i < len; i++) {
+               if (buff[i] == '*') {
+                       if (!i) {
+                               *search = buff + 1;
+                               type = MATCH_END_ONLY;
+                       } else {
+                               if (type == MATCH_END_ONLY)
+                                       type = MATCH_MIDDLE_ONLY;
+                               else
+                                       type = MATCH_FRONT_ONLY;
+                               buff[i] = 0;
+                               break;
+                       }
+               }
+       }
+
+       return type;
+}
+
+static void filter_build_regex(struct filter_pred *pred)
+{
+       struct regex *r = &pred->regex;
+       char *search;
+       enum regex_type type = MATCH_FULL;
+       int not = 0;
+
+       if (pred->op == OP_GLOB) {
+               type = filter_parse_regex(r->pattern, r->len, &search, &not);
+               r->len = strlen(search);
+               memmove(r->pattern, search, r->len+1);
+       }
+
+       switch (type) {
+       case MATCH_FULL:
+               r->match = regex_match_full;
+               break;
+       case MATCH_FRONT_ONLY:
+               r->match = regex_match_front;
+               break;
+       case MATCH_MIDDLE_ONLY:
+               r->match = regex_match_middle;
+               break;
+       case MATCH_END_ONLY:
+               r->match = regex_match_end;
+               break;
+       }
+
+       pred->not ^= not;
+}
+
+enum move_type {
+       MOVE_DOWN,
+       MOVE_UP_FROM_LEFT,
+       MOVE_UP_FROM_RIGHT
+};
+
+static struct filter_pred *
+get_pred_parent(struct filter_pred *pred, struct filter_pred *preds,
+               int index, enum move_type *move)
+{
+       if (pred->parent & FILTER_PRED_IS_RIGHT)
+               *move = MOVE_UP_FROM_RIGHT;
+       else
+               *move = MOVE_UP_FROM_LEFT;
+       pred = &preds[pred->parent & ~FILTER_PRED_IS_RIGHT];
+
+       return pred;
+}
+
+enum walk_return {
+       WALK_PRED_ABORT,
+       WALK_PRED_PARENT,
+       WALK_PRED_DEFAULT,
+};
+
+typedef int (*filter_pred_walkcb_t) (enum move_type move,
+                                    struct filter_pred *pred,
+                                    int *err, void *data);
+
+static int walk_pred_tree(struct filter_pred *preds,
+                         struct filter_pred *root,
+                         filter_pred_walkcb_t cb, void *data)
+{
+       struct filter_pred *pred = root;
+       enum move_type move = MOVE_DOWN;
+       int done = 0;
+
+       if  (!preds)
+               return -EINVAL;
+
+       do {
+               int err = 0, ret;
+
+               ret = cb(move, pred, &err, data);
+               if (ret == WALK_PRED_ABORT)
+                       return err;
+               if (ret == WALK_PRED_PARENT)
+                       goto get_parent;
+
+               switch (move) {
+               case MOVE_DOWN:
+                       if (pred->left != FILTER_PRED_INVALID) {
+                               pred = &preds[pred->left];
+                               continue;
+                       }
+                       goto get_parent;
+               case MOVE_UP_FROM_LEFT:
+                       pred = &preds[pred->right];
+                       move = MOVE_DOWN;
+                       continue;
+               case MOVE_UP_FROM_RIGHT:
+ get_parent:
+                       if (pred == root)
+                               break;
+                       pred = get_pred_parent(pred, preds,
+                                              pred->parent,
+                                              &move);
+                       continue;
+               }
+               done = 1;
+       } while (!done);
+
+       /* We are fine. */
+       return 0;
+}
+
+/*
+ * A series of AND or ORs where found together. Instead of
+ * climbing up and down the tree branches, an array of the
+ * ops were made in order of checks. We can just move across
+ * the array and short circuit if needed.
+ */
+static int process_ops(struct filter_pred *preds,
+                      struct filter_pred *op, void *rec)
+{
+       struct filter_pred *pred;
+       int match = 0;
+       int type;
+       int i;
+
+       /*
+        * Micro-optimization: We set type to true if op
+        * is an OR and false otherwise (AND). Then we
+        * just need to test if the match is equal to
+        * the type, and if it is, we can short circuit the
+        * rest of the checks:
+        *
+        * if ((match && op->op == OP_OR) ||
+        *     (!match && op->op == OP_AND))
+        *        return match;
+        */
+       type = op->op == OP_OR;
+
+       for (i = 0; i < op->val; i++) {
+               pred = &preds[op->ops[i]];
+               if (!WARN_ON_ONCE(!pred->fn))
+                       match = pred->fn(pred, rec);
+               if (!!match == type)
+                       break;
+       }
+       /* If not of not match is equal to not of not, then it is a match */
+       return !!match == !op->not;
+}
+
+struct filter_match_preds_data {
+       struct filter_pred *preds;
+       int match;
+       void *rec;
+};
+
+static int filter_match_preds_cb(enum move_type move, struct filter_pred *pred,
+                                int *err, void *data)
+{
+       struct filter_match_preds_data *d = data;
+
+       *err = 0;
+       switch (move) {
+       case MOVE_DOWN:
+               /* only AND and OR have children */
+               if (pred->left != FILTER_PRED_INVALID) {
+                       /* If ops is set, then it was folded. */
+                       if (!pred->ops)
+                               return WALK_PRED_DEFAULT;
+                       /* We can treat folded ops as a leaf node */
+                       d->match = process_ops(d->preds, pred, d->rec);
+               } else {
+                       if (!WARN_ON_ONCE(!pred->fn))
+                               d->match = pred->fn(pred, d->rec);
+               }
+
+               return WALK_PRED_PARENT;
+       case MOVE_UP_FROM_LEFT:
+               /*
+                * Check for short circuits.
+                *
+                * Optimization: !!match == (pred->op == OP_OR)
+                *   is the same as:
+                * if ((match && pred->op == OP_OR) ||
+                *     (!match && pred->op == OP_AND))
+                */
+               if (!!d->match == (pred->op == OP_OR))
+                       return WALK_PRED_PARENT;
+               break;
+       case MOVE_UP_FROM_RIGHT:
+               break;
+       }
+
+       return WALK_PRED_DEFAULT;
+}
+
+/* return 1 if event matches, 0 otherwise (discard) */
+int filter_match_preds(struct event_filter *filter, void *rec)
+{
+       struct filter_pred *preds;
+       struct filter_pred *root;
+       struct filter_match_preds_data data = {
+               /* match is currently meaningless */
+               .match = -1,
+               .rec   = rec,
+       };
+       int n_preds, ret;
+
+       /* no filter is considered a match */
+       if (!filter)
+               return 1;
+
+       n_preds = filter->n_preds;
+       if (!n_preds)
+               return 1;
+
+       /*
+        * n_preds, root and filter->preds are protect with preemption disabled.
+        */
+       root = rcu_dereference_sched(filter->root);
+       if (!root)
+               return 1;
+
+       data.preds = preds = rcu_dereference_sched(filter->preds);
+       ret = walk_pred_tree(preds, root, filter_match_preds_cb, &data);
+       WARN_ON(ret);
+       return data.match;
+}
+EXPORT_SYMBOL_GPL(filter_match_preds);
+
+static void parse_error(struct filter_parse_state *ps, int err, int pos)
+{
+       ps->lasterr = err;
+       ps->lasterr_pos = pos;
+}
+
+static void remove_filter_string(struct event_filter *filter)
+{
+       if (!filter)
+               return;
+
+       kfree(filter->filter_string);
+       filter->filter_string = NULL;
+}
+
+static int replace_filter_string(struct event_filter *filter,
+                                char *filter_string)
+{
+       kfree(filter->filter_string);
+       filter->filter_string = kstrdup(filter_string, GFP_KERNEL);
+       if (!filter->filter_string)
+               return -ENOMEM;
+
+       return 0;
+}
+
+static int append_filter_string(struct event_filter *filter,
+                               char *string)
+{
+       int newlen;
+       char *new_filter_string;
+
+       BUG_ON(!filter->filter_string);
+       newlen = strlen(filter->filter_string) + strlen(string) + 1;
+       new_filter_string = kmalloc(newlen, GFP_KERNEL);
+       if (!new_filter_string)
+               return -ENOMEM;
+
+       strcpy(new_filter_string, filter->filter_string);
+       strcat(new_filter_string, string);
+       kfree(filter->filter_string);
+       filter->filter_string = new_filter_string;
+
+       return 0;
+}
+
+static void append_filter_err(struct filter_parse_state *ps,
+                             struct event_filter *filter)
+{
+       int pos = ps->lasterr_pos;
+       char *buf, *pbuf;
+
+       buf = (char *)__get_free_page(GFP_TEMPORARY);
+       if (!buf)
+               return;
+
+       append_filter_string(filter, "\n");
+       memset(buf, ' ', PAGE_SIZE);
+       if (pos > PAGE_SIZE - 128)
+               pos = 0;
+       buf[pos] = '^';
+       pbuf = &buf[pos] + 1;
+
+       sprintf(pbuf, "\nparse_error: %s\n", err_text[ps->lasterr]);
+       append_filter_string(filter, buf);
+       free_page((unsigned long) buf);
+}
+
+static inline struct event_filter *event_filter(struct ftrace_event_file *file)
+{
+       if (file->event_call->flags & TRACE_EVENT_FL_USE_CALL_FILTER)
+               return file->event_call->filter;
+       else
+               return file->filter;
+}
+
+/* caller must hold event_mutex */
+void print_event_filter(struct ftrace_event_file *file, struct trace_seq *s)
+{
+       struct event_filter *filter = event_filter(file);
+
+       if (filter && filter->filter_string)
+               trace_seq_printf(s, "%s\n", filter->filter_string);
+       else
+               trace_seq_puts(s, "none\n");
+}
+
+void print_subsystem_event_filter(struct event_subsystem *system,
+                                 struct trace_seq *s)
+{
+       struct event_filter *filter;
+
+       mutex_lock(&event_mutex);
+       filter = system->filter;
+       if (filter && filter->filter_string)
+               trace_seq_printf(s, "%s\n", filter->filter_string);
+       else
+               trace_seq_puts(s, DEFAULT_SYS_FILTER_MESSAGE "\n");
+       mutex_unlock(&event_mutex);
+}
+
+static int __alloc_pred_stack(struct pred_stack *stack, int n_preds)
+{
+       stack->preds = kcalloc(n_preds + 1, sizeof(*stack->preds), GFP_KERNEL);
+       if (!stack->preds)
+               return -ENOMEM;
+       stack->index = n_preds;
+       return 0;
+}
+
+static void __free_pred_stack(struct pred_stack *stack)
+{
+       kfree(stack->preds);
+       stack->index = 0;
+}
+
+static int __push_pred_stack(struct pred_stack *stack,
+                            struct filter_pred *pred)
+{
+       int index = stack->index;
+
+       if (WARN_ON(index == 0))
+               return -ENOSPC;
+
+       stack->preds[--index] = pred;
+       stack->index = index;
+       return 0;
+}
+
+static struct filter_pred *
+__pop_pred_stack(struct pred_stack *stack)
+{
+       struct filter_pred *pred;
+       int index = stack->index;
+
+       pred = stack->preds[index++];
+       if (!pred)
+               return NULL;
+
+       stack->index = index;
+       return pred;
+}
+
+static int filter_set_pred(struct event_filter *filter,
+                          int idx,
+                          struct pred_stack *stack,
+                          struct filter_pred *src)
+{
+       struct filter_pred *dest = &filter->preds[idx];
+       struct filter_pred *left;
+       struct filter_pred *right;
+
+       *dest = *src;
+       dest->index = idx;
+
+       if (dest->op == OP_OR || dest->op == OP_AND) {
+               right = __pop_pred_stack(stack);
+               left = __pop_pred_stack(stack);
+               if (!left || !right)
+                       return -EINVAL;
+               /*
+                * If both children can be folded
+                * and they are the same op as this op or a leaf,
+                * then this op can be folded.
+                */
+               if (left->index & FILTER_PRED_FOLD &&
+                   ((left->op == dest->op && !left->not) ||
+                    left->left == FILTER_PRED_INVALID) &&
+                   right->index & FILTER_PRED_FOLD &&
+                   ((right->op == dest->op && !right->not) ||
+                    right->left == FILTER_PRED_INVALID))
+                       dest->index |= FILTER_PRED_FOLD;
+
+               dest->left = left->index & ~FILTER_PRED_FOLD;
+               dest->right = right->index & ~FILTER_PRED_FOLD;
+               left->parent = dest->index & ~FILTER_PRED_FOLD;
+               right->parent = dest->index | FILTER_PRED_IS_RIGHT;
+       } else {
+               /*
+                * Make dest->left invalid to be used as a quick
+                * way to know this is a leaf node.
+                */
+               dest->left = FILTER_PRED_INVALID;
+
+               /* All leafs allow folding the parent ops. */
+               dest->index |= FILTER_PRED_FOLD;
+       }
+
+       return __push_pred_stack(stack, dest);
+}
+
+static void __free_preds(struct event_filter *filter)
+{
+       int i;
+
+       if (filter->preds) {
+               for (i = 0; i < filter->n_preds; i++)
+                       kfree(filter->preds[i].ops);
+               kfree(filter->preds);
+               filter->preds = NULL;
+       }
+       filter->a_preds = 0;
+       filter->n_preds = 0;
+}
+
+static void filter_disable(struct ftrace_event_file *file)
+{
+       struct ftrace_event_call *call = file->event_call;
+
+       if (call->flags & TRACE_EVENT_FL_USE_CALL_FILTER)
+               call->flags &= ~TRACE_EVENT_FL_FILTERED;
+       else
+               file->flags &= ~FTRACE_EVENT_FL_FILTERED;
+}
+
+static void __free_filter(struct event_filter *filter)
+{
+       if (!filter)
+               return;
+
+       __free_preds(filter);
+       kfree(filter->filter_string);
+       kfree(filter);
+}
+
+void free_event_filter(struct event_filter *filter)
+{
+       __free_filter(filter);
+}
+
+static struct event_filter *__alloc_filter(void)
+{
+       struct event_filter *filter;
+
+       filter = kzalloc(sizeof(*filter), GFP_KERNEL);
+       return filter;
+}
+
+static int __alloc_preds(struct event_filter *filter, int n_preds)
+{
+       struct filter_pred *pred;
+       int i;
+
+       if (filter->preds)
+               __free_preds(filter);
+
+       filter->preds = kcalloc(n_preds, sizeof(*filter->preds), GFP_KERNEL);
+
+       if (!filter->preds)
+               return -ENOMEM;
+
+       filter->a_preds = n_preds;
+       filter->n_preds = 0;
+
+       for (i = 0; i < n_preds; i++) {
+               pred = &filter->preds[i];
+               pred->fn = filter_pred_none;
+       }
+
+       return 0;
+}
+
+static inline void __remove_filter(struct ftrace_event_file *file)
+{
+       struct ftrace_event_call *call = file->event_call;
+
+       filter_disable(file);
+       if (call->flags & TRACE_EVENT_FL_USE_CALL_FILTER)
+               remove_filter_string(call->filter);
+       else
+               remove_filter_string(file->filter);
+}
+
+static void filter_free_subsystem_preds(struct ftrace_subsystem_dir *dir,
+                                       struct trace_array *tr)
+{
+       struct ftrace_event_file *file;
+
+       list_for_each_entry(file, &tr->events, list) {
+               if (file->system != dir)
+                       continue;
+               __remove_filter(file);
+       }
+}
+
+static inline void __free_subsystem_filter(struct ftrace_event_file *file)
+{
+       struct ftrace_event_call *call = file->event_call;
+
+       if (call->flags & TRACE_EVENT_FL_USE_CALL_FILTER) {
+               __free_filter(call->filter);
+               call->filter = NULL;
+       } else {
+               __free_filter(file->filter);
+               file->filter = NULL;
+       }
+}
+
+static void filter_free_subsystem_filters(struct ftrace_subsystem_dir *dir,
+                                         struct trace_array *tr)
+{
+       struct ftrace_event_file *file;
+
+       list_for_each_entry(file, &tr->events, list) {
+               if (file->system != dir)
+                       continue;
+               __free_subsystem_filter(file);
+       }
+}
+
+static int filter_add_pred(struct filter_parse_state *ps,
+                          struct event_filter *filter,
+                          struct filter_pred *pred,
+                          struct pred_stack *stack)
+{
+       int err;
+
+       if (WARN_ON(filter->n_preds == filter->a_preds)) {
+               parse_error(ps, FILT_ERR_TOO_MANY_PREDS, 0);
+               return -ENOSPC;
+       }
+
+       err = filter_set_pred(filter, filter->n_preds, stack, pred);
+       if (err)
+               return err;
+
+       filter->n_preds++;
+
+       return 0;
+}
+
+int filter_assign_type(const char *type)
+{
+       if (strstr(type, "__data_loc") && strstr(type, "char"))
+               return FILTER_DYN_STRING;
+
+       if (strchr(type, '[') && strstr(type, "char"))
+               return FILTER_STATIC_STRING;
+
+       return FILTER_OTHER;
+}
+
+static bool is_function_field(struct ftrace_event_field *field)
+{
+       return field->filter_type == FILTER_TRACE_FN;
+}
+
+static bool is_string_field(struct ftrace_event_field *field)
+{
+       return field->filter_type == FILTER_DYN_STRING ||
+              field->filter_type == FILTER_STATIC_STRING ||
+              field->filter_type == FILTER_PTR_STRING;
+}
+
+static int is_legal_op(struct ftrace_event_field *field, int op)
+{
+       if (is_string_field(field) &&
+           (op != OP_EQ && op != OP_NE && op != OP_GLOB))
+               return 0;
+       if (!is_string_field(field) && op == OP_GLOB)
+               return 0;
+
+       return 1;
+}
+
+static filter_pred_fn_t select_comparison_fn(int op, int field_size,
+                                            int field_is_signed)
+{
+       filter_pred_fn_t fn = NULL;
+
+       switch (field_size) {
+       case 8:
+               if (op == OP_EQ || op == OP_NE)
+                       fn = filter_pred_64;
+               else if (field_is_signed)
+                       fn = filter_pred_s64;
+               else
+                       fn = filter_pred_u64;
+               break;
+       case 4:
+               if (op == OP_EQ || op == OP_NE)
+                       fn = filter_pred_32;
+               else if (field_is_signed)
+                       fn = filter_pred_s32;
+               else
+                       fn = filter_pred_u32;
+               break;
+       case 2:
+               if (op == OP_EQ || op == OP_NE)
+                       fn = filter_pred_16;
+               else if (field_is_signed)
+                       fn = filter_pred_s16;
+               else
+                       fn = filter_pred_u16;
+               break;
+       case 1:
+               if (op == OP_EQ || op == OP_NE)
+                       fn = filter_pred_8;
+               else if (field_is_signed)
+                       fn = filter_pred_s8;
+               else
+                       fn = filter_pred_u8;
+               break;
+       }
+
+       return fn;
+}
+
+static int init_pred(struct filter_parse_state *ps,
+                    struct ftrace_event_field *field,
+                    struct filter_pred *pred)
+
+{
+       filter_pred_fn_t fn = filter_pred_none;
+       unsigned long long val;
+       int ret;
+
+       pred->offset = field->offset;
+
+       if (!is_legal_op(field, pred->op)) {
+               parse_error(ps, FILT_ERR_ILLEGAL_FIELD_OP, 0);
+               return -EINVAL;
+       }
+
+       if (is_string_field(field)) {
+               filter_build_regex(pred);
+
+               if (field->filter_type == FILTER_STATIC_STRING) {
+                       fn = filter_pred_string;
+                       pred->regex.field_len = field->size;
+               } else if (field->filter_type == FILTER_DYN_STRING)
+                       fn = filter_pred_strloc;
+               else
+                       fn = filter_pred_pchar;
+       } else if (is_function_field(field)) {
+               if (strcmp(field->name, "ip")) {
+                       parse_error(ps, FILT_ERR_IP_FIELD_ONLY, 0);
+                       return -EINVAL;
+               }
+       } else {
+               if (field->is_signed)
+                       ret = kstrtoll(pred->regex.pattern, 0, &val);
+               else
+                       ret = kstrtoull(pred->regex.pattern, 0, &val);
+               if (ret) {
+                       parse_error(ps, FILT_ERR_ILLEGAL_INTVAL, 0);
+                       return -EINVAL;
+               }
+               pred->val = val;
+
+               fn = select_comparison_fn(pred->op, field->size,
+                                         field->is_signed);
+               if (!fn) {
+                       parse_error(ps, FILT_ERR_INVALID_OP, 0);
+                       return -EINVAL;
+               }
+       }
+
+       if (pred->op == OP_NE)
+               pred->not ^= 1;
+
+       pred->fn = fn;
+       return 0;
+}
+
+static void parse_init(struct filter_parse_state *ps,
+                      struct filter_op *ops,
+                      char *infix_string)
+{
+       memset(ps, '\0', sizeof(*ps));
+
+       ps->infix.string = infix_string;
+       ps->infix.cnt = strlen(infix_string);
+       ps->ops = ops;
+
+       INIT_LIST_HEAD(&ps->opstack);
+       INIT_LIST_HEAD(&ps->postfix);
+}
+
+static char infix_next(struct filter_parse_state *ps)
+{
+       ps->infix.cnt--;
+
+       return ps->infix.string[ps->infix.tail++];
+}
+
+static char infix_peek(struct filter_parse_state *ps)
+{
+       if (ps->infix.tail == strlen(ps->infix.string))
+               return 0;
+
+       return ps->infix.string[ps->infix.tail];
+}
+
+static void infix_advance(struct filter_parse_state *ps)
+{
+       ps->infix.cnt--;
+       ps->infix.tail++;
+}
+
+static inline int is_precedence_lower(struct filter_parse_state *ps,
+                                     int a, int b)
+{
+       return ps->ops[a].precedence < ps->ops[b].precedence;
+}
+
+static inline int is_op_char(struct filter_parse_state *ps, char c)
+{
+       int i;
+
+       for (i = 0; strcmp(ps->ops[i].string, "OP_NONE"); i++) {
+               if (ps->ops[i].string[0] == c)
+                       return 1;
+       }
+
+       return 0;
+}
+
+static int infix_get_op(struct filter_parse_state *ps, char firstc)
+{
+       char nextc = infix_peek(ps);
+       char opstr[3];
+       int i;
+
+       opstr[0] = firstc;
+       opstr[1] = nextc;
+       opstr[2] = '\0';
+
+       for (i = 0; strcmp(ps->ops[i].string, "OP_NONE"); i++) {
+               if (!strcmp(opstr, ps->ops[i].string)) {
+                       infix_advance(ps);
+                       return ps->ops[i].id;
+               }
+       }
+
+       opstr[1] = '\0';
+
+       for (i = 0; strcmp(ps->ops[i].string, "OP_NONE"); i++) {
+               if (!strcmp(opstr, ps->ops[i].string))
+                       return ps->ops[i].id;
+       }
+
+       return OP_NONE;
+}
+
+static inline void clear_operand_string(struct filter_parse_state *ps)
+{
+       memset(ps->operand.string, '\0', MAX_FILTER_STR_VAL);
+       ps->operand.tail = 0;
+}
+
+static inline int append_operand_char(struct filter_parse_state *ps, char c)
+{
+       if (ps->operand.tail == MAX_FILTER_STR_VAL - 1)
+               return -EINVAL;
+
+       ps->operand.string[ps->operand.tail++] = c;
+
+       return 0;
+}
+
+static int filter_opstack_push(struct filter_parse_state *ps, int op)
+{
+       struct opstack_op *opstack_op;
+
+       opstack_op = kmalloc(sizeof(*opstack_op), GFP_KERNEL);
+       if (!opstack_op)
+               return -ENOMEM;
+
+       opstack_op->op = op;
+       list_add(&opstack_op->list, &ps->opstack);
+
+       return 0;
+}
+
+static int filter_opstack_empty(struct filter_parse_state *ps)
+{
+       return list_empty(&ps->opstack);
+}
+
+static int filter_opstack_top(struct filter_parse_state *ps)
+{
+       struct opstack_op *opstack_op;
+
+       if (filter_opstack_empty(ps))
+               return OP_NONE;
+
+       opstack_op = list_first_entry(&ps->opstack, struct opstack_op, list);
+
+       return opstack_op->op;
+}
+
+static int filter_opstack_pop(struct filter_parse_state *ps)
+{
+       struct opstack_op *opstack_op;
+       int op;
+
+       if (filter_opstack_empty(ps))
+               return OP_NONE;
+
+       opstack_op = list_first_entry(&ps->opstack, struct opstack_op, list);
+       op = opstack_op->op;
+       list_del(&opstack_op->list);
+
+       kfree(opstack_op);
+
+       return op;
+}
+
+static void filter_opstack_clear(struct filter_parse_state *ps)
+{
+       while (!filter_opstack_empty(ps))
+               filter_opstack_pop(ps);
+}
+
+static char *curr_operand(struct filter_parse_state *ps)
+{
+       return ps->operand.string;
+}
+
+static int postfix_append_operand(struct filter_parse_state *ps, char *operand)
+{
+       struct postfix_elt *elt;
+
+       elt = kmalloc(sizeof(*elt), GFP_KERNEL);
+       if (!elt)
+               return -ENOMEM;
+
+       elt->op = OP_NONE;
+       elt->operand = kstrdup(operand, GFP_KERNEL);
+       if (!elt->operand) {
+               kfree(elt);
+               return -ENOMEM;
+       }
+
+       list_add_tail(&elt->list, &ps->postfix);
+
+       return 0;
+}
+
+static int postfix_append_op(struct filter_parse_state *ps, int op)
+{
+       struct postfix_elt *elt;
+
+       elt = kmalloc(sizeof(*elt), GFP_KERNEL);
+       if (!elt)
+               return -ENOMEM;
+
+       elt->op = op;
+       elt->operand = NULL;
+
+       list_add_tail(&elt->list, &ps->postfix);
+
+       return 0;
+}
+
+static void postfix_clear(struct filter_parse_state *ps)
+{
+       struct postfix_elt *elt;
+
+       while (!list_empty(&ps->postfix)) {
+               elt = list_first_entry(&ps->postfix, struct postfix_elt, list);
+               list_del(&elt->list);
+               kfree(elt->operand);
+               kfree(elt);
+       }
+}
+
+static int filter_parse(struct filter_parse_state *ps)
+{
+       int in_string = 0;
+       int op, top_op;
+       char ch;
+
+       while ((ch = infix_next(ps))) {
+               if (ch == '"') {
+                       in_string ^= 1;
+                       continue;
+               }
+
+               if (in_string)
+                       goto parse_operand;
+
+               if (isspace(ch))
+                       continue;
+
+               if (is_op_char(ps, ch)) {
+                       op = infix_get_op(ps, ch);
+                       if (op == OP_NONE) {
+                               parse_error(ps, FILT_ERR_INVALID_OP, 0);
+                               return -EINVAL;
+                       }
+
+                       if (strlen(curr_operand(ps))) {
+                               postfix_append_operand(ps, curr_operand(ps));
+                               clear_operand_string(ps);
+                       }
+
+                       while (!filter_opstack_empty(ps)) {
+                               top_op = filter_opstack_top(ps);
+                               if (!is_precedence_lower(ps, top_op, op)) {
+                                       top_op = filter_opstack_pop(ps);
+                                       postfix_append_op(ps, top_op);
+                                       continue;
+                               }
+                               break;
+                       }
+
+                       filter_opstack_push(ps, op);
+                       continue;
+               }
+
+               if (ch == '(') {
+                       filter_opstack_push(ps, OP_OPEN_PAREN);
+                       continue;
+               }
+
+               if (ch == ')') {
+                       if (strlen(curr_operand(ps))) {
+                               postfix_append_operand(ps, curr_operand(ps));
+                               clear_operand_string(ps);
+                       }
+
+                       top_op = filter_opstack_pop(ps);
+                       while (top_op != OP_NONE) {
+                               if (top_op == OP_OPEN_PAREN)
+                                       break;
+                               postfix_append_op(ps, top_op);
+                               top_op = filter_opstack_pop(ps);
+                       }
+                       if (top_op == OP_NONE) {
+                               parse_error(ps, FILT_ERR_UNBALANCED_PAREN, 0);
+                               return -EINVAL;
+                       }
+                       continue;
+               }
+parse_operand:
+               if (append_operand_char(ps, ch)) {
+                       parse_error(ps, FILT_ERR_OPERAND_TOO_LONG, 0);
+                       return -EINVAL;
+               }
+       }
+
+       if (strlen(curr_operand(ps)))
+               postfix_append_operand(ps, curr_operand(ps));
+
+       while (!filter_opstack_empty(ps)) {
+               top_op = filter_opstack_pop(ps);
+               if (top_op == OP_NONE)
+                       break;
+               if (top_op == OP_OPEN_PAREN) {
+                       parse_error(ps, FILT_ERR_UNBALANCED_PAREN, 0);
+                       return -EINVAL;
+               }
+               postfix_append_op(ps, top_op);
+       }
+
+       return 0;
+}
+
+static struct filter_pred *create_pred(struct filter_parse_state *ps,
+                                      struct ftrace_event_call *call,
+                                      int op, char *operand1, char *operand2)
+{
+       struct ftrace_event_field *field;
+       static struct filter_pred pred;
+
+       memset(&pred, 0, sizeof(pred));
+       pred.op = op;
+
+       if (op == OP_AND || op == OP_OR)
+               return &pred;
+
+       if (!operand1 || !operand2) {
+               parse_error(ps, FILT_ERR_MISSING_FIELD, 0);
+               return NULL;
+       }
+
+       field = trace_find_event_field(call, operand1);
+       if (!field) {
+               parse_error(ps, FILT_ERR_FIELD_NOT_FOUND, 0);
+               return NULL;
+       }
+
+       strcpy(pred.regex.pattern, operand2);
+       pred.regex.len = strlen(pred.regex.pattern);
+       pred.field = field;
+       return init_pred(ps, field, &pred) ? NULL : &pred;
+}
+
+static int check_preds(struct filter_parse_state *ps)
+{
+       int n_normal_preds = 0, n_logical_preds = 0;
+       struct postfix_elt *elt;
+       int cnt = 0;
+
+       list_for_each_entry(elt, &ps->postfix, list) {
+               if (elt->op == OP_NONE) {
+                       cnt++;
+                       continue;
+               }
+
+               if (elt->op == OP_AND || elt->op == OP_OR) {
+                       n_logical_preds++;
+                       cnt--;
+                       continue;
+               }
+               if (elt->op != OP_NOT)
+                       cnt--;
+               n_normal_preds++;
+               WARN_ON_ONCE(cnt < 0);
+       }
+
+       if (cnt != 1 || !n_normal_preds || n_logical_preds >= n_normal_preds) {
+               parse_error(ps, FILT_ERR_INVALID_FILTER, 0);
+               return -EINVAL;
+       }
+
+       return 0;
+}
+
+static int count_preds(struct filter_parse_state *ps)
+{
+       struct postfix_elt *elt;
+       int n_preds = 0;
+
+       list_for_each_entry(elt, &ps->postfix, list) {
+               if (elt->op == OP_NONE)
+                       continue;
+               n_preds++;
+       }
+
+       return n_preds;
+}
+
+struct check_pred_data {
+       int count;
+       int max;
+};
+
+static int check_pred_tree_cb(enum move_type move, struct filter_pred *pred,
+                             int *err, void *data)
+{
+       struct check_pred_data *d = data;
+
+       if (WARN_ON(d->count++ > d->max)) {
+               *err = -EINVAL;
+               return WALK_PRED_ABORT;
+       }
+       return WALK_PRED_DEFAULT;
+}
+
+/*
+ * The tree is walked at filtering of an event. If the tree is not correctly
+ * built, it may cause an infinite loop. Check here that the tree does
+ * indeed terminate.
+ */
+static int check_pred_tree(struct event_filter *filter,
+                          struct filter_pred *root)
+{
+       struct check_pred_data data = {
+               /*
+                * The max that we can hit a node is three times.
+                * Once going down, once coming up from left, and
+                * once coming up from right. This is more than enough
+                * since leafs are only hit a single time.
+                */
+               .max   = 3 * filter->n_preds,
+               .count = 0,
+       };
+
+       return walk_pred_tree(filter->preds, root,
+                             check_pred_tree_cb, &data);
+}
+
+static int count_leafs_cb(enum move_type move, struct filter_pred *pred,
+                         int *err, void *data)
+{
+       int *count = data;
+
+       if ((move == MOVE_DOWN) &&
+           (pred->left == FILTER_PRED_INVALID))
+               (*count)++;
+
+       return WALK_PRED_DEFAULT;
+}
+
+static int count_leafs(struct filter_pred *preds, struct filter_pred *root)
+{
+       int count = 0, ret;
+
+       ret = walk_pred_tree(preds, root, count_leafs_cb, &count);
+       WARN_ON(ret);
+       return count;
+}
+
+struct fold_pred_data {
+       struct filter_pred *root;
+       int count;
+       int children;
+};
+
+static int fold_pred_cb(enum move_type move, struct filter_pred *pred,
+                       int *err, void *data)
+{
+       struct fold_pred_data *d = data;
+       struct filter_pred *root = d->root;
+
+       if (move != MOVE_DOWN)
+               return WALK_PRED_DEFAULT;
+       if (pred->left != FILTER_PRED_INVALID)
+               return WALK_PRED_DEFAULT;
+
+       if (WARN_ON(d->count == d->children)) {
+               *err = -EINVAL;
+               return WALK_PRED_ABORT;
+       }
+
+       pred->index &= ~FILTER_PRED_FOLD;
+       root->ops[d->count++] = pred->index;
+       return WALK_PRED_DEFAULT;
+}
+
+static int fold_pred(struct filter_pred *preds, struct filter_pred *root)
+{
+       struct fold_pred_data data = {
+               .root  = root,
+               .count = 0,
+       };
+       int children;
+
+       /* No need to keep the fold flag */
+       root->index &= ~FILTER_PRED_FOLD;
+
+       /* If the root is a leaf then do nothing */
+       if (root->left == FILTER_PRED_INVALID)
+               return 0;
+
+       /* count the children */
+       children = count_leafs(preds, &preds[root->left]);
+       children += count_leafs(preds, &preds[root->right]);
+
+       root->ops = kcalloc(children, sizeof(*root->ops), GFP_KERNEL);
+       if (!root->ops)
+               return -ENOMEM;
+
+       root->val = children;
+       data.children = children;
+       return walk_pred_tree(preds, root, fold_pred_cb, &data);
+}
+
+static int fold_pred_tree_cb(enum move_type move, struct filter_pred *pred,
+                            int *err, void *data)
+{
+       struct filter_pred *preds = data;
+
+       if (move != MOVE_DOWN)
+               return WALK_PRED_DEFAULT;
+       if (!(pred->index & FILTER_PRED_FOLD))
+               return WALK_PRED_DEFAULT;
+
+       *err = fold_pred(preds, pred);
+       if (*err)
+               return WALK_PRED_ABORT;
+
+       /* eveyrhing below is folded, continue with parent */
+       return WALK_PRED_PARENT;
+}
+
+/*
+ * To optimize the processing of the ops, if we have several "ors" or
+ * "ands" together, we can put them in an array and process them all
+ * together speeding up the filter logic.
+ */
+static int fold_pred_tree(struct event_filter *filter,
+                          struct filter_pred *root)
+{
+       return walk_pred_tree(filter->preds, root, fold_pred_tree_cb,
+                             filter->preds);
+}
+
+static int replace_preds(struct ftrace_event_call *call,
+                        struct event_filter *filter,
+                        struct filter_parse_state *ps,
+                        bool dry_run)
+{
+       char *operand1 = NULL, *operand2 = NULL;
+       struct filter_pred *pred;
+       struct filter_pred *root;
+       struct postfix_elt *elt;
+       struct pred_stack stack = { }; /* init to NULL */
+       int err;
+       int n_preds = 0;
+
+       n_preds = count_preds(ps);
+       if (n_preds >= MAX_FILTER_PRED) {
+               parse_error(ps, FILT_ERR_TOO_MANY_PREDS, 0);
+               return -ENOSPC;
+       }
+
+       err = check_preds(ps);
+       if (err)
+               return err;
+
+       if (!dry_run) {
+               err = __alloc_pred_stack(&stack, n_preds);
+               if (err)
+                       return err;
+               err = __alloc_preds(filter, n_preds);
+               if (err)
+                       goto fail;
+       }
+
+       n_preds = 0;
+       list_for_each_entry(elt, &ps->postfix, list) {
+               if (elt->op == OP_NONE) {
+                       if (!operand1)
+                               operand1 = elt->operand;
+                       else if (!operand2)
+                               operand2 = elt->operand;
+                       else {
+                               parse_error(ps, FILT_ERR_TOO_MANY_OPERANDS, 0);
+                               err = -EINVAL;
+                               goto fail;
+                       }
+                       continue;
+               }
+
+               if (elt->op == OP_NOT) {
+                       if (!n_preds || operand1 || operand2) {
+                               parse_error(ps, FILT_ERR_ILLEGAL_NOT_OP, 0);
+                               err = -EINVAL;
+                               goto fail;
+                       }
+                       if (!dry_run)
+                               filter->preds[n_preds - 1].not ^= 1;
+                       continue;
+               }
+
+               if (WARN_ON(n_preds++ == MAX_FILTER_PRED)) {
+                       parse_error(ps, FILT_ERR_TOO_MANY_PREDS, 0);
+                       err = -ENOSPC;
+                       goto fail;
+               }
+
+               pred = create_pred(ps, call, elt->op, operand1, operand2);
+               if (!pred) {
+                       err = -EINVAL;
+                       goto fail;
+               }
+
+               if (!dry_run) {
+                       err = filter_add_pred(ps, filter, pred, &stack);
+                       if (err)
+                               goto fail;
+               }
+
+               operand1 = operand2 = NULL;
+       }
+
+       if (!dry_run) {
+               /* We should have one item left on the stack */
+               pred = __pop_pred_stack(&stack);
+               if (!pred)
+                       return -EINVAL;
+               /* This item is where we start from in matching */
+               root = pred;
+               /* Make sure the stack is empty */
+               pred = __pop_pred_stack(&stack);
+               if (WARN_ON(pred)) {
+                       err = -EINVAL;
+                       filter->root = NULL;
+                       goto fail;
+               }
+               err = check_pred_tree(filter, root);
+               if (err)
+                       goto fail;
+
+               /* Optimize the tree */
+               err = fold_pred_tree(filter, root);
+               if (err)
+                       goto fail;
+
+               /* We don't set root until we know it works */
+               barrier();
+               filter->root = root;
+       }
+
+       err = 0;
+fail:
+       __free_pred_stack(&stack);
+       return err;
+}
+
+static inline void event_set_filtered_flag(struct ftrace_event_file *file)
+{
+       struct ftrace_event_call *call = file->event_call;
+
+       if (call->flags & TRACE_EVENT_FL_USE_CALL_FILTER)
+               call->flags |= TRACE_EVENT_FL_FILTERED;
+       else
+               file->flags |= FTRACE_EVENT_FL_FILTERED;
+}
+
+static inline void event_set_filter(struct ftrace_event_file *file,
+                                   struct event_filter *filter)
+{
+       struct ftrace_event_call *call = file->event_call;
+
+       if (call->flags & TRACE_EVENT_FL_USE_CALL_FILTER)
+               rcu_assign_pointer(call->filter, filter);
+       else
+               rcu_assign_pointer(file->filter, filter);
+}
+
+static inline void event_clear_filter(struct ftrace_event_file *file)
+{
+       struct ftrace_event_call *call = file->event_call;
+
+       if (call->flags & TRACE_EVENT_FL_USE_CALL_FILTER)
+               RCU_INIT_POINTER(call->filter, NULL);
+       else
+               RCU_INIT_POINTER(file->filter, NULL);
+}
+
+static inline void
+event_set_no_set_filter_flag(struct ftrace_event_file *file)
+{
+       struct ftrace_event_call *call = file->event_call;
+
+       if (call->flags & TRACE_EVENT_FL_USE_CALL_FILTER)
+               call->flags |= TRACE_EVENT_FL_NO_SET_FILTER;
+       else
+               file->flags |= FTRACE_EVENT_FL_NO_SET_FILTER;
+}
+
+static inline void
+event_clear_no_set_filter_flag(struct ftrace_event_file *file)
+{
+       struct ftrace_event_call *call = file->event_call;
+
+       if (call->flags & TRACE_EVENT_FL_USE_CALL_FILTER)
+               call->flags &= ~TRACE_EVENT_FL_NO_SET_FILTER;
+       else
+               file->flags &= ~FTRACE_EVENT_FL_NO_SET_FILTER;
+}
+
+static inline bool
+event_no_set_filter_flag(struct ftrace_event_file *file)
+{
+       struct ftrace_event_call *call = file->event_call;
+
+       if (file->flags & FTRACE_EVENT_FL_NO_SET_FILTER)
+               return true;
+
+       if ((call->flags & TRACE_EVENT_FL_USE_CALL_FILTER) &&
+           (call->flags & TRACE_EVENT_FL_NO_SET_FILTER))
+               return true;
+
+       return false;
+}
+
+struct filter_list {
+       struct list_head        list;
+       struct event_filter     *filter;
+};
+
+static int replace_system_preds(struct ftrace_subsystem_dir *dir,
+                               struct trace_array *tr,
+                               struct filter_parse_state *ps,
+                               char *filter_string)
+{
+       struct ftrace_event_file *file;
+       struct filter_list *filter_item;
+       struct filter_list *tmp;
+       LIST_HEAD(filter_list);
+       bool fail = true;
+       int err;
+
+       list_for_each_entry(file, &tr->events, list) {
+               if (file->system != dir)
+                       continue;
+
+               /*
+                * Try to see if the filter can be applied
+                *  (filter arg is ignored on dry_run)
+                */
+               err = replace_preds(file->event_call, NULL, ps, true);
+               if (err)
+                       event_set_no_set_filter_flag(file);
+               else
+                       event_clear_no_set_filter_flag(file);
+       }
+
+       list_for_each_entry(file, &tr->events, list) {
+               struct event_filter *filter;
+
+               if (file->system != dir)
+                       continue;
+
+               if (event_no_set_filter_flag(file))
+                       continue;
+
+               filter_item = kzalloc(sizeof(*filter_item), GFP_KERNEL);
+               if (!filter_item)
+                       goto fail_mem;
+
+               list_add_tail(&filter_item->list, &filter_list);
+
+               filter_item->filter = __alloc_filter();
+               if (!filter_item->filter)
+                       goto fail_mem;
+               filter = filter_item->filter;
+
+               /* Can only fail on no memory */
+               err = replace_filter_string(filter, filter_string);
+               if (err)
+                       goto fail_mem;
+
+               err = replace_preds(file->event_call, filter, ps, false);
+               if (err) {
+                       filter_disable(file);
+                       parse_error(ps, FILT_ERR_BAD_SUBSYS_FILTER, 0);
+                       append_filter_err(ps, filter);
+               } else
+                       event_set_filtered_flag(file);
+               /*
+                * Regardless of if this returned an error, we still
+                * replace the filter for the call.
+                */
+               filter = event_filter(file);
+               event_set_filter(file, filter_item->filter);
+               filter_item->filter = filter;
+
+               fail = false;
+       }
+
+       if (fail)
+               goto fail;
+
+       /*
+        * The calls can still be using the old filters.
+        * Do a synchronize_sched() to ensure all calls are
+        * done with them before we free them.
+        */
+       synchronize_sched();
+       list_for_each_entry_safe(filter_item, tmp, &filter_list, list) {
+               __free_filter(filter_item->filter);
+               list_del(&filter_item->list);
+               kfree(filter_item);
+       }
+       return 0;
+ fail:
+       /* No call succeeded */
+       list_for_each_entry_safe(filter_item, tmp, &filter_list, list) {
+               list_del(&filter_item->list);
+               kfree(filter_item);
+       }
+       parse_error(ps, FILT_ERR_BAD_SUBSYS_FILTER, 0);
+       return -EINVAL;
+ fail_mem:
+       /* If any call succeeded, we still need to sync */
+       if (!fail)
+               synchronize_sched();
+       list_for_each_entry_safe(filter_item, tmp, &filter_list, list) {
+               __free_filter(filter_item->filter);
+               list_del(&filter_item->list);
+               kfree(filter_item);
+       }
+       return -ENOMEM;
+}
+
+static int create_filter_start(char *filter_str, bool set_str,
+                              struct filter_parse_state **psp,
+                              struct event_filter **filterp)
+{
+       struct event_filter *filter;
+       struct filter_parse_state *ps = NULL;
+       int err = 0;
+
+       WARN_ON_ONCE(*psp || *filterp);
+
+       /* allocate everything, and if any fails, free all and fail */
+       filter = __alloc_filter();
+       if (filter && set_str)
+               err = replace_filter_string(filter, filter_str);
+
+       ps = kzalloc(sizeof(*ps), GFP_KERNEL);
+
+       if (!filter || !ps || err) {
+               kfree(ps);
+               __free_filter(filter);
+               return -ENOMEM;
+       }
+
+       /* we're committed to creating a new filter */
+       *filterp = filter;
+       *psp = ps;
+
+       parse_init(ps, filter_ops, filter_str);
+       err = filter_parse(ps);
+       if (err && set_str)
+               append_filter_err(ps, filter);
+       return err;
+}
+
+static void create_filter_finish(struct filter_parse_state *ps)
+{
+       if (ps) {
+               filter_opstack_clear(ps);
+               postfix_clear(ps);
+               kfree(ps);
+       }
+}
+
+/**
+ * create_filter - create a filter for a ftrace_event_call
+ * @call: ftrace_event_call to create a filter for
+ * @filter_str: filter string
+ * @set_str: remember @filter_str and enable detailed error in filter
+ * @filterp: out param for created filter (always updated on return)
+ *
+ * Creates a filter for @call with @filter_str.  If @set_str is %true,
+ * @filter_str is copied and recorded in the new filter.
+ *
+ * On success, returns 0 and *@filterp points to the new filter.  On
+ * failure, returns -errno and *@filterp may point to %NULL or to a new
+ * filter.  In the latter case, the returned filter contains error
+ * information if @set_str is %true and the caller is responsible for
+ * freeing it.
+ */
+static int create_filter(struct ftrace_event_call *call,
+                        char *filter_str, bool set_str,
+                        struct event_filter **filterp)
+{
+       struct event_filter *filter = NULL;
+       struct filter_parse_state *ps = NULL;
+       int err;
+
+       err = create_filter_start(filter_str, set_str, &ps, &filter);
+       if (!err) {
+               err = replace_preds(call, filter, ps, false);
+               if (err && set_str)
+                       append_filter_err(ps, filter);
+       }
+       create_filter_finish(ps);
+
+       *filterp = filter;
+       return err;
+}
+
+int create_event_filter(struct ftrace_event_call *call,
+                       char *filter_str, bool set_str,
+                       struct event_filter **filterp)
+{
+       return create_filter(call, filter_str, set_str, filterp);
+}
+
+/**
+ * create_system_filter - create a filter for an event_subsystem
+ * @system: event_subsystem to create a filter for
+ * @filter_str: filter string
+ * @filterp: out param for created filter (always updated on return)
+ *
+ * Identical to create_filter() except that it creates a subsystem filter
+ * and always remembers @filter_str.
+ */
+static int create_system_filter(struct ftrace_subsystem_dir *dir,
+                               struct trace_array *tr,
+                               char *filter_str, struct event_filter **filterp)
+{
+       struct event_filter *filter = NULL;
+       struct filter_parse_state *ps = NULL;
+       int err;
+
+       err = create_filter_start(filter_str, true, &ps, &filter);
+       if (!err) {
+               err = replace_system_preds(dir, tr, ps, filter_str);
+               if (!err) {
+                       /* System filters just show a default message */
+                       kfree(filter->filter_string);
+                       filter->filter_string = NULL;
+               } else {
+                       append_filter_err(ps, filter);
+               }
+       }
+       create_filter_finish(ps);
+
+       *filterp = filter;
+       return err;
+}
+
+/* caller must hold event_mutex */
+int apply_event_filter(struct ftrace_event_file *file, char *filter_string)
+{
+       struct ftrace_event_call *call = file->event_call;
+       struct event_filter *filter;
+       int err;
+
+       if (!strcmp(strstrip(filter_string), "0")) {
+               filter_disable(file);
+               filter = event_filter(file);
+
+               if (!filter)
+                       return 0;
+
+               event_clear_filter(file);
+
+               /* Make sure the filter is not being used */
+               synchronize_sched();
+               __free_filter(filter);
+
+               return 0;
+       }
+
+       err = create_filter(call, filter_string, true, &filter);
+
+       /*
+        * Always swap the call filter with the new filter
+        * even if there was an error. If there was an error
+        * in the filter, we disable the filter and show the error
+        * string
+        */
+       if (filter) {
+               struct event_filter *tmp;
+
+               tmp = event_filter(file);
+               if (!err)
+                       event_set_filtered_flag(file);
+               else
+                       filter_disable(file);
+
+               event_set_filter(file, filter);
+
+               if (tmp) {
+                       /* Make sure the call is done with the filter */
+                       synchronize_sched();
+                       __free_filter(tmp);
+               }
+       }
+
+       return err;
+}
+
+int apply_subsystem_event_filter(struct ftrace_subsystem_dir *dir,
+                                char *filter_string)
+{
+       struct event_subsystem *system = dir->subsystem;
+       struct trace_array *tr = dir->tr;
+       struct event_filter *filter;
+       int err = 0;
+
+       mutex_lock(&event_mutex);
+
+       /* Make sure the system still has events */
+       if (!dir->nr_events) {
+               err = -ENODEV;
+               goto out_unlock;
+       }
+
+       if (!strcmp(strstrip(filter_string), "0")) {
+               filter_free_subsystem_preds(dir, tr);
+               remove_filter_string(system->filter);
+               filter = system->filter;
+               system->filter = NULL;
+               /* Ensure all filters are no longer used */
+               synchronize_sched();
+               filter_free_subsystem_filters(dir, tr);
+               __free_filter(filter);
+               goto out_unlock;
+       }
+
+       err = create_system_filter(dir, tr, filter_string, &filter);
+       if (filter) {
+               /*
+                * No event actually uses the system filter
+                * we can free it without synchronize_sched().
+                */
+               __free_filter(system->filter);
+               system->filter = filter;
+       }
+out_unlock:
+       mutex_unlock(&event_mutex);
+
+       return err;
+}
+
+#ifdef CONFIG_PERF_EVENTS
+
+void ftrace_profile_free_filter(struct perf_event *event)
+{
+       struct event_filter *filter = event->filter;
+
+       event->filter = NULL;
+       __free_filter(filter);
+}
+
+struct function_filter_data {
+       struct ftrace_ops *ops;
+       int first_filter;
+       int first_notrace;
+};
+
+#ifdef CONFIG_FUNCTION_TRACER
+static char **
+ftrace_function_filter_re(char *buf, int len, int *count)
+{
+       char *str, *sep, **re;
+
+       str = kstrndup(buf, len, GFP_KERNEL);
+       if (!str)
+               return NULL;
+
+       /*
+        * The argv_split function takes white space
+        * as a separator, so convert ',' into spaces.
+        */
+       while ((sep = strchr(str, ',')))
+               *sep = ' ';
+
+       re = argv_split(GFP_KERNEL, str, count);
+       kfree(str);
+       return re;
+}
+
+static int ftrace_function_set_regexp(struct ftrace_ops *ops, int filter,
+                                     int reset, char *re, int len)
+{
+       int ret;
+
+       if (filter)
+               ret = ftrace_set_filter(ops, re, len, reset);
+       else
+               ret = ftrace_set_notrace(ops, re, len, reset);
+
+       return ret;
+}
+
+static int __ftrace_function_set_filter(int filter, char *buf, int len,
+                                       struct function_filter_data *data)
+{
+       int i, re_cnt, ret = -EINVAL;
+       int *reset;
+       char **re;
+
+       reset = filter ? &data->first_filter : &data->first_notrace;
+
+       /*
+        * The 'ip' field could have multiple filters set, separated
+        * either by space or comma. We first cut the filter and apply
+        * all pieces separatelly.
+        */
+       re = ftrace_function_filter_re(buf, len, &re_cnt);
+       if (!re)
+               return -EINVAL;
+
+       for (i = 0; i < re_cnt; i++) {
+               ret = ftrace_function_set_regexp(data->ops, filter, *reset,
+                                                re[i], strlen(re[i]));
+               if (ret)
+                       break;
+
+               if (*reset)
+                       *reset = 0;
+       }
+
+       argv_free(re);
+       return ret;
+}
+
+static int ftrace_function_check_pred(struct filter_pred *pred, int leaf)
+{
+       struct ftrace_event_field *field = pred->field;
+
+       if (leaf) {
+               /*
+                * Check the leaf predicate for function trace, verify:
+                *  - only '==' and '!=' is used
+                *  - the 'ip' field is used
+                */
+               if ((pred->op != OP_EQ) && (pred->op != OP_NE))
+                       return -EINVAL;
+
+               if (strcmp(field->name, "ip"))
+                       return -EINVAL;
+       } else {
+               /*
+                * Check the non leaf predicate for function trace, verify:
+                *  - only '||' is used
+               */
+               if (pred->op != OP_OR)
+                       return -EINVAL;
+       }
+
+       return 0;
+}
+
+static int ftrace_function_set_filter_cb(enum move_type move,
+                                        struct filter_pred *pred,
+                                        int *err, void *data)
+{
+       /* Checking the node is valid for function trace. */
+       if ((move != MOVE_DOWN) ||
+           (pred->left != FILTER_PRED_INVALID)) {
+               *err = ftrace_function_check_pred(pred, 0);
+       } else {
+               *err = ftrace_function_check_pred(pred, 1);
+               if (*err)
+                       return WALK_PRED_ABORT;
+
+               *err = __ftrace_function_set_filter(pred->op == OP_EQ,
+                                                   pred->regex.pattern,
+                                                   pred->regex.len,
+                                                   data);
+       }
+
+       return (*err) ? WALK_PRED_ABORT : WALK_PRED_DEFAULT;
+}
+
+static int ftrace_function_set_filter(struct perf_event *event,
+                                     struct event_filter *filter)
+{
+       struct function_filter_data data = {
+               .first_filter  = 1,
+               .first_notrace = 1,
+               .ops           = &event->ftrace_ops,
+       };
+
+       return walk_pred_tree(filter->preds, filter->root,
+                             ftrace_function_set_filter_cb, &data);
+}
+#else
+static int ftrace_function_set_filter(struct perf_event *event,
+                                     struct event_filter *filter)
+{
+       return -ENODEV;
+}
+#endif /* CONFIG_FUNCTION_TRACER */
+
+int ftrace_profile_set_filter(struct perf_event *event, int event_id,
+                             char *filter_str)
+{
+       int err;
+       struct event_filter *filter;
+       struct ftrace_event_call *call;
+
+       mutex_lock(&event_mutex);
+
+       call = event->tp_event;
+
+       err = -EINVAL;
+       if (!call)
+               goto out_unlock;
+
+       err = -EEXIST;
+       if (event->filter)
+               goto out_unlock;
+
+       err = create_filter(call, filter_str, false, &filter);
+       if (err)
+               goto free_filter;
+
+       if (ftrace_event_is_function(call))
+               err = ftrace_function_set_filter(event, filter);
+       else
+               event->filter = filter;
+
+free_filter:
+       if (err || ftrace_event_is_function(call))
+               __free_filter(filter);
+
+out_unlock:
+       mutex_unlock(&event_mutex);
+
+       return err;
+}
+
+#endif /* CONFIG_PERF_EVENTS */
+
+#ifdef CONFIG_FTRACE_STARTUP_TEST
+
+#include <linux/types.h>
+#include <linux/tracepoint.h>
+
+#define CREATE_TRACE_POINTS
+#include "trace_events_filter_test.h"
+
+#define DATA_REC(m, va, vb, vc, vd, ve, vf, vg, vh, nvisit) \
+{ \
+       .filter = FILTER, \
+       .rec    = { .a = va, .b = vb, .c = vc, .d = vd, \
+                   .e = ve, .f = vf, .g = vg, .h = vh }, \
+       .match  = m, \
+       .not_visited = nvisit, \
+}
+#define YES 1
+#define NO  0
+
+static struct test_filter_data_t {
+       char *filter;
+       struct ftrace_raw_ftrace_test_filter rec;
+       int match;
+       char *not_visited;
+} test_filter_data[] = {
+#define FILTER "a == 1 && b == 1 && c == 1 && d == 1 && " \
+              "e == 1 && f == 1 && g == 1 && h == 1"
+       DATA_REC(YES, 1, 1, 1, 1, 1, 1, 1, 1, ""),
+       DATA_REC(NO,  0, 1, 1, 1, 1, 1, 1, 1, "bcdefgh"),
+       DATA_REC(NO,  1, 1, 1, 1, 1, 1, 1, 0, ""),
+#undef FILTER
+#define FILTER "a == 1 || b == 1 || c == 1 || d == 1 || " \
+              "e == 1 || f == 1 || g == 1 || h == 1"
+       DATA_REC(NO,  0, 0, 0, 0, 0, 0, 0, 0, ""),
+       DATA_REC(YES, 0, 0, 0, 0, 0, 0, 0, 1, ""),
+       DATA_REC(YES, 1, 0, 0, 0, 0, 0, 0, 0, "bcdefgh"),
+#undef FILTER
+#define FILTER "(a == 1 || b == 1) && (c == 1 || d == 1) && " \
+              "(e == 1 || f == 1) && (g == 1 || h == 1)"
+       DATA_REC(NO,  0, 0, 1, 1, 1, 1, 1, 1, "dfh"),
+       DATA_REC(YES, 0, 1, 0, 1, 0, 1, 0, 1, ""),
+       DATA_REC(YES, 1, 0, 1, 0, 0, 1, 0, 1, "bd"),
+       DATA_REC(NO,  1, 0, 1, 0, 0, 1, 0, 0, "bd"),
+#undef FILTER
+#define FILTER "(a == 1 && b == 1) || (c == 1 && d == 1) || " \
+              "(e == 1 && f == 1) || (g == 1 && h == 1)"
+       DATA_REC(YES, 1, 0, 1, 1, 1, 1, 1, 1, "efgh"),
+       DATA_REC(YES, 0, 0, 0, 0, 0, 0, 1, 1, ""),
+       DATA_REC(NO,  0, 0, 0, 0, 0, 0, 0, 1, ""),
+#undef FILTER
+#define FILTER "(a == 1 && b == 1) && (c == 1 && d == 1) && " \
+              "(e == 1 && f == 1) || (g == 1 && h == 1)"
+       DATA_REC(YES, 1, 1, 1, 1, 1, 1, 0, 0, "gh"),
+       DATA_REC(NO,  0, 0, 0, 0, 0, 0, 0, 1, ""),
+       DATA_REC(YES, 1, 1, 1, 1, 1, 0, 1, 1, ""),
+#undef FILTER
+#define FILTER "((a == 1 || b == 1) || (c == 1 || d == 1) || " \
+              "(e == 1 || f == 1)) && (g == 1 || h == 1)"
+       DATA_REC(YES, 1, 1, 1, 1, 1, 1, 0, 1, "bcdef"),
+       DATA_REC(NO,  0, 0, 0, 0, 0, 0, 0, 0, ""),
+       DATA_REC(YES, 1, 1, 1, 1, 1, 0, 1, 1, "h"),
+#undef FILTER
+#define FILTER "((((((((a == 1) && (b == 1)) || (c == 1)) && (d == 1)) || " \
+              "(e == 1)) && (f == 1)) || (g == 1)) && (h == 1))"
+       DATA_REC(YES, 1, 1, 1, 1, 1, 1, 1, 1, "ceg"),
+       DATA_REC(NO,  0, 1, 0, 1, 0, 1, 0, 1, ""),
+       DATA_REC(NO,  1, 0, 1, 0, 1, 0, 1, 0, ""),
+#undef FILTER
+#define FILTER "((((((((a == 1) || (b == 1)) && (c == 1)) || (d == 1)) && " \
+              "(e == 1)) || (f == 1)) && (g == 1)) || (h == 1))"
+       DATA_REC(YES, 1, 1, 1, 1, 1, 1, 1, 1, "bdfh"),
+       DATA_REC(YES, 0, 1, 0, 1, 0, 1, 0, 1, ""),
+       DATA_REC(YES, 1, 0, 1, 0, 1, 0, 1, 0, "bdfh"),
+};
+
+#undef DATA_REC
+#undef FILTER
+#undef YES
+#undef NO
+
+#define DATA_CNT (sizeof(test_filter_data)/sizeof(struct test_filter_data_t))
+
+static int test_pred_visited;
+
+static int test_pred_visited_fn(struct filter_pred *pred, void *event)
+{
+       struct ftrace_event_field *field = pred->field;
+
+       test_pred_visited = 1;
+       printk(KERN_INFO "\npred visited %s\n", field->name);
+       return 1;
+}
+
+static int test_walk_pred_cb(enum move_type move, struct filter_pred *pred,
+                            int *err, void *data)
+{
+       char *fields = data;
+
+       if ((move == MOVE_DOWN) &&
+           (pred->left == FILTER_PRED_INVALID)) {
+               struct ftrace_event_field *field = pred->field;
+
+               if (!field) {
+                       WARN(1, "all leafs should have field defined");
+                       return WALK_PRED_DEFAULT;
+               }
+               if (!strchr(fields, *field->name))
+                       return WALK_PRED_DEFAULT;
+
+               WARN_ON(!pred->fn);
+               pred->fn = test_pred_visited_fn;
+       }
+       return WALK_PRED_DEFAULT;
+}
+
+static __init int ftrace_test_event_filter(void)
+{
+       int i;
+
+       printk(KERN_INFO "Testing ftrace filter: ");
+
+       for (i = 0; i < DATA_CNT; i++) {
+               struct event_filter *filter = NULL;
+               struct test_filter_data_t *d = &test_filter_data[i];
+               int err;
+
+               err = create_filter(&event_ftrace_test_filter, d->filter,
+                                   false, &filter);
+               if (err) {
+                       printk(KERN_INFO
+                              "Failed to get filter for '%s', err %d\n",
+                              d->filter, err);
+                       __free_filter(filter);
+                       break;
+               }
+
+               /*
+                * The preemption disabling is not really needed for self
+                * tests, but the rcu dereference will complain without it.
+                */
+               preempt_disable();
+               if (*d->not_visited)
+                       walk_pred_tree(filter->preds, filter->root,
+                                      test_walk_pred_cb,
+                                      d->not_visited);
+
+               test_pred_visited = 0;
+               err = filter_match_preds(filter, &d->rec);
+               preempt_enable();
+
+               __free_filter(filter);
+
+               if (test_pred_visited) {
+                       printk(KERN_INFO
+                              "Failed, unwanted pred visited for filter %s\n",
+                              d->filter);
+                       break;
+               }
+
+               if (err != d->match) {
+                       printk(KERN_INFO
+                              "Failed to match filter '%s', expected %d\n",
+                              d->filter, d->match);
+                       break;
+               }
+       }
+
+       if (i == DATA_CNT)
+               printk(KERN_CONT "OK\n");
+
+       return 0;
+}
+
+late_initcall(ftrace_test_event_filter);
+
+#endif /* CONFIG_FTRACE_STARTUP_TEST */