|  | /* | 
|  | * Copyright (C) 2007 Mathieu Desnoyers | 
|  | * | 
|  | * This program is free software; you can redistribute it and/or modify | 
|  | * it under the terms of the GNU General Public License as published by | 
|  | * the Free Software Foundation; either version 2 of the License, or | 
|  | * (at your option) any later version. | 
|  | * | 
|  | * This program is distributed in the hope that it will be useful, | 
|  | * but WITHOUT ANY WARRANTY; without even the implied warranty of | 
|  | * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the | 
|  | * GNU General Public License for more details. | 
|  | * | 
|  | * You should have received a copy of the GNU General Public License | 
|  | * along with this program; if not, write to the Free Software | 
|  | * Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA 02111-1307, USA. | 
|  | */ | 
|  | #include <linux/module.h> | 
|  | #include <linux/mutex.h> | 
|  | #include <linux/types.h> | 
|  | #include <linux/jhash.h> | 
|  | #include <linux/list.h> | 
|  | #include <linux/rcupdate.h> | 
|  | #include <linux/marker.h> | 
|  | #include <linux/err.h> | 
|  |  | 
|  | extern struct marker __start___markers[]; | 
|  | extern struct marker __stop___markers[]; | 
|  |  | 
|  | /* | 
|  | * markers_mutex nests inside module_mutex. Markers mutex protects the builtin | 
|  | * and module markers, the hash table and deferred_sync. | 
|  | */ | 
|  | static DEFINE_MUTEX(markers_mutex); | 
|  |  | 
|  | /* | 
|  | * Marker deferred synchronization. | 
|  | * Upon marker probe_unregister, we delay call to synchronize_sched() to | 
|  | * accelerate mass unregistration (only when there is no more reference to a | 
|  | * given module do we call synchronize_sched()). However, we need to make sure | 
|  | * every critical region has ended before we re-arm a marker that has been | 
|  | * unregistered and then registered back with a different probe data. | 
|  | */ | 
|  | static int deferred_sync; | 
|  |  | 
|  | /* | 
|  | * Marker hash table, containing the active markers. | 
|  | * Protected by module_mutex. | 
|  | */ | 
|  | #define MARKER_HASH_BITS 6 | 
|  | #define MARKER_TABLE_SIZE (1 << MARKER_HASH_BITS) | 
|  |  | 
|  | struct marker_entry { | 
|  | struct hlist_node hlist; | 
|  | char *format; | 
|  | marker_probe_func *probe; | 
|  | void *private; | 
|  | int refcount;	/* Number of times armed. 0 if disarmed. */ | 
|  | char name[0];	/* Contains name'\0'format'\0' */ | 
|  | }; | 
|  |  | 
|  | static struct hlist_head marker_table[MARKER_TABLE_SIZE]; | 
|  |  | 
|  | /** | 
|  | * __mark_empty_function - Empty probe callback | 
|  | * @mdata: pointer of type const struct marker | 
|  | * @fmt: format string | 
|  | * @...: variable argument list | 
|  | * | 
|  | * Empty callback provided as a probe to the markers. By providing this to a | 
|  | * disabled marker, we make sure the  execution flow is always valid even | 
|  | * though the function pointer change and the marker enabling are two distinct | 
|  | * operations that modifies the execution flow of preemptible code. | 
|  | */ | 
|  | void __mark_empty_function(const struct marker *mdata, void *private, | 
|  | const char *fmt, ...) | 
|  | { | 
|  | } | 
|  | EXPORT_SYMBOL_GPL(__mark_empty_function); | 
|  |  | 
|  | /* | 
|  | * Get marker if the marker is present in the marker hash table. | 
|  | * Must be called with markers_mutex held. | 
|  | * Returns NULL if not present. | 
|  | */ | 
|  | static struct marker_entry *get_marker(const char *name) | 
|  | { | 
|  | struct hlist_head *head; | 
|  | struct hlist_node *node; | 
|  | struct marker_entry *e; | 
|  | u32 hash = jhash(name, strlen(name), 0); | 
|  |  | 
|  | head = &marker_table[hash & ((1 << MARKER_HASH_BITS)-1)]; | 
|  | hlist_for_each_entry(e, node, head, hlist) { | 
|  | if (!strcmp(name, e->name)) | 
|  | return e; | 
|  | } | 
|  | return NULL; | 
|  | } | 
|  |  | 
|  | /* | 
|  | * Add the marker to the marker hash table. Must be called with markers_mutex | 
|  | * held. | 
|  | */ | 
|  | static int add_marker(const char *name, const char *format, | 
|  | marker_probe_func *probe, void *private) | 
|  | { | 
|  | struct hlist_head *head; | 
|  | struct hlist_node *node; | 
|  | struct marker_entry *e; | 
|  | size_t name_len = strlen(name) + 1; | 
|  | size_t format_len = 0; | 
|  | u32 hash = jhash(name, name_len-1, 0); | 
|  |  | 
|  | if (format) | 
|  | format_len = strlen(format) + 1; | 
|  | head = &marker_table[hash & ((1 << MARKER_HASH_BITS)-1)]; | 
|  | hlist_for_each_entry(e, node, head, hlist) { | 
|  | if (!strcmp(name, e->name)) { | 
|  | printk(KERN_NOTICE | 
|  | "Marker %s busy, probe %p already installed\n", | 
|  | name, e->probe); | 
|  | return -EBUSY;	/* Already there */ | 
|  | } | 
|  | } | 
|  | /* | 
|  | * Using kmalloc here to allocate a variable length element. Could | 
|  | * cause some memory fragmentation if overused. | 
|  | */ | 
|  | e = kmalloc(sizeof(struct marker_entry) + name_len + format_len, | 
|  | GFP_KERNEL); | 
|  | if (!e) | 
|  | return -ENOMEM; | 
|  | memcpy(&e->name[0], name, name_len); | 
|  | if (format) { | 
|  | e->format = &e->name[name_len]; | 
|  | memcpy(e->format, format, format_len); | 
|  | trace_mark(core_marker_format, "name %s format %s", | 
|  | e->name, e->format); | 
|  | } else | 
|  | e->format = NULL; | 
|  | e->probe = probe; | 
|  | e->private = private; | 
|  | e->refcount = 0; | 
|  | hlist_add_head(&e->hlist, head); | 
|  | return 0; | 
|  | } | 
|  |  | 
|  | /* | 
|  | * Remove the marker from the marker hash table. Must be called with mutex_lock | 
|  | * held. | 
|  | */ | 
|  | static void *remove_marker(const char *name) | 
|  | { | 
|  | struct hlist_head *head; | 
|  | struct hlist_node *node; | 
|  | struct marker_entry *e; | 
|  | int found = 0; | 
|  | size_t len = strlen(name) + 1; | 
|  | void *private = NULL; | 
|  | u32 hash = jhash(name, len-1, 0); | 
|  |  | 
|  | head = &marker_table[hash & ((1 << MARKER_HASH_BITS)-1)]; | 
|  | hlist_for_each_entry(e, node, head, hlist) { | 
|  | if (!strcmp(name, e->name)) { | 
|  | found = 1; | 
|  | break; | 
|  | } | 
|  | } | 
|  | if (found) { | 
|  | private = e->private; | 
|  | hlist_del(&e->hlist); | 
|  | kfree(e); | 
|  | } | 
|  | return private; | 
|  | } | 
|  |  | 
|  | /* | 
|  | * Set the mark_entry format to the format found in the element. | 
|  | */ | 
|  | static int marker_set_format(struct marker_entry **entry, const char *format) | 
|  | { | 
|  | struct marker_entry *e; | 
|  | size_t name_len = strlen((*entry)->name) + 1; | 
|  | size_t format_len = strlen(format) + 1; | 
|  |  | 
|  | e = kmalloc(sizeof(struct marker_entry) + name_len + format_len, | 
|  | GFP_KERNEL); | 
|  | if (!e) | 
|  | return -ENOMEM; | 
|  | memcpy(&e->name[0], (*entry)->name, name_len); | 
|  | e->format = &e->name[name_len]; | 
|  | memcpy(e->format, format, format_len); | 
|  | e->probe = (*entry)->probe; | 
|  | e->private = (*entry)->private; | 
|  | e->refcount = (*entry)->refcount; | 
|  | hlist_add_before(&e->hlist, &(*entry)->hlist); | 
|  | hlist_del(&(*entry)->hlist); | 
|  | kfree(*entry); | 
|  | *entry = e; | 
|  | trace_mark(core_marker_format, "name %s format %s", | 
|  | e->name, e->format); | 
|  | return 0; | 
|  | } | 
|  |  | 
|  | /* | 
|  | * Sets the probe callback corresponding to one marker. | 
|  | */ | 
|  | static int set_marker(struct marker_entry **entry, struct marker *elem) | 
|  | { | 
|  | int ret; | 
|  | WARN_ON(strcmp((*entry)->name, elem->name) != 0); | 
|  |  | 
|  | if ((*entry)->format) { | 
|  | if (strcmp((*entry)->format, elem->format) != 0) { | 
|  | printk(KERN_NOTICE | 
|  | "Format mismatch for probe %s " | 
|  | "(%s), marker (%s)\n", | 
|  | (*entry)->name, | 
|  | (*entry)->format, | 
|  | elem->format); | 
|  | return -EPERM; | 
|  | } | 
|  | } else { | 
|  | ret = marker_set_format(entry, elem->format); | 
|  | if (ret) | 
|  | return ret; | 
|  | } | 
|  | elem->call = (*entry)->probe; | 
|  | elem->private = (*entry)->private; | 
|  | elem->state = 1; | 
|  | return 0; | 
|  | } | 
|  |  | 
|  | /* | 
|  | * Disable a marker and its probe callback. | 
|  | * Note: only after a synchronize_sched() issued after setting elem->call to the | 
|  | * empty function insures that the original callback is not used anymore. This | 
|  | * insured by preemption disabling around the call site. | 
|  | */ | 
|  | static void disable_marker(struct marker *elem) | 
|  | { | 
|  | elem->state = 0; | 
|  | elem->call = __mark_empty_function; | 
|  | /* | 
|  | * Leave the private data and id there, because removal is racy and | 
|  | * should be done only after a synchronize_sched(). These are never used | 
|  | * until the next initialization anyway. | 
|  | */ | 
|  | } | 
|  |  | 
|  | /** | 
|  | * marker_update_probe_range - Update a probe range | 
|  | * @begin: beginning of the range | 
|  | * @end: end of the range | 
|  | * @probe_module: module address of the probe being updated | 
|  | * @refcount: number of references left to the given probe_module (out) | 
|  | * | 
|  | * Updates the probe callback corresponding to a range of markers. | 
|  | */ | 
|  | void marker_update_probe_range(struct marker *begin, | 
|  | struct marker *end, struct module *probe_module, | 
|  | int *refcount) | 
|  | { | 
|  | struct marker *iter; | 
|  | struct marker_entry *mark_entry; | 
|  |  | 
|  | mutex_lock(&markers_mutex); | 
|  | for (iter = begin; iter < end; iter++) { | 
|  | mark_entry = get_marker(iter->name); | 
|  | if (mark_entry && mark_entry->refcount) { | 
|  | set_marker(&mark_entry, iter); | 
|  | /* | 
|  | * ignore error, continue | 
|  | */ | 
|  | if (probe_module) | 
|  | if (probe_module == | 
|  | __module_text_address((unsigned long)mark_entry->probe)) | 
|  | (*refcount)++; | 
|  | } else { | 
|  | disable_marker(iter); | 
|  | } | 
|  | } | 
|  | mutex_unlock(&markers_mutex); | 
|  | } | 
|  |  | 
|  | /* | 
|  | * Update probes, removing the faulty probes. | 
|  | * Issues a synchronize_sched() when no reference to the module passed | 
|  | * as parameter is found in the probes so the probe module can be | 
|  | * safely unloaded from now on. | 
|  | */ | 
|  | static void marker_update_probes(struct module *probe_module) | 
|  | { | 
|  | int refcount = 0; | 
|  |  | 
|  | /* Core kernel markers */ | 
|  | marker_update_probe_range(__start___markers, | 
|  | __stop___markers, probe_module, &refcount); | 
|  | /* Markers in modules. */ | 
|  | module_update_markers(probe_module, &refcount); | 
|  | if (probe_module && refcount == 0) { | 
|  | synchronize_sched(); | 
|  | deferred_sync = 0; | 
|  | } | 
|  | } | 
|  |  | 
|  | /** | 
|  | * marker_probe_register -  Connect a probe to a marker | 
|  | * @name: marker name | 
|  | * @format: format string | 
|  | * @probe: probe handler | 
|  | * @private: probe private data | 
|  | * | 
|  | * private data must be a valid allocated memory address, or NULL. | 
|  | * Returns 0 if ok, error value on error. | 
|  | */ | 
|  | int marker_probe_register(const char *name, const char *format, | 
|  | marker_probe_func *probe, void *private) | 
|  | { | 
|  | struct marker_entry *entry; | 
|  | int ret = 0; | 
|  |  | 
|  | mutex_lock(&markers_mutex); | 
|  | entry = get_marker(name); | 
|  | if (entry && entry->refcount) { | 
|  | ret = -EBUSY; | 
|  | goto end; | 
|  | } | 
|  | if (deferred_sync) { | 
|  | synchronize_sched(); | 
|  | deferred_sync = 0; | 
|  | } | 
|  | ret = add_marker(name, format, probe, private); | 
|  | if (ret) | 
|  | goto end; | 
|  | mutex_unlock(&markers_mutex); | 
|  | marker_update_probes(NULL); | 
|  | return ret; | 
|  | end: | 
|  | mutex_unlock(&markers_mutex); | 
|  | return ret; | 
|  | } | 
|  | EXPORT_SYMBOL_GPL(marker_probe_register); | 
|  |  | 
|  | /** | 
|  | * marker_probe_unregister -  Disconnect a probe from a marker | 
|  | * @name: marker name | 
|  | * | 
|  | * Returns the private data given to marker_probe_register, or an ERR_PTR(). | 
|  | */ | 
|  | void *marker_probe_unregister(const char *name) | 
|  | { | 
|  | struct module *probe_module; | 
|  | struct marker_entry *entry; | 
|  | void *private; | 
|  |  | 
|  | mutex_lock(&markers_mutex); | 
|  | entry = get_marker(name); | 
|  | if (!entry) { | 
|  | private = ERR_PTR(-ENOENT); | 
|  | goto end; | 
|  | } | 
|  | entry->refcount = 0; | 
|  | /* In what module is the probe handler ? */ | 
|  | probe_module = __module_text_address((unsigned long)entry->probe); | 
|  | private = remove_marker(name); | 
|  | deferred_sync = 1; | 
|  | mutex_unlock(&markers_mutex); | 
|  | marker_update_probes(probe_module); | 
|  | return private; | 
|  | end: | 
|  | mutex_unlock(&markers_mutex); | 
|  | return private; | 
|  | } | 
|  | EXPORT_SYMBOL_GPL(marker_probe_unregister); | 
|  |  | 
|  | /** | 
|  | * marker_probe_unregister_private_data -  Disconnect a probe from a marker | 
|  | * @private: probe private data | 
|  | * | 
|  | * Unregister a marker by providing the registered private data. | 
|  | * Returns the private data given to marker_probe_register, or an ERR_PTR(). | 
|  | */ | 
|  | void *marker_probe_unregister_private_data(void *private) | 
|  | { | 
|  | struct module *probe_module; | 
|  | struct hlist_head *head; | 
|  | struct hlist_node *node; | 
|  | struct marker_entry *entry; | 
|  | int found = 0; | 
|  | unsigned int i; | 
|  |  | 
|  | mutex_lock(&markers_mutex); | 
|  | for (i = 0; i < MARKER_TABLE_SIZE; i++) { | 
|  | head = &marker_table[i]; | 
|  | hlist_for_each_entry(entry, node, head, hlist) { | 
|  | if (entry->private == private) { | 
|  | found = 1; | 
|  | goto iter_end; | 
|  | } | 
|  | } | 
|  | } | 
|  | iter_end: | 
|  | if (!found) { | 
|  | private = ERR_PTR(-ENOENT); | 
|  | goto end; | 
|  | } | 
|  | entry->refcount = 0; | 
|  | /* In what module is the probe handler ? */ | 
|  | probe_module = __module_text_address((unsigned long)entry->probe); | 
|  | private = remove_marker(entry->name); | 
|  | deferred_sync = 1; | 
|  | mutex_unlock(&markers_mutex); | 
|  | marker_update_probes(probe_module); | 
|  | return private; | 
|  | end: | 
|  | mutex_unlock(&markers_mutex); | 
|  | return private; | 
|  | } | 
|  | EXPORT_SYMBOL_GPL(marker_probe_unregister_private_data); | 
|  |  | 
|  | /** | 
|  | * marker_arm - Arm a marker | 
|  | * @name: marker name | 
|  | * | 
|  | * Activate a marker. It keeps a reference count of the number of | 
|  | * arming/disarming done. | 
|  | * Returns 0 if ok, error value on error. | 
|  | */ | 
|  | int marker_arm(const char *name) | 
|  | { | 
|  | struct marker_entry *entry; | 
|  | int ret = 0; | 
|  |  | 
|  | mutex_lock(&markers_mutex); | 
|  | entry = get_marker(name); | 
|  | if (!entry) { | 
|  | ret = -ENOENT; | 
|  | goto end; | 
|  | } | 
|  | /* | 
|  | * Only need to update probes when refcount passes from 0 to 1. | 
|  | */ | 
|  | if (entry->refcount++) | 
|  | goto end; | 
|  | end: | 
|  | mutex_unlock(&markers_mutex); | 
|  | marker_update_probes(NULL); | 
|  | return ret; | 
|  | } | 
|  | EXPORT_SYMBOL_GPL(marker_arm); | 
|  |  | 
|  | /** | 
|  | * marker_disarm - Disarm a marker | 
|  | * @name: marker name | 
|  | * | 
|  | * Disarm a marker. It keeps a reference count of the number of arming/disarming | 
|  | * done. | 
|  | * Returns 0 if ok, error value on error. | 
|  | */ | 
|  | int marker_disarm(const char *name) | 
|  | { | 
|  | struct marker_entry *entry; | 
|  | int ret = 0; | 
|  |  | 
|  | mutex_lock(&markers_mutex); | 
|  | entry = get_marker(name); | 
|  | if (!entry) { | 
|  | ret = -ENOENT; | 
|  | goto end; | 
|  | } | 
|  | /* | 
|  | * Only permit decrement refcount if higher than 0. | 
|  | * Do probe update only on 1 -> 0 transition. | 
|  | */ | 
|  | if (entry->refcount) { | 
|  | if (--entry->refcount) | 
|  | goto end; | 
|  | } else { | 
|  | ret = -EPERM; | 
|  | goto end; | 
|  | } | 
|  | end: | 
|  | mutex_unlock(&markers_mutex); | 
|  | marker_update_probes(NULL); | 
|  | return ret; | 
|  | } | 
|  | EXPORT_SYMBOL_GPL(marker_disarm); | 
|  |  | 
|  | /** | 
|  | * marker_get_private_data - Get a marker's probe private data | 
|  | * @name: marker name | 
|  | * | 
|  | * Returns the private data pointer, or an ERR_PTR. | 
|  | * The private data pointer should _only_ be dereferenced if the caller is the | 
|  | * owner of the data, or its content could vanish. This is mostly used to | 
|  | * confirm that a caller is the owner of a registered probe. | 
|  | */ | 
|  | void *marker_get_private_data(const char *name) | 
|  | { | 
|  | struct hlist_head *head; | 
|  | struct hlist_node *node; | 
|  | struct marker_entry *e; | 
|  | size_t name_len = strlen(name) + 1; | 
|  | u32 hash = jhash(name, name_len-1, 0); | 
|  | int found = 0; | 
|  |  | 
|  | head = &marker_table[hash & ((1 << MARKER_HASH_BITS)-1)]; | 
|  | hlist_for_each_entry(e, node, head, hlist) { | 
|  | if (!strcmp(name, e->name)) { | 
|  | found = 1; | 
|  | return e->private; | 
|  | } | 
|  | } | 
|  | return ERR_PTR(-ENOENT); | 
|  | } | 
|  | EXPORT_SYMBOL_GPL(marker_get_private_data); |