/* auditsc.c -- System-call auditing support * Handles all system-call specific auditing features. * * Copyright 2003-2004 Red Hat Inc., Durham, North Carolina. * All Rights Reserved. * * This program is free software; you can redistribute it and/or modify * it under the terms of the GNU General Public License as published by * the Free Software Foundation; either version 2 of the License, or * (at your option) any later version. * * This program is distributed in the hope that it will be useful, * but WITHOUT ANY WARRANTY; without even the implied warranty of * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the * GNU General Public License for more details. * * You should have received a copy of the GNU General Public License * along with this program; if not, write to the Free Software * Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA * * Written by Rickard E. (Rik) Faith <faith@redhat.com> * * Many of the ideas implemented here are from Stephen C. Tweedie, * especially the idea of avoiding a copy by using getname. * * The method for actual interception of syscall entry and exit (not in * this file -- see entry.S) is based on a GPL'd patch written by * okir@suse.de and Copyright 2003 SuSE Linux AG. * */ #include <linux/init.h> #include <asm/types.h> #include <asm/atomic.h> #include <linux/mm.h> #include <linux/module.h> #include <linux/mount.h> #include <linux/socket.h> #include <linux/audit.h> #include <linux/personality.h> #include <linux/time.h> #include <linux/kthread.h> #include <linux/netlink.h> #include <linux/compiler.h> #include <asm/unistd.h> /* 0 = no checking 1 = put_count checking 2 = verbose put_count checking */ #define AUDIT_DEBUG 0 /* No syscall auditing will take place unless audit_enabled != 0. */ extern int audit_enabled; /* AUDIT_NAMES is the number of slots we reserve in the audit_context * for saving names from getname(). */ #define AUDIT_NAMES 20 /* AUDIT_NAMES_RESERVED is the number of slots we reserve in the * audit_context from being used for nameless inodes from * path_lookup. */ #define AUDIT_NAMES_RESERVED 7 /* At task start time, the audit_state is set in the audit_context using a per-task filter. At syscall entry, the audit_state is augmented by the syscall filter. */ enum audit_state { AUDIT_DISABLED, /* Do not create per-task audit_context. * No syscall-specific audit records can * be generated. */ AUDIT_SETUP_CONTEXT, /* Create the per-task audit_context, * but don't necessarily fill it in at * syscall entry time (i.e., filter * instead). */ AUDIT_BUILD_CONTEXT, /* Create the per-task audit_context, * and always fill it in at syscall * entry time. This makes a full * syscall record available if some * other part of the kernel decides it * should be recorded. */ AUDIT_RECORD_CONTEXT /* Create the per-task audit_context, * always fill it in at syscall entry * time, and always write out the audit * record at syscall exit time. */ }; /* When fs/namei.c:getname() is called, we store the pointer in name and * we don't let putname() free it (instead we free all of the saved * pointers at syscall exit time). * * Further, in fs/namei.c:path_lookup() we store the inode and device. */ struct audit_names { const char *name; unsigned long ino; dev_t dev; umode_t mode; uid_t uid; gid_t gid; dev_t rdev; unsigned flags; }; struct audit_aux_data { struct audit_aux_data *next; int type; }; #define AUDIT_AUX_IPCPERM 0 struct audit_aux_data_ipcctl { struct audit_aux_data d; struct ipc_perm p; unsigned long qbytes; uid_t uid; gid_t gid; mode_t mode; }; struct audit_aux_data_socketcall { struct audit_aux_data d; int nargs; unsigned long args[0]; }; struct audit_aux_data_sockaddr { struct audit_aux_data d; int len; char a[0]; }; struct audit_aux_data_path { struct audit_aux_data d; struct dentry *dentry; struct vfsmount *mnt; }; /* The per-task audit context. */ struct audit_context { int in_syscall; /* 1 if task is in a syscall */ enum audit_state state; unsigned int serial; /* serial number for record */ struct timespec ctime; /* time of syscall entry */ uid_t loginuid; /* login uid (identity) */ int major; /* syscall number */ unsigned long argv[4]; /* syscall arguments */ int return_valid; /* return code is valid */ long return_code;/* syscall return code */ int auditable; /* 1 if record should be written */ int name_count; struct audit_names names[AUDIT_NAMES]; struct dentry * pwd; struct vfsmount * pwdmnt; struct audit_context *previous; /* For nested syscalls */ struct audit_aux_data *aux; /* Save things to print about task_struct */ pid_t pid; uid_t uid, euid, suid, fsuid; gid_t gid, egid, sgid, fsgid; unsigned long personality; int arch; #if AUDIT_DEBUG int put_count; int ino_count; #endif }; /* Public API */ /* There are three lists of rules -- one to search at task creation * time, one to search at syscall entry time, and another to search at * syscall exit time. */ static struct list_head audit_filter_list[AUDIT_NR_FILTERS] = { LIST_HEAD_INIT(audit_filter_list[0]), LIST_HEAD_INIT(audit_filter_list[1]), LIST_HEAD_INIT(audit_filter_list[2]), LIST_HEAD_INIT(audit_filter_list[3]), LIST_HEAD_INIT(audit_filter_list[4]), #if AUDIT_NR_FILTERS != 5 #error Fix audit_filter_list initialiser #endif }; struct audit_entry { struct list_head list; struct rcu_head rcu; struct audit_rule rule; }; extern int audit_pid; /* Copy rule from user-space to kernel-space. Called from * audit_add_rule during AUDIT_ADD. */ static inline int audit_copy_rule(struct audit_rule *d, struct audit_rule *s) { int i; if (s->action != AUDIT_NEVER && s->action != AUDIT_POSSIBLE && s->action != AUDIT_ALWAYS) return -1; if (s->field_count < 0 || s->field_count > AUDIT_MAX_FIELDS) return -1; if ((s->flags & ~AUDIT_FILTER_PREPEND) >= AUDIT_NR_FILTERS) return -1; d->flags = s->flags; d->action = s->action; d->field_count = s->field_count; for (i = 0; i < d->field_count; i++) { d->fields[i] = s->fields[i]; d->values[i] = s->values[i]; } for (i = 0; i < AUDIT_BITMASK_SIZE; i++) d->mask[i] = s->mask[i]; return 0; } /* Check to see if two rules are identical. It is called from * audit_add_rule during AUDIT_ADD and * audit_del_rule during AUDIT_DEL. */ static inline int audit_compare_rule(struct audit_rule *a, struct audit_rule *b) { int i; if (a->flags != b->flags) return 1; if (a->action != b->action) return 1; if (a->field_count != b->field_count) return 1; for (i = 0; i < a->field_count; i++) { if (a->fields[i] != b->fields[i] || a->values[i] != b->values[i]) return 1; } for (i = 0; i < AUDIT_BITMASK_SIZE; i++) if (a->mask[i] != b->mask[i]) return 1; return 0; } /* Note that audit_add_rule and audit_del_rule are called via * audit_receive() in audit.c, and are protected by * audit_netlink_sem. */ static inline int audit_add_rule(struct audit_rule *rule, struct list_head *list) { struct audit_entry *entry; /* Do not use the _rcu iterator here, since this is the only * addition routine. */ list_for_each_entry(entry, list, list) { if (!audit_compare_rule(rule, &entry->rule)) { return -EEXIST; } } if (!(entry = kmalloc(sizeof(*entry), GFP_KERNEL))) return -ENOMEM; if (audit_copy_rule(&entry->rule, rule)) { kfree(entry); return -EINVAL; } if (entry->rule.flags & AUDIT_FILTER_PREPEND) { entry->rule.flags &= ~AUDIT_FILTER_PREPEND; list_add_rcu(&entry->list, list); } else { list_add_tail_rcu(&entry->list, list); } return 0; } static inline void audit_free_rule(struct rcu_head *head) { struct audit_entry *e = container_of(head, struct audit_entry, rcu); kfree(e); } /* Note that audit_add_rule and audit_del_rule are called via * audit_receive() in audit.c, and are protected by * audit_netlink_sem. */ static inline int audit_del_rule(struct audit_rule *rule, struct list_head *list) { struct audit_entry *e; /* Do not use the _rcu iterator here, since this is the only * deletion routine. */ list_for_each_entry(e, list, list) { if (!audit_compare_rule(rule, &e->rule)) { list_del_rcu(&e->list); call_rcu(&e->rcu, audit_free_rule); return 0; } } return -ENOENT; /* No matching rule */ } static int audit_list_rules(void *_dest) { int pid, seq; int *dest = _dest; struct audit_entry *entry; int i; pid = dest[0]; seq = dest[1]; kfree(dest); down(&audit_netlink_sem); /* The *_rcu iterators not needed here because we are always called with audit_netlink_sem held. */ for (i=0; i<AUDIT_NR_FILTERS; i++) { list_for_each_entry(entry, &audit_filter_list[i], list) audit_send_reply(pid, seq, AUDIT_LIST, 0, 1, &entry->rule, sizeof(entry->rule)); } audit_send_reply(pid, seq, AUDIT_LIST, 1, 1, NULL, 0); up(&audit_netlink_sem); return 0; } int audit_receive_filter(int type, int pid, int uid, int seq, void *data, uid_t loginuid) { struct task_struct *tsk; int *dest; int err = 0; unsigned listnr; switch (type) { case AUDIT_LIST: /* We can't just spew out the rules here because we might fill * the available socket buffer space and deadlock waiting for * auditctl to read from it... which isn't ever going to * happen if we're actually running in the context of auditctl * trying to _send_ the stuff */ dest = kmalloc(2 * sizeof(int), GFP_KERNEL); if (!dest) return -ENOMEM; dest[0] = pid; dest[1] = seq; tsk = kthread_run(audit_list_rules, dest, "audit_list_rules"); if (IS_ERR(tsk)) { kfree(dest); err = PTR_ERR(tsk); } break; case AUDIT_ADD: listnr =((struct audit_rule *)data)->flags & ~AUDIT_FILTER_PREPEND; if (listnr >= AUDIT_NR_FILTERS) return -EINVAL; err = audit_add_rule(data, &audit_filter_list[listnr]); if (!err) audit_log(NULL, GFP_KERNEL, AUDIT_CONFIG_CHANGE, "auid=%u added an audit rule\n", loginuid); break; case AUDIT_DEL: listnr =((struct audit_rule *)data)->flags & ~AUDIT_FILTER_PREPEND; if (listnr >= AUDIT_NR_FILTERS) return -EINVAL; err = audit_del_rule(data, &audit_filter_list[listnr]); if (!err) audit_log(NULL, GFP_KERNEL, AUDIT_CONFIG_CHANGE, "auid=%u removed an audit rule\n", loginuid); break; default: return -EINVAL; } return err; } /* Compare a task_struct with an audit_rule. Return 1 on match, 0 * otherwise. */ static int audit_filter_rules(struct task_struct *tsk, struct audit_rule *rule, struct audit_context *ctx, enum audit_state *state) { int i, j; for (i = 0; i < rule->field_count; i++) { u32 field = rule->fields[i] & ~AUDIT_NEGATE; u32 value = rule->values[i]; int result = 0; switch (field) { case AUDIT_PID: result = (tsk->pid == value); break; case AUDIT_UID: result = (tsk->uid == value); break; case AUDIT_EUID: result = (tsk->euid == value); break; case AUDIT_SUID: result = (tsk->suid == value); break; case AUDIT_FSUID: result = (tsk->fsuid == value); break; case AUDIT_GID: result = (tsk->gid == value); break; case AUDIT_EGID: result = (tsk->egid == value); break; case AUDIT_SGID: result = (tsk->sgid == value); break; case AUDIT_FSGID: result = (tsk->fsgid == value); break; case AUDIT_PERS: result = (tsk->personality == value); break; case AUDIT_ARCH: if (ctx) result = (ctx->arch == value); break; case AUDIT_EXIT: if (ctx && ctx->return_valid) result = (ctx->return_code == value); break; case AUDIT_SUCCESS: if (ctx && ctx->return_valid) { if (value) result = (ctx->return_valid == AUDITSC_SUCCESS); else result = (ctx->return_valid == AUDITSC_FAILURE); } break; case AUDIT_DEVMAJOR: if (ctx) { for (j = 0; j < ctx->name_count; j++) { if (MAJOR(ctx->names[j].dev)==value) { ++result; break; } } } break; case AUDIT_DEVMINOR: if (ctx) { for (j = 0; j < ctx->name_count; j++) { if (MINOR(ctx->names[j].dev)==value) { ++result; break; } } } break; case AUDIT_INODE: if (ctx) { for (j = 0; j < ctx->name_count; j++) { if (ctx->names[j].ino == value) { ++result; break; } } } break; case AUDIT_LOGINUID: result = 0; if (ctx) result = (ctx->loginuid == value); break; case AUDIT_ARG0: case AUDIT_ARG1: case AUDIT_ARG2: case AUDIT_ARG3: if (ctx) result = (ctx->argv[field-AUDIT_ARG0]==value); break; } if (rule->fields[i] & AUDIT_NEGATE) result = !result; if (!result) return 0; } switch (rule->action) { case AUDIT_NEVER: *state = AUDIT_DISABLED; break; case AUDIT_POSSIBLE: *state = AUDIT_BUILD_CONTEXT; break; case AUDIT_ALWAYS: *state = AUDIT_RECORD_CONTEXT; break; } return 1; } /* At process creation time, we can determine if system-call auditing is * completely disabled for this task. Since we only have the task * structure at this point, we can only check uid and gid. */ static enum audit_state audit_filter_task(struct task_struct *tsk) { struct audit_entry *e; enum audit_state state; rcu_read_lock(); list_for_each_entry_rcu(e, &audit_filter_list[AUDIT_FILTER_TASK], list) { if (audit_filter_rules(tsk, &e->rule, NULL, &state)) { rcu_read_unlock(); return state; } } rcu_read_unlock(); return AUDIT_BUILD_CONTEXT; } /* At syscall entry and exit time, this filter is called if the * audit_state is not low enough that auditing cannot take place, but is * also not high enough that we already know we have to write an audit * record (i.e., the state is AUDIT_SETUP_CONTEXT or AUDIT_BUILD_CONTEXT). */ static enum audit_state audit_filter_syscall(struct task_struct *tsk, struct audit_context *ctx, struct list_head *list) { struct audit_entry *e; enum audit_state state; if (audit_pid && tsk->tgid == audit_pid) return AUDIT_DISABLED; rcu_read_lock(); if (!list_empty(list)) { int word = AUDIT_WORD(ctx->major); int bit = AUDIT_BIT(ctx->major); list_for_each_entry_rcu(e, list, list) { if ((e->rule.mask[word] & bit) == bit && audit_filter_rules(tsk, &e->rule, ctx, &state)) { rcu_read_unlock(); return state; } } } rcu_read_unlock(); return AUDIT_BUILD_CONTEXT; } static int audit_filter_user_rules(struct netlink_skb_parms *cb, struct audit_rule *rule, enum audit_state *state) { int i; for (i = 0; i < rule->field_count; i++) { u32 field = rule->fields[i] & ~AUDIT_NEGATE; u32 value = rule->values[i]; int result = 0; switch (field) { case AUDIT_PID: result = (cb->creds.pid == value); break; case AUDIT_UID: result = (cb->creds.uid == value); break; case AUDIT_GID: result = (cb->creds.gid == value); break; case AUDIT_LOGINUID: result = (cb->loginuid == value); break; } if (rule->fields[i] & AUDIT_NEGATE) result = !result; if (!result) return 0; } switch (rule->action) { case AUDIT_NEVER: *state = AUDIT_DISABLED; break; case AUDIT_POSSIBLE: *state = AUDIT_BUILD_CONTEXT; break; case AUDIT_ALWAYS: *state = AUDIT_RECORD_CONTEXT; break; } return 1; } int audit_filter_user(struct netlink_skb_parms *cb, int type) { struct audit_entry *e; enum audit_state state; int ret = 1; rcu_read_lock(); list_for_each_entry_rcu(e, &audit_filter_list[AUDIT_FILTER_USER], list) { if (audit_filter_user_rules(cb, &e->rule, &state)) { if (state == AUDIT_DISABLED) ret = 0; break; } } rcu_read_unlock(); return ret; /* Audit by default */ } /* This should be called with task_lock() held. */ static inline struct audit_context *audit_get_context(struct task_struct *tsk, int return_valid, int return_code) { struct audit_context *context = tsk->audit_context; if (likely(!context)) return NULL; context->return_valid = return_valid; context->return_code = return_code; if (context->in_syscall && !context->auditable) { enum audit_state state; state = audit_filter_syscall(tsk, context, &audit_filter_list[AUDIT_FILTER_EXIT]); if (state == AUDIT_RECORD_CONTEXT) context->auditable = 1; } context->pid = tsk->pid; context->uid = tsk->uid; context->gid = tsk->gid; context->euid = tsk->euid; context->suid = tsk->suid; context->fsuid = tsk->fsuid; context->egid = tsk->egid; context->sgid = tsk->sgid; context->fsgid = tsk->fsgid; context->personality = tsk->personality; tsk->audit_context = NULL; return context; } static inline void audit_free_names(struct audit_context *context) { int i; #if AUDIT_DEBUG == 2 if (context->auditable ||context->put_count + context->ino_count != context->name_count) { printk(KERN_ERR "audit.c:%d(:%d): major=%d in_syscall=%d" " name_count=%d put_count=%d" " ino_count=%d [NOT freeing]\n", __LINE__, context->serial, context->major, context->in_syscall, context->name_count, context->put_count, context->ino_count); for (i = 0; i < context->name_count; i++) printk(KERN_ERR "names[%d] = %p = %s\n", i, context->names[i].name, context->names[i].name); dump_stack(); return; } #endif #if AUDIT_DEBUG context->put_count = 0; context->ino_count = 0; #endif for (i = 0; i < context->name_count; i++) if (context->names[i].name) __putname(context->names[i].name); context->name_count = 0; if (context->pwd) dput(context->pwd); if (context->pwdmnt) mntput(context->pwdmnt); context->pwd = NULL; context->pwdmnt = NULL; } static inline void audit_free_aux(struct audit_context *context) { struct audit_aux_data *aux; while ((aux = context->aux)) { if (aux->type == AUDIT_AVC_PATH) { struct audit_aux_data_path *axi = (void *)aux; dput(axi->dentry); mntput(axi->mnt); } context->aux = aux->next; kfree(aux); } } static inline void audit_zero_context(struct audit_context *context, enum audit_state state) { uid_t loginuid = context->loginuid; memset(context, 0, sizeof(*context)); context->state = state; context->loginuid = loginuid; } static inline struct audit_context *audit_alloc_context(enum audit_state state) { struct audit_context *context; if (!(context = kmalloc(sizeof(*context), GFP_KERNEL))) return NULL; audit_zero_context(context, state); return context; } /* Filter on the task information and allocate a per-task audit context * if necessary. Doing so turns on system call auditing for the * specified task. This is called from copy_process, so no lock is * needed. */ int audit_alloc(struct task_struct *tsk) { struct audit_context *context; enum audit_state state; if (likely(!audit_enabled)) return 0; /* Return if not auditing. */ state = audit_filter_task(tsk); if (likely(state == AUDIT_DISABLED)) return 0; if (!(context = audit_alloc_context(state))) { audit_log_lost("out of memory in audit_alloc"); return -ENOMEM; } /* Preserve login uid */ context->loginuid = -1; if (current->audit_context) context->loginuid = current->audit_context->loginuid; tsk->audit_context = context; set_tsk_thread_flag(tsk, TIF_SYSCALL_AUDIT); return 0; } static inline void audit_free_context(struct audit_context *context) { struct audit_context *previous; int count = 0; do { previous = context->previous; if (previous || (count && count < 10)) { ++count; printk(KERN_ERR "audit(:%d): major=%d name_count=%d:" " freeing multiple contexts (%d)\n", context->serial, context->major, context->name_count, count); } audit_free_names(context); audit_free_aux(context); kfree(context); context = previous; } while (context); if (count >= 10) printk(KERN_ERR "audit: freed %d contexts\n", count); } static void audit_log_task_info(struct audit_buffer *ab) { char name[sizeof(current->comm)]; struct mm_struct *mm = current->mm; struct vm_area_struct *vma; get_task_comm(name, current); audit_log_format(ab, " comm="); audit_log_untrustedstring(ab, name); if (!mm) return; down_read(&mm->mmap_sem); vma = mm->mmap; while (vma) { if ((vma->vm_flags & VM_EXECUTABLE) && vma->vm_file) { audit_log_d_path(ab, "exe=", vma->vm_file->f_dentry, vma->vm_file->f_vfsmnt); break; } vma = vma->vm_next; } up_read(&mm->mmap_sem); } static void audit_log_exit(struct audit_context *context, gfp_t gfp_mask) { int i; struct audit_buffer *ab; struct audit_aux_data *aux; ab = audit_log_start(context, gfp_mask, AUDIT_SYSCALL); if (!ab) return; /* audit_panic has been called */ audit_log_format(ab, "arch=%x syscall=%d", context->arch, context->major); if (context->personality != PER_LINUX) audit_log_format(ab, " per=%lx", context->personality); if (context->return_valid) audit_log_format(ab, " success=%s exit=%ld", (context->return_valid==AUDITSC_SUCCESS)?"yes":"no", context->return_code); audit_log_format(ab, " a0=%lx a1=%lx a2=%lx a3=%lx items=%d" " pid=%d auid=%u uid=%u gid=%u" " euid=%u suid=%u fsuid=%u" " egid=%u sgid=%u fsgid=%u", context->argv[0], context->argv[1], context->argv[2], context->argv[3], context->name_count, context->pid, context->loginuid, context->uid, context->gid, context->euid, context->suid, context->fsuid, context->egid, context->sgid, context->fsgid); audit_log_task_info(ab); audit_log_end(ab); for (aux = context->aux; aux; aux = aux->next) { ab = audit_log_start(context, GFP_KERNEL, aux->type); if (!ab) continue; /* audit_panic has been called */ switch (aux->type) { case AUDIT_IPC: { struct audit_aux_data_ipcctl *axi = (void *)aux; audit_log_format(ab, " qbytes=%lx iuid=%u igid=%u mode=%x", axi->qbytes, axi->uid, axi->gid, axi->mode); break; } case AUDIT_SOCKETCALL: { int i; struct audit_aux_data_socketcall *axs = (void *)aux; audit_log_format(ab, "nargs=%d", axs->nargs); for (i=0; i<axs->nargs; i++) audit_log_format(ab, " a%d=%lx", i, axs->args[i]); break; } case AUDIT_SOCKADDR: { struct audit_aux_data_sockaddr *axs = (void *)aux; audit_log_format(ab, "saddr="); audit_log_hex(ab, axs->a, axs->len); break; } case AUDIT_AVC_PATH: { struct audit_aux_data_path *axi = (void *)aux; audit_log_d_path(ab, "path=", axi->dentry, axi->mnt); break; } } audit_log_end(ab); } if (context->pwd && context->pwdmnt) { ab = audit_log_start(context, GFP_KERNEL, AUDIT_CWD); if (ab) { audit_log_d_path(ab, "cwd=", context->pwd, context->pwdmnt); audit_log_end(ab); } } for (i = 0; i < context->name_count; i++) { ab = audit_log_start(context, GFP_KERNEL, AUDIT_PATH); if (!ab) continue; /* audit_panic has been called */ audit_log_format(ab, "item=%d", i); if (context->names[i].name) { audit_log_format(ab, " name="); audit_log_untrustedstring(ab, context->names[i].name); } audit_log_format(ab, " flags=%x\n", context->names[i].flags); if (context->names[i].ino != (unsigned long)-1) audit_log_format(ab, " inode=%lu dev=%02x:%02x mode=%#o" " ouid=%u ogid=%u rdev=%02x:%02x", context->names[i].ino, MAJOR(context->names[i].dev), MINOR(context->names[i].dev), context->names[i].mode, context->names[i].uid, context->names[i].gid, MAJOR(context->names[i].rdev), MINOR(context->names[i].rdev)); audit_log_end(ab); } } /* Free a per-task audit context. Called from copy_process and * __put_task_struct. */ void audit_free(struct task_struct *tsk) { struct audit_context *context; task_lock(tsk); context = audit_get_context(tsk, 0, 0); task_unlock(tsk); if (likely(!context)) return; /* Check for system calls that do not go through the exit * function (e.g., exit_group), then free context block. * We use GFP_ATOMIC here because we might be doing this * in the context of the idle thread */ if (context->in_syscall && context->auditable) audit_log_exit(context, GFP_ATOMIC); audit_free_context(context); } /* Fill in audit context at syscall entry. This only happens if the * audit context was created when the task was created and the state or * filters demand the audit context be built. If the state from the * per-task filter or from the per-syscall filter is AUDIT_RECORD_CONTEXT, * then the record will be written at syscall exit time (otherwise, it * will only be written if another part of the kernel requests that it * be written). */ void audit_syscall_entry(struct task_struct *tsk, int arch, int major, unsigned long a1, unsigned long a2, unsigned long a3, unsigned long a4) { struct audit_context *context = tsk->audit_context; enum audit_state state; BUG_ON(!context); /* This happens only on certain architectures that make system * calls in kernel_thread via the entry.S interface, instead of * with direct calls. (If you are porting to a new * architecture, hitting this condition can indicate that you * got the _exit/_leave calls backward in entry.S.) * * i386 no * x86_64 no * ppc64 yes (see arch/ppc64/kernel/misc.S) * * This also happens with vm86 emulation in a non-nested manner * (entries without exits), so this case must be caught. */ if (context->in_syscall) { struct audit_context *newctx; #if defined(__NR_vm86) && defined(__NR_vm86old) /* vm86 mode should only be entered once */ if (major == __NR_vm86 || major == __NR_vm86old) return; #endif #if AUDIT_DEBUG printk(KERN_ERR "audit(:%d) pid=%d in syscall=%d;" " entering syscall=%d\n", context->serial, tsk->pid, context->major, major); #endif newctx = audit_alloc_context(context->state); if (newctx) { newctx->previous = context; context = newctx; tsk->audit_context = newctx; } else { /* If we can't alloc a new context, the best we * can do is to leak memory (any pending putname * will be lost). The only other alternative is * to abandon auditing. */ audit_zero_context(context, context->state); } } BUG_ON(context->in_syscall || context->name_count); if (!audit_enabled) return; context->arch = arch; context->major = major; context->argv[0] = a1; context->argv[1] = a2; context->argv[2] = a3; context->argv[3] = a4; state = context->state; if (state == AUDIT_SETUP_CONTEXT || state == AUDIT_BUILD_CONTEXT) state = audit_filter_syscall(tsk, context, &audit_filter_list[AUDIT_FILTER_ENTRY]); if (likely(state == AUDIT_DISABLED)) return; context->serial = 0; context->ctime = CURRENT_TIME; context->in_syscall = 1; context->auditable = !!(state == AUDIT_RECORD_CONTEXT); } /* Tear down after system call. If the audit context has been marked as * auditable (either because of the AUDIT_RECORD_CONTEXT state from * filtering, or because some other part of the kernel write an audit * message), then write out the syscall information. In call cases, * free the names stored from getname(). */ void audit_syscall_exit(struct task_struct *tsk, int valid, long return_code) { struct audit_context *context; get_task_struct(tsk); task_lock(tsk); context = audit_get_context(tsk, valid, return_code); task_unlock(tsk); /* Not having a context here is ok, since the parent may have * called __put_task_struct. */ if (likely(!context)) goto out; if (context->in_syscall && context->auditable) audit_log_exit(context, GFP_KERNEL); context->in_syscall = 0; context->auditable = 0; if (context->previous) { struct audit_context *new_context = context->previous; context->previous = NULL; audit_free_context(context); tsk->audit_context = new_context; } else { audit_free_names(context); audit_free_aux(context); tsk->audit_context = context; } out: put_task_struct(tsk); } /* Add a name to the list. Called from fs/namei.c:getname(). */ void audit_getname(const char *name) { struct audit_context *context = current->audit_context; if (!context || IS_ERR(name) || !name) return; if (!context->in_syscall) { #if AUDIT_DEBUG == 2 printk(KERN_ERR "%s:%d(:%d): ignoring getname(%p)\n", __FILE__, __LINE__, context->serial, name); dump_stack(); #endif return; } BUG_ON(context->name_count >= AUDIT_NAMES); context->names[context->name_count].name = name; context->names[context->name_count].ino = (unsigned long)-1; ++context->name_count; if (!context->pwd) { read_lock(¤t->fs->lock); context->pwd = dget(current->fs->pwd); context->pwdmnt = mntget(current->fs->pwdmnt); read_unlock(¤t->fs->lock); } } /* Intercept a putname request. Called from * include/linux/fs.h:putname(). If we have stored the name from * getname in the audit context, then we delay the putname until syscall * exit. */ void audit_putname(const char *name) { struct audit_context *context = current->audit_context; BUG_ON(!context); if (!context->in_syscall) { #if AUDIT_DEBUG == 2 printk(KERN_ERR "%s:%d(:%d): __putname(%p)\n", __FILE__, __LINE__, context->serial, name); if (context->name_count) { int i; for (i = 0; i < context->name_count; i++) printk(KERN_ERR "name[%d] = %p = %s\n", i, context->names[i].name, context->names[i].name); } #endif __putname(name); } #if AUDIT_DEBUG else { ++context->put_count; if (context->put_count > context->name_count) { printk(KERN_ERR "%s:%d(:%d): major=%d" " in_syscall=%d putname(%p) name_count=%d" " put_count=%d\n", __FILE__, __LINE__, context->serial, context->major, context->in_syscall, name, context->name_count, context->put_count); dump_stack(); } } #endif } /* Store the inode and device from a lookup. Called from * fs/namei.c:path_lookup(). */ void audit_inode(const char *name, const struct inode *inode, unsigned flags) { int idx; struct audit_context *context = current->audit_context; if (!context->in_syscall) return; if (context->name_count && context->names[context->name_count-1].name && context->names[context->name_count-1].name == name) idx = context->name_count - 1; else if (context->name_count > 1 && context->names[context->name_count-2].name && context->names[context->name_count-2].name == name) idx = context->name_count - 2; else { /* FIXME: how much do we care about inodes that have no * associated name? */ if (context->name_count >= AUDIT_NAMES - AUDIT_NAMES_RESERVED) return; idx = context->name_count++; context->names[idx].name = NULL; #if AUDIT_DEBUG ++context->ino_count; #endif } context->names[idx].flags = flags; context->names[idx].ino = inode->i_ino; context->names[idx].dev = inode->i_sb->s_dev; context->names[idx].mode = inode->i_mode; context->names[idx].uid = inode->i_uid; context->names[idx].gid = inode->i_gid; context->names[idx].rdev = inode->i_rdev; } void auditsc_get_stamp(struct audit_context *ctx, struct timespec *t, unsigned int *serial) { if (!ctx->serial) ctx->serial = audit_serial(); t->tv_sec = ctx->ctime.tv_sec; t->tv_nsec = ctx->ctime.tv_nsec; *serial = ctx->serial; ctx->auditable = 1; } int audit_set_loginuid(struct task_struct *task, uid_t loginuid) { if (task->audit_context) { struct audit_buffer *ab; ab = audit_log_start(NULL, GFP_KERNEL, AUDIT_LOGIN); if (ab) { audit_log_format(ab, "login pid=%d uid=%u " "old auid=%u new auid=%u", task->pid, task->uid, task->audit_context->loginuid, loginuid); audit_log_end(ab); } task->audit_context->loginuid = loginuid; } return 0; } uid_t audit_get_loginuid(struct audit_context *ctx) { return ctx ? ctx->loginuid : -1; } int audit_ipc_perms(unsigned long qbytes, uid_t uid, gid_t gid, mode_t mode) { struct audit_aux_data_ipcctl *ax; struct audit_context *context = current->audit_context; if (likely(!context)) return 0; ax = kmalloc(sizeof(*ax), GFP_KERNEL); if (!ax) return -ENOMEM; ax->qbytes = qbytes; ax->uid = uid; ax->gid = gid; ax->mode = mode; ax->d.type = AUDIT_IPC; ax->d.next = context->aux; context->aux = (void *)ax; return 0; } int audit_socketcall(int nargs, unsigned long *args) { struct audit_aux_data_socketcall *ax; struct audit_context *context = current->audit_context; if (likely(!context)) return 0; ax = kmalloc(sizeof(*ax) + nargs * sizeof(unsigned long), GFP_KERNEL); if (!ax) return -ENOMEM; ax->nargs = nargs; memcpy(ax->args, args, nargs * sizeof(unsigned long)); ax->d.type = AUDIT_SOCKETCALL; ax->d.next = context->aux; context->aux = (void *)ax; return 0; } int audit_sockaddr(int len, void *a) { struct audit_aux_data_sockaddr *ax; struct audit_context *context = current->audit_context; if (likely(!context)) return 0; ax = kmalloc(sizeof(*ax) + len, GFP_KERNEL); if (!ax) return -ENOMEM; ax->len = len; memcpy(ax->a, a, len); ax->d.type = AUDIT_SOCKADDR; ax->d.next = context->aux; context->aux = (void *)ax; return 0; } int audit_avc_path(struct dentry *dentry, struct vfsmount *mnt) { struct audit_aux_data_path *ax; struct audit_context *context = current->audit_context; if (likely(!context)) return 0; ax = kmalloc(sizeof(*ax), GFP_ATOMIC); if (!ax) return -ENOMEM; ax->dentry = dget(dentry); ax->mnt = mntget(mnt); ax->d.type = AUDIT_AVC_PATH; ax->d.next = context->aux; context->aux = (void *)ax; return 0; } void audit_signal_info(int sig, struct task_struct *t) { extern pid_t audit_sig_pid; extern uid_t audit_sig_uid; if (unlikely(audit_pid && t->tgid == audit_pid)) { if (sig == SIGTERM || sig == SIGHUP) { struct audit_context *ctx = current->audit_context; audit_sig_pid = current->pid; if (ctx) audit_sig_uid = ctx->loginuid; else audit_sig_uid = current->uid; } } }