1299 lines
33 KiB
C
1299 lines
33 KiB
C
/* auditsc.c -- System-call auditing support
|
|
* Handles all system-call specific auditing features.
|
|
*
|
|
* Copyright 2003-2004 Red Hat Inc., Durham, North Carolina.
|
|
* All Rights Reserved.
|
|
*
|
|
* This program is free software; you can redistribute it and/or modify
|
|
* it under the terms of the GNU General Public License as published by
|
|
* the Free Software Foundation; either version 2 of the License, or
|
|
* (at your option) any later version.
|
|
*
|
|
* This program is distributed in the hope that it will be useful,
|
|
* but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
|
* GNU General Public License for more details.
|
|
*
|
|
* You should have received a copy of the GNU General Public License
|
|
* along with this program; if not, write to the Free Software
|
|
* Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA
|
|
*
|
|
* Written by Rickard E. (Rik) Faith <faith@redhat.com>
|
|
*
|
|
* Many of the ideas implemented here are from Stephen C. Tweedie,
|
|
* especially the idea of avoiding a copy by using getname.
|
|
*
|
|
* The method for actual interception of syscall entry and exit (not in
|
|
* this file -- see entry.S) is based on a GPL'd patch written by
|
|
* okir@suse.de and Copyright 2003 SuSE Linux AG.
|
|
*
|
|
*/
|
|
|
|
#include <linux/init.h>
|
|
#include <asm/atomic.h>
|
|
#include <asm/types.h>
|
|
#include <linux/mm.h>
|
|
#include <linux/module.h>
|
|
#include <linux/mount.h>
|
|
#include <linux/socket.h>
|
|
#include <linux/audit.h>
|
|
#include <linux/personality.h>
|
|
#include <linux/time.h>
|
|
#include <linux/kthread.h>
|
|
#include <linux/netlink.h>
|
|
#include <linux/compiler.h>
|
|
#include <asm/unistd.h>
|
|
|
|
/* 0 = no checking
|
|
1 = put_count checking
|
|
2 = verbose put_count checking
|
|
*/
|
|
#define AUDIT_DEBUG 0
|
|
|
|
/* No syscall auditing will take place unless audit_enabled != 0. */
|
|
extern int audit_enabled;
|
|
|
|
/* AUDIT_NAMES is the number of slots we reserve in the audit_context
|
|
* for saving names from getname(). */
|
|
#define AUDIT_NAMES 20
|
|
|
|
/* AUDIT_NAMES_RESERVED is the number of slots we reserve in the
|
|
* audit_context from being used for nameless inodes from
|
|
* path_lookup. */
|
|
#define AUDIT_NAMES_RESERVED 7
|
|
|
|
/* At task start time, the audit_state is set in the audit_context using
|
|
a per-task filter. At syscall entry, the audit_state is augmented by
|
|
the syscall filter. */
|
|
enum audit_state {
|
|
AUDIT_DISABLED, /* Do not create per-task audit_context.
|
|
* No syscall-specific audit records can
|
|
* be generated. */
|
|
AUDIT_SETUP_CONTEXT, /* Create the per-task audit_context,
|
|
* but don't necessarily fill it in at
|
|
* syscall entry time (i.e., filter
|
|
* instead). */
|
|
AUDIT_BUILD_CONTEXT, /* Create the per-task audit_context,
|
|
* and always fill it in at syscall
|
|
* entry time. This makes a full
|
|
* syscall record available if some
|
|
* other part of the kernel decides it
|
|
* should be recorded. */
|
|
AUDIT_RECORD_CONTEXT /* Create the per-task audit_context,
|
|
* always fill it in at syscall entry
|
|
* time, and always write out the audit
|
|
* record at syscall exit time. */
|
|
};
|
|
|
|
/* When fs/namei.c:getname() is called, we store the pointer in name and
|
|
* we don't let putname() free it (instead we free all of the saved
|
|
* pointers at syscall exit time).
|
|
*
|
|
* Further, in fs/namei.c:path_lookup() we store the inode and device. */
|
|
struct audit_names {
|
|
const char *name;
|
|
unsigned long ino;
|
|
dev_t dev;
|
|
umode_t mode;
|
|
uid_t uid;
|
|
gid_t gid;
|
|
dev_t rdev;
|
|
unsigned flags;
|
|
};
|
|
|
|
struct audit_aux_data {
|
|
struct audit_aux_data *next;
|
|
int type;
|
|
};
|
|
|
|
#define AUDIT_AUX_IPCPERM 0
|
|
|
|
struct audit_aux_data_ipcctl {
|
|
struct audit_aux_data d;
|
|
struct ipc_perm p;
|
|
unsigned long qbytes;
|
|
uid_t uid;
|
|
gid_t gid;
|
|
mode_t mode;
|
|
};
|
|
|
|
struct audit_aux_data_socketcall {
|
|
struct audit_aux_data d;
|
|
int nargs;
|
|
unsigned long args[0];
|
|
};
|
|
|
|
struct audit_aux_data_sockaddr {
|
|
struct audit_aux_data d;
|
|
int len;
|
|
char a[0];
|
|
};
|
|
|
|
struct audit_aux_data_path {
|
|
struct audit_aux_data d;
|
|
struct dentry *dentry;
|
|
struct vfsmount *mnt;
|
|
};
|
|
|
|
/* The per-task audit context. */
|
|
struct audit_context {
|
|
int in_syscall; /* 1 if task is in a syscall */
|
|
enum audit_state state;
|
|
unsigned int serial; /* serial number for record */
|
|
struct timespec ctime; /* time of syscall entry */
|
|
uid_t loginuid; /* login uid (identity) */
|
|
int major; /* syscall number */
|
|
unsigned long argv[4]; /* syscall arguments */
|
|
int return_valid; /* return code is valid */
|
|
long return_code;/* syscall return code */
|
|
int auditable; /* 1 if record should be written */
|
|
int name_count;
|
|
struct audit_names names[AUDIT_NAMES];
|
|
struct dentry * pwd;
|
|
struct vfsmount * pwdmnt;
|
|
struct audit_context *previous; /* For nested syscalls */
|
|
struct audit_aux_data *aux;
|
|
|
|
/* Save things to print about task_struct */
|
|
pid_t pid;
|
|
uid_t uid, euid, suid, fsuid;
|
|
gid_t gid, egid, sgid, fsgid;
|
|
unsigned long personality;
|
|
int arch;
|
|
|
|
#if AUDIT_DEBUG
|
|
int put_count;
|
|
int ino_count;
|
|
#endif
|
|
};
|
|
|
|
/* Public API */
|
|
/* There are three lists of rules -- one to search at task creation
|
|
* time, one to search at syscall entry time, and another to search at
|
|
* syscall exit time. */
|
|
static struct list_head audit_filter_list[AUDIT_NR_FILTERS] = {
|
|
LIST_HEAD_INIT(audit_filter_list[0]),
|
|
LIST_HEAD_INIT(audit_filter_list[1]),
|
|
LIST_HEAD_INIT(audit_filter_list[2]),
|
|
LIST_HEAD_INIT(audit_filter_list[3]),
|
|
LIST_HEAD_INIT(audit_filter_list[4]),
|
|
#if AUDIT_NR_FILTERS != 5
|
|
#error Fix audit_filter_list initialiser
|
|
#endif
|
|
};
|
|
|
|
struct audit_entry {
|
|
struct list_head list;
|
|
struct rcu_head rcu;
|
|
struct audit_rule rule;
|
|
};
|
|
|
|
extern int audit_pid;
|
|
|
|
/* Copy rule from user-space to kernel-space. Called from
|
|
* audit_add_rule during AUDIT_ADD. */
|
|
static inline int audit_copy_rule(struct audit_rule *d, struct audit_rule *s)
|
|
{
|
|
int i;
|
|
|
|
if (s->action != AUDIT_NEVER
|
|
&& s->action != AUDIT_POSSIBLE
|
|
&& s->action != AUDIT_ALWAYS)
|
|
return -1;
|
|
if (s->field_count < 0 || s->field_count > AUDIT_MAX_FIELDS)
|
|
return -1;
|
|
if ((s->flags & ~AUDIT_FILTER_PREPEND) >= AUDIT_NR_FILTERS)
|
|
return -1;
|
|
|
|
d->flags = s->flags;
|
|
d->action = s->action;
|
|
d->field_count = s->field_count;
|
|
for (i = 0; i < d->field_count; i++) {
|
|
d->fields[i] = s->fields[i];
|
|
d->values[i] = s->values[i];
|
|
}
|
|
for (i = 0; i < AUDIT_BITMASK_SIZE; i++) d->mask[i] = s->mask[i];
|
|
return 0;
|
|
}
|
|
|
|
/* Check to see if two rules are identical. It is called from
|
|
* audit_add_rule during AUDIT_ADD and
|
|
* audit_del_rule during AUDIT_DEL. */
|
|
static inline int audit_compare_rule(struct audit_rule *a, struct audit_rule *b)
|
|
{
|
|
int i;
|
|
|
|
if (a->flags != b->flags)
|
|
return 1;
|
|
|
|
if (a->action != b->action)
|
|
return 1;
|
|
|
|
if (a->field_count != b->field_count)
|
|
return 1;
|
|
|
|
for (i = 0; i < a->field_count; i++) {
|
|
if (a->fields[i] != b->fields[i]
|
|
|| a->values[i] != b->values[i])
|
|
return 1;
|
|
}
|
|
|
|
for (i = 0; i < AUDIT_BITMASK_SIZE; i++)
|
|
if (a->mask[i] != b->mask[i])
|
|
return 1;
|
|
|
|
return 0;
|
|
}
|
|
|
|
/* Note that audit_add_rule and audit_del_rule are called via
|
|
* audit_receive() in audit.c, and are protected by
|
|
* audit_netlink_sem. */
|
|
static inline int audit_add_rule(struct audit_rule *rule,
|
|
struct list_head *list)
|
|
{
|
|
struct audit_entry *entry;
|
|
|
|
/* Do not use the _rcu iterator here, since this is the only
|
|
* addition routine. */
|
|
list_for_each_entry(entry, list, list) {
|
|
if (!audit_compare_rule(rule, &entry->rule)) {
|
|
return -EEXIST;
|
|
}
|
|
}
|
|
|
|
if (!(entry = kmalloc(sizeof(*entry), GFP_KERNEL)))
|
|
return -ENOMEM;
|
|
if (audit_copy_rule(&entry->rule, rule)) {
|
|
kfree(entry);
|
|
return -EINVAL;
|
|
}
|
|
|
|
if (entry->rule.flags & AUDIT_FILTER_PREPEND) {
|
|
entry->rule.flags &= ~AUDIT_FILTER_PREPEND;
|
|
list_add_rcu(&entry->list, list);
|
|
} else {
|
|
list_add_tail_rcu(&entry->list, list);
|
|
}
|
|
|
|
return 0;
|
|
}
|
|
|
|
static inline void audit_free_rule(struct rcu_head *head)
|
|
{
|
|
struct audit_entry *e = container_of(head, struct audit_entry, rcu);
|
|
kfree(e);
|
|
}
|
|
|
|
/* Note that audit_add_rule and audit_del_rule are called via
|
|
* audit_receive() in audit.c, and are protected by
|
|
* audit_netlink_sem. */
|
|
static inline int audit_del_rule(struct audit_rule *rule,
|
|
struct list_head *list)
|
|
{
|
|
struct audit_entry *e;
|
|
|
|
/* Do not use the _rcu iterator here, since this is the only
|
|
* deletion routine. */
|
|
list_for_each_entry(e, list, list) {
|
|
if (!audit_compare_rule(rule, &e->rule)) {
|
|
list_del_rcu(&e->list);
|
|
call_rcu(&e->rcu, audit_free_rule);
|
|
return 0;
|
|
}
|
|
}
|
|
return -ENOENT; /* No matching rule */
|
|
}
|
|
|
|
static int audit_list_rules(void *_dest)
|
|
{
|
|
int pid, seq;
|
|
int *dest = _dest;
|
|
struct audit_entry *entry;
|
|
int i;
|
|
|
|
pid = dest[0];
|
|
seq = dest[1];
|
|
kfree(dest);
|
|
|
|
down(&audit_netlink_sem);
|
|
|
|
/* The *_rcu iterators not needed here because we are
|
|
always called with audit_netlink_sem held. */
|
|
for (i=0; i<AUDIT_NR_FILTERS; i++) {
|
|
list_for_each_entry(entry, &audit_filter_list[i], list)
|
|
audit_send_reply(pid, seq, AUDIT_LIST, 0, 1,
|
|
&entry->rule, sizeof(entry->rule));
|
|
}
|
|
audit_send_reply(pid, seq, AUDIT_LIST, 1, 1, NULL, 0);
|
|
|
|
up(&audit_netlink_sem);
|
|
return 0;
|
|
}
|
|
|
|
int audit_receive_filter(int type, int pid, int uid, int seq, void *data,
|
|
uid_t loginuid)
|
|
{
|
|
struct task_struct *tsk;
|
|
int *dest;
|
|
int err = 0;
|
|
unsigned listnr;
|
|
|
|
switch (type) {
|
|
case AUDIT_LIST:
|
|
/* We can't just spew out the rules here because we might fill
|
|
* the available socket buffer space and deadlock waiting for
|
|
* auditctl to read from it... which isn't ever going to
|
|
* happen if we're actually running in the context of auditctl
|
|
* trying to _send_ the stuff */
|
|
|
|
dest = kmalloc(2 * sizeof(int), GFP_KERNEL);
|
|
if (!dest)
|
|
return -ENOMEM;
|
|
dest[0] = pid;
|
|
dest[1] = seq;
|
|
|
|
tsk = kthread_run(audit_list_rules, dest, "audit_list_rules");
|
|
if (IS_ERR(tsk)) {
|
|
kfree(dest);
|
|
err = PTR_ERR(tsk);
|
|
}
|
|
break;
|
|
case AUDIT_ADD:
|
|
listnr =((struct audit_rule *)data)->flags & ~AUDIT_FILTER_PREPEND;
|
|
if (listnr >= AUDIT_NR_FILTERS)
|
|
return -EINVAL;
|
|
|
|
err = audit_add_rule(data, &audit_filter_list[listnr]);
|
|
if (!err)
|
|
audit_log(NULL, GFP_KERNEL, AUDIT_CONFIG_CHANGE,
|
|
"auid=%u added an audit rule\n", loginuid);
|
|
break;
|
|
case AUDIT_DEL:
|
|
listnr =((struct audit_rule *)data)->flags & ~AUDIT_FILTER_PREPEND;
|
|
if (listnr >= AUDIT_NR_FILTERS)
|
|
return -EINVAL;
|
|
|
|
err = audit_del_rule(data, &audit_filter_list[listnr]);
|
|
if (!err)
|
|
audit_log(NULL, GFP_KERNEL, AUDIT_CONFIG_CHANGE,
|
|
"auid=%u removed an audit rule\n", loginuid);
|
|
break;
|
|
default:
|
|
return -EINVAL;
|
|
}
|
|
|
|
return err;
|
|
}
|
|
|
|
/* Compare a task_struct with an audit_rule. Return 1 on match, 0
|
|
* otherwise. */
|
|
static int audit_filter_rules(struct task_struct *tsk,
|
|
struct audit_rule *rule,
|
|
struct audit_context *ctx,
|
|
enum audit_state *state)
|
|
{
|
|
int i, j;
|
|
|
|
for (i = 0; i < rule->field_count; i++) {
|
|
u32 field = rule->fields[i] & ~AUDIT_NEGATE;
|
|
u32 value = rule->values[i];
|
|
int result = 0;
|
|
|
|
switch (field) {
|
|
case AUDIT_PID:
|
|
result = (tsk->pid == value);
|
|
break;
|
|
case AUDIT_UID:
|
|
result = (tsk->uid == value);
|
|
break;
|
|
case AUDIT_EUID:
|
|
result = (tsk->euid == value);
|
|
break;
|
|
case AUDIT_SUID:
|
|
result = (tsk->suid == value);
|
|
break;
|
|
case AUDIT_FSUID:
|
|
result = (tsk->fsuid == value);
|
|
break;
|
|
case AUDIT_GID:
|
|
result = (tsk->gid == value);
|
|
break;
|
|
case AUDIT_EGID:
|
|
result = (tsk->egid == value);
|
|
break;
|
|
case AUDIT_SGID:
|
|
result = (tsk->sgid == value);
|
|
break;
|
|
case AUDIT_FSGID:
|
|
result = (tsk->fsgid == value);
|
|
break;
|
|
case AUDIT_PERS:
|
|
result = (tsk->personality == value);
|
|
break;
|
|
case AUDIT_ARCH:
|
|
if (ctx)
|
|
result = (ctx->arch == value);
|
|
break;
|
|
|
|
case AUDIT_EXIT:
|
|
if (ctx && ctx->return_valid)
|
|
result = (ctx->return_code == value);
|
|
break;
|
|
case AUDIT_SUCCESS:
|
|
if (ctx && ctx->return_valid) {
|
|
if (value)
|
|
result = (ctx->return_valid == AUDITSC_SUCCESS);
|
|
else
|
|
result = (ctx->return_valid == AUDITSC_FAILURE);
|
|
}
|
|
break;
|
|
case AUDIT_DEVMAJOR:
|
|
if (ctx) {
|
|
for (j = 0; j < ctx->name_count; j++) {
|
|
if (MAJOR(ctx->names[j].dev)==value) {
|
|
++result;
|
|
break;
|
|
}
|
|
}
|
|
}
|
|
break;
|
|
case AUDIT_DEVMINOR:
|
|
if (ctx) {
|
|
for (j = 0; j < ctx->name_count; j++) {
|
|
if (MINOR(ctx->names[j].dev)==value) {
|
|
++result;
|
|
break;
|
|
}
|
|
}
|
|
}
|
|
break;
|
|
case AUDIT_INODE:
|
|
if (ctx) {
|
|
for (j = 0; j < ctx->name_count; j++) {
|
|
if (ctx->names[j].ino == value) {
|
|
++result;
|
|
break;
|
|
}
|
|
}
|
|
}
|
|
break;
|
|
case AUDIT_LOGINUID:
|
|
result = 0;
|
|
if (ctx)
|
|
result = (ctx->loginuid == value);
|
|
break;
|
|
case AUDIT_ARG0:
|
|
case AUDIT_ARG1:
|
|
case AUDIT_ARG2:
|
|
case AUDIT_ARG3:
|
|
if (ctx)
|
|
result = (ctx->argv[field-AUDIT_ARG0]==value);
|
|
break;
|
|
}
|
|
|
|
if (rule->fields[i] & AUDIT_NEGATE)
|
|
result = !result;
|
|
if (!result)
|
|
return 0;
|
|
}
|
|
switch (rule->action) {
|
|
case AUDIT_NEVER: *state = AUDIT_DISABLED; break;
|
|
case AUDIT_POSSIBLE: *state = AUDIT_BUILD_CONTEXT; break;
|
|
case AUDIT_ALWAYS: *state = AUDIT_RECORD_CONTEXT; break;
|
|
}
|
|
return 1;
|
|
}
|
|
|
|
/* At process creation time, we can determine if system-call auditing is
|
|
* completely disabled for this task. Since we only have the task
|
|
* structure at this point, we can only check uid and gid.
|
|
*/
|
|
static enum audit_state audit_filter_task(struct task_struct *tsk)
|
|
{
|
|
struct audit_entry *e;
|
|
enum audit_state state;
|
|
|
|
rcu_read_lock();
|
|
list_for_each_entry_rcu(e, &audit_filter_list[AUDIT_FILTER_TASK], list) {
|
|
if (audit_filter_rules(tsk, &e->rule, NULL, &state)) {
|
|
rcu_read_unlock();
|
|
return state;
|
|
}
|
|
}
|
|
rcu_read_unlock();
|
|
return AUDIT_BUILD_CONTEXT;
|
|
}
|
|
|
|
/* At syscall entry and exit time, this filter is called if the
|
|
* audit_state is not low enough that auditing cannot take place, but is
|
|
* also not high enough that we already know we have to write an audit
|
|
* record (i.e., the state is AUDIT_SETUP_CONTEXT or AUDIT_BUILD_CONTEXT).
|
|
*/
|
|
static enum audit_state audit_filter_syscall(struct task_struct *tsk,
|
|
struct audit_context *ctx,
|
|
struct list_head *list)
|
|
{
|
|
struct audit_entry *e;
|
|
enum audit_state state;
|
|
|
|
if (audit_pid && tsk->tgid == audit_pid)
|
|
return AUDIT_DISABLED;
|
|
|
|
rcu_read_lock();
|
|
if (!list_empty(list)) {
|
|
int word = AUDIT_WORD(ctx->major);
|
|
int bit = AUDIT_BIT(ctx->major);
|
|
|
|
list_for_each_entry_rcu(e, list, list) {
|
|
if ((e->rule.mask[word] & bit) == bit
|
|
&& audit_filter_rules(tsk, &e->rule, ctx, &state)) {
|
|
rcu_read_unlock();
|
|
return state;
|
|
}
|
|
}
|
|
}
|
|
rcu_read_unlock();
|
|
return AUDIT_BUILD_CONTEXT;
|
|
}
|
|
|
|
static int audit_filter_user_rules(struct netlink_skb_parms *cb,
|
|
struct audit_rule *rule,
|
|
enum audit_state *state)
|
|
{
|
|
int i;
|
|
|
|
for (i = 0; i < rule->field_count; i++) {
|
|
u32 field = rule->fields[i] & ~AUDIT_NEGATE;
|
|
u32 value = rule->values[i];
|
|
int result = 0;
|
|
|
|
switch (field) {
|
|
case AUDIT_PID:
|
|
result = (cb->creds.pid == value);
|
|
break;
|
|
case AUDIT_UID:
|
|
result = (cb->creds.uid == value);
|
|
break;
|
|
case AUDIT_GID:
|
|
result = (cb->creds.gid == value);
|
|
break;
|
|
case AUDIT_LOGINUID:
|
|
result = (cb->loginuid == value);
|
|
break;
|
|
}
|
|
|
|
if (rule->fields[i] & AUDIT_NEGATE)
|
|
result = !result;
|
|
if (!result)
|
|
return 0;
|
|
}
|
|
switch (rule->action) {
|
|
case AUDIT_NEVER: *state = AUDIT_DISABLED; break;
|
|
case AUDIT_POSSIBLE: *state = AUDIT_BUILD_CONTEXT; break;
|
|
case AUDIT_ALWAYS: *state = AUDIT_RECORD_CONTEXT; break;
|
|
}
|
|
return 1;
|
|
}
|
|
|
|
int audit_filter_user(struct netlink_skb_parms *cb, int type)
|
|
{
|
|
struct audit_entry *e;
|
|
enum audit_state state;
|
|
int ret = 1;
|
|
|
|
rcu_read_lock();
|
|
list_for_each_entry_rcu(e, &audit_filter_list[AUDIT_FILTER_USER], list) {
|
|
if (audit_filter_user_rules(cb, &e->rule, &state)) {
|
|
if (state == AUDIT_DISABLED)
|
|
ret = 0;
|
|
break;
|
|
}
|
|
}
|
|
rcu_read_unlock();
|
|
|
|
return ret; /* Audit by default */
|
|
}
|
|
|
|
/* This should be called with task_lock() held. */
|
|
static inline struct audit_context *audit_get_context(struct task_struct *tsk,
|
|
int return_valid,
|
|
int return_code)
|
|
{
|
|
struct audit_context *context = tsk->audit_context;
|
|
|
|
if (likely(!context))
|
|
return NULL;
|
|
context->return_valid = return_valid;
|
|
context->return_code = return_code;
|
|
|
|
if (context->in_syscall && !context->auditable) {
|
|
enum audit_state state;
|
|
state = audit_filter_syscall(tsk, context, &audit_filter_list[AUDIT_FILTER_EXIT]);
|
|
if (state == AUDIT_RECORD_CONTEXT)
|
|
context->auditable = 1;
|
|
}
|
|
|
|
context->pid = tsk->pid;
|
|
context->uid = tsk->uid;
|
|
context->gid = tsk->gid;
|
|
context->euid = tsk->euid;
|
|
context->suid = tsk->suid;
|
|
context->fsuid = tsk->fsuid;
|
|
context->egid = tsk->egid;
|
|
context->sgid = tsk->sgid;
|
|
context->fsgid = tsk->fsgid;
|
|
context->personality = tsk->personality;
|
|
tsk->audit_context = NULL;
|
|
return context;
|
|
}
|
|
|
|
static inline void audit_free_names(struct audit_context *context)
|
|
{
|
|
int i;
|
|
|
|
#if AUDIT_DEBUG == 2
|
|
if (context->auditable
|
|
||context->put_count + context->ino_count != context->name_count) {
|
|
printk(KERN_ERR "audit.c:%d(:%d): major=%d in_syscall=%d"
|
|
" name_count=%d put_count=%d"
|
|
" ino_count=%d [NOT freeing]\n",
|
|
__LINE__,
|
|
context->serial, context->major, context->in_syscall,
|
|
context->name_count, context->put_count,
|
|
context->ino_count);
|
|
for (i = 0; i < context->name_count; i++)
|
|
printk(KERN_ERR "names[%d] = %p = %s\n", i,
|
|
context->names[i].name,
|
|
context->names[i].name);
|
|
dump_stack();
|
|
return;
|
|
}
|
|
#endif
|
|
#if AUDIT_DEBUG
|
|
context->put_count = 0;
|
|
context->ino_count = 0;
|
|
#endif
|
|
|
|
for (i = 0; i < context->name_count; i++)
|
|
if (context->names[i].name)
|
|
__putname(context->names[i].name);
|
|
context->name_count = 0;
|
|
if (context->pwd)
|
|
dput(context->pwd);
|
|
if (context->pwdmnt)
|
|
mntput(context->pwdmnt);
|
|
context->pwd = NULL;
|
|
context->pwdmnt = NULL;
|
|
}
|
|
|
|
static inline void audit_free_aux(struct audit_context *context)
|
|
{
|
|
struct audit_aux_data *aux;
|
|
|
|
while ((aux = context->aux)) {
|
|
if (aux->type == AUDIT_AVC_PATH) {
|
|
struct audit_aux_data_path *axi = (void *)aux;
|
|
dput(axi->dentry);
|
|
mntput(axi->mnt);
|
|
}
|
|
context->aux = aux->next;
|
|
kfree(aux);
|
|
}
|
|
}
|
|
|
|
static inline void audit_zero_context(struct audit_context *context,
|
|
enum audit_state state)
|
|
{
|
|
uid_t loginuid = context->loginuid;
|
|
|
|
memset(context, 0, sizeof(*context));
|
|
context->state = state;
|
|
context->loginuid = loginuid;
|
|
}
|
|
|
|
static inline struct audit_context *audit_alloc_context(enum audit_state state)
|
|
{
|
|
struct audit_context *context;
|
|
|
|
if (!(context = kmalloc(sizeof(*context), GFP_KERNEL)))
|
|
return NULL;
|
|
audit_zero_context(context, state);
|
|
return context;
|
|
}
|
|
|
|
/* Filter on the task information and allocate a per-task audit context
|
|
* if necessary. Doing so turns on system call auditing for the
|
|
* specified task. This is called from copy_process, so no lock is
|
|
* needed. */
|
|
int audit_alloc(struct task_struct *tsk)
|
|
{
|
|
struct audit_context *context;
|
|
enum audit_state state;
|
|
|
|
if (likely(!audit_enabled))
|
|
return 0; /* Return if not auditing. */
|
|
|
|
state = audit_filter_task(tsk);
|
|
if (likely(state == AUDIT_DISABLED))
|
|
return 0;
|
|
|
|
if (!(context = audit_alloc_context(state))) {
|
|
audit_log_lost("out of memory in audit_alloc");
|
|
return -ENOMEM;
|
|
}
|
|
|
|
/* Preserve login uid */
|
|
context->loginuid = -1;
|
|
if (current->audit_context)
|
|
context->loginuid = current->audit_context->loginuid;
|
|
|
|
tsk->audit_context = context;
|
|
set_tsk_thread_flag(tsk, TIF_SYSCALL_AUDIT);
|
|
return 0;
|
|
}
|
|
|
|
static inline void audit_free_context(struct audit_context *context)
|
|
{
|
|
struct audit_context *previous;
|
|
int count = 0;
|
|
|
|
do {
|
|
previous = context->previous;
|
|
if (previous || (count && count < 10)) {
|
|
++count;
|
|
printk(KERN_ERR "audit(:%d): major=%d name_count=%d:"
|
|
" freeing multiple contexts (%d)\n",
|
|
context->serial, context->major,
|
|
context->name_count, count);
|
|
}
|
|
audit_free_names(context);
|
|
audit_free_aux(context);
|
|
kfree(context);
|
|
context = previous;
|
|
} while (context);
|
|
if (count >= 10)
|
|
printk(KERN_ERR "audit: freed %d contexts\n", count);
|
|
}
|
|
|
|
static void audit_log_task_info(struct audit_buffer *ab)
|
|
{
|
|
char name[sizeof(current->comm)];
|
|
struct mm_struct *mm = current->mm;
|
|
struct vm_area_struct *vma;
|
|
|
|
get_task_comm(name, current);
|
|
audit_log_format(ab, " comm=");
|
|
audit_log_untrustedstring(ab, name);
|
|
|
|
if (!mm)
|
|
return;
|
|
|
|
down_read(&mm->mmap_sem);
|
|
vma = mm->mmap;
|
|
while (vma) {
|
|
if ((vma->vm_flags & VM_EXECUTABLE) &&
|
|
vma->vm_file) {
|
|
audit_log_d_path(ab, "exe=",
|
|
vma->vm_file->f_dentry,
|
|
vma->vm_file->f_vfsmnt);
|
|
break;
|
|
}
|
|
vma = vma->vm_next;
|
|
}
|
|
up_read(&mm->mmap_sem);
|
|
}
|
|
|
|
static void audit_log_exit(struct audit_context *context, gfp_t gfp_mask)
|
|
{
|
|
int i;
|
|
struct audit_buffer *ab;
|
|
struct audit_aux_data *aux;
|
|
|
|
ab = audit_log_start(context, gfp_mask, AUDIT_SYSCALL);
|
|
if (!ab)
|
|
return; /* audit_panic has been called */
|
|
audit_log_format(ab, "arch=%x syscall=%d",
|
|
context->arch, context->major);
|
|
if (context->personality != PER_LINUX)
|
|
audit_log_format(ab, " per=%lx", context->personality);
|
|
if (context->return_valid)
|
|
audit_log_format(ab, " success=%s exit=%ld",
|
|
(context->return_valid==AUDITSC_SUCCESS)?"yes":"no",
|
|
context->return_code);
|
|
audit_log_format(ab,
|
|
" a0=%lx a1=%lx a2=%lx a3=%lx items=%d"
|
|
" pid=%d auid=%u uid=%u gid=%u"
|
|
" euid=%u suid=%u fsuid=%u"
|
|
" egid=%u sgid=%u fsgid=%u",
|
|
context->argv[0],
|
|
context->argv[1],
|
|
context->argv[2],
|
|
context->argv[3],
|
|
context->name_count,
|
|
context->pid,
|
|
context->loginuid,
|
|
context->uid,
|
|
context->gid,
|
|
context->euid, context->suid, context->fsuid,
|
|
context->egid, context->sgid, context->fsgid);
|
|
audit_log_task_info(ab);
|
|
audit_log_end(ab);
|
|
|
|
for (aux = context->aux; aux; aux = aux->next) {
|
|
|
|
ab = audit_log_start(context, GFP_KERNEL, aux->type);
|
|
if (!ab)
|
|
continue; /* audit_panic has been called */
|
|
|
|
switch (aux->type) {
|
|
case AUDIT_IPC: {
|
|
struct audit_aux_data_ipcctl *axi = (void *)aux;
|
|
audit_log_format(ab,
|
|
" qbytes=%lx iuid=%u igid=%u mode=%x",
|
|
axi->qbytes, axi->uid, axi->gid, axi->mode);
|
|
break; }
|
|
|
|
case AUDIT_SOCKETCALL: {
|
|
int i;
|
|
struct audit_aux_data_socketcall *axs = (void *)aux;
|
|
audit_log_format(ab, "nargs=%d", axs->nargs);
|
|
for (i=0; i<axs->nargs; i++)
|
|
audit_log_format(ab, " a%d=%lx", i, axs->args[i]);
|
|
break; }
|
|
|
|
case AUDIT_SOCKADDR: {
|
|
struct audit_aux_data_sockaddr *axs = (void *)aux;
|
|
|
|
audit_log_format(ab, "saddr=");
|
|
audit_log_hex(ab, axs->a, axs->len);
|
|
break; }
|
|
|
|
case AUDIT_AVC_PATH: {
|
|
struct audit_aux_data_path *axi = (void *)aux;
|
|
audit_log_d_path(ab, "path=", axi->dentry, axi->mnt);
|
|
break; }
|
|
|
|
}
|
|
audit_log_end(ab);
|
|
}
|
|
|
|
if (context->pwd && context->pwdmnt) {
|
|
ab = audit_log_start(context, GFP_KERNEL, AUDIT_CWD);
|
|
if (ab) {
|
|
audit_log_d_path(ab, "cwd=", context->pwd, context->pwdmnt);
|
|
audit_log_end(ab);
|
|
}
|
|
}
|
|
for (i = 0; i < context->name_count; i++) {
|
|
ab = audit_log_start(context, GFP_KERNEL, AUDIT_PATH);
|
|
if (!ab)
|
|
continue; /* audit_panic has been called */
|
|
|
|
audit_log_format(ab, "item=%d", i);
|
|
if (context->names[i].name) {
|
|
audit_log_format(ab, " name=");
|
|
audit_log_untrustedstring(ab, context->names[i].name);
|
|
}
|
|
audit_log_format(ab, " flags=%x\n", context->names[i].flags);
|
|
|
|
if (context->names[i].ino != (unsigned long)-1)
|
|
audit_log_format(ab, " inode=%lu dev=%02x:%02x mode=%#o"
|
|
" ouid=%u ogid=%u rdev=%02x:%02x",
|
|
context->names[i].ino,
|
|
MAJOR(context->names[i].dev),
|
|
MINOR(context->names[i].dev),
|
|
context->names[i].mode,
|
|
context->names[i].uid,
|
|
context->names[i].gid,
|
|
MAJOR(context->names[i].rdev),
|
|
MINOR(context->names[i].rdev));
|
|
audit_log_end(ab);
|
|
}
|
|
}
|
|
|
|
/* Free a per-task audit context. Called from copy_process and
|
|
* __put_task_struct. */
|
|
void audit_free(struct task_struct *tsk)
|
|
{
|
|
struct audit_context *context;
|
|
|
|
task_lock(tsk);
|
|
context = audit_get_context(tsk, 0, 0);
|
|
task_unlock(tsk);
|
|
|
|
if (likely(!context))
|
|
return;
|
|
|
|
/* Check for system calls that do not go through the exit
|
|
* function (e.g., exit_group), then free context block.
|
|
* We use GFP_ATOMIC here because we might be doing this
|
|
* in the context of the idle thread */
|
|
if (context->in_syscall && context->auditable)
|
|
audit_log_exit(context, GFP_ATOMIC);
|
|
|
|
audit_free_context(context);
|
|
}
|
|
|
|
/* Fill in audit context at syscall entry. This only happens if the
|
|
* audit context was created when the task was created and the state or
|
|
* filters demand the audit context be built. If the state from the
|
|
* per-task filter or from the per-syscall filter is AUDIT_RECORD_CONTEXT,
|
|
* then the record will be written at syscall exit time (otherwise, it
|
|
* will only be written if another part of the kernel requests that it
|
|
* be written). */
|
|
void audit_syscall_entry(struct task_struct *tsk, int arch, int major,
|
|
unsigned long a1, unsigned long a2,
|
|
unsigned long a3, unsigned long a4)
|
|
{
|
|
struct audit_context *context = tsk->audit_context;
|
|
enum audit_state state;
|
|
|
|
BUG_ON(!context);
|
|
|
|
/* This happens only on certain architectures that make system
|
|
* calls in kernel_thread via the entry.S interface, instead of
|
|
* with direct calls. (If you are porting to a new
|
|
* architecture, hitting this condition can indicate that you
|
|
* got the _exit/_leave calls backward in entry.S.)
|
|
*
|
|
* i386 no
|
|
* x86_64 no
|
|
* ppc64 yes (see arch/ppc64/kernel/misc.S)
|
|
*
|
|
* This also happens with vm86 emulation in a non-nested manner
|
|
* (entries without exits), so this case must be caught.
|
|
*/
|
|
if (context->in_syscall) {
|
|
struct audit_context *newctx;
|
|
|
|
#if defined(__NR_vm86) && defined(__NR_vm86old)
|
|
/* vm86 mode should only be entered once */
|
|
if (major == __NR_vm86 || major == __NR_vm86old)
|
|
return;
|
|
#endif
|
|
#if AUDIT_DEBUG
|
|
printk(KERN_ERR
|
|
"audit(:%d) pid=%d in syscall=%d;"
|
|
" entering syscall=%d\n",
|
|
context->serial, tsk->pid, context->major, major);
|
|
#endif
|
|
newctx = audit_alloc_context(context->state);
|
|
if (newctx) {
|
|
newctx->previous = context;
|
|
context = newctx;
|
|
tsk->audit_context = newctx;
|
|
} else {
|
|
/* If we can't alloc a new context, the best we
|
|
* can do is to leak memory (any pending putname
|
|
* will be lost). The only other alternative is
|
|
* to abandon auditing. */
|
|
audit_zero_context(context, context->state);
|
|
}
|
|
}
|
|
BUG_ON(context->in_syscall || context->name_count);
|
|
|
|
if (!audit_enabled)
|
|
return;
|
|
|
|
context->arch = arch;
|
|
context->major = major;
|
|
context->argv[0] = a1;
|
|
context->argv[1] = a2;
|
|
context->argv[2] = a3;
|
|
context->argv[3] = a4;
|
|
|
|
state = context->state;
|
|
if (state == AUDIT_SETUP_CONTEXT || state == AUDIT_BUILD_CONTEXT)
|
|
state = audit_filter_syscall(tsk, context, &audit_filter_list[AUDIT_FILTER_ENTRY]);
|
|
if (likely(state == AUDIT_DISABLED))
|
|
return;
|
|
|
|
context->serial = 0;
|
|
context->ctime = CURRENT_TIME;
|
|
context->in_syscall = 1;
|
|
context->auditable = !!(state == AUDIT_RECORD_CONTEXT);
|
|
}
|
|
|
|
/* Tear down after system call. If the audit context has been marked as
|
|
* auditable (either because of the AUDIT_RECORD_CONTEXT state from
|
|
* filtering, or because some other part of the kernel write an audit
|
|
* message), then write out the syscall information. In call cases,
|
|
* free the names stored from getname(). */
|
|
void audit_syscall_exit(struct task_struct *tsk, int valid, long return_code)
|
|
{
|
|
struct audit_context *context;
|
|
|
|
get_task_struct(tsk);
|
|
task_lock(tsk);
|
|
context = audit_get_context(tsk, valid, return_code);
|
|
task_unlock(tsk);
|
|
|
|
/* Not having a context here is ok, since the parent may have
|
|
* called __put_task_struct. */
|
|
if (likely(!context))
|
|
goto out;
|
|
|
|
if (context->in_syscall && context->auditable)
|
|
audit_log_exit(context, GFP_KERNEL);
|
|
|
|
context->in_syscall = 0;
|
|
context->auditable = 0;
|
|
|
|
if (context->previous) {
|
|
struct audit_context *new_context = context->previous;
|
|
context->previous = NULL;
|
|
audit_free_context(context);
|
|
tsk->audit_context = new_context;
|
|
} else {
|
|
audit_free_names(context);
|
|
audit_free_aux(context);
|
|
tsk->audit_context = context;
|
|
}
|
|
out:
|
|
put_task_struct(tsk);
|
|
}
|
|
|
|
/* Add a name to the list. Called from fs/namei.c:getname(). */
|
|
void audit_getname(const char *name)
|
|
{
|
|
struct audit_context *context = current->audit_context;
|
|
|
|
if (!context || IS_ERR(name) || !name)
|
|
return;
|
|
|
|
if (!context->in_syscall) {
|
|
#if AUDIT_DEBUG == 2
|
|
printk(KERN_ERR "%s:%d(:%d): ignoring getname(%p)\n",
|
|
__FILE__, __LINE__, context->serial, name);
|
|
dump_stack();
|
|
#endif
|
|
return;
|
|
}
|
|
BUG_ON(context->name_count >= AUDIT_NAMES);
|
|
context->names[context->name_count].name = name;
|
|
context->names[context->name_count].ino = (unsigned long)-1;
|
|
++context->name_count;
|
|
if (!context->pwd) {
|
|
read_lock(¤t->fs->lock);
|
|
context->pwd = dget(current->fs->pwd);
|
|
context->pwdmnt = mntget(current->fs->pwdmnt);
|
|
read_unlock(¤t->fs->lock);
|
|
}
|
|
|
|
}
|
|
|
|
/* Intercept a putname request. Called from
|
|
* include/linux/fs.h:putname(). If we have stored the name from
|
|
* getname in the audit context, then we delay the putname until syscall
|
|
* exit. */
|
|
void audit_putname(const char *name)
|
|
{
|
|
struct audit_context *context = current->audit_context;
|
|
|
|
BUG_ON(!context);
|
|
if (!context->in_syscall) {
|
|
#if AUDIT_DEBUG == 2
|
|
printk(KERN_ERR "%s:%d(:%d): __putname(%p)\n",
|
|
__FILE__, __LINE__, context->serial, name);
|
|
if (context->name_count) {
|
|
int i;
|
|
for (i = 0; i < context->name_count; i++)
|
|
printk(KERN_ERR "name[%d] = %p = %s\n", i,
|
|
context->names[i].name,
|
|
context->names[i].name);
|
|
}
|
|
#endif
|
|
__putname(name);
|
|
}
|
|
#if AUDIT_DEBUG
|
|
else {
|
|
++context->put_count;
|
|
if (context->put_count > context->name_count) {
|
|
printk(KERN_ERR "%s:%d(:%d): major=%d"
|
|
" in_syscall=%d putname(%p) name_count=%d"
|
|
" put_count=%d\n",
|
|
__FILE__, __LINE__,
|
|
context->serial, context->major,
|
|
context->in_syscall, name, context->name_count,
|
|
context->put_count);
|
|
dump_stack();
|
|
}
|
|
}
|
|
#endif
|
|
}
|
|
|
|
/* Store the inode and device from a lookup. Called from
|
|
* fs/namei.c:path_lookup(). */
|
|
void audit_inode(const char *name, const struct inode *inode, unsigned flags)
|
|
{
|
|
int idx;
|
|
struct audit_context *context = current->audit_context;
|
|
|
|
if (!context->in_syscall)
|
|
return;
|
|
if (context->name_count
|
|
&& context->names[context->name_count-1].name
|
|
&& context->names[context->name_count-1].name == name)
|
|
idx = context->name_count - 1;
|
|
else if (context->name_count > 1
|
|
&& context->names[context->name_count-2].name
|
|
&& context->names[context->name_count-2].name == name)
|
|
idx = context->name_count - 2;
|
|
else {
|
|
/* FIXME: how much do we care about inodes that have no
|
|
* associated name? */
|
|
if (context->name_count >= AUDIT_NAMES - AUDIT_NAMES_RESERVED)
|
|
return;
|
|
idx = context->name_count++;
|
|
context->names[idx].name = NULL;
|
|
#if AUDIT_DEBUG
|
|
++context->ino_count;
|
|
#endif
|
|
}
|
|
context->names[idx].flags = flags;
|
|
context->names[idx].ino = inode->i_ino;
|
|
context->names[idx].dev = inode->i_sb->s_dev;
|
|
context->names[idx].mode = inode->i_mode;
|
|
context->names[idx].uid = inode->i_uid;
|
|
context->names[idx].gid = inode->i_gid;
|
|
context->names[idx].rdev = inode->i_rdev;
|
|
}
|
|
|
|
void auditsc_get_stamp(struct audit_context *ctx,
|
|
struct timespec *t, unsigned int *serial)
|
|
{
|
|
if (!ctx->serial)
|
|
ctx->serial = audit_serial();
|
|
t->tv_sec = ctx->ctime.tv_sec;
|
|
t->tv_nsec = ctx->ctime.tv_nsec;
|
|
*serial = ctx->serial;
|
|
ctx->auditable = 1;
|
|
}
|
|
|
|
int audit_set_loginuid(struct task_struct *task, uid_t loginuid)
|
|
{
|
|
if (task->audit_context) {
|
|
struct audit_buffer *ab;
|
|
|
|
ab = audit_log_start(NULL, GFP_KERNEL, AUDIT_LOGIN);
|
|
if (ab) {
|
|
audit_log_format(ab, "login pid=%d uid=%u "
|
|
"old auid=%u new auid=%u",
|
|
task->pid, task->uid,
|
|
task->audit_context->loginuid, loginuid);
|
|
audit_log_end(ab);
|
|
}
|
|
task->audit_context->loginuid = loginuid;
|
|
}
|
|
return 0;
|
|
}
|
|
|
|
uid_t audit_get_loginuid(struct audit_context *ctx)
|
|
{
|
|
return ctx ? ctx->loginuid : -1;
|
|
}
|
|
|
|
int audit_ipc_perms(unsigned long qbytes, uid_t uid, gid_t gid, mode_t mode)
|
|
{
|
|
struct audit_aux_data_ipcctl *ax;
|
|
struct audit_context *context = current->audit_context;
|
|
|
|
if (likely(!context))
|
|
return 0;
|
|
|
|
ax = kmalloc(sizeof(*ax), GFP_KERNEL);
|
|
if (!ax)
|
|
return -ENOMEM;
|
|
|
|
ax->qbytes = qbytes;
|
|
ax->uid = uid;
|
|
ax->gid = gid;
|
|
ax->mode = mode;
|
|
|
|
ax->d.type = AUDIT_IPC;
|
|
ax->d.next = context->aux;
|
|
context->aux = (void *)ax;
|
|
return 0;
|
|
}
|
|
|
|
int audit_socketcall(int nargs, unsigned long *args)
|
|
{
|
|
struct audit_aux_data_socketcall *ax;
|
|
struct audit_context *context = current->audit_context;
|
|
|
|
if (likely(!context))
|
|
return 0;
|
|
|
|
ax = kmalloc(sizeof(*ax) + nargs * sizeof(unsigned long), GFP_KERNEL);
|
|
if (!ax)
|
|
return -ENOMEM;
|
|
|
|
ax->nargs = nargs;
|
|
memcpy(ax->args, args, nargs * sizeof(unsigned long));
|
|
|
|
ax->d.type = AUDIT_SOCKETCALL;
|
|
ax->d.next = context->aux;
|
|
context->aux = (void *)ax;
|
|
return 0;
|
|
}
|
|
|
|
int audit_sockaddr(int len, void *a)
|
|
{
|
|
struct audit_aux_data_sockaddr *ax;
|
|
struct audit_context *context = current->audit_context;
|
|
|
|
if (likely(!context))
|
|
return 0;
|
|
|
|
ax = kmalloc(sizeof(*ax) + len, GFP_KERNEL);
|
|
if (!ax)
|
|
return -ENOMEM;
|
|
|
|
ax->len = len;
|
|
memcpy(ax->a, a, len);
|
|
|
|
ax->d.type = AUDIT_SOCKADDR;
|
|
ax->d.next = context->aux;
|
|
context->aux = (void *)ax;
|
|
return 0;
|
|
}
|
|
|
|
int audit_avc_path(struct dentry *dentry, struct vfsmount *mnt)
|
|
{
|
|
struct audit_aux_data_path *ax;
|
|
struct audit_context *context = current->audit_context;
|
|
|
|
if (likely(!context))
|
|
return 0;
|
|
|
|
ax = kmalloc(sizeof(*ax), GFP_ATOMIC);
|
|
if (!ax)
|
|
return -ENOMEM;
|
|
|
|
ax->dentry = dget(dentry);
|
|
ax->mnt = mntget(mnt);
|
|
|
|
ax->d.type = AUDIT_AVC_PATH;
|
|
ax->d.next = context->aux;
|
|
context->aux = (void *)ax;
|
|
return 0;
|
|
}
|
|
|
|
void audit_signal_info(int sig, struct task_struct *t)
|
|
{
|
|
extern pid_t audit_sig_pid;
|
|
extern uid_t audit_sig_uid;
|
|
|
|
if (unlikely(audit_pid && t->tgid == audit_pid)) {
|
|
if (sig == SIGTERM || sig == SIGHUP) {
|
|
struct audit_context *ctx = current->audit_context;
|
|
audit_sig_pid = current->pid;
|
|
if (ctx)
|
|
audit_sig_uid = ctx->loginuid;
|
|
else
|
|
audit_sig_uid = current->uid;
|
|
}
|
|
}
|
|
}
|
|
|