linux/kernel/exit.c

/*
 *  linux/kernel/exit.c
 *
 *  Copyright (C) 1991, 1992  Linus Torvalds
 */

#undef DEBUG_PROC_TREE

#include <linux/wait.h>
#include <linux/errno.h>
#include <linux/signal.h>
#include <linux/sched.h>
#include <linux/kernel.h>
#include <linux/resource.h>
#include <linux/mm.h>
#include <linux/tty.h>
#include <linux/malloc.h>
#include <linux/interrupt.h>

#include <asm/segment.h>
#include <asm/pgtable.h>

extern void sem_exit (void);
extern void acct_process (long exitcode);
extern void kerneld_exit(void);

int getrusage(struct task_struct *, int, struct rusage *);

static inline void generate(unsigned long sig, struct task_struct * p)
{
        unsigned long mask = 1 << (sig-1);
        struct sigaction * sa = sig + p->sig->action - 1;

        if (!(mask & p->blocked) && !(p->flags & PF_PTRACED)) {
                /* don't bother with ignored signals (but SIGCHLD is special) */
                if (sa->sa_handler == SIG_IGN && sig != SIGCHLD)
                        return;
                /* some signals are ignored by default.. (but SIGCONT already did its deed) */
                if ((sa->sa_handler == SIG_DFL) &&
                    (sig == SIGCONT || sig == SIGCHLD || sig == SIGWINCH || sig == SIGURG))
                        return;
        }
        p->signal |= mask;
        if (p->state == TASK_INTERRUPTIBLE && (p->signal & ~p->blocked))
                wake_up_process(p);
}

void force_sig(unsigned long sig, struct task_struct * p)
{
        sig--;
        if (p->sig) {
                unsigned long mask = 1UL << sig;
                struct sigaction *sa = p->sig->action + sig;
                p->signal |= mask;
                p->blocked &= ~mask;
                if (sa->sa_handler == SIG_IGN)
                        sa->sa_handler = SIG_DFL;
                if (p->state == TASK_INTERRUPTIBLE)
                        wake_up_process(p);
        }
}


int send_sig(unsigned long sig,struct task_struct * p,int priv)
{
        if (!p || sig > 32)
                return -EINVAL;
        if (!priv && ((sig != SIGCONT) || (current->session != p->session)) &&
            (current->euid ^ p->suid) && (current->euid ^ p->uid) &&
            (current->uid ^ p->suid) && (current->uid ^ p->uid) &&
            !suser())
                return -EPERM;
        if (!sig)
                return 0;
        if (!p->sig)
                return 0;
        if ((sig == SIGKILL) || (sig == SIGCONT)) {
                if (p->state == TASK_STOPPED)
                        wake_up_process(p);
                p->exit_code = 0;
                p->signal &= ~( (1<<(SIGSTOP-1)) | (1<<(SIGTSTP-1)) |
                                (1<<(SIGTTIN-1)) | (1<<(SIGTTOU-1)) );
        }
        if (sig == SIGSTOP || sig == SIGTSTP || sig == SIGTTIN || sig == SIGTTOU)
                p->signal &= ~(1<<(SIGCONT-1));
        /* Actually generate the signal */
        generate(sig,p);
        return 0;
}

void notify_parent(struct task_struct * tsk)
{
        if (tsk->p_pptr == task[smp_num_cpus])          /* Init */
                tsk->exit_signal = SIGCHLD;
        send_sig(tsk->exit_signal, tsk->p_pptr, 1);
        wake_up_interruptible(&tsk->p_pptr->wait_chldexit);
}

void release(struct task_struct * p)
{
        int i;

        if (!p)
                return;
        if (p == current) {
                printk("task releasing itself\n");
                return;
        }
        for (i=1 ; i<NR_TASKS ; i++)
                if (task[i] == p) {
                        nr_tasks--;
                        task[i] = NULL;
                        REMOVE_LINKS(p);
                        release_thread(p);
                        if (STACK_MAGIC != *(unsigned long *)p->kernel_stack_page)
                                printk(KERN_ALERT "release: %s kernel stack corruption. Aiee\n", p->comm);
                        free_kernel_stack(p->kernel_stack_page);
                        current->cmin_flt += p->min_flt + p->cmin_flt;
                        current->cmaj_flt += p->maj_flt + p->cmaj_flt;
                        current->cnswap += p->nswap + p->cnswap;
                        kfree(p);
                        return;
                }
        panic("trying to release non-existent task");
}

#ifdef DEBUG_PROC_TREE

int bad_task_ptr(struct task_struct *p)
{
        int     i;

        if (!p)
                return 0;
        for (i=0 ; i<NR_TASKS ; i++)
                if (task[i] == p)
                        return 0;
        return 1;
}

void audit_ptree(void)
{
        int     i;

        for (i=1 ; i<NR_TASKS ; i++) {
                if (!task[i])
                        continue;
                if (bad_task_ptr(task[i]->p_pptr))
                        printk("Warning, pid %d's parent link is bad\n",
                                task[i]->pid);
                if (bad_task_ptr(task[i]->p_cptr))
                        printk("Warning, pid %d's child link is bad\n",
                                task[i]->pid);
                if (bad_task_ptr(task[i]->p_ysptr))
                        printk("Warning, pid %d's ys link is bad\n",
                                task[i]->pid);
                if (bad_task_ptr(task[i]->p_osptr))
                        printk("Warning, pid %d's os link is bad\n",
                                task[i]->pid);
                if (task[i]->p_pptr == task[i])
                        printk("Warning, pid %d parent link points to self\n",
                                task[i]->pid);
                if (task[i]->p_cptr == task[i])
                        printk("Warning, pid %d child link points to self\n",
                                task[i]->pid);
                if (task[i]->p_ysptr == task[i])
                        printk("Warning, pid %d ys link points to self\n",
                                task[i]->pid);
                if (task[i]->p_osptr == task[i])
                        printk("Warning, pid %d os link points to self\n",
                                task[i]->pid);
                if (task[i]->p_osptr) {
                        if (task[i]->p_pptr != task[i]->p_osptr->p_pptr)
                                printk(
                        "Warning, pid %d older sibling %d parent is %d\n",
                                task[i]->pid, task[i]->p_osptr->pid,
                                task[i]->p_osptr->p_pptr->pid);
                        if (task[i]->p_osptr->p_ysptr != task[i])
                                printk(
                "Warning, pid %d older sibling %d has mismatched ys link\n",
                                task[i]->pid, task[i]->p_osptr->pid);
                }
                if (task[i]->p_ysptr) {
                        if (task[i]->p_pptr != task[i]->p_ysptr->p_pptr)
                                printk(
                        "Warning, pid %d younger sibling %d parent is %d\n",
                                task[i]->pid, task[i]->p_osptr->pid,
                                task[i]->p_osptr->p_pptr->pid);
                        if (task[i]->p_ysptr->p_osptr != task[i])
                                printk(
                "Warning, pid %d younger sibling %d has mismatched os link\n",
                                task[i]->pid, task[i]->p_ysptr->pid);
                }
                if (task[i]->p_cptr) {
                        if (task[i]->p_cptr->p_pptr != task[i])
                                printk(
                        "Warning, pid %d youngest child %d has mismatched parent link\n",
                                task[i]->pid, task[i]->p_cptr->pid);
                        if (task[i]->p_cptr->p_ysptr)
                                printk(
                        "Warning, pid %d youngest child %d has non-NULL ys link\n",
                                task[i]->pid, task[i]->p_cptr->pid);
                }
        }
}
#endif /* DEBUG_PROC_TREE */

int session_of_pgrp(int pgrp)
{
        struct task_struct *p;
        int fallback;

        fallback = -1;
        for_each_task(p) {
                if (p->session <= 0)
                        continue;
                if (p->pgrp == pgrp)
                        return p->session;
                if (p->pid == pgrp)
                        fallback = p->session;
        }
        return fallback;
}

int kill_pg(int pgrp, int sig, int priv)
{
        struct task_struct *p;
        int err,retval = -ESRCH;
        int found = 0;

        if (sig<0 || sig>32 || pgrp<=0)
                return -EINVAL;
        for_each_task(p) {
                if (p->pgrp == pgrp) {
                        if ((err = send_sig(sig,p,priv)) != 0)
                                retval = err;
                        else
                                found++;
                }
        }
        return(found ? 0 : retval);
}

int kill_sl(int sess, int sig, int priv)
{
        struct task_struct *p;
        int err,retval = -ESRCH;
        int found = 0;

        if (sig<0 || sig>32 || sess<=0)
                return -EINVAL;
        for_each_task(p) {
                if (p->session == sess && p->leader) {
                        if ((err = send_sig(sig,p,priv)) != 0)
                                retval = err;
                        else
                                found++;
                }
        }
        return(found ? 0 : retval);
}

int kill_proc(int pid, int sig, int priv)
{
        struct task_struct *p;

        if (sig<0 || sig>32)
                return -EINVAL;
        for_each_task(p) {
                if (p && p->pid == pid)
                        return send_sig(sig,p,priv);
        }
        return(-ESRCH);
}

asmlinkage int sys_kill(int pid,int sig)
{
        int err, retval = 0, count = 0;

        if (!pid)
                return(kill_pg(current->pgrp,sig,0));
        if (pid == -1) {
                struct task_struct * p;
                for_each_task(p) {
                        if (p->pid > 1 && p != current) {
                                ++count;
                                if ((err = send_sig(sig,p,0)) != -EPERM)
                                        retval = err;
                        }
                }
                return(count ? retval : -ESRCH);
        }
        if (pid < 0)
                return(kill_pg(-pid,sig,0));
        /* Normal kill */
        return(kill_proc(pid,sig,0));
}

static int will_become_orphaned_pgrp(int pgrp, struct task_struct * ignored_task)
{
        struct task_struct *p;

        for_each_task(p) {
                if ((p == ignored_task) || (p->pgrp != pgrp) ||
                    (p->state == TASK_ZOMBIE) ||
                    (p->p_pptr->pid == 1))
                        continue;
                if ((p->p_pptr->pgrp != pgrp) &&
                    (p->p_pptr->session == p->session))
                        return 0;
        }
        return(1);
}

int is_orphaned_pgrp(int pgrp)
{
        return will_become_orphaned_pgrp(pgrp, 0);
}

static inline int has_stopped_jobs(int pgrp)
{
        struct task_struct * p;

        for_each_task(p) {
                if (p->pgrp != pgrp)
                        continue;
                if (p->state == TASK_STOPPED)
                        return(1);
        }
        return(0);
}

static inline void forget_original_parent(struct task_struct * father)
{
        struct task_struct * p;

        for_each_task(p) {
                if (p->p_opptr == father)
                        if (task[smp_num_cpus]) /* init */
                                p->p_opptr = task[smp_num_cpus];
                        else
                                p->p_opptr = task[0];
        }
}

static inline void close_files(struct files_struct * files)
{
        int i, j;

        j = 0;
        for (;;) {
                unsigned long set = files->open_fds.fds_bits[j];
                i = j * __NFDBITS;
                j++;
                if (i >= NR_OPEN)
                        break;
                while (set) {
                        if (set & 1)
                                close_fp(files->fd[i]);
                        i++;
                        set >>= 1;
                }
        }
}

static inline void __exit_files(struct task_struct *tsk)
{
        struct files_struct * files = tsk->files;

        if (files) {
                tsk->files = NULL;
                if (!--files->count) {
                        close_files(files);
                        kfree(files);
                }
        }
}

void exit_files(struct task_struct *tsk)
{
  __exit_files(tsk);
}

static inline void __exit_fs(struct task_struct *tsk)
{
        struct fs_struct * fs = tsk->fs;

        if (fs) {
                tsk->fs = NULL;
                if (!--fs->count) {
                        iput(fs->root);
                        iput(fs->pwd);
                        kfree(fs);
                }
        }
}

void exit_fs(struct task_struct *tsk)
{
  __exit_fs(tsk);
}

static inline void __exit_sighand(struct task_struct *tsk)
{
        struct signal_struct * sig = tsk->sig;

        if (sig) {
                tsk->sig = NULL;
                if (!--sig->count) {
                        kfree(sig);
                }
        }
}

void exit_sighand(struct task_struct *tsk)
{
        __exit_sighand(tsk);
}

static inline void __exit_mm(struct task_struct * tsk)
{
        struct mm_struct * mm = tsk->mm;

        if (mm != &init_mm) {
                flush_cache_mm(mm);
                flush_tlb_mm(mm);
                tsk->mm = &init_mm;
                tsk->swappable = 0;
                SET_PAGE_DIR(tsk, swapper_pg_dir);

                /* free the old state - not used any more */
                if (!--mm->count) {
                        exit_mmap(mm);
                        free_page_tables(mm);
                        kfree(mm);
                }
        }
}

void exit_mm(struct task_struct *tsk)
{
        __exit_mm(tsk);
}

static void exit_notify(void)
{
        struct task_struct * p;

        forget_original_parent(current);

        if ((current->p_pptr->pgrp != current->pgrp) &&
            (current->p_pptr->session == current->session) &&
            will_become_orphaned_pgrp(current->pgrp, current) &&
            has_stopped_jobs(current->pgrp)) {
                kill_pg(current->pgrp,SIGHUP,1);
                kill_pg(current->pgrp,SIGCONT,1);
        }
        notify_parent(current);

        while ((p = current->p_cptr) != NULL) {
                current->p_cptr = p->p_osptr;
                p->p_ysptr = NULL;
                p->flags &= ~(PF_PTRACED|PF_TRACESYS);
                if (task[smp_num_cpus] && task[smp_num_cpus] != current) /* init */
                        p->p_pptr = task[smp_num_cpus];
                else
                        p->p_pptr = task[0];
                p->p_osptr = p->p_pptr->p_cptr;
                p->p_osptr->p_ysptr = p;
                p->p_pptr->p_cptr = p;
                if (p->state == TASK_ZOMBIE)
                        notify_parent(p);
                if ((p->pgrp != current->pgrp) &&
                    (p->session == current->session) &&
                    is_orphaned_pgrp(p->pgrp) &&
                    has_stopped_jobs(p->pgrp)) {
                        kill_pg(p->pgrp,SIGHUP,1);
                        kill_pg(p->pgrp,SIGCONT,1);
                }
        }
        if (current->leader)
                disassociate_ctty(1);
}

NORET_TYPE void do_exit(long code)
{
        if (intr_count) {
                printk("Aiee, killing interrupt handler\n");
                intr_count = 0;
        }
fake_volatile:
        acct_process(code);
        current->flags |= PF_EXITING;
        del_timer(¤t->real_timer);
        sem_exit();
        kerneld_exit();
        __exit_mm(current);
        __exit_files(current);
        __exit_fs(current);
        __exit_sighand(current);
        exit_thread();
        current->state = TASK_ZOMBIE;
        current->exit_code = code;
        exit_notify();
#ifdef DEBUG_PROC_TREE
        audit_ptree();
#endif
        if (current->exec_domain && current->exec_domain->use_count)
                (*current->exec_domain->use_count)--;
        if (current->binfmt && current->binfmt->use_count)
                (*current->binfmt->use_count)--;
        schedule();
        goto fake_volatile;
}

asmlinkage int sys_exit(int error_code)
{
        do_exit((error_code&0xff)<<8);
}

asmlinkage int sys_wait4(pid_t pid,unsigned int * stat_addr, int options, struct rusage * ru)
{
        int flag, retval;
        struct wait_queue wait = { current, NULL };
        struct task_struct *p;

        if (stat_addr) {
                flag = verify_area(VERIFY_WRITE, stat_addr, sizeof(*stat_addr));
                if (flag)
                        return flag;
        }
        if (ru) {
                flag = verify_area(VERIFY_WRITE, ru, sizeof(*ru));
                if (flag)
                        return flag;
        }
        if (options & ~(WNOHANG|WUNTRACED|__WCLONE))
            return -EINVAL;

        add_wait_queue(¤t->wait_chldexit,&wait);
repeat:
        flag=0;
        for (p = current->p_cptr ; p ; p = p->p_osptr) {
                if (pid>0) {
                        if (p->pid != pid)
                                continue;
                } else if (!pid) {
                        if (p->pgrp != current->pgrp)
                                continue;
                } else if (pid != -1) {
                        if (p->pgrp != -pid)
                                continue;
                }
                /* wait for cloned processes iff the __WCLONE flag is set */
                if ((p->exit_signal != SIGCHLD) ^ ((options & __WCLONE) != 0))
                        continue;
                flag = 1;
                switch (p->state) {
                        case TASK_STOPPED:
                                if (!p->exit_code)
                                        continue;
                                if (!(options & WUNTRACED) && !(p->flags & PF_PTRACED))
                                        continue;
                                if (ru != NULL)
                                        getrusage(p, RUSAGE_BOTH, ru);
                                if (stat_addr)
                                        put_user((p->exit_code << 8) | 0x7f,
                                                stat_addr);
                                p->exit_code = 0;
                                retval = p->pid;
                                goto end_wait4;
                        case TASK_ZOMBIE:
                                current->cutime += p->utime + p->cutime;
                                current->cstime += p->stime + p->cstime;
                                if (ru != NULL)
                                        getrusage(p, RUSAGE_BOTH, ru);
                                if (stat_addr)
                                        put_user(p->exit_code, stat_addr);
                                retval = p->pid;
                                if (p->p_opptr != p->p_pptr) {
                                        REMOVE_LINKS(p);
                                        p->p_pptr = p->p_opptr;
                                        SET_LINKS(p);
                                        notify_parent(p);
                                } else
                                        release(p);
#ifdef DEBUG_PROC_TREE
                                audit_ptree();
#endif
                                goto end_wait4;
                        default:
                                continue;
                }
        }
        if (flag) {
                retval = 0;
                if (options & WNOHANG)
                        goto end_wait4;
                retval = -ERESTARTSYS;
                if (current->signal & ~current->blocked)
                        goto end_wait4;
                current->state=TASK_INTERRUPTIBLE;
                schedule();
                goto repeat;
        }
        retval = -ECHILD;
end_wait4:
        remove_wait_queue(¤t->wait_chldexit,&wait);
        return retval;
}

#ifndef __alpha__

asmlinkage int sys_waitpid(pid_t pid,unsigned int * stat_addr, int options)
{
        return sys_wait4(pid, stat_addr, options, NULL);
}

#endif