kernel/ptrace.c

时间:2023-02-17 21:48:09

/* ptrace.c */
/* By Ross Biro 1/23/92 */
/* edited by Linus Torvalds */

#include <linux/head.h>
#include <linux/kernel.h>
#include <linux/sched.h>
#include <linux/mm.h>
#include <linux/errno.h>
#include <linux/ptrace.h>
#include <linux/user.h>

#include <asm/segment.h>
#include <asm/system.h>
#include <linux/debugreg.h>

/*
 * does not yet catch signals sent when the child dies.
 * in exit.c or in signal.c.
 */
//exit.c和signal.c当子进程退出时任然捕获不到信号
/* determines which flags the user has access to. */
/* 1 = access 0 = no access */
#define FLAG_MASK 0x00044dd5

/* set's the trap flag. */
#define TRAP_FLAG 0x100

/*
 * this is the number to subtract from the top of the stack. To find
 * the local frame.
 */
#define MAGICNUMBER 68

/* change a pid into a task struct. */
//获取指定pid的任务
static inline struct task_struct * get_task(int pid)
{
    int i;
    //遍历所有任务进程,查找指定进程号的进程
    for (i = 1; i < NR_TASKS; i++) {
        if (task[i] != NULL && (task[i]->pid == pid))
            return task[i];
    }
    return NULL;
}

/*
 * this routine will get a word off of the processes priviledged stack.
 * the offset is how far from the base addr as stored in the TSS.  
 * this routine assumes that all the priviledged stacks are in our
 * data space.
 */   
 //获取栈的偏移处的内容
static inline int get_stack_long(struct task_struct *task, int offset)
{
    unsigned char *stack;
    //获取到栈基址
    stack = (unsigned char *)task->tss.esp0;
    //计算偏移
    stack += offset;
    //取出该位置的内容
    return (*((int *)stack));
}

/*
 * this routine will put a word on the processes priviledged stack.
 * the offset is how far from the base addr as stored in the TSS.  
 * this routine assumes that all the priviledged stacks are in our
 * data space.
 */
 //设置栈指定偏移处的内容
static inline int put_stack_long(struct task_struct *task, int offset,
    unsigned long data)
{
    unsigned char * stack;
    //栈基址
    stack = (unsigned char *) task->tss.esp0;
    //偏移位置
    stack += offset;
    //设置内容
    *(unsigned long *) stack = data;
    return 0;
}

/*
 * This routine gets a long from any process space by following the page
 * tables. NOTE! You should check that the long isn't on a page boundary,
 * and that it is in the task area before calling this: this routine does
 * no checking.
 *
 * NOTE2! This uses "tsk->tss.cr3" even though we know it's currently always
 * zero. This routine shouldn't have to change when we make a better mm.
 */
 //获取指定任务的内存控制任意位置处的数据
static unsigned long get_long(struct task_struct * tsk,
    unsigned long addr)
{
    unsigned long page;

repeat:
    page = *PAGE_DIR_OFFSET(tsk->tss.cr3,addr);
    if (page & PAGE_PRESENT) {
        page &= PAGE_MASK;
        page += PAGE_PTR(addr);
        page = *((unsigned long *) page);
    }
    if (!(page & PAGE_PRESENT)) {
        do_no_page(0,addr,tsk,0);
        goto repeat;
    }
/* this is a hack for non-kernel-mapped video buffers and similar */
    if (page >= high_memory)
        return 0;
    page &= PAGE_MASK;
    page += addr & ~PAGE_MASK;
    return *(unsigned long *) page;
}

/*
 * This routine puts a long into any process space by following the page
 * tables. NOTE! You should check that the long isn't on a page boundary,
 * and that it is in the task area before calling this: this routine does
 * no checking.
 *
 * Now keeps R/W state of page so that a text page stays readonly
 * even if a debugger scribbles breakpoints into it.  -M.U-
 */
static void put_long(struct task_struct * tsk, unsigned long addr,
    unsigned long data)
{
    unsigned long page, pte = 0;
    int readonly = 0;

repeat:
    page = *PAGE_DIR_OFFSET(tsk->tss.cr3,addr);
    if (page & PAGE_PRESENT) {
        page &= PAGE_MASK;
        page += PAGE_PTR(addr);
        pte = page;
        page = *((unsigned long *) page);
    }
    if (!(page & PAGE_PRESENT)) {
        do_no_page(0 /* PAGE_RW */ ,addr,tsk,0);
        goto repeat;
    }
    if (!(page & PAGE_RW)) {
        if(!(page & PAGE_COW))
            readonly = 1;
        do_wp_page(PAGE_RW | PAGE_PRESENT,addr,tsk,0);
        goto repeat;
    }
/* this is a hack for non-kernel-mapped video buffers and similar */
    if (page >= high_memory)
        return;
/* we're bypassing pagetables, so we have to set the dirty bit ourselves */
    *(unsigned long *) pte |= (PAGE_DIRTY|PAGE_COW);
    page &= PAGE_MASK;
    page += addr & ~PAGE_MASK;
    *(unsigned long *) page = data;
    if(readonly) {
        *(unsigned long *) pte &=~ (PAGE_RW|PAGE_COW);
        invalidate();
    }
}

/*
 * This routine checks the page boundaries, and that the offset is
 * within the task area. It then calls get_long() to read a long.
 */
static int read_long(struct task_struct * tsk, unsigned long addr,
    unsigned long * result)
{
    unsigned long low,high;

if (addr > TASK_SIZE-sizeof(long))
        return -EIO;
    if ((addr & ~PAGE_MASK) > PAGE_SIZE-sizeof(long)) {
        low = get_long(tsk,addr & ~(sizeof(long)-1));
        high = get_long(tsk,(addr+sizeof(long)) & ~(sizeof(long)-1));
        switch (addr & (sizeof(long)-1)) {
            case 1:
                low >>= 8;
                low |= high << 24;
                break;
            case 2:
                low >>= 16;
                low |= high << 16;
                break;
            case 3:
                low >>= 24;
                low |= high << 8;
                break;
        }
        *result = low;
    } else
        *result = get_long(tsk,addr);
    return 0;
}

/*
 * This routine checks the page boundaries, and that the offset is
 * within the task area. It then calls put_long() to write a long.
 */
static int write_long(struct task_struct * tsk, unsigned long addr,
    unsigned long data)
{
    unsigned long low,high;

if (addr > TASK_SIZE-sizeof(long))
        return -EIO;
    if ((addr & ~PAGE_MASK) > PAGE_SIZE-sizeof(long)) {
        low = get_long(tsk,addr & ~(sizeof(long)-1));
        high = get_long(tsk,(addr+sizeof(long)) & ~(sizeof(long)-1));
        switch (addr & (sizeof(long)-1)) {
            case 0: /* shouldn't happen, but safety first */
                low = data;
                break;
            case 1:
                low &= 0x000000ff;
                low |= data << 8;
                high &= ~0xff;
                high |= data >> 24;
                break;
            case 2:
                low &= 0x0000ffff;
                low |= data << 16;
                high &= ~0xffff;
                high |= data >> 16;
                break;
            case 3:
                low &= 0x00ffffff;
                low |= data << 24;
                high &= ~0xffffff;
                high |= data >> 8;
                break;
        }
        put_long(tsk,addr & ~(sizeof(long)-1),low);
        put_long(tsk,(addr+sizeof(long)) & ~(sizeof(long)-1),high);
    } else
        put_long(tsk,addr,data);
    return 0;
}

asmlinkage int sys_ptrace(long request, long pid, long addr, long data)
{
    struct task_struct *child;
    struct user * dummy;
    int i;

dummy = NULL;

if (request == PTRACE_TRACEME) {
        /* are we already being traced? */
        if (current->flags & PF_PTRACED)
            return -EPERM;
        /* set the ptrace bit in the proccess flags. */
        current->flags |= PF_PTRACED;
        return 0;
    }
    if (pid == 1)        /* you may not mess with init */
        return -EPERM;
    if (!(child = get_task(pid)))
        return -ESRCH;
    if (request == PTRACE_ATTACH) {
        if (child == current)
            return -EPERM;
        if ((!child->dumpable || (current->uid != child->euid) ||
             (current->gid != child->egid)) && !suser())
            return -EPERM;
        /* the same process cannot be attached many times */
        if (child->flags & PF_PTRACED)
            return -EPERM;
        child->flags |= PF_PTRACED;
        if (child->p_pptr != current) {
            REMOVE_LINKS(child);
            child->p_pptr = current;
            SET_LINKS(child);
        }
        send_sig(SIGSTOP, child, 1);
        return 0;
    }
    if (!(child->flags & PF_PTRACED))
        return -ESRCH;
    if (child->state != TASK_STOPPED) {
        if (request != PTRACE_KILL)
            return -ESRCH;
    }
    if (child->p_pptr != current)
        return -ESRCH;

switch (request) {
    /* when I and D space are seperate, these will need to be fixed. */
        case PTRACE_PEEKTEXT: /* read word at location addr. */
        case PTRACE_PEEKDATA: {
            unsigned long tmp;
            int res;

res = read_long(child, addr, &tmp);
            if (res < 0)
                return res;
            res = verify_area(VERIFY_WRITE, (void *) data, sizeof(long));
            if (!res)
                put_fs_long(tmp,(unsigned long *) data);
            return res;
        }

/* read the word at location addr in the USER area. */
        case PTRACE_PEEKUSR: {
            unsigned long tmp;
            int res;

if ((addr & 3) || addr < 0 ||
                addr > sizeof(struct user) - 3)
                return -EIO;

res = verify_area(VERIFY_WRITE, (void *) data, sizeof(long));
            if (res)
                return res;
            tmp = 0;  /* Default return condition */
            if(addr < 17*sizeof(long)) {
              addr = addr >> 2; /* temporary hack. */

tmp = get_stack_long(child, sizeof(long)*addr - MAGICNUMBER);
              if (addr == DS || addr == ES ||
                  addr == FS || addr == GS ||
                  addr == CS || addr == SS)
                tmp &= 0xffff;
            };
            if(addr >= (long) &dummy->u_debugreg[0] &&
               addr <= (long) &dummy->u_debugreg[7]){
                addr -= (long) &dummy->u_debugreg[0];
                addr = addr >> 2;
                tmp = child->debugreg[addr];
            };
            put_fs_long(tmp,(unsigned long *) data);
            return 0;
        }

/* when I and D space are seperate, this will have to be fixed. */
        case PTRACE_POKETEXT: /* write the word at location addr. */
        case PTRACE_POKEDATA:
            return write_long(child,addr,data);

case PTRACE_POKEUSR: /* write the word at location addr in the USER area */
            if ((addr & 3) || addr < 0 ||
                addr > sizeof(struct user) - 3)
                return -EIO;

addr = addr >> 2; /* temproary hack. */

if (addr == ORIG_EAX)
                return -EIO;
            if (addr == DS || addr == ES ||
                addr == FS || addr == GS ||
                addr == CS || addr == SS) {
                    data &= 0xffff;
                    if (data && (data & 3) != 3)
                    return -EIO;
            }
            if (addr == EFL) {   /* flags. */
                data &= FLAG_MASK;
                data |= get_stack_long(child, EFL*sizeof(long)-MAGICNUMBER)  & ~FLAG_MASK;
            }
          /* Do not allow the user to set the debug register for kernel
             address space */
          if(addr < 17){
              if (put_stack_long(child, sizeof(long)*addr-MAGICNUMBER, data))
                return -EIO;
            return 0;
            };

/* We need to be very careful here.  We implicitly
             want to modify a portion of the task_struct, and we
             have to be selective about what portions we allow someone
             to modify. */

addr = addr << 2;  /* Convert back again */
          if(addr >= (long) &dummy->u_debugreg[0] &&
             addr <= (long) &dummy->u_debugreg[7]){

if(addr == (long) &dummy->u_debugreg[4]) return -EIO;
              if(addr == (long) &dummy->u_debugreg[5]) return -EIO;
              if(addr < (long) &dummy->u_debugreg[4] &&
                 ((unsigned long) data) >= 0xbffffffd) return -EIO;
              
              if(addr == (long) &dummy->u_debugreg[7]) {
                  data &= ~DR_CONTROL_RESERVED;
                  for(i=0; i<4; i++)
                      if ((0x5f54 >> ((data >> (16 + 4*i)) & 0xf)) & 1)
                          return -EIO;
              };

addr -= (long) &dummy->u_debugreg;
              addr = addr >> 2;
              child->debugreg[addr] = data;
              return 0;
          };
          return -EIO;

case PTRACE_SYSCALL: /* continue and stop at next (return from) syscall */
        case PTRACE_CONT: { /* restart after signal. */
            long tmp;

if ((unsigned long) data > NSIG)
                return -EIO;
            if (request == PTRACE_SYSCALL)
                child->flags |= PF_TRACESYS;
            else
                child->flags &= ~PF_TRACESYS;
            child->exit_code = data;
            child->state = TASK_RUNNING;
    /* make sure the single step bit is not set. */
            tmp = get_stack_long(child, sizeof(long)*EFL-MAGICNUMBER) & ~TRAP_FLAG;
            put_stack_long(child, sizeof(long)*EFL-MAGICNUMBER,tmp);
            return 0;
        }

/*
 * make the child exit.  Best I can do is send it a sigkill.
 * perhaps it should be put in the status that it want's to
 * exit.
 */
        case PTRACE_KILL: {
            long tmp;

child->state = TASK_RUNNING;
            child->exit_code = SIGKILL;
    /* make sure the single step bit is not set. */
            tmp = get_stack_long(child, sizeof(long)*EFL-MAGICNUMBER) & ~TRAP_FLAG;
            put_stack_long(child, sizeof(long)*EFL-MAGICNUMBER,tmp);
            return 0;
        }

case PTRACE_SINGLESTEP: {  /* set the trap flag. */
            long tmp;

if ((unsigned long) data > NSIG)
                return -EIO;
            child->flags &= ~PF_TRACESYS;
            tmp = get_stack_long(child, sizeof(long)*EFL-MAGICNUMBER) | TRAP_FLAG;
            put_stack_long(child, sizeof(long)*EFL-MAGICNUMBER,tmp);
            child->state = TASK_RUNNING;
            child->exit_code = data;
    /* give it a chance to run. */
            return 0;
        }

case PTRACE_DETACH: { /* detach a process that was attached. */
            long tmp;

if ((unsigned long) data > NSIG)
                return -EIO;
            child->flags &= ~(PF_PTRACED|PF_TRACESYS);
            child->state = TASK_RUNNING;
            child->exit_code = data;
            REMOVE_LINKS(child);
            child->p_pptr = child->p_opptr;
            SET_LINKS(child);
            /* make sure the single step bit is not set. */
            tmp = get_stack_long(child, sizeof(long)*EFL-MAGICNUMBER) & ~TRAP_FLAG;
            put_stack_long(child, sizeof(long)*EFL-MAGICNUMBER,tmp);
            return 0;
        }

default:
            return -EIO;
    }
}

//系统调用
asmlinkage void syscall_trace(void)
{
    if ((current->flags & (PF_PTRACED|PF_TRACESYS))
            != (PF_PTRACED|PF_TRACESYS))
        return;
    current->exit_code = SIGTRAP;
    current->state = TASK_STOPPED;
    notify_parent(current);
    schedule();
    /*
     * this isn't the same as continuing with a signal, but it will do
     * for normal use.  strace only continues with a signal if the
     * stopping signal is not SIGTRAP.  -brl
     */
    if (current->exit_code)
        current->signal |= (1 << (current->exit_code - 1));
    current->exit_code = 0;
}

kernel/ptrace.c的更多相关文章

  1. Playing with ptrace&comma; Part II

    Playing with ptrace, Part II Issue From Issue # December Dec , By Pradeep Padala inSysAdmin In Part ...

  2. linux下 玩转ptrace

    译者序:在开发Hust Online Judge的过程中,查阅了不少资料,关于调试器技术的资料在网上是很少,即便是UNIX编程巨著<UNIX环境高级编程>中,相关内容也不多,直到我在 ht ...

  3. 玩转ptrace&lpar;转&rpar;

    下面是转帖的内容,写的很详细.但是不同的linux发行版中头文件的路径和名称并不相同.如在某些发行版中<linux/user.h>就不存在,其中定义的变量出现在<asm/ptrace ...

  4. 由于ptrace&period;h文件导致的内核编译出错的解决方法

    arch/x86/kernel/ptrace.c:1472:17: error: conflicting types for 'syscall_trace_enter'  In file includ ...

  5. CVE-2019-13272 Linux kernel 权限许可和访问控制问题漏洞

    漏洞简介: Linuxkernel是美国Linux基金会发布的开源操作系统Linux所使用的内核. Linuxkernel5.1.17之前版本中存在安全漏洞,该漏洞源于kernel/ptrace.c文 ...

  6. ptrace函数深入分析

    ptrace函数:进程跟踪. 形式:#include<sys/ptrace.h> Int ptrace(int request,int pid,int addr,int data); 概述 ...

  7. LInux&lowbar;System&lowbar;Call&lowbar;INT&lowbar;80h

    Int 80h Website (Copy from Linux-System-Call) List of Linux/i386 system calls Copyright (C) 1999-200 ...

  8. Process Kill Technology &amp&semi;&amp&semi; Process Protection Against In Linux

    目录 . 引言 . Kill Process By Kill Command && SIGNAL . Kill Process By Resource Limits . Kill Pr ...

  9. systemtap 列出所有linux 内核模块与相关函数0

    diskiohttp://blog.163.com/digoal%40126/blog/static/16387704020131015105532435/ [root@localhost linux ...

随机推荐

  1. 一个URL链接到一个页面发生了什么?

    最开始觉得这是一个很难理解的东西,后来看了很多人写的发现并没有那么难理解,本人只是一个学渣有什么说的不对的地方希望大家能够指出来! 一个URL从我们输入的那一刻起,到返回页面到底发生了什么呢? URL ...

  2. Symfony2学习笔记之表单

    对于一个Web开发者来说,处理HTML表单是一个最为普通又具挑战的任务.Symfony2集成了一个Form组件,让处理表单变的容易起来.在这一节里,我们将从基础开始创建一个复杂的表单,学习表单类库中最 ...

  3. iOS&lowbar;SN&lowbar;深浅拷贝&lpar; 百度的&rpar;&lowbar;转载

    文章原地址:http://www.cnblogs.com/5ishare/p/4362459.html 深浅拷贝前提是:是实现NSCopying或者NSMutableCopying协议. 浅拷贝只是复 ...

  4. 使用资源监控工具 glances

    http://www.ibm.com/developerworks/cn/linux/1304_caoyq_glances/ glances 可以为 Unix 和 Linux 性能专家提供监视和分析性 ...

  5. 【Android Developers Training】 51&period; 序言:打印内容

    注:本文翻译自Google官方的Android Developers Training文档,译者技术一般,由于喜爱安卓而产生了翻译的念头,纯属个人兴趣爱好. 原文链接:http://developer ...

  6. python可用ORM之Pony

    Pony是Python的一种ORM,它允许使用生成器表达式来构造查询,通过将生成器表达式的抽象语法树解析成SQL语句.它也有在线ER图编辑器可以帮助你创建Model. 示例分析 Pony语句: sel ...

  7. OO前三次作业总结

    一.第一次作业 1.程序设计分析 ![img](s1.ax1x.com/2018/04/02/CSgoSU.png) 图1 第一次作业类图 ![name](https://images2018.cnb ...

  8. git diff 结果分析

    git diff 的5个使用场景: 1.staging area和working area的文件 (无其他参数时) git diff   2.master分支和working area的文件 (用ma ...

  9. 2018&period;10&period;27 bzoj3209&colon; 花神的数论题(数位dp)

    传送门 数位dpdpdp经典题. 题面已经暗示了我们按照二进制位来数位dpdpdp. 直接dpdpdp多少个数有111个111,222个111,333个111-, 然后快速幂算就行了. 于是我们枚举前 ...

  10. Visual Studio无法导航到插入点下面的符号

    Visual Studio2017编辑器按F12无法跳转到变量所属的类定义,弹窗提示[无法导航到插入点下面的符号],如下图: 解决办法: 方法一: 清理解决方案,重新生成. 方法二: 如果以上办法不行 ...