Question

我是CS专业，我的班级有一个实验室来创建链接列表保存内存信息（位置，大小等）以模拟C中的简单垃圾收集器。我们需要做的一件事就是找到我们系统的基本指针。问题在于，我们几乎没有人能够做到这一点，教授暗示这些概念将在决赛中出现。

实验室结束了，所以不要担心这个等级或其他任何东西，我正在努力抓住这个想法，所以我已经为我的决赛做好了准备。

我不确定“root”是否是一个常用术语，但我们的想法是我们保存main函数的基数的位置，然后当我们调出root函数时，我们立即保存该函数的位置函数，迭代两者之间的所有内存，寻找指向链表的指针。这些指针被认为是“根”。

这是我实验室的代码。也许只是看它而不是尝试解释它会更容易。我意识到它可能不是很好的代码，并且它并不真正做任何东西，但我只是做他们告诉我的事情。

*我的问题是我的链接列表中的“开始”和“完成”范围从未指向当我遍历堆栈时，所以我相信我的指针一定是做错了。 my＆amp; start和＆amp; fin总是非常接近迭代器，但从不重叠，我不明白为什么。

将两个文件保存为.c文件进行编译时，应该像gcc -g * .c一样简单

#include <stdio.h>
#include <stdlib.h>
#include <ctype.h>
#include <string.h>
#include <stdbool.h>
//#include "gc_lib.h"

typedef struct hnode{

    bool used;
    long size;
    void* loc;
    struct hnode* next;
    struct hnode* prev;
}hnode;

//Globals
long HEAP_SIZE = 0;
bool AUTO_FREE = false;
void* MAIN_BASE = NULL;
void* MY_HEAP = NULL;
hnode* head = 0;


bool gc_init( long heapsize, void* main_base, bool autofree ){

    if( heapsize <= 0 )
        return false;

    HEAP_SIZE = heapsize;
    AUTO_FREE = autofree;
    MAIN_BASE = main_base;

    if( ( MY_HEAP = malloc( HEAP_SIZE ) ) == NULL )
        return false;

    return true;    
}


void* gc_malloc( unsigned long size ){

    if( size <= 0 )
        return NULL;

    //first malloc
    if( !head ){

        head = malloc( sizeof( hnode ) );
        head -> size = size;
        head -> loc = MY_HEAP;
        head -> used = true;        
        head -> prev = 0;

        hnode* hMem = malloc( sizeof( hnode ) );
        hMem -> size = HEAP_SIZE - size;
        hMem -> loc = (void*)((char*)(MY_HEAP) + size);
        hMem -> used = false;
        hMem -> next = 0;
        hMem -> prev = head;

        head -> next = hMem;

        return head -> loc;
    }

    hnode* findSpot = head;
    void* tempLoc = MY_HEAP;    
    int tempS = 0;

    while( findSpot ){

        //Used node
        if( findSpot -> used == true ){

            tempS += findSpot -> size;
            tempLoc = (void*)((char*)(MY_HEAP) + tempS);
            findSpot = findSpot -> next;
        }
        //Empty node; fits perfectly
        else if( ( findSpot -> used == false ) && ( findSpot -> size == size ) ){

            findSpot -> used = true;
            return findSpot -> loc;
        }
        //Empty node; fits imperfectly
        else if( ( findSpot -> used == false ) && ( findSpot -> size > size ) ){

            int splitSize = ( findSpot -> size ) - size;

            findSpot -> used = true;
            findSpot -> size = size; 

            hnode* newNode = malloc ( sizeof( hnode ) );
            newNode -> prev = findSpot;
            newNode -> next = findSpot -> next;
            newNode -> size = splitSize;
            newNode -> used = false;

            if( findSpot -> next )
                findSpot -> next -> prev = newNode;

            findSpot -> next = newNode;
            tempS += findSpot -> size;
            tempLoc = (void*)((char*)(MY_HEAP) + tempS);

            newNode -> loc = tempLoc;
            return findSpot -> loc;
        }
        //Empty node; too small
        else if( ( findSpot -> used == false ) && ( findSpot -> size < size ) ){

            tempS += findSpot -> size;
            tempLoc = (void*)((char*)(MY_HEAP) + tempS);
            findSpot = findSpot -> next;
        }
    }

    return NULL;
}


void print_roots( void ){

    register void* base asm("ebp");

    void* iter = base;
    printf( "Roots:\n" );

    if( head ){

        void* mBase = MAIN_BASE;
        hnode* nTemp = head;
        void* start = 0;
        void* fin = 0;

        while( iter != mBase ){

            if( nTemp )
                start = nTemp -> loc;

            while( nTemp && nTemp -> used)                
                nTemp = nTemp -> next;

            fin = nTemp -> loc + nTemp -> size;


            if( iter >= start && iter <= fin )
                fprintf( stdout, ">>>>%p\n", iter );

            printf("iter: %p\n", (iter)++ );
        }

        printf("MAIN_BASE: %p\n", MAIN_BASE );
        printf("base: %p\n", base );
        printf("\tstart: %p\n", &start );
        printf("\tfin: %p\n", &fin );
    }
}

以下是我们提供的测试文件：

#include <stdio.h>
#include <stdbool.h>
#include <assert.h>

#include "gc_lib.h"



int main(int argc, char** argv){
    register void* base asm("ebp");
    gc_init(100, base, false);

    void* x1 = gc_malloc(8);
    assert(x1 != NULL);
    void* x2 = gc_malloc(8);
    assert(x2 != NULL);
    assert((x2 == x1 + 8) || (x2 == x1 - 8));

    printf("%p\n", x1);
    printf("%p\n", x2);

    print_roots();

    return 0;
}

Answer 1

如果我是正确的，你想知道为什么永远不满足以下条件，并且相应的printf永远不会执行：

 if( iter >= start && iter <= fin )
            fprintf( stdout, ">>>>%p\n", iter );

据我所知，代码register void* base asm("ebp");将base变量放在EBP寄存器中。虽然，似乎只是建议编译器将其放在那里，因此可以忽略 - 来自gcc docs：

此选项不保证GCC始终在您指定的寄存器中生成具有此变量的代码。

因此，无法保证获得EBP值。

但这似乎并非如此。 iter从base值开始，这是指向void print_roots( void )被调用的地方的指针（我可能在这里错了，但它并不重要 - 它指向某个地方在堆栈中）。它通过增加它的值来迭代，直到它等于MAIN_BASE，它指向一个堆栈，其中int main(int argc, char** argv)函数存储关于它自身的东西。在这两个值之间，期望找到main函数的局部变量（x1和x2），这些变量指向堆中的某个位置（其中一些hnode->loc点到）。

以下代码定义start和fin变量的值：

nTemp = head;
if( nTemp )
    start = nTemp -> loc;

while( nTemp && nTemp -> used)                
    nTemp = nTemp -> next;

fin = nTemp -> loc + nTemp -> size;

因此，start和fin指向堆（因为列表中的任何hnode是指向堆的指针），而iter指向堆栈。这就是条件iter >= start && iter <= fin永远不会满足的原因。

在堆栈上查找函数的根

1 个答案: