类的数据结构

时间:2012-10-11 17:27:15

标签: c++ assembly data-structures computer-science

C ++类的数据结构是什么? 它在汇编级别如何工作?

IF语句是代码行的compare +条件跳转。

数组和字符串是数据的链接。

1 个答案:

答案 0 :(得分:3)

编译器为所有成员分配偏移量,并在成员的所有加载/存储操作中包含这些偏移量:

struct foo {
    uint32_t bar;
    uint32_t baz;

    uint32_t get_baz() { return baz; }
};

uint32_t get_baz_from_foo(foo *f) { return f->baz; }

变为(用于简化的ARM汇编代码):

foo__get_baz:
    ; calling convention: this pointer in r3
    ; load 32 bit value from r3 + 4 bytes into r0
    ldr r0, [r3, #4];
    ; calling convention: return value in r0
    ; return from subroutine
    b lr

get_baz_from_foo:
    ; calling convention: first parameter in r0
    ; load 32 bit value from r0 + 4 bytes into r0
    ldr r0, [r0, #4]
    ; calling convention: return value in r0
    ; return from subroutine
    b lr

由于struct各自的class布局在编译后没有改变,所以4在这里被硬编码到指令流中。

通过分配内存并将指针从分配函数传递给期望指向结构的指针的每个人来创建实例:

new__foo:
    ; two 32 bit integers need 8 bytes
    ; calling convention: first parameter in r0
    mov r0, #8
    ; call allocator, which will then return to the function invoking new
    bra malloc

如果有构造函数

struct foo2 {
    foo2() : bar(5), baz(7) { }
    uint32_t bar;
    uint32_t baz;
    uint32_t get_baz() { return baz; }
};

我们最终会采用一种稍微复杂的方式来创建对象(您应该能够在没有注释的情况下找到它):

new__foo2:
    strdb lr, ![sp]
    mov r0, #8
    bl malloc
    mov r1, #5
    str r1, [r0]
    mov r1, #7
    str r1, [r0, #4]
    ldaia lr, ![sp]
    b lr

get_baz实现与foo类相同。

现在,如果我构造这样的对象并获得baz值:

    bl new__foo2
    ; remember: the this pointer goes to r3
    mov r3, r0
    bl foo2__get_baz

我最终得到的r0包含值7

对于virtual方法,创建了一个隐藏数据成员,它是一个指向函数表的指针:

struct base {
    virtual uint32_t get_baz() = 0;
};

struct derived : base {
    derived() : baz(5) { }
    virtual uint32_t get_baz();
    uint32_t bar;
    uint32_t baz;
};

变为

new__derived:
    strdb lr, ![sp]
    mov r0, #12
    bl malloc
    mov r1, #5
    str r1, [r0, #8]
    ; get the address of the vtable
    ldr r1, =vtable__derived
    ; vtable typically goes to the end of the class defining it
    ; as this is the base class, it goes before derived's data members
    str r1, [r0]
    ldria lr, ![sp]
    b lr

vtable__derived:
    ; pointer to function
    dw derived__get_baz

derived__get_baz:
    ldr r0, [r3, #8]
    b lr

间接完成此功能的调用:

    ; construct normally
    bl new__derived
    ; here, we forget that this is a "derived" object
    ; this pointer to r3
    mov r3, r0
    ; get vtable ptr
    ldr r0, [r3]
    ; get function ptr from vtable
    ldr r0, [r0]
    ; call function
    bl r0

在这里,r0现在是5,因为那是构造函数存储在那里的。