如果一个函数有20个参数(指针)(示例中使用了4个),并且所有参数的默认值都指向NULL,那是否意味着每次调用此函数都会在运行时执行PUSH堆栈NULL值?
此类函数的示例可能如下所示:
function test(val1=NULL, val2=NULL, .... val20=NULL)
我要求最大限度地提高速度,并在函数调用期间减少#cycle。
// ArgsListTest.cpp
// @author Mathew Kurian
#include "stdafx.h"
#include <iostream>
#include <time.h>
using namespace std;
// Look at the difference in psuedo-assembly code
// My knowledge in compiler is little, but I can see that
// that there are unncessary cycles being wasted for this part.
// **** With array (this example) *****
// LOAD Reg, memAddressOfArray
// WRITETOMEM Reg, ptrToVar1
// INCREMENT sp
// WRITETOMEM Reg, ptrToVar2
// DECREMENT sp
// PUSH ptrToArray
// JUMP test
// ***** IDEALLY SUPPOSED TO LIKE THIS *****
// PUSH ptrToVar2
// PUSH ptrToVar1
// JUMP test
class Base
{
public:
virtual int test(void* arguments[])
{
cout << "Base function being called. VTable lookup ignored since there is no virtual." << endl;
cout << *static_cast<int*>(arguments[0]) << endl; // Parameter 1 (Thinks there is only 1 parameter!)
int x = 5; x += 1; // Random math to prevent optimizations. (I hope)
return x;
}
};
class Derived : public Base
{
public:
virtual int test(void* arguments[])
{
// cout << "Derived function being called. VTable lookup during runtime. Slight overhead here!" << endl;
// cout << *static_cast<string*>(arguments[0]) << endl; // Parameter 1
// cout << *static_cast<int*>(arguments[1]) << endl; // Parameter 2
int x = 5; x += 1;
return x;
}
};
class Base2
{
public:
virtual int test(void* arg1 = NULL, void* arg2 = NULL, void* arg3 = NULL, void* arg4 = NULL)
{
// cout << "Base2 function being called. VTable lookup ignored since there is no virtual." << endl;
// cout << *static_cast<string*>(arg1) << endl; // Parameter 1
// cout << *static_cast<int*>(arg2) << endl; // Parameter 2
int x = 5; x += 1;
return x;
}
virtual int test2()
{
int x = 5; x += 1;
return x;
}
};
int _tmain(int argc, _TCHAR* argv[])
{
Base * base = new Derived;
Base2 * base2 = new Base2;
int r = 0;
string * str = new string("sunny");
int * vale = new int(20);
int iterations = 1000000000;
//================================================================================
printf("Using No-Parameters [%d iterations]\n", iterations);
clock_t tStart = clock();
for (int x = 0; x < iterations; x++)
{
r = base2->test2();
}
printf("Time taken: %.9fs\n", (double)(clock() - tStart) / CLOCKS_PER_SEC);
//================================================================================
printf("Using Array [%d iterations]\n", iterations);
tStart = clock();
for (int x = 0; x < iterations; x++)
{
void * arguments[] = { str, vale };
r = base->test(arguments);
}
printf("Time taken: %.9fs\n", (double)(clock() - tStart) / CLOCKS_PER_SEC);
//================================================================================
printf("Using Default-Parameters [%d iterations]\n", iterations);
tStart = clock();
for (int x = 0; x < iterations; x++)
{
r = base2->test(str, vale);
}
printf("Time taken: %.9fs\n", (double)(clock() - tStart) / CLOCKS_PER_SEC);
//================================================================================
// cout << "NOTE: Derived class has no extra methods although the parameter counts are different.\n Parent class doesn't even realize parameter 1 exists!" << endl;
std::getchar();
return 0;
}
PUSH NULL
更快?答案 0 :(得分:2)
虚拟方法可能会影响您的结果。我将您的方法复制到全局范围,演示了不同的性能顺序。
Using No-Parameters [1000000000 iterations]
Time taken: 24.831000000s
Using Array [1000000000 iterations]
Time taken: 24.730000000s
Using Default-Parameters [1000000000 iterations]
Time taken: 25.241000000s
Using No-Parameters [1000000000 iterations] on int testA()
Time taken: 21.664000000s
Using Array [1000000000 iterations] on int testB(void* arguments[])
Time taken: 22.384000000s
Using Default-Parameters [1000000000 iterations] int testC(void* arg1 = NULL, ...)
Time taken: 22.329000000s
编辑:
与testB中的数组赋值相同的测试移出for循环的范围:
Using No-Parameters [1000000000 iterations]
Time taken: 24.713000000s
Using Array [1000000000 iterations]
Time taken: 24.686000000s
Using Default-Parameters [1000000000 iterations]
Time taken: 25.225000000s
Using No-Parameters [1000000000 iterations] on int testA()
Time taken: 21.653000000s
Using Array [1000000000 iterations] on int testB(void* arguments[])
Time taken: 21.896000000s
Using Default-Parameters [1000000000 iterations] int testC(void* arg1 = NULL, ...)
Time taken: 22.353000000s
答案 1 :(得分:0)
也许。另一个简单的解决方案是拥有多个入口点:
# Pseudocode
PUSH nullptr # Default argument 20
PUSH nullptr # Default argument 19
PUSH nullptr # Default argument 18
...
ENTRYPOINT(test)
如果您有N个默认参数,则跳转到常规入口点前面的地址N指令。好处:推送这些默认参数的代码现在可以在调用者之间共享。但是,需要一点链接器智能。