C++ 有没有更快的C++;堆分配/释放机制是否比boost::object\u pool可用?
本周我发现了boost::object_pool,并惊讶地发现它比普通的new&delete快20-30%C++ 有没有更快的C++;堆分配/释放机制是否比boost::object\u pool可用?,c++,boost,C++,Boost,本周我发现了boost::object_pool,并惊讶地发现它比普通的new&delete快20-30% 为测试我编写了一个小型的C++应用程序,它使用Booo::计时来处理不同堆的分配器/DealLoopter(SyrdY-PTR)。函数本身使用“new”和“delete”进行一个简单的6000万次迭代循环。在代码下面: #include <iostream> #include <memory> using std::shared_ptr; #include &l
为测试我编写了一个小型的C++应用程序,它使用Booo::计时来处理不同堆的分配器/DealLoopter(SyrdY-PTR)。函数本身使用“new”和“delete”进行一个简单的6000万次迭代循环。在代码下面:
#include <iostream>
#include <memory>
using std::shared_ptr;
#include <boost/smart_ptr.hpp>
#include <boost/chrono.hpp>
#include <boost/chrono/chrono_io.hpp>
#include <boost/pool/object_pool.hpp>
#include <SSVUtils/SSVUtils.h>
#include "TestClass.h"
const long lTestRecursion = 60000000L;
void WithSmartPtrs()
{
boost::chrono::system_clock::time_point startTime = boost::chrono::system_clock::now();
std::cout << "Start time: " << startTime << std::endl;
for (long i=0; i < lTestRecursion; ++i)
{
boost::shared_ptr<TestClass> spTC = boost::make_shared<TestClass>("Test input data!");
}
boost::chrono::system_clock::time_point endTime = boost::chrono::system_clock::now();
std::cout << "End time: " << endTime << std::endl;
boost::chrono::duration<double> d = endTime - startTime;
std::cout << "Duration: " << d << std::endl;
}
void WithSTDSmartPtrs()
{
boost::chrono::system_clock::time_point startTime = boost::chrono::system_clock::now();
std::cout << "Start time: " << startTime << std::endl;
for (long i=0; i < lTestRecursion; ++i)
{
std::shared_ptr<TestClass> spTC = std::make_shared<TestClass>("Test input data!");
}
boost::chrono::system_clock::time_point endTime = boost::chrono::system_clock::now();
std::cout << "End time: " << endTime << std::endl;
boost::chrono::duration<double> d = endTime - startTime;
std::cout << "Duration: " << d << std::endl;
}
template<typename T> struct Deleter {
void operator()(T *p)
{
delete p;
}
};
void WithSmartPtrsUnique()
{
boost::chrono::system_clock::time_point startTime = boost::chrono::system_clock::now();
std::cout << "Start time: " << startTime << std::endl;
for (long i=0; i < lTestRecursion; ++i)
{
boost::unique_ptr<TestClass, Deleter<TestClass> > spTC = boost::unique_ptr<TestClass, Deleter<TestClass> >(new TestClass("Test input data!"));
}
boost::chrono::system_clock::time_point endTime = boost::chrono::system_clock::now();
std::cout << "End time: " << endTime << std::endl;
boost::chrono::duration<double> d = endTime - startTime;
std::cout << "Duration: " << d << std::endl;
}
void WithSmartPtrsNoMakeShared()
{
boost::chrono::system_clock::time_point startTime = boost::chrono::system_clock::now();
std::cout << "Start time: " << startTime << std::endl;
for (long i=0; i < lTestRecursion; ++i)
{
boost::shared_ptr<TestClass> spTC = boost::shared_ptr<TestClass>( new TestClass("Test input data!"));
}
boost::chrono::system_clock::time_point endTime = boost::chrono::system_clock::now();
std::cout << "End time: " << endTime << std::endl;
boost::chrono::duration<double> d = endTime - startTime;
std::cout << "Duration: " << d << std::endl;
}
void WithoutSmartPtrs()
{
boost::chrono::system_clock::time_point startTime = boost::chrono::system_clock::now();
std::cout << "Start time: " << startTime << std::endl;
for (long i=0; i < lTestRecursion; ++i)
{
TestClass* pTC = new TestClass("Test input data!");
delete pTC;
}
boost::chrono::system_clock::time_point endTime = boost::chrono::system_clock::now();
std::cout << "End time: " << endTime << std::endl;
boost::chrono::duration<double> d = endTime - startTime;
std::cout << "Duration: " << d << std::endl;
}
void WithObjectPool()
{
boost::chrono::system_clock::time_point startTime = boost::chrono::system_clock::now();
std::cout << "Start time: " << startTime << std::endl;
{
boost::object_pool<TestClass> pool;
for (long i=0; i < lTestRecursion; ++i)
{
TestClass* pTC = pool.construct("Test input data!");
pool.destroy(pTC);
}
}
boost::chrono::system_clock::time_point endTime = boost::chrono::system_clock::now();
std::cout << "End time: " << endTime << std::endl;
boost::chrono::duration<double> d = endTime - startTime;
std::cout << "Duration: " << d << std::endl;
}
void WithObjectPoolNoDestroy()
{
boost::chrono::system_clock::time_point startTime = boost::chrono::system_clock::now();
std::cout << "Start time: " << startTime << std::endl;
//{
boost::object_pool<TestClass> pool;
for (long i=0; i < lTestRecursion; ++i)
{
TestClass* pTC = pool.construct("Test input data!");
//pool.destroy(pTC);
}
//}
boost::chrono::system_clock::time_point endTime = boost::chrono::system_clock::now();
std::cout << "End time: " << endTime << std::endl;
boost::chrono::duration<double> d = endTime - startTime;
std::cout << "Duration: " << d << std::endl;
}
void WithSSVUtilsPreAllocDyn()
{
boost::chrono::system_clock::time_point startTime = boost::chrono::system_clock::now();
std::cout << "Start time: " << startTime << std::endl;
{
ssvu::PreAlloc::PreAllocDyn preAllocatorDyn(1024*1024);
for (long i=0; i < lTestRecursion; ++i)
{
TestClass* pTC = preAllocatorDyn.create<TestClass>("Test input data!");
preAllocatorDyn.destroy(pTC);
}
}
boost::chrono::system_clock::time_point endTime = boost::chrono::system_clock::now();
std::cout << "End time: " << endTime << std::endl;
boost::chrono::duration<double> d = endTime - startTime;
std::cout << "Duration: " << d << std::endl;
}
void WithSSVUtilsPreAllocStatic()
{
boost::chrono::system_clock::time_point startTime = boost::chrono::system_clock::now();
std::cout << "Start time: " << startTime << std::endl;
{
ssvu::PreAlloc::PreAllocStatic<TestClass> preAllocatorStat(10);
for (long i=0; i < lTestRecursion; ++i)
{
TestClass* pTC = preAllocatorStat.create<TestClass>("Test input data!");
preAllocatorStat.destroy(pTC);
}
}
boost::chrono::system_clock::time_point endTime = boost::chrono::system_clock::now();
std::cout << "End time: " << endTime << std::endl;
boost::chrono::duration<double> d = endTime - startTime;
std::cout << "Duration: " << d << std::endl;
}
int main()
{
std::cout << " With OUT smartptrs (new and delete): " << std::endl;
WithoutSmartPtrs();
std::cout << std::endl << " With smartptrs (boost::shared_ptr withOUT make_shared): " << std::endl;
WithSmartPtrsNoMakeShared();
std::cout << std::endl << " With smartptrs (boost::shared_ptr with make_shared): " << std::endl;
WithSmartPtrs();
std::cout << std::endl << " With STD smart_ptr (std::shared_ptr with make_shared): " << std::endl;
WithSTDSmartPtrs();
std::cout << std::endl << " With Object Pool (boost::object_pool<>): " << std::endl;
WithObjectPool();
std::cout << std::endl << " With Object Pool (boost::object_pool<>) but without destroy called!: " << std::endl;
WithObjectPoolNoDestroy();
std::cout << std::endl << " With SSVUtils PreAllocDyn(1024*1024)!: " << std::endl;
WithSSVUtilsPreAllocDyn();
std::cout << std::endl << " With SSVUtils PreAllocStatic(10)!: " << std::endl;
WithSSVUtilsPreAllocStatic();
return 0;
}
结果包括我的MacBook Pro上的SSVUtils PreAllocDyn:
汇编时使用:
g++-mp-4.8 -I$BOOSTHOME/include -I$SSVUTILSHOME/include -std=c++11 -O2 -L$BOOSTHOME/lib -lboost_system -lboost_chrono -o smartptrtest smartptr.cpp
With OUT smartptrs (new and delete):
Start time: 1381596718412786000 nanoseconds since Jan 1, 1970
End time: 1381596731642044000 nanoseconds since Jan 1, 1970
Duration: 13.2293 seconds
With smartptrs (boost::shared_ptr withOUT make_shared):
Start time: 1381596731642108000 nanoseconds since Jan 1, 1970
End time: 1381596753651561000 nanoseconds since Jan 1, 1970
Duration: 22.0095 seconds
With smartptrs (boost::shared_ptr with make_shared):
Start time: 1381596753651611000 nanoseconds since Jan 1, 1970
End time: 1381596768909452000 nanoseconds since Jan 1, 1970
Duration: 15.2578 seconds
With STD smart_ptr (std::shared_ptr with make_shared):
Start time: 1381596768909496000 nanoseconds since Jan 1, 1970
End time: 1381596785500599000 nanoseconds since Jan 1, 1970
Duration: 16.5911 seconds
With Object Pool (boost::object_pool<>):
Start time: 1381596785500638000 nanoseconds since Jan 1, 1970
End time: 1381596793484515000 nanoseconds since Jan 1, 1970
Duration: 7.98388 seconds
With Object Pool (boost::object_pool<>) but without destroy called!:
Start time: 1381596793484551000 nanoseconds since Jan 1, 1970
End time: 1381596805774318000 nanoseconds since Jan 1, 1970
Duration: 12.2898 seconds
With SSVUtils PreAllocDyn(1024*1024)!:
Start time: 1381596815742696000 nanoseconds since Jan 1, 1970
End time: 1381596824173405000 nanoseconds since Jan 1, 1970
Duration: 8.43071 seconds
With SSVUtils PreAllocStatic(10)!:
Start time: 1381596824173448000 nanoseconds since Jan 1, 1970
End time: 1381596832034965000 nanoseconds since Jan 1, 1970
Duration: 7.86152 seconds
g++-mp-4.8-I$BOOSTHOME/include-I$SSVUTILSHOME/include-std=c++11-O2-L$BOOSTHOME/lib-lboost\u系统-lboost\u计时-o smartptrtest smartptr.cpp
不带SmartPTR(新建和删除):
开始时间:自1970年1月1日起1381596718412786000纳秒
结束时间:自1970年1月1日起1381596731642044000纳秒
持续时间:13.2293秒
使用SmartPTR(boost::shared_ptr而不使用make_shared):
开始时间:自1970年1月1日起1381596731642108000纳秒
结束时间:自1970年1月1日起1381596753651561000纳秒
持续时间:22.0095秒
使用smartptrs(boost::shared_ptr和make_shared):
开始时间:自1970年1月1日起1381596753651611000纳秒
结束时间:自1970年1月1日起1381596768909452000纳秒
持续时间:15.2578秒
使用STD smart_ptr(STD::共享_ptr和make_shared):
开始时间:自1970年1月1日起1381596768909496000纳秒
结束时间:自1970年1月1日起1381596785500599000纳秒
持续时间:16.5911秒
使用对象池(boost::对象池):
开始时间:自1970年1月1日起1381596785500638000纳秒
结束时间:自1970年1月1日起1381596793484515000纳秒
持续时间:7.98388秒
使用对象池(boost::Object\u Pool),但不调用destroy!:
开始时间:自1970年1月1日起1381596793484551000纳秒
结束时间:自1970年1月1日起1381596805774310000纳秒
持续时间:12.2898秒
带SSVUtils预分配码(1024*1024)!:
开始时间:自1970年1月1日起138159681574269600纳秒
结束时间:自1970年1月1日起1381596824173405000纳秒
持续时间:8.43071秒
带SSVUtils PreAllocStatic(10)!:
开始时间:自1970年1月1日起1381596824173448000纳秒
结束时间:自1970年1月1日起1381596832034965000纳秒
持续时间:7.86152秒
我的问题:
除了shared_ptr/unique_ptr/boost::object_pool之外,是否还有更多堆/分配机制可用于大型对象集的快速堆分配/解除分配
注意:我在其他机器和操作系统上也有更多的结果
编辑1:添加SSVUtils预分配结果
编辑4:添加了我的编译器命令行选项,并使用SSVUtils PreAllocStatic(10)重新测试
谢谢当我需要一个快速的新/删除机制时,我自己写的。我不得不妥协于“通用动态分配内存”的要求。这种改进使我能够准确地编写所需的代码。 简而言之-
- 在数组中不需要
- 预分配是必须的(但与任何堆一样)
- 预先分配所需对象大小的向量
分配/解除分配。e、 g.
MyType preMyType[1000]
- 将预分配对象的地址推送到堆栈中
- 关于新地址
- 删除时-将返回的地址推回堆栈
如果您愿意,我可以详细说明,包括代码示例。我曾经有一个古怪的想法,用整数替换可用插槽数组。在这里查看:
我已经创建了一些未记录的池。您可能正在寻找
PreAllocStatic
,如果您可以避免单个项目的销毁,它可能会变得更快。竞技场分配的一种常见模式是:分配竞技场,在竞技场内分配个人,取消分配竞技场。但是,形式上不调用对象的析构函数是未定义的行为。如果您将new/delete与boosts池分配器进行比较,您是否检查了它们是否是线程安全的?new/delete必须是线程安全的,但是分配器没有,boost文档也没有说明。线程安全增加了开销。@VittorioRomeo感谢您的SSVUtils引用,我在上面的结果中添加了它。@John5342感谢您的提醒。目前线程安全还不是问题。但是,如果我们进行并行处理,它在将来可能会成为一个问题。p.s使其运行速度比常规的new/delete快2-4倍。基准也是一个问题……如果分配了异构对象,您是否处理对齐?这不是很乏味吗?@C.R同一堆栈中没有异构对象。每个类都有自己的运算符new()和运算符delete()。每种类型我都有一个堆栈。
g++-mp-4.8 -I$BOOSTHOME/include -I$SSVUTILSHOME/include -std=c++11 -O2 -L$BOOSTHOME/lib -lboost_system -lboost_chrono -o smartptrtest smartptr.cpp
With OUT smartptrs (new and delete):
Start time: 1381596718412786000 nanoseconds since Jan 1, 1970
End time: 1381596731642044000 nanoseconds since Jan 1, 1970
Duration: 13.2293 seconds
With smartptrs (boost::shared_ptr withOUT make_shared):
Start time: 1381596731642108000 nanoseconds since Jan 1, 1970
End time: 1381596753651561000 nanoseconds since Jan 1, 1970
Duration: 22.0095 seconds
With smartptrs (boost::shared_ptr with make_shared):
Start time: 1381596753651611000 nanoseconds since Jan 1, 1970
End time: 1381596768909452000 nanoseconds since Jan 1, 1970
Duration: 15.2578 seconds
With STD smart_ptr (std::shared_ptr with make_shared):
Start time: 1381596768909496000 nanoseconds since Jan 1, 1970
End time: 1381596785500599000 nanoseconds since Jan 1, 1970
Duration: 16.5911 seconds
With Object Pool (boost::object_pool<>):
Start time: 1381596785500638000 nanoseconds since Jan 1, 1970
End time: 1381596793484515000 nanoseconds since Jan 1, 1970
Duration: 7.98388 seconds
With Object Pool (boost::object_pool<>) but without destroy called!:
Start time: 1381596793484551000 nanoseconds since Jan 1, 1970
End time: 1381596805774318000 nanoseconds since Jan 1, 1970
Duration: 12.2898 seconds
With SSVUtils PreAllocDyn(1024*1024)!:
Start time: 1381596815742696000 nanoseconds since Jan 1, 1970
End time: 1381596824173405000 nanoseconds since Jan 1, 1970
Duration: 8.43071 seconds
With SSVUtils PreAllocStatic(10)!:
Start time: 1381596824173448000 nanoseconds since Jan 1, 1970
End time: 1381596832034965000 nanoseconds since Jan 1, 1970
Duration: 7.86152 seconds