四叉树图书馆

Question

我需要在四叉树中存储10亿个空间多边形（使用其最小边界矩形指定）。为此，我编写了以下代码。然而，事实证明，对于10亿个点，代码运行速度非常慢。有没有什么方法可以改进代码，以便它可以运行得更快。如果是，那么有人可以帮助相同的

//---------------------------------------------------------------------------
struct MBR
{
    double xRight, xLeft, yBottom, yTop;
    MBR *zero,*first,*second,*third;
    unsigned level=0;
    vector<unsigned> result; //contains the resulting intersecting spatial ids
};
bool intersects(MBR& spatialId,MBR& mbr) 
{
    if (mbr.yBottom > spatialId.yTop || mbr.yTop < spatialId.yBottom) return false;
    if (mbr.xLeft > spatialId.xRight || mbr.xRight < spatialId.xLeft) return false;        
    return true;    
}
//---------------------------------------------------------------------------
bool contains(MBR& spatialId,MBR& mbr) 
{
    if (mbr.yBottom > spatialId.yBottom || mbr.yTop < spatialId.yTop) return false;
    if (mbr.xLeft > spatialId.xLeft || mbr.xRight < spatialId.xRight) return false;
    return true;    
}
//---------------------------------------------------------------------------
bool touches(MBR& spatialId,MBR& mbr) 
{
    if (    (mbr.yBottom >= spatialId.yBottom + std::numeric_limits<double>::epsilon() && 
            mbr.yBottom <= spatialId.yBottom - std::numeric_limits<double>::epsilon()) ||
            (mbr.yTop >= spatialId.yTop + std::numeric_limits<double>::epsilon() &&
            mbr.yTop <= spatialId.yTop - std::numeric_limits<double>::epsilon()))
            return true;
    if (    (mbr.xLeft >= spatialId.xLeft + std::numeric_limits<double>::epsilon() &&
            mbr.xLeft <= spatialId.xLeft - std::numeric_limits<double>::epsilon()) ||
            (mbr.xRight >= spatialId.xRight + std::numeric_limits<double>::epsilon() &&
            mbr.xRight <= spatialId.xRight - std::numeric_limits<double>::epsilon()))
            return true;    
    return false;    
}
//---------------------------------------------------------------------------
MBR MBR1,MBR2,MBR3,MBR4;
vector<unsigned> spatialIds; //contain 1 billion spatial identifiers which are intersected with MBR1, MBR2, MBR3, MBR4
//MBR1, MBR2, MBR3, MBR4 are again specified using their Minimum Bounding Rectangles    
stack<MBR**> stackQuadTree;
MBR *root=new MBR();
(*root).yBottom=-90; (*root).yTop=90;
(*root).xLeft=-180; (*root).xRight=180;
(*root).level=0;
stackQuadTree.push(&root);

while(!stackQuadTree.empty())
{
    MBR** node=&(*stackQuadTree.front());
    if((*node)->level==50)
        break;

    (*node)->zero=new MBR(); (*node)->first=new MBR(); (*node)->second=new MBR(); (*node)->third=new MBR();
    (*node)->zero->yBottom=(*node)->yBottom; (*node)->zero->yTop=((*node)->yBottom+(*node)->yTop)/2;
    (*node)->zero->xLeft=(*node)->xLeft; (*node)->zero->xRight=((*node)->xLeft+(*node)->xRight)/2;                        
    (*node)->zero->level=(*node)->level+1;

    (*node)->first->yBottom=((*node)->yBottom+(*node)->yTop)/2; (*node)->first->yTop=(*node)->yTop; 
    (*node)->first->xLeft=(*node)->xLeft; (*node)->first->xRight=((*node)->xLeft+(*node)->xRight)/2;          
    (*node)->first->level=(*node)->level+1;

    (*node)->second->yBottom=(*node)->yBottom; (*node)->second->yTop=((*node)->yBottom+(*node)->yTop)/2;
    (*node)->second->xLeft=((*node)->xLeft+(*node)->xRight)/2; (*node)->second->xRight=(*node)->xRight;        
    (*node)->second->level=(*node)->level+1;

    (*node)->third->yBottom=((*node)->yBottom+(*node)->yTop)/2; (*node)->third->yTop=(*node)->yTop;
    (*node)->third->xLeft=((*node)->xLeft+(*node)->xRight)/2; (*node)->third->xRight=(*node)->xRight;                        
    (*node)->third->level=(*node)->level+1;

    MBR* node=*stackQuadTree.top();
    stackQuadTree.pop();        
    for(vector<MBR>::iterator itSpatialId=spatialIds.begin(),lSpatialId=spatialIds.end();itSpatialId!=lSpatialId;++itSpatialId)
    {
        if(intersects((*itSpatialId),&(*node)->zero)||contains((*itSpatialId),&(*node)->zero)||touches((*itSpatialId),&(*node)->zero))
        {
            (*node)->zero->result.push_back((*itSpatialId));
            stackQuadTree.push(*(*node)->zero);
        }

        if(intersects((*itSpatialId),&(*node)->first)||contains((*itSpatialId),&(*node)->first)||touches((*itSpatialId),&(*node)->first))
        {
            (*node)->first->result.push_back((*itSpatialId));
            stackQuadTree.push(*(*node)->first);
        }                    

        if(intersects((*itSpatialId),&(*node)->second)||contains((*itSpatialId),&(*node)->second)||touches((*itSpatialId),&(*node)->second))
        {
            (*node)->second->result.push_back((*itSpatialId));
            stackQuadTree.push(*(*node)->second);
        }   

        if(intersects((*itSpatialId),&(*node)->third)||contains((*itSpatialId),&(*node)->third)||touches((*itSpatialId),&(*node)->third))
        {
            (*node)->third->result.push_back((*itSpatialId));
            stackQuadTree.push(*(*node)->third);
        }   
    }
}

Answer 1

由于要求是处理10个⁹记录，即使使用最紧凑的表示，每个记录都是16字节（4 * sizeof(float)），我们需要16 GiB才能保留这些记录记忆。由于我们希望使用多边形的边界框进行索引，因此每个边界框可能属于多个象限。如果存在大量相对较大的多边形或多个重叠，则整个四叉树的内存需求可能会显着增加。这表明了构建四叉树的迭代方法，我们使用文件来存储与每个节点匹配的边界框列表，以及整个树的节点信息。

四叉树图书馆

矩形表示

我们使用矩形来表示两件事：

多边形的边界框（即我们的输入数据）。
象限的边界框（四叉树中的节点）。

我们还需要对矩形执行一些操作，例如将它们细分为象限，或者找出一对矩形是否相交。让我们写一个简单的类来封装它。

<强> rectangle.hpp

#pragma once

#include <cstdint>

template<typename T = float>
struct rectangle_t
{
    typedef typename T value_type;

    rectangle_t() : left(0.0f), top(0.0f), right(0.0f), bottom(0.0f) {}
    rectangle_t(value_type x1, value_type y1, value_type x2, value_type y2)
        : left(x1), top(y1), right(x2), bottom(y2)
    {
    }

    bool intersects(rectangle_t<T> const& other) const;
    bool contains(rectangle_t<T> const& other) const;
    bool touches(rectangle_t<T> const& other) const;
    rectangle_t<T> quadrant(uint32_t n) const;

    value_type left, top, right, bottom;
};

template<typename T>
inline bool rectangle_t<T>::intersects(rectangle_t<T> const& other) const
{
    return !((left > other.right)
        || (right < other.left)
        || (top > other.bottom)
        || (bottom < other.top));
}

template<typename T>
inline bool rectangle_t<T>::contains(rectangle_t<T> const& other) const
{
    return !((left >= other.left)
        || (right <= other.right)
        || (top >= other.top)
        || (bottom <= other.bottom));
}

template<typename T>
inline bool rectangle_t<T>::touches(rectangle_t<T> const& other) const
{
    return ((left == other.right)
        || (right == other.left)
        || (top == other.bottom)
        || (bottom == other.top));
}

template<typename T>
inline rectangle_t<T> rectangle_t<T>::quadrant(uint32_t n) const
{
    value_type const center_x((left + right) / 2);
    value_type const center_y((top + bottom) / 2);
    switch (n & 0x03) {
    case 0: return rectangle_t<T>(left, top, center_x, center_y);
    case 1: return rectangle_t<T>(center_x, top, right, center_y);
    case 2: return rectangle_t<T>(left, center_y, center_x, bottom);
    case 3: return rectangle_t<T>(center_x, center_y, right, bottom);
    }
    return *this; // Can't happen since we mask n
}

typedef rectangle_t<float> rectangle;

注意：虽然我们还提供方法contains()和touches()，但我们并不真正需要它们 - 如果矩形A包含矩形B，那么两者也相交。类似地，如果两个矩形具有重叠的一对边，则它们也被认为是相交的。

矩形序列化

下一步是开发一种将矩形存储在文件中的简单方法。我们可以使用简单的二进制文件，其布局与对象在内存中的表示方式相对应。

该文件包含单个对象序列，没有标题或其他任何内容。

由于我们希望以块的形式处理数据，因此我们实现了提供此功能的简单 reader 和 writer 类。

<强> rectangle_file.hpp

#pragma once

#include "rectangle.hpp"
#include "config.hpp"

#include <fstream>
#include <string>
#include <vector>

typedef std::vector<rectangle> rectangle_vec;

class rectangle_writer
{
public:
    rectangle_writer(std::string const& file_name);
    rectangle_writer(rectangle_writer const&) = delete;

    void write_block(rectangle_vec const& block);

    uint64_t count() const { return count_; }

private:
    std::ofstream f_;
    uint64_t count_;
};

class rectangle_reader
{
public:
    rectangle_reader(std::string const& file_name);
    rectangle_reader(rectangle_reader const&) = delete;

    void read_block(rectangle_vec& block, uint64_t n = BLOCK_SIZE);

    uint64_t count() const { return count_; }
    uint64_t total_count() const { return total_count_; }
    uint64_t remaining_count() const { return total_count_ - count_; }

private:
    std::ifstream f_;
    uint64_t count_;
    uint64_t total_count_;
};

<强> rectangle_file.cpp

#include "rectangle_file.hpp"

#include <algorithm>

rectangle_writer::rectangle_writer(std::string const& file_name)
    : f_(file_name, std::ios_base::binary)
    , count_(0)
{
    if (!f_) {
        throw std::runtime_error("Unable to open index file.");
    }
}

void rectangle_writer::write_block(rectangle_vec const& block)
{
    f_.write(reinterpret_cast<char const*>(&block[0])
        , block.size() * sizeof(rectangle));
    count_ += static_cast<uint32_t>(block.size());
    if (!f_) {
        throw std::runtime_error("Read error.");
    }
}

rectangle_reader::rectangle_reader(std::string const& file_name)
    : f_(file_name, std::ios_base::binary)
    , count_(0)
{
    f_.seekg(0, std::ios::end);
    total_count_ = static_cast<uint32_t>(f_.tellg() / sizeof(rectangle));
    f_.seekg(0, std::ios::beg);
}

void rectangle_reader::read_block(rectangle_vec& block, uint64_t n)
{
    uint64_t to_read(std::min(remaining_count(), n));
    block.resize(to_read);
    if (to_read) {
        f_.read(reinterpret_cast<char*>(&block[0])
            , to_read * sizeof(rectangle));
        count_ += to_read;
        if (!f_) {
            throw std::runtime_error("Write error.");
        }
    }
}

四叉树代表

由于我们可能使用大量节点，我们将所有节点保留在一个数组中，而不是指针使用节点索引来表示层次结构。节点的索引由它在数组中的位置决定，因此我们不需要明确地存储它。

我们使用紧凑结构（node_info）来表示相关的节点信息：

定义象限边界框的矩形。
子节点的4个索引的数组。（我们使用32位索引，将我们限制在约40亿个节点）

每个节点的匹配矩形列表存储在一个数据文件中，该文件根据节点索引（node_XXXXXXXX.dat）命名。

Node Flyweight

为了封装四叉树的表示，并公开一个熟悉的界面来操作它，我们创建一个flyweight类node，持有对quadtree的引用，节点的索引，和树中的当前级别（16字节）。此类提供构建和使用四叉树所需的所有功能：

读取和书写边界框。
读取和编写匹配矩形列表。
访问子节点，节点索引，当前级别......
添加子节点

<强> quadtree.hpp

#pragma once

#include "rectangle.hpp"
#include "rectangle_file.hpp"

#include <string>
#include <vector>

class quadtree
{
public:
    class node
    {
    public:
        rectangle& bounds();
        rectangle const& bounds() const;

        node child(uint32_t i) const;

        rectangle_reader reader() const;
        rectangle_writer writer() const;

        std::string rectangle_file_name() const;

        void add_child_nodes() const;

        bool is_leaf_node() const;

        uint32_t index() const;
        uint32_t level() const;

    private:
        friend class quadtree;
        node(quadtree& tree, uint32_t index, uint32_t level);

        quadtree& tree_;
        uint32_t index_;
        uint32_t level_;
    };

public:
    enum {
        ROOT_NODE_INDEX = 0
        , QUADRANT_COUNT = 4
    };

    quadtree(quadtree&& other);
    ~quadtree();

    static quadtree create(std::string const& dir_name
        , rectangle const& bounds);
    static quadtree load(std::string const& dir_name);

    void save();

    node get_node(uint32_t i = ROOT_NODE_INDEX);
    uint32_t node_count() const;

private:
    quadtree(std::string const& dir_name);
    std::string index_file_name() const;

    uint32_t add_node(rectangle const& bounds);
    void add_child_nodes(uint32_t n);

private:
    struct node_info
    {
        node_info();
        explicit node_info(rectangle const& bounds);

        rectangle bounds;
        uint32_t child[4];
    };
    typedef std::vector<node_info> node_list;

    std::string dir_name_;
    node_list nodes_;
};

inline quadtree::node::node(quadtree& tree, uint32_t index, uint32_t level)
    : tree_(tree)
    , index_(index)
    , level_(level)
{
}

inline rectangle& quadtree::node::bounds()
{
    return tree_.nodes_[index_].bounds;
}

inline rectangle const& quadtree::node::bounds() const
{
    return tree_.nodes_[index_].bounds;
}

inline quadtree::node quadtree::node::child(uint32_t i) const
{
    return node(tree_, tree_.nodes_[index_].child[i], level_ + 1);
}

inline bool quadtree::node::is_leaf_node() const
{
    return !((tree_.nodes_[index_].child[0])
        || (tree_.nodes_[index_].child[1])
        || (tree_.nodes_[index_].child[2])
        || (tree_.nodes_[index_].child[3]));
}

inline uint32_t quadtree::node::index() const
{
    return index_;
}

inline uint32_t quadtree::node::level() const
{
    return level_;
}

四叉树序列化

磁盘上的布局再次对应于对象在内存中的表示方式。

节点文件是一个包含单个对象序列的简单二进制文件：

为了说明，这是如何在磁盘上出现具有1000个矩形的3级四叉树（root + 2级子级）：

配置

<强> config.hpp

#pragma once

#define BLOCK_SIZE (1024 * 8)

#define QUADTREE_LOGGING 0
#define WORKQUEUE_LOGGING 0
#define PROGRESS_LOGGING 1

的处理

我们的处理基于以下观察：

只有根节点的树仍然是有效的树。
我们可以细分任何有效的树，以获得更详细分类的更深层树。

四叉树初始化

最初的步骤是创建最简单的有效四叉树：一个只有根节点，包含所有边界框。

由于我没有可以使用的任何数据，我编写了一个简单的生成器，它创建了一个可配置数量的随机矩形，并使用它们来初始化树。

<强> gen_rnd_tree.cpp

#include "rectangle.hpp"
#include "rectangle_file.hpp"
#include "quadtree.hpp"
#include "config.hpp"

#include <algorithm>
#include <cstdint>
#include <chrono>
#include <iostream>
#include <random>
#include <vector>

#if defined(_WIN32)
#include <direct.h>
#endif

void generate_random(uint32_t n, quadtree& qt)
{
    rectangle_writer writer(qt.get_node().writer());

    std::vector<rectangle> buffer;
    buffer.reserve(BLOCK_SIZE);

    std::random_device rd;
    std::mt19937 gen(rd());
    std::uniform_real_distribution<rectangle::value_type> dis_x(-179.5f, 179.5f);
    std::uniform_real_distribution<rectangle::value_type> dis_y(-89.5f, 89.5f);
    std::exponential_distribution<rectangle::value_type> dis_wh(1.0f);

    for (uint32_t i(0); i < n; ++i) {
        rectangle::value_type x(dis_x(gen));
        rectangle::value_type y(dis_y(gen));
        rectangle::value_type half_w(std::min(dis_wh(gen), 10.0f) * 0.05f);
        rectangle::value_type half_h(std::min(dis_wh(gen), 10.0f) * 0.05f);
        buffer.emplace_back(x - half_w, y - half_h, x + half_w, y + half_h);

        if (buffer.size() >= BLOCK_SIZE) {
            writer.write_block(buffer);
            buffer.clear();
#if(PROGRESS_LOGGING)
            std::cout << ".";
#endif
        }
    }

    if (!buffer.empty()) {
        writer.write_block(buffer);
    }
#if(PROGRESS_LOGGING)
    std::cout << ".\n";
#endif
}

int main(int argc, char* argv[])
{
    using std::chrono::high_resolution_clock;
    using std::chrono::duration_cast;
    using std::chrono::microseconds;

    if (argc != 2) return -1;

    std::string const TREE_DIR("tree");

#if defined(_WIN32)
    _mkdir(TREE_DIR.c_str());
#else 
    mkdir(TREE_DIR.c_str(), 0777);
#endif

    uint32_t const N_POLYGONS(atoi(argv[1]));

    std::cout << "Polygon count = " << N_POLYGONS << "\n";
    std::cout << "Polygon size = " << sizeof(rectangle) << " B\n";
    std::cout << "Total size = " << N_POLYGONS * sizeof(rectangle) << " B\n";

    std::cout << "\nGenerating...\n";

    high_resolution_clock::time_point t1 = high_resolution_clock::now();

    quadtree qt(quadtree::create("tree", rectangle(-180,-90,180,90)));

    generate_random(N_POLYGONS, qt);

    high_resolution_clock::time_point t2 = high_resolution_clock::now();

    std::cout << "\n";

    double dt1_us(static_cast<double>(duration_cast<microseconds>(t2 - t1).count()));
    std::cout << "Generate: " << (dt1_us / 1000.0) << " ms\n";
    std::cout << "\nDone.\n\n";
    return 0;
}

四叉树细分

函数subdivide(quadtree& qt,...)使用堆栈执行树的深度优先遍历。我们可以使用队列进行广度优先遍历，但是一旦我们在树中足够深，队列就会变得非常大。

我们反复使用堆栈顶部的节点，尝试细分它们，并将它们的子节点推送到堆栈上。

函数subdivide(quadtree::node const& qtn, ...)决定是否细分给定节点，并为copy_elements(...)准备参数。一旦节点被细分，并且所有匹配的矩形都已移动到子节点，我们清除给定节点的矩形文件。

函数copy_elements(...)从父节点读取匹配矩形的列表，并将它们复制到它们相交的边界框的所有子节点。

#include "rectangle.hpp"
#include "rectangle_file.hpp"
#include "quadtree.hpp"

#include <algorithm>
#include <cstdint>
#include <chrono>
#include <iostream>
#include <stack>

using std::chrono::high_resolution_clock;
using std::chrono::duration_cast;
using std::chrono::microseconds;

void copy_elements(rectangle_reader& reader, quadtree::node child_node[4])
{
    rectangle target[quadtree::QUADRANT_COUNT] {
         child_node[0].bounds()
        , child_node[1].bounds()
        , child_node[2].bounds()
        , child_node[3].bounds()
    };

    rectangle_writer writer[quadtree::QUADRANT_COUNT] {
        child_node[0].writer()
        , child_node[1].writer()
        , child_node[2].writer()
        , child_node[3].writer()
    };

    rectangle_vec buffer_in;
    buffer_in.reserve(BLOCK_SIZE);
    rectangle_vec buffer_out[quadtree::QUADRANT_COUNT];
    for (auto& buffer : buffer_out) {
        buffer.reserve(BLOCK_SIZE);
    }

#if(PROGRESS_LOGGING)
    for (; reader.remaining_count(); std::cout << ".") {
#else
    for (; reader.remaining_count();) {
#endif
        reader.read_block(buffer_in, BLOCK_SIZE);

        for (auto const& rect : buffer_in) {
            for (uint32_t i(0); i < quadtree::QUADRANT_COUNT; ++i) {
                if (target[i].intersects(rect)) {
                    buffer_out[i].push_back(rect);
                }
            }
        }

        for (uint32_t i(0); i < quadtree::QUADRANT_COUNT; ++i) {
            if (!buffer_out[i].empty()) {
                writer[i].write_block(buffer_out[i]);
                buffer_out[i].clear();
            }
        }
    }
}

// Return true if we should subdivide further, false otherwise
bool subdivide(quadtree::node const& qtn, uint32_t max_depth, uint32_t max_leaf_size)
{
    bool at_max_depth(qtn.level() >= max_depth);
    std::cout << (at_max_depth ? "Skipping" : "Subdividing")
        << " node #" << qtn.index() << " @ level " << qtn.level() << ".\n";
    if (at_max_depth) {
        return false;
    } else {
        // Make sure reader goes out of scope before writer is created.
        rectangle_reader reader(qtn.reader());
        if (qtn.is_leaf_node()) {
            if (reader.total_count() <= max_leaf_size) {
                std::cout << "Leaf node (" << reader.total_count() << ").\n";
                return false;
            }
            qtn.add_child_nodes();
        } else if (!reader.total_count()) {
            std::cout << "Branch node.\n";
            return (qtn.level() < max_depth);
        }

        quadtree::node child_nodes[4] {
            qtn.child(0)
            , qtn.child(1)
            , qtn.child(2)
            , qtn.child(3)
        };

        high_resolution_clock::time_point t1(high_resolution_clock::now());

        copy_elements(reader, child_nodes);

        high_resolution_clock::time_point t2(high_resolution_clock::now());
        double dt_us(static_cast<double>(duration_cast<microseconds>(t2 - t1).count()));

        std::cout << ". (" << reader.count() << ") " << (dt_us / 1000.0) << " ms\n";
    }

    rectangle_writer writer(qtn.writer()); // Clean the file

    std::cout << "Branch node.\n";
    return (qtn.level() < max_depth);
}

void subdivide(quadtree& qt, uint32_t max_depth, uint32_t max_leaf_size)
{
    std::stack<quadtree::node> work;
    work.emplace(qt.get_node());
    std::size_t max_queue_size(work.size());

    for (; !work.empty();) {
        quadtree::node node(work.top());
        work.pop();

        if (subdivide(node, max_depth, max_leaf_size)) {
            for (uint32_t i(0); i < quadtree::QUADRANT_COUNT; ++i) {
                work.emplace(node.child(i));
            }
        }
        max_queue_size = std::max(max_queue_size, work.size());
#if(WORKQUEUE_LOGGING)
        std::cout << "* Work queue " << work.size() << " (" << max_queue_size << ").\n";
#endif
    }
}

int main(int argc, char* argv[])
{
    uint32_t const MAX_DEPTH(atoi((argc >= 2) ? argv[1] : "2"));
    uint32_t const MAX_LEAF_SIZE(atoi((argc >= 3) ? argv[2] : "100"));

    std::cout << "Loading...\n";

    high_resolution_clock::time_point t1(high_resolution_clock::now());

    quadtree qt(quadtree::load("tree"));

    if (qt.node_count() < 1) {
        std::cerr << "Invalid tree.\n";
        return -1;
    }

    std::cout << "Building tree (max_depth=" << MAX_DEPTH
        << ", max_leaf_size=" << MAX_LEAF_SIZE << ")...\n";

    high_resolution_clock::time_point t2(high_resolution_clock::now());

    subdivide(qt, MAX_DEPTH, MAX_LEAF_SIZE);

    high_resolution_clock::time_point t3(high_resolution_clock::now());

    std::cout << "\n";

    std::cout << "Tree completed (" << qt.node_count() << " nodes).\n\n";

    double dt1_us(static_cast<double>(duration_cast<microseconds>(t2 - t1).count()));
    double dt2_us(static_cast<double>(duration_cast<microseconds>(t3 - t2).count()));
    std::cout << "Load: " << (dt1_us / 1000.0) << " ms\n";
    std::cout << "Process: " << (dt2_us / 1000.0) << " ms\n";
    std::cout << "\nDone.\n\n";
    return 0;
}

用法

gen_rnd_tree <count> - 在根节点中使用 count 矩形生成树。
build_tree <max_depth> <max_node_size> - 细分 max_node_size 矩形的节点，深度 max_depth （root位于深度0处）。

样本输出

Polygon count = 1000
Polygon size = 16 B
Total size = 16000 B

Generating...
.

Generate: 0 ms

Done.

Loading...
Building tree (max_depth=5, max_leaf_size=100)...
Subdividing node #0 @ level 0.
.. (1000) 15.624 ms
Branch node.
Subdividing node #4 @ level 1.
.. (288) 15.625 ms
Branch node.
Subdividing node #8 @ level 2.
Leaf node (71).
Subdividing node #7 @ level 2.
Leaf node (59).
Subdividing node #6 @ level 2.
Leaf node (81).
Subdividing node #5 @ level 2.
Leaf node (77).
Subdividing node #3 @ level 1.
.. (212) 0 ms
Branch node.
Subdividing node #12 @ level 2.
Leaf node (46).
Subdividing node #11 @ level 2.
Leaf node (55).
Subdividing node #10 @ level 2.
Leaf node (55).
Subdividing node #9 @ level 2.
Leaf node (58).
Subdividing node #2 @ level 1.
.. (260) 15.626 ms
Branch node.
Subdividing node #16 @ level 2.
Leaf node (68).
Subdividing node #15 @ level 2.
Leaf node (69).
Subdividing node #14 @ level 2.
Leaf node (71).
Subdividing node #13 @ level 2.
Leaf node (53).
Subdividing node #1 @ level 1.
.. (240) 0 ms
Branch node.
Subdividing node #20 @ level 2.
Leaf node (68).
Subdividing node #19 @ level 2.
Leaf node (60).
Subdividing node #18 @ level 2.
Leaf node (62).
Subdividing node #17 @ level 2.
Leaf node (50).

Tree completed (21 nodes).

Load: 0 ms
Process: 109.377 ms

Done.

当尝试使用10个⁸矩形，64k记录的BLOCK_SIZE时，构建一个max_depth为6的树花了大约45秒。这已经为节点提供了大约。使用内存算法可以轻松处理的10个⁵项目。

程序在整个过程中只使用了几个MiB的RAM。

进一步改进

错误检查，单元测试（我不能在这里填写代码）。
将元数据添加到矩形文件中，以便您可以找到它们匹配的多边形。我会保持记录的大小为16字节（对齐）的倍数。
并行
- 互斥用于同步quadtree，互斥锁以同步stack，线程池以运行for (; !work.empty();) { ...循环。
- 由于我们只在细分后推送子节点，因此每个线程将始终在树的孤立部分上工作。
混合方法
- 磁盘I / O成为此类处理的瓶颈。一旦我们得到足够小的节点（例如10个⁵ - 10 ⁶条目），我们就可以方便地在内存中处理数据。
- 使用此算法中的节点列表作为查找来加载＆＃34; small＆＃34;内存四叉树。实施缓存机制，以保持最近的查找＆＃34;小＆＃34;四叉树可用。
矢量化（可能会加速匹配大量的矩形）。

Answer 2

log2（10亿）约为30

为了减少您的操作次数，请考虑更快速到达正确邻居的数据结构。

例如，如果您知道您的对象位于10km x 10km的网格内，请考虑将其分解为10x10网格（1kmx1km）然后，任何属于特定网格的对象都可以立即跳转到1％的对象（假设它们均匀分布）。

显然，你可以有一个递归结构，但你真的不需要超过一个或两个10x10分割。为什么不尝试顶级，每个子网格是四叉树？

我也注意到你有一个奇怪的结构：

mbr.yTop >= spatialId.yTop + std::numeric_limits<double>::epsilon()

我认为您可以将其简化为：

spatialId.yTop < mbr.yTop

这是浮点分辨率的定义，不是吗？如果我是对的，这应该会加速你的代码，但这只是一个不变的因素。

class Grid {
private:
  stackQuadTree qt[100]; // 10x10 array of quadtrees
public:
  Grid(double xmin, double xmax, double ymin, double ymax) {
    // store your 10x10 grid in the grid object
    gridSizeX = 1/10 of the size of grid in the x
    gridSizeY = 1/10 of the size of grid in the y
  }

  stackQuadTree& findGrid(MBR& mbr) {
    int i = (mbr.xLeft - xmin) / gridSizeX;
    int j = (mbr.yTop - ymin) / gridSizeY;
    return qt[i*10+j];
  }

  void add(MBR& mbr) {
    // add the right quadtree and add the object in
  }
};

Answer 3

嗯，有几个主角：

您可以在不改变结构的情况下加速代码
您可以加快代码更改结构，以便成为多线程，因此您将使用计算机的多个核心。
最佳解决方案是应用1然后再应用2.

1）

a- sizeof(MBR)应该提供76字节+向量dyn内存空间，因此应删除intersects，touches和contains中复制的所有对象。使用bool myfunc(const MBR & spatialId, const MBR & mbr)代替3种方法myfunc={intersects, touches , contains}.

B- 将std::numeric_limits<double>::epsilon()存储在const变量中。编译器会喜欢它！

2）

多线程化过程主要是对内部for循环进行并列化。一种简单的方法是使用OpenMP。

尝试使用for指令包围#pragma循环，类似：

#pragma omp parallel for
for(vector<MBR>::iterator itSpatialId=spatialIds.begin(),lSpatialId=spatialIds.end();itSpatialId!=lSpatialId;++itSpatialId)
{
   // ....
}
#pragma omp barrier

但这还不够，因为会同时访问某些共享数据（导致崩溃）。所以你必须使用lock / mutex / atomics来保护stackQuadTree上的MBR::result和push_back

在四叉树中存储十亿个多边形

3 个答案:

四叉树图书馆

矩形表示

矩形序列化

四叉树代表

Node Flyweight

四叉树序列化

配置

的处理

四叉树初始化

四叉树细分

用法

样本输出

进一步改进