doc/ogdf/_f_m_e_multipole_kernel_8h_source.html

#pragma once


#include <ogdf/energybased/fast_multipole_embedder/FMEFunc.h>

#include <ogdf/energybased/fast_multipole_embedder/FMEKernel.h>


namespace ogdf {

namespace fast_multipole_embedder {


struct ArrayPartition {

    uint32_t begin;

    uint32_t end;


    template<typename Func>


    void for_loop(Func& func) {

        for (uint32_t i = begin; i <= end; i++) {

            func(i);

        }

    }


};


class FMEMultipoleKernel : public FMEKernel {

public:

    explicit FMEMultipoleKernel(FMEThread* pThread) : FMEKernel(pThread) { }


    static FMEGlobalContext* allocateContext(ArrayGraph* pGraph, FMEGlobalOptions* pOptions,

            uint32_t numThreads);


    static void deallocateContext(FMEGlobalContext* globalContext);


    void quadtreeConstruction(ArrayPartition& nodePointPartition);


    void multipoleApproxSingleThreaded(ArrayPartition& nodePointPartition);


    void multipoleApproxSingleWSPD(ArrayPartition& nodePointPartition);


    void multipoleApproxNoWSPDStructure(ArrayPartition& nodePointPartition);


    void multipoleApproxFinal(ArrayPartition& nodePointPartition);


    void operator()(FMEGlobalContext* globalContext);


    inline ArrayPartition arrayPartition(uint32_t n) {

        return arrayPartition(n, threadNr(), numThreads(), 16);

    }


    inline ArrayPartition arrayPartition(uint32_t n, uint32_t threadNr, uint32_t numThreads,

            uint32_t chunkSize) {

        ArrayPartition result;

        if (!n) {

            result.begin = 1;

            result.end = 0;

            return result;

        }

        if (n >= numThreads * chunkSize) {

            uint32_t s = n / (numThreads * chunkSize);

            uint32_t o = s * chunkSize * threadNr;

            if (threadNr == numThreads - 1) {

                result.begin = o;

                result.end = n - 1;

            } else {

                result.begin = o;

                result.end = o + s * chunkSize - 1;

            }

        } else {

            if (threadNr == 0) {

                result.begin = 0;

                result.end = n - 1;

            } else {

                result.begin = 1;

                result.end = 0;

            }

        }

        return result;

    }


    template<typename F>


    inline void for_loop(const ArrayPartition& partition, F func) {

        if (partition.begin > partition.end) {

            return;

        }

        for (uint32_t i = partition.begin; i <= partition.end; i++) {

            func(i);

        }

    }


    template<typename F>


    inline void for_tree_partition(F functor) {

        for (LinearQuadtree::NodeID id : m_pLocalContext->treePartition.nodes) {

            functor(id);

        }

    }


    template<typename T, typename C>


    inline void sort_single(T* ptr, uint32_t n, C comparer) {

        if (isMainThread()) {

            std::sort(ptr, ptr + n, comparer);

        }

    }


    template<typename T, typename C>


    inline void sort_parallel(T* ptr, uint32_t n, C comparer) {

        if (n < numThreads() * 1000 || numThreads() == 1) {

            sort_single(ptr, n, comparer);

        } else {

            sort_parallel(ptr, n, comparer, 0, numThreads());

        }

    }


    template<typename T, typename C>


    inline void sort_parallel(T* ptr, uint32_t n, C comparer, uint32_t threadNrBegin,

            uint32_t numThreads) {

        if (n <= 1) {

            return;

        }

        if (numThreads == 1) {

            std::sort(ptr, ptr + n, comparer);

        } else {

            uint32_t half = n >> 1;

            uint32_t halfThreads = numThreads >> 1;

            if (this->threadNr() < threadNrBegin + halfThreads) {

                sort_parallel(ptr, half, comparer, threadNrBegin, halfThreads);

            } else {

                sort_parallel(ptr + half, n - half, comparer, threadNrBegin + halfThreads,

                        halfThreads);

            }


            // wait until all threads are ready.

            sync();

            if (this->threadNr() == threadNrBegin) {

                std::inplace_merge(ptr, ptr + half, ptr + n, comparer);

            }

        }

    }


private:

    FMEGlobalContext* m_pGlobalContext = nullptr;

    FMELocalContext* m_pLocalContext = nullptr;

};


}

}

FMEFunc.h
Definitions of various auxiliary classes for FME layout.

FMEKernel.h
Declaration of FME kernel.

ogdf::fast_multipole_embedder::ArrayGraph
Definition ArrayGraph.h:40

ogdf::fast_multipole_embedder::FMEKernel
Definition FMEKernel.h:44

ogdf::fast_multipole_embedder::FMEKernel::isMainThread
bool isMainThread() const
returns true if this is the main thread ( the main thread is always the first thread )
Definition FMEKernel.h:57

ogdf::fast_multipole_embedder::FMEKernel::threadNr
uint32_t threadNr() const
returns the index of the thread ( 0.. numThreads()-1 )
Definition FMEKernel.h:51

ogdf::fast_multipole_embedder::FMEKernel::numThreads
uint32_t numThreads() const
returns the total number of threads in the pool
Definition FMEKernel.h:54

ogdf::fast_multipole_embedder::FMEKernel::sync
void sync()
Definition FMEKernel.h:48

ogdf::fast_multipole_embedder::FMEMultipoleKernel
Definition FMEMultipoleKernel.h:52

ogdf::fast_multipole_embedder::FMEMultipoleKernel::arrayPartition
ArrayPartition arrayPartition(uint32_t n, uint32_t threadNr, uint32_t numThreads, uint32_t chunkSize)
returns an array partition for the given threadNr and thread count
Definition FMEMultipoleKernel.h:87

ogdf::fast_multipole_embedder::FMEMultipoleKernel::multipoleApproxSingleThreaded
void multipoleApproxSingleThreaded(ArrayPartition &nodePointPartition)
the single threaded version without fences

ogdf::fast_multipole_embedder::FMEMultipoleKernel::m_pLocalContext
FMELocalContext * m_pLocalContext
Definition FMEMultipoleKernel.h:183

ogdf::fast_multipole_embedder::FMEMultipoleKernel::allocateContext
static FMEGlobalContext * allocateContext(ArrayGraph *pGraph, FMEGlobalOptions *pOptions, uint32_t numThreads)
allocate the global and local contexts used by an instance of this kernel

ogdf::fast_multipole_embedder::FMEMultipoleKernel::sort_parallel
void sort_parallel(T *ptr, uint32_t n, C comparer)
lazy parallel sorting for num_threads = power of two
Definition FMEMultipoleKernel.h:146

ogdf::fast_multipole_embedder::FMEMultipoleKernel::sort_single
void sort_single(T *ptr, uint32_t n, C comparer)
sorting single threaded
Definition FMEMultipoleKernel.h:138

ogdf::fast_multipole_embedder::FMEMultipoleKernel::quadtreeConstruction
void quadtreeConstruction(ArrayPartition &nodePointPartition)
sub procedure for quadtree construction

ogdf::fast_multipole_embedder::FMEMultipoleKernel::m_pGlobalContext
FMEGlobalContext * m_pGlobalContext
Definition FMEMultipoleKernel.h:182

ogdf::fast_multipole_embedder::FMEMultipoleKernel::multipoleApproxNoWSPDStructure
void multipoleApproxNoWSPDStructure(ArrayPartition &nodePointPartition)
new but slower method, parallel wspd computation without using the wspd structure

ogdf::fast_multipole_embedder::FMEMultipoleKernel::FMEMultipoleKernel
FMEMultipoleKernel(FMEThread *pThread)
Definition FMEMultipoleKernel.h:54

ogdf::fast_multipole_embedder::FMEMultipoleKernel::arrayPartition
ArrayPartition arrayPartition(uint32_t n)
creates an array partition with a default chunksize of 16
Definition FMEMultipoleKernel.h:82

ogdf::fast_multipole_embedder::FMEMultipoleKernel::deallocateContext
static void deallocateContext(FMEGlobalContext *globalContext)
free the global and local context

ogdf::fast_multipole_embedder::FMEMultipoleKernel::sort_parallel
void sort_parallel(T *ptr, uint32_t n, C comparer, uint32_t threadNrBegin, uint32_t numThreads)
lazy parallel sorting for num_threads = power of two
Definition FMEMultipoleKernel.h:156

ogdf::fast_multipole_embedder::FMEMultipoleKernel::multipoleApproxFinal
void multipoleApproxFinal(ArrayPartition &nodePointPartition)
the final version, the wspd structure is only used for the top of the tree

ogdf::fast_multipole_embedder::FMEMultipoleKernel::multipoleApproxSingleWSPD
void multipoleApproxSingleWSPD(ArrayPartition &nodePointPartition)
the original algorithm which runs the WSPD completely single threaded

ogdf::fast_multipole_embedder::FMEMultipoleKernel::for_loop
void for_loop(const ArrayPartition &partition, F func)
for loop on a partition
Definition FMEMultipoleKernel.h:119

ogdf::fast_multipole_embedder::FMEMultipoleKernel::for_tree_partition
void for_tree_partition(F functor)
for loop on the tree partition
Definition FMEMultipoleKernel.h:130

ogdf::fast_multipole_embedder::FMEMultipoleKernel::operator()
void operator()(FMEGlobalContext *globalContext)
main function of the kernel

ogdf::fast_multipole_embedder::FMEThread
The fast multipole embedder work thread class.
Definition FMEThread.h:77

ogdf::fast_multipole_embedder::LinearQuadtree::NodeID
unsigned int NodeID
Definition LinearQuadtree.h:52

getDoubleFactoredZeroAdjustedMerger
static MultilevelBuilder * getDoubleFactoredZeroAdjustedMerger()
Definition multilevelmixer.cpp:36

ogdf
The namespace for all OGDF objects.
Definition AugmentationModule.h:36

ogdf::fast_multipole_embedder::ArrayPartition
Definition FMEMultipoleKernel.h:40

ogdf::fast_multipole_embedder::ArrayPartition::end
uint32_t end
Definition FMEMultipoleKernel.h:42

ogdf::fast_multipole_embedder::ArrayPartition::begin
uint32_t begin
Definition FMEMultipoleKernel.h:41

ogdf::fast_multipole_embedder::ArrayPartition::for_loop
void for_loop(Func &func)
Definition FMEMultipoleKernel.h:45

ogdf::fast_multipole_embedder::FMEGlobalContext
Global Context.
Definition FMEFunc.h:94

ogdf::fast_multipole_embedder::FMEGlobalOptions
the main global options for a run
Definition FMEFunc.h:66

ogdf::fast_multipole_embedder::FMELocalContext
Local thread Context.
Definition FMEFunc.h:115

ogdf::fast_multipole_embedder::FMELocalContext::treePartition
FMETreePartition treePartition
tree partition assigned to the thread
Definition FMEFunc.h:126

ogdf::fast_multipole_embedder::FMETreePartition::nodes
std::list< LinearQuadtree::NodeID > nodes
Definition FMEFunc.h:49