#include "knnCPU.h"
#include <omp.h>
#include <algorithm>

Include dependency graph for knnCPU.cpp:

Functions
std::pair< Point2D, Point2D >	GetGabarit (const std::vector< Vortex2D > &vtx)
	�� (�� ) More...

unsigned int	ExpandBits (unsigned int v)

unsigned int	Morton2D (const Point2D &r)

void	RSort_Parallel (TParticleCode m, TParticleCode m_temp, unsigned int n, unsigned int *s)
	�� More...

size_t	BinSearch (const std::vector< std::pair< double, size_t >> &currentNN, double x, int low, int high)

void	newSort (std::vector< std::pair< double, size_t >> &mass, std::vector< std::pair< double, size_t >> &dstKeys)

void	newMerge (std::vector< std::pair< double, size_t >> &currentNN, const std::vector< std::pair< double, size_t >> &candidateNN, std::vector< size_t > &loc, std::vector< size_t > &counter, std::vector< size_t > &offset, std::vector< size_t > &counterScan, std::vector< std::pair< double, size_t >> &updateNN)

void	mainCycle (const int k, const std::vector< Vortex2D > &vtx, const std::pair< Point2D, Point2D > &gab, const double scale, const int sdvig, std::vector< TParticleCode > &mortonCodeBoth, std::vector< unsigned int > &s, std::vector< TParticleCode > &mortonCodeBoth_temp, std::vector< TParticleCode > &mcdata, std::vector< TParticleCode > &mcquery, std::vector< unsigned int > &iq, std::vector< size_t > &initneig, std::vector< std::vector< std::pair< double, size_t >>> &initdist, double *time)

void	WakekNN (const std::vector< Vortex2D > &vtx, const size_t k, std::vector< std::vector< std::pair< double, size_t >>> &initdist)

Variables
const int	codeLength = 15

const int	twoPowCodeLength = (1 << codeLength)

Function Documentation

size_t BinSearch	(	const std::vector< std::pair< double, size_t >> &	currentNN,
		double	x,
		int	low,
		int	high
	)

inline

Definition at line 139 of file knnCPU.cpp.

 {
     int mid = -1;
 
     if (x > currentNN[high].first)
         return high;
 
     while (low <= high) {
         mid = (low + high) / 2;
 
         if (currentNN[mid].first == x)
             return mid + 1; //����� �� �����        if (currentNN[mid].first < x)
            low = mid + 1;
        else
            high = mid - 1;
    }
    return mid;
}
 
         if (currentNN[mid].first < x)
             low = mid + 1;
         else
             high = mid - 1;
     }
     return mid;
 }

Here is the caller graph for this function:

unsigned int ExpandBits ( unsigned int v )

Definition at line 24 of file knnCPU.cpp.

 {
     // ������� 1 ����
     v = (v | (v << 8)) & 0x00FF00FF;      //  00000000`00000000`abcdefgh`ijklmnop 
     //                                      | 00000000`abcdefgh`ijklmnop`00000000
     //                                      = 00000000`abcdefgh`XXXXXXXX`ijklmnop
     //                                      & 00000000`11111111`00000000`11111111
     //                                      = 00000000`abcdefgh`00000000`ijklmnop
 
     v = (v | (v << 4)) & 0x0F0F0F0F;      //  00000000`abcdefgh`00000000`ijklmnop 
     //                                      | 0000abcd`efgh0000`0000ijkl`mnop0000
     //                                      = 0000abcd`XXXXefgh`0000ijkl`XXXXmnop
     //                                      & 00001111`00001111`00001111`00001111
     //                                      = 0000abcd`0000efgh`0000ijkl`0000mnop
 
     v = (v | (v << 2)) & 0x33333333;      //  0000abcd`0000efgh`0000ijkl`0000mnop 
     //                                      | 00abcd00`00efgh00`00ijkl00`00mnop00
     //                                      = 00abXXcd`00efXXgh`00ijXXkl`00mnXXop
     //                                      & 00110011`00110011`00110011`00110011
     //                                      = 00ab00cd`00ef00gh`00ij00kl`00mn00op
 
     v = (v | (v << 1)) & 0x55555555;      //  00ab00cd`00ef00gh`00ij00kl`00mn00op 
     //                                      | 0ab00cd0`0ef00gh0`0ij00kl0`0mn00op0
     //                                      = 0aXb0cXd`0eXf0gXh`0iXj0kXl`0mXn0oXp
     //                                      & 01010101`01010101`01010101`01010101
     //                                      = 0a0b0c0d`0e0f0g0h`0i0j0k0l`0m0n0o0p
     return v;
 }

Here is the caller graph for this function:

std::pair<Point2D, Point2D> GetGabarit ( const std::vector< Vortex2D > & vtx )

�� (�� )

Definition at line 13 of file knnCPU.cpp.

 {
     auto xx = std::minmax_element(vtx.begin(), vtx.end(), [](const Vortex2D& P1, const Vortex2D& P2) {return P1.r()[0] < P2.r()[0]; });
     auto yy = std::minmax_element(vtx.begin(), vtx.end(), [](const Vortex2D& P1, const Vortex2D& P2) {return P1.r()[1] < P2.r()[1]; });
 
     return { { xx.first->r()[0], yy.first->r()[1] }, { xx.second->r()[0], yy.second->r()[1] } };
 }

Here is the call graph for this function:

Here is the caller graph for this function:

void mainCycle	(	const int	k,
		const std::vector< Vortex2D > &	vtx,
		const std::pair< Point2D, Point2D > &	gab,
		const double	scale,
		const int	sdvig,
		std::vector< TParticleCode > &	mortonCodeBoth,
		std::vector< unsigned int > &	s,
		std::vector< TParticleCode > &	mortonCodeBoth_temp,
		std::vector< TParticleCode > &	mcdata,
		std::vector< TParticleCode > &	mcquery,
		std::vector< unsigned int > &	iq,
		std::vector< size_t > &	initneig,
		std::vector< std::vector< std::pair< double, size_t >>> &	initdist,
		double *	time
	)

Definition at line 264 of file knnCPU.cpp.

 {
     //��������������� ��������� ������ � [0;0.75)^2, ����� �� ������������ ����� 
 
     time[0] = omp_get_wtime();
 #pragma omp parallel for
     for (int i = 0; i < vtx.size(); ++i)
     {
         //�������� ������� data 
         mortonCodeBoth[i].key = Morton2D((vtx[i].r() - gab.first) * (0.75 / scale) + sdvig * Point2D{ 0.05, 0.05 });
         mortonCodeBoth[i].key <<= 1;
         //mortonCodeBoth[i].isQuery = 0;
         mortonCodeBoth[i].originNumber = i;
 
         //�������� ������� query
         mortonCodeBoth[vtx.size() + i].key = mortonCodeBoth[i].key;// Morton2D((vtx[i].r() - gab.first) * (0.75 / scale) + sdvig * Point2D{ 0.05, 0.05 });
 
         mortonCodeBoth[vtx.size() + i].key |= 1;
         mortonCodeBoth[vtx.size() + i].originNumber = i;
 
         //std::cout << "code_data[" << i << "] = " << std::bitset<8>(mortonCodeData[i].key) << std::endl;
     }
 
     time[1] = omp_get_wtime();
     //std::cout << "----------" << std::endl;
 
 
     //for (size_t i = 0; i < mortonCodeBoth.size(); ++i)
     //{
     //  std::cout << "code[" << i << "] = " << std::bitset<2 * codeLength + 1>(mortonCodeBoth[i].key) << std::endl;
     //}
 
     //���������� ������� ������� (data � query) �� ������������ �����	      
     RSort_Parallel(mortonCodeBoth.data(), mortonCodeBoth_temp.data(), (int)mortonCodeBoth.size(), s.data());
 
     time[2] = omp_get_wtime();
 
     //��� ������� (�������� ������ ������� data � query � ����������� ������������� ������)
     //for (size_t i = 0; i < mortonCodeBoth.size() / 2; ++i)
     //  if (rand() > RAND_MAX / 2)
     //      std::swap(mortonCodeBoth[2 * i], mortonCodeBoth[2 * i + 1]);
 
 
 
     //std::cout << "----------" << std::endl;
 
     //��� ������� ������� ���������� ������ iq -- ������ ���������� ������ �������� ������
     //������������� ������ mortonCodeBoth ��������� �� mcquery (������ �������) � mcdata (������ ������)
     mcdata.resize(0);
     mcquery.resize(0);
     mcdata.reserve(vtx.size());
     mcquery.reserve(vtx.size());
 
     time[3] = omp_get_wtime();
 
     iq.resize(0);
     iq.reserve(vtx.size());
     for (size_t i = 0, j = -1; i < mortonCodeBoth.size(); ++i)
     {
         if (mortonCodeBoth[i].key & 1)
         {
             mcquery.push_back(mortonCodeBoth[i]);
             iq.push_back((unsigned)(j + 1) == 0 ? 0 : (unsigned int)j);
         }
         else
         {
             ++j;
             mcdata.push_back(mortonCodeBoth[i]);
         }
     }
 
     time[4] = omp_get_wtime();
 
     //std::cout << "----------" << std::endl;
     //
     //for (size_t i = 0; i < iq.size(); ++i)
     //  std::cout << "iq[" << i << "] = " << iq[i] << std::endl;
     //
     //std::cout << "----------" << std::endl;
 
     //for (size_t i = 0; i < mcdata.size(); ++i)
     //  std::cout << "mcdata[" << i << "] = " << std::bitset<8>(mcdata[i].key) << ", isQuery = " << (int)mcdata[i].isQuery << std::endl;
 
     //����� ��� ������� ������� k ����� ������ ����� � k ����� ������ ������ (��� �������� ������ � ����� �������, ��������� � ������)
     //��� ������� ������� ������� ������ �������� ������, � �������� ����� ������������� 2*k �������	        
 
 #pragma omp parallel for
     for (int q = 0; q < mcquery.size(); ++q)
     {
         size_t pt = iq[q];
         size_t left = pt - k + 1;// , right = pt + k;
         if (pt < k - 1)
         {
             left = 0;
             //right = 2 * k - 1;
         }
         if (pt > mcquery.size() - k - 1)
         {
             //right = mcquery.size() - 1;
             left = (mcquery.size() - 1) - (2 * k - 1);
         }
 
         initneig[q] = left;
     }
 
     time[5] = omp_get_wtime();
 
     //std::cout << "----------" << std::endl;
 
     //for (size_t i = 0; i < initneig.size(); ++i)
     //  std::cout << "initneig[" << i << "] = from " << initneig[i] << std::endl;
 
 
     //std::cout << "----------" << std::endl;
 
     std::vector<std::pair<double, size_t>> dist(2 * k, { -1.0, -1 });
     //std::vector<std::pair<double, size_t>>    mergeArray(3 * k);
 
     std::vector<size_t> loc(2 * k);
     std::vector<size_t> counter(2 * k, 0);
     std::vector<size_t> offset(2 * k, 0);
     std::vector<size_t> counterScan(2 * k, 0);
     std::vector<std::pair<double, size_t>> updateNN(k, { 0.0, 0 });
 
     std::vector<std::pair<double, size_t>> dstKeys1(2 * k, { 0.0, 0 });
     std::vector<std::pair<double, size_t>> dstKeys(k, { 0.0, 0 });
 
     time[6] = omp_get_wtime();
 
     if (sdvig == 0)
 #pragma omp parallel for firstprivate(dstKeys1)
         for (int i = 0; i < initdist.size(); ++i)
         {
 
             for (size_t j = 0; j < 2 * k; ++j)
                 initdist[mcquery[i].originNumber][j] = { (vtx[mcquery[i].originNumber].r() - vtx[mcdata[initneig[i] + j].originNumber].r()).length2(),  mcdata[initneig[i] + j].originNumber };
 
             //std::sort(initdist[mcquery[i].originNumber].begin(), initdist[mcquery[i].originNumber].end(), [](const std::pair<double, size_t>& pr1, const std::pair<double, size_t>& pr2) {return pr1.first < pr2.first; });
             newSort(initdist[mcquery[i].originNumber], dstKeys1);
 
             initdist[mcquery[i].originNumber].resize(k);
         }
     else
 #pragma omp parallel for firstprivate(dist) firstprivate(loc, counter, offset, counterScan, updateNN, dstKeys)//, firstprivate(mergeArray)
         for (int i = 0; i < initdist.size(); ++i)
         {
             for (size_t j = 0; j < 2 * k; ++j)
                 dist[j] = { (vtx[mcquery[i].originNumber].r() - vtx[mcdata[initneig[i] + j].originNumber].r()).length2(),  mcdata[initneig[i] + j].originNumber };
 
             //std::sort(dist.begin(), dist.end(), [](const std::pair<double, size_t>& pr1, const std::pair<double, size_t>& pr2) {return pr1.first < pr2.first; });
 
             //std::cout << "dist[" << i << "] = "; 
             //for (size_t j = 0; j < k; ++j)
             //  std::cout << "(" << dist[j].first << ", " << dist[j].second << "), ";
             //std::cout << std::endl;
 
             //Mymerge(initdist[mcquery[i].originNumber].begin(), initdist[mcquery[i].originNumber].end(), dist.begin(), dist.end(), mergeArray.begin());
             newMerge(initdist[mcquery[i].originNumber], dist, loc, counter, offset, counterScan, updateNN);
 
             newSort(initdist[mcquery[i].originNumber], dstKeys);
 
             //std::sort(initdist[mcquery[i].originNumber].begin(), initdist[mcquery[i].originNumber].end());
 
             //std::copy(mergeArray.begin(), mergeArray.begin() + k, initdist[mcquery[i].originNumber].begin());
         }
 
     time[7] = omp_get_wtime();
 }

Here is the call graph for this function:

Here is the caller graph for this function:

unsigned int Morton2D ( const Point2D & r )

Definition at line 56 of file knnCPU.cpp.

 {
     const Point2D& rscale = twoPowCodeLength * r;
     const unsigned int& xx = ExpandBits((unsigned int)(rscale[0]));
     const unsigned int& yy = ExpandBits((unsigned int)(rscale[1]));
     return yy | (xx << 1);
 }

Here is the call graph for this function:

Here is the caller graph for this function:

void newMerge	(	std::vector< std::pair< double, size_t >> &	currentNN,
		const std::vector< std::pair< double, size_t >> &	candidateNN,
		std::vector< size_t > &	loc,
		std::vector< size_t > &	counter,
		std::vector< size_t > &	offset,
		std::vector< size_t > &	counterScan,
		std::vector< std::pair< double, size_t >> &	updateNN
	)

Definition at line 180 of file knnCPU.cpp.

 {
     const size_t k = candidateNN.size() / 2;  //���������� ��������� �������    //std::cout << "loc: " << std::endl;        
    for (size_t j = 0; j < 2 * k; ++j)
    {
        loc[j] = BinSearch(currentNN, candidateNN[j].first, 0, (int)k - 1);
        //std::cout << loc[j] << " ";
    }
    //std::cout << std::endl;

    for (size_t j = 0; j < 2 * k; ++j)
        counter[j] = j & 1;

    //std::cout << "counter: " << std::endl;
    //for (size_t j = 0; j < 2 * k; ++j)
    //    std::cout << counter[j] << " ";
    //std::cout << std::endl;

    for (size_t j = 0; j < 2 * k; ++j)
    {
        if ((loc[j] > 0) && ((loc[j] == k) || (candidateNN[j].first == currentNN[loc[j] - 1].first))) //����� ����� second, ���������!!
            offset[j] = k;
        else
            offset[j] = counter[2 * loc[j]]++;
    }

    //std::cout << "counter: " << std::endl;
    //for (size_t j = 0; j < 2 * k; ++j)
    //    std::cout << counter[j] << " ";
    //std::cout << std::endl;

    //std::cout << "offset: " << std::endl;
    //for (size_t j = 0; j < 2 * k; ++j)
    //    std::cout << offset[j] << " ";
    //std::cout << std::endl;


    counterScan[0] = 0;
    for (size_t j = 1; j < 2 * k; ++j)
        counterScan[j] = counterScan[j - 1] + counter[j - 1];

    //std::cout << "counterScan: " << std::endl;
    //for (size_t j = 0; j < 2 * k; ++j)
    //    std::cout << counterScan[j] << " ";
    //std::cout << std::endl;



    size_t index;
    for (size_t j = 0; j < k; ++j)
    {
        index = counterScan[2 * j + 1];
        //std::cout << index << std::endl;
        if (index < k)
            updateNN[index] = currentNN[j];
    }
    //std::cout << "updateNN: " << std::endl;
    //for (size_t j = 0; j < k; ++j)
    //    std::cout << "(" << updateNN[j].first << ", " << updateNN[j].second << "), ";
    //std::cout << std::endl;

    for (size_t j = 0; j < 2 * k; ++j)
    {
        if (2 * loc[j] < 2 * k)
        {
            index = counterScan[2 * loc[j]] + offset[j];
            if (index < k)
                updateNN[index] = candidateNN[j];
        }
    }

    currentNN.swap(updateNN);
}
 
     //std::cout << "loc: " << std::endl;        
     for (size_t j = 0; j < 2 * k; ++j)
     {
         loc[j] = BinSearch(currentNN, candidateNN[j].first, 0, (int)k - 1);
         //std::cout << loc[j] << " ";
     }
     //std::cout << std::endl;
 
     for (size_t j = 0; j < 2 * k; ++j)
         counter[j] = j & 1;
 
     //std::cout << "counter: " << std::endl;
     //for (size_t j = 0; j < 2 * k; ++j)
     //    std::cout << counter[j] << " ";
     //std::cout << std::endl;
 
     for (size_t j = 0; j < 2 * k; ++j)
     {
         if ((loc[j] > 0) && ((loc[j] == k) || (candidateNN[j].first == currentNN[loc[j] - 1].first))) //����� ����� second, ���������!!
             offset[j] = k;
         else
             offset[j] = counter[2 * loc[j]]++;
     }
 
     //std::cout << "counter: " << std::endl;
     //for (size_t j = 0; j < 2 * k; ++j)
     //    std::cout << counter[j] << " ";
     //std::cout << std::endl;
 
     //std::cout << "offset: " << std::endl;
     //for (size_t j = 0; j < 2 * k; ++j)
     //    std::cout << offset[j] << " ";
     //std::cout << std::endl;
 
 
     counterScan[0] = 0;
     for (size_t j = 1; j < 2 * k; ++j)
         counterScan[j] = counterScan[j - 1] + counter[j - 1];
 
     //std::cout << "counterScan: " << std::endl;
     //for (size_t j = 0; j < 2 * k; ++j)
     //    std::cout << counterScan[j] << " ";
     //std::cout << std::endl;
 
 
 
     size_t index;
     for (size_t j = 0; j < k; ++j)
     {
         index = counterScan[2 * j + 1];
         //std::cout << index << std::endl;
         if (index < k)
             updateNN[index] = currentNN[j];
     }
     //std::cout << "updateNN: " << std::endl;
     //for (size_t j = 0; j < k; ++j)
     //    std::cout << "(" << updateNN[j].first << ", " << updateNN[j].second << "), ";
     //std::cout << std::endl;
 
     for (size_t j = 0; j < 2 * k; ++j)
     {
         if (2 * loc[j] < 2 * k)
         {
             index = counterScan[2 * loc[j]] + offset[j];
             if (index < k)
                 updateNN[index] = candidateNN[j];
         }
     }
 
     currentNN.swap(updateNN);
 }

Here is the call graph for this function:

Here is the caller graph for this function:

void newSort	(	std::vector< std::pair< double, size_t >> &	mass,
		std::vector< std::pair< double, size_t >> &	dstKeys
	)

Definition at line 160 of file knnCPU.cpp.

                                                                                                     {
     size_t k = mass.size();
     size_t cnt = 0;
 
     for (size_t i = 0; i < k; i++) {
         double elem = mass[i].first;
 
         cnt = 0;
         for (size_t j = 0; j < k; j++) {
             cnt += (mass[j].first < elem);
             //std::cout << cnt;
         }
         //if (!AssumeDistinct) 
         for (size_t j = 0; j < i; j++)
             cnt += (mass[j].first == elem);
         dstKeys[cnt] = mass[i];
     }
     mass.swap(dstKeys);
 }

Here is the caller graph for this function:

void RSort_Parallel	(	TParticleCode *	m,
		TParticleCode *	m_temp,
		unsigned int	n,
		unsigned int *	s
	)

��

Definition at line 66 of file knnCPU.cpp.

 {
     if (n == 0)
         return;
     // ���������� ��������������� �������    //std::cout << "threads = " << (int)threads << std::endl;

#pragma omp parallel num_threads(threads)
    {
        TParticleCode* source = m;
        TParticleCode* dest = m_temp;
        unsigned int l = omp_get_thread_num();
        unsigned int div = n / omp_get_num_threads();
        unsigned int mod = n % omp_get_num_threads();
        unsigned int left_index = l < mod ? (div + (mod == 0 ? 0 : 1)) * l : n - (omp_get_num_threads() - l) * div;
        unsigned int right_index = left_index + div - (mod > l ? 0 : 1);

        for (unsigned int digit = 0; digit < sizeof(m->key); ++digit)
        {
            unsigned int s_sum[256] = { 0 };
            unsigned int s0[256] = { 0 };
            unsigned char* b1 = (unsigned char*)&source[right_index].key;
            unsigned char* b2 = (unsigned char*)&source[left_index].key;
            while (b1 >= b2)
            {
                ++s0[*(b1 + digit)];
                b1 -= sizeof(TParticleCode);
            }
            for (unsigned int i = 0; i < 256; i++)
            {
                s[i + 256 * l] = s0[i];
            }

#pragma omp barrier
            for (unsigned int j = 0; j < threads; j++)
            {
                for (unsigned int i = 0; i < 256; i++)
                {
                    s_sum[i] += s[i + 256 * j];
                    if (j < l)
                    {
                        s0[i] += s[i + 256 * j];
                    }
                }
            }

            for (unsigned int i = 1; i < 256; ++i)
            {
                s_sum[i] += s_sum[i - 1];
                s0[i] += s_sum[i - 1];
            }
            unsigned char* b = (unsigned char*)&source[right_index].key + digit;
            TParticleCode* v1 = &source[right_index];
            TParticleCode* v2 = &source[left_index];
            while (v1 >= v2)
            {
                dest[--s0[*b]] = *v1--;
                b -= sizeof(TParticleCode);
            }
#pragma omp barrier
            std::swap(source, dest);
        }
    }

    // ���� ���� ��������� ������������, ������ �������� � �������� ������
    if (sizeof(m->key) == 1)
    {
        memcpy(m, m_temp, n * sizeof(TParticleCode));
    }
}
     unsigned char threads = omp_get_max_threads();
     //std::cout << "threads = " << (int)threads << std::endl;
 
 #pragma omp parallel num_threads(threads)
     {
         TParticleCode* source = m;
         TParticleCode* dest = m_temp;
         unsigned int l = omp_get_thread_num();
         unsigned int div = n / omp_get_num_threads();
         unsigned int mod = n % omp_get_num_threads();
         unsigned int left_index = l < mod ? (div + (mod == 0 ? 0 : 1)) * l : n - (omp_get_num_threads() - l) * div;
         unsigned int right_index = left_index + div - (mod > l ? 0 : 1);
 
         for (unsigned int digit = 0; digit < sizeof(m->key); ++digit)
         {
             unsigned int s_sum[256] = { 0 };
             unsigned int s0[256] = { 0 };
             unsigned char* b1 = (unsigned char*)&source[right_index].key;
             unsigned char* b2 = (unsigned char*)&source[left_index].key;
             while (b1 >= b2)
             {
                 ++s0[*(b1 + digit)];
                 b1 -= sizeof(TParticleCode);
             }
             for (unsigned int i = 0; i < 256; i++)
             {
                 s[i + 256 * l] = s0[i];
             }
 
 #pragma omp barrier
             for (unsigned int j = 0; j < threads; j++)
             {
                 for (unsigned int i = 0; i < 256; i++)
                 {
                     s_sum[i] += s[i + 256 * j];
                     if (j < l)
                     {
                         s0[i] += s[i + 256 * j];
                     }
                 }
             }
 
             for (unsigned int i = 1; i < 256; ++i)
             {
                 s_sum[i] += s_sum[i - 1];
                 s0[i] += s_sum[i - 1];
             }
             unsigned char* b = (unsigned char*)&source[right_index].key + digit;
             TParticleCode* v1 = &source[right_index];
             TParticleCode* v2 = &source[left_index];
             while (v1 >= v2)
             {
                 dest[--s0[*b]] = *v1--;
                 b -= sizeof(TParticleCode);
             }
 #pragma omp barrier
             std::swap(source, dest);
         }
     }
 
     // ���� ���� ��������� ������������, ������ �������� � �������� ������
     if (sizeof(m->key) == 1)
     {
         memcpy(m, m_temp, n * sizeof(TParticleCode));
     }
 }

Here is the caller graph for this function:

void WakekNN	(	const std::vector< Vortex2D > &	vtx,
		const size_t	k,
		std::vector< std::vector< std::pair< double, size_t >>> &	initdist
	)

Definition at line 447 of file knnCPU.cpp.

                                                                                                                       {
     const size_t n = vtx.size();
 
     auto gab = GetGabarit(vtx);
     double scale = std::max(gab.second[0] - gab.first[0], gab.second[1] - gab.first[1]);
 
     //�������� ������� ������� data � query 
     std::vector<TParticleCode> mortonCodeBoth(2 * vtx.size());
 
     //���������� ������� ������� (data � query) �� ������������ �����    std::vector<TParticleCode> mortonCodeBoth_temp(2 * vtx.size());

    //��� ������� ������� ���������� ������ iq -- ������ ���������� ������ �������� ������
    //������������� ������ mortonCodeBoth ��������� �� mcquery (������ �������) � mcdata (������ ������)
    std::vector<TParticleCode> mcdata, mcquery;

    std::vector<unsigned int> iq;


    //����� ��� ������� ������� k ����� ������ ����� � k ����� ������ ������ (��� �������� ������ � ����� �������, ��������� � ������)
    //��� ������� ������� ������� ������ �������� ������, � �������� ����� ������������� 2*k �������
    std::vector<size_t> initneig(vtx.size(), -1);

    //����� �� 2*k ���������� k ������� (����� �� ���������� �� ������ �� �������)
    // initdist = {����������; �� �������� ������}
    // ���������� �� ����������
    /*std::vector < std::vector < std::pair<double, size_t> >> initdist(vtx.size());
    for (auto& d : initdist)
        d.resize(2 * k, { -1.0, -1 });*/

        //�������� ��� �����
    double t1 = omp_get_wtime();
    double tStart[5], tFinish[5];
    double time[5][8];
    for (size_t sdvig = 0; sdvig <= 4; ++sdvig) //4
    {

        tStart[sdvig] = omp_get_wtime();
        mainCycle((int)k, vtx, gab, scale, (int)sdvig,
            mortonCodeBoth,
            s, mortonCodeBoth_temp, mcdata, mcquery,
            iq, initneig, initdist, time[sdvig]);
        tFinish[sdvig] = omp_get_wtime();

        //std::cout << "time_knn:" 
        //  << " " << time[sdvig][1] - time[sdvig][0] 
        //  << " " << time[sdvig][2] - time[sdvig][1] 
        //  << " " << time[sdvig][3] - time[sdvig][2] 
        //  << " " << time[sdvig][4] - time[sdvig][3] 
        //  << " " << time[sdvig][5] - time[sdvig][4] 
        //  << " " << time[sdvig][6] - time[sdvig][5] 
        //  << " " << time[sdvig][7] - time[sdvig][6] << std::endl;
    }//for sdvig
}
     std::vector<unsigned int> s(256 * omp_get_max_threads());
     std::vector<TParticleCode> mortonCodeBoth_temp(2 * vtx.size());
 
     //��� ������� ������� ���������� ������ iq -- ������ ���������� ������ �������� ������
     //������������� ������ mortonCodeBoth ��������� �� mcquery (������ �������) � mcdata (������ ������)
     std::vector<TParticleCode> mcdata, mcquery;
 
     std::vector<unsigned int> iq;
 
 
     //����� ��� ������� ������� k ����� ������ ����� � k ����� ������ ������ (��� �������� ������ � ����� �������, ��������� � ������)
     //��� ������� ������� ������� ������ �������� ������, � �������� ����� ������������� 2*k �������
    //����� �� 2*k ���������� k ������� (����� �� ���������� �� ������ �� �������)
    // initdist = {����������; �� �������� ������}
    // ���������� �� ����������
    /*std::vector < std::vector < std::pair<double, size_t> >> initdist(vtx.size());
    for (auto& d : initdist)
        d.resize(2 * k, { -1.0, -1 });*/

        //�������� ��� �����
    double t1 = omp_get_wtime();
    double tStart[5], tFinish[5];
    double time[5][8];
    for (size_t sdvig = 0; sdvig <= 4; ++sdvig) //4
    {

        tStart[sdvig] = omp_get_wtime();
        mainCycle((int)k, vtx, gab, scale, (int)sdvig,
            mortonCodeBoth,
            s, mortonCodeBoth_temp, mcdata, mcquery,
            iq, initneig, initdist, time[sdvig]);
        tFinish[sdvig] = omp_get_wtime();

        //std::cout << "time_knn:" 
        //  << " " << time[sdvig][1] - time[sdvig][0] 
        //  << " " << time[sdvig][2] - time[sdvig][1] 
        //  << " " << time[sdvig][3] - time[sdvig][2] 
        //  << " " << time[sdvig][4] - time[sdvig][3] 
        //  << " " << time[sdvig][5] - time[sdvig][4] 
        //  << " " << time[sdvig][6] - time[sdvig][5] 
        //  << " " << time[sdvig][7] - time[sdvig][6] << std::endl;
    }//for sdvig
}
     std::vector<size_t> initneig(vtx.size(), -1);
 
     //����� �� 2*k ���������� k ������� (����� �� ���������� �� ������ �� �������)
     // initdist = {����������; �� �������� ������}
     // ���������� �� ����������
     /*std::vector < std::vector < std::pair<double, size_t> >> initdist(vtx.size());
     for (auto& d : initdist)
         d.resize(2 * k, { -1.0, -1 });*/
 
         //�������� ��� �����    double tStart[5], tFinish[5];
    double time[5][8];
    for (size_t sdvig = 0; sdvig <= 4; ++sdvig) //4
    {

        tStart[sdvig] = omp_get_wtime();
        mainCycle((int)k, vtx, gab, scale, (int)sdvig,
            mortonCodeBoth,
            s, mortonCodeBoth_temp, mcdata, mcquery,
            iq, initneig, initdist, time[sdvig]);
        tFinish[sdvig] = omp_get_wtime();

        //std::cout << "time_knn:" 
        //  << " " << time[sdvig][1] - time[sdvig][0] 
        //  << " " << time[sdvig][2] - time[sdvig][1] 
        //  << " " << time[sdvig][3] - time[sdvig][2] 
        //  << " " << time[sdvig][4] - time[sdvig][3] 
        //  << " " << time[sdvig][5] - time[sdvig][4] 
        //  << " " << time[sdvig][6] - time[sdvig][5] 
        //  << " " << time[sdvig][7] - time[sdvig][6] << std::endl;
    }//for sdvig
}
     double t1 = omp_get_wtime();
     double tStart[5], tFinish[5];
     double time[5][8];
     for (size_t sdvig = 0; sdvig <= 4; ++sdvig) //4
     {
 
         tStart[sdvig] = omp_get_wtime();
         mainCycle((int)k, vtx, gab, scale, (int)sdvig,
             mortonCodeBoth,
             s, mortonCodeBoth_temp, mcdata, mcquery,
             iq, initneig, initdist, time[sdvig]);
         tFinish[sdvig] = omp_get_wtime();
 
         //std::cout << "time_knn:" 
         //  << " " << time[sdvig][1] - time[sdvig][0] 
         //  << " " << time[sdvig][2] - time[sdvig][1] 
         //  << " " << time[sdvig][3] - time[sdvig][2] 
         //  << " " << time[sdvig][4] - time[sdvig][3] 
         //  << " " << time[sdvig][5] - time[sdvig][4] 
         //  << " " << time[sdvig][6] - time[sdvig][5] 
         //  << " " << time[sdvig][7] - time[sdvig][6] << std::endl;
     }//for sdvig
 }

Here is the call graph for this function:












Here is the caller graph for this function:

Variable Documentation

const int codeLength = 15

Definition at line 8 of file knnCPU.cpp.

const int twoPowCodeLength = (1 << codeLength)

Definition at line 9 of file knnCPU.cpp.

Functions

Variables

Function Documentation

Variable Documentation