C# HashSet VS C++ std::unordered_set 自定义类键。 C++ 更慢……不可能。如何达到C#的速度?

标签 c# c++ performance hashset unordered-set

我将我的程序移植到 C++ 以获得更好的速度,但遇到了一些可怕的事情!我找不到一种快速方法来从数组中获取按值自定义类实例的唯一性。

为了比较,我做了两个最小的示例项目。

C++程序发布结果(VC++ 2010 express): 唯一 vector 计数为 666791。耗时 5 秒。

C#程序调试!!!结果: 唯一 vector 计数为 666533。耗时 0,9060004 秒。

我需要一种方法来仅从数组中获取唯一元素。

C++代码:

#include <conio.h>
#include <time.h>
#include <vector>
#include <unordered_set>

struct XVFields
{
    unsigned char JointPromosCountSinceBeginning;
    unsigned char PromoWeeksCountSinceCurrPromoBeginning;
    unsigned char NoPromoWeeksCountSinceLastJointPromo;
    unsigned char IsPromo;
};

class XVector
{
public:
        XVFields XVFs;
        unsigned char *DiscountUsagesCounts;

    XVector()
    {
        this->DiscountUsagesCounts = (unsigned char*)malloc(5);
    }
};

struct XVectorHasher
{
    size_t operator()(const XVector *k) const
    {
        size_t result = 0;
        const size_t prime = 31;

        int unibytes_count = sizeof(XVFields) + 5;
        unsigned char *unibytes = (unsigned char*)malloc(unibytes_count);
        memcpy(unibytes, &k->XVFs, sizeof(XVFields));
        memcpy(&unibytes[sizeof(XVFields)], k->DiscountUsagesCounts, 5);

        for (size_t i = 0; i < unibytes_count; i++)
            result = unibytes[i] + (result * prime);

        free(unibytes);

        return result;
    }
};

struct XVectorComparator
{
    bool operator()(const XVector *xv1, const XVector *xv2) const
    {
        if (memcmp(&xv1->XVFs, &xv2->XVFs, sizeof(XVFields)) != 0)
            return false;

        if (memcmp(xv1->DiscountUsagesCounts, xv2->DiscountUsagesCounts, 5) != 0)
            return false;

        return true;
    }
};

void main()
{
    srand(time(NULL));
    std::vector<XVector*> xvectors;

    for (int i = 0; i < 1500000; i++)
    {
        XVector *temp_xv = new XVector();
        temp_xv->XVFs.IsPromo = rand() % 2 > 0;
        temp_xv->XVFs.JointPromosCountSinceBeginning = rand() % 5;
        temp_xv->XVFs.NoPromoWeeksCountSinceLastJointPromo = rand() % 5;
        temp_xv->XVFs.PromoWeeksCountSinceCurrPromoBeginning = rand() % 5;

        for (int j = 0; j < 5; j++)
            temp_xv->DiscountUsagesCounts[j] = rand() % 5;

        xvectors.push_back(temp_xv);
    }

    time_t start_dt = time(NULL);
    std::unordered_set<XVector*, XVectorHasher, XVectorComparator> *unique_xvs = new std::unordered_set<XVector*, XVectorHasher, XVectorComparator>();

    for (int i = 0; i < xvectors.size(); i++)
        if (unique_xvs->find(xvectors[i]) == unique_xvs->end())
            unique_xvs->insert(xvectors[i]);

    printf("Unique vectors count is %i. Took %i seconds.", unique_xvs->size(), time(NULL) - start_dt);
    getch();
}

C#代码:

using System;
using System.Text;
using System.Linq;
using System.Collections.Generic;

namespace DictSpeedTest
{
    class Program
    {
        static void Main(string[] args)
        {
            Random rnd = new Random((int)(DateTime.Now - new DateTime(1970, 1, 1)).TotalSeconds);
            List<XVector> xvectors = new List<XVector>();

            for (int i = 0; i < 1500000; i++)
            {
                XVector temp_xv = new XVector();
                temp_xv.XVFs.IsPromo = rnd.Next(2) > 0;
                temp_xv.XVFs.JointPromosCountSinceBeginning = (byte)rnd.Next(0, 5);
                temp_xv.XVFs.NoPromoWeeksCountSinceLastJointPromo = (byte)rnd.Next(0, 5);
                temp_xv.XVFs.PromoWeeksCountSinceCurrPromoBeginning = (byte)rnd.Next(0, 5);

                for (int j = 0; j < temp_xv.DiscountUsagesCounts.Length; j++)
                    temp_xv.DiscountUsagesCounts[j] = (byte)rnd.Next(0, 5);

                xvectors.Add(temp_xv);
            }

            DateTime start_dt = DateTime.Now;
            HashSet<XVector> unique_xvs = new HashSet<XVector>(new XVectorEqualityComparer());

            for (int i = 0; i < xvectors.Count; i++)
                if (!unique_xvs.Contains(xvectors[i]))
                    unique_xvs.Add(xvectors[i]);

            Console.WriteLine("Unique vectors count is " + unique_xvs.Count + ". Took " + (DateTime.Now - start_dt).TotalSeconds + " seconds.");
            Console.ReadKey();
        }
    }

    struct XVFields
    {
        public byte JointPromosCountSinceBeginning;
        public byte PromoWeeksCountSinceCurrPromoBeginning;
        public byte NoPromoWeeksCountSinceLastJointPromo;
        public bool IsPromo;
    }

    class XVector
    {
        public XVFields XVFs;
        public byte[] DiscountUsagesCounts;

        public XVector()
        {
            this.DiscountUsagesCounts = new byte[5];
        }

        public override bool Equals(object obj)
        {
            byte[] my_low_lvl_dump = new byte[4 + 5];

            my_low_lvl_dump[0] = this.XVFs.IsPromo ? (byte)1 : (byte)0;
            my_low_lvl_dump[1] = this.XVFs.JointPromosCountSinceBeginning;
            my_low_lvl_dump[2] = this.XVFs.PromoWeeksCountSinceCurrPromoBeginning;
            my_low_lvl_dump[3] = this.XVFs.NoPromoWeeksCountSinceLastJointPromo;
            my_low_lvl_dump[4] = this.DiscountUsagesCounts[0];
            my_low_lvl_dump[5] = this.DiscountUsagesCounts[1];
            my_low_lvl_dump[6] = this.DiscountUsagesCounts[2];
            my_low_lvl_dump[7] = this.DiscountUsagesCounts[3];
            my_low_lvl_dump[8] = this.DiscountUsagesCounts[4];

            XVector xv = (XVector)obj;
            byte[] obj_low_lvl_dump = new byte[4 + 5];

            obj_low_lvl_dump[0] = xv.XVFs.IsPromo ? (byte)1 : (byte)0;
            obj_low_lvl_dump[1] = xv.XVFs.JointPromosCountSinceBeginning;
            obj_low_lvl_dump[2] = xv.XVFs.PromoWeeksCountSinceCurrPromoBeginning;
            obj_low_lvl_dump[3] = xv.XVFs.NoPromoWeeksCountSinceLastJointPromo;
            obj_low_lvl_dump[4] = xv.DiscountUsagesCounts[0];
            obj_low_lvl_dump[5] = xv.DiscountUsagesCounts[1];
            obj_low_lvl_dump[6] = xv.DiscountUsagesCounts[2];
            obj_low_lvl_dump[7] = xv.DiscountUsagesCounts[3];
            obj_low_lvl_dump[8] = xv.DiscountUsagesCounts[4];

            return my_low_lvl_dump.SequenceEqual<byte>(obj_low_lvl_dump);
        }

        public override int GetHashCode()
        {
            byte[] low_lvl_dump = new byte[4 + 5];

            low_lvl_dump[0] = this.XVFs.IsPromo ? (byte)1 : (byte)0;
            low_lvl_dump[1] = this.XVFs.JointPromosCountSinceBeginning;
            low_lvl_dump[2] = this.XVFs.PromoWeeksCountSinceCurrPromoBeginning;
            low_lvl_dump[3] = this.XVFs.NoPromoWeeksCountSinceLastJointPromo;
            low_lvl_dump[4] = this.DiscountUsagesCounts[0];
            low_lvl_dump[5] = this.DiscountUsagesCounts[1];
            low_lvl_dump[6] = this.DiscountUsagesCounts[2];
            low_lvl_dump[7] = this.DiscountUsagesCounts[3];
            low_lvl_dump[8] = this.DiscountUsagesCounts[4];

            int result = 0;
            int prime = 31;

            for (int i = 0; i < low_lvl_dump.Length; i++)
                result = low_lvl_dump[i] + (result * prime);

            return result;
        }
    }

    class XVectorEqualityComparer : IEqualityComparer<XVector>
    {
        public bool Equals(XVector xv1, XVector xv2)
        {
            return xv1.Equals(xv2);
        }

        public int GetHashCode(XVector xv)
        {
            return xv.GetHashCode();
        }
    }
}

C# 在为散列函数生成数组时采用了昂贵的操作方式,但最终结果更快。

最佳答案

我使用的是 Visual Studio 2019,我的 RELEASE 构建代码运行时间约为 700 毫秒。

您肯定可以通过一些改进战胜这次。

  1. 当您向哈希集中插入 1,500,000 个元素时,它会被重新哈希大约 10 次。您可以通过在构造该集合时指定桶数来避免这种情况。将其设置为 800,000 可节省约 20%。

  2. 在您的哈希函数中,您创建和销毁了一个 9 字节的数组。一百五十万次!您可以有一个静态数组并简单地用所需的数据填充它。然而,您可以直接在您的字段上简单地进行数学运算,这将为您节省大约 50%:

    struct XVectorHasher
    {
    size_t operator()(const XVector* k) const
    {
        size_t result = 0;
        const size_t prime = 31;
    
        result = k->XVFs.IsPromo;
        result = k->XVFs.JointPromosCountSinceBeginning + (result * prime);
        result = k->XVFs.PromoWeeksCountSinceCurrPromoBeginning + (result * prime);
        result = k->XVFs.NoPromoWeeksCountSinceLastJointPromo + (result * prime);
        for (size_t i = 0; i < 5; i++)
            result = k->DiscountUsagesCounts[i] + (result * prime);
        return result;
    }
    };
    
  3. 您示例中的数据结构是真实的还是简化的?这些 unsigned char 字段的有效范围是多少?我问的原因是你只有 8 个字节 + 1 个 bool 值。如果您可以在这 8 个字节中的任何一个字节中节省一个位,您可以简单地组成一个 long long 键,而不必提供您自己的自定义哈希和比较。这将为您再节省 50%

关于C# HashSet VS C++ std::unordered_set 自定义类键。 C++ 更慢……不可能。如何达到C#的速度?,我们在Stack Overflow上找到一个类似的问题: https://stackoverflow.com/questions/59396081/

相关文章:

c# - 使用自动布局约束时,Syncfusion SfRangeSlider slider 和标签未正确对齐

c# - 在构建项目引用和包期间正在安装和引用不同版本的 nuget 包

c++ - 可执行文件在 Wine 上的运行速度比 Windows 快——为什么?

performance - 编写更短的代码/算法,是否更高效(性能)?

c - 分支预测器条目在程序完成后失效?

c# - 如何从不同的主机连接到我的 SignalR 集线器?

c# - 优化 C#/.NET 程序的技巧

c++ - 将输出流对象和其他参数传递给多个线程

c++ - 读取 PNG header 的第一个字节时出现奇怪的结果

javascript - 将 "min.js"文件放入 MVC 包中是否有意义?