Question

输入：

BC
  BD
  BC
  BC
  BD
  CD

输出：

BC 3
  BD 2
  CD 1

如果我使用char类型作为键它是可用的。但似乎Thrust不支持字符串作为键。

#include <thrust/device_vector.h>
#include <thrust/iterator/constant_iterator.h>
#include <thrust/reduce.h>
#include <string>

int main(void)
{
  std::string data = "aaabbbbbcddeeeeeeeeeff";

  size_t N = data.size();

  thrust::device_vector<char> input(data.begin(), data.end());

  thrust::device_vector<char> output(N);
  thrust::device_vector<int>  lengths(N);

  size_t num_runs =
    thrust::reduce_by_key(input.begin(), input.end(),        
                      thrust::constant_iterator<int>(1), 
                      output.begin(),                    
                      lengths.begin()                    
                      ).first - output.begin();
   return 0;
}

如何使用Thrust实现它？

Answer 1

向@AngryLettuce道歉，这里有两种可能的方法：

方法1：

创建一个结构来保存您的密钥。该结构将为您的密钥中的每个字符包含一个sort项。
reduce_by_key将钥匙放在一起的钥匙。看起来你想要的只是每个键类型的计数，无论它在序列中出现的位置。为了便于reduce_by_key，首先需要将类似的键组合在一起。否则，reduce_by_key会将由不同中间密钥分隔的密钥视为不同的密钥序列。从你想要的输入和输出中可以看出，这不是你想要的。
现在在排序的密钥上使用reduce_by_key，按键计数。

步骤2需要（对于此方法）仿函数对键进行排序，步骤3需要仿函数来识别char所需的“相等”键的含义。

方法2：

创建两个单独的device_vector zip_iterator（s），一个用于保存每个键的第一个字母，另一个用于保存每个键的第二个字母。然后，我们将在代码的其余部分中使用sort将这两个向量视为统一的“关键”向量。
reduce_by_key压缩的密钥向量。在这种情况下，推力知道如何对基本类型的压缩矢量进行排序，并且不需要单独的排序函数
对zipped（和已排序）键向量执行zip_iterator。这再一次不需要单独的平等函子。 Thrust知道如何确定基本类型的压缩向量的相等性。

除了不需要任何函子定义之外，第二种方法可能也会更快，因为与第一种方法中存在的AoS（结构数组）相比，$ cat t1004.cu #include <thrust/device_vector.h> #include <thrust/sort.h> #include <thrust/reduce.h> #include <thrust/iterator/constant_iterator.h> #include <iostream> #include <thrust/iterator/zip_iterator.h> struct key { char k1; char k2; }; struct sort_functor{ __host__ __device__ bool operator()(key &k1, key &k2){ if (k1.k1 < k2.k1) return true; if (k1.k1 > k2.k1) return false; if (k1.k2 < k2.k2) return true; return false;} }; struct equal_key{ __host__ __device__ bool operator()(key k1, key k2){ if ((k1.k1 == k2.k1)&&(k1.k2 == k2.k2)) return true; return false;} }; int main(){ key data[] = {{'B','C'},{'B','D'},{'B','C'},{'B','C'},{'B','D'},{'C','D'}};; size_t dsize = sizeof(data)/sizeof(key); //method 1 thrust::device_vector<key> keys(data, data+dsize); thrust::device_vector<key> keys_out(dsize); thrust::device_vector<int> lengths(dsize); thrust::sort(keys.begin(), keys.end(), sort_functor()); int rsize = thrust::reduce_by_key(keys.begin(), keys.end(), thrust::constant_iterator<int>(1), keys_out.begin(), lengths.begin(),equal_key()).first - keys_out.begin(); std::cout << "Method1:" << std::endl; for (int i = 0; i < rsize; i++){ key temp = keys_out[i]; int len = lengths[i]; std::cout << " " << temp.k1 << temp.k2 << " " << len << std::endl;} //method 2 //get the key data into 2 separate vectors. //there are more efficient ways to do this //but this is not the crux of your question thrust::device_vector<char> k1; thrust::device_vector<char> k2; for (int i = 0; i < dsize; i++){ k1.push_back(data[i].k1); k2.push_back(data[i].k2);} thrust::sort(thrust::make_zip_iterator(thrust::make_tuple(k1.begin(), k2.begin())), thrust::make_zip_iterator(thrust::make_tuple(k1.end(), k2.end()))); thrust::device_vector<char> k1r(dsize); thrust::device_vector<char> k2r(dsize); rsize = thrust::reduce_by_key(thrust::make_zip_iterator(thrust::make_tuple(k1.begin(), k2.begin())), thrust::make_zip_iterator(thrust::make_tuple(k1.end(), k2.end())), thrust::constant_iterator<int>(1), thrust::make_zip_iterator(thrust::make_tuple(k1r.begin(), k2r.begin())), lengths.begin()).first - thrust::make_zip_iterator(thrust::make_tuple(k1r.begin(),k2r.begin())); std::cout << "Method2:" << std::endl; for (int i = 0; i < rsize; i++){ char c1 = k1r[i]; char c2 = k2r[i]; int len = lengths[i]; std::cout << " " << c1 << c2 << " " << len << std::endl;} return 0; } $ nvcc -o t1004 t1004.cu $ ./t1004 Method1: BC 3 BD 2 CD 1 Method2: BC 3 BD 2 CD 1 $倾向于改善数据访问。 / p>

这是一个展示两种方法的实例：

$ cat t1004.cu
#include <thrust/device_vector.h>
#include <thrust/sort.h>
#include <thrust/reduce.h>
#include <thrust/iterator/constant_iterator.h>
#include <iostream>

#include <thrust/iterator/zip_iterator.h>
#include <thrust/iterator/transform_iterator.h>
#include <thrust/iterator/permutation_iterator.h>

template <typename Iterator>
class strided_range
{
    public:

    typedef typename thrust::iterator_difference<Iterator>::type difference_type;

    struct stride_functor : public thrust::unary_function<difference_type,difference_type>
    {
        difference_type stride;

        stride_functor(difference_type stride)
            : stride(stride) {}

        __host__ __device__
        difference_type operator()(const difference_type& i) const
        {
            return stride * i;
        }
    };

    typedef typename thrust::counting_iterator<difference_type>                   CountingIterator;
    typedef typename thrust::transform_iterator<stride_functor, CountingIterator> TransformIterator;
    typedef typename thrust::permutation_iterator<Iterator,TransformIterator>     PermutationIterator;

    // type of the strided_range iterator
    typedef PermutationIterator iterator;

    // construct strided_range for the range [first,last)
    strided_range(Iterator first, Iterator last, difference_type stride)
        : first(first), last(last), stride(stride) {}

    iterator begin(void) const
    {
        return PermutationIterator(first, TransformIterator(CountingIterator(0), stride_functor(stride)));
    }

    iterator end(void) const
    {
        return begin() + ((last - first) + (stride - 1)) / stride;
    }

    protected:
    Iterator first;
    Iterator last;
    difference_type stride;
};

typedef thrust::device_vector<char>::iterator cIterator;

int main(){

//method 2

  //get the key data into separate vectors, one per character in key.
#define KEYLEN 2
  const char data[] = "BCBDBCBCBDCD";
  size_t dsize = sizeof(data)/sizeof(char);
  size_t numkeys = dsize/KEYLEN;
  thrust::device_vector<char> keys(data, data+dsize);
  strided_range<cIterator>  *str_k[KEYLEN];
  for (int i = 0; i < KEYLEN; i++)
    str_k[i] = new strided_range<cIterator>(keys.begin()+i, keys.end(), KEYLEN);

//modify this line also if KEYLEN changes (max 10)
  auto my_z = thrust::make_zip_iterator(thrust::make_tuple((*str_k[0]).begin(), (*str_k[1]).begin()));

  thrust::sort(my_z, my_z+numkeys);

  thrust::device_vector<char> kr[KEYLEN];
  for (int i = 0; i < KEYLEN; i++)
    kr[i].resize(numkeys);

//modify this line also if KEYLEN changes (max 10)
  auto my_zr = thrust::make_zip_iterator(thrust::make_tuple(kr[0].begin(), kr[1].begin()));

  thrust::device_vector<int> lengths(numkeys);

  size_t rsize = thrust::reduce_by_key(my_z, my_z + numkeys, thrust::constant_iterator<int>(1), my_zr, lengths.begin()).first - my_zr;
  std::cout << "Method2:" << std::endl;

  for (int i = 0; i < rsize; i++){
    std::cout << " ";
    for (int j = 0; j < KEYLEN; j++){
      char c = kr[j][i];
      std::cout << c; }
    int len = lengths[i];
    std::cout <<" " <<  len << std::endl;}

  return 0;
}
$ nvcc -std=c++11 t1004.cu -o t1004
$ ./t1004
Method2:
 BC 3
 BD 2
 CD 1
$

这是方法2的改进版本。您应该能够直接使用字符串/字符数组，并且可以相当容易地修改此版本以容纳2到10个字符的密钥长度。此方法使用strided range iterator直接从数据数组中提取单个键字符：

class SendLink < ApplicationMailer
  default :from => 'info@mysite.com'

  def email( object )
    @object = object
    mail(
      :subject => 'Critical Documentation Needed' ,
      :to  => @object.recipient ,
      :track_opens => 'true'
    )
  end
end

当键是字符串或char数组时，如何使用Thrust实现按键减少

1 个答案: