LINQ查询输出键计数值对

时间:2012-09-25 19:38:13

标签: linq list dictionary ravendb

客户的RavenDB文档大约有50万个。其中一个属性是“City”..如何编写LINQ查询以获取每个城市的所有事件列表及其计数。例如,如果一千个客户文件将“NY”作为城市价值,那么我需要一个类似NY 1000的城市列表; LA 200,OR 1300,BO 5000等。

这是我最初写的......

 Dictionary<string,int> cityStats = session.Query<Customer>()
                    .ToList()
                    .GroupBy(x => x.City)
                    .OrderBy(x => x.Count())
                    .ToDictionary(x => x.Key, x => x.Count());

但这看起来并不像给我准确的结果..所以我改变了最大请求允许属性(我知道它不推荐)只是为了看它是否改变了结果..但是保持maxrequest值为500000也带给我同样的结果。我知道肯定有大约50万份客户文件,所以需要加起来匹配。

1 个答案:

答案 0 :(得分:2)

您需要map-reduce索引才能执行此操作。这是一个简短的控制台程序,演示了:

using System;
using System.Linq;
using Raven.Client.Document;
using Raven.Client.Indexes;

namespace ConsoleApplication1
{
  public class Customer
  {
    public string Id { get; set; }
    public string Name { get; set; }
    public string City { get; set; }
  }

  public class Customers_ByCity : AbstractIndexCreationTask<Customer, Customers_ByCity.Result>
  {
    public Customers_ByCity()
    {
      Map = customers => from customer in customers
                         select new
                         {
                           customer.City,
                           Count = 1
                         };

      Reduce = results => from result in results
                          group result by result.City
                          into g
                          select new
                          {
                            City = g.Key,
                            Count = g.Sum(x => x.Count)
                          };
    }

    public class Result
    {
      public string City { get; set; }
      public int Count { get; set; }
    }
  }

  class Program
  {
    private static void Main()
    {
      var documentStore = new DocumentStore { Url = "http://localhost:8080" };
      documentStore.Initialize();
      IndexCreation.CreateIndexes(typeof(Program).Assembly, documentStore);

      using (var session = documentStore.OpenSession())
      {
        session.Store(new Customer { Name = "John", City = "NY" });
        session.Store(new Customer { Name = "Jane", City = "NY" });
        session.Store(new Customer { Name = "Jim", City = "NY" });
        session.Store(new Customer { Name = "Sally", City = "LA" });
        session.Store(new Customer { Name = "Sam", City = "LA" });
        session.Store(new Customer { Name = "Suzie", City = "LA" });
        session.Store(new Customer { Name = "Sarah", City = "LA" });

        session.SaveChanges();
      }

      using (var session = documentStore.OpenSession())
      {
        // In a real app, you probably don't want to wait for nonstale results.
        // You will also want to consider what to do if you have more than one page of results (more than 1024 cities)

        var counts = session.Query<Customers_ByCity.Result, Customers_ByCity>()
          .Customize(x=> x.WaitForNonStaleResults())
          .Take(1024);

        foreach (var result in counts)
        {
          Console.WriteLine("{0}: {1}", result.City, result.Count);
        }

        Console.WriteLine();
      }
      Console.ReadLine();
    }
  }
}