寻找热门查询,300万个查询字符串中统计最热门的10个查询
#include
#include
#include
struct QueryInfo{
string s;
int times;
QueryInfo(string s1, int t): s(s1), times(t){}
};
int QueryCompare(const QueryInfo &q1, const QueryInfo &q2)
{
return q1.times < q2.times;
}
void FindHottest(vector &s)
{
hash_map table;
int size = s.size();
for (int i = 0; i < size; ++i)
{
if (table.find(s[i]) == table.end())
{
table[s[i]] = 1;
}else
++table[s[i]];
}
vector heap;
auto it = table.begin();
for (int i = 0; it != table.end() && i < 10; ++it, ++i)
{
QueryInfo temp(it->first, it->second);
heap.push_back(temp);
}
make_heap(heap.begin(), heap.end(), QueryCompare);
if (it == table.end())
return;
for ( ; it != table.end(); ++it)
{
if (it->second > heap[0].times){
pop_heap(heap.begin(), heap.end(), QueryCompare);
heap.pop_back();
heap.push_back(QueryInfo(it->first, it->second));
push_heap(heap.begin(), heap.end(), QueryCompare);
}
}
for (auto it2 = heap.begin(); it2 != heap.end(); ++it2)
{
cout << it2->s <<" "<times< s(t, t+sizeof(t)/sizeof(string));
FindHottest(s);
}