C ++“计算哈希表中每个插槽的冲突数”

时间:2013-08-01 20:41:08

标签: c++ list class hashtable

我想将字典创建为带有链接列表的哈希表来拼写检查文本文档。我读了“words.txt”文件来创建字典。此外,当我加载字典“words.txt”时,我必须计算/显示哈希表中每个插槽的冲突数量

我给出了带有链接列表的HashTable类的源代码,如下所示:

hashtable.cpp(#include“listtools.cpp”,因为它使用模板)

#include <iostream>
#include <string>
#include "listtools.h"
#include "listtools.cpp"
#include "hashtable.h"

using LinkedListSavitch::Node;
using LinkedListSavitch::search;
using LinkedListSavitch::headInsert;
using namespace std;

#define HASH_WEIGHT 31

namespace HashTableSavitch
{
   HashTable::HashTable()
   {
    for (int i = 0; i < SIZE; i++)
    {
     hashArray[i] = NULL;
     //array for collisons
     collisionArray[i] = 0;
    }
   }

   HashTable::~HashTable()
   {
     for (int i=0; i<SIZE; i++)
     {
       Node<string> *next = hashArray[i];
       while (next != NULL)
       {
         Node<string> *discard = next;
     next = next->getLink( );
     delete discard;
       }
     }
   }

   unsigned int HashTable::computeHash(string s) const
   {
    unsigned int hash = 0;
    for (unsigned int i = 0; i < s.length( ); i++)
    {
        hash = HASH_WEIGHT * hash + s[i];
    }
    return hash % SIZE;
   }

   bool HashTable::containsString(string target) const
   {
    int hash = this->computeHash(target);
    Node<string>* result = search(hashArray[hash], target);
    if (result == NULL)
       return false;
    else
       return true;
   }

   void HashTable::put(string s)
   {
       int count = 0;
       int hash = computeHash(s);
       if (search(hashArray[hash], s) == NULL)
       {
           // Only add the target if it's not in the list
           headInsert(hashArray[hash], s);
       }
       else
       {
               collisionArray[hash]++;
   }
   void HashTable::printArray()
   {
   int number;
   for(int i = 0; i < SIZE; i++)
   {
       number = collisionArray[i];
       cout << "----------------\n";
       cout << "index = " << i << endl;
       cout << "Collisions = " << number << endl;
       cout << "----------------\n";
   }
   }
} // HashTableSavitch

我的main.cpp文件

#include <iostream>
#include <fstream>
#include <cctype>
#include <algorithm>
#include <cstring>
#include <string>
#include "hashtable.h"
using namespace std;
using HashTableSavitch::HashTable;

void upToLow(string & str);
void removePunct(string & str);

int main()
{
    HashTable h;
    string currWord;
    string word;
    int countMisspelled = 0;
    int countCorrect = 0;

    //Get input from words.rtf
    ifstream dictionary("words.txt");

    //File checking
    if (dictionary.fail())
    {
        cout << "File does not exist" << endl;
        cout << "Exit program" << endl;
    }

    //Create the dictionary as a hash table
    while(dictionary >> currWord)
    {
        h.put(currWord);
    }
    dictionary.close();

    //display collisions
    h.printArray();

    //Get input from gettysburg_address.txt
    ifstream input("gettysburg_address.txt");

    //File checking
    if (input.fail())
    {
        cout << "File does not exist" << endl;
        cout << "Exit program" << endl;
    }

    //Spell check gettysburg_address.txt
    cout << "Misspelled words : " << endl;
    cout << endl;

    //If a word is not in the dictionary assume misspelled
    while(input >> word)
    {
        removePunct(word);
        upToLow(word);
        if(h.containsString(word) == false)
        {
            countMisspelled++; // Increment misspelled words count
            cout << word << " ";
            if(countMisspelled % 20 == 0) // Display misspelled words 20 per line
            {
                cout << endl;
            }
        }
        else
        {
            countCorrect++; // Increment correct words count
        }
    }
    input.close();

    cout << endl;
    cout << endl;

    cout << "Number of misspelled words : " << countMisspelled << endl;
    cout << "Number of correct words : " << countCorrect << endl;

    return 0;
}


/*Function to convert uppercase letters to lowercase*/
void upToLow(string & str)
{
    for (unsigned int i = 0; i < strlen(str.c_str()); i++)
         if (str[i] >= 0x41 && str[i] <= 0x5A)
              str[i] = str[i] + 0x20;
}


/*Function to remove punctuation from string*/
void removePunct(string & str)
{
    str.erase(remove_if(str.begin(), str.end(), static_cast<int(*)(int)>(&ispunct)),str.end());
}

在“words.txt”中加载时,是否有一种简单的方法可以计算每个插槽的碰撞次数?如果我在“put”函数中实现count变量,我可以获得冲突的总数,但我不太确定如何计算/显示哈希表的每个槽的冲突数。任何帮助/提示表示赞赏。

编辑 : 按照Joe的建议,现在我想知道如何在每个插槽中显示碰撞次数。我做了一个无效功能,但它显示每个插槽的碰撞次数为0.任何人都知道我应该做什么?

1 个答案:

答案 0 :(得分:0)

可能最简单的方法是在适当的地方声明一个数组

int collisionArray[SIZE]; 

HashTable::HashTable()

中将其初始化为0
HashTable::HashTable()
{
 for (int i = 0; i < SIZE; i++)
 {
  hashArray[i] = NULL;
  collisionArray[i] = 0;
 }
}

然后在发现碰撞时增加相应的元素

void HashTable::put(string s)
{
    int count = 0;
    int hash = computeHash(s);
    if (search(hashArray[hash], s) == NULL)
    {
        // Only add the target if it's not in the list
        headInsert(hashArray[hash], s);
        collisionArray[hash]++;
    }
}