我正在尝试将HTML转换为文本转换后的文件到哈希表中,以便稍后检索它们。我不明白如何实现它。请帮我。如何将文本文件存储到哈希表中?
package hashTable;
import java.io.BufferedReader;
import java.io.BufferedWriter;
import java.io.File;
import java.io.FileReader;
import java.io.FileWriter;
import java.io.IOException;
import java.math.BigInteger;
import java.util.Scanner;
import org.jsoup.Jsoup;
import org.jsoup.nodes.Document;
public class HashMap {
// Setting table size to a max of 32, value used to modulus for hash value.
private final static int TABLE_SIZE = 32;
HashEntry[] table;
HashMap() {
table = new HashEntry[TABLE_SIZE];
for (int i = 0; i < TABLE_SIZE; i++)
table[i] = null;
}
/* function to retrieve value from the table according to key */
public int get(String key) {
int hash = new BigInteger(toAscii(key)).mod(new BigInteger(((Integer)TABLE_SIZE).toString())).intValue();
while (table[hash] != null && table[hash].getKey() != key)
hash = (hash + 1) % TABLE_SIZE;
if (table[hash] == null)
return -1;
else
return table[hash].getValue();
}
/* function to add value to the table */
public void put(String key, int value) {
//creating hash code using key value given as a string
int hash = new BigInteger(toAscii(key)).mod(new BigInteger(((Integer)TABLE_SIZE).toString())).intValue();
while (table[hash] != null && table[hash].getKey() != key)
hash = (hash + 1) % TABLE_SIZE;
table[hash] = new HashEntry(key, value);
}
/* value to create the Hash code from he name entered, basically converting name to ASCII */
public static String toAscii(String s){
StringBuilder sb = new StringBuilder();
long asciiInt;
// loop through all values in the string, including blanks
for (int i = 0; i < s.length(); i++){
//getting Ascii value of character and adding it to the string.
char c = s.charAt(i);
asciiInt = (int)c;
sb.append(asciiInt);
}
return String.valueOf(sb);
}
public void HtmltoText(String fn){
try{
String uri="C:/Users/Bharadwaj/Downloads/W3C Web Pages";
BufferedReader in = new BufferedReader(new FileReader(uri));
String st=new String();
String str;
while((str=in.readLine())!=null){
st += "\n" + str.replace("<br", "\n<br");
}
Document s=Jsoup.parse(st);
// System.out.println(s1);
String text=s.text();
// System.out.println(filename.substring(0,filename.length()-4));
String txtpath="C:/Users/Bharadwaj/Downloads/W3C Web Pages/Text";
System.out.println(text);
String newname=txtpath+fn.substring(0,(fn.length()-4))+".txt";
BufferedWriter writerTxt = new BufferedWriter(new FileWriter(newname));
writerTxt.write(text);
writerTxt.close();
}catch(Exception e){
e.printStackTrace();
}
}
public static void main(String[]args) throws IOException{
HashMap entry = new HashMap();
String uri="C:/Users/Bharadwaj/Downloads/W3C Web Pages";
File fil=new File(uri);
System.out.println(fil);
entry.HtmltoText(uri);
}
}
答案 0 :(得分:1)
将一些大型文件存储在一个hashmap中并不是一个好主意,但如果你坚持认为可以尝试以下方法:
<Integer, String>
&#39}插入到散列图中。瞧! 现在你有一个包含所有文件的hashmap。当然可能会发生异常,例如在阅读反斜杠等特殊字符时......
答案 1 :(得分:0)
为什么不将文件存储在filesytem上,只是将路径放到地图中的文件中?