1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59
| public static void main(String[] args) { LinkedHashMap<String,Integer> map =new LinkedHashMap<>(); String[] docxFiles= IOHelpers.getFilesRecursively("D:/JavaTest1/ExcelTest2","docx"); for (String docxFile:docxFiles) { String str = WordHelpers.readAllText(docxFile); String[] texts = str.toLowerCase().split("\\s|\\.|\\,|\\:|\\!|\\?|;|\\(|\\)"); for (String text :texts) { if (!isEnglishWord(text)) { continue; }
if (text.equals("")) { continue; } Integer frqe =map.get(text); if (frqe==null) { map.put(text,1); } else { map.put(text,frqe+1);
}
} String outputString =""; for (String word:map.keySet()) { int freq =map.get(word); outputString =outputString+word+"="+freq+"\r\n";
} IOHelpers.writeAllText("D:/JavaTest1/ExcelTest2/1.txt",outputString);
}
} public static boolean isEnglishWord(String s) { int numbers=s.length(); for (int i =0;i<numbers;i++) { char ch =s.charAt(i); if (Character.isLowerCase(ch)==false) { return false; } } return true; }
|