|
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113 |
#include<iostream.h>#include<fstream.h>#include<string.h>void
main(){ ifstream inFile("F:wen\\wenben.txt",ios::in); if(!inFile) cout<<"打开文件失败"<<endl; else { int
m=0,l=0,j=0; int
n[10]={0}; int
k[10]={0}; char
c[10][20]; int
max[10]={0}; int
i=0; char
t; if(inFile) { while(inFile.get(t)) { l++; if(t==32||t==‘,‘||t==‘.‘) { m++; } } } inFile.close(); char
**ch; ch=new
char*[m+1]; for(i=0;i<=m;i++) { ch[i]=new
char[20]; } i=0; ifstream inFile("F:wen\\wenben.txt",ios::in); while(inFile.get(ch[i][j])) { if(ch[i][j]>=65&&ch[i][j]<=90) ch[i][j]=ch[i][j]-22; if(ch[i][j]==32||ch[i][j]==‘,‘||ch[i][j]==‘.‘) { j=0; i++; continue; } j++; } for(j=0;j<=m;j++) { for(i=0;i<=m;i++) { if(n[j]==-1) break; if(!strcmp(ch[j],ch[i])) { if(j>0&&i==0) if(!strcmp(ch[j],ch[0])) n[j]=-1; if(j>0&&i>0) for(int
he=0;he<i;he++) if(!strcmp(ch[j],ch[he])) n[j]=-1; if(j==0) { n[j]++; continue; } if(n[j]!=-1) n[j]++; } } } for(i=0;i<=9;i++) { for(int
j=0;j<=m;j++) { int
h=0; if(i>0) for(int
r=0;r<i;r++) { if(!strcmp(c[r],ch[j])) h=1; } if(h) continue; if(n[j]>=max[i]) { max[i]=n[j]; strcpy(c[i],ch[j]); } } } cout<<"该文档中出现次数最高的10个单词依次是:"<<endl; for(i=0;i<=9;i++) { cout<<c[i]<<" "; cout<<"出现的次数为"<<max[m]<<endl; } }} |
统计文本文档中出现次数最多的前10个单词,布布扣,bubuko.com
原文:http://www.cnblogs.com/xuxiaoyi/p/3577538.html