2 * SARG Squid Analysis Report Generator http://sarg.sourceforge.net
6 * please look at http://sarg.sourceforge.net/donations.php
8 * http://sourceforge.net/projects/sarg/forums/forum/363374
9 * ---------------------------------------------------------------------
11 * This program is free software; you can redistribute it and/or modify
12 * it under the terms of the GNU General Public License as published by
13 * the Free Software Foundation; either version 2 of the License, or
14 * (at your option) any later version.
16 * This program is distributed in the hope that it will be useful,
17 * but WITHOUT ANY WARRANTY; without even the implied warranty of
18 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
19 * GNU General Public License for more details.
21 * You should have received a copy of the GNU General Public License
22 * along with this program; if not, write to the Free Software
23 * Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111, USA.
27 #include "include/conf.h"
28 #include "include/defs.h"
30 #ifdef ENABLE_DOUBLE_CHECK_DATA
31 extern struct globalstatstruct globstat
;
43 char general2
[MAXLEN
];
44 char general3
[MAXLEN
];
52 long long int tnacc
=0;
53 long long int tnbytes
=0;
54 long long int tntime
=0;
55 long long int twork1
=0, twork2
=0, twork3
=0;
56 #ifdef ENABLE_DOUBLE_CHECK_DATA
57 long long int ttnacc
=0;
58 long long int ttnbytes
=0;
59 long long int ttntime
=0;
65 struct getwordstruct gwarea
;
67 struct generalitemstruct item
;
70 if (debugz
) debugaz(_("Top sites report not produced because privacy option is on\n"));
74 sprintf(general
,"%s/sarg-general",outdirname
);
75 sprintf(sites
,"%s/sarg-sites",outdirname
);
76 sprintf(general2
,"%s/sarg-general2",outdirname
);
77 sprintf(general3
,"%s/sarg-general3",outdirname
);
79 sprintf(report
,"%s/topsites.html",outdirname
);
81 if (snprintf(csort
,sizeof(csort
),"sort -t \"\t\" -k 4,4 -o \"%s\" \"%s\"",general2
,general
)>=sizeof(csort
)) {
82 debuga(_("Sort command too long when sorting file \"%s\" to \"%s\"\n"),general
,general2
);
85 cstatus
=system(csort
);
86 if (!WIFEXITED(cstatus
) || WEXITSTATUS(cstatus
)) {
87 debuga(_("sort command return status %d\n"),WEXITSTATUS(cstatus
));
88 debuga(_("sort command: %s\n"),csort
);
92 if((fp_in
=fopen(general2
,"r"))==NULL
) {
93 debuga(_("(topsites) Cannot open log file %s\n"),general2
);
94 debuga(_("sort command: %s\n"),csort
);
98 if((fp_ou
=fopen(general3
,"w"))==NULL
) {
99 debuga(_("(topsites) Cannot open log file %s\n"),general3
);
103 if ((line
=longline_create())==NULL
) {
104 debuga(_("Not enough memory to read file %s\n"),general2
);
108 while((buf
=longline_read(fp_in
,line
))!=NULL
) {
109 ger_read(buf
,&item
,general2
);
110 if(item
.total
) continue;
113 url_len
=strlen(item
.url
);
114 if (!ourl
|| url_len
>=ourl_size
) {
116 ourl
=realloc(ourl
,ourl_size
);
118 debuga(_("Not enough memory to store the url\n"));
122 strcpy(ourl
,item
.url
);
126 if(strcmp(item
.url
,ourl
) != 0) {
128 This complicated printf is due to Microsoft's inability to comply with any standard. Msvcrt is unable
129 to print a long long int unless it is exactly 64-bits long.
131 fprintf(fp_ou
,"%"PRIu64
"\t%"PRIu64
"\t%"PRIu64
"\t%s\n",(uint64_t)tnacc
,(uint64_t)tnbytes
,(uint64_t)tntime
,ourl
);
132 url_len
=strlen(item
.url
);
133 if (url_len
>=ourl_size
) {
135 ourl
=realloc(ourl
,ourl_size
);
137 debuga(_("Not enough memory to store the url\n"));
141 strcpy(ourl
,item
.url
);
148 tnbytes
+=item
.nbytes
;
150 #ifdef ENABLE_DOUBLE_CHECK_DATA
152 ttnbytes
+=item
.nbytes
;
157 longline_destroy(&line
);
161 This complicated printf is due to Microsoft's inability to comply with any standard. Msvcrt is unable
162 to print a long long int unless it is exactly 64-bits long.
164 fprintf(fp_ou
,"%"PRIu64
"\t%"PRIu64
"\t%"PRIu64
"\t%s\n",(uint64_t)tnacc
,(uint64_t)tnbytes
,(uint64_t)tntime
,ourl
);
170 #ifdef ENABLE_DOUBLE_CHECK_DATA
171 if (ttnacc
!=globstat
.nacc
|| ttnbytes
!=globstat
.nbytes
|| ttntime
!=globstat
.elap
) {
172 debuga(_("Total statistics mismatch when reading %s to produce the top sites\n"),general2
);
177 if (unlink(general2
)) {
178 debuga(_("Cannot delete %s - %s\n"),general2
,strerror(errno
));
182 if((TopsitesSort
& TOPSITE_SORT_CONNECT
) != 0) {
183 sortf
="-k 1,1 -k 2,2";
184 } else if((TopsitesSort
& TOPSITE_SORT_BYTES
) != 0) {
185 sortf
="-k 2,2 -k 1,1";
186 } else if((TopsitesSort
& TOPSITE_SORT_TIME
) != 0) {
189 sortf
="-k 2,2 -k 1,1"; //default is BYTES
191 if((TopsitesSort
& TOPSITE_SORT_REVERSE
) != 0) {
197 if (snprintf(csort
,sizeof(csort
),"sort -t \"\t\" %s -n %s -o \"%s\" \"%s\"",sortt
,sortf
,sites
,general3
)>=sizeof(csort
)) {
198 debuga(_("Sort command too long when sorting file \"%s\" to \"%s\"\n"),general3
,sites
);
201 cstatus
=system(csort
);
202 if (!WIFEXITED(cstatus
) || WEXITSTATUS(cstatus
)) {
203 debuga(_("sort command return status %d\n"),WEXITSTATUS(cstatus
));
204 debuga(_("sort command: %s\n"),csort
);
207 if((fp_in
=fopen(sites
,"r"))==NULL
) {
208 debuga(_("(topsites) Cannot open log file %s\n"),sites
);
209 debuga(_("sort command: %s\n"),csort
);
213 if (unlink(general3
)) {
214 debuga(_("Cannot delete %s - %s\n"),general3
,strerror(errno
));
218 if((fp_ou
=fopen(report
,"w"))==NULL
) {
219 debuga(_("(topsites) Cannot open log file %s\n"),report
);
223 write_html_header(fp_ou
,(IndexTree
== INDEX_TREE_DATE
) ? 3 : 1,_("Top sites"),HTML_JS_SORTTABLE
);
224 fputs("<tr><td class=\"header_c\">",fp_ou
);
225 fprintf(fp_ou
,_("Period: %s"),period
.html
);
226 fputs("</td></tr>\n",fp_ou
);
227 fputs("<tr><th class=\"header_c\">",fp_ou
);
228 fprintf(fp_ou
,_("Top %d sites"),TopSitesNum
);
229 fputs("</th></tr>\n",fp_ou
);
230 close_html_header(fp_ou
);
232 fputs("<div class=\"report\"><table cellpadding=\"1\" cellspacing=\"2\"",fp_ou
);
233 if (SortTableJs
[0]) fputs(" class=\"sortable\"",fp_ou
);
235 fprintf(fp_ou
,"<thead><tr><th class=\"header_l\">%s</th><th class=\"header_l",_("NUM"));
236 if (SortTableJs
[0]) fputs(" sorttable_alpha",fp_ou
);
237 fprintf(fp_ou
,"\">%s</th><th class=\"header_l\">%s</th><th class=\"header_l\">%s</th><th class=\"header_l\">%s</th></tr></thead>\n",_("ACCESSED SITE"),_("CONNECT"),_("BYTES"),_("TIME"));
242 if ((line
=longline_create())==NULL
) {
243 debuga(_("Not enough memory to read file %s\n"),sites
);
247 while(regs
<TopSitesNum
&& (buf
=longline_read(fp_in
,line
))!=NULL
) {
248 getword_start(&gwarea
,buf
);
249 if (getword_atoll(&nacc
,&gwarea
,'\t')<0) {
250 debuga(_("Maybe you have a broken record or garbage in your %s file\n"),sites
);
253 if (nacc
== 0) continue;
254 if (getword_atoll(&nbytes
,&gwarea
,'\t')<0 || getword_atoll(&ntime
,&gwarea
,'\t')<0) {
255 debuga(_("Maybe you have a broken record or garbage in your %s file\n"),sites
);
258 if (getword_ptr(buf
,&url
,&gwarea
,'\t')<0) {
259 debuga(_("The url is invalid in file %s\n"),sites
);
267 fprintf(fp_ou
,"<tr><td class=\"data\">%d</td><td class=\"data2\">",++regs
);
269 if(BlockIt
[0] != '\0' && url
[0]!=ALIAS_PREFIX
) {
270 fprintf(fp_ou
,"<a href=\"%s%s?url=\"",wwwDocumentRoot
,BlockIt
);
271 output_html_url(fp_ou
,url
);
272 fputs("\"><img src=\"../images/sarg-squidguard-block.png\"></a> ",fp_ou
);
275 output_html_link(fp_ou
,url
,100);
276 fputs("</td><td class=\"data\"",fp_ou
);
277 if (SortTableJs
[0]) fprintf(fp_ou
," sorttable_customkey=\"%"PRId64
"\"",(uint64_t)twork1
);
278 fprintf(fp_ou
,">%s</td>",fixnum(twork1
,1));
279 fputs("<td class=\"data\"",fp_ou
);
280 if (SortTableJs
[0]) fprintf(fp_ou
," sorttable_customkey=\"%"PRId64
"\"",(uint64_t)twork2
);
281 fprintf(fp_ou
,">%s</td>",fixnum(twork2
,1));
282 fputs("<td class=\"data\"",fp_ou
);
283 if (SortTableJs
[0]) fprintf(fp_ou
," sorttable_customkey=\"%"PRId64
"\"",(uint64_t)twork3
);
284 fprintf(fp_ou
,">%s</td></tr>\n",fixtime(twork3
));
287 longline_destroy(&line
);
289 fputs("</table></div>\n",fp_ou
);
290 if (write_html_trailer(fp_ou
)<0)
291 debuga(_("Write error in file %s\n"),report
);
292 if (fclose(fp_ou
)==EOF
)
293 debuga(_("Failed to close file %s - %s\n"),report
,strerror(errno
));