X-Git-Url: https://code.th-h.de/?p=usenet%2Fnewsstats.git;a=blobdiff_plain;f=groupstats.pl;h=ccd7f869682483e27c7540acf8c548194d62c681;hp=e21aeb78f5380b455ede631a4ff7319508d019a0;hb=89db2f904dc9ddd07bfce9c3fe1fe81b58c1aa8b;hpb=f2ddfd8a923d3276c00daf243a0abf1cbdd8b35b diff --git a/groupstats.pl b/groupstats.pl index e21aeb7..ccd7f86 100755 --- a/groupstats.pl +++ b/groupstats.pl @@ -26,7 +26,7 @@ use DBI; ################################# Main program ################################# ### read commandline options -my %Options = &ReadOptions('m:p:an:o:t:l:b:iscqdg:'); +my %Options = &ReadOptions('m:p:an:o:t:l:b:iscqdf:g:'); ### read configuration my %Conf = %{ReadConfig('newsstats.conf')}; @@ -39,7 +39,13 @@ $ConfOverride{'DBTableGrps'} = $Options{'g'} if $Options{'g'}; ### check for incompatible command line options # you can't mix '-t', '-b' and '-l' # -b/-l take preference over -t, and -b takes preference over -l +# you can't use '-f' with '-b' or '-l' if ($Options{'b'} or $Options{'l'}) { + if ($Options{'f'}) { + # drop -f + warn ("$MySelf: W: You cannot save the report to monthly files when using top lists (-b) or levels (-l). Filename template '-f $Options{'f'}' was ignored.\n"); + undef($Options{'f'}); + }; if ($Options{'t'}) { # drop -t warn ("$MySelf: W: You cannot combine thresholds (-t) and top lists (-b) or levels (-l). Threshold '-t $Options{'t'}' was ignored.\n"); @@ -56,8 +62,8 @@ if ($Options{'b'} or $Options{'l'}) { }; ### check output type -# default output type to 'dump' -$Options{'o'} = 'dump' if !$Options{'o'}; +# default output type to 'pretty' +$Options{'o'} = 'pretty' if !$Options{'o'}; # fail if more than one newsgroup is combined with 'dumpgroup' type die ("$MySelf: E: You cannot combine newsgroup lists (-n) with more than one group with '-o dumpgroup'!\n") if ($Options{'o'} eq 'dumpgroup' and defined($Options{'n'}) and $Options{'n'} =~ /:|\*/); # accept 'dumpgroup' only with -n @@ -66,10 +72,15 @@ if ($Options{'o'} eq 'dumpgroup' and !defined($Options{'n'})) { warn ("$MySelf: W: You must submit exactly one newsgroup ('-n news.group') for '-o dumpgroup'. Output type was set to 'dump'.\n"); }; # set output type to 'pretty' for -l -if ($Options{'l'}) { +if ($Options{'l'} and $Options{'o'} ne 'pretty') { $Options{'o'} = 'pretty'; warn ("$MySelf: W: Output type forced to '-o pretty' due to usage of '-l'.\n"); }; +# set output type to 'dump' for -f +if ($Options{'f'} and $Options{'o'} ne 'dump') { + $Options{'o'} = 'dump'; + warn ("$MySelf: W: Output type forced to '-o dump' due to usage of '-f'.\n"); +}; ### init database my $DBHandle = InitDB(\%Conf,1); @@ -88,14 +99,18 @@ if ($Options{'a'}) { } else { ($StartMonth,$EndMonth) = &GetTimePeriod($Options{'m'},$Options{'p'}); }; -# if time period is more than one month: set output type to '-o pretty' or '-o dumpgroup' +# if -p or -a are set: drop -m +undef $Options{'m'} if ($Options{'p'} or $Options{'a'}); +# if time period is more than one month: force output type to '-o pretty' or '-o dumpgroup' if ($Options{'o'} eq 'dump' and ($Options{'p'} or $Options{'a'})) { if (defined($Options{'n'}) and $Options{'n'} !~ /:|\*/) { - warn ("$MySelf: W: You cannot combine time periods (-p) with '-o dump', changing output type to '-o dumpgroup'.\n"); - $Options{'o'} = 'dumpgroup'; - } else { - warn ("$MySelf: W: You cannot combine time periods (-p) with '-o dump', changing output type to '-o pretty'.\n"); - $Options{'o'} = 'pretty'; + # just one newsgroup is defined + warn ("$MySelf: W: You cannot combine time periods (-p) with '-o dump', changing output type to '-o dumpgroup'.\n"); + $Options{'o'} = 'dumpgroup'; + } elsif (!defined($Options{'f'})) { + # more than one newsgroup - and no file output + warn ("$MySelf: W: You cannot combine time periods (-p) with '-o dump', changing output type to '-o pretty'.\n"); + $Options{'o'} = 'pretty'; } }; @@ -190,12 +205,14 @@ $DBQuery->execute($StartMonth,$EndMonth,@GroupList,@Params) or die sprintf("$MySelf: E: Can't get groups data for %s to %s from %s.%s: %s\n",$StartMonth,$EndMonth,$Conf{'DBDatabase'},$Conf{'DBTableGrps'},$DBI::errstr); # output results +# reset caption (-c) if -f is set +undef($Options{'c'}) if $Options{'f'}; # print caption (-c) with time period if -m or -p is set if ($Options{'c'}) { - if ($Options{'p'}) { - printf ("----- Report from %s to %s\n",$StartMonth,$EndMonth); - } elsif ($Options{'m'}) { + if ($Options{'m'}) { printf ("----- Report for %s\n",$StartMonth); + } else { + printf ("----- Report from %s to %s %s\n",$StartMonth,$EndMonth,$Options{'a'} ? '(all months)' : ''); }; }; # print caption (-c) with newsgroup list if -n is set @@ -204,7 +221,7 @@ printf ("----- Newsgroups: %s\n",join(',',split(/:/,$Newsgroups))) if $Options{' printf ("----- Threshold: %s %u\n",$Options{'i'} ? '<' : '>',$Options{'t'}) if $Options{'c'} and $Options{'t'}; if (!defined($Options{'b'}) and !defined($Options{'l'})) { # default: neither -b nor -l - &OutputData($Options{'o'},$DBQuery,$MaxLength); + &OutputData($Options{'o'},$Options{'f'},$DBQuery,$MaxLength); } elsif ($Options{'b'}) { # -b is set (then -l can't be!) # we have to read in the query results ourselves, as they do not have standard layout @@ -236,7 +253,7 @@ groupstats - create reports on newsgroup usage =head1 SYNOPSIS -B [B<-Vhiscqd>] [B<-m> I | B<-p> I | B<-a>] [B<-n> I] [B<-t> I] [B<-l> I] [B<-b> I] [B<-o> I] [B<-g> I] +B [B<-Vhiscqd>] [B<-m> I | B<-p> I | B<-a>] [B<-n> I] [B<-t> I] [B<-l> I] [B<-b> I] [B<-o> I] [B<-f> I] [B<-g> I] =head1 REQUIREMENTS @@ -286,10 +303,9 @@ period by using B<-l> (together with B as needed). Last but not least you can create a "best of" list of the top x newsgroups via B<-b> (or a "worst of" list by adding B). -By default, B will dump a very simple alphabetical list of -newsgroups, one per line, followed by the number of postings in that -month. This output format of course cannot sensibly be combined with -time periods, so you can set the output format by using B<-o> (see +By default, B will dump an alphabetical list of newsgroups, +one per line, followed by the number of postings in that group, for +every month. You can change the output format by using B<-o> (see below). Captions can be added by setting the B<-c> switch. =head2 Configuration @@ -355,7 +371,7 @@ postings every single month will be included. Output will be ordered by newsgroup name, followed by month. This setting will be ignored if B<-b> is set. Overrides B<-t> and -can't be used together with B<-q> or B<-d>. +can't be used together with B<-q>, B<-d> or B<-f>. =item B<-b> I (best of) @@ -364,8 +380,8 @@ whole reporting period. Can be inverted by the B<-i> switch so that a list of the I newsgroups with the least postings over the whole period is generated. Output will be ordered by sum of postings. -Overrides B<-t> and B<-l> and can't be used together with B<-q> or -B<-d>. Output format is set to I (see below). +Overrides B<-t> and B<-l> and can't be used together with B<-q>, B<-d> +or B<-f>. Output format is set to I (see below). =item B<-i> (invert) @@ -385,10 +401,18 @@ See the B man page for details. =item B<-o> I (output format) -Set output format. Default is I, consisting of an alphabetical -list of newsgroups, each on a new line, followed by the number of -postings in that month. This default format can't be used with time -periods of more than one month. +Set output format. Default is I, which will print a header for +each new month, followed by an alphabetical list of newsgroups, each +on a new line, followed by the number of postings in that month. +B will try to align newsgroup names and posting counts. +Usage of B<-b> will force this format; it cannot be used together with +B<-f>. + +I format is used to create an easily parsable output consisting +of an alphabetical list of newsgroups, each on a new line, followed by +the number of postings in that month, without any alignment. This +default format can't be used with time periods of more than one month. +Usage of B<-f> will force this format. I format is like I, but will print the month in front of the newsgroup name. @@ -397,14 +421,12 @@ I format can only be use with a group list (see B<-n>) of exactly one newsgroup and is like I, but will output months, followed by the number of postings. -If you don't need easily parsable output, you'll mostly use I -format, which will print a header for each new month and try to align -newsgroup names and posting counts. Usage of B<-b> will force this -format. - =item B<-c> (captions) -Add captions to output (reporting period, newsgroups list, threshold). +Add captions to output (reporting period, newsgroups list, threshold +and so on). + +This setting will be ignored if B<-f> is set. =item B<-q> (quantity of postings) @@ -418,6 +440,20 @@ Change sort order to descending. Cannot be used with B<-l> or B<-b>. +=item B<-f> I (output file) + +Save output to file instead of dumping it to STDOUT. B +will create one file for each month, with filenames composed by +adding year and month to the I, for example +with B<-f> I: + + stats-2010-01 + stats-2010-02 + ... and so on + +This setting will be ignored if B<-l> or B<-b> is set. Output format +is set to I (see above). + =item B<-g> I (postings per group table) Override I from F.