Jump to content

User:AnomieBOT/source/tasks/WikiProjectWorker.pm: Difference between revisions

From Wikipedia, the free encyclopedia
Content deleted Content added
AnomieBOT (talk | contribs)
Updating published sources: WikiProjectWorker: * Start run for WikiProject Geology.
AnomieBOT (talk | contribs)
Updating published sources: WikiProjectWorker: * Actually start run for WikiProject Geology.
Line 102: Line 102:


sub approved {
sub approved {
return -1;
return 1;
}
}



Revision as of 19:03, 7 September 2012

package tasks::WikiProjectWorker;

=pod

=begin metadata

Bot:      AnomieBOT
Task:     WikiProjectWorker
BRFA:     Wikipedia:Bots/Requests for approval/AnomieBOT 28
Status:   Approved 2009-04-08
Created:  2009-03-27
OnDemand: true

Perform various tasks at the request of the affected WikiProjects:
* Add or remove banners on a specific set of pages (e.g. pages in a category, pages transcluding a template).
* Adjust banner parameters, particularly assessments and task forces.
* Fix banner shells on pages edited for the above reasons.

=end metadata

=cut

use utf8;
use strict;

use Data::Dumper;
use Digest::SHA qw/sha256_base64/;
use AnomieBOT::Task;
use vars qw/@ISA/;
@ISA=qw/AnomieBOT::Task/;

### Request link, for edit summary.
my $req="[[User:AnomieBOT/req/WikiProject Geology 1|request]]";

### Increment this number every time a new run is started, so we don't have to
### mess around with deleting previous runs' database entries.
my $seq=19;

### How to find the pages?
my @cats=(
	'Category:Unknown-importance Geology articles',
);
my @iterators=(
    {
        generator  => 'categorymembers',
        gcmtitle   => [@cats],
        gcmlimit   => 100,
    },
);

### Filter function: manipulate the found data as necessary, returning the talk
### page to tag (or undef to skip).
sub filter {
    $_[0]->{'title'}='Talk:'.$_[0]->{'title'} if $_[0]->{'ns'}==0;
    $_[0]->{'title'}=~s/^([^:]*):/$1 talk:/ if($_[0]->{'ns'}!=0 && ($_[0]->{'ns'}&1)==0);
    return $_[0]->{'title'};
}

### How to copy other projects' assessments
sub copy_class {
    #return ($_[0]->WPBmax($_[2]))[0];
    return '';
}

sub copy_importance {
    #return ($_[0]->WPBmax($_[2]))[1];
    return 'Low';
}

# Banner configurations.
my $main_banner='WikiProject Geology';
my @preprocess_templates=();
my %banner_cfgs=(
    'WikiProject Geology' => {
        meta => 1,
        canonicalize => 'WikiProject Geology',
    },
);

my @main_banners=(
    $main_banner,
);

sub new {
    my $class=shift;
    my $self=$class->SUPER::new();
    $self->{'config loaded'}=0;
    $self->{'iter'}=undef;
    $self->{'iterators'}=[@iterators];
    bless $self, $class;
    return $self;
}

=pod

=for info
Approved 2009-04-08<br />[[Wikipedia:Bots/Requests for approval/AnomieBOT 28]]

=cut

sub approved {
    return 1;
}

sub run {
    my ($self, $api)=@_;
    my $res;

    $api->task('WikiProjectWorker', 0, 10, qw/d::WikiProjectTagging/);
    my $errto = 'Errors? [[User:'.$api->user.'/shutoff/WikiProjectWorker]]';

    # Load configs, if necessary
    if(!$self->{'config loaded'}){
        my %cfg=();
        while(my ($banner,$cfg)=each %banner_cfgs){
            $cfg=$api->WPBMetaConfig($cfg->{'meta'}, %$cfg) if exists($cfg->{'meta'});
            $cfg{$banner}=$cfg;
            $banner_cfgs{$banner}{'stubauto'}=$cfg->{'stubauto'};
        }
        $api->WPBconfig(%cfg);

        $self->{'config loaded'}=1;
    }
    if(($api->store->{'configured'} // 0) < $seq){
        ### Initialize configuration here
    }

    # Spend a max of 5 minutes on this task before restarting
    my $endtime=time()+300;

    while(1){
        my $iter=$self->{'iter'};
        if(!defined($iter)){
            my $i=shift @{$self->{'iterators'}};
            last unless $i;
            $iter=$api->iterator(%$i);
            $self->{'iter'}=$iter;
        }
        while(my $page=$iter->next()){
            if(!$page->{'_ok_'}){
                $api->warn("Could not retrieve page from iterator: ".$page->{'error'}."\n");
                return 60;
            }

            my $pageid=$page->{'pageid'};
            next if ($api->store->{$pageid} // 0) >= $seq;

            my $title=filter($page);
            if(!defined($title)){
                $api->log("Skipping ".$page->{'title'}.", filter returned undef");
                $api->store->{$pageid}=$seq;
                next;
            }

            my $tok=$api->edittoken($title, EditRedir => 1);
            if($tok->{'code'} eq 'shutoff'){
                $api->warn("Task disabled: ".$tok->{'content'}."\n");
                return 300;
            }
            if($tok->{'code'} ne 'success'){
                $api->warn("Failed to get edit token for $title: ".$tok->{'error'}."\n");
                next;
            }
            if(($tok->{'ns'}&1)==0){
                $api->log("Cannot edit $title: namespace ".$tok->{'ns'}." is non-talk");
                $api->store->{$pageid}=$seq;
                next;
            }
            if(exists($tok->{'redirect'})){
                $api->log("$title is a redirect, skipping.");
                $api->store->{$pageid}=$seq;
                next;
            }

            $api->log("Checking $title...");

            my $intxt=$tok->{'revisions'}[0]{'*'} // '';
            my ($outtxt,$nowiki)=$api->strip_nowiki($intxt);

            my @params=();

            my $assess = undef;
            my $class = copy_class($api, $title, $intxt);
            if(ref($class) eq 'HASH'){
                $api->warn("Processing $title failed: ".$class->{'error'}."\n");
                next;
            }
            $class=~s/^\s+|\s+$//g;
            $assess=$api->WPBassess($title);
            if(ref($assess) eq 'HASH'){
                if($assess->{'code'} eq 'pagemissing'){
                    # No subject page, doesn't matter
                    $assess=undef;
                } else {
                    $api->warn("Processing $title failed: ".$assess->{'error'}."\n");
                    next;
                }
            }
            if($class eq '' || lc($class) eq lc($assess)){
                $class='';
            } else {
                $assess=undef;
                push @params, "class=$class";
                my $imp = copy_importance($api, $title, $intxt);
                if(ref($imp) eq 'HASH'){
                    $api->warn("Processing $title failed: ".$imp->{'error'}."\n");
                    next;
                }
                push @params, "importance=$imp" if ($imp//'') ne '';
            }

            if(1){ # Always copy importance?
                my $imp = copy_importance($api, $title, $intxt);
                if(ref($imp) eq 'HASH'){
                    $api->warn("Processing $title failed: ".$imp->{'error'}."\n");
                    next;
                }
                push @params, "importance=$imp" if ($imp//'') ne '';
            }

            my $need_main_banner = ($api->WPBcheck($outtxt, $main_banner) == 0);
            if(0){
                # grr, already redirected so the above always returns true
                $need_main_banner=1;
                $api->WPBcheck($outtxt, sub {
                        my $banner=shift;
                        my $name=shift;
                        $need_main_banner=0 if(grep $name eq $_, @main_banners);
                        return undef;
                    }, $main_banner);
            }

            ### PROCESSING ###

            my @merge=();
            my @summary=();

            if(@preprocess_templates){
                (undef,$outtxt)=$api->WPBcheck($outtxt, sub {
                    my $banner=shift;
                    my $name=shift;
                    my $oname=shift;
                    my $params=shift;
                    my $wikitext=shift;

                    return undef if(grep $name eq $_, @main_banners);

                    push @merge, $oname;

                    return '' unless $need_main_banner;
                    $need_main_banner=0;
                    return "{{$main_banner}}";
                }, @preprocess_templates);
                if(ref($outtxt) eq 'HASH'){
                    $api->warn("Preprocessing $title failed: ".$outtxt->{'error'}."\n");
                    next;
                }
                if(@merge){
                    $merge[-1]='and '.$merge[-1] if @merge>1;
                    push @summary, "merging ".join((@merge>2)?', ':' ', @merge)." into $main_banner" if @merge;
                } else {
                #    $api->warn("$title contains ".$iter->iterval.", but not in section 0\n");
                    next;
                }
            }

            my $tag;
            my $pg=$title;
            $pg=~s/^Talk://;
            if($page->{'title'} ne $pg){
                $page=$api->query(
                    titles       => $pg,
                    prop         => 'info',
                    redirects    => 1,
                );
                if($page->{'code'} ne 'success'){
                    $api->warn("Could not load $pg info: ".$page->{'error'}."\n");
                    return 60;
                }

                $page=(values %{$page->{'query'}{'pages'}})[0];
            }

            $outtxt=$api->WPBadd($outtxt, $assess, sub {
                my $banner=shift; # banner
                my $name=shift; # name
                my $oname=shift;
                my $params=shift;
                my $wikitext=shift;
                my $new=shift;
                #return '' if $new;

                return undef unless(grep $banner eq $_, @main_banners);
                my %cfg=%{$banner_cfgs{$banner}};

                my $any=0;
                foreach my $p (@params){
                    next unless $p=~/^(.+?)=(.*)$/;
                    my ($k,$v)=($1,$2);
                    my $re=qr/\S/;
                    unless(grep(/^\s*\Q$k\E\s*=\s*$re\s*$/, @$params)){
                        next if(grep(/^\s*\Q$k\E\s*=\s*\Q$v\E\s*$/s, @$params));
                        unshift @$params, "$k=$v" unless(grep(s/^(\s*\Q$k\E\s*=\s*?)(?:\S.*?)?(\s*)$/$1$v$2/s, @$params));
                        $any=1 unless $v eq '';
                        if($k eq 'class' && ($cfg{'meta'}//0) && ($cfg{'stubauto'}//'')){
                            my $aa=$cfg{'stubauto'};
                            $aa=~s/\s*=.*//;
                            push @$params, "$aa=inherit" unless(grep(s/^(\s*\Q$aa\E\s*=\s*?)(?:\S.*?)?(\s*)$/$1inherit$2/s, @$params));
                        }
                    }
                }
                if($new && $class && (grep /^class=/, @$params) && ($cfg{'meta'}//0) && ($cfg{'stubauto'}//'')){
                    my $aa=$cfg{'stubauto'};
                    $aa=~s/\s*=.*//;
                    push @$params, "$aa=inherit" unless(grep(s/^(\s*\Q$aa\E\s*=\s*?)(?:\S.*?)?(\s*)$/$1inherit$2/s, @$params));
                    $any=1;
                }
                return $wikitext unless $any;

                if(defined($cfg{'canonicalize'})){
                    my $n=$cfg{'canonicalize'};
                    $oname=~s/_/ /g;
                    $oname=~s/^(\s*)\S(?:.*\S)?(\s*)$/$1$n$2/is;
                }
                my $out="{{$oname";
                $out.="|".join("|", @$params) if @$params;
                $out.="}}";
                return $out;
            }, $main_banner, @params);
            if(ref($outtxt) eq 'HASH'){
                $api->warn("Processing $title failed: ".$outtxt->{'error'}."\n");
                next;
            }
            push @summary, "Tagging with {{$main_banner}}" unless @summary;

            $outtxt=$api->replace_nowiki($outtxt, $nowiki);

            # Need to edit?
            if($outtxt ne $intxt){
                if(!@summary){
                    $api->warn("$title changed, but nothing in \@summary\n");
                    next;
                }
                my $cat=$iter->iterval;
                $summary[-1]='and '.$summary[-1] if @summary>1;
                my $summary = ucfirst(join((@summary>2)?', ':' ', @summary))." per $req";

                my @cleanup=();
                $outtxt=$api->WPBfixshell($outtxt, \@cleanup);
                if(ref($outtxt) eq 'HASH'){
                    $api->warn("Processing $title failed: ".$outtxt->{'error'}."\n");
                    next;
                }
                $summary.="; general banner cleanup (".join(', ', @cleanup).")" if @cleanup;
                $summary.=". $errto";

                $api->log("$summary in $title");
                my $r=$api->edit($tok, $outtxt, $summary, 1, 1);
                if($r->{'code'} ne 'success'){
                    $api->warn("Write failed on $title: ".$r->{'error'}."\n");
                    next;
                }
            } else {
                $api->log("Nothing to do in $title");
            }

            # Remember that we processed this page already
            $api->store->{$pageid}=$seq;

            # If we've been at it long enough, let another task have a go.
            return 0 if time()>=$endtime;
        }
        $self->{'iter'}=undef;
    }

    # No more pages to check, try again in 10 minutes or so in case of errors.
    $self->{'iter'}=undef;
    $self->{'iterators'}=[@iterators];
    $api->log("WikiProjectWorker may be DONE!");
    return 600;
}