-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathTemplateTranslatePreparseXML.pl
59 lines (46 loc) · 1.42 KB
/
TemplateTranslatePreparseXML.pl
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
#!/usr/bin/perl
# Fluffbot translates templates to swedish parameters, preparser
# Copyright (C) User:Fluff 2015
# This program is free software: you can redistribute it and/or modify
# it under the terms of the GNU General Public License as published by
# the Free Software Foundation, either version 3 of the License, or
# (at your option) any later version.
# This program is distributed in the hope that it will be useful,
# but WITHOUT ANY WARRANTY; without even the implied warranty of
# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
# GNU General Public License for more details.
# You should have received a copy of the GNU General Public License
# along with this program. If not, see <http://www.gnu.org/licenses/>.
use strict;
use warnings;
use XML::LibXML::Reader;
my $r = XML::LibXML::Reader->new(FD => fileno(STDIN));
my $t = $ARGV[0];
chomp($t);
my $pattern;
if($t eq "web") {
$pattern = qr/\{\{cite[\ |\_]?web/i;
}
elsif($t eq "book") {
$pattern = qr/\{\{cite[\ |\_]?book/i;
}
elsif($t eq "news") {
$pattern = qr/\{\{cite[\ |\_](news|article)/i;
}
while($r->nextElement('page')) {
my $title;
my $text;
if($r->nextElement('title')) {
$title = $r->readInnerXml();
}
if($r->nextElement('ns')) {
if($r->readInnerXml() == 0) {
if($r->nextElement('text')) {
$text = $r->readInnerXml();
}
if($text =~ $pattern) {
print $title . "\n";
}
}
}
}