In Deinen bestehenden Code integriert sieht es in etwas so aus:
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
use HTML::Parser;
my $string = "";
sub search {
my @terms = split(/\s+/, $FORM{'terms'});
my $parser = HTML::Parser->new(
api_version => 3,
start_h => [\&start,"self,tagname,attr"],
text_h => [\&text,"self,dtext"],
end_h => [\&end,"self,tagname"]);
for my $html_file(@FILES){
$string = '';
$parser->parse_file($html_file);
foreach $term (@terms) {
&Umlaute;
if ($string =~ /$term/) {
$include{$FILE} = 'yes';
last;
}
else {
$include{$FILE} = 'no';
}
}
}
}
sub start{
my ($self,$tag,$attr) = @_;
if($tag eq 'div' && $attr->{class} eq 'scroll'){
$self->{search} = 1;
}
}
sub text{
my ($self,$dtext) = @_;
$string .= $dtext if($self->{search});
}
sub end{
my ($self,$tag) = @_;
if($tag eq 'div'){
$self->{search} = 0;
}
}
Deine Version etwas abgewandelt:
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
sub search {
@terms = split(/\s+/, $FORM{'terms'});
foreach $FILE (@FILES) {
local $/;
open(FILE,"<",$FILE) or die $!;
my $string = <FILE>;
close(FILE);
($string) = $string =~ m~<div class="scroll">(.*?)</div>~;
$string =~ s/\n//g;
foreach $term (@terms) {
&Umlaute;
if ($string =~ /$term/) {
$include{$FILE} = 'yes';
last;
}
else {
$include{$FILE} = 'no';
}
}
}
}
Du solltest unbeding
use strict verwenden!
Und zu regulaeren Ausdruecken kannst Du Dir mal
perlre,
perlretut und
perlrequick anschauen...\n\n
<!--EDIT|renee|1151077815-->