eg/hstrip - metacpan.org


            
              1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
              #!/usr/bin/perl
# This script cleans up an HTML document
use strict;
use warnings;
use HTML::Parser ();
# configure these values
my @ignore_attr = qw(bgcolor background color face style link alink vlink text
    onblur onchange onclick ondblclick onfocus onkeydown onkeyup onload
    onmousedown onmousemove onmouseout onmouseover onmouseup
    onreset onselect onunload
);
my @ignore_tags     = qw(font big small b i);
my @ignore_elements = qw(script style);
# make it easier to look up attributes
my %ignore_attr = map { $_ => 1 } @ignore_attr;
sub tag {
    my ($pos, $text) = @_;
    if (@$pos >= 4) {
        # kill some attributes
        my ($k_offset, $k_len, $v_offset, $v_len) = @{$pos}[-4 .. -1];
        my $next_attr = $v_offset ? $v_offset + $v_len : $k_offset + $k_len;
        my $edited;
        while (@$pos >= 4) {
            ($k_offset, $k_len, $v_offset, $v_len) = splice @$pos, -4;
            if ($ignore_attr{lc substr($text, $k_offset, $k_len)}) {
                substr($text, $k_offset, $next_attr - $k_offset) = "";
                $edited++;
            }
            $next_attr = $k_offset;
        }
        # if we killed all attributed, kill any extra whitespace too
        $text =~ s/^(<\w+)\s+>$/$1>/ if $edited;
    }
    print $text;
}
sub decl {
    my $type = shift;
    print shift if $type eq "doctype";
}
sub text {
    print shift;
}
HTML::Parser->new(
    api_version   => 3,
    start_h       => [\&tag, "tokenpos, text"],
    process_h     => ["", ""],
    comment_h     => ["", ""],
    declaration_h => [\&decl, "tagname, text"],
    default_h     => [\&text, "text"],
    ignore_tags     => \@ignore_tags,
    ignore_elements => \@ignore_elements,
)->parse_file(shift)
    || die "Can't open file: $!\n";

	Global
`s`	Focus search bar
`?`	Bring up this help dialog

	GitHub
`g` `p`	Go to pull requests
`g` `i`	go to github issues (only if github is preferred repository)

	POD
`g` `a`	Go to author
`g` `c`	Go to changes
`g` `i`	Go to issues
`g` `d`	Go to dist
`g` `r`	Go to repository/SCM
`g` `s`	Go to source
`g` `b`	Go to file browse

	Search terms
module: (e.g. module:Plugin)
distribution: (e.g. distribution:Dancer auth)
author: (e.g. author:SONGMU Redis)
version: (e.g. version:1.00)