line |
stmt |
bran |
cond |
sub |
pod |
time |
code |
1
|
|
|
|
|
|
|
package WikiText::Sample::Parser; |
2
|
5
|
|
|
5
|
|
4119
|
use base 'WikiText::Parser'; |
|
5
|
|
|
|
|
10
|
|
|
5
|
|
|
|
|
1090
|
|
3
|
|
|
|
|
|
|
|
4
|
|
|
|
|
|
|
sub create_grammar { |
5
|
18
|
|
|
18
|
0
|
65
|
my $all_blocks = [ 'h1', 'h2', 'h3', 'hr', 'p', 'pre' ]; |
6
|
|
|
|
|
|
|
|
7
|
18
|
|
|
|
|
43
|
my $all_phrases = [ 'b', 'i' ]; |
8
|
|
|
|
|
|
|
|
9
|
|
|
|
|
|
|
return { |
10
|
|
|
|
|
|
|
# Parsing starts at the "top" level document |
11
|
|
|
|
|
|
|
top => { |
12
|
|
|
|
|
|
|
blocks => $all_blocks, # A document consists of top level blocks |
13
|
|
|
|
|
|
|
}, |
14
|
|
|
|
|
|
|
p => { |
15
|
|
|
|
|
|
|
match => qr/^ # Blocks must start at beginning |
16
|
|
|
|
|
|
|
( # Capture paragraph in $1 |
17
|
|
|
|
|
|
|
((?!(?: # Stop at certain blocks |
18
|
|
|
|
|
|
|
[\=] | # Headings |
19
|
|
|
|
|
|
|
\s+\S |
20
|
|
|
|
|
|
|
)) |
21
|
|
|
|
|
|
|
.*\S.*\n)+ # Otherwise, collect non-empty lines |
22
|
|
|
|
|
|
|
) |
23
|
|
|
|
|
|
|
(?:\s*\n)? # Eat trailing newlines |
24
|
|
|
|
|
|
|
/x, |
25
|
|
|
|
|
|
|
phrases => $all_phrases, |
26
|
18
|
|
|
18
|
|
54
|
filter => sub { chomp }, |
27
|
|
|
|
|
|
|
}, |
28
|
|
|
|
|
|
|
pre => { |
29
|
|
|
|
|
|
|
match => qr/^ |
30
|
|
|
|
|
|
|
( |
31
|
|
|
|
|
|
|
((?!(?: # Stop at certain blocks |
32
|
|
|
|
|
|
|
\S # Anything starting with nonspace |
33
|
|
|
|
|
|
|
)) |
34
|
|
|
|
|
|
|
(?m: ^\ +.*\S.*\n))+ # otherwise grab lines starting with space |
35
|
|
|
|
|
|
|
) |
36
|
|
|
|
|
|
|
(\s*\n)* # and all blank lines after |
37
|
|
|
|
|
|
|
/x, |
38
|
3
|
|
|
3
|
|
19
|
filter => sub { s/^\s*//mg; s/\s*$//mg; }, |
|
3
|
|
|
|
|
26
|
|
39
|
|
|
|
|
|
|
}, |
40
|
18
|
|
|
|
|
478
|
h1 => { |
41
|
|
|
|
|
|
|
match => re_header(1), |
42
|
|
|
|
|
|
|
}, |
43
|
|
|
|
|
|
|
h2 => { |
44
|
|
|
|
|
|
|
match => re_header(2), |
45
|
|
|
|
|
|
|
}, |
46
|
|
|
|
|
|
|
h3 => { |
47
|
|
|
|
|
|
|
match => re_header(3), |
48
|
|
|
|
|
|
|
}, |
49
|
|
|
|
|
|
|
hr => { |
50
|
|
|
|
|
|
|
match => qr/^----\n(?:\s*\n)?/, |
51
|
|
|
|
|
|
|
}, |
52
|
|
|
|
|
|
|
b => { |
53
|
|
|
|
|
|
|
phrases => $all_phrases, |
54
|
|
|
|
|
|
|
match => phrase("'''"), |
55
|
|
|
|
|
|
|
}, |
56
|
|
|
|
|
|
|
i => { |
57
|
|
|
|
|
|
|
phrases => $all_phrases, |
58
|
|
|
|
|
|
|
match => phrase("''"), |
59
|
|
|
|
|
|
|
}, |
60
|
|
|
|
|
|
|
}; |
61
|
|
|
|
|
|
|
} |
62
|
|
|
|
|
|
|
|
63
|
|
|
|
|
|
|
# Reusable regexp generators used by the grammar |
64
|
|
|
|
|
|
|
sub phrase { |
65
|
36
|
|
|
36
|
0
|
59
|
my $brace1 = shift; |
66
|
36
|
|
33
|
|
|
143
|
my $brace2 = shift || $brace1; |
67
|
|
|
|
|
|
|
|
68
|
36
|
|
|
|
|
920
|
return qr/ |
69
|
|
|
|
|
|
|
${brace1} # Opening phrase markup |
70
|
|
|
|
|
|
|
(.*?'*) # Capture content in $1 |
71
|
|
|
|
|
|
|
${brace2} # Closing phrase markup |
72
|
|
|
|
|
|
|
/x; |
73
|
|
|
|
|
|
|
} |
74
|
|
|
|
|
|
|
|
75
|
|
|
|
|
|
|
sub re_header { |
76
|
54
|
|
|
54
|
0
|
82
|
my $level = shift; |
77
|
54
|
|
|
|
|
1446
|
return qr/^ # Block must begin at position 0 |
78
|
|
|
|
|
|
|
\={$level} # Proper number of '=' chars |
79
|
|
|
|
|
|
|
\ + # 1 or more spaces |
80
|
|
|
|
|
|
|
(.*?) # Capture header content in $1 |
81
|
|
|
|
|
|
|
\s*\n # Eat trailing whitespace and newlines |
82
|
|
|
|
|
|
|
/x; |
83
|
|
|
|
|
|
|
} |
84
|
|
|
|
|
|
|
|
85
|
|
|
|
|
|
|
1; |