line |
true |
false |
branch |
124
|
1 |
0 |
if defined(@_ > 0) |
125
|
0 |
1 |
@_ ? : |
127
|
0 |
1 |
if $$self{'verbose'} |
128
|
0 |
1 |
if $$self{'verbose'} |
156
|
0 |
1 |
unless open VOCAB, ">$VOCAB_FILE" |
157
|
0 |
1 |
unless open SNT, ">$SNT_FILE" |
160
|
0 |
1 |
if ($NONTOKEN_FILE ne '') |
170
|
0 |
1 |
unless open CORPUS, $_ |
179
|
18 |
4 |
if (not exists $vocab_hash{$token}) { } |
188
|
0 |
3 |
if $new_line |
223
|
1 |
0 |
if (-e $TOKEN_FILE) { } |
224
|
0 |
1 |
unless open TOKEN, $TOKEN_FILE |
228
|
0 |
1 |
if (length $_ <= 0) |
229
|
0 |
1 |
unless (m[^/] and m[/$]) |
246
|
0 |
1 |
if (length $tokenizerRegex > 0) |
256
|
0 |
1 |
if ($#tokenRegex < 0) |
272
|
0 |
0 |
if ($NONTOKEN_FILE) { } |
275
|
0 |
0 |
unless open NOTOK, $NONTOKEN_FILE |
282
|
0 |
0 |
if (/^\s*$/) |
284
|
0 |
0 |
unless (m[^/]) |
288
|
0 |
0 |
unless (m[/$]) |
301
|
0 |
0 |
if (length $nontokenizerRegex <= 0) |
325
|
0 |
0 |
unless open FILE, $file |
333
|
0 |
0 |
if (/^\s*$/) |
336
|
0 |
0 |
unless (m[^/]) |
340
|
0 |
0 |
unless (m[/$]) |
353
|
0 |
0 |
if (length $stop_regex <= 0) |
371
|
0 |
1 |
unless open VOCAB, $VOCAB_FILE |
515
|
1 |
0 |
if $window_size == 0 |
519
|
0 |
1 |
if $window_size > $ngram_size |
537
|
0 |
1 |
unless open SNT, $SNT_FILE |
567
|
4 |
84 |
if ($i + $ngram_size > $N + 1) |
570
|
42 |
42 |
if ($bits[0] != 1) |
573
|
21 |
21 |
if ($size != $ngram_size) |
598
|
0 |
0 |
if (vec($win, $j, $win_bit) == 1) |
613
|
0 |
1 |
unless open SNTNGRAM, ">$SNTNGRAM_FILE" |
617
|
1 |
0 |
unless (@vocab_array) |
626
|
42 |
0 |
if vec($win, $_, $win_bit) == 1 |
629
|
0 |
21 |
if ($ngram[$#ngram] == 0) |
632
|
1 |
20 |
if ($#prev == -1) { } |
|
20 |
0 |
elsif (join(' ', @ngram) ne join(' ', @prev)) { } |
642
|
20 |
0 |
if ($return_value == 1) |
651
|
1 |
0 |
if ($return_value == 1) |
669
|
0 |
21 |
if ($stop_flag) |
672
|
0 |
0 |
if ($stop_mode =~ /OR|or/) { } |
676
|
0 |
0 |
if ($token_ngram[$i] =~ /$stop_regex/) |
|
0 |
0 |
if ($stop_mode =~ /OR|or/) { } |
679
|
0 |
0 |
unless ($token_ngram[$i] =~ /$stop_regex/) |
682
|
0 |
0 |
if ($doStop and $marginals) |
684
|
0 |
0 |
if (exists $remove_hash{$_ . ':' . $ngram[$_]}) { } |
693
|
0 |
0 |
if ($_ == 1) |
|
0 |
21 |
if ($new_line) |
698
|
21 |
0 |
if ($doStop == 0 and $line == 0) |
699
|
21 |
0 |
if ($remove <= $freq) { } |
701
|
21 |
0 |
if ($frequency <= $freq) |
705
|
0 |
0 |
if (exists $remove_hash{$_ . ':' . $ngram[$_]}) { } |
721
|
0 |
1 |
unless open SNTNGRAM, $SNTNGRAM_FILE |
724
|
0 |
1 |
unless open NGRAM, ">$NGRAM_FILE" |
727
|
0 |
1 |
unless (@vocab_array) |
738
|
21 |
0 |
if ($marginals) |
757
|
21 |
21 |
if ($i == 0) |
758
|
0 |
21 |
if ($_[$i] == vec($corpus, $N, $bit)) |
760
|
21 |
21 |
if ($i == $#_) |
761
|
0 |
21 |
if ($_[$i] == vec($corpus, 0, $bit)) |
764
|
0 |
42 |
if ($stop_flag or $remove > 0) |
765
|
0 |
0 |
if (exists $remove_hash{$i . ':' . $_[$i]}) |
782
|
120 |
0 |
if (vec($a, $i, $win_bit) == 1) |
783
|
120 |
0 |
if (vec($b, $i, $win_bit) == 1) |
787
|
115 |
5 |
if ($a_array[$z] != $b_array[$z]) |
789
|
30 |
0 |
$a_array[$x] < $b_array[$x] ? : |
|
30 |
30 |
$a_array[$x] > $b_array[$x] ? : |