… | |
… | |
7 | and $self->selection (map { y/A-Za-z/N-ZA-Mn-za-m/; $_ } $self->selection); |
7 | and $self->selection (map { y/A-Za-z/N-ZA-Mn-za-m/; $_ } $self->selection); |
8 | |
8 | |
9 | () |
9 | () |
10 | } |
10 | } |
11 | |
11 | |
|
|
12 | sub on_init { |
|
|
13 | my ($self) = @_; |
|
|
14 | |
|
|
15 | for (my $idx = 0; defined (my $res = $self->x_resource ("selection.pattern-$idx")); $idx++) { |
|
|
16 | no re 'eval'; # just to be sure |
|
|
17 | $res = utf8::encode $self->locale_decode ($res); |
|
|
18 | push @{ $self->{patterns} }, qr/$res/; |
|
|
19 | } |
|
|
20 | |
|
|
21 | () |
|
|
22 | } |
|
|
23 | |
12 | # "find interetsing things"-patterns |
24 | # "find interetsing things"-patterns |
13 | my @mark_patterns = ( |
25 | my @mark_patterns = ( |
|
|
26 | # common types of "parentheses" |
|
|
27 | qr{ (?<![^[:space:]]) ‘ ([^‘’]+) ’ (?![^[:space]]) }x, |
|
|
28 | qr{ (?<![^[:space:]]) ` ([^`']+) ' (?![^[:space]]) }x, |
|
|
29 | qr{ (?<![^[:space:]]) (" [^[:space:]] [^"]* ") }x, |
|
|
30 | qr{ (" [^"]* [^[:space:]] ") (?![^[:space]]) }x, |
|
|
31 | qr{ \< ([^<>[:space:]]+) \> }x, |
|
|
32 | qr{ \{ ([^{}[:space:]]+) \} }x, |
|
|
33 | qr{ \[ ([^{}[:space:]]+) \] }x, |
|
|
34 | qr{ \( ([^()[:space:]]+) \) }x, |
|
|
35 | |
14 | # urls, just a heuristic |
36 | # urls, just a heuristic |
15 | qr{( |
37 | qr{( |
16 | (?:https?|ftp|news|mailto|file)://[ab-zA-Z0-9\-\@;\/?:&=%\$_.+!*\x27(),~]+ |
38 | (?:https?|ftp|news|mailto|file)://[ab-zA-Z0-9\-\@;\/?:&=%\$_.+!*\x27(),~]+ |
17 | [ab-zA-Z0-9\-\@;\/?:&=%\$_+!*\x27(),~] # do not include a trailing dot, its wrong too often |
39 | [ab-zA-Z0-9\-\@;\/?:&=%\$_+!*\x27()~] # exclude some trailing characters (heuristic) |
18 | )}x, |
40 | )}x, |
19 | |
|
|
20 | # common "parentheses" |
|
|
21 | qr{(?:^|\s) ‘ ([^‘’]+?) ’ (?:\s|$)}x, |
|
|
22 | qr{(?:^|\s) ` ([^`']+?) ' (?:\s|$)}x, |
|
|
23 | qr{ \{ ([^{}]+?) \} }x, |
|
|
24 | qr{ \[ ([^{}]+?) \] }x, |
|
|
25 | |
41 | |
26 | # shell-like argument quoting, basically always matches |
42 | # shell-like argument quoting, basically always matches |
27 | qr{\G [\ \t|&;<>()] *( |
43 | qr{\G [\ \t|&;<>()] *( |
28 | (?: |
44 | (?: |
29 | [^\\"'\ \t|&;<>()]+ |
45 | [^\\"'\ \t|&;<>()]+ |
… | |
… | |
39 | qr{^"([^\\"'\ \t|&;<>()*?]+)"$}, # "simple" => simple |
55 | qr{^"([^\\"'\ \t|&;<>()*?]+)"$}, # "simple" => simple |
40 | qr{^(.*)[,\-]$}, # strip off trailing , and - |
56 | qr{^(.*)[,\-]$}, # strip off trailing , and - |
41 | ); |
57 | ); |
42 | |
58 | |
43 | sub on_sel_extend { |
59 | sub on_sel_extend { |
44 | my ($self) = @_; |
60 | my ($self, $time) = @_; |
45 | |
61 | |
46 | my ($row, $col) = $self->selection_mark; |
62 | my ($row, $col) = $self->selection_mark; |
47 | my $line = $self->line ($row); |
63 | my $line = $self->line ($row); |
48 | my $offset = $line->offset_of ($row, $col); |
|
|
49 | my $text = $line->t; |
64 | my $text = $line->t; |
|
|
65 | my $markofs = $line->offset_of ($row, $col); |
|
|
66 | my $curlen = $line->offset_of ($self->selection_end) |
|
|
67 | - $line->offset_of ($self->selection_beg); |
50 | |
68 | |
51 | for my $regex (@mark_patterns) { |
69 | my @matches; |
|
|
70 | |
|
|
71 | # not doing matches in unicode mode helps speed |
|
|
72 | # enourmously here. working in utf-8 should be |
|
|
73 | # equivalent due to the magic of utf-8 encoding. |
|
|
74 | utf8::encode $text; |
|
|
75 | study $text; # _really_ helps, too :) |
|
|
76 | |
|
|
77 | for my $regex (@mark_patterns, @{ $self->{patterns} }) { |
52 | while ($text =~ /$regex/g) { |
78 | while ($text =~ /$regex/g) { |
53 | if ($-[1] <= $offset and $offset <= $+[1]) { |
79 | if ($-[1] <= $markofs and $markofs <= $+[1]) { |
54 | my $ofs = $-[1]; |
80 | my $ofs = $-[1]; |
55 | my $match = $1; |
81 | my $match = $1; |
56 | |
82 | |
57 | for my $regex (@simplify_patterns) { |
83 | for my $regex (@simplify_patterns) { |
58 | if ($match =~ $regex) { |
84 | if ($match =~ $regex) { |
59 | $match = $1; |
85 | $match = $1; |
60 | $ofs += $-[1]; |
86 | $ofs += $-[1]; |
61 | } |
87 | } |
62 | } |
88 | } |
63 | |
89 | |
64 | $self->selection_beg ($line->coord_of ($ofs)); |
90 | push @matches, [$ofs, length $match]; |
65 | $self->selection_end ($line->coord_of ($ofs + length $match)); |
|
|
66 | return 1; |
|
|
67 | } |
91 | } |
68 | } |
92 | } |
69 | } |
93 | } |
70 | |
94 | |
|
|
95 | # whole line |
|
|
96 | push @matches, [0, ($line->end - $line->beg + 1) * $self->ncol]; |
|
|
97 | |
|
|
98 | for (sort { $a->[1] <=> $b->[1] or $b->[0] <=> $a->[0] } @matches) { |
|
|
99 | my ($ofs, $len) = @$_; |
|
|
100 | |
|
|
101 | next if $len <= $curlen; |
|
|
102 | |
|
|
103 | $self->selection_beg ($line->coord_of ($ofs)); |
|
|
104 | $self->selection_end ($line->coord_of ($ofs + $len)); |
|
|
105 | return 1; |
|
|
106 | } |
|
|
107 | |
71 | () |
108 | () |
72 | } |
109 | } |