… | |
… | |
19 | Uses per-line display filtering (C<on_line_update>) to underline text |
19 | Uses per-line display filtering (C<on_line_update>) to underline text |
20 | matching a certain pattern and make it clickable. When clicked with the |
20 | matching a certain pattern and make it clickable. When clicked with the |
21 | mouse button specified in the C<matcher.button> resource (default 2, or |
21 | mouse button specified in the C<matcher.button> resource (default 2, or |
22 | middle), the program specified in the C<matcher.launcher> resource |
22 | middle), the program specified in the C<matcher.launcher> resource |
23 | (default, the C<url-launcher> resource, C<sensible-browser>) will be started |
23 | (default, the C<url-launcher> resource, C<sensible-browser>) will be started |
24 | with the matched text as first argument. The default configuration is |
24 | with the matched text as first argument. The default configuration is |
25 | suitable for matching URLs and launching a web browser, like the |
25 | suitable for matching URLs and launching a web browser, like the |
26 | former "mark-urls" extension. |
26 | former "mark-urls" extension. |
27 | |
27 | |
28 | The default pattern to match URLs can be overridden with the |
28 | The default pattern to match URLs can be overridden with the |
29 | C<matcher.pattern.0> resource, and additional patterns can be specified |
29 | C<matcher.pattern.0> resource, and additional patterns can be specified |
30 | with numbered patterns, in a manner similar to the "selection" extension. |
30 | with numbered patterns, in a manner similar to the "selection" extension. |
31 | The launcher can also be overridden on a per-pattern basis. |
31 | The launcher can also be overridden on a per-pattern basis. |
32 | |
32 | |
33 | It is possible to activate the most recently seen match or a list of matches |
33 | It is possible to activate the most recently seen match or a list of matches |
34 | from the keyboard. Simply bind a keysym to "matcher:last" or |
34 | from the keyboard. Simply bind a keysym to "matcher:last" or |
35 | "matcher:list" as seen in the example below. |
35 | "matcher:list" as seen in the example below. |
36 | |
36 | |
37 | The C<matcher:select> action enables a mode in which it is possible to |
37 | The C<matcher:select> action enables a mode in which it is possible to |
38 | iterate over the matches using the keyboard and either activate them |
38 | iterate over the matches using the keyboard and either activate them |
39 | or copy them to the clipboard. While the mode is active, normal terminal |
39 | or copy them to the clipboard. While the mode is active, normal terminal |
40 | input/output is suspended and the following bindings are recognized: |
40 | input/output is suspended and the following bindings are recognized: |
41 | |
41 | |
42 | =over 4 |
42 | =over |
43 | |
43 | |
44 | =item C<Up> |
44 | =item C<Up> |
45 | |
45 | |
46 | Search for a match upwards. |
46 | Search for a match upwards. |
47 | |
47 | |
… | |
… | |
86 | URxvt.matcher.button: 1 |
86 | URxvt.matcher.button: 1 |
87 | URxvt.matcher.pattern.1: \\bwww\\.[\\w-]+\\.[\\w./?&@#-]*[\\w/-] |
87 | URxvt.matcher.pattern.1: \\bwww\\.[\\w-]+\\.[\\w./?&@#-]*[\\w/-] |
88 | URxvt.matcher.pattern.2: \\B(/\\S+?):(\\d+)(?=:|$) |
88 | URxvt.matcher.pattern.2: \\B(/\\S+?):(\\d+)(?=:|$) |
89 | URxvt.matcher.launcher.2: gvim +$2 $1 |
89 | URxvt.matcher.launcher.2: gvim +$2 $1 |
90 | |
90 | |
|
|
91 | =head2 Regex encoding/wide character matching |
|
|
92 | |
|
|
93 | Urxvt stores all text as unicode, in a special encoding that uses |
|
|
94 | one character/code point per column. For various reasons, the regular |
|
|
95 | expressions are matched directly against this encoding, which means there are a few things |
|
|
96 | you need to keep in mind: |
|
|
97 | |
|
|
98 | =over |
|
|
99 | |
|
|
100 | =item X resources/command line arguments are locale-encoded |
|
|
101 | |
|
|
102 | The regexes taken from the command line or resources will be converted |
|
|
103 | from locale encoding to unicode. This can change the number of code points |
|
|
104 | per character. |
|
|
105 | |
|
|
106 | =item Wide characters are column-padded with C<$urxvt::NOCHAR> |
|
|
107 | |
|
|
108 | Wide characters (such as kanji and sometimes tabs) are padded with |
|
|
109 | a special character value (C<$urxvt::NOCHAR>). That means that |
|
|
110 | constructs such as C<\w> or C<.> will only match part of a character, as |
|
|
111 | C<$urxvt::NOCHAR> is not matched by C<\w> and both only match the first |
|
|
112 | "column" of a wide character. |
|
|
113 | |
|
|
114 | That means you have to incorporate C<$urxvt::NOCHAR> into parts of regexes |
|
|
115 | that may match wide characters. For example, to match C<\w+> you might |
|
|
116 | want to use C<[\w$urxvt::NOCHAR]+> instead, and to match a single character |
|
|
117 | (C<.>) you might want to use C<.$urxvt::NOCHAR*> instead. |
|
|
118 | |
|
|
119 | =back |
|
|
120 | |
91 | =cut |
121 | =cut |
92 | |
122 | |
93 | my $url = |
123 | my $url = |
94 | qr{ |
124 | qr{ |
95 | (?:https?://|ftp://|news://|mailto:|file://|\bwww\.) |
125 | (?:https?://|ftp://|news://|mailto:|file://|\bwww\.) |
96 | [\w\-\@;\/?:&=%\$.+!*\x27,~#]* |
126 | [\w\-\@;\/?:&=%\$.+!*\x27,~#$urxvt::NOCHAR]* |
97 | ( |
127 | ( |
98 | \([\w\-\@;\/?:&=%\$.+!*\x27,~#]*\)| # Allow a pair of matched parentheses |
128 | \([\w\-\@;\/?:&=%\$.+!*\x27,~#$urxvt::NOCHAR]*\)| # Allow a pair of matched parentheses |
99 | [\w\-\@;\/?:&=%\$+*~] # exclude some trailing characters (heuristic) |
129 | [\w\-\@;\/?:&=%\$+*~] # exclude some trailing characters (heuristic) |
100 | )+ |
130 | )+ |
101 | }x; |
131 | }x; |
102 | |
132 | |
103 | sub matchlist_key_press { |
133 | sub matchlist_key_press { |
… | |
… | |
193 | |
223 | |
194 | sub most_recent { |
224 | sub most_recent { |
195 | my ($self) = shift; |
225 | my ($self) = shift; |
196 | my $row = $self->nrow - 1; |
226 | my $row = $self->nrow - 1; |
197 | my @exec; |
227 | my @exec; |
|
|
228 | |
198 | while ($row >= $self->top_row) { |
229 | while ($row >= $self->top_row) { |
199 | my $line = $self->line ($row); |
230 | my $line = $self->line ($row); |
200 | @exec = $self->command_for($row); |
231 | @exec = $self->command_for ($row); |
201 | last if(@exec); |
232 | last if @exec; |
202 | |
233 | |
203 | $row = $line->beg - 1; |
234 | $row = $line->beg - 1; |
204 | } |
235 | } |
|
|
236 | |
205 | if(@exec) { |
237 | if (@exec) { |
206 | return $self->exec_async (@exec); |
238 | return $self->exec_async (@exec); |
207 | } |
239 | } |
|
|
240 | |
208 | () |
241 | () |
209 | } |
242 | } |
210 | |
243 | |
211 | sub my_resource { |
244 | sub my_resource { |
212 | $_[0]->x_resource ("%.$_[1]") |
245 | $_[0]->x_resource ("%.$_[1]") |
… | |
… | |
251 | } |
284 | } |
252 | } |
285 | } |
253 | |
286 | |
254 | my @defaults = ($url); |
287 | my @defaults = ($url); |
255 | my @matchers; |
288 | my @matchers; |
256 | for (my $idx = 0; defined (my $res = $self->my_resource ("pattern.$idx") || $defaults[$idx]); $idx++) { |
289 | for (my $idx = 0; defined (my $res = $self->locale_decode ($self->my_resource ("pattern.$idx")) || $defaults[$idx]); $idx++) { |
257 | $res = $self->locale_decode ($res); |
|
|
258 | utf8::encode $res; |
|
|
259 | my $launcher = $self->my_resource ("launcher.$idx"); |
290 | my $launcher = $self->my_resource ("launcher.$idx"); |
260 | $launcher =~ s/\$&|\$\{&\}/\${0}/g if $launcher; |
291 | $launcher =~ s/\$&|\$\{&\}/\${0}/g if $launcher; |
261 | my $rend = $self->parse_rend($self->my_resource ("rend.$idx")); |
292 | my $rend = $self->parse_rend($self->my_resource ("rend.$idx")); |
262 | unshift @matchers, [qr($res)x,$launcher,$rend]; |
293 | unshift @matchers, [qr($res)x,$launcher,$rend]; |
263 | } |
294 | } |
… | |
… | |
313 | my $match = substr $text, $-[0], $+[0] - $-[0]; |
344 | my $match = substr $text, $-[0], $+[0] - $-[0]; |
314 | my @begin = @-; |
345 | my @begin = @-; |
315 | my @end = @+; |
346 | my @end = @+; |
316 | my @exec; |
347 | my @exec; |
317 | |
348 | |
318 | if (!defined($off) || ($-[0] <= $off && $+[0] >= $off)) { |
349 | if (!(defined $off) || ($-[0] <= $off && $+[0] >= $off)) { |
319 | if ($launcher !~ /\$/) { |
350 | if ($launcher !~ /\$/) { |
320 | @exec = ($launcher, $match); |
351 | @exec = ($launcher, $match); |
321 | } else { |
352 | } else { |
322 | # It'd be nice to just access a list like ($&,$1,$2...), |
353 | # It'd be nice to just access a list like ($&,$1,$2...), |
323 | # but alas, m//g behaves differently in list context. |
354 | # but alas, m//g behaves differently in list context. |
324 | @exec = map { s/\$(\d+)|\$\{(\d+)\}/ |
355 | @exec = map { |
|
|
356 | s{\$(\d+)|\$\{(\d+)\}}{ |
325 | substr $text, $begin[$1 || $2], $end[$1 || $2] - $begin[$1 || $2] |
357 | substr $text, $begin[$1 || $2], $end[$1 || $2] - $begin[$1 || $2] |
|
|
358 | }egx; |
|
|
359 | $_ |
326 | /egx; $_ } split /\s+/, $launcher; |
360 | } split /\s+/, $launcher; |
327 | } |
361 | } |
328 | |
362 | |
329 | push @matches, [ $line->coord_of ($begin[0]), $line->coord_of ($end[0]), $match, @exec ]; |
363 | push @matches, [ $line->coord_of ($begin[0]), $line->coord_of ($end[0]), $match, @exec ]; |
330 | } |
364 | } |
331 | } |
365 | } |
332 | } |
366 | } |
333 | |
367 | |
334 | @matches; |
368 | @matches |
335 | } |
369 | } |
336 | |
370 | |
337 | sub command_for { |
371 | sub command_for { |
338 | my ($self, $row, $col) = @_; |
372 | my ($self, $row, $col) = @_; |
339 | |
373 | |
… | |
… | |
346 | () |
380 | () |
347 | } |
381 | } |
348 | |
382 | |
349 | sub on_button_press { |
383 | sub on_button_press { |
350 | my ($self, $event) = @_; |
384 | my ($self, $event) = @_; |
|
|
385 | |
|
|
386 | if ( |
351 | if($self->valid_button($event) |
387 | $self->valid_button ($event) |
352 | && (my @exec = $self->command_for($event->{row},$event->{col}))) { |
388 | && (my @exec = $self->command_for ($event->{row}, $event->{col})) |
|
|
389 | ) { |
353 | $self->{row} = $event->{row}; |
390 | $self->{row} = $event->{row}; |
354 | $self->{col} = $event->{col}; |
391 | $self->{col} = $event->{col}; |
355 | $self->{cmd} = \@exec; |
392 | $self->{cmd} = \@exec; |
356 | return 1; |
393 | return 1; |
357 | } else { |
394 | } else { |
… | |
… | |
370 | my $col = delete $self->{col}; |
407 | my $col = delete $self->{col}; |
371 | my $cmd = delete $self->{cmd}; |
408 | my $cmd = delete $self->{cmd}; |
372 | |
409 | |
373 | return if !defined $row; |
410 | return if !defined $row; |
374 | |
411 | |
375 | if($row == $event->{row} && abs($col-$event->{col}) < 2 |
412 | if ( |
|
|
413 | $row == $event->{row} |
|
|
414 | && (abs $col-$event->{col}) < 2 |
376 | && join("\x00", @$cmd) eq join("\x00", $self->command_for($row,$col))) { |
415 | && (join "\x00", @$cmd) eq (join "\x00", $self->command_for ($row, $col)) |
|
|
416 | ) { |
377 | if($self->valid_button($event)) { |
417 | if ($self->valid_button ($event)) { |
378 | |
|
|
379 | $self->exec_async (@$cmd); |
418 | $self->exec_async (@$cmd); |
380 | |
|
|
381 | } |
419 | } |
382 | } |
420 | } |
383 | |
421 | |
384 | 1; |
422 | 1; |
385 | } |
423 | } |