--- rxvt-unicode/src/perl/selection 2006/07/06 19:06:40 1.39 +++ rxvt-unicode/src/perl/selection 2014/05/31 08:33:47 1.60 @@ -1,9 +1,66 @@ #! perl -sub on_user_command { - my ($self, $cmd) = @_; +#:META:RESOURCE:%.pattern-0:string:first selection pattern - $cmd eq "selection:rot13" +=head1 NAME + +selection - more intelligent selection (enabled by default) + +=head1 DESCRIPTION + +This extension tries to be more intelligent when the user extends +selections (double-click and further clicks). Right now, it tries to +select words, urls and complete shell-quoted arguments, which is very +convenient, too, if your F supports C<--quoting-style=shell>. + +A double-click usually selects the word under the cursor, further clicks +will enlarge the selection. + +The selection works by trying to match a number of regexes and displaying +them in increasing order of length. You can add your own regexes by +specifying resources of the form: + + URxvt.selection.pattern-0: perl-regex + URxvt.selection.pattern-1: perl-regex + ... + +The index number (0, 1...) must not have any holes, and each regex must +contain at least one pair of capturing parentheses, which will be used for +the match. For example, the following adds a regex that matches everything +between two vertical bars: + + URxvt.selection.pattern-0: \\|([^|]+)\\| + +Another example: Programs I use often output "absolute path: " at the +beginning of a line when they process multiple files. The following +pattern matches the filename (note, there is a single space at the very +end): + + URxvt.selection.pattern-0: ^(/[^:]+):\ + +You can look at the source of the selection extension to see more +interesting uses, such as parsing a line from beginning to end. + +This extension also offers the following actions: + +=over 4 + +=item rot13 + +Rot-13 the selection when activated. + +Example: + + URxvt.keysym.C-M-r: selection:rot13 + +=back + +=cut + +sub on_action { + my ($self, $action) = @_; + + $action eq "rot13" and $self->selection (map { y/A-Za-z/N-ZA-Mn-za-m/; $_ } $self->selection); () @@ -19,7 +76,6 @@ for (my $idx = 0; defined (my $res = $self->x_resource ("selection.pattern-$idx")); $idx++) { $res = $self->locale_decode ($res); - utf8::encode $res; push @{ $self->{patterns} }, qr/$res/; } @@ -34,20 +90,30 @@ # "find interesting things"-patterns my @mark_patterns = ( +# qr{ ([[:word:]]+) }x, + qr{ ([^[:space:]]+) }x, + # common types of "parentheses" - qr{ (?[:space:]]+) \> }x, - qr{ \{ ([^{}[:space:]]+) \} }x, - qr{ \[ ([^{}[:space:]]+) \] }x, - qr{ \( ([^()[:space:]]+) \) }x, + qr{ (?]+) \> }x, # urls, just a heuristic qr{( - (?:https?://|ftp://|news://|mailto:|file://)[ab-zA-Z0-9\-\@;\/?:&=%\$_.+!*\x27(),~#]+ - [ab-zA-Z0-9\-\@;\/?:&=%\$_+!*\x27()~] # exclude some trailing characters (heuristic) + (?:https?://|ftp://|news://|mailto:|file://|\bwww\.)[ab-zA-Z0-9\-\@;\/?:&=%\$_.+!*\x27(),~#]+ + [ab-zA-Z0-9\-\@;\/?:&=%\$_+*()~] # exclude some trailing characters (heuristic) )}x, # shell-like argument quoting, basically always matches @@ -83,17 +149,6 @@ my @matches; if ($markofs < $line->l) { - # convert markofs form character to UTF-8 offset space - { - my $prefix = substr $text, 0, $markofs; - utf8::encode $prefix; - $markofs = length $prefix; - } - - # not doing matches in unicode mode helps speed - # enourmously here. working in utf-8 should be - # equivalent due to the magic of utf-8 encoding. - utf8::encode $text; study $text; # _really_ helps, too :) for my $regex (@mark_patterns, @{ $self->{patterns} }) { @@ -123,18 +178,6 @@ next if $len <= $curlen; - # convert back from UTF-8 offset space to character space - { - my $length = substr "$text ", $ofs, $len; - utf8::decode $length; - $len = length $length; - } - { - my $prefix = substr $text, 0, $ofs; - utf8::decode $prefix; - $ofs = length $prefix; - } - $self->selection_beg ($line->coord_of ($ofs)); $self->selection_end ($line->coord_of ($ofs + $len)); return 1;