ViewVC Help
View File | Revision Log | Show Annotations | Download File
/cvs/rxvt-unicode/src/perl/selection
(Generate patch)

Comparing rxvt-unicode/src/perl/selection (file contents):
Revision 1.43 by root, Mon Nov 19 09:26:41 2007 UTC vs.
Revision 1.54 by root, Wed Jun 6 15:06:41 2012 UTC

1#! perl 1#! perl
2
3#:META:X_RESOURCE:%.pattern-0:string:first selection pattern
2 4
3sub on_user_command { 5sub on_user_command {
4 my ($self, $cmd) = @_; 6 my ($self, $cmd) = @_;
5 7
6 $cmd eq "selection:rot13" 8 $cmd eq "selection:rot13"
17 push @{ $self->{patterns} }, qr{\G [\Q$res\E[:space:]]* ([^\Q$res\E[:space:]]+) }x; 19 push @{ $self->{patterns} }, qr{\G [\Q$res\E[:space:]]* ([^\Q$res\E[:space:]]+) }x;
18 } 20 }
19 21
20 for (my $idx = 0; defined (my $res = $self->x_resource ("selection.pattern-$idx")); $idx++) { 22 for (my $idx = 0; defined (my $res = $self->x_resource ("selection.pattern-$idx")); $idx++) {
21 $res = $self->locale_decode ($res); 23 $res = $self->locale_decode ($res);
22 utf8::encode $res;
23 push @{ $self->{patterns} }, qr/$res/; 24 push @{ $self->{patterns} }, qr/$res/;
24 } 25 }
25 26
26 $self->{enabled} = 1; 27 $self->{enabled} = 1;
27 28
32 () 33 ()
33} 34}
34 35
35# "find interesting things"-patterns 36# "find interesting things"-patterns
36my @mark_patterns = ( 37my @mark_patterns = (
37 qr{ ([[:word:]]+) }x, 38# qr{ ([[:word:]]+) }x,
38 qr{ ([^[:space:]]+) }x, 39 qr{ ([^[:space:]]+) }x,
39 40
40 # common types of "parentheses" 41 # common types of "parentheses"
41 qr{ (?<![^[:space:]]) ` ([^‘’]+) ` (?![^[:space:]]) }x, 42 qr{ (?<![^[:space:]]) [`'] ([^`']+) [`'] (?![^[:space:]]) }x,
42 qr{ (?<![^[:space:]]) ‘ ([^‘’]+) ’ (?![^[:space:]]) }x, 43 qr{ (?<![^[:space:]]) ‘ ([^‘’]+) ’ (?![^[:space:]]) }x,
43 qr{ (?<![^[:space:]]) ` ([^`']+) ' (?![^[:space:]]) }x, 44 qr{ (?<![^[:space:]]) ([^“”]+) (?![^[:space:]]) }x,
44 45
45 qr{ (?<![^[:space:]]) ‘ ([^`']+) ’ (?![^[:space:]]) }x,
46 qr{ (?<![^[:space:]]) “ ([^`']+) ” (?![^[:space:]]) }x,
47
48 qr{ (?<![^[:space:]]) (' [^[:space:]] [^']* ') }x, 46 qr{ (?<![^[:space:]]) (' [^[:space:]] [^']* ') }x,
49 qr{ (' [^']* [^[:space:]] ') (?![^[:space:]]) }x, 47 qr{ (' [^']* [^[:space:]] ') (?![^[:space:]]) }x,
48 qr{ (?<![^[:space:]]) (` [^[:space:]] [^']* ') }x,
49 qr{ (` [^']* [^[:space:]] ') (?![^[:space:]]) }x,
50 qr{ (?<![^[:space:]]) (" [^[:space:]] [^"]* ") }x, 50 qr{ (?<![^[:space:]]) (" [^[:space:]] [^"]* ") }x,
51 qr{ (" [^"]* [^[:space:]] ") (?![^[:space:]]) }x, 51 qr{ (" [^"]* [^[:space:]] ") (?![^[:space:]]) }x,
52 52
53 qr{ \< ([^`']+) \> }x,
54 qr{ \( ([^`']+) \) }x,
55 qr{ \{ ([^`']+) \} }x, 53 qr{ \{ ([^\{\}]+) \} }x,
54 qr{ \( ([^\(\)]+) \) }x,
56 qr{ \[ ([^`']+) \] }x, 55 qr{ \[ ([^\[\]]+) \] }x,
56 qr{ \< ([^\<\>]+) \> }x,
57 57
58 # urls, just a heuristic 58 # urls, just a heuristic
59 qr{( 59 qr{(
60 (?:https?://|ftp://|news://|mailto:|file://|\bwww\.)[ab-zA-Z0-9\-\@;\/?:&=%\$_.+!*\x27(),~#]+ 60 (?:https?://|ftp://|news://|mailto:|file://|\bwww\.)[ab-zA-Z0-9\-\@;\/?:&=%\$_.+!*\x27(),~#]+
61 [ab-zA-Z0-9\-\@;\/?:&=%\$_+*()~] # exclude some trailing characters (heuristic) 61 [ab-zA-Z0-9\-\@;\/?:&=%\$_+*()~] # exclude some trailing characters (heuristic)
92 - $line->offset_of ($self->selection_beg); 92 - $line->offset_of ($self->selection_beg);
93 93
94 my @matches; 94 my @matches;
95 95
96 if ($markofs < $line->l) { 96 if ($markofs < $line->l) {
97 # convert markofs from character to UTF-8 offset space
98 {
99 my $prefix = substr $text, 0, $markofs;
100 utf8::encode $prefix;
101 $markofs = length $prefix;
102 }
103
104 # not doing matches in unicode mode helps speed
105 # enourmously here. working in utf-8 should be
106 # equivalent due to the magic of utf-8 encoding.
107 utf8::encode $text;
108 study $text; # _really_ helps, too :) 97 study $text; # _really_ helps, too :)
109 98
110 for my $regex (@mark_patterns, @{ $self->{patterns} }) { 99 for my $regex (@mark_patterns, @{ $self->{patterns} }) {
111 while ($text =~ /$regex/g) { 100 while ($text =~ /$regex/g) {
112 if ($-[1] <= $markofs and $markofs <= $+[1]) { 101 if ($-[1] <= $markofs and $markofs <= $+[1]) {
132 for (sort { $a->[1] <=> $b->[1] or $b->[0] <=> $a->[0] } @matches) { 121 for (sort { $a->[1] <=> $b->[1] or $b->[0] <=> $a->[0] } @matches) {
133 my ($ofs, $len) = @$_; 122 my ($ofs, $len) = @$_;
134 123
135 next if $len <= $curlen; 124 next if $len <= $curlen;
136 125
137 # convert back from UTF-8 offset space to character space
138 {
139 my $length = substr "$text ", $ofs, $len;
140 utf8::decode $length;
141 $len = length $length;
142 }
143 {
144 my $prefix = substr $text, 0, $ofs;
145 utf8::decode $prefix;
146 $ofs = length $prefix;
147 }
148
149 $self->selection_beg ($line->coord_of ($ofs)); 126 $self->selection_beg ($line->coord_of ($ofs));
150 $self->selection_end ($line->coord_of ($ofs + $len)); 127 $self->selection_end ($line->coord_of ($ofs + $len));
151 return 1; 128 return 1;
152 } 129 }
153 130

Diff Legend

Removed lines
+ Added lines
< Changed lines
> Changed lines