ViewVC Help
View File | Revision Log | Show Annotations | Download File
/cvs/rxvt-unicode/src/perl/selection
(Generate patch)

Comparing rxvt-unicode/src/perl/selection (file contents):
Revision 1.23 by root, Thu Jan 12 12:05:28 2006 UTC vs.
Revision 1.36 by root, Wed Jan 25 15:33:43 2006 UTC

1#! perl 1#! perl
2 2
3sub on_keyboard_command { 3sub on_user_command {
4 my ($self, $cmd) = @_; 4 my ($self, $cmd) = @_;
5 5
6 $cmd eq "selection:rot13" 6 $cmd eq "selection:rot13"
7 and $self->selection (map { y/A-Za-z/N-ZA-Mn-za-m/; $_ } $self->selection); 7 and $self->selection (map { y/A-Za-z/N-ZA-Mn-za-m/; $_ } $self->selection);
8 8
10} 10}
11 11
12sub on_init { 12sub on_init {
13 my ($self) = @_; 13 my ($self) = @_;
14 14
15 if (defined (my $res = $self->resource ("cutchars"))) {
16 $res = $self->locale_decode ($res);
17 push @{ $self->{patterns} }, qr{\G [\Q$res\E[:space:]]* ([^\Q$res\E[:space:]]+) }x;
18 }
19
15 for (my $idx = 0; defined (my $res = $self->x_resource ("selection.pattern-$idx")); $idx++) { 20 for (my $idx = 0; defined (my $res = $self->x_resource ("selection.pattern-$idx")); $idx++) {
16 no re 'eval'; # just to be sure 21 $res = $self->locale_decode ($res);
22 utf8::encode $res;
17 push @{ $self->{patterns} }, qr/$res/; 23 push @{ $self->{patterns} }, qr/$res/;
18 } 24 }
19 25
20 () 26 ()
21} 27}
22 28
23# "find interetsing things"-patterns 29# "find interesting things"-patterns
24my @mark_patterns = ( 30my @mark_patterns = (
25 qr{([[:word:]]+)},
26
27 # common "parentheses" 31 # common types of "parentheses"
28 qr{(?:^|\s) ‘ ([^‘’]+?) ’ (?:\s|\)|$)}x, 32 qr{ (?<![^[:space:]]) ‘ ([^‘’]+) ’ (?![^[:space]]) }x,
29 qr{(?:^|\s) ` ([^`']+?) ' (?:\s|\)|$)}x, 33 qr{ (?<![^[:space:]]) ` ([^`']+) ' (?![^[:space]]) }x,
30 qr{ \{ ([^{}]+?) \} }x, 34 qr{ (?<![^[:space:]]) (" [^[:space:]] [^"]* ") }x,
31 qr{ \[ ([^{}]+?) \] }x, 35 qr{ (" [^"]* [^[:space:]] ") (?![^[:space]]) }x,
32 qr{ \( ([^()]+?) \) }x, 36 qr{ \< ([^<>[:space:]]+) \> }x,
37 qr{ \{ ([^{}[:space:]]+) \} }x,
38 qr{ \[ ([^{}[:space:]]+) \] }x,
39 qr{ \( ([^()[:space:]]+) \) }x,
33 40
34 # urls, just a heuristic 41 # urls, just a heuristic
35 qr{( 42 qr{(
36 (?:https?|ftp|news|mailto|file)://[ab-zA-Z0-9\-\@;\/?:&=%\$_.+!*\x27(),~]+ 43 (?:https?|ftp|news|mailto|file)://[ab-zA-Z0-9\-\@;\/?:&=%\$_.+!*\x27(),~]+
37 [ab-zA-Z0-9\-\@;\/?:&=%\$_+!*\x27()~] # exclude some trailing characters (heuristic) 44 [ab-zA-Z0-9\-\@;\/?:&=%\$_+!*\x27()~] # exclude some trailing characters (heuristic)
38 )}x, 45 )}x,
39 46
40 # shell-like argument quoting, basically always matches 47 # shell-like argument quoting, basically always matches
41 qr{\G [\ \t|&;<>()] *( 48 qr{\G [\ \t|&;<>()]* (
42 (?: 49 (?:
43 [^\\"'\ \t|&;<>()]+ 50 [^\\"'\ \t|&;<>()]+
44 | \\. 51 | \\.
45 | " (?: [^\\"]+ | \\. )* " 52 | " (?: [^\\"]+ | \\. )* "
46 | ' [^']* ' 53 | ' [^']* '
64 my $curlen = $line->offset_of ($self->selection_end) 71 my $curlen = $line->offset_of ($self->selection_end)
65 - $line->offset_of ($self->selection_beg); 72 - $line->offset_of ($self->selection_beg);
66 73
67 my @matches; 74 my @matches;
68 75
69 for my $regex (@mark_patterns, @{ $self->{patterns} }) { 76 if ($markofs < $line->l) {
70 while ($text =~ /$regex/g) { 77 # convert markofs form character to UTF-8 offset space
71 if ($-[1] <= $markofs and $markofs <= $+[1]) { 78 {
72 my $ofs = $-[1]; 79 my $prefix = substr $text, 0, $markofs;
73 my $match = $1; 80 utf8::encode $prefix;
81 $markofs = length $prefix;
82 }
74 83
75 push @matches, [$ofs, length $match]; 84 # not doing matches in unicode mode helps speed
85 # enourmously here. working in utf-8 should be
86 # equivalent due to the magic of utf-8 encoding.
87 utf8::encode $text;
88 study $text; # _really_ helps, too :)
76 89
90 for my $regex (@mark_patterns, @{ $self->{patterns} }) {
91 while ($text =~ /$regex/g) {
92 if ($-[1] <= $markofs and $markofs <= $+[1]) {
93 my $ofs = $-[1];
94 my $match = $1;
95
77 for my $regex (@simplify_patterns) { 96 for my $regex (@simplify_patterns) {
78 if ($match =~ $regex) { 97 if ($match =~ $regex) {
79 $match = $1; 98 $match = $1;
80 $ofs += $-[1]; 99 $ofs += $-[1];
100 }
81 } 101 }
102
103 push @matches, [$ofs, length $match];
82 } 104 }
83
84 push @matches, [$ofs, length $match];
85 } 105 }
86 } 106 }
87 } 107 }
88 108
89 # whole line 109 # whole line
92 for (sort { $a->[1] <=> $b->[1] or $b->[0] <=> $a->[0] } @matches) { 112 for (sort { $a->[1] <=> $b->[1] or $b->[0] <=> $a->[0] } @matches) {
93 my ($ofs, $len) = @$_; 113 my ($ofs, $len) = @$_;
94 114
95 next if $len <= $curlen; 115 next if $len <= $curlen;
96 116
117 # convert back from UTF-8 offset space to character space
118 {
119 my $length = substr "$text ", $ofs, $len;
120 utf8::decode $length;
121 $len = length $length;
122 }
123 {
124 my $prefix = substr $text, 0, $ofs;
125 utf8::decode $prefix;
126 $ofs = length $prefix;
127 }
128
97 $self->selection_beg ($line->coord_of ($ofs)); 129 $self->selection_beg ($line->coord_of ($ofs));
98 $self->selection_end ($line->coord_of ($ofs + $len)); 130 $self->selection_end ($line->coord_of ($ofs + $len));
99 return 1; 131 return 1;
100 } 132 }
101 133

Diff Legend

Removed lines
+ Added lines
< Changed lines
> Changed lines