ViewVC Help
View File | Revision Log | Show Annotations | Download File
/cvs/rxvt-unicode/src/perl/selection
(Generate patch)

Comparing rxvt-unicode/src/perl/selection (file contents):
Revision 1.24 by root, Thu Jan 12 23:11:23 2006 UTC vs.
Revision 1.44 by root, Mon Nov 19 09:27:08 2007 UTC

1#! perl 1#! perl
2 2
3sub on_keyboard_command { 3sub on_user_command {
4 my ($self, $cmd) = @_; 4 my ($self, $cmd) = @_;
5 5
6 $cmd eq "selection:rot13" 6 $cmd eq "selection:rot13"
7 and $self->selection (map { y/A-Za-z/N-ZA-Mn-za-m/; $_ } $self->selection); 7 and $self->selection (map { y/A-Za-z/N-ZA-Mn-za-m/; $_ } $self->selection);
8 8
10} 10}
11 11
12sub on_init { 12sub on_init {
13 my ($self) = @_; 13 my ($self) = @_;
14 14
15 if (defined (my $res = $self->resource ("cutchars"))) {
16 $res = $self->locale_decode ($res);
17 push @{ $self->{patterns} }, qr{\G [\Q$res\E[:space:]]* ([^\Q$res\E[:space:]]+) }x;
18 }
19
15 for (my $idx = 0; defined (my $res = $self->x_resource ("selection.pattern-$idx")); $idx++) { 20 for (my $idx = 0; defined (my $res = $self->x_resource ("selection.pattern-$idx")); $idx++) {
16 no re 'eval'; # just to be sure 21 $res = $self->locale_decode ($res);
22 utf8::encode $res;
17 push @{ $self->{patterns} }, qr/$res/; 23 push @{ $self->{patterns} }, qr/$res/;
18 } 24 }
25
26 $self->{enabled} = 1;
27
28 push @{ $self->{term}{option_popup_hook} }, sub {
29 ("new selection" => $self->{enabled}, sub { $self->{enabled} = shift })
30 };
19 31
20 () 32 ()
21} 33}
22 34
23# "find interetsing things"-patterns 35# "find interesting things"-patterns
24my @mark_patterns = ( 36my @mark_patterns = (
37 qr{ ([[:word:]]+) }x,
38 qr{ ([^[:space:]]+) }x,
39
25 # common types of "parentheses" 40 # common types of "parentheses"
26 qr{(?:^|\s) ‘ ([^‘’]+?) ’ (?:\s|\)|$)}x, 41 qr{ (?<![^[:space:]]) ` ([^‘’]+) ` (?![^[:space:]]) }x,
27 qr{(?:^|\s) ` ([^`']+?) ' (?:\s|\)|$)}x, 42 qr{ (?<![^[:space:]]) ‘ ([^‘’]+) ’ (?![^[:space:]]) }x,
28 qr{ \{ ([^{}]+?) \} }x, 43 qr{ (?<![^[:space:]]) ` ([^`']+) ' (?![^[:space:]]) }x,
29 qr{ \[ ([^{}]+?) \] }x, 44
45 qr{ (?<![^[:space:]]) ‘ ([^`']+) ’ (?![^[:space:]]) }x,
46 qr{ (?<![^[:space:]]) “ ([^`']+) ” (?![^[:space:]]) }x,
47
48 qr{ (?<![^[:space:]]) (' [^[:space:]] [^']* ') }x,
49 qr{ (' [^']* [^[:space:]] ') (?![^[:space:]]) }x,
50 qr{ (?<![^[:space:]]) (" [^[:space:]] [^"]* ") }x,
51 qr{ (" [^"]* [^[:space:]] ") (?![^[:space:]]) }x,
52
53 qr{ \< ([^>]+) \> }x,
30 qr{ \( ([^()]+?) \) }x, 54 qr{ \( ([^)]+) \) }x,
55 qr{ \{ ([^}]+) \} }x,
56 qr{ \[ ([^]]+) \] }x,
31 57
32 # urls, just a heuristic 58 # urls, just a heuristic
33 qr{( 59 qr{(
34 (?:https?|ftp|news|mailto|file)://[ab-zA-Z0-9\-\@;\/?:&=%\$_.+!*\x27(),~]+ 60 (?:https?://|ftp://|news://|mailto:|file://|\bwww\.)[ab-zA-Z0-9\-\@;\/?:&=%\$_.+!*\x27(),~#]+
35 [ab-zA-Z0-9\-\@;\/?:&=%\$_+!*\x27()~] # exclude some trailing characters (heuristic) 61 [ab-zA-Z0-9\-\@;\/?:&=%\$_+*()~] # exclude some trailing characters (heuristic)
36 )}x, 62 )}x,
37 63
38 # shell-like argument quoting, basically always matches 64 # shell-like argument quoting, basically always matches
39 qr{\G [\ \t|&;<>()] *( 65 qr{\G [\ \t|&;<>()]* (
40 (?: 66 (?:
41 [^\\"'\ \t|&;<>()]+ 67 [^\\"'\ \t|&;<>()]+
42 | \\. 68 | \\.
43 | " (?: [^\\"]+ | \\. )* " 69 | " (?: [^\\"]+ | \\. )* "
44 | ' [^']* ' 70 | ' [^']* '
53); 79);
54 80
55sub on_sel_extend { 81sub on_sel_extend {
56 my ($self, $time) = @_; 82 my ($self, $time) = @_;
57 83
84 $self->{enabled}
85 or return;
86
58 my ($row, $col) = $self->selection_mark; 87 my ($row, $col) = $self->selection_mark;
59 my $line = $self->line ($row); 88 my $line = $self->line ($row);
60 my $text = $line->t; 89 my $text = $line->t;
61 my $markofs = $line->offset_of ($row, $col); 90 my $markofs = $line->offset_of ($row, $col);
62 my $curlen = $line->offset_of ($self->selection_end) 91 my $curlen = $line->offset_of ($self->selection_end)
63 - $line->offset_of ($self->selection_beg); 92 - $line->offset_of ($self->selection_beg);
64 93
65 my @matches; 94 my @matches;
66 95
67 for my $regex (@mark_patterns, @{ $self->{patterns} }) { 96 if ($markofs < $line->l) {
68 while ($text =~ /$regex/g) { 97 # convert markofs from character to UTF-8 offset space
69 if ($-[1] <= $markofs and $markofs <= $+[1]) { 98 {
70 my $ofs = $-[1]; 99 my $prefix = substr $text, 0, $markofs;
71 my $match = $1; 100 utf8::encode $prefix;
101 $markofs = length $prefix;
102 }
72 103
73 push @matches, [$ofs, length $match]; 104 # not doing matches in unicode mode helps speed
105 # enourmously here. working in utf-8 should be
106 # equivalent due to the magic of utf-8 encoding.
107 utf8::encode $text;
108 study $text; # _really_ helps, too :)
74 109
110 for my $regex (@mark_patterns, @{ $self->{patterns} }) {
111 while ($text =~ /$regex/g) {
112 if ($-[1] <= $markofs and $markofs <= $+[1]) {
113 my $ofs = $-[1];
114 my $match = $1;
115
75 for my $regex (@simplify_patterns) { 116 for my $regex (@simplify_patterns) {
76 if ($match =~ $regex) { 117 if ($match =~ $regex) {
77 $match = $1; 118 $match = $1;
78 $ofs += $-[1]; 119 $ofs += $-[1];
120 }
79 } 121 }
122
123 push @matches, [$ofs, length $match];
80 } 124 }
81
82 push @matches, [$ofs, length $match];
83 } 125 }
84 } 126 }
85 } 127 }
86 128
87 # whole line 129 # whole line
90 for (sort { $a->[1] <=> $b->[1] or $b->[0] <=> $a->[0] } @matches) { 132 for (sort { $a->[1] <=> $b->[1] or $b->[0] <=> $a->[0] } @matches) {
91 my ($ofs, $len) = @$_; 133 my ($ofs, $len) = @$_;
92 134
93 next if $len <= $curlen; 135 next if $len <= $curlen;
94 136
137 # convert back from UTF-8 offset space to character space
138 {
139 my $length = substr "$text ", $ofs, $len;
140 utf8::decode $length;
141 $len = length $length;
142 }
143 {
144 my $prefix = substr $text, 0, $ofs;
145 utf8::decode $prefix;
146 $ofs = length $prefix;
147 }
148
95 $self->selection_beg ($line->coord_of ($ofs)); 149 $self->selection_beg ($line->coord_of ($ofs));
96 $self->selection_end ($line->coord_of ($ofs + $len)); 150 $self->selection_end ($line->coord_of ($ofs + $len));
97 return 1; 151 return 1;
98 } 152 }
99 153

Diff Legend

Removed lines
+ Added lines
< Changed lines
> Changed lines