ViewVC Help
View File | Revision Log | Show Annotations | Download File
/cvs/rxvt-unicode/src/perl/selection
(Generate patch)

Comparing rxvt-unicode/src/perl/selection (file contents):
Revision 1.18 by root, Mon Jan 9 01:06:55 2006 UTC vs.
Revision 1.50 by root, Sat Jan 12 22:13:47 2008 UTC

1#! perl 1#! perl
2 2
3sub on_keyboard_command { 3sub on_user_command {
4 my ($self, $cmd) = @_; 4 my ($self, $cmd) = @_;
5 5
6 $cmd eq "selection:rot13" 6 $cmd eq "selection:rot13"
7 and $self->selection (map { y/A-Za-z/N-ZA-Mn-za-m/; $_ } $self->selection); 7 and $self->selection (map { y/A-Za-z/N-ZA-Mn-za-m/; $_ } $self->selection);
8 8
9 () 9 ()
10} 10}
11 11
12sub on_init {
13 my ($self) = @_;
14
15 if (defined (my $res = $self->resource ("cutchars"))) {
16 $res = $self->locale_decode ($res);
17 push @{ $self->{patterns} }, qr{\G [\Q$res\E[:space:]]* ([^\Q$res\E[:space:]]+) }x;
18 }
19
20 for (my $idx = 0; defined (my $res = $self->x_resource ("selection.pattern-$idx")); $idx++) {
21 $res = $self->locale_decode ($res);
22 utf8::encode $res;
23 push @{ $self->{patterns} }, qr/$res/;
24 }
25
26 $self->{enabled} = 1;
27
28 push @{ $self->{term}{option_popup_hook} }, sub {
29 ("new selection" => $self->{enabled}, sub { $self->{enabled} = shift })
30 };
31
32 ()
33}
34
12# "find interetsing things"-patterns 35# "find interesting things"-patterns
13my @mark_patterns = ( 36my @mark_patterns = (
37# qr{ ([[:word:]]+) }x,
38 qr{ ([^[:space:]]+) }x,
39
40 # common types of "parentheses"
41 qr{ (?<![^[:space:]]) [`'] ([^`']+) [`'] (?![^[:space:]]) }x,
42 qr{ (?<![^[:space:]]) ‘ ([^‘’]+) ’ (?![^[:space:]]) }x,
43 qr{ (?<![^[:space:]]) “ ([^“”]+) ” (?![^[:space:]]) }x,
44
45 qr{ (?<![^[:space:]]) (' [^[:space:]] [^']* ') }x,
46 qr{ (' [^']* [^[:space:]] ') (?![^[:space:]]) }x,
47 qr{ (?<![^[:space:]]) (" [^[:space:]] [^"]* ") }x,
48 qr{ (" [^"]* [^[:space:]] ") (?![^[:space:]]) }x,
49
50 qr{ \{ ([^\{\}]+) \} }x,
51 qr{ \( ([^\(\)]+) \) }x,
52 qr{ \[ ([^\[\]]+) \] }x,
53 qr{ \< ([^\<\>]+) \> }x,
54
14 # urls, just a heuristic 55 # urls, just a heuristic
15 qr{( 56 qr{(
16 (?:https?|ftp|news|mailto|file)://[ab-zA-Z0-9\-\@;\/?:&=%\$_.+!*\x27(),~]+ 57 (?:https?://|ftp://|news://|mailto:|file://|\bwww\.)[ab-zA-Z0-9\-\@;\/?:&=%\$_.+!*\x27(),~#]+
17 [ab-zA-Z0-9\-\@;\/?:&=%\$_+!*\x27(),~] # do not include a trailing dot, its wrong too often 58 [ab-zA-Z0-9\-\@;\/?:&=%\$_+*()~] # exclude some trailing characters (heuristic)
18 )}x, 59 )}x,
19 60
20 # common "parentheses"
21 qr{(?:^|\s) ‘ ([^‘’]+?) ’ (?:\s|\)|$)}x,
22 qr{(?:^|\s) ` ([^`']+?) ' (?:\s|\)|$)}x,
23 qr{ \{ ([^{}]+?) \} }x,
24 qr{ \[ ([^{}]+?) \] }x,
25
26 # shell-like argument quoting, basically always matches 61 # shell-like argument quoting, basically always matches
27 qr{\G [\ \t|&;<>()] *( 62 qr{\G [\ \t|&;<>()]* (
28 (?: 63 (?:
29 [^\\"'\ \t|&;<>()]+ 64 [^\\"'\ \t|&;<>()]+
30 | \\. 65 | \\.
31 | " (?: [^\\"]+ | \\. )* " 66 | " (?: [^\\"]+ | \\. )* "
32 | ' [^']* ' 67 | ' [^']* '
39 qr{^"([^\\"'\ \t|&;<>()*?]+)"$}, # "simple" => simple 74 qr{^"([^\\"'\ \t|&;<>()*?]+)"$}, # "simple" => simple
40 qr{^(.*)[,\-]$}, # strip off trailing , and - 75 qr{^(.*)[,\-]$}, # strip off trailing , and -
41); 76);
42 77
43sub on_sel_extend { 78sub on_sel_extend {
44 my ($self) = @_; 79 my ($self, $time) = @_;
80
81 $self->{enabled}
82 or return;
45 83
46 my ($row, $col) = $self->selection_mark; 84 my ($row, $col) = $self->selection_mark;
47 my $line = $self->line ($row); 85 my $line = $self->line ($row);
48 my $offset = $line->offset_of ($row, $col);
49 my $text = $line->t; 86 my $text = $line->t;
87 my $markofs = $line->offset_of ($row, $col);
88 my $curlen = $line->offset_of ($self->selection_end)
89 - $line->offset_of ($self->selection_beg);
50 90
51 for my $regex (@mark_patterns) { 91 my @matches;
52 while ($text =~ /$regex/g) {
53 if ($-[1] <= $offset and $offset <= $+[1]) {
54 my $ofs = $-[1];
55 my $match = $1;
56 92
93 if ($markofs < $line->l) {
94 # convert markofs from character to UTF-8 offset space
95 {
96 my $prefix = substr $text, 0, $markofs;
97 utf8::encode $prefix;
98 $markofs = length $prefix;
99 }
100
101 # not doing matches in unicode mode helps speed
102 # enourmously here. working in utf-8 should be
103 # equivalent due to the magic of utf-8 encoding.
104 utf8::encode $text;
105 study $text; # _really_ helps, too :)
106
107 for my $regex (@mark_patterns, @{ $self->{patterns} }) {
108 while ($text =~ /$regex/g) {
109 if ($-[1] <= $markofs and $markofs <= $+[1]) {
110 my $ofs = $-[1];
111 my $match = $1;
112
57 for my $regex (@simplify_patterns) { 113 for my $regex (@simplify_patterns) {
58 if ($match =~ $regex) { 114 if ($match =~ $regex) {
59 $match = $1; 115 $match = $1;
60 $ofs += $-[1]; 116 $ofs += $-[1];
117 }
61 } 118 }
119
120 push @matches, [$ofs, length $match];
62 } 121 }
63
64 $self->selection_beg ($line->coord_of ($ofs));
65 $self->selection_end ($line->coord_of ($ofs + length $match));
66 return 1;
67 } 122 }
68 } 123 }
69 } 124 }
70 125
126 # whole line
127 push @matches, [0, ($line->end - $line->beg + 1) * $self->ncol];
128
129 for (sort { $a->[1] <=> $b->[1] or $b->[0] <=> $a->[0] } @matches) {
130 my ($ofs, $len) = @$_;
131
132 next if $len <= $curlen;
133
134 # convert back from UTF-8 offset space to character space
135 {
136 my $length = substr "$text ", $ofs, $len;
137 utf8::decode $length;
138 $len = length $length;
139 }
140 {
141 my $prefix = substr $text, 0, $ofs;
142 utf8::decode $prefix;
143 $ofs = length $prefix;
144 }
145
146 $self->selection_beg ($line->coord_of ($ofs));
147 $self->selection_end ($line->coord_of ($ofs + $len));
148 return 1;
149 }
150
71 () 151 ()
72} 152}

Diff Legend

Removed lines
+ Added lines
< Changed lines
> Changed lines