ViewVC Help
View File | Revision Log | Show Annotations | Download File
/cvs/rxvt-unicode/src/perl/selection
Revision: 1.52
Committed: Sat Dec 26 10:50:46 2009 UTC (14 years, 5 months ago) by root
Branch: MAIN
CVS Tags: before_dynamic_fontidx, rel-9_10, dynamic_fontidx, rel-9_09, rel-9_07
Changes since 1.51: +2 -1 lines
Log Message:
*** empty log message ***

File Contents

# Content
1 #! perl
2
3 sub on_user_command {
4 my ($self, $cmd) = @_;
5
6 $cmd eq "selection:rot13"
7 and $self->selection (map { y/A-Za-z/N-ZA-Mn-za-m/; $_ } $self->selection);
8
9 ()
10 }
11
12 sub on_init {
13 my ($self) = @_;
14
15 if (defined (my $res = $self->resource ("cutchars"))) {
16 $res = $self->locale_decode ($res);
17 push @{ $self->{patterns} }, qr{\G [\Q$res\E[:space:]]* ([^\Q$res\E[:space:]]+) }x;
18 }
19
20 for (my $idx = 0; defined (my $res = $self->x_resource ("selection.pattern-$idx")); $idx++) {
21 $res = $self->locale_decode ($res);
22 utf8::encode $res;
23 push @{ $self->{patterns} }, qr/$res/;
24 }
25
26 $self->{enabled} = 1;
27
28 push @{ $self->{term}{option_popup_hook} }, sub {
29 ("new selection" => $self->{enabled}, sub { $self->{enabled} = shift })
30 };
31
32 ()
33 }
34
35 # "find interesting things"-patterns
36 my @mark_patterns = (
37 # qr{ ([[:word:]]+) }x,
38 qr{ ([^[:space:]]+) }x,
39
40 # common types of "parentheses"
41 qr{ (?<![^[:space:]]) [`'] ([^`']+) [`'] (?![^[:space:]]) }x,
42 qr{ (?<![^[:space:]]) ‘ ([^‘’]+) ’ (?![^[:space:]]) }x,
43 qr{ (?<![^[:space:]]) “ ([^“”]+) ” (?![^[:space:]]) }x,
44
45 qr{ (?<![^[:space:]]) (' [^[:space:]] [^']* ') }x,
46 qr{ (' [^']* [^[:space:]] ') (?![^[:space:]]) }x,
47 qr{ (?<![^[:space:]]) (` [^[:space:]] [^']* ') }x,
48 qr{ (` [^']* [^[:space:]] ') (?![^[:space:]]) }x,
49 qr{ (?<![^[:space:]]) (" [^[:space:]] [^"]* ") }x,
50 qr{ (" [^"]* [^[:space:]] ") (?![^[:space:]]) }x,
51
52 qr{ \{ ([^\{\}]+) \} }x,
53 qr{ \( ([^\(\)]+) \) }x,
54 qr{ \[ ([^\[\]]+) \] }x,
55 qr{ \< ([^\<\>]+) \> }x,
56
57 # urls, just a heuristic
58 qr{(
59 (?:https?://|ftp://|news://|mailto:|file://|\bwww\.)[ab-zA-Z0-9\-\@;\/?:&=%\$_.+!*\x27(),~#]+
60 [ab-zA-Z0-9\-\@;\/?:&=%\$_+*()~] # exclude some trailing characters (heuristic)
61 )}x,
62
63 # shell-like argument quoting, basically always matches
64 qr{\G [\ \t|&;<>()]* (
65 (?:
66 [^\\"'\ \t|&;<>()]+
67 | \\.
68 | " (?: [^\\"]+ | \\. )* "
69 | ' [^']* '
70 )+
71 )}x,
72 );
73
74 # "correct obvious? crap"-patterns
75 my @simplify_patterns = (
76 qr{^"([^\\"'\ \t|&;<>()*?]+)"$}, # "simple" => simple
77 qr{^(.*)[,\-]$}, # strip off trailing , and -
78 );
79
80 sub on_sel_extend {
81 my ($self, $time) = @_;
82
83 $self->{enabled}
84 or return;
85
86 my ($row, $col) = $self->selection_mark;
87 my $line = $self->line ($row);
88 my $text = $line->t;
89 my $markofs = $line->offset_of ($row, $col);
90 my $curlen = $line->offset_of ($self->selection_end)
91 - $line->offset_of ($self->selection_beg);
92
93 my @matches;
94
95 if ($markofs < $line->l) {
96 # convert markofs from character to UTF-8 offset space
97 {
98 my $prefix = substr $text, 0, $markofs;
99 utf8::encode $prefix;
100 $markofs = length $prefix;
101 }
102
103 # not doing matches in unicode mode helps speed
104 # enourmously here. working in utf-8 should be
105 # equivalent due to the magic of utf-8 encoding.
106 utf8::encode $text;
107 study $text; # _really_ helps, too :)
108
109 for my $regex (@mark_patterns, @{ $self->{patterns} }) {
110 while ($text =~ /$regex/g) {
111 if ($-[1] <= $markofs and $markofs <= $+[1]) {
112 my $ofs = $-[1];
113 my $match = $1;
114
115 for my $regex (@simplify_patterns) {
116 if ($match =~ $regex) {
117 $match = $1;
118 $ofs += $-[1];
119 }
120 }
121
122 push @matches, [$ofs, length $match];
123 }
124 }
125 }
126 }
127
128 # whole line
129 push @matches, [0, ($line->end - $line->beg + 1) * $self->ncol];
130
131 for (sort { $a->[1] <=> $b->[1] or $b->[0] <=> $a->[0] } @matches) {
132 my ($ofs, $len) = @$_;
133
134 next if $len <= $curlen;
135
136 # convert back from UTF-8 offset space to character space
137 {
138 my $length = substr "$text ", $ofs, $len;
139 utf8::decode $length;
140 $len = length $length;
141 }
142 {
143 my $prefix = substr $text, 0, $ofs;
144 utf8::decode $prefix;
145 $ofs = length $prefix;
146 }
147
148 $self->selection_beg ($line->coord_of ($ofs));
149 $self->selection_end ($line->coord_of ($ofs + $len));
150 return 1;
151 }
152
153 ()
154 }