ViewVC Help
View File | Revision Log | Show Annotations | Download File
/cvs/rxvt-unicode/src/perl/selection
Revision: 1.40
Committed: Tue Oct 3 11:32:20 2006 UTC (17 years, 7 months ago) by root
Branch: MAIN
CVS Tags: rel-8_0
Changes since 1.39: +2 -2 lines
Log Message:
matcher

File Contents

# User Rev Content
1 root 1.4 #! perl
2    
3 root 1.36 sub on_user_command {
4 root 1.7 my ($self, $cmd) = @_;
5 elmex 1.2
6     $cmd eq "selection:rot13"
7 root 1.7 and $self->selection (map { y/A-Za-z/N-ZA-Mn-za-m/; $_ } $self->selection);
8 elmex 1.3
9     ()
10 elmex 1.1 }
11 root 1.5
12 root 1.23 sub on_init {
13     my ($self) = @_;
14    
15 root 1.35 if (defined (my $res = $self->resource ("cutchars"))) {
16     $res = $self->locale_decode ($res);
17     push @{ $self->{patterns} }, qr{\G [\Q$res\E[:space:]]* ([^\Q$res\E[:space:]]+) }x;
18     }
19    
20 root 1.23 for (my $idx = 0; defined (my $res = $self->x_resource ("selection.pattern-$idx")); $idx++) {
21 root 1.31 $res = $self->locale_decode ($res);
22     utf8::encode $res;
23 root 1.23 push @{ $self->{patterns} }, qr/$res/;
24     }
25    
26 root 1.37 $self->{enabled} = 1;
27    
28     push @{ $self->{term}{option_popup_hook} }, sub {
29     ("new selection" => $self->{enabled}, sub { $self->{enabled} = shift })
30     };
31    
32 root 1.23 ()
33     }
34    
35 root 1.34 # "find interesting things"-patterns
36 root 1.15 my @mark_patterns = (
37 root 1.24 # common types of "parentheses"
38 root 1.25 qr{ (?<![^[:space:]]) ‘ ([^‘’]+) ’ (?![^[:space]]) }x,
39     qr{ (?<![^[:space:]]) ` ([^`']+) ' (?![^[:space]]) }x,
40     qr{ (?<![^[:space:]]) (" [^[:space:]] [^"]* ") }x,
41     qr{ (" [^"]* [^[:space:]] ") (?![^[:space]]) }x,
42     qr{ \< ([^<>[:space:]]+) \> }x,
43     qr{ \{ ([^{}[:space:]]+) \} }x,
44     qr{ \[ ([^{}[:space:]]+) \] }x,
45     qr{ \( ([^()[:space:]]+) \) }x,
46 root 1.14
47 root 1.20 # urls, just a heuristic
48     qr{(
49 root 1.40 (?:https?://|ftp://|news://|mailto:|file://|\bwww\.)[ab-zA-Z0-9\-\@;\/?:&=%\$_.+!*\x27(),~#]+
50     [ab-zA-Z0-9\-\@;\/?:&=%\$_+*()~] # exclude some trailing characters (heuristic)
51 root 1.20 )}x,
52    
53 root 1.17 # shell-like argument quoting, basically always matches
54 root 1.34 qr{\G [\ \t|&;<>()]* (
55 root 1.9 (?:
56 root 1.11 [^\\"'\ \t|&;<>()]+
57 root 1.9 | \\.
58 root 1.13 | " (?: [^\\"]+ | \\. )* "
59 root 1.9 | ' [^']* '
60     )+
61 root 1.14 )}x,
62 root 1.8 );
63    
64 root 1.16 # "correct obvious? crap"-patterns
65 root 1.15 my @simplify_patterns = (
66     qr{^"([^\\"'\ \t|&;<>()*?]+)"$}, # "simple" => simple
67 root 1.16 qr{^(.*)[,\-]$}, # strip off trailing , and -
68 root 1.15 );
69 root 1.14
70 root 1.6 sub on_sel_extend {
71 root 1.21 my ($self, $time) = @_;
72 root 1.8
73 root 1.37 $self->{enabled}
74     or return;
75    
76 root 1.8 my ($row, $col) = $self->selection_mark;
77     my $line = $self->line ($row);
78     my $text = $line->t;
79 root 1.20 my $markofs = $line->offset_of ($row, $col);
80     my $curlen = $line->offset_of ($self->selection_end)
81     - $line->offset_of ($self->selection_beg);
82    
83     my @matches;
84 root 1.8
85 root 1.32 if ($markofs < $line->l) {
86     # convert markofs form character to UTF-8 offset space
87     {
88     my $prefix = substr $text, 0, $markofs;
89     utf8::encode $prefix;
90     $markofs = length $prefix;
91     }
92    
93     # not doing matches in unicode mode helps speed
94     # enourmously here. working in utf-8 should be
95     # equivalent due to the magic of utf-8 encoding.
96     utf8::encode $text;
97     study $text; # _really_ helps, too :)
98    
99     for my $regex (@mark_patterns, @{ $self->{patterns} }) {
100     while ($text =~ /$regex/g) {
101     if ($-[1] <= $markofs and $markofs <= $+[1]) {
102     my $ofs = $-[1];
103     my $match = $1;
104    
105     for my $regex (@simplify_patterns) {
106     if ($match =~ $regex) {
107     $match = $1;
108     $ofs += $-[1];
109     }
110 root 1.15 }
111 root 1.32
112     push @matches, [$ofs, length $match];
113 root 1.15 }
114 root 1.8 }
115     }
116     }
117    
118 root 1.21 # whole line
119     push @matches, [0, ($line->end - $line->beg + 1) * $self->ncol];
120    
121 root 1.20 for (sort { $a->[1] <=> $b->[1] or $b->[0] <=> $a->[0] } @matches) {
122     my ($ofs, $len) = @$_;
123    
124     next if $len <= $curlen;
125    
126 root 1.32 # convert back from UTF-8 offset space to character space
127     {
128 root 1.33 my $length = substr "$text ", $ofs, $len;
129 root 1.32 utf8::decode $length;
130     $len = length $length;
131     }
132     {
133     my $prefix = substr $text, 0, $ofs;
134     utf8::decode $prefix;
135     $ofs = length $prefix;
136     }
137    
138 root 1.20 $self->selection_beg ($line->coord_of ($ofs));
139     $self->selection_end ($line->coord_of ($ofs + $len));
140     return 1;
141     }
142    
143 root 1.21 ()
144 root 1.5 }