ViewVC Help
View File | Revision Log | Show Annotations | Download File
/cvs/rxvt-unicode/src/perl/selection
(Generate patch)

Comparing rxvt-unicode/src/perl/selection (file contents):
Revision 1.19 by root, Tue Jan 10 21:20:53 2006 UTC vs.
Revision 1.32 by root, Sat Jan 21 21:20:34 2006 UTC

7 and $self->selection (map { y/A-Za-z/N-ZA-Mn-za-m/; $_ } $self->selection); 7 and $self->selection (map { y/A-Za-z/N-ZA-Mn-za-m/; $_ } $self->selection);
8 8
9 () 9 ()
10} 10}
11 11
12sub on_init {
13 my ($self) = @_;
14
15 for (my $idx = 0; defined (my $res = $self->x_resource ("selection.pattern-$idx")); $idx++) {
16 no re 'eval'; # just to be sure
17 $res = $self->locale_decode ($res);
18 utf8::encode $res;
19 push @{ $self->{patterns} }, qr/$res/;
20 }
21
22 ()
23}
24
12# "find interetsing things"-patterns 25# "find interetsing things"-patterns
13my @mark_patterns = ( 26my @mark_patterns = (
27 # common types of "parentheses"
28 qr{ (?<![^[:space:]]) ‘ ([^‘’]+) ’ (?![^[:space]]) }x,
29 qr{ (?<![^[:space:]]) ` ([^`']+) ' (?![^[:space]]) }x,
30 qr{ (?<![^[:space:]]) (" [^[:space:]] [^"]* ") }x,
31 qr{ (" [^"]* [^[:space:]] ") (?![^[:space]]) }x,
32 qr{ \< ([^<>[:space:]]+) \> }x,
33 qr{ \{ ([^{}[:space:]]+) \} }x,
34 qr{ \[ ([^{}[:space:]]+) \] }x,
35 qr{ \( ([^()[:space:]]+) \) }x,
36
14 # urls, just a heuristic 37 # urls, just a heuristic
15 qr{( 38 qr{(
16 (?:https?|ftp|news|mailto|file)://[ab-zA-Z0-9\-\@;\/?:&=%\$_.+!*\x27(),~]+ 39 (?:https?|ftp|news|mailto|file)://[ab-zA-Z0-9\-\@;\/?:&=%\$_.+!*\x27(),~]+
17 [ab-zA-Z0-9\-\@;\/?:&=%\$_+!*\x27()~] # exclude some trailing characters (heuristic) 40 [ab-zA-Z0-9\-\@;\/?:&=%\$_+!*\x27()~] # exclude some trailing characters (heuristic)
18 )}x, 41 )}x,
19
20 # common "parentheses"
21 qr{(?:^|\s) ‘ ([^‘’]+?) ’ (?:\s|\)|$)}x,
22 qr{(?:^|\s) ` ([^`']+?) ' (?:\s|\)|$)}x,
23 qr{ \{ ([^{}]+?) \} }x,
24 qr{ \[ ([^{}]+?) \] }x,
25 42
26 # shell-like argument quoting, basically always matches 43 # shell-like argument quoting, basically always matches
27 qr{\G [\ \t|&;<>()] *( 44 qr{\G [\ \t|&;<>()] *(
28 (?: 45 (?:
29 [^\\"'\ \t|&;<>()]+ 46 [^\\"'\ \t|&;<>()]+
39 qr{^"([^\\"'\ \t|&;<>()*?]+)"$}, # "simple" => simple 56 qr{^"([^\\"'\ \t|&;<>()*?]+)"$}, # "simple" => simple
40 qr{^(.*)[,\-]$}, # strip off trailing , and - 57 qr{^(.*)[,\-]$}, # strip off trailing , and -
41); 58);
42 59
43sub on_sel_extend { 60sub on_sel_extend {
44 my ($self) = @_; 61 my ($self, $time) = @_;
45 62
46 my ($row, $col) = $self->selection_mark; 63 my ($row, $col) = $self->selection_mark;
47 my $line = $self->line ($row); 64 my $line = $self->line ($row);
48 my $offset = $line->offset_of ($row, $col);
49 my $text = $line->t; 65 my $text = $line->t;
66 my $markofs = $line->offset_of ($row, $col);
67 my $curlen = $line->offset_of ($self->selection_end)
68 - $line->offset_of ($self->selection_beg);
50 69
51 for my $regex (@mark_patterns) { 70 my @matches;
52 while ($text =~ /$regex/g) {
53 if ($-[1] <= $offset and $offset <= $+[1]) {
54 my $ofs = $-[1];
55 my $match = $1;
56 71
72 if ($markofs < $line->l) {
73 # convert markofs form character to UTF-8 offset space
74 {
75 my $prefix = substr $text, 0, $markofs;
76 utf8::encode $prefix;
77 $markofs = length $prefix;
78 }
79
80 # not doing matches in unicode mode helps speed
81 # enourmously here. working in utf-8 should be
82 # equivalent due to the magic of utf-8 encoding.
83 utf8::encode $text;
84 study $text; # _really_ helps, too :)
85
86 for my $regex (@mark_patterns, @{ $self->{patterns} }) {
87 while ($text =~ /$regex/g) {
88 if ($-[1] <= $markofs and $markofs <= $+[1]) {
89 my $ofs = $-[1];
90 my $match = $1;
91
57 for my $regex (@simplify_patterns) { 92 for my $regex (@simplify_patterns) {
58 if ($match =~ $regex) { 93 if ($match =~ $regex) {
59 $match = $1; 94 $match = $1;
60 $ofs += $-[1]; 95 $ofs += $-[1];
96 }
61 } 97 }
98
99 push @matches, [$ofs, length $match];
62 } 100 }
63
64 $self->selection_beg ($line->coord_of ($ofs));
65 $self->selection_end ($line->coord_of ($ofs + length $match));
66 return 1;
67 } 101 }
68 } 102 }
69 } 103 }
70 104
105 # whole line
106 push @matches, [0, ($line->end - $line->beg + 1) * $self->ncol];
107
108 for (sort { $a->[1] <=> $b->[1] or $b->[0] <=> $a->[0] } @matches) {
109 my ($ofs, $len) = @$_;
110
111 next if $len <= $curlen;
112
113 # convert back from UTF-8 offset space to character space
114 {
115 my $length = substr $text, $ofs, $len;
116 utf8::decode $length;
117 $len = length $length;
118 }
119 {
120 my $prefix = substr $text, 0, $ofs;
121 utf8::decode $prefix;
122 $ofs = length $prefix;
123 }
124
125 $self->selection_beg ($line->coord_of ($ofs));
126 $self->selection_end ($line->coord_of ($ofs + $len));
127 return 1;
128 }
129
71 () 130 ()
72} 131}

Diff Legend

Removed lines
+ Added lines
< Changed lines
> Changed lines