… | |
… | |
9 | () |
9 | () |
10 | } |
10 | } |
11 | |
11 | |
12 | # "find interetsing things"-patterns |
12 | # "find interetsing things"-patterns |
13 | my @mark_patterns = ( |
13 | my @mark_patterns = ( |
|
|
14 | qr{([[:alnum:]]+)}, |
|
|
15 | |
|
|
16 | # common "parentheses" |
|
|
17 | qr{(?:^|\s) ‘ ([^‘’]+?) ’ (?:\s|\)|$)}x, |
|
|
18 | qr{(?:^|\s) ` ([^`']+?) ' (?:\s|\)|$)}x, |
|
|
19 | qr{ \{ ([^{}]+?) \} }x, |
|
|
20 | qr{ \[ ([^{}]+?) \] }x, |
|
|
21 | |
14 | # urls, just a heuristic |
22 | # urls, just a heuristic |
15 | qr{( |
23 | qr{( |
16 | (?:https?|ftp|news|mailto|file)://[ab-zA-Z0-9\-\@;\/?:&=%\$_.+!*\x27(),~]+ |
24 | (?:https?|ftp|news|mailto|file)://[ab-zA-Z0-9\-\@;\/?:&=%\$_.+!*\x27(),~]+ |
17 | [ab-zA-Z0-9\-\@;\/?:&=%\$_+!*\x27(),~] # do not include a trailing dot, its wrong too often |
25 | [ab-zA-Z0-9\-\@;\/?:&=%\$_+!*\x27()~] # exclude some trailing characters (heuristic) |
18 | )}x, |
26 | )}x, |
19 | |
27 | |
20 | # common forms of quoting |
28 | # shell-like argument quoting, basically always matches |
21 | qr{(?:^|\s) [‘`] ([^‘`’']+) [’'] (?:\s|$)}x, |
|
|
22 | |
|
|
23 | # shell-like argument quoting |
|
|
24 | qr{\G [\ \t|&;<>()] *( |
29 | qr{\G [\ \t|&;<>()] *( |
25 | (?: |
30 | (?: |
26 | [^\\"'\ \t|&;<>()]+ |
31 | [^\\"'\ \t|&;<>()]+ |
27 | | \\. |
32 | | \\. |
28 | | " (?: [^\\"]+ | \\. )* " |
33 | | " (?: [^\\"]+ | \\. )* " |
… | |
… | |
36 | qr{^"([^\\"'\ \t|&;<>()*?]+)"$}, # "simple" => simple |
41 | qr{^"([^\\"'\ \t|&;<>()*?]+)"$}, # "simple" => simple |
37 | qr{^(.*)[,\-]$}, # strip off trailing , and - |
42 | qr{^(.*)[,\-]$}, # strip off trailing , and - |
38 | ); |
43 | ); |
39 | |
44 | |
40 | sub on_sel_extend { |
45 | sub on_sel_extend { |
41 | my ($self) = @_; |
46 | my ($self, $time) = @_; |
42 | |
47 | |
43 | my ($row, $col) = $self->selection_mark; |
48 | my ($row, $col) = $self->selection_mark; |
44 | my $line = $self->line ($row); |
49 | my $line = $self->line ($row); |
45 | my $offset = $line->offset_of ($row, $col); |
|
|
46 | my $text = $line->t; |
50 | my $text = $line->t; |
|
|
51 | my $markofs = $line->offset_of ($row, $col); |
|
|
52 | my $curlen = $line->offset_of ($self->selection_end) |
|
|
53 | - $line->offset_of ($self->selection_beg); |
|
|
54 | |
|
|
55 | my @matches; |
47 | |
56 | |
48 | for my $regex (@mark_patterns) { |
57 | for my $regex (@mark_patterns) { |
49 | while ($text =~ /$regex/g) { |
58 | while ($text =~ /$regex/g) { |
50 | if ($-[1] <= $offset and $offset <= $+[1]) { |
59 | if ($-[1] <= $markofs and $markofs <= $+[1]) { |
51 | my $ofs = $-[1]; |
60 | my $ofs = $-[1]; |
52 | my $match = $1; |
61 | my $match = $1; |
|
|
62 | |
|
|
63 | push @matches, [$ofs, length $match]; |
53 | |
64 | |
54 | for my $regex (@simplify_patterns) { |
65 | for my $regex (@simplify_patterns) { |
55 | if ($match =~ $regex) { |
66 | if ($match =~ $regex) { |
56 | $match = $1; |
67 | $match = $1; |
57 | $ofs += $-[1]; |
68 | $ofs += $-[1]; |
58 | } |
69 | } |
59 | } |
70 | } |
60 | |
71 | |
61 | $self->selection_beg ($line->coord_of ($ofs)); |
72 | push @matches, [$ofs, length $match]; |
62 | $self->selection_end ($line->coord_of ($ofs + length $match)); |
|
|
63 | return 1; |
|
|
64 | } |
73 | } |
65 | } |
74 | } |
66 | } |
75 | } |
67 | |
76 | |
|
|
77 | # whole line |
|
|
78 | push @matches, [0, ($line->end - $line->beg + 1) * $self->ncol]; |
|
|
79 | |
|
|
80 | for (sort { $a->[1] <=> $b->[1] or $b->[0] <=> $a->[0] } @matches) { |
|
|
81 | my ($ofs, $len) = @$_; |
|
|
82 | |
|
|
83 | next if $len <= $curlen; |
|
|
84 | |
|
|
85 | $self->selection_beg ($line->coord_of ($ofs)); |
|
|
86 | $self->selection_end ($line->coord_of ($ofs + $len)); |
|
|
87 | return 1; |
|
|
88 | } |
|
|
89 | |
68 | () |
90 | () |
69 | } |
91 | } |