--- rxvt-unicode/src/perl/selection 2006/02/06 06:14:08 1.37 +++ rxvt-unicode/src/perl/selection 2008/01/12 22:13:47 1.50 @@ -34,20 +34,28 @@ # "find interesting things"-patterns my @mark_patterns = ( +# qr{ ([[:word:]]+) }x, + qr{ ([^[:space:]]+) }x, + # common types of "parentheses" - qr{ (?[:space:]]+) \> }x, - qr{ \{ ([^{}[:space:]]+) \} }x, - qr{ \[ ([^{}[:space:]]+) \] }x, - qr{ \( ([^()[:space:]]+) \) }x, + qr{ (?]+) \> }x, # urls, just a heuristic qr{( - (?:https?|ftp|news|mailto|file)://[ab-zA-Z0-9\-\@;\/?:&=%\$_.+!*\x27(),~]+ - [ab-zA-Z0-9\-\@;\/?:&=%\$_+!*\x27()~] # exclude some trailing characters (heuristic) + (?:https?://|ftp://|news://|mailto:|file://|\bwww\.)[ab-zA-Z0-9\-\@;\/?:&=%\$_.+!*\x27(),~#]+ + [ab-zA-Z0-9\-\@;\/?:&=%\$_+*()~] # exclude some trailing characters (heuristic) )}x, # shell-like argument quoting, basically always matches @@ -83,7 +91,7 @@ my @matches; if ($markofs < $line->l) { - # convert markofs form character to UTF-8 offset space + # convert markofs from character to UTF-8 offset space { my $prefix = substr $text, 0, $markofs; utf8::encode $prefix;