Correct underline processing and more UTF-8 support for w3mman2html.cgi
Patch from <https://bugs.launchpad.net/ubuntu/+source/w3m/+bug/680202>, provided by Piotr P. Karwasz.
This commit is contained in:
@@ -126,12 +126,14 @@ while(<F>) {
|
||||
s/\&/\&/g;
|
||||
s/\</\</g;
|
||||
s/\>/\>/g;
|
||||
# non ASCII UTF-8 codepoint
|
||||
my $utf8="[\300-\337][\200-\277]|[\340-\357][\200-\277]{2}|[\360-\367][\200-\277]{3}|[\370-\373][\200-\277]{4}|[\374\375][\200-\277]{5}";
|
||||
|
||||
s@([\200-\377].)(\010{1,2}\1)+@<b>$1</b>@g;
|
||||
s@($utf8)(\010\1)+@<b>$1</b>@g;
|
||||
s@(\&\w+;|.)(\010\1)+@<b>$1</b>@g;
|
||||
s@__\010{1,2}((\<b\>)?[\200-\377].(\</b\>)?)@<u>$1</u>@g;
|
||||
s@_\010((\<b\>)?($utf8)(\</b\>)?)@<u>$1</u>@g;
|
||||
s@_\010((\<b\>)?(\&\w+\;|.)(\</b\>)?)@<u>$1</u>@g;
|
||||
s@((\<b\>)?[\200-\377].(\</b\>)?)\010{1,2}__@<u>$1</u>@g;
|
||||
s@((\<b\>)?($utf8)(\</b\>)?)\010_@<u>$1</u>@g;
|
||||
s@((\<b\>)?(\&\w+\;|.)(\</b\>)?)\010_@<u>$1</u>@g;
|
||||
s@.\010(.)@$1@g;
|
||||
|
||||
|
Reference in New Issue
Block a user