From 0561dc969f7e1e5bdc52248b75b5d1e555ffaf01 Mon Sep 17 00:00:00 2001 From: Rocco Rutte Date: Mon, 6 Jul 2009 15:28:04 +0200 Subject: [PATCH] Manual: Add a note about when/why to use utf-8 --- doc/manual.xml.head | 48 +++++++++++++++++++++++++-------------------- 1 file changed, 27 insertions(+), 21 deletions(-) diff --git a/doc/manual.xml.head b/doc/manual.xml.head index 3990c6d0..bf244cce 100644 --- a/doc/manual.xml.head +++ b/doc/manual.xml.head @@ -46,7 +46,7 @@ The official homepage can be found at To subscribe to one of the following mailing lists, send a message with the word subscribe in the body to -list-name-request@mutt.org. +list-name-request@mutt.org. @@ -73,14 +73,11 @@ feature requests - -All messages posted to -mutt-announce are automatically forwarded to -mutt-users, so you do not need to be subscribed to -both lists. +All messages posted to mutt-announce are +automatically forwarded to mutt-users, so you do +not need to be subscribed to both lists. - @@ -4571,13 +4568,11 @@ set index_format="%4C %Z %{%b %d} %-15.15L (%?l?%4l&%4c?)%* %s" Character Set Handling -Mutt supports all character sets the system supports which can be -determined by running locale -a. A character -set is basically a mapping between bytes and glyphs and implies -a certain character encoding scheme. For example, for the ISO 8859 -family of character sets, an encoding of 8bit per character is used. For -the Unicode character set, different character encodings may be used, -UTF-8 being the most popular. +A character set is basically a mapping between bytes and +glyphs and implies a certain character encoding scheme. For example, for +the ISO 8859 family of character sets, an encoding of 8bit per character +is used. For the Unicode character set, different character encodings +may be used, UTF-8 being the most popular. @@ -4601,19 +4596,30 @@ setup itself. -Warning: A mismatch between what these functions think the locale is and -what mutt was told what the locale is may make it behave badly with -non-ascii input. This warning is to be taken seriously since not only -local mail handling may suffer: sent messages may carry wrong character -set information the receiver has too deal with. The +If you happen to work with several character sets on a regular basis, +it's highly advisable to use Unicode and an UTF-8 locale. Unicode can +represent nearly all characters in a message at the same time, making +all conversions superfluous which eliminates the risk of conversion +errors. It also eliminates potentially wrong expectations about the +character set between Mutt and external programs. + + + +Warning: A mismatch between what system and library functions think the +locale is and what Mutt was told what the locale is may make it behave +badly with non-ascii input: it will fail at seemingly random +places. This warning is to be taken seriously since not only local mail +handling may suffer: sent messages may carry wrong character set +information the receiver has too deal with. The need to set $charset directly in most cases points at terminal and environment variable setup problems, not Mutt problems. A list of officially assigned and known character sets can be found at -IANA. +IANA, +a list of locally supported locales can be obtained by +running locale -a. -- 2.49.0