Blame nkf.1

Packit 5b6b86
.\" Automatically generated by Pod::Man 2.28 (Pod::Simple 3.28)
Packit 5b6b86
.\"
Packit 5b6b86
.\" Standard preamble:
Packit 5b6b86
.\" ========================================================================
Packit 5b6b86
.de Sp \" Vertical space (when we can't use .PP)
Packit 5b6b86
.if t .sp .5v
Packit 5b6b86
.if n .sp
Packit 5b6b86
..
Packit 5b6b86
.de Vb \" Begin verbatim text
Packit 5b6b86
.ft CW
Packit 5b6b86
.nf
Packit 5b6b86
.ne \\$1
Packit 5b6b86
..
Packit 5b6b86
.de Ve \" End verbatim text
Packit 5b6b86
.ft R
Packit 5b6b86
.fi
Packit 5b6b86
..
Packit 5b6b86
.\" Set up some character translations and predefined strings.  \*(-- will
Packit 5b6b86
.\" give an unbreakable dash, \*(PI will give pi, \*(L" will give a left
Packit 5b6b86
.\" double quote, and \*(R" will give a right double quote.  \*(C+ will
Packit 5b6b86
.\" give a nicer C++.  Capital omega is used to do unbreakable dashes and
Packit 5b6b86
.\" therefore won't be available.  \*(C` and \*(C' expand to `' in nroff,
Packit 5b6b86
.\" nothing in troff, for use with C<>.
Packit 5b6b86
.tr \(*W-
Packit 5b6b86
.ds C+ C\v'-.1v'\h'-1p'\s-2+\h'-1p'+\s0\v'.1v'\h'-1p'
Packit 5b6b86
.ie n \{\
Packit 5b6b86
.    ds -- \(*W-
Packit 5b6b86
.    ds PI pi
Packit 5b6b86
.    if (\n(.H=4u)&(1m=24u) .ds -- \(*W\h'-12u'\(*W\h'-12u'-\" diablo 10 pitch
Packit 5b6b86
.    if (\n(.H=4u)&(1m=20u) .ds -- \(*W\h'-12u'\(*W\h'-8u'-\"  diablo 12 pitch
Packit 5b6b86
.    ds L" ""
Packit 5b6b86
.    ds R" ""
Packit 5b6b86
.    ds C` ""
Packit 5b6b86
.    ds C' ""
Packit 5b6b86
'br\}
Packit 5b6b86
.el\{\
Packit 5b6b86
.    ds -- \|\(em\|
Packit 5b6b86
.    ds PI \(*p
Packit 5b6b86
.    ds L" ``
Packit 5b6b86
.    ds R" ''
Packit 5b6b86
.    ds C`
Packit 5b6b86
.    ds C'
Packit 5b6b86
'br\}
Packit 5b6b86
.\"
Packit 5b6b86
.\" Escape single quotes in literal strings from groff's Unicode transform.
Packit 5b6b86
.ie \n(.g .ds Aq \(aq
Packit 5b6b86
.el       .ds Aq '
Packit 5b6b86
.\"
Packit 5b6b86
.\" If the F register is turned on, we'll generate index entries on stderr for
Packit 5b6b86
.\" titles (.TH), headers (.SH), subsections (.SS), items (.Ip), and index
Packit 5b6b86
.\" entries marked with X<> in POD.  Of course, you'll have to process the
Packit 5b6b86
.\" output yourself in some meaningful fashion.
Packit 5b6b86
.\"
Packit 5b6b86
.\" Avoid warning from groff about undefined register 'F'.
Packit 5b6b86
.de IX
Packit 5b6b86
..
Packit 5b6b86
.nr rF 0
Packit 5b6b86
.if \n(.g .if rF .nr rF 1
Packit 5b6b86
.if (\n(rF:(\n(.g==0)) \{
Packit 5b6b86
.    if \nF \{
Packit 5b6b86
.        de IX
Packit 5b6b86
.        tm Index:\\$1\t\\n%\t"\\$2"
Packit 5b6b86
..
Packit 5b6b86
.        if !\nF==2 \{
Packit 5b6b86
.            nr % 0
Packit 5b6b86
.            nr F 2
Packit 5b6b86
.        \}
Packit 5b6b86
.    \}
Packit 5b6b86
.\}
Packit 5b6b86
.rr rF
Packit 5b6b86
.\"
Packit 5b6b86
.\" Accent mark definitions (@(#)ms.acc 1.5 88/02/08 SMI; from UCB 4.2).
Packit 5b6b86
.\" Fear.  Run.  Save yourself.  No user-serviceable parts.
Packit 5b6b86
.    \" fudge factors for nroff and troff
Packit 5b6b86
.if n \{\
Packit 5b6b86
.    ds #H 0
Packit 5b6b86
.    ds #V .8m
Packit 5b6b86
.    ds #F .3m
Packit 5b6b86
.    ds #[ \f1
Packit 5b6b86
.    ds #] \fP
Packit 5b6b86
.\}
Packit 5b6b86
.if t \{\
Packit 5b6b86
.    ds #H ((1u-(\\\\n(.fu%2u))*.13m)
Packit 5b6b86
.    ds #V .6m
Packit 5b6b86
.    ds #F 0
Packit 5b6b86
.    ds #[ \&
Packit 5b6b86
.    ds #] \&
Packit 5b6b86
.\}
Packit 5b6b86
.    \" simple accents for nroff and troff
Packit 5b6b86
.if n \{\
Packit 5b6b86
.    ds ' \&
Packit 5b6b86
.    ds ` \&
Packit 5b6b86
.    ds ^ \&
Packit 5b6b86
.    ds , \&
Packit 5b6b86
.    ds ~ ~
Packit 5b6b86
.    ds /
Packit 5b6b86
.\}
Packit 5b6b86
.if t \{\
Packit 5b6b86
.    ds ' \\k:\h'-(\\n(.wu*8/10-\*(#H)'\'\h"|\\n:u"
Packit 5b6b86
.    ds ` \\k:\h'-(\\n(.wu*8/10-\*(#H)'\`\h'|\\n:u'
Packit 5b6b86
.    ds ^ \\k:\h'-(\\n(.wu*10/11-\*(#H)'^\h'|\\n:u'
Packit 5b6b86
.    ds , \\k:\h'-(\\n(.wu*8/10)',\h'|\\n:u'
Packit 5b6b86
.    ds ~ \\k:\h'-(\\n(.wu-\*(#H-.1m)'~\h'|\\n:u'
Packit 5b6b86
.    ds / \\k:\h'-(\\n(.wu*8/10-\*(#H)'\z\(sl\h'|\\n:u'
Packit 5b6b86
.\}
Packit 5b6b86
.    \" troff and (daisy-wheel) nroff accents
Packit 5b6b86
.ds : \\k:\h'-(\\n(.wu*8/10-\*(#H+.1m+\*(#F)'\v'-\*(#V'\z.\h'.2m+\*(#F'.\h'|\\n:u'\v'\*(#V'
Packit 5b6b86
.ds 8 \h'\*(#H'\(*b\h'-\*(#H'
Packit 5b6b86
.ds o \\k:\h'-(\\n(.wu+\w'\(de'u-\*(#H)/2u'\v'-.3n'\*(#[\z\(de\v'.3n'\h'|\\n:u'\*(#]
Packit 5b6b86
.ds d- \h'\*(#H'\(pd\h'-\w'~'u'\v'-.25m'\f2\(hy\fP\v'.25m'\h'-\*(#H'
Packit 5b6b86
.ds D- D\\k:\h'-\w'D'u'\v'-.11m'\z\(hy\v'.11m'\h'|\\n:u'
Packit 5b6b86
.ds th \*(#[\v'.3m'\s+1I\s-1\v'-.3m'\h'-(\w'I'u*2/3)'\s-1o\s+1\*(#]
Packit 5b6b86
.ds Th \*(#[\s+2I\s-2\h'-\w'I'u*3/5'\v'-.3m'o\v'.3m'\*(#]
Packit 5b6b86
.ds ae a\h'-(\w'a'u*4/10)'e
Packit 5b6b86
.ds Ae A\h'-(\w'A'u*4/10)'E
Packit 5b6b86
.    \" corrections for vroff
Packit 5b6b86
.if v .ds ~ \\k:\h'-(\\n(.wu*9/10-\*(#H)'\s-2\u~\d\s+2\h'|\\n:u'
Packit 5b6b86
.if v .ds ^ \\k:\h'-(\\n(.wu*10/11-\*(#H)'\v'-.4m'^\v'.4m'\h'|\\n:u'
Packit 5b6b86
.    \" for low resolution devices (crt and lpr)
Packit 5b6b86
.if \n(.H>23 .if \n(.V>19 \
Packit 5b6b86
\{\
Packit 5b6b86
.    ds : e
Packit 5b6b86
.    ds 8 ss
Packit 5b6b86
.    ds o a
Packit 5b6b86
.    ds d- d\h'-1'\(ga
Packit 5b6b86
.    ds D- D\h'-1'\(hy
Packit 5b6b86
.    ds th \o'bp'
Packit 5b6b86
.    ds Th \o'LP'
Packit 5b6b86
.    ds ae ae
Packit 5b6b86
.    ds Ae AE
Packit 5b6b86
.\}
Packit 5b6b86
.rm #[ #] #H #V #F C
Packit 5b6b86
.\" ========================================================================
Packit 5b6b86
.\"
Packit 5b6b86
.IX Title "nkf 1"
Packit 5b6b86
.TH nkf 1 "2015-12-12" "nkf 2.1.4" " "
Packit 5b6b86
.\" For nroff, turn off justification.  Always turn off hyphenation; it makes
Packit 5b6b86
.\" way too many mistakes in technical documents.
Packit 5b6b86
.if n .ad l
Packit 5b6b86
.nh
Packit 5b6b86
.SH "NAME"
Packit 5b6b86
nkf \- Network Kanji Filter
Packit 5b6b86
.SH "SYNOPSIS"
Packit 5b6b86
.IX Header "SYNOPSIS"
Packit 5b6b86
nkf \fB[\-butjnesliohrTVvwWJESZxXFfmMBOcdILg]\fR \fB[\fR\fIfile ...\fR\fB]\fR
Packit 5b6b86
.SH "DESCRIPTION"
Packit 5b6b86
.IX Header "DESCRIPTION"
Packit 5b6b86
\&\fBNkf\fR is a yet another kanji code converter among networks, hosts and terminals.
Packit 5b6b86
It converts input kanji code to designated kanji code
Packit 5b6b86
such as \s-1ISO\-2022\-JP,\s0 Shift_JIS, EUC-JP, \s-1UTF\-8, UTF\-16\s0 or \s-1UTF\-32.\s0
Packit 5b6b86
.PP
Packit 5b6b86
One of the most unique faculty of \fBnkf\fR is the guess of the input kanji encodings.
Packit 5b6b86
It currently recognizes \s-1ISO\-2022\-JP,\s0 Shift_JIS, EUC-JP, \s-1UTF\-8, UTF\-16\s0 and \s-1UTF\-32.\s0
Packit 5b6b86
So users needn't set the input kanji code explicitly.
Packit 5b6b86
.PP
Packit 5b6b86
By default, X0201 kana is converted into X0208 kana.
Packit 5b6b86
For X0201 kana, \s-1SO/SI, SSO\s0 and \s-1ESC\-\s0(\-I methods are supported.
Packit 5b6b86
For automatic code detection, nkf assumes no X0201 kana in Shift_JIS.
Packit 5b6b86
To accept X0201 in Shift_JIS, use \fB\-X\fR, \fB\-x\fR or \fB\-S\fR.
Packit 5b6b86
.PP
Packit 5b6b86
multiple options are specifed as seprate strings, such as
Packit 5b6b86
.PP
Packit 5b6b86
.Vb 1
Packit 5b6b86
\&  print nkf(\*(Aq\-\-ic=UTF8\-MAC\*(Aq, \*(Aq\-w\*(Aq, $string), "\en";
Packit 5b6b86
.Ve
Packit 5b6b86
.PP
Packit 5b6b86
except the last arguments.
Packit 5b6b86
.SH "OPTIONS"
Packit 5b6b86
.IX Header "OPTIONS"
Packit 5b6b86
.IP "\fB\-J \-S \-E \-W \-W16 \-W32 \-j \-s \-e \-w \-w16 \-w32\fR" 4
Packit 5b6b86
.IX Item "-J -S -E -W -W16 -W32 -j -s -e -w -w16 -w32"
Packit 5b6b86
Specify input and output encodings. Upper case is input.
Packit 5b6b86
cf. \-\-ic and \-\-oc.
Packit 5b6b86
.RS 4
Packit 5b6b86
.IP "\fB\-J\fR" 4
Packit 5b6b86
.IX Item "-J"
Packit 5b6b86
\&\s-1ISO\-2022\-JP \s0(\s-1JIS\s0 code).
Packit 5b6b86
.IP "\fB\-S\fR" 4
Packit 5b6b86
.IX Item "-S"
Packit 5b6b86
Shift_JIS and \s-1JIS X 0201\s0 kana.
Packit 5b6b86
EUC-JP is recognized as X0201 kana. Without \fB\-x\fR flag,
Packit 5b6b86
\&\s-1JIS X 0201\s0 Katakana (a.k.a.halfwidth kana) is converted into \s-1JIS X 0208.\s0
Packit 5b6b86
If you use Windows, see Windows\-31J (\s-1CP932\s0).
Packit 5b6b86
.IP "\fB\-E\fR" 4
Packit 5b6b86
.IX Item "-E"
Packit 5b6b86
EUC-JP.
Packit 5b6b86
.IP "\fB\-W\fR" 4
Packit 5b6b86
.IX Item "-W"
Packit 5b6b86
\&\s-1UTF\-8N.\s0
Packit 5b6b86
.IP "\fB\-W16[\s-1BL\s0][0]\fR" 4
Packit 5b6b86
.IX Item "-W16[BL][0]"
Packit 5b6b86
\&\s-1UTF\-16.
Packit 5b6b86
B\s0 or L gives whether Big Endian or Little Endian.
Packit 5b6b86
0 gives whther put \s-1BOM\s0 or not.
Packit 5b6b86
.IP "\fB\-W32[\s-1BL\s0][0]\fR" 4
Packit 5b6b86
.IX Item "-W32[BL][0]"
Packit 5b6b86
\&\s-1UTF\-32.
Packit 5b6b86
B\s0 or L gives whether Big Endian or Little Endian.
Packit 5b6b86
0 gives whther put \s-1BOM\s0 or not.
Packit 5b6b86
.RE
Packit 5b6b86
.RS 4
Packit 5b6b86
.RE
Packit 5b6b86
.IP "\fB\-b \-u\fR" 4
Packit 5b6b86
.IX Item "-b -u"
Packit 5b6b86
Output is buffered (\s-1DEFAULT\s0), Output is unbuffered.
Packit 5b6b86
.IP "\fB\-t\fR" 4
Packit 5b6b86
.IX Item "-t"
Packit 5b6b86
No conversion.
Packit 5b6b86
.IP "\fB\-i[@B]\fR" 4
Packit 5b6b86
.IX Item "-i[@B]"
Packit 5b6b86
Specify the escape sequence for \s-1JIS X 0208.\s0
Packit 5b6b86
.RS 4
Packit 5b6b86
.IP "\fB\-i@\fR" 4
Packit 5b6b86
.IX Item "-i@"
Packit 5b6b86
Use \s-1ESC \s0( @. (\s-1JIS X 0208\-1978\s0)
Packit 5b6b86
.IP "\fB\-iB\fR" 4
Packit 5b6b86
.IX Item "-iB"
Packit 5b6b86
Use \s-1ESC \s0( B. (\s-1JIS X 0208\-1983/1990 DEFAULT\s0)
Packit 5b6b86
.RE
Packit 5b6b86
.RS 4
Packit 5b6b86
.RE
Packit 5b6b86
.IP "\fB\-o[\s-1BJ\s0]\fR" 4
Packit 5b6b86
.IX Item "-o[BJ]"
Packit 5b6b86
Specify the escape sequence for \s-1US\-ASCII/JIS X 0201\s0 Roman. (\s-1DEFAULT B\s0)
Packit 5b6b86
.IP "\fB\-r\fR" 4
Packit 5b6b86
.IX Item "-r"
Packit 5b6b86
{de/en}crypt \s-1ROT13/47\s0
Packit 5b6b86
.IP "\fB\-h[123] \-\-hiragana \-\-katakana \-\-katakana\-hiragana\fR" 4
Packit 5b6b86
.IX Item "-h[123] --hiragana --katakana --katakana-hiragana"
Packit 5b6b86
.RS 4
Packit 5b6b86
.PD 0
Packit 5b6b86
.IP "\fB\-h1 \-\-hiragana\fR" 4
Packit 5b6b86
.IX Item "-h1 --hiragana"
Packit 5b6b86
.PD
Packit 5b6b86
Katakana to Hiragana conversion.
Packit 5b6b86
.IP "\fB\-h2 \-\-katakana\fR" 4
Packit 5b6b86
.IX Item "-h2 --katakana"
Packit 5b6b86
Hiragana to Katakana conversion.
Packit 5b6b86
.IP "\fB\-h3 \-\-katakana\-hiragana\fR" 4
Packit 5b6b86
.IX Item "-h3 --katakana-hiragana"
Packit 5b6b86
Katakana to Hiragana and Hiragana to Katakana conversion.
Packit 5b6b86
.RE
Packit 5b6b86
.RS 4
Packit 5b6b86
.RE
Packit 5b6b86
.IP "\fB\-T\fR" 4
Packit 5b6b86
.IX Item "-T"
Packit 5b6b86
Text mode output (MS-DOS)
Packit 5b6b86
.IP "\fB\-f[\f(BIm\fB [\- \f(BIn\fB]]\fR" 4
Packit 5b6b86
.IX Item "-f[m [- n]]"
Packit 5b6b86
Folding on \fIm\fR length with \fIn\fR margin in a line.
Packit 5b6b86
Without this option, fold length is 60 and fold margin is 10.
Packit 5b6b86
.IP "\fB\-F\fR" 4
Packit 5b6b86
.IX Item "-F"
Packit 5b6b86
New line preserving line folding.
Packit 5b6b86
.IP "\fB\-Z[0\-3]\fR" 4
Packit 5b6b86
.IX Item "-Z[0-3]"
Packit 5b6b86
Convert X0208 alphabet (Fullwidth Alphabets) to \s-1ASCII.\s0
Packit 5b6b86
.RS 4
Packit 5b6b86
.IP "\fB\-Z \-Z0\fR" 4
Packit 5b6b86
.IX Item "-Z -Z0"
Packit 5b6b86
Convert X0208 alphabet to \s-1ASCII.\s0
Packit 5b6b86
.IP "\fB\-Z1\fR" 4
Packit 5b6b86
.IX Item "-Z1"
Packit 5b6b86
Convert X0208 kankaku to single \s-1ASCII\s0 space.
Packit 5b6b86
.IP "\fB\-Z2\fR" 4
Packit 5b6b86
.IX Item "-Z2"
Packit 5b6b86
Convert X0208 kankaku to double \s-1ASCII\s0 spaces.
Packit 5b6b86
.IP "\fB\-Z3\fR" 4
Packit 5b6b86
.IX Item "-Z3"
Packit 5b6b86
Replacing fullwidth >, <, ", & into '>', '<', '"', '&' as in \s-1HTML.\s0
Packit 5b6b86
.RE
Packit 5b6b86
.RS 4
Packit 5b6b86
.RE
Packit 5b6b86
.IP "\fB\-X \-x\fR" 4
Packit 5b6b86
.IX Item "-X -x"
Packit 5b6b86
With \fB\-X\fR or without this option, X0201 is converted into X0208 Kana.
Packit 5b6b86
With \fB\-x\fR, try to preserve X0208 kana and do not convert X0201 kana to X0208.
Packit 5b6b86
In \s-1JIS\s0 output, \s-1ESC\-\s0(\-I is used. In \s-1EUC\s0 output, \s-1SS2\s0 is used.
Packit 5b6b86
.IP "\fB\-B[0\-2]\fR" 4
Packit 5b6b86
.IX Item "-B[0-2]"
Packit 5b6b86
Assume broken JIS-Kanji input, which lost \s-1ESC.\s0
Packit 5b6b86
Useful when your site is using old B\-News Nihongo patch.
Packit 5b6b86
.RS 4
Packit 5b6b86
.IP "\fB\-B1\fR" 4
Packit 5b6b86
.IX Item "-B1"
Packit 5b6b86
allows any chars after \s-1ESC\-\s0( or \s-1ESC\-$.\s0
Packit 5b6b86
.IP "\fB\-B2\fR" 4
Packit 5b6b86
.IX Item "-B2"
Packit 5b6b86
force \s-1ASCII\s0 after \s-1NL.\s0
Packit 5b6b86
.RE
Packit 5b6b86
.RS 4
Packit 5b6b86
.RE
Packit 5b6b86
.IP "\fB\-I\fR" 4
Packit 5b6b86
.IX Item "-I"
Packit 5b6b86
Replacing non iso\-2022\-jp char into a geta character
Packit 5b6b86
(substitute character in Japanese).
Packit 5b6b86
.IP "\fB\-m[\s-1BQN0\s0]\fR" 4
Packit 5b6b86
.IX Item "-m[BQN0]"
Packit 5b6b86
\&\s-1MIME ISO\-2022\-JP/ISO8859\-1\s0 decode. (\s-1DEFAULT\s0)
Packit 5b6b86
To see \s-1ISO8859\-1 \s0(Latin\-1) \-l is necessary.
Packit 5b6b86
.RS 4
Packit 5b6b86
.IP "\fB\-mB\fR" 4
Packit 5b6b86
.IX Item "-mB"
Packit 5b6b86
Decode \s-1MIME\s0 base64 encoded stream. Remove header or other part before
Packit 5b6b86
conversion.
Packit 5b6b86
.IP "\fB\-mQ\fR" 4
Packit 5b6b86
.IX Item "-mQ"
Packit 5b6b86
Decode \s-1MIME\s0 quoted stream. '_' in quoted stream is converted to space.
Packit 5b6b86
.IP "\fB\-mN\fR" 4
Packit 5b6b86
.IX Item "-mN"
Packit 5b6b86
Non-strict decoding.
Packit 5b6b86
It allows line break in the middle of the base64 encoding.
Packit 5b6b86
.IP "\fB\-m0\fR" 4
Packit 5b6b86
.IX Item "-m0"
Packit 5b6b86
No \s-1MIME\s0 decode.
Packit 5b6b86
.RE
Packit 5b6b86
.RS 4
Packit 5b6b86
.RE
Packit 5b6b86
.IP "\fB\-M\fR" 4
Packit 5b6b86
.IX Item "-M"
Packit 5b6b86
\&\s-1MIME\s0 encode. Header style. All \s-1ASCII\s0 code and control characters are intact.
Packit 5b6b86
.RS 4
Packit 5b6b86
.IP "\fB\-MB\fR" 4
Packit 5b6b86
.IX Item "-MB"
Packit 5b6b86
\&\s-1MIME\s0 encode Base64 stream.
Packit 5b6b86
Kanji conversion is performed before encoding, so this cannot be used as a picture encoder.
Packit 5b6b86
.IP "\fB\-MQ\fR" 4
Packit 5b6b86
.IX Item "-MQ"
Packit 5b6b86
Perform quoted encoding.
Packit 5b6b86
.RE
Packit 5b6b86
.RS 4
Packit 5b6b86
.RE
Packit 5b6b86
.IP "\fB\-l\fR" 4
Packit 5b6b86
.IX Item "-l"
Packit 5b6b86
Input and output code is \s-1ISO8859\-1 \s0(Latin\-1) and \s-1ISO\-2022\-JP.
Packit 5b6b86
\&\s0\fB\-s\fR, \fB\-e\fR and \fB\-x\fR are not compatible with this option.
Packit 5b6b86
.IP "\fB\-L[uwm] \-d \-c\fR" 4
Packit 5b6b86
.IX Item "-L[uwm] -d -c"
Packit 5b6b86
Convert line breaks.
Packit 5b6b86
.RS 4
Packit 5b6b86
.IP "\fB\-Lu \-d\fR" 4
Packit 5b6b86
.IX Item "-Lu -d"
Packit 5b6b86
unix (\s-1LF\s0)
Packit 5b6b86
.IP "\fB\-Lw \-c\fR" 4
Packit 5b6b86
.IX Item "-Lw -c"
Packit 5b6b86
windows (\s-1CRLF\s0)
Packit 5b6b86
.IP "\fB\-Lm\fR" 4
Packit 5b6b86
.IX Item "-Lm"
Packit 5b6b86
mac (\s-1CR\s0)
Packit 5b6b86
.Sp
Packit 5b6b86
Without this option, nkf doesn't convert line breaks.
Packit 5b6b86
.RE
Packit 5b6b86
.RS 4
Packit 5b6b86
.RE
Packit 5b6b86
.IP "\fB\-\-fj \-\-unix \-\-mac \-\-msdos \-\-windows\fR" 4
Packit 5b6b86
.IX Item "--fj --unix --mac --msdos --windows"
Packit 5b6b86
Convert for these systems.
Packit 5b6b86
.IP "\fB\-\-jis \-\-euc \-\-sjis \-\-mime \-\-base64\fR" 4
Packit 5b6b86
.IX Item "--jis --euc --sjis --mime --base64"
Packit 5b6b86
Convert to named code.
Packit 5b6b86
.IP "\fB\-\-jis\-input \-\-euc\-input \-\-sjis\-input \-\-mime\-input \-\-base64\-input\fR" 4
Packit 5b6b86
.IX Item "--jis-input --euc-input --sjis-input --mime-input --base64-input"
Packit 5b6b86
Assume input system
Packit 5b6b86
.IP "\fB\-\-ic=\f(BIinput codeset\fB \-\-oc=\f(BIoutput codeset\fB\fR" 4
Packit 5b6b86
.IX Item "--ic=input codeset --oc=output codeset"
Packit 5b6b86
Set the input or output codeset.
Packit 5b6b86
\&\s-1NKF\s0 supports following codesets and those codeset names are case insensitive.
Packit 5b6b86
.RS 4
Packit 5b6b86
.IP "\s-1ISO\-2022\-JP\s0" 4
Packit 5b6b86
.IX Item "ISO-2022-JP"
Packit 5b6b86
a.k.a. \s-1RFC1468,\s0 7bit \s-1JIS, JUNET\s0
Packit 5b6b86
.IP "EUC-JP (eucJP-nkf)" 4
Packit 5b6b86
.IX Item "EUC-JP (eucJP-nkf)"
Packit 5b6b86
a.k.a. \s-1AT&T JIS,\s0 Japanese \s-1EUC, UJIS\s0
Packit 5b6b86
.IP "eucJP-ascii" 4
Packit 5b6b86
.IX Item "eucJP-ascii"
Packit 5b6b86
.PD 0
Packit 5b6b86
.IP "eucJP-ms" 4
Packit 5b6b86
.IX Item "eucJP-ms"
Packit 5b6b86
.IP "\s-1CP51932\s0" 4
Packit 5b6b86
.IX Item "CP51932"
Packit 5b6b86
.PD
Packit 5b6b86
Microsoft Version of EUC-JP.
Packit 5b6b86
.IP "Shift_JIS" 4
Packit 5b6b86
.IX Item "Shift_JIS"
Packit 5b6b86
a.k.a. \s-1SJIS,\s0 MS_Kanji
Packit 5b6b86
.IP "Windows\-31J" 4
Packit 5b6b86
.IX Item "Windows-31J"
Packit 5b6b86
a.k.a. \s-1CP932\s0
Packit 5b6b86
.IP "\s-1UTF\-8\s0" 4
Packit 5b6b86
.IX Item "UTF-8"
Packit 5b6b86
same as \s-1UTF\-8N\s0
Packit 5b6b86
.IP "\s-1UTF\-8N\s0" 4
Packit 5b6b86
.IX Item "UTF-8N"
Packit 5b6b86
\&\s-1UTF\-8\s0 without \s-1BOM\s0
Packit 5b6b86
.IP "\s-1UTF\-8\-BOM\s0" 4
Packit 5b6b86
.IX Item "UTF-8-BOM"
Packit 5b6b86
\&\s-1UTF\-8\s0 with \s-1BOM\s0
Packit 5b6b86
.IP "\s-1UTF8\-MAC \s0(input only)" 4
Packit 5b6b86
.IX Item "UTF8-MAC (input only)"
Packit 5b6b86
decomposed \s-1UTF\-8\s0
Packit 5b6b86
.IP "\s-1UTF\-16\s0" 4
Packit 5b6b86
.IX Item "UTF-16"
Packit 5b6b86
same as \s-1UTF\-16BE\s0
Packit 5b6b86
.IP "\s-1UTF\-16BE\s0" 4
Packit 5b6b86
.IX Item "UTF-16BE"
Packit 5b6b86
\&\s-1UTF\-16\s0 Big Endian without \s-1BOM\s0
Packit 5b6b86
.IP "\s-1UTF\-16BE\-BOM\s0" 4
Packit 5b6b86
.IX Item "UTF-16BE-BOM"
Packit 5b6b86
\&\s-1UTF\-16\s0 Big Endian with \s-1BOM\s0
Packit 5b6b86
.IP "\s-1UTF\-16LE\s0" 4
Packit 5b6b86
.IX Item "UTF-16LE"
Packit 5b6b86
\&\s-1UTF\-16\s0 Little Endian without \s-1BOM\s0
Packit 5b6b86
.IP "\s-1UTF\-16LE\-BOM\s0" 4
Packit 5b6b86
.IX Item "UTF-16LE-BOM"
Packit 5b6b86
\&\s-1UTF\-16\s0 Little Endian with \s-1BOM\s0
Packit 5b6b86
.IP "\s-1UTF\-32\s0" 4
Packit 5b6b86
.IX Item "UTF-32"
Packit 5b6b86
same as \s-1UTF\-32BE\s0
Packit 5b6b86
.IP "\s-1UTF\-32BE\s0" 4
Packit 5b6b86
.IX Item "UTF-32BE"
Packit 5b6b86
\&\s-1UTF\-32\s0 Big Endian without \s-1BOM\s0
Packit 5b6b86
.IP "\s-1UTF\-32BE\-BOM\s0" 4
Packit 5b6b86
.IX Item "UTF-32BE-BOM"
Packit 5b6b86
\&\s-1UTF\-32\s0 Big Endian with \s-1BOM\s0
Packit 5b6b86
.IP "\s-1UTF\-32LE\s0" 4
Packit 5b6b86
.IX Item "UTF-32LE"
Packit 5b6b86
\&\s-1UTF\-32\s0 Little Endian without \s-1BOM\s0
Packit 5b6b86
.IP "\s-1UTF\-32LE\-BOM\s0" 4
Packit 5b6b86
.IX Item "UTF-32LE-BOM"
Packit 5b6b86
\&\s-1UTF\-32\s0 Little Endian with \s-1BOM\s0
Packit 5b6b86
.RE
Packit 5b6b86
.RS 4
Packit 5b6b86
.RE
Packit 5b6b86
.IP "\fB\-\-fb\-{skip, html, xml, perl, java, subchar}\fR" 4
Packit 5b6b86
.IX Item "--fb-{skip, html, xml, perl, java, subchar}"
Packit 5b6b86
Specify the way that nkf handles unassigned characters.
Packit 5b6b86
Without this option, \-\-fb\-skip is assumed.
Packit 5b6b86
.IP "\fB\-\-prefix=\f(BIescape character\fB\f(BItarget character\fB..\fR" 4
Packit 5b6b86
.IX Item "--prefix=escape charactertarget character.."
Packit 5b6b86
When nkf converts to Shift_JIS,
Packit 5b6b86
nkf adds a specified escape character to specified 2nd byte of Shift_JIS characters.
Packit 5b6b86
1st byte of argument is the escape character and following bytes are target characters.
Packit 5b6b86
.IP "\fB\-\-no\-cp932ext\fR" 4
Packit 5b6b86
.IX Item "--no-cp932ext"
Packit 5b6b86
Handle the characters extended in \s-1CP932\s0 as unassigned characters.
Packit 5b6b86
.IP "\fB\-\-no\-best\-fit\-chars\fR" 4
Packit 5b6b86
.IX Item "--no-best-fit-chars"
Packit 5b6b86
When Unicode to Encoded byte conversion,
Packit 5b6b86
don't convert characters which is not round trip safe.
Packit 5b6b86
When Unicode to Unicode conversion,
Packit 5b6b86
with this and \-x option, nkf can be used as \s-1UTF\s0 converter.
Packit 5b6b86
(In other words, without this and \-x option, nkf doesn't save some characters)
Packit 5b6b86
.Sp
Packit 5b6b86
When nkf converts strings that related to path, you should use this opion.
Packit 5b6b86
.IP "\fB\-\-cap\-input\fR" 4
Packit 5b6b86
.IX Item "--cap-input"
Packit 5b6b86
Decode hex encoded characters.
Packit 5b6b86
.IP "\fB\-\-url\-input\fR" 4
Packit 5b6b86
.IX Item "--url-input"
Packit 5b6b86
Unescape percent escaped characters.
Packit 5b6b86
.IP "\fB\-\-numchar\-input\fR" 4
Packit 5b6b86
.IX Item "--numchar-input"
Packit 5b6b86
Decode character reference, such as \*(L"&#....;\*(R".
Packit 5b6b86
.IP "\fB\-\-in\-place[=\fR\fI\s-1SUFFIX\s0\fR\fB]\fR  \fB\-\-overwrite[=\fR\fI\s-1SUFFIX\s0\fR\fB]\fR" 4
Packit 5b6b86
.IX Item "--in-place[=SUFFIX] --overwrite[=SUFFIX]"
Packit 5b6b86
Overwrite \fBoriginal\fR listed files by filtered result.
Packit 5b6b86
.Sp
Packit 5b6b86
\&\fBNote\fR \-\-overwrite preserves timestamps of original files.
Packit 5b6b86
.IP "\fB\-\-guess=[12]\fR" 4
Packit 5b6b86
.IX Item "--guess=[12]"
Packit 5b6b86
Print guessed encoding and newline. (2 is default, 1 is only encoding)
Packit 5b6b86
.IP "\fB\-\-help\fR" 4
Packit 5b6b86
.IX Item "--help"
Packit 5b6b86
Print nkf's help.
Packit 5b6b86
.IP "\fB\-\-version\fR" 4
Packit 5b6b86
.IX Item "--version"
Packit 5b6b86
Print nkf's version.
Packit 5b6b86
.IP "\fB\-\-\fR" 4
Packit 5b6b86
.IX Item "--"
Packit 5b6b86
Ignore rest of \-option.
Packit 5b6b86
.SH "AUTHOR"
Packit 5b6b86
.IX Header "AUTHOR"
Packit 5b6b86
Copyright (c) 1987, Fujitsu \s-1LTD. \s0(Itaru \s-1ICHIKAWA\s0).
Packit 5b6b86
.PP
Packit 5b6b86
Copyright (c) 1996\-2015, The nkf Project.