|
Packit |
575503 |
# Date: Sun, 16 Mar 2008 18:51:14 +0100
|
|
Packit |
575503 |
# From: Hermann Peifer <peifer@gmx.eu>
|
|
Packit |
575503 |
# Subject: [Fwd: Gawk FIELDWIDTHS and multibyte characters]
|
|
Packit |
575503 |
# To: bug-gawk@gnu.org
|
|
Packit |
575503 |
# Message-id: <47DD5E12.2010403@gmx.eu>
|
|
Packit |
575503 |
#
|
|
Packit |
575503 |
# See below. Regards, Hermann
|
|
Packit |
575503 |
#
|
|
Packit |
575503 |
# --- Original Message ---
|
|
Packit |
575503 |
#
|
|
Packit |
575503 |
# Newsgroups: comp.lang.awk
|
|
Packit |
575503 |
# From: Hermann Peifer <peifer@gmx.eu>
|
|
Packit |
575503 |
# Date: Sun, 16 Mar 2008 01:23:38 -0700 (PDT)
|
|
Packit |
575503 |
# Subject: Gawk FIELDWIDTHS and multibyte characters
|
|
Packit |
575503 |
#
|
|
Packit |
575503 |
# Hi,
|
|
Packit |
575503 |
#
|
|
Packit |
575503 |
# It looks to me that Gawk's FIELDWIDTHS extension is not aware of
|
|
Packit |
575503 |
# multibyte characters, see my example below.
|
|
Packit |
575503 |
#
|
|
Packit |
575503 |
# $ cat testdata
|
|
Packit |
575503 |
# CDRegion Commune Site
|
|
Packit |
575503 |
# SEVästsverige Hallands län Kungsbacka
|
|
Packit |
575503 |
# SESmåland med öarna Västra Götalands länGöteborg
|
|
Packit |
575503 |
# SEKronoberg Alvesta Stenungsund
|
|
Packit |
575503 |
#
|
|
Packit |
575503 |
# $ file testdata
|
|
Packit |
575503 |
# testdata: UTF-8 Unicode text
|
|
Packit |
575503 |
#
|
|
Packit |
575503 |
# $ awk 'BEGIN{FIELDWIDTHS = "2 20 20 20"}{print $4}' testdata
|
|
Packit |
575503 |
# Site
|
|
Packit |
575503 |
# Kungsbacka
|
|
Packit |
575503 |
# länGöteborg
|
|
Packit |
575503 |
# Stenungsund
|
|
Packit |
575503 |
#
|
|
Packit |
575503 |
# Can someone confirm?
|
|
Packit |
575503 |
#
|
|
Packit |
575503 |
# Hermann
|
|
Packit |
575503 |
BEGIN { FIELDWIDTHS = "2 20 20 20" }
|
|
Packit |
575503 |
{ print $4 }
|