Blame libarchive/test/test_zip_filename_encoding.c

Packit Service 1d0348
/*-
Packit Service 1d0348
 * Copyright (c) 2011 Michihiro NAKAJIMA
Packit Service 1d0348
 * All rights reserved.
Packit Service 1d0348
 *
Packit Service 1d0348
 * Redistribution and use in source and binary forms, with or without
Packit Service 1d0348
 * modification, are permitted provided that the following conditions
Packit Service 1d0348
 * are met:
Packit Service 1d0348
 * 1. Redistributions of source code must retain the above copyright
Packit Service 1d0348
 *    notice, this list of conditions and the following disclaimer.
Packit Service 1d0348
 * 2. Redistributions in binary form must reproduce the above copyright
Packit Service 1d0348
 *    notice, this list of conditions and the following disclaimer in the
Packit Service 1d0348
 *    documentation and/or other materials provided with the distribution.
Packit Service 1d0348
 *
Packit Service 1d0348
 * THIS SOFTWARE IS PROVIDED BY THE AUTHOR(S) ``AS IS'' AND ANY EXPRESS OR
Packit Service 1d0348
 * IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES
Packit Service 1d0348
 * OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE DISCLAIMED.
Packit Service 1d0348
 * IN NO EVENT SHALL THE AUTHOR(S) BE LIABLE FOR ANY DIRECT, INDIRECT,
Packit Service 1d0348
 * INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT
Packit Service 1d0348
 * NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
Packit Service 1d0348
 * DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
Packit Service 1d0348
 * THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
Packit Service 1d0348
 * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF
Packit Service 1d0348
 * THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
Packit Service 1d0348
 */
Packit Service 1d0348
#include "test.h"
Packit Service 1d0348
__FBSDID("$FreeBSD$");
Packit Service 1d0348
Packit Service 1d0348
#include <locale.h>
Packit Service 1d0348
Packit Service 1d0348
DEFINE_TEST(test_zip_filename_encoding_UTF8)
Packit Service 1d0348
{
Packit Service 1d0348
  	struct archive *a;
Packit Service 1d0348
  	struct archive_entry *entry;
Packit Service 1d0348
	char buff[4096];
Packit Service 1d0348
	size_t used;
Packit Service 1d0348
Packit Service 1d0348
	if (NULL == setlocale(LC_ALL, "en_US.UTF-8")) {
Packit Service 1d0348
		skipping("en_US.UTF-8 locale not available on this system.");
Packit Service 1d0348
		return;
Packit Service 1d0348
	}
Packit Service 1d0348
Packit Service 1d0348
	/*
Packit Service 1d0348
	 * Verify that UTF-8 filenames are correctly stored with
Packit Service 1d0348
	 * hdrcharset=UTF-8 option.
Packit Service 1d0348
	 */
Packit Service 1d0348
	a = archive_write_new();
Packit Service 1d0348
	assertEqualInt(ARCHIVE_OK, archive_write_set_format_zip(a));
Packit Service 1d0348
	if (archive_write_set_options(a, "hdrcharset=UTF-8") != ARCHIVE_OK) {
Packit Service 1d0348
		skipping("This system cannot convert character-set"
Packit Service 1d0348
		    " for UTF-8.");
Packit Service 1d0348
		archive_write_free(a);
Packit Service 1d0348
		return;
Packit Service 1d0348
	}
Packit Service 1d0348
	assertEqualInt(ARCHIVE_OK,
Packit Service 1d0348
	    archive_write_open_memory(a, buff, sizeof(buff), &used));
Packit Service 1d0348
Packit Service 1d0348
	entry = archive_entry_new2(a);
Packit Service 1d0348
	/* Set a UTF-8 filename. */
Packit Service 1d0348
	archive_entry_set_pathname(entry, "\xD0\xBF\xD1\x80\xD0\xB8");
Packit Service 1d0348
	archive_entry_set_filetype(entry, AE_IFREG);
Packit Service 1d0348
	archive_entry_set_size(entry, 0);
Packit Service 1d0348
	assertEqualInt(ARCHIVE_OK, archive_write_header(a, entry));
Packit Service 1d0348
	archive_entry_free(entry);
Packit Service 1d0348
	assertEqualInt(ARCHIVE_OK, archive_write_free(a));
Packit Service 1d0348
Packit Service 1d0348
	/* A bit 11 of general purpose flag should be 0x08,
Packit Service 1d0348
	 * which indicates the filename charset is UTF-8. */
Packit Service 1d0348
	assertEqualInt(0x08, buff[7]);
Packit Service 1d0348
	assertEqualMem(buff + 30, "\xD0\xBF\xD1\x80\xD0\xB8", 6);
Packit Service 1d0348
Packit Service 1d0348
	/*
Packit Service 1d0348
	 * Verify that UTF-8 filenames are correctly stored without
Packit Service 1d0348
	 * hdrcharset=UTF-8 option.
Packit Service 1d0348
	 */
Packit Service 1d0348
	a = archive_write_new();
Packit Service 1d0348
	assertEqualInt(ARCHIVE_OK, archive_write_set_format_zip(a));
Packit Service 1d0348
	assertEqualInt(ARCHIVE_OK,
Packit Service 1d0348
	    archive_write_open_memory(a, buff, sizeof(buff), &used));
Packit Service 1d0348
Packit Service 1d0348
	entry = archive_entry_new2(a);
Packit Service 1d0348
	/* Set a UTF-8 filename. */
Packit Service 1d0348
	archive_entry_set_pathname(entry, "\xD0\xBF\xD1\x80\xD0\xB8");
Packit Service 1d0348
	archive_entry_set_filetype(entry, AE_IFREG);
Packit Service 1d0348
	archive_entry_set_size(entry, 0);
Packit Service 1d0348
	assertEqualInt(ARCHIVE_OK, archive_write_header(a, entry));
Packit Service 1d0348
	archive_entry_free(entry);
Packit Service 1d0348
	assertEqualInt(ARCHIVE_OK, archive_write_free(a));
Packit Service 1d0348
Packit Service 1d0348
	/* A bit 11 of general purpose flag should be 0x08,
Packit Service 1d0348
	 * which indicates the filename charset is UTF-8. */
Packit Service 1d0348
	assertEqualInt(0x08, buff[7]);
Packit Service 1d0348
	assertEqualMem(buff + 30, "\xD0\xBF\xD1\x80\xD0\xB8", 6);
Packit Service 1d0348
Packit Service 1d0348
	/*
Packit Service 1d0348
	 * Verify that A bit 11 of general purpose flag is not set
Packit Service 1d0348
	 * when ASCII filenames are stored.
Packit Service 1d0348
	 */
Packit Service 1d0348
	a = archive_write_new();
Packit Service 1d0348
	assertEqualInt(ARCHIVE_OK, archive_write_set_format_zip(a));
Packit Service 1d0348
	assertEqualInt(ARCHIVE_OK,
Packit Service 1d0348
	    archive_write_open_memory(a, buff, sizeof(buff), &used));
Packit Service 1d0348
Packit Service 1d0348
	entry = archive_entry_new2(a);
Packit Service 1d0348
	/* Set an ASCII filename. */
Packit Service 1d0348
	archive_entry_set_pathname(entry, "abcABC");
Packit Service 1d0348
	archive_entry_set_filetype(entry, AE_IFREG);
Packit Service 1d0348
	archive_entry_set_size(entry, 0);
Packit Service 1d0348
	assertEqualInt(ARCHIVE_OK, archive_write_header(a, entry));
Packit Service 1d0348
	archive_entry_free(entry);
Packit Service 1d0348
	assertEqualInt(ARCHIVE_OK, archive_write_free(a));
Packit Service 1d0348
Packit Service 1d0348
	/* A bit 11 of general purpose flag should be 0,
Packit Service 1d0348
	 * which indicates the filename charset is unknown. */
Packit Service 1d0348
	assertEqualInt(0, buff[7]);
Packit Service 1d0348
	assertEqualMem(buff + 30, "abcABC", 6);
Packit Service 1d0348
}
Packit Service 1d0348
Packit Service 1d0348
DEFINE_TEST(test_zip_filename_encoding_KOI8R)
Packit Service 1d0348
{
Packit Service 1d0348
  	struct archive *a;
Packit Service 1d0348
  	struct archive_entry *entry;
Packit Service 1d0348
	char buff[4096];
Packit Service 1d0348
	size_t used;
Packit Service 1d0348
Packit Service 1d0348
	if (NULL == setlocale(LC_ALL, "ru_RU.KOI8-R")) {
Packit Service 1d0348
		skipping("KOI8-R locale not available on this system.");
Packit Service 1d0348
		return;
Packit Service 1d0348
	}
Packit Service 1d0348
Packit Service 1d0348
	/*
Packit Service 1d0348
	 * Verify that KOI8-R filenames are correctly translated to UTF-8.
Packit Service 1d0348
	 */
Packit Service 1d0348
	a = archive_write_new();
Packit Service 1d0348
	assertEqualInt(ARCHIVE_OK, archive_write_set_format_zip(a));
Packit Service 1d0348
	if (archive_write_set_options(a, "hdrcharset=UTF-8") != ARCHIVE_OK) {
Packit Service 1d0348
		skipping("This system cannot convert character-set"
Packit Service 1d0348
		    " from KOI8-R to UTF-8.");
Packit Service 1d0348
		archive_write_free(a);
Packit Service 1d0348
		return;
Packit Service 1d0348
	}
Packit Service 1d0348
	assertEqualInt(ARCHIVE_OK,
Packit Service 1d0348
	    archive_write_open_memory(a, buff, sizeof(buff), &used));
Packit Service 1d0348
Packit Service 1d0348
	entry = archive_entry_new2(a);
Packit Service 1d0348
	/* Set a KOI8-R filename. */
Packit Service 1d0348
	archive_entry_set_pathname(entry, "\xD0\xD2\xC9");
Packit Service 1d0348
	archive_entry_set_filetype(entry, AE_IFREG);
Packit Service 1d0348
	archive_entry_set_size(entry, 0);
Packit Service 1d0348
	assertEqualInt(ARCHIVE_OK, archive_write_header(a, entry));
Packit Service 1d0348
	archive_entry_free(entry);
Packit Service 1d0348
	assertEqualInt(ARCHIVE_OK, archive_write_free(a));
Packit Service 1d0348
Packit Service 1d0348
	/* A bit 11 of general purpose flag should be 0x08,
Packit Service 1d0348
	 * which indicates the filename charset is UTF-8. */
Packit Service 1d0348
	assertEqualInt(0x08, buff[7]);
Packit Service 1d0348
	/* Above three characters in KOI8-R should translate to the following
Packit Service 1d0348
	 * three characters (two bytes each) in UTF-8. */
Packit Service 1d0348
	assertEqualMem(buff + 30, "\xD0\xBF\xD1\x80\xD0\xB8", 6);
Packit Service 1d0348
Packit Service 1d0348
	/*
Packit Service 1d0348
	 * Verify that KOI8-R filenames are not translated to UTF-8.
Packit Service 1d0348
	 */
Packit Service 1d0348
	a = archive_write_new();
Packit Service 1d0348
	assertEqualInt(ARCHIVE_OK, archive_write_set_format_zip(a));
Packit Service 1d0348
	assertEqualInt(ARCHIVE_OK,
Packit Service 1d0348
	    archive_write_open_memory(a, buff, sizeof(buff), &used));
Packit Service 1d0348
Packit Service 1d0348
	entry = archive_entry_new2(a);
Packit Service 1d0348
	/* Set a KOI8-R filename. */
Packit Service 1d0348
	archive_entry_set_pathname(entry, "\xD0\xD2\xC9");
Packit Service 1d0348
	archive_entry_set_filetype(entry, AE_IFREG);
Packit Service 1d0348
	archive_entry_set_size(entry, 0);
Packit Service 1d0348
	assertEqualInt(ARCHIVE_OK, archive_write_header(a, entry));
Packit Service 1d0348
	archive_entry_free(entry);
Packit Service 1d0348
	assertEqualInt(ARCHIVE_OK, archive_write_free(a));
Packit Service 1d0348
Packit Service 1d0348
	/* A bit 11 of general purpose flag should be 0,
Packit Service 1d0348
	 * which indicates the filename charset is unknown. */
Packit Service 1d0348
	assertEqualInt(0, buff[7]);
Packit Service 1d0348
	/* Above three characters in KOI8-R should not translate to
Packit Service 1d0348
	 * any character-set. */
Packit Service 1d0348
	assertEqualMem(buff + 30, "\xD0\xD2\xC9", 3);
Packit Service 1d0348
Packit Service 1d0348
	/*
Packit Service 1d0348
	 * Verify that A bit 11 of general purpose flag is not set
Packit Service 1d0348
	 * when ASCII filenames are stored even if hdrcharset=UTF-8
Packit Service 1d0348
	 * is specified.
Packit Service 1d0348
	 */
Packit Service 1d0348
	a = archive_write_new();
Packit Service 1d0348
	assertEqualInt(ARCHIVE_OK, archive_write_set_format_zip(a));
Packit Service 1d0348
	if (archive_write_set_options(a, "hdrcharset=UTF-8") != ARCHIVE_OK) {
Packit Service 1d0348
		skipping("This system cannot convert character-set"
Packit Service 1d0348
		    " from KOI8-R to UTF-8.");
Packit Service 1d0348
		archive_write_free(a);
Packit Service 1d0348
		return;
Packit Service 1d0348
	}
Packit Service 1d0348
	assertEqualInt(ARCHIVE_OK,
Packit Service 1d0348
	    archive_write_open_memory(a, buff, sizeof(buff), &used));
Packit Service 1d0348
Packit Service 1d0348
	entry = archive_entry_new2(a);
Packit Service 1d0348
	/* Set an ASCII filename. */
Packit Service 1d0348
	archive_entry_set_pathname(entry, "abcABC");
Packit Service 1d0348
	archive_entry_set_filetype(entry, AE_IFREG);
Packit Service 1d0348
	archive_entry_set_size(entry, 0);
Packit Service 1d0348
	assertEqualInt(ARCHIVE_OK, archive_write_header(a, entry));
Packit Service 1d0348
	archive_entry_free(entry);
Packit Service 1d0348
	assertEqualInt(ARCHIVE_OK, archive_write_free(a));
Packit Service 1d0348
Packit Service 1d0348
	/* A bit 11 of general purpose flag should be 0,
Packit Service 1d0348
	 * which indicates the filename charset is unknown. */
Packit Service 1d0348
	assertEqualInt(0, buff[7]);
Packit Service 1d0348
	assertEqualMem(buff + 30, "abcABC", 6);
Packit Service 1d0348
}
Packit Service 1d0348
Packit Service 1d0348
/*
Packit Service 1d0348
 * Do not translate CP1251 into CP866 if non Windows platform.
Packit Service 1d0348
 */
Packit Service 1d0348
DEFINE_TEST(test_zip_filename_encoding_ru_RU_CP1251)
Packit Service 1d0348
{
Packit Service 1d0348
  	struct archive *a;
Packit Service 1d0348
  	struct archive_entry *entry;
Packit Service 1d0348
	char buff[4096];
Packit Service 1d0348
	size_t used;
Packit Service 1d0348
Packit Service 1d0348
	if (NULL == setlocale(LC_ALL, "ru_RU.CP1251")) {
Packit Service 1d0348
		skipping("Russian_Russia locale not available on this system.");
Packit Service 1d0348
		return;
Packit Service 1d0348
	}
Packit Service 1d0348
Packit Service 1d0348
	/*
Packit Service 1d0348
	 * Verify that CP1251 filenames are not translated into any
Packit Service 1d0348
	 * other character-set, in particular, CP866.
Packit Service 1d0348
	 */
Packit Service 1d0348
	a = archive_write_new();
Packit Service 1d0348
	assertEqualInt(ARCHIVE_OK, archive_write_set_format_zip(a));
Packit Service 1d0348
	assertEqualInt(ARCHIVE_OK,
Packit Service 1d0348
	    archive_write_open_memory(a, buff, sizeof(buff), &used));
Packit Service 1d0348
Packit Service 1d0348
	entry = archive_entry_new2(a);
Packit Service 1d0348
	/* Set a CP1251 filename. */
Packit Service 1d0348
	archive_entry_set_pathname(entry, "\xEF\xF0\xE8");
Packit Service 1d0348
	archive_entry_set_filetype(entry, AE_IFREG);
Packit Service 1d0348
	archive_entry_set_size(entry, 0);
Packit Service 1d0348
	assertEqualInt(ARCHIVE_OK, archive_write_header(a, entry));
Packit Service 1d0348
	archive_entry_free(entry);
Packit Service 1d0348
	assertEqualInt(ARCHIVE_OK, archive_write_free(a));
Packit Service 1d0348
Packit Service 1d0348
	/* A bit 11 of general purpose flag should be 0,
Packit Service 1d0348
	 * which indicates the filename charset is unknown. */
Packit Service 1d0348
	assertEqualInt(0, buff[7]);
Packit Service 1d0348
	/* Above three characters in CP1251 should not translate into
Packit Service 1d0348
	 * any other character-set. */
Packit Service 1d0348
	assertEqualMem(buff + 30, "\xEF\xF0\xE8", 3);
Packit Service 1d0348
}
Packit Service 1d0348
Packit Service 1d0348
/*
Packit Service 1d0348
 * Other archiver applications on Windows translate CP1251 filenames
Packit Service 1d0348
 * into CP866 filenames and store it in the zip file.
Packit Service 1d0348
 * Test above behavior works well.
Packit Service 1d0348
 */
Packit Service 1d0348
DEFINE_TEST(test_zip_filename_encoding_Russian_Russia)
Packit Service 1d0348
{
Packit Service 1d0348
  	struct archive *a;
Packit Service 1d0348
  	struct archive_entry *entry;
Packit Service 1d0348
	char buff[4096];
Packit Service 1d0348
	size_t used;
Packit Service 1d0348
Packit Service 1d0348
	if (NULL == setlocale(LC_ALL, "Russian_Russia")) {
Packit Service 1d0348
		skipping("Russian_Russia locale not available on this system.");
Packit Service 1d0348
		return;
Packit Service 1d0348
	}
Packit Service 1d0348
Packit Service 1d0348
	/*
Packit Service 1d0348
	 * Verify that Russian_Russia(CP1251) filenames are correctly translated
Packit Service 1d0348
	 * to UTF-8.
Packit Service 1d0348
	 */
Packit Service 1d0348
	a = archive_write_new();
Packit Service 1d0348
	assertEqualInt(ARCHIVE_OK, archive_write_set_format_zip(a));
Packit Service 1d0348
	if (archive_write_set_options(a, "hdrcharset=UTF-8") != ARCHIVE_OK) {
Packit Service 1d0348
		skipping("This system cannot convert character-set"
Packit Service 1d0348
		    " from Russian_Russia.CP1251 to UTF-8.");
Packit Service 1d0348
		archive_write_free(a);
Packit Service 1d0348
		return;
Packit Service 1d0348
	}
Packit Service 1d0348
	assertEqualInt(ARCHIVE_OK,
Packit Service 1d0348
	    archive_write_open_memory(a, buff, sizeof(buff), &used));
Packit Service 1d0348
Packit Service 1d0348
	entry = archive_entry_new2(a);
Packit Service 1d0348
	/* Set a CP1251 filename. */
Packit Service 1d0348
	archive_entry_set_pathname(entry, "\xEF\xF0\xE8");
Packit Service 1d0348
	archive_entry_set_filetype(entry, AE_IFREG);
Packit Service 1d0348
	archive_entry_set_size(entry, 0);
Packit Service 1d0348
	assertEqualInt(ARCHIVE_OK, archive_write_header(a, entry));
Packit Service 1d0348
	archive_entry_free(entry);
Packit Service 1d0348
	assertEqualInt(ARCHIVE_OK, archive_write_free(a));
Packit Service 1d0348
Packit Service 1d0348
	/* A bit 11 of general purpose flag should be 0x08,
Packit Service 1d0348
	 * which indicates the filename charset is UTF-8. */
Packit Service 1d0348
	assertEqualInt(0x08, buff[7]);
Packit Service 1d0348
	/* Above three characters in CP1251 should translate to the following
Packit Service 1d0348
	 * three characters (two bytes each) in UTF-8. */
Packit Service 1d0348
	assertEqualMem(buff + 30, "\xD0\xBF\xD1\x80\xD0\xB8", 6);
Packit Service 1d0348
Packit Service 1d0348
	/*
Packit Service 1d0348
	 * Verify that Russian_Russia(CP1251) filenames are correctly translated
Packit Service 1d0348
	 * to CP866.
Packit Service 1d0348
	 */
Packit Service 1d0348
	a = archive_write_new();
Packit Service 1d0348
	assertEqualInt(ARCHIVE_OK, archive_write_set_format_zip(a));
Packit Service 1d0348
	assertEqualInt(ARCHIVE_OK,
Packit Service 1d0348
	    archive_write_open_memory(a, buff, sizeof(buff), &used));
Packit Service 1d0348
Packit Service 1d0348
	entry = archive_entry_new2(a);
Packit Service 1d0348
	/* Set a CP1251 filename. */
Packit Service 1d0348
	archive_entry_set_pathname(entry, "\xEF\xF0\xE8");
Packit Service 1d0348
	archive_entry_set_filetype(entry, AE_IFREG);
Packit Service 1d0348
	archive_entry_set_size(entry, 0);
Packit Service 1d0348
	assertEqualInt(ARCHIVE_OK, archive_write_header(a, entry));
Packit Service 1d0348
	archive_entry_free(entry);
Packit Service 1d0348
	assertEqualInt(ARCHIVE_OK, archive_write_free(a));
Packit Service 1d0348
Packit Service 1d0348
	/* A bit 11 of general purpose flag should be 0,
Packit Service 1d0348
	 * which indicates the filename charset is unknown. */
Packit Service 1d0348
	assertEqualInt(0, buff[7]);
Packit Service 1d0348
	/* Above three characters in CP1251 should translate to the following
Packit Service 1d0348
	 * three characters in CP866. */
Packit Service 1d0348
	assertEqualMem(buff + 30, "\xAF\xE0\xA8", 3);
Packit Service 1d0348
}
Packit Service 1d0348
Packit Service 1d0348
DEFINE_TEST(test_zip_filename_encoding_EUCJP)
Packit Service 1d0348
{
Packit Service 1d0348
  	struct archive *a;
Packit Service 1d0348
  	struct archive_entry *entry;
Packit Service 1d0348
	char buff[4096];
Packit Service 1d0348
	size_t used;
Packit Service 1d0348
Packit Service 1d0348
	if (NULL == setlocale(LC_ALL, "ja_JP.eucJP")) {
Packit Service 1d0348
		skipping("eucJP locale not available on this system.");
Packit Service 1d0348
		return;
Packit Service 1d0348
	}
Packit Service 1d0348
Packit Service 1d0348
	/*
Packit Service 1d0348
	 * Verify that EUC-JP filenames are correctly translated to UTF-8.
Packit Service 1d0348
	 */
Packit Service 1d0348
	a = archive_write_new();
Packit Service 1d0348
	assertEqualInt(ARCHIVE_OK, archive_write_set_format_zip(a));
Packit Service 1d0348
	if (archive_write_set_options(a, "hdrcharset=UTF-8") != ARCHIVE_OK) {
Packit Service 1d0348
		skipping("This system cannot convert character-set"
Packit Service 1d0348
		    " from eucJP to UTF-8.");
Packit Service 1d0348
		archive_write_free(a);
Packit Service 1d0348
		return;
Packit Service 1d0348
	}
Packit Service 1d0348
	assertEqualInt(ARCHIVE_OK,
Packit Service 1d0348
	    archive_write_open_memory(a, buff, sizeof(buff), &used));
Packit Service 1d0348
Packit Service 1d0348
	entry = archive_entry_new2(a);
Packit Service 1d0348
	/* Set an EUC-JP filename. */
Packit Service 1d0348
	archive_entry_set_pathname(entry, "\xC9\xBD.txt");
Packit Service 1d0348
	/* Check the Unicode version. */
Packit Service 1d0348
	archive_entry_set_filetype(entry, AE_IFREG);
Packit Service 1d0348
	archive_entry_set_size(entry, 0);
Packit Service 1d0348
	assertEqualInt(ARCHIVE_OK, archive_write_header(a, entry));
Packit Service 1d0348
	archive_entry_free(entry);
Packit Service 1d0348
	assertEqualInt(ARCHIVE_OK, archive_write_free(a));
Packit Service 1d0348
Packit Service 1d0348
	/* A bit 11 of general purpose flag should be 0x08,
Packit Service 1d0348
	 * which indicates the filename charset is UTF-8. */
Packit Service 1d0348
	assertEqualInt(0x08, buff[7]);
Packit Service 1d0348
	/* Check UTF-8 version. */
Packit Service 1d0348
	assertEqualMem(buff + 30, "\xE8\xA1\xA8.txt", 7);
Packit Service 1d0348
Packit Service 1d0348
	/*
Packit Service 1d0348
	 * Verify that EUC-JP filenames are not translated to UTF-8.
Packit Service 1d0348
	 */
Packit Service 1d0348
	a = archive_write_new();
Packit Service 1d0348
	assertEqualInt(ARCHIVE_OK, archive_write_set_format_zip(a));
Packit Service 1d0348
	assertEqualInt(ARCHIVE_OK,
Packit Service 1d0348
	    archive_write_open_memory(a, buff, sizeof(buff), &used));
Packit Service 1d0348
Packit Service 1d0348
	entry = archive_entry_new2(a);
Packit Service 1d0348
	/* Set an EUC-JP filename. */
Packit Service 1d0348
	archive_entry_set_pathname(entry, "\xC9\xBD.txt");
Packit Service 1d0348
	/* Check the Unicode version. */
Packit Service 1d0348
	archive_entry_set_filetype(entry, AE_IFREG);
Packit Service 1d0348
	archive_entry_set_size(entry, 0);
Packit Service 1d0348
	assertEqualInt(ARCHIVE_OK, archive_write_header(a, entry));
Packit Service 1d0348
	archive_entry_free(entry);
Packit Service 1d0348
	assertEqualInt(ARCHIVE_OK, archive_write_free(a));
Packit Service 1d0348
Packit Service 1d0348
	/* A bit 11 of general purpose flag should be 0,
Packit Service 1d0348
	 * which indicates the filename charset is unknown. */
Packit Service 1d0348
	assertEqualInt(0, buff[7]);
Packit Service 1d0348
	/* Above three characters in EUC-JP should not translate to
Packit Service 1d0348
	 * any character-set. */
Packit Service 1d0348
	assertEqualMem(buff + 30, "\xC9\xBD.txt", 6);
Packit Service 1d0348
Packit Service 1d0348
	/*
Packit Service 1d0348
	 * Verify that A bit 11 of general purpose flag is not set
Packit Service 1d0348
	 * when ASCII filenames are stored even if hdrcharset=UTF-8
Packit Service 1d0348
	 * is specified.
Packit Service 1d0348
	 */
Packit Service 1d0348
	a = archive_write_new();
Packit Service 1d0348
	assertEqualInt(ARCHIVE_OK, archive_write_set_format_zip(a));
Packit Service 1d0348
	if (archive_write_set_options(a, "hdrcharset=UTF-8") != ARCHIVE_OK) {
Packit Service 1d0348
		skipping("This system cannot convert character-set"
Packit Service 1d0348
		    " from eucJP to UTF-8.");
Packit Service 1d0348
		archive_write_free(a);
Packit Service 1d0348
		return;
Packit Service 1d0348
	}
Packit Service 1d0348
	assertEqualInt(ARCHIVE_OK,
Packit Service 1d0348
	    archive_write_open_memory(a, buff, sizeof(buff), &used));
Packit Service 1d0348
Packit Service 1d0348
	entry = archive_entry_new2(a);
Packit Service 1d0348
	/* Set an ASCII filename. */
Packit Service 1d0348
	archive_entry_set_pathname(entry, "abcABC");
Packit Service 1d0348
	/* Check the Unicode version. */
Packit Service 1d0348
	archive_entry_set_filetype(entry, AE_IFREG);
Packit Service 1d0348
	archive_entry_set_size(entry, 0);
Packit Service 1d0348
	assertEqualInt(ARCHIVE_OK, archive_write_header(a, entry));
Packit Service 1d0348
	archive_entry_free(entry);
Packit Service 1d0348
	assertEqualInt(ARCHIVE_OK, archive_write_free(a));
Packit Service 1d0348
Packit Service 1d0348
	/* A bit 11 of general purpose flag should be 0,
Packit Service 1d0348
	 * which indicates the filename charset is unknown. */
Packit Service 1d0348
	assertEqualInt(0, buff[7]);
Packit Service 1d0348
	assertEqualMem(buff + 30, "abcABC", 6);
Packit Service 1d0348
}
Packit Service 1d0348
Packit Service 1d0348
DEFINE_TEST(test_zip_filename_encoding_CP932)
Packit Service 1d0348
{
Packit Service 1d0348
  	struct archive *a;
Packit Service 1d0348
  	struct archive_entry *entry;
Packit Service 1d0348
	char buff[4096];
Packit Service 1d0348
	size_t used;
Packit Service 1d0348
Packit Service 1d0348
	if (NULL == setlocale(LC_ALL, "Japanese_Japan") &&
Packit Service 1d0348
	    NULL == setlocale(LC_ALL, "ja_JP.SJIS")) {
Packit Service 1d0348
		skipping("CP932/SJIS locale not available on this system.");
Packit Service 1d0348
		return;
Packit Service 1d0348
	}
Packit Service 1d0348
Packit Service 1d0348
	/*
Packit Service 1d0348
	 * Verify that EUC-JP filenames are correctly translated to UTF-8.
Packit Service 1d0348
	 */
Packit Service 1d0348
	a = archive_write_new();
Packit Service 1d0348
	assertEqualInt(ARCHIVE_OK, archive_write_set_format_zip(a));
Packit Service 1d0348
	if (archive_write_set_options(a, "hdrcharset=UTF-8") != ARCHIVE_OK) {
Packit Service 1d0348
		skipping("This system cannot convert character-set"
Packit Service 1d0348
		    " from CP932/SJIS to UTF-8.");
Packit Service 1d0348
		archive_write_free(a);
Packit Service 1d0348
		return;
Packit Service 1d0348
	}
Packit Service 1d0348
	assertEqualInt(ARCHIVE_OK,
Packit Service 1d0348
	    archive_write_open_memory(a, buff, sizeof(buff), &used));
Packit Service 1d0348
Packit Service 1d0348
	entry = archive_entry_new2(a);
Packit Service 1d0348
	/* Set a CP932/SJIS filename. */
Packit Service 1d0348
	archive_entry_set_pathname(entry, "\x95\x5C.txt");
Packit Service 1d0348
	/* Check the Unicode version. */
Packit Service 1d0348
	archive_entry_set_filetype(entry, AE_IFREG);
Packit Service 1d0348
	archive_entry_set_size(entry, 0);
Packit Service 1d0348
	assertEqualInt(ARCHIVE_OK, archive_write_header(a, entry));
Packit Service 1d0348
	archive_entry_free(entry);
Packit Service 1d0348
	assertEqualInt(ARCHIVE_OK, archive_write_free(a));
Packit Service 1d0348
Packit Service 1d0348
	/* A bit 11 of general purpose flag should be 0x08,
Packit Service 1d0348
	 * which indicates the filename charset is UTF-8. */
Packit Service 1d0348
	assertEqualInt(0x08, buff[7]);
Packit Service 1d0348
	/* Check UTF-8 version. */
Packit Service 1d0348
	assertEqualMem(buff + 30, "\xE8\xA1\xA8.txt", 7);
Packit Service 1d0348
Packit Service 1d0348
	/*
Packit Service 1d0348
	 * Verify that CP932/SJIS filenames are not translated to UTF-8.
Packit Service 1d0348
	 */
Packit Service 1d0348
	a = archive_write_new();
Packit Service 1d0348
	assertEqualInt(ARCHIVE_OK, archive_write_set_format_zip(a));
Packit Service 1d0348
	assertEqualInt(ARCHIVE_OK,
Packit Service 1d0348
	    archive_write_open_memory(a, buff, sizeof(buff), &used));
Packit Service 1d0348
Packit Service 1d0348
	entry = archive_entry_new2(a);
Packit Service 1d0348
	/* Set a CP932/SJIS filename. */
Packit Service 1d0348
	archive_entry_set_pathname(entry, "\x95\x5C.txt");
Packit Service 1d0348
	/* Check the Unicode version. */
Packit Service 1d0348
	archive_entry_set_filetype(entry, AE_IFREG);
Packit Service 1d0348
	archive_entry_set_size(entry, 0);
Packit Service 1d0348
	assertEqualInt(ARCHIVE_OK, archive_write_header(a, entry));
Packit Service 1d0348
	archive_entry_free(entry);
Packit Service 1d0348
	assertEqualInt(ARCHIVE_OK, archive_write_free(a));
Packit Service 1d0348
Packit Service 1d0348
	/* A bit 11 of general purpose flag should be 0,
Packit Service 1d0348
	 * which indicates the filename charset is unknown. */
Packit Service 1d0348
	assertEqualInt(0, buff[7]);
Packit Service 1d0348
	/* Above three characters in CP932/SJIS should not translate to
Packit Service 1d0348
	 * any character-set. */
Packit Service 1d0348
	assertEqualMem(buff + 30, "\x95\x5C.txt", 6);
Packit Service 1d0348
Packit Service 1d0348
	/*
Packit Service 1d0348
	 * Verify that A bit 11 of general purpose flag is not set
Packit Service 1d0348
	 * when ASCII filenames are stored even if hdrcharset=UTF-8
Packit Service 1d0348
	 * is specified.
Packit Service 1d0348
	 */
Packit Service 1d0348
	a = archive_write_new();
Packit Service 1d0348
	assertEqualInt(ARCHIVE_OK, archive_write_set_format_zip(a));
Packit Service 1d0348
	if (archive_write_set_options(a, "hdrcharset=UTF-8") != ARCHIVE_OK) {
Packit Service 1d0348
		skipping("This system cannot convert character-set"
Packit Service 1d0348
		    " from CP932/SJIS to UTF-8.");
Packit Service 1d0348
		archive_write_free(a);
Packit Service 1d0348
		return;
Packit Service 1d0348
	}
Packit Service 1d0348
	assertEqualInt(ARCHIVE_OK,
Packit Service 1d0348
	    archive_write_open_memory(a, buff, sizeof(buff), &used));
Packit Service 1d0348
Packit Service 1d0348
	entry = archive_entry_new2(a);
Packit Service 1d0348
	/* Set an ASCII filename. */
Packit Service 1d0348
	archive_entry_set_pathname(entry, "abcABC");
Packit Service 1d0348
	/* Check the Unicode version. */
Packit Service 1d0348
	archive_entry_set_filetype(entry, AE_IFREG);
Packit Service 1d0348
	archive_entry_set_size(entry, 0);
Packit Service 1d0348
	assertEqualInt(ARCHIVE_OK, archive_write_header(a, entry));
Packit Service 1d0348
	archive_entry_free(entry);
Packit Service 1d0348
	assertEqualInt(ARCHIVE_OK, archive_write_free(a));
Packit Service 1d0348
Packit Service 1d0348
	/* A bit 11 of general purpose flag should be 0,
Packit Service 1d0348
	 * which indicates the filename charset is unknown. */
Packit Service 1d0348
	assertEqualInt(0, buff[7]);
Packit Service 1d0348
	assertEqualMem(buff + 30, "abcABC", 6);
Packit Service 1d0348
}