Blame extension/rwarray.c

Packit 575503
/*
Packit 575503
 * rwarray.c - Builtin functions to binary read / write arrays to a file.
Packit 575503
 *
Packit 575503
 * Arnold Robbins
Packit 575503
 * May 2009
Packit 575503
 * Redone June 2012
Packit 575503
 * Improved September 2017
Packit 575503
 */
Packit 575503
Packit 575503
/*
Packit 575503
 * Copyright (C) 2009-2014, 2017 the Free Software Foundation, Inc.
Packit 575503
 *
Packit 575503
 * This file is part of GAWK, the GNU implementation of the
Packit 575503
 * AWK Programming Language.
Packit 575503
 *
Packit 575503
 * GAWK is free software; you can redistribute it and/or modify
Packit 575503
 * it under the terms of the GNU General Public License as published by
Packit 575503
 * the Free Software Foundation; either version 3 of the License, or
Packit 575503
 * (at your option) any later version.
Packit 575503
 *
Packit 575503
 * GAWK is distributed in the hope that it will be useful,
Packit 575503
 * but WITHOUT ANY WARRANTY; without even the implied warranty of
Packit 575503
 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
Packit 575503
 * GNU General Public License for more details.
Packit 575503
 *
Packit 575503
 * You should have received a copy of the GNU General Public License
Packit 575503
 * along with this program; if not, write to the Free Software
Packit 575503
 * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA  02110-1301, USA
Packit 575503
 */
Packit 575503
Packit 575503
#ifdef HAVE_CONFIG_H
Packit 575503
#include <config.h>
Packit 575503
#endif
Packit 575503
Packit 575503
#include <stdio.h>
Packit 575503
#include <assert.h>
Packit 575503
#include <errno.h>
Packit 575503
#include <fcntl.h>
Packit 575503
#include <stdlib.h>
Packit 575503
#include <string.h>
Packit 575503
#include <unistd.h>
Packit 575503
Packit 575503
#ifdef __MINGW32__
Packit 575503
#include <winsock2.h>
Packit 575503
#include <stdint.h>
Packit 575503
#else
Packit 575503
#include <arpa/inet.h>
Packit 575503
#endif
Packit 575503
#include <sys/types.h>
Packit 575503
#include <sys/stat.h>
Packit 575503
Packit 575503
#include "gawkapi.h"
Packit 575503
Packit 575503
#include "gettext.h"
Packit 575503
#define _(msgid)  gettext(msgid)
Packit 575503
#define N_(msgid) msgid
Packit 575503
Packit 575503
#define MAGIC "awkrulz\n"
Packit 575503
#define MAJOR 3
Packit 575503
#define MINOR 1
Packit 575503
Packit 575503
static const gawk_api_t *api;	/* for convenience macros to work */
Packit 575503
static awk_ext_id_t ext_id;
Packit 575503
static const char *ext_version = "rwarray extension: version 1.2";
Packit 575503
static awk_bool_t (*init_func)(void) = NULL;
Packit 575503
Packit 575503
int plugin_is_GPL_compatible;
Packit 575503
Packit 575503
static awk_bool_t write_array(FILE *fp, awk_array_t array);
Packit 575503
static awk_bool_t write_elem(FILE *fp, awk_element_t *element);
Packit 575503
static awk_bool_t write_value(FILE *fp, awk_value_t *val);
Packit 575503
Packit 575503
static awk_bool_t read_array(FILE *fp, awk_array_t array);
Packit 575503
static awk_bool_t read_elem(FILE *fp, awk_element_t *element);
Packit 575503
static awk_bool_t read_value(FILE *fp, awk_value_t *value);
Packit 575503
Packit 575503
/*
Packit 575503
 * Format of array info:
Packit 575503
 *
Packit 575503
 * MAGIC		8 bytes
Packit 575503
 * Major version	4 bytes - network order
Packit 575503
 * Minor version	4 bytes - network order
Packit 575503
 * Element count	4 bytes - network order
Packit 575503
 * Elements
Packit 575503
 *
Packit 575503
 * For each element:
Packit 575503
 * Length of index val:	4 bytes - network order
Packit 575503
 * Index val as characters (N bytes)
Packit 575503
 * Value type		4 bytes (0 = string, 1 = number, 2 = array, 3 = regex, 4 = strnum, 5 = undefined)
Packit 575503
 * IF string:
Packit 575503
 * 	Length of value	4 bytes
Packit 575503
 * 	Value as characters (N bytes)
Packit 575503
 * ELSE IF number:
Packit 575503
 * 	8 bytes as native double
Packit 575503
 * ELSE
Packit 575503
 * 	Element count
Packit 575503
 * 	Elements
Packit 575503
 * END IF
Packit 575503
 */
Packit 575503
Packit 575503
/* do_writea --- write an array */
Packit 575503
Packit 575503
static awk_value_t *
Packit 575503
do_writea(int nargs, awk_value_t *result, struct awk_ext_func *unused)
Packit 575503
{
Packit 575503
	awk_value_t filename, array;
Packit 575503
	FILE *fp = NULL;
Packit 575503
	uint32_t major = MAJOR;
Packit 575503
	uint32_t minor = MINOR;
Packit 575503
Packit 575503
	assert(result != NULL);
Packit 575503
	make_number(0.0, result);
Packit 575503
Packit 575503
	if (nargs < 2)
Packit 575503
		goto out;
Packit 575503
Packit 575503
	/* filename is first arg, array to dump is second */
Packit 575503
	if (! get_argument(0, AWK_STRING, & filename)) {
Packit 575503
		fprintf(stderr, _("do_writea: argument 0 is not a string\n"));
Packit 575503
		errno = EINVAL;
Packit 575503
		goto done1;
Packit 575503
	}
Packit 575503
Packit 575503
	if (! get_argument(1, AWK_ARRAY, & array)) {
Packit 575503
		fprintf(stderr, _("do_writea: argument 1 is not an array\n"));
Packit 575503
		errno = EINVAL;
Packit 575503
		goto done1;
Packit 575503
	}
Packit 575503
Packit 575503
	/* open the file, if error, set ERRNO and return */
Packit 575503
	fp = fopen(filename.str_value.str, "wb");
Packit 575503
	if (fp == NULL)
Packit 575503
		goto done1;
Packit 575503
Packit 575503
	if (fwrite(MAGIC, 1, strlen(MAGIC), fp) != strlen(MAGIC))
Packit 575503
		goto done1;
Packit 575503
Packit 575503
	major = htonl(major);
Packit 575503
	if (fwrite(& major, 1, sizeof(major), fp) != sizeof(major))
Packit 575503
		goto done1;
Packit 575503
Packit 575503
	minor = htonl(minor);
Packit 575503
	if (fwrite(& minor, 1, sizeof(minor), fp) != sizeof(minor))
Packit 575503
		goto done1;
Packit 575503
Packit 575503
	if (write_array(fp, array.array_cookie)) {
Packit 575503
		make_number(1.0, result);
Packit 575503
		goto done0;
Packit 575503
	}
Packit 575503
Packit 575503
done1:
Packit 575503
	update_ERRNO_int(errno);
Packit 575503
	unlink(filename.str_value.str);
Packit 575503
Packit 575503
done0:
Packit 575503
	fclose(fp);
Packit 575503
out:
Packit 575503
	return result;
Packit 575503
}
Packit 575503
Packit 575503
Packit 575503
/* write_array --- write out an array or a sub-array */
Packit 575503
Packit 575503
static awk_bool_t
Packit 575503
write_array(FILE *fp, awk_array_t array)
Packit 575503
{
Packit 575503
	uint32_t i;
Packit 575503
	uint32_t count;
Packit 575503
	awk_flat_array_t *flat_array;
Packit 575503
Packit 575503
	if (! flatten_array(array, & flat_array)) {
Packit 575503
		fprintf(stderr, _("write_array: could not flatten array\n"));
Packit 575503
		return awk_false;
Packit 575503
	}
Packit 575503
Packit 575503
	count = htonl(flat_array->count);
Packit 575503
	if (fwrite(& count, 1, sizeof(count), fp) != sizeof(count))
Packit 575503
		return awk_false;
Packit 575503
Packit 575503
	for (i = 0; i < flat_array->count; i++) {
Packit 575503
		if (! write_elem(fp, & flat_array->elements[i])) {
Packit 575503
			(void) release_flattened_array(array, flat_array);
Packit 575503
			return awk_false;
Packit 575503
		}
Packit 575503
	}
Packit 575503
Packit 575503
	if (! release_flattened_array(array, flat_array)) {
Packit 575503
		fprintf(stderr, _("write_array: could not release flattened array\n"));
Packit 575503
		return awk_false;
Packit 575503
	}
Packit 575503
Packit 575503
	return awk_true;
Packit 575503
}
Packit 575503
Packit 575503
/* write_elem --- write out a single element */
Packit 575503
Packit 575503
static awk_bool_t
Packit 575503
write_elem(FILE *fp, awk_element_t *element)
Packit 575503
{
Packit 575503
	uint32_t indexval_len;
Packit 575503
	ssize_t write_count;
Packit 575503
Packit 575503
	indexval_len = htonl(element->index.str_value.len);
Packit 575503
	if (fwrite(& indexval_len, 1, sizeof(indexval_len), fp) != sizeof(indexval_len))
Packit 575503
		return awk_false;
Packit 575503
Packit 575503
	if (element->index.str_value.len > 0) {
Packit 575503
		write_count = fwrite(element->index.str_value.str,
Packit 575503
				1, element->index.str_value.len, fp);
Packit 575503
		if (write_count != (ssize_t) element->index.str_value.len)
Packit 575503
			return awk_false;
Packit 575503
	}
Packit 575503
Packit 575503
	return write_value(fp, & element->value);
Packit 575503
}
Packit 575503
Packit 575503
/* write_value --- write a number or a string or a strnum or a regex or an array */
Packit 575503
Packit 575503
static awk_bool_t
Packit 575503
write_value(FILE *fp, awk_value_t *val)
Packit 575503
{
Packit 575503
	uint32_t code, len;
Packit 575503
Packit 575503
	if (val->val_type == AWK_ARRAY) {
Packit 575503
		code = htonl(2);
Packit 575503
		if (fwrite(& code, 1, sizeof(code), fp) != sizeof(code))
Packit 575503
			return awk_false;
Packit 575503
		return write_array(fp, val->array_cookie);
Packit 575503
	}
Packit 575503
Packit 575503
	if (val->val_type == AWK_NUMBER) {
Packit 575503
		code = htonl(1);
Packit 575503
		if (fwrite(& code, 1, sizeof(code), fp) != sizeof(code))
Packit 575503
			return awk_false;
Packit 575503
Packit 575503
		if (fwrite(& val->num_value, 1, sizeof(val->num_value), fp) != sizeof(val->num_value))
Packit 575503
			return awk_false;
Packit 575503
	} else {
Packit 575503
		switch (val->val_type) {
Packit 575503
		case AWK_STRING:
Packit 575503
			code = htonl(0);
Packit 575503
			break;
Packit 575503
		case AWK_STRNUM:
Packit 575503
			code = htonl(4);
Packit 575503
			break;
Packit 575503
		case AWK_REGEX:
Packit 575503
			code = htonl(3);
Packit 575503
			break;
Packit 575503
		case AWK_UNDEFINED:
Packit 575503
			code = htonl(5);
Packit 575503
			break;
Packit 575503
		default:
Packit 575503
			/* XXX can this happen? */
Packit 575503
			code = htonl(0);
Packit 575503
			warning(ext_id, _("array value has unknown type %d"), val->val_type);
Packit 575503
			break;
Packit 575503
		}
Packit 575503
		if (fwrite(& code, 1, sizeof(code), fp) != sizeof(code))
Packit 575503
			return awk_false;
Packit 575503
Packit 575503
		len = htonl(val->str_value.len);
Packit 575503
		if (fwrite(& len, 1, sizeof(len), fp) != sizeof(len))
Packit 575503
			return awk_false;
Packit 575503
Packit 575503
		if (fwrite(val->str_value.str, 1, val->str_value.len, fp)
Packit 575503
				!= (ssize_t) val->str_value.len)
Packit 575503
			return awk_false;
Packit 575503
	}
Packit 575503
Packit 575503
	return awk_true;
Packit 575503
}
Packit 575503
Packit 575503
/* do_reada --- read an array */
Packit 575503
Packit 575503
static awk_value_t *
Packit 575503
do_reada(int nargs, awk_value_t *result, struct awk_ext_func *unused)
Packit 575503
{
Packit 575503
	awk_value_t filename, array;
Packit 575503
	FILE *fp = NULL;
Packit 575503
	uint32_t major;
Packit 575503
	uint32_t minor;
Packit 575503
	char magic_buf[30];
Packit 575503
Packit 575503
	assert(result != NULL);
Packit 575503
	make_number(0.0, result);
Packit 575503
Packit 575503
	if (nargs < 2)
Packit 575503
		goto out;
Packit 575503
Packit 575503
	/* directory is first arg, array to read is second */
Packit 575503
	if (! get_argument(0, AWK_STRING, & filename)) {
Packit 575503
		fprintf(stderr, _("do_reada: argument 0 is not a string\n"));
Packit 575503
		errno = EINVAL;
Packit 575503
		goto done1;
Packit 575503
	}
Packit 575503
Packit 575503
	if (! get_argument(1, AWK_ARRAY, & array)) {
Packit 575503
		fprintf(stderr, _("do_reada: argument 1 is not an array\n"));
Packit 575503
		errno = EINVAL;
Packit 575503
		goto done1;
Packit 575503
	}
Packit 575503
Packit 575503
	fp = fopen(filename.str_value.str, "rb");
Packit 575503
	if (fp == NULL)
Packit 575503
		goto done1;
Packit 575503
Packit 575503
	memset(magic_buf, '\0', sizeof(magic_buf));
Packit 575503
	if (fread(magic_buf, 1, strlen(MAGIC), fp) != strlen(MAGIC)) {
Packit 575503
		errno = EBADF;
Packit 575503
		goto done1;
Packit 575503
	}
Packit 575503
Packit 575503
	if (strcmp(magic_buf, MAGIC) != 0) {
Packit 575503
		errno = EBADF;
Packit 575503
		goto done1;
Packit 575503
	}
Packit 575503
Packit 575503
	if (fread(& major, 1, sizeof(major), fp) != sizeof(major)) {
Packit 575503
		errno = EBADF;
Packit 575503
		goto done1;
Packit 575503
	}
Packit 575503
	major = ntohl(major);
Packit 575503
Packit 575503
	if (major != MAJOR) {
Packit 575503
		errno = EBADF;
Packit 575503
		goto done1;
Packit 575503
	}
Packit 575503
Packit 575503
	if (fread(& minor, 1, sizeof(minor), fp) != sizeof(minor)) {
Packit 575503
		/* read() sets errno */
Packit 575503
		goto done1;
Packit 575503
	}
Packit 575503
Packit 575503
	minor = ntohl(minor);
Packit 575503
	if (minor != MINOR) {
Packit 575503
		errno = EBADF;
Packit 575503
		goto done1;
Packit 575503
	}
Packit 575503
Packit 575503
	if (! clear_array(array.array_cookie)) {
Packit 575503
		errno = ENOMEM;
Packit 575503
		fprintf(stderr, _("do_reada: clear_array failed\n"));
Packit 575503
		goto done1;
Packit 575503
	}
Packit 575503
Packit 575503
	if (read_array(fp, array.array_cookie)) {
Packit 575503
		make_number(1.0, result);
Packit 575503
		goto done0;
Packit 575503
	}
Packit 575503
Packit 575503
done1:
Packit 575503
	update_ERRNO_int(errno);
Packit 575503
done0:
Packit 575503
	if (fp != NULL)
Packit 575503
		fclose(fp);
Packit 575503
out:
Packit 575503
	return result;
Packit 575503
}
Packit 575503
Packit 575503
Packit 575503
/* read_array --- read in an array or sub-array */
Packit 575503
Packit 575503
static awk_bool_t
Packit 575503
read_array(FILE *fp, awk_array_t array)
Packit 575503
{
Packit 575503
	uint32_t i;
Packit 575503
	uint32_t count;
Packit 575503
	awk_element_t new_elem;
Packit 575503
Packit 575503
	if (fread(& count, 1, sizeof(count), fp) != sizeof(count))
Packit 575503
		return awk_false;
Packit 575503
Packit 575503
	count = ntohl(count);
Packit 575503
Packit 575503
	for (i = 0; i < count; i++) {
Packit 575503
		if (read_elem(fp, & new_elem)) {
Packit 575503
			/* add to array */
Packit 575503
			if (! set_array_element_by_elem(array, & new_elem)) {
Packit 575503
				fprintf(stderr, _("read_array: set_array_element failed\n"));
Packit 575503
				return awk_false;
Packit 575503
			}
Packit 575503
		} else
Packit 575503
			break;
Packit 575503
	}
Packit 575503
Packit 575503
	if (i != count)
Packit 575503
		return awk_false;
Packit 575503
Packit 575503
	return awk_true;
Packit 575503
}
Packit 575503
Packit 575503
/* read_elem --- read in a single element */
Packit 575503
Packit 575503
static awk_bool_t
Packit 575503
read_elem(FILE *fp, awk_element_t *element)
Packit 575503
{
Packit 575503
	uint32_t index_len;
Packit 575503
	static char *buffer;
Packit 575503
	static uint32_t buflen;
Packit 575503
	ssize_t ret;
Packit 575503
Packit 575503
	if ((ret = fread(& index_len, 1, sizeof(index_len), fp)) != sizeof(index_len)) {
Packit 575503
		return awk_false;
Packit 575503
	}
Packit 575503
	index_len = ntohl(index_len);
Packit 575503
Packit 575503
	memset(element, 0, sizeof(*element));
Packit 575503
Packit 575503
	if (index_len > 0) {
Packit 575503
		if (buffer == NULL) {
Packit 575503
			/* allocate buffer */
Packit 575503
			emalloc(buffer, char *, index_len, "read_elem");
Packit 575503
			buflen = index_len;
Packit 575503
		} else if (buflen < index_len) {
Packit 575503
			/* reallocate buffer */
Packit 575503
			char *cp = gawk_realloc(buffer, index_len);
Packit 575503
Packit 575503
			if (cp == NULL)
Packit 575503
				return awk_false;
Packit 575503
Packit 575503
			buffer = cp;
Packit 575503
			buflen = index_len;
Packit 575503
		}
Packit 575503
Packit 575503
		if (fread(buffer, 1, index_len, fp) != (ssize_t) index_len) {
Packit 575503
			return awk_false;
Packit 575503
		}
Packit 575503
		make_const_string(buffer, index_len, & element->index);
Packit 575503
	} else {
Packit 575503
		make_null_string(& element->index);
Packit 575503
	}
Packit 575503
Packit 575503
	if (! read_value(fp, & element->value))
Packit 575503
		return awk_false;
Packit 575503
Packit 575503
	return awk_true;
Packit 575503
}
Packit 575503
Packit 575503
/* read_value --- read a number or a string */
Packit 575503
Packit 575503
static awk_bool_t
Packit 575503
read_value(FILE *fp, awk_value_t *value)
Packit 575503
{
Packit 575503
	uint32_t code, len;
Packit 575503
Packit 575503
	if (fread(& code, 1, sizeof(code), fp) != sizeof(code))
Packit 575503
		return awk_false;
Packit 575503
Packit 575503
	code = ntohl(code);
Packit 575503
Packit 575503
	if (code == 2) {
Packit 575503
		awk_array_t array = create_array();
Packit 575503
Packit 575503
		if (! read_array(fp, array))
Packit 575503
			return awk_false;
Packit 575503
Packit 575503
		/* hook into value */
Packit 575503
		value->val_type = AWK_ARRAY;
Packit 575503
		value->array_cookie = array;
Packit 575503
	} else if (code == 1) {
Packit 575503
		double d;
Packit 575503
Packit 575503
		if (fread(& d, 1, sizeof(d), fp) != sizeof(d))
Packit 575503
			return awk_false;
Packit 575503
Packit 575503
		/* hook into value */
Packit 575503
		value->val_type = AWK_NUMBER;
Packit 575503
		value->num_value = d;
Packit 575503
	} else {
Packit 575503
		if (fread(& len, 1, sizeof(len), fp) != sizeof(len)) {
Packit 575503
			return awk_false;
Packit 575503
		}
Packit 575503
		len = ntohl(len);
Packit 575503
		switch (code) {
Packit 575503
		case 0:
Packit 575503
			value->val_type = AWK_STRING;
Packit 575503
			break;
Packit 575503
		case 3:
Packit 575503
			value->val_type = AWK_REGEX;
Packit 575503
			break;
Packit 575503
		case 4:
Packit 575503
			value->val_type = AWK_STRNUM;
Packit 575503
			break;
Packit 575503
		case 5:
Packit 575503
			value->val_type = AWK_UNDEFINED;
Packit 575503
			break;
Packit 575503
		default:
Packit 575503
			/* this cannot happen! */
Packit 575503
			warning(ext_id, _("treating recovered value with unknown type code %d as a string"), code);
Packit 575503
			value->val_type = AWK_STRING;
Packit 575503
			break;
Packit 575503
		}
Packit 575503
		value->str_value.len = len;
Packit 575503
		value->str_value.str = gawk_malloc(len + 1);
Packit 575503
Packit 575503
		if (fread(value->str_value.str, 1, len, fp) != (ssize_t) len) {
Packit 575503
			gawk_free(value->str_value.str);
Packit 575503
			return awk_false;
Packit 575503
		}
Packit 575503
		value->str_value.str[len] = '\0';
Packit 575503
	}
Packit 575503
Packit 575503
	return awk_true;
Packit 575503
}
Packit 575503
Packit 575503
static awk_ext_func_t func_table[] = {
Packit 575503
	{ "writea", do_writea, 2, 2, awk_false, NULL },
Packit 575503
	{ "reada", do_reada, 2, 2, awk_false, NULL },
Packit 575503
};
Packit 575503
Packit 575503
Packit 575503
/* define the dl_load function using the boilerplate macro */
Packit 575503
Packit 575503
dl_load_func(func_table, rwarray, "")