Blob Blame History Raw
/*
 * Copyright (c) 2008-2009 Voltaire, Inc. All rights reserved.
 * Copyright (c) 2007 The Regents of the University of California.
 * Copyright (c) 2009 HNR Consulting. All rights reserved.
 *
 * This software is available to you under a choice of one of two
 * licenses.  You may choose to be licensed under the terms of the GNU
 * General Public License (GPL) Version 2, available from the file
 * COPYING in the main directory of this source tree, or the
 * OpenIB.org BSD license below:
 *
 *     Redistribution and use in source and binary forms, with or
 *     without modification, are permitted provided that the following
 *     conditions are met:
 *
 *      - Redistributions of source code must retain the above
 *        copyright notice, this list of conditions and the following
 *        disclaimer.
 *
 *      - Redistributions in binary form must reproduce the above
 *        copyright notice, this list of conditions and the following
 *        disclaimer in the documentation and/or other materials
 *        provided with the distribution.
 *
 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
 * EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
 * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
 * NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS
 * BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN
 * ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN
 * CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
 * SOFTWARE.
 *
 */

#if HAVE_CONFIG_H
#  include <config.h>
#endif				/* HAVE_CONFIG_H */

#ifdef ENABLE_OSM_PERF_MGR

#include <stdlib.h>
#include <errno.h>
#include <limits.h>
#include <dlfcn.h>
#include <sys/stat.h>

#include <opensm/osm_file_ids.h>
#define FILE_ID OSM_FILE_PERFMGR_DB_C
#include <opensm/osm_perfmgr_db.h>
#include <opensm/osm_perfmgr.h>
#include <opensm/osm_opensm.h>

static void free_node(db_node_t * node);

/** =========================================================================
 */
perfmgr_db_t *perfmgr_db_construct(osm_perfmgr_t *perfmgr)
{
	perfmgr_db_t *db = malloc(sizeof(*db));
	if (!db)
		return NULL;

	cl_qmap_init(&db->pc_data);
	cl_plock_construct(&db->lock);
	cl_plock_init(&db->lock);
	db->perfmgr = perfmgr;
	return db;
}

/** =========================================================================
 */
void perfmgr_db_destroy(perfmgr_db_t * db)
{
	cl_map_item_t *item, *next_item;

	if (db) {
		item = cl_qmap_head(&db->pc_data);
		while (item != cl_qmap_end(&db->pc_data)) {
			next_item = cl_qmap_next(item);
			free_node((db_node_t *)item);
			item = next_item;
		}
		cl_plock_destroy(&db->lock);
		free(db);
	}
}

/**********************************************************************
 * Internal call db->lock should be held when calling
 **********************************************************************/
static inline db_node_t *get(perfmgr_db_t * db, uint64_t guid)
{
	cl_map_item_t *rc = cl_qmap_get(&db->pc_data, guid);
	const cl_map_item_t *end = cl_qmap_end(&db->pc_data);

	if (rc == end)
		return NULL;
	return (db_node_t *) rc;
}

static inline perfmgr_db_err_t bad_node_port(db_node_t * node, uint8_t port)
{
	if (!node)
		return PERFMGR_EVENT_DB_GUIDNOTFOUND;
	if (port >= node->num_ports || (!node->esp0 && port == 0))
		return PERFMGR_EVENT_DB_PORTNOTFOUND;

	return PERFMGR_EVENT_DB_SUCCESS;
}

static inline void mark_port_valid(db_node_t * node, uint8_t port)
{
	node->ports[port].valid = TRUE;
}

/** =========================================================================
 */
static db_node_t *malloc_node(uint64_t guid, boolean_t esp0,
			      uint8_t num_ports, char *name)
{
	int i = 0;
	time_t cur_time = 0;
	db_node_t *rc = malloc(sizeof(*rc));
	if (!rc)
		return NULL;

	rc->ports = calloc(num_ports, sizeof(db_port_t));
	if (!rc->ports)
		goto free_rc;
	rc->num_ports = num_ports;
	rc->node_guid = guid;
	rc->esp0 = esp0;

	cur_time = time(NULL);
	for (i = 0; i < num_ports; i++) {
		rc->ports[i].last_reset = cur_time;
		rc->ports[i].err_previous.time = cur_time;
		rc->ports[i].dc_previous.time = cur_time;
		rc->ports[i].valid = FALSE;
	}
	snprintf(rc->node_name, sizeof(rc->node_name), "%s", name);
	rc->active = FALSE;

	return rc;

free_rc:
	free(rc);
	return NULL;
}

/** =========================================================================
 */
static void free_node(db_node_t * node)
{
	if (!node)
		return;
	if (node->ports)
		free(node->ports);
	free(node);
}

/* insert nodes to the database */
static perfmgr_db_err_t insert(perfmgr_db_t * db, db_node_t * node)
{
	cl_map_item_t *rc = cl_qmap_insert(&db->pc_data, node->node_guid,
					   (cl_map_item_t *) node);

	if ((void *)rc != (void *)node)
		return PERFMGR_EVENT_DB_FAIL;
	return PERFMGR_EVENT_DB_SUCCESS;
}

perfmgr_db_err_t
perfmgr_db_create_entry(perfmgr_db_t * db, uint64_t guid, boolean_t esp0,
			uint8_t num_ports, char *name)
{
	perfmgr_db_err_t rc = PERFMGR_EVENT_DB_SUCCESS;

	cl_plock_excl_acquire(&db->lock);
	if (!get(db, guid)) {
		db_node_t *pc_node = malloc_node(guid, esp0, num_ports,
						 name);
		if (!pc_node) {
			rc = PERFMGR_EVENT_DB_NOMEM;
			goto Exit;
		}
		if (insert(db, pc_node)) {
			free_node(pc_node);
			rc = PERFMGR_EVENT_DB_FAIL;
			goto Exit;
		}
	}
Exit:
	cl_plock_release(&db->lock);
	return rc;
}

perfmgr_db_err_t
perfmgr_db_update_name(perfmgr_db_t * db, uint64_t node_guid, char *name)
{
	db_node_t *node = NULL;

	cl_plock_excl_acquire(&db->lock);
	node = get(db, node_guid);
	if (node)
		snprintf(node->node_name, sizeof(node->node_name), "%s", name);
	cl_plock_release(&db->lock);
	return (PERFMGR_EVENT_DB_SUCCESS);
}

perfmgr_db_err_t
perfmgr_db_delete_entry(perfmgr_db_t * db, uint64_t guid)
{
	cl_map_item_t * rc = cl_qmap_remove(&db->pc_data, guid);

	if (rc == cl_qmap_end(&db->pc_data))
		return(PERFMGR_EVENT_DB_GUIDNOTFOUND);

	db_node_t *pc_node = (db_node_t *)rc;
	free_node(pc_node);
	return(PERFMGR_EVENT_DB_SUCCESS);
}

perfmgr_db_err_t
perfmgr_db_delete_inactive(perfmgr_db_t * db, unsigned *cnt)
{
	perfmgr_db_err_t rc = PERFMGR_EVENT_DB_SUCCESS;
	int i = 0;
	int num = 0;
	uint64_t * guid_list = NULL;
	cl_map_item_t * p_map_item = cl_qmap_head(&db->pc_data);

	if (p_map_item == cl_qmap_end(&db->pc_data)) {
		rc = PERFMGR_EVENT_DB_SUCCESS;
		goto Done;
	}

	while (p_map_item != cl_qmap_end(&db->pc_data)) {
		db_node_t *n = (db_node_t *)p_map_item;
		if (n->active == FALSE) {
			guid_list = realloc(guid_list,
					sizeof(*guid_list) * (num+1));
			if (!guid_list) {
				num = 0;
				rc = PERFMGR_EVENT_DB_NOMEM;
				goto Done;
			}
			guid_list[num] = n->node_guid;
			num++;
		}
		p_map_item = cl_qmap_next(p_map_item);
	}

	for (i = 0 ; i < num; i++)
		perfmgr_db_delete_entry(db, guid_list[i]);

	free(guid_list);

Done:
	if (cnt)
		*cnt = num;

	return(rc);
}

perfmgr_db_err_t
perfmgr_db_mark_active(perfmgr_db_t *db, uint64_t guid, boolean_t active)
{
	db_node_t *node = NULL;

	cl_plock_excl_acquire(&db->lock);
	node = get(db, guid);
	if (node)
		node->active = active;
	cl_plock_release(&db->lock);
	return (PERFMGR_EVENT_DB_SUCCESS);
}


/**********************************************************************
 * Dump a reading vs the previous reading to stdout
 **********************************************************************/
static inline void
debug_dump_err_reading(perfmgr_db_t * db, uint64_t guid, uint8_t port_num,
		       db_port_t * port, perfmgr_db_err_reading_t * cur)
{
	osm_log_t *log = db->perfmgr->log;

	if (!OSM_LOG_IS_ACTIVE_V2(log, OSM_LOG_DEBUG))
		return;		/* optimize this a bit */

	osm_log_v2(log, OSM_LOG_DEBUG, FILE_ID,
		   "GUID 0x%" PRIx64 " Port %u:\n", guid, port_num);
	osm_log_v2(log, OSM_LOG_DEBUG, FILE_ID,
		   "sym %" PRIu64 " <-- %" PRIu64 " (%" PRIu64 ")\n",
		   cur->symbol_err_cnt, port->err_previous.symbol_err_cnt,
		   port->err_total.symbol_err_cnt);
	osm_log_v2(log, OSM_LOG_DEBUG, FILE_ID,
		   "ler %" PRIu64 " <-- %" PRIu64 " (%" PRIu64 ")\n",
		   cur->link_err_recover, port->err_previous.link_err_recover,
		   port->err_total.link_err_recover);
	osm_log_v2(log, OSM_LOG_DEBUG, FILE_ID,
		   "ld %" PRIu64 " <-- %" PRIu64 " (%" PRIu64 ")\n",
		   cur->link_downed, port->err_previous.link_downed,
		   port->err_total.link_downed);
	osm_log_v2(log, OSM_LOG_DEBUG, FILE_ID,
		   "re %" PRIu64 " <-- %" PRIu64 " (%" PRIu64 ")\n", cur->rcv_err,
		   port->err_previous.rcv_err, port->err_total.rcv_err);
	osm_log_v2(log, OSM_LOG_DEBUG, FILE_ID,
		   "rrp %" PRIu64 " <-- %" PRIu64 " (%" PRIu64 ")\n",
		   cur->rcv_rem_phys_err, port->err_previous.rcv_rem_phys_err,
		   port->err_total.rcv_rem_phys_err);
	osm_log_v2(log, OSM_LOG_DEBUG, FILE_ID,
		   "rsr %" PRIu64 " <-- %" PRIu64 " (%" PRIu64 ")\n",
		   cur->rcv_switch_relay_err,
		   port->err_previous.rcv_switch_relay_err,
		   port->err_total.rcv_switch_relay_err);
	osm_log_v2(log, OSM_LOG_DEBUG, FILE_ID,
		   "xd %" PRIu64 " <-- %" PRIu64 " (%" PRIu64 ")\n",
		   cur->xmit_discards, port->err_previous.xmit_discards,
		   port->err_total.xmit_discards);
	osm_log_v2(log, OSM_LOG_DEBUG, FILE_ID,
		   "xce %" PRIu64 " <-- %" PRIu64 " (%" PRIu64 ")\n",
		   cur->xmit_constraint_err,
		   port->err_previous.xmit_constraint_err,
		   port->err_total.xmit_constraint_err);
	osm_log_v2(log, OSM_LOG_DEBUG, FILE_ID,
		   "rce %" PRIu64 " <-- %" PRIu64 " (%" PRIu64 ")\n",
		   cur->rcv_constraint_err, port->err_previous.rcv_constraint_err,
		   port->err_total.rcv_constraint_err);
	osm_log_v2(log, OSM_LOG_DEBUG, FILE_ID,
		   "li %" PRIu64 " <-- %" PRIu64 " (%" PRIu64 ")\n",
		   cur->link_integrity, port->err_previous.link_integrity,
		   port->err_total.link_integrity);
	osm_log_v2(log, OSM_LOG_DEBUG, FILE_ID,
		   "bo %" PRIu64 " <-- %" PRIu64 " (%" PRIu64 ")\n",
		   cur->buffer_overrun, port->err_previous.buffer_overrun,
		   port->err_total.buffer_overrun);
	osm_log_v2(log, OSM_LOG_DEBUG, FILE_ID,
		   "vld %" PRIu64 " <-- %" PRIu64 " (%" PRIu64 ")\n",
		   cur->vl15_dropped, port->err_previous.vl15_dropped,
		   port->err_total.vl15_dropped);
	osm_log_v2(log, OSM_LOG_DEBUG, FILE_ID,
		   "xw %" PRIu64 " <-- %" PRIu64 " (%" PRIu64 ")\n",
		   cur->xmit_wait, port->err_previous.xmit_wait,
		   port->err_total.xmit_wait);
}

/**********************************************************************
 * perfmgr_db_err_reading_t functions
 **********************************************************************/
perfmgr_db_err_t
perfmgr_db_add_err_reading(perfmgr_db_t * db, uint64_t guid, uint8_t port,
			   perfmgr_db_err_reading_t * reading)
{
	db_port_t *p_port = NULL;
	db_node_t *node = NULL;
	perfmgr_db_err_reading_t *previous = NULL;
	perfmgr_db_err_t rc = PERFMGR_EVENT_DB_SUCCESS;
	osm_epi_pe_event_t epi_pe_data;

	cl_plock_excl_acquire(&db->lock);
	node = get(db, guid);
	if ((rc = bad_node_port(node, port)) != PERFMGR_EVENT_DB_SUCCESS)
		goto Exit;

	mark_port_valid(node, port);

	p_port = &(node->ports[port]);
	previous = &(node->ports[port].err_previous);

	debug_dump_err_reading(db, guid, port, p_port, reading);

	epi_pe_data.time_diff_s = (reading->time - previous->time);
	osm_epi_create_port_id(&epi_pe_data.port_id, guid, port,
			       node->node_name);

	/* calculate changes from previous reading */
	epi_pe_data.symbol_err_cnt =
	    (reading->symbol_err_cnt - previous->symbol_err_cnt);
	p_port->err_total.symbol_err_cnt += epi_pe_data.symbol_err_cnt;
	epi_pe_data.link_err_recover =
	    (reading->link_err_recover - previous->link_err_recover);
	p_port->err_total.link_err_recover += epi_pe_data.link_err_recover;
	epi_pe_data.link_downed =
	    (reading->link_downed - previous->link_downed);
	p_port->err_total.link_downed += epi_pe_data.link_downed;
	epi_pe_data.rcv_err = (reading->rcv_err - previous->rcv_err);
	p_port->err_total.rcv_err += epi_pe_data.rcv_err;
	epi_pe_data.rcv_rem_phys_err =
	    (reading->rcv_rem_phys_err - previous->rcv_rem_phys_err);
	p_port->err_total.rcv_rem_phys_err += epi_pe_data.rcv_rem_phys_err;
	epi_pe_data.rcv_switch_relay_err =
	    (reading->rcv_switch_relay_err - previous->rcv_switch_relay_err);
	p_port->err_total.rcv_switch_relay_err +=
	    epi_pe_data.rcv_switch_relay_err;
	epi_pe_data.xmit_discards =
	    (reading->xmit_discards - previous->xmit_discards);
	p_port->err_total.xmit_discards += epi_pe_data.xmit_discards;
	epi_pe_data.xmit_constraint_err =
	    (reading->xmit_constraint_err - previous->xmit_constraint_err);
	p_port->err_total.xmit_constraint_err +=
	    epi_pe_data.xmit_constraint_err;
	epi_pe_data.rcv_constraint_err =
	    (reading->rcv_constraint_err - previous->rcv_constraint_err);
	p_port->err_total.rcv_constraint_err += epi_pe_data.rcv_constraint_err;
	epi_pe_data.link_integrity =
	    (reading->link_integrity - previous->link_integrity);
	p_port->err_total.link_integrity += epi_pe_data.link_integrity;
	epi_pe_data.buffer_overrun =
	    (reading->buffer_overrun - previous->buffer_overrun);
	p_port->err_total.buffer_overrun += epi_pe_data.buffer_overrun;
	epi_pe_data.vl15_dropped =
	    (reading->vl15_dropped - previous->vl15_dropped);
	p_port->err_total.vl15_dropped += epi_pe_data.vl15_dropped;
	epi_pe_data.xmit_wait =
	    (reading->xmit_wait - previous->xmit_wait);
	p_port->err_total.xmit_wait += epi_pe_data.xmit_wait;

	p_port->err_previous = *reading;

	/* mark the time this total was updated */
	p_port->err_total.time = reading->time;

	osm_opensm_report_event(db->perfmgr->osm, OSM_EVENT_ID_PORT_ERRORS,
				&epi_pe_data);

Exit:
	cl_plock_release(&db->lock);
	return rc;
}

perfmgr_db_err_t perfmgr_db_get_prev_err(perfmgr_db_t * db, uint64_t guid,
					 uint8_t port,
					 perfmgr_db_err_reading_t * reading)
{
	db_node_t *node = NULL;
	perfmgr_db_err_t rc = PERFMGR_EVENT_DB_SUCCESS;

	cl_plock_acquire(&db->lock);

	node = get(db, guid);
	if ((rc = bad_node_port(node, port)) != PERFMGR_EVENT_DB_SUCCESS)
		goto Exit;

	*reading = node->ports[port].err_previous;

Exit:
	cl_plock_release(&db->lock);
	return rc;
}

perfmgr_db_err_t
perfmgr_db_clear_prev_err(perfmgr_db_t * db, uint64_t guid, uint8_t port)
{
	db_node_t *node = NULL;
	perfmgr_db_err_reading_t *previous = NULL;
	perfmgr_db_err_t rc = PERFMGR_EVENT_DB_SUCCESS;

	cl_plock_excl_acquire(&db->lock);
	node = get(db, guid);
	if ((rc = bad_node_port(node, port)) != PERFMGR_EVENT_DB_SUCCESS)
		goto Exit;

	previous = &(node->ports[port].err_previous);

	memset(previous, 0, sizeof(*previous));
	node->ports[port].err_previous.time = time(NULL);

Exit:
	cl_plock_release(&db->lock);
	return rc;
}

static inline void
debug_dump_dc_reading(perfmgr_db_t * db, uint64_t guid, uint8_t port_num,
		      db_port_t * port, perfmgr_db_data_cnt_reading_t * cur)
{
	osm_log_t *log = db->perfmgr->log;
	if (!OSM_LOG_IS_ACTIVE_V2(log, OSM_LOG_DEBUG))
		return;

	osm_log_v2(log, OSM_LOG_DEBUG, FILE_ID,
		   "xd %" PRIu64 " <-- %" PRIu64 " (%" PRIu64 ")\n",
		   cur->xmit_data, port->dc_previous.xmit_data,
		   port->dc_total.xmit_data);
	osm_log_v2(log, OSM_LOG_DEBUG, FILE_ID,
		   "rd %" PRIu64 " <-- %" PRIu64 " (%" PRIu64 ")\n", cur->rcv_data,
		   port->dc_previous.rcv_data, port->dc_total.rcv_data);
	osm_log_v2(log, OSM_LOG_DEBUG, FILE_ID,
		   "xp %" PRIu64 " <-- %" PRIu64 " (%" PRIu64 ")\n",
		   cur->xmit_pkts, port->dc_previous.xmit_pkts,
		   port->dc_total.xmit_pkts);
	osm_log_v2(log, OSM_LOG_DEBUG, FILE_ID,
		   "rp %" PRIu64 " <-- %" PRIu64 " (%" PRIu64 ")\n", cur->rcv_pkts,
		   port->dc_previous.rcv_pkts, port->dc_total.rcv_pkts);
}

/**********************************************************************
 * perfmgr_db_data_cnt_reading_t functions
 **********************************************************************/
perfmgr_db_err_t
perfmgr_db_add_dc_reading(perfmgr_db_t * db, uint64_t guid, uint8_t port,
			  perfmgr_db_data_cnt_reading_t * reading,
			  int ietf_sup)
{
	db_port_t *p_port = NULL;
	db_node_t *node = NULL;
	perfmgr_db_data_cnt_reading_t *previous = NULL;
	perfmgr_db_err_t rc = PERFMGR_EVENT_DB_SUCCESS;
	osm_epi_dc_event_t epi_dc_data;

	cl_plock_excl_acquire(&db->lock);
	node = get(db, guid);
	if ((rc = bad_node_port(node, port)) != PERFMGR_EVENT_DB_SUCCESS)
		goto Exit;

	mark_port_valid(node, port);

	p_port = &node->ports[port];
	previous = &node->ports[port].dc_previous;

	debug_dump_dc_reading(db, guid, port, p_port, reading);

	epi_dc_data.time_diff_s = reading->time - previous->time;
	osm_epi_create_port_id(&epi_dc_data.port_id, guid, port,
			       node->node_name);

	/* calculate changes from previous reading */
	epi_dc_data.xmit_data = reading->xmit_data - previous->xmit_data;
	p_port->dc_total.xmit_data += epi_dc_data.xmit_data;
	epi_dc_data.rcv_data = reading->rcv_data - previous->rcv_data;
	p_port->dc_total.rcv_data += epi_dc_data.rcv_data;
	epi_dc_data.xmit_pkts = reading->xmit_pkts - previous->xmit_pkts;
	p_port->dc_total.xmit_pkts += epi_dc_data.xmit_pkts;
	epi_dc_data.rcv_pkts = reading->rcv_pkts - previous->rcv_pkts;
	p_port->dc_total.rcv_pkts += epi_dc_data.rcv_pkts;

	if (ietf_sup)
	{
		epi_dc_data.unicast_xmit_pkts =
		    reading->unicast_xmit_pkts - previous->unicast_xmit_pkts;
		p_port->dc_total.unicast_xmit_pkts += epi_dc_data.unicast_xmit_pkts;
		epi_dc_data.unicast_rcv_pkts =
		    reading->unicast_rcv_pkts - previous->unicast_rcv_pkts;
		p_port->dc_total.unicast_rcv_pkts += epi_dc_data.unicast_rcv_pkts;
		epi_dc_data.multicast_xmit_pkts =
		    reading->multicast_xmit_pkts - previous->multicast_xmit_pkts;
		p_port->dc_total.multicast_xmit_pkts += epi_dc_data.multicast_xmit_pkts;
		epi_dc_data.multicast_rcv_pkts =
		    reading->multicast_rcv_pkts - previous->multicast_rcv_pkts;
		p_port->dc_total.multicast_rcv_pkts += epi_dc_data.multicast_rcv_pkts;
	}

	p_port->dc_previous = *reading;

	/* mark the time this total was updated */
	p_port->dc_total.time = reading->time;

	osm_opensm_report_event(db->perfmgr->osm,
				OSM_EVENT_ID_PORT_DATA_COUNTERS, &epi_dc_data);

Exit:
	cl_plock_release(&db->lock);
	return rc;
}

perfmgr_db_err_t perfmgr_db_get_prev_dc(perfmgr_db_t * db, uint64_t guid,
					uint8_t port,
					perfmgr_db_data_cnt_reading_t * reading)
{
	db_node_t *node = NULL;
	perfmgr_db_err_t rc = PERFMGR_EVENT_DB_SUCCESS;

	cl_plock_acquire(&db->lock);

	node = get(db, guid);
	if ((rc = bad_node_port(node, port)) != PERFMGR_EVENT_DB_SUCCESS)
		goto Exit;

	*reading = node->ports[port].dc_previous;

Exit:
	cl_plock_release(&db->lock);
	return rc;
}

perfmgr_db_err_t
perfmgr_db_clear_prev_dc(perfmgr_db_t * db, uint64_t guid, uint8_t port)
{
	db_node_t *node = NULL;
	perfmgr_db_data_cnt_reading_t *previous = NULL;
	perfmgr_db_err_t rc = PERFMGR_EVENT_DB_SUCCESS;

	cl_plock_excl_acquire(&db->lock);
	node = get(db, guid);
	if ((rc = bad_node_port(node, port)) != PERFMGR_EVENT_DB_SUCCESS)
		goto Exit;

	previous = &node->ports[port].dc_previous;

	memset(previous, 0, sizeof(*previous));
	node->ports[port].dc_previous.time = time(NULL);

Exit:
	cl_plock_release(&db->lock);
	return rc;
}

static void clear_counters(cl_map_item_t * const p_map_item, void *context)
{
	db_node_t *node = (db_node_t *) p_map_item;
	int i = 0;
	time_t ts = time(NULL);

	for (i = 0; i < node->num_ports; i++) {
		node->ports[i].err_total.symbol_err_cnt = 0;
		node->ports[i].err_total.link_err_recover = 0;
		node->ports[i].err_total.link_downed = 0;
		node->ports[i].err_total.rcv_err = 0;
		node->ports[i].err_total.rcv_rem_phys_err = 0;
		node->ports[i].err_total.rcv_switch_relay_err = 0;
		node->ports[i].err_total.xmit_discards = 0;
		node->ports[i].err_total.xmit_constraint_err = 0;
		node->ports[i].err_total.rcv_constraint_err = 0;
		node->ports[i].err_total.link_integrity = 0;
		node->ports[i].err_total.buffer_overrun = 0;
		node->ports[i].err_total.vl15_dropped = 0;
		node->ports[i].err_total.xmit_wait = 0;
		node->ports[i].err_total.time = ts;

		node->ports[i].dc_total.xmit_data = 0;
		node->ports[i].dc_total.rcv_data = 0;
		node->ports[i].dc_total.xmit_pkts = 0;
		node->ports[i].dc_total.rcv_pkts = 0;
		node->ports[i].dc_total.unicast_xmit_pkts = 0;
		node->ports[i].dc_total.unicast_rcv_pkts = 0;
		node->ports[i].dc_total.multicast_xmit_pkts = 0;
		node->ports[i].dc_total.multicast_rcv_pkts = 0;
		node->ports[i].dc_total.time = ts;

		node->ports[i].last_reset = ts;
	}
}

/**********************************************************************
 * Clear all the counters from the db
 **********************************************************************/
void perfmgr_db_clear_counters(perfmgr_db_t * db)
{
	cl_plock_excl_acquire(&db->lock);
	cl_qmap_apply_func(&db->pc_data, clear_counters, (void *)db);
	cl_plock_release(&db->lock);
#if 0
	if (db->db_impl->clear_counters)
		db->db_impl->clear_counters(db->db_data);
#endif
}

/**********************************************************************
 * Output a tab delimited output of the port counters
 **********************************************************************/
static void dump_node_mr(db_node_t * node, FILE * fp)
{
	int i = 0;

	fprintf(fp, "\nName\tGUID\tActive\tPort\tLast Reset\t"
		"Last Error Update\tLast Data Update\t"
		"%s\t%s\t"
		"%s\t%s\t%s\t%s\t%s\t%s\t%s\t"
		"%s\t%s\t%s\t%s\t%s\t%s\t%s\t"
		"%s\t%s\t%s\t%s\t%s\n",
		"symbol_err_cnt",
		"link_err_recover",
		"link_downed",
		"rcv_err",
		"rcv_rem_phys_err",
		"rcv_switch_relay_err",
		"xmit_discards",
		"xmit_constraint_err",
		"rcv_constraint_err",
		"link_int_err",
		"buf_overrun_err",
		"vl15_dropped",
		"xmit_wait",
		"xmit_data",
		"rcv_data",
		"xmit_pkts",
		"rcv_pkts",
		"unicast_xmit_pkts",
		"unicast_rcv_pkts",
		"multicast_xmit_pkts",
		"multicast_rcv_pkts");
	for (i = (node->esp0) ? 0 : 1; i < node->num_ports; i++) {
		char lr[128];
		char *last_reset = ctime_r(&node->ports[i].last_reset, lr);
		char leu[128];
		char *last_err_update = ctime_r(&node->ports[i].err_total.time, leu);
		char ldu[128];
		char *last_data_update = ctime_r(&node->ports[i].dc_total.time, ldu);

		if (!node->ports[i].valid)
			continue;

		last_reset[strlen(last_reset) - 1] = '\0';	/* remove \n */
		last_err_update[strlen(last_err_update) - 1] = '\0';	/* remove \n */
		last_data_update[strlen(last_data_update) - 1] = '\0';	/* remove \n */

		fprintf(fp,
			"%s\t0x%" PRIx64 "\t%s\t%d\t%s\t%s\t%s\t%" PRIu64 "\t%" PRIu64 "\t"
			"%" PRIu64 "\t%" PRIu64 "\t%" PRIu64 "\t%" PRIu64 "\t"
			"%" PRIu64 "\t%" PRIu64 "\t%" PRIu64 "\t" "%" PRIu64
			"\t%" PRIu64 "\t%" PRIu64 "\t" "%" PRIu64 "\t%" PRIu64
			"\t%" PRIu64 "\t%" PRIu64 "\t" "%" PRIu64 "\t%" PRIu64
			"\t%" PRIu64 "\t%" PRIu64 "\t%" PRIu64 "\n", node->node_name,
			node->node_guid,
			node->active ? "TRUE" : "FALSE",
			i, last_reset, last_err_update, last_data_update,
			node->ports[i].err_total.symbol_err_cnt,
			node->ports[i].err_total.link_err_recover,
			node->ports[i].err_total.link_downed,
			node->ports[i].err_total.rcv_err,
			node->ports[i].err_total.rcv_rem_phys_err,
			node->ports[i].err_total.rcv_switch_relay_err,
			node->ports[i].err_total.xmit_discards,
			node->ports[i].err_total.xmit_constraint_err,
			node->ports[i].err_total.rcv_constraint_err,
			node->ports[i].err_total.link_integrity,
			node->ports[i].err_total.buffer_overrun,
			node->ports[i].err_total.vl15_dropped,
			node->ports[i].err_total.xmit_wait,
			node->ports[i].dc_total.xmit_data,
			node->ports[i].dc_total.rcv_data,
			node->ports[i].dc_total.xmit_pkts,
			node->ports[i].dc_total.rcv_pkts,
			node->ports[i].dc_total.unicast_xmit_pkts,
			node->ports[i].dc_total.unicast_rcv_pkts,
			node->ports[i].dc_total.multicast_xmit_pkts,
			node->ports[i].dc_total.multicast_rcv_pkts);
	}
}

static void dump_hr_dc(FILE *fp, uint64_t val64, int data)
{
	const char *unit = "";
	uint64_t tmp = val64;
	float val = 0.0;
	int ui = 0;
	uint64_t div = 1;

	tmp /= 1024;
	while (tmp) {
		ui++;
		tmp /= 1024;
		div *= 1024;
	}

	val = (float)(val64);
	if (data) {
		val *= 4;
		if (val/div > 1024) {
			ui++;
			div *= 1024;
		}
	}
	val /= div;

	switch (ui) {
		case 1:
			unit = "K";
			break;
		case 2:
			unit = "M";
			break;
		case 3:
			unit = "G";
			break;
		case 4:
			unit = "T";
			break;
		case 5:
			unit = "P";
			break;
		case 6:
			unit = "E";
			break;
	}

	fprintf(fp, " (%5.3f%s%s)\n", val, unit, data ? "B" : "");
}

/**********************************************************************
 * Output a human readable output of the port counters
 **********************************************************************/
static void dump_node_hr(db_node_t * node, FILE * fp, char *port, int err_only)
{
	int i = (node->esp0) ? 0 : 1;
	int num_ports = node->num_ports;

	if (port) {
		char *end = NULL;
		int p = strtoul(port, &end, 0);
		if (port + strlen(port) == end && p >= i && p < num_ports) {
			i = p;
			num_ports = p+1;
		} else {
			fprintf(fp, "Warning: \"%s\" is not a valid port\n", port);
		}
	}
	for (/* set above */; i < num_ports; i++) {
		char lr[128];
		char *last_reset = ctime_r(&node->ports[i].last_reset, lr);
		char leu[128];
		char *last_err_update = ctime_r(&node->ports[i].err_total.time, leu);
		char ldu[128];
		char *last_data_update = ctime_r(&node->ports[i].dc_total.time, ldu);

		if (!node->ports[i].valid)
			continue;

		last_reset[strlen(last_reset) - 1] = '\0';	/* remove \n */
		last_err_update[strlen(last_err_update) - 1] = '\0';	/* remove \n */
		last_data_update[strlen(last_data_update) - 1] = '\0';	/* remove \n */

		perfmgr_db_err_reading_t *err = &node->ports[i].err_total;

		if (err_only
		    && err->symbol_err_cnt == 0
		    && err->link_err_recover == 0
		    && err->link_downed == 0
		    && err->rcv_err == 0
		    && err->rcv_rem_phys_err == 0
		    && err->rcv_switch_relay_err == 0
		    && err->xmit_discards == 0
		    && err->xmit_constraint_err == 0
		    && err->rcv_constraint_err == 0
		    && err->link_integrity == 0
		    && err->buffer_overrun == 0
		    && err->vl15_dropped == 0
		    && err->xmit_wait == 0)
			continue;

		fprintf(fp, "\"%s\" 0x%" PRIx64 " active %s port %d\n"
				    "     Last Reset           : %s\n"
				    "     Last Error Update    : %s\n",
			node->node_name, node->node_guid,
			node->active ? "TRUE":"FALSE", i, last_reset,
			last_err_update);

		if (!err_only || err->symbol_err_cnt != 0)
			fprintf(fp, "     symbol_err_cnt       : %" PRIu64 "\n",
				err->symbol_err_cnt);
		if (!err_only || err->link_err_recover != 0)
			fprintf(fp, "     link_err_recover     : %" PRIu64 "\n",
				err->link_err_recover);
		if (!err_only || err->link_downed != 0)
			fprintf(fp, "     link_downed          : %" PRIu64 "\n",
				err->link_downed);
		if (!err_only || err->rcv_err != 0)
			fprintf(fp, "     rcv_err              : %" PRIu64 "\n",
				err->rcv_err);
		if (!err_only || err->rcv_rem_phys_err != 0)
			fprintf(fp, "     rcv_rem_phys_err     : %" PRIu64 "\n",
				err->rcv_rem_phys_err);
		if (!err_only || err->rcv_switch_relay_err != 0)
			fprintf(fp, "     rcv_switch_relay_err : %" PRIu64 "\n",
				err->rcv_switch_relay_err);
		if (!err_only || err->xmit_discards != 0)
			fprintf(fp, "     xmit_discards        : %" PRIu64 "\n",
				err->xmit_discards);
		if (!err_only || err->xmit_constraint_err != 0)
			fprintf(fp, "     xmit_constraint_err  : %" PRIu64 "\n",
				err->xmit_constraint_err);
		if (!err_only || err->rcv_constraint_err != 0)
			fprintf(fp, "     rcv_constraint_err   : %" PRIu64 "\n",
				err->rcv_constraint_err);
		if (!err_only || err->link_integrity != 0)
			fprintf(fp, "     link_integrity_err   : %" PRIu64 "\n",
				err->link_integrity);
		if (!err_only || err->buffer_overrun != 0)
			fprintf(fp, "     buf_overrun_err      : %" PRIu64 "\n",
				err->buffer_overrun);
		if (!err_only || err->vl15_dropped != 0)
			fprintf(fp, "     vl15_dropped         : %" PRIu64 "\n",
				err->vl15_dropped);
		if (!err_only || err->xmit_wait != 0)
			fprintf(fp, "     xmit_wait            : %" PRIu64 "\n",
				err->xmit_wait);

		if (err_only)
			continue;

		fprintf(fp, "     Last Data Update     : %s\n",
			last_data_update);
		fprintf(fp, "     xmit_data            : %" PRIu64,
			node->ports[i].dc_total.xmit_data);
		dump_hr_dc(fp, node->ports[i].dc_total.xmit_data, 1);
		fprintf(fp, "     rcv_data             : %" PRIu64,
			node->ports[i].dc_total.rcv_data);
		dump_hr_dc(fp, node->ports[i].dc_total.rcv_data, 1);
		fprintf(fp, "     xmit_pkts            : %" PRIu64,
			node->ports[i].dc_total.xmit_pkts);
		dump_hr_dc(fp, node->ports[i].dc_total.xmit_pkts, 0);
		fprintf(fp, "     rcv_pkts             : %" PRIu64,
			node->ports[i].dc_total.rcv_pkts);
		dump_hr_dc(fp, node->ports[i].dc_total.rcv_pkts, 0);
		fprintf(fp, "     unicast_xmit_pkts    : %" PRIu64,
			node->ports[i].dc_total.unicast_xmit_pkts);
		dump_hr_dc(fp, node->ports[i].dc_total.unicast_xmit_pkts, 0);
		fprintf(fp, "     unicast_rcv_pkts     : %" PRIu64,
			node->ports[i].dc_total.unicast_rcv_pkts);
		dump_hr_dc(fp, node->ports[i].dc_total.unicast_rcv_pkts, 0);
		fprintf(fp, "     multicast_xmit_pkts  : %" PRIu64,
			node->ports[i].dc_total.multicast_xmit_pkts);
		dump_hr_dc(fp, node->ports[i].dc_total.multicast_xmit_pkts, 0);
		fprintf(fp, "     multicast_rcv_pkts   : %" PRIu64,
			node->ports[i].dc_total.multicast_rcv_pkts);
		dump_hr_dc(fp, node->ports[i].dc_total.multicast_rcv_pkts, 0);

	}
}

/* Define a context for the __db_dump callback */
typedef struct {
	FILE *fp;
	perfmgr_db_dump_t dump_type;
} dump_context_t;

static void db_dump(cl_map_item_t * const p_map_item, void *context)
{
	db_node_t *node = (db_node_t *) p_map_item;
	dump_context_t *c = (dump_context_t *) context;
	FILE *fp = c->fp;

	switch (c->dump_type) {
	case PERFMGR_EVENT_DB_DUMP_MR:
		dump_node_mr(node, fp);
		break;
	case PERFMGR_EVENT_DB_DUMP_HR:
	default:
		dump_node_hr(node, fp, NULL, 0);
		break;
	}
}

/**********************************************************************
 * print all node data to fp
 **********************************************************************/
void
perfmgr_db_print_all(perfmgr_db_t * db, FILE *fp, int err_only)
{
	cl_map_item_t *item;
	db_node_t *node;

	cl_plock_acquire(&db->lock);
	item = cl_qmap_head(&db->pc_data);
	while (item != cl_qmap_end(&db->pc_data)) {
		node = (db_node_t *)item;
		dump_node_hr(node, fp, NULL, err_only);
		item = cl_qmap_next(item);
	}
	cl_plock_release(&db->lock);
}

/**********************************************************************
 * print node data to fp
 **********************************************************************/
void
perfmgr_db_print_by_name(perfmgr_db_t * db, char *nodename, FILE *fp,
			 char *port, int err_only)
{
	cl_map_item_t *item;
	db_node_t *node;

	cl_plock_acquire(&db->lock);

	/* find the node */
	item = cl_qmap_head(&db->pc_data);
	while (item != cl_qmap_end(&db->pc_data)) {
		node = (db_node_t *)item;
		if (strcmp(node->node_name, nodename) == 0) {
			dump_node_hr(node, fp, port, err_only);
			goto done;
		}
		item = cl_qmap_next(item);
	}

	fprintf(fp, "Node %s not found...\n", nodename);
done:
	cl_plock_release(&db->lock);
}

/**********************************************************************
 * print node data to fp
 **********************************************************************/
void
perfmgr_db_print_by_guid(perfmgr_db_t * db, uint64_t nodeguid, FILE *fp,
			 char *port, int err_only)
{
	cl_map_item_t *node;

	cl_plock_acquire(&db->lock);

	node = cl_qmap_get(&db->pc_data, nodeguid);
	if (node != cl_qmap_end(&db->pc_data))
		dump_node_hr((db_node_t *)node, fp, port, err_only);
	else
		fprintf(fp, "Node 0x%" PRIx64 " not found...\n", nodeguid);

	cl_plock_release(&db->lock);
}

/**********************************************************************
 * dump the data to the file "file"
 **********************************************************************/
perfmgr_db_err_t
perfmgr_db_dump(perfmgr_db_t * db, char *file, perfmgr_db_dump_t dump_type)
{
	dump_context_t context;

	context.fp = fopen(file, "w+");
	if (!context.fp)
		return PERFMGR_EVENT_DB_FAIL;
	context.dump_type = dump_type;

	cl_plock_acquire(&db->lock);
	cl_qmap_apply_func(&db->pc_data, db_dump, (void *)&context);
	cl_plock_release(&db->lock);
	fclose(context.fp);
	return PERFMGR_EVENT_DB_SUCCESS;
}

/**********************************************************************
 * Fill in the various DB objects from their wire counter parts
 **********************************************************************/
void
perfmgr_db_fill_err_read(ib_port_counters_t * wire_read,
			 perfmgr_db_err_reading_t * reading,
			 boolean_t xmit_wait_sup)
{
	reading->symbol_err_cnt = cl_ntoh16(wire_read->symbol_err_cnt);
	reading->link_err_recover = wire_read->link_err_recover;
	reading->link_downed = wire_read->link_downed;
	reading->rcv_err = cl_ntoh16(wire_read->rcv_err);
	reading->rcv_rem_phys_err = cl_ntoh16(wire_read->rcv_rem_phys_err);
	reading->rcv_switch_relay_err =
	    cl_ntoh16(wire_read->rcv_switch_relay_err);
	reading->xmit_discards = cl_ntoh16(wire_read->xmit_discards);
	reading->xmit_constraint_err = wire_read->xmit_constraint_err;
	reading->rcv_constraint_err = wire_read->rcv_constraint_err;
	reading->link_integrity =
	    PC_LINK_INT(wire_read->link_int_buffer_overrun);
	reading->buffer_overrun =
	    PC_BUF_OVERRUN(wire_read->link_int_buffer_overrun);
	reading->vl15_dropped = cl_ntoh16(wire_read->vl15_dropped);
	if (xmit_wait_sup)
		reading->xmit_wait = cl_ntoh32(wire_read->xmit_wait);
	else
		reading->xmit_wait = 0;
	reading->time = time(NULL);
}

void
perfmgr_db_fill_data_cnt_read_pc(ib_port_counters_t * wire_read,
				 perfmgr_db_data_cnt_reading_t * reading)
{
	reading->xmit_data = cl_ntoh32(wire_read->xmit_data);
	reading->rcv_data = cl_ntoh32(wire_read->rcv_data);
	reading->xmit_pkts = cl_ntoh32(wire_read->xmit_pkts);
	reading->rcv_pkts = cl_ntoh32(wire_read->rcv_pkts);
	reading->unicast_xmit_pkts = 0;
	reading->unicast_rcv_pkts = 0;
	reading->multicast_xmit_pkts = 0;
	reading->multicast_rcv_pkts = 0;
	reading->time = time(NULL);
}

void
perfmgr_db_fill_data_cnt_read_pce(ib_port_counters_ext_t * wire_read,
				  perfmgr_db_data_cnt_reading_t * reading,
				  int ietf_sup)
{
	reading->xmit_data = cl_ntoh64(wire_read->xmit_data);
	reading->rcv_data = cl_ntoh64(wire_read->rcv_data);
	reading->xmit_pkts = cl_ntoh64(wire_read->xmit_pkts);
	reading->rcv_pkts = cl_ntoh64(wire_read->rcv_pkts);
	if (ietf_sup)
	{
		reading->unicast_xmit_pkts = cl_ntoh64(wire_read->unicast_xmit_pkts);
		reading->unicast_rcv_pkts = cl_ntoh64(wire_read->unicast_rcv_pkts);
		reading->multicast_xmit_pkts =
		    cl_ntoh64(wire_read->multicast_xmit_pkts);
		reading->multicast_rcv_pkts = cl_ntoh64(wire_read->multicast_rcv_pkts);
	}
	reading->time = time(NULL);
}
#endif				/* ENABLE_OSM_PERF_MGR */