Blob Blame History Raw
/****************************/
/* THIS IS OPEN SOURCE CODE */
/****************************/

/** 
 * @file    linux-bgq.c
 * @author  Heike Jagode
 *          jagode@eecs.utk.edu
 * Mods:	< your name here >
 *			< your email address >
 * Blue Gene/Q CPU component: BGPM / Punit
 * 
 * Tested version of bgpm (early access)
 *
 * @brief
 *  This file has the source code for a component that enables PAPI-C to 
 *  access hardware monitoring counters for BG/Q through the BGPM library.
 */

#include "papi.h"
#include "papi_internal.h"
#include "papi_lock.h"
#include "papi_memory.h"
#include "extras.h"

#include "linux-bgq.h"

#include "papi_vector.h"
#include "error.h"

/*
 * BG/Q specific 'stuff'
 */
#include <ucontext.h>
#include <stdlib.h>
#include <signal.h>
#include <sys/time.h>
#include <errno.h>
#include <stdio.h>
#include <string.h>
#include <sys/utsname.h>
#include "spi/include/upci/upci.h"
#ifdef DEBUG_BGQ
#include <inttypes.h>
#endif

// BG/Q macros
#define get_cycles GetTimeBase

// BG/Q external structures/functions/stuff
#if 1
UPC_Lock_t thdLocks[PAPI_MAX_LOCK];
#else
pthread_mutex_t thdLocks[PAPI_MAX_LOCK];
#endif

/* Defined in papi_data.c */
//extern papi_mdi_t _papi_hwi_system_info;

papi_vector_t _bgq_vectors;
PAPI_os_info_t _papi_os_info;

#define OPCODE_EVENT_CHUNK 8
static int allocated_opcode_events = 0;
static int num_opcode_events = 0;

struct bgq_generic_events_t {
	int idx;
	int eventId;
	char mask[PAPI_MIN_STR_LEN];
	char opcode[PAPI_MIN_STR_LEN];
	uint64_t opcode_mask;
};

static struct bgq_generic_events_t *GenericEvent;

/* Defined in linux-bgq-memory.c */
extern int _bgq_get_memory_info( PAPI_hw_info_t * pHwInfo, int pCPU_Type );
extern int _bgq_get_dmem_info( PAPI_dmem_info_t * pDmemInfo );

/* prototypes */
void user_signal_handler( int hEvtSet, uint64_t address, uint64_t ovfVector, const ucontext_t *pContext );

/*******************************************************************************
 ********  BEGIN FUNCTIONS USED INTERNALLY SPECIFIC TO THIS COMPONENT **********
 ******************************************************************************/


/*
 * Lock
 */
void
_papi_hwd_lock( int lock ) 
{
#ifdef DEBUG_BGQ
	printf( _AT_ " _papi_hwd_lock %d\n", lock);
#endif
	assert( lock < PAPI_MAX_LOCK );
#if 1
	UPC_Lock( &thdLocks[lock] );
#else
	pthread_mutex_lock( &thdLocks[lock] );
#endif
	
#ifdef DEBUG_BGQ
	printf( _AT_ " _papi_hwd_lock got lock %d\n", lock );
#endif
	
	return;
}

/*
 * Unlock
 */
void
_papi_hwd_unlock( int lock )
{
#ifdef DEBUG_BGQ
    printf( _AT_ " _papi_hwd_unlock %d\n", lock );
#endif
    assert( lock < PAPI_MAX_LOCK );
#if 1
	UPC_Unlock( &thdLocks[lock] );
#else
	pthread_mutex_unlock( &thdLocks[lock] );
#endif
	
	return;
}


/*
 * Get System Information
 *
 * Initialize system information structure
 */
int
_bgq_get_system_info( papi_mdi_t *mdi )
{
#ifdef DEBUG_BGQ
	printf( "_bgq_get_system_info\n" );
#endif
	
	( void ) mdi;
	Personality_t personality;
	int retval;
	
	/* Hardware info */
	retval = Kernel_GetPersonality( &personality, sizeof( Personality_t ) );
	if ( retval ) {
		fprintf( stdout, "Kernel_GetPersonality returned %d (sys error=%d).\n"
				"\t%s\n", retval, errno, strerror( errno ) );
		return PAPI_ESYS;
	}

	/* Returns the number of processors that are associated with the currently
	 * running process */
	_papi_hwi_system_info.hw_info.ncpu = Kernel_ProcessorCount( );
	// TODO: HJ Those values need to be fixed
	_papi_hwi_system_info.hw_info.nnodes = Kernel_ProcessCount( );
	_papi_hwi_system_info.hw_info.totalcpus = _papi_hwi_system_info.hw_info.ncpu;
	
	_papi_hwi_system_info.hw_info.cpu_max_mhz = personality.Kernel_Config.FreqMHz;
	_papi_hwi_system_info.hw_info.cpu_min_mhz = personality.Kernel_Config.FreqMHz;

	_papi_hwi_system_info.hw_info.mhz = ( float ) personality.Kernel_Config.FreqMHz;
	SUBDBG( "_bgq_get_system_info:  Detected MHZ is %f\n",
		   _papi_hwi_system_info.hw_info.mhz );

	return ( PAPI_OK );
}


/*
 * Initialize Control State
 *
 */
int
_bgq_init_control_state( hwd_control_state_t * ptr )
{
#ifdef DEBUG_BGQ
	printf( "_bgq_init_control_state\n" );
#endif
	int retval;
	
	ptr->EventGroup = Bgpm_CreateEventSet();
	retval = _check_BGPM_error( ptr->EventGroup, "Bgpm_CreateEventSet" );
	if ( retval < 0 ) return retval;

	// initialize multiplexing flag to OFF (0)
	ptr->muxOn = 0;
	// initialize overflow flag to OFF (0)
	ptr->overflow = 0;
    ptr->overflow_count = 0;
	// initialized BGPM eventGroup flag to NOT applied yet (0)
	ptr->bgpm_eventset_applied = 0;
	
	return PAPI_OK;
}


/*
 * Set Domain
 */
int
_bgq_set_domain( hwd_control_state_t * cntrl, int domain )
{
#ifdef DEBUG_BGQ
	printf( "_bgq_set_domain\n" );
#endif
	int found = 0;
	( void ) cntrl;
	
	if ( PAPI_DOM_USER & domain )
		found = 1;
	
	if ( PAPI_DOM_KERNEL & domain )
		found = 1;
	
	if ( PAPI_DOM_OTHER & domain )
		found = 1;
	
	if ( !found )
		return ( PAPI_EINVAL );
	
	return ( PAPI_OK );
}

/*
 * PAPI Initialization
 * This is called whenever a thread is initialized
 */
int
_bgq_init( hwd_context_t * ctx )
{
#ifdef DEBUG_BGQ
	printf( "_bgq_init\n" );
#endif
	( void ) ctx;
	int retval;

#ifdef DEBUG_BGPM
	Bgpm_PrintOnError(1);
	Bgpm_ExitOnError(0);
#else
	Bgpm_PrintOnError(0);
	// avoid bgpm default of exiting when error occurs - caller will check return code instead.
	Bgpm_ExitOnError(0);	
#endif
	
	retval = Bgpm_Init( BGPM_MODE_SWDISTRIB );
	retval = _check_BGPM_error( retval, "Bgpm_Init" );
	if ( retval < 0 ) return retval;

	//_common_initBgpm();
	
	return PAPI_OK;	
}


int
_bgq_multiplex( hwd_control_state_t * bgq_state )
{
	int retval;
	uint64_t bgpm_period;
	double Sec, Hz;	

#ifdef DEBUG_BGQ
	printf("_bgq_multiplex BEGIN: Num of Events = %d (vs %d)\n", Bgpm_NumEvents( bgq_state->EventGroup ), bgq_state->count );
#endif
	
	// convert Mhz to Hz ( = cycles / sec )
	Hz = (double) _papi_hwi_system_info.hw_info.cpu_max_mhz * 1000 * 1000;
	// convert PAPI multiplex period (in ns) to BGPM period (in cycles)
	Sec = (double) _papi_os_info.itimer_ns / ( 1000 * 1000 * 1000 );
	bgpm_period = Hz * Sec;

	// if EventGroup is not empty -- which is required by BGPM before 
	// we can call SetMultiplex() -- then drain the events from the 
	// BGPM EventGroup, turn on multiplex flag, and rebuild BGPM EventGroup.
	if ( 0 < bgq_state->count ) {
		// Delete and re-create BGPM eventset
		retval = _common_deleteRecreate( &bgq_state->EventGroup );
		if ( retval < 0 ) return retval;

		// turn on multiplex for BGPM
		retval = Bgpm_SetMultiplex( bgq_state->EventGroup, bgpm_period, BGPM_NORMAL ); 		
		retval = _check_BGPM_error( retval, "Bgpm_SetMultiplex" );
		if ( retval < 0 ) return retval;

		// rebuild BGPM EventGroup
		retval = _common_rebuildEventgroup( bgq_state->count, 
								   bgq_state->EventGroup_local, 
								   &bgq_state->EventGroup );	
		if ( retval < 0 ) return retval;
	}
	else {
		// need to pass either BGPM_NORMAL or BGPM_NOTNORMAL 
		// BGPM_NORMAL: numbers reported by Bgpm_ReadEvent() are normalized 
		// to the maximum time spent in a multiplexed group
		retval = Bgpm_SetMultiplex( bgq_state->EventGroup, bgpm_period, BGPM_NORMAL ); 		
		retval = _check_BGPM_error( retval, "Bgpm_SetMultiplex" );
		if ( retval < 0 ) return retval;
	}

#ifdef DEBUG_BGQ
	printf("_bgq_multiplex END: Num of Events = %d (vs %d) --- retval = %d\n", 
		   Bgpm_NumEvents( bgq_state->EventGroup ), bgq_state->count, retval );
#endif
	
	return ( retval );
}





/*
 * Register Allocation
 *
 */
int
_bgq_allocate_registers( EventSetInfo_t * ESI )
{
#ifdef DEBUG_BGQ
	printf("_bgq_allocate_registers\n");
#endif
	int i, natNum;
	int xEventId;

	/*
	 * Start monitoring the events...
	 */
	natNum = ESI->NativeCount;

	for ( i = 0; i < natNum; i++ ) {
		xEventId = ( ESI->NativeInfoArray[i].ni_event & PAPI_NATIVE_AND_MASK ) + 1;
		ESI->NativeInfoArray[i].ni_position = i;		
	}

	return PAPI_OK;
}


/*
 * PAPI Cleanup Eventset
 *
 * Destroy and re-create the BGPM / Punit EventSet
 */
int
_bgq_cleanup_eventset( hwd_control_state_t * ctrl )
{
#ifdef DEBUG_BGQ
	printf( "_bgq_cleanup_eventset\n" );
#endif
	
	// set multiplexing flag to OFF (0)
	ctrl->muxOn = 0;
	// set overflow flag to OFF (0)
	ctrl->overflow = 0;
    ctrl->overflow_count = 0;
	// set BGPM eventGroup flag back to NOT applied yet (0)
	ctrl->bgpm_eventset_applied = 0;

	return ( PAPI_OK );
}


/*
 * Update Control State
 *
 * This function clears the current contents of the control
 * structure and updates it with whatever resources are allocated
 * for all the native events in the native info structure array.
 */
int
_bgq_update_control_state( hwd_control_state_t * ptr,
						   NativeInfo_t * native, int count,
						   hwd_context_t * ctx )
{
#ifdef DEBUG_BGQ
	printf( _AT_ " _bgq_update_control_state: count = %d, EventGroup=%d\n", count, ptr->EventGroup );
#endif
	( void ) ctx;
	int i, j, k, index, retval;
	unsigned evtIdx;
	
	// Delete and re-create BGPM eventset
	retval = _common_deleteRecreate( &ptr->EventGroup );
	if ( retval < 0 ) return retval;

#ifdef DEBUG_BGQ
    printf( _AT_ " _bgq_update_control_state: EventGroup=%d, muxOn = %d, overflow = %d\n",
		   ptr->EventGroup, ptr->muxOn, ptr->overflow );
#endif
	
	// add the events to the eventset
	for ( i = 0; i < count; i++ ) {
		index = ( native[i].ni_event & PAPI_NATIVE_AND_MASK ) + 1;
		
		ptr->EventGroup_local[i] = index;

		// we found an opcode event
		if ( index > BGQ_PUNIT_MAX_EVENTS ) {
			for( j = 0; j < num_opcode_events; j++ ) {
#ifdef DEBUG_BGQ
				printf(_AT_ " _bgq_update_control_state: %d out of %d OPCODES\n",
					   j, num_opcode_events );
#endif
#ifdef DEBUG_BGQ
				printf(_AT_ " _bgq_update_control_state: j's idx = %d, index = %d\n",
					   GenericEvent[j].idx, index );
#endif
				if ( GenericEvent[j].idx == ( index - 1) ) {
					/* Add events to the BGPM eventGroup */
					retval = Bgpm_AddEvent( ptr->EventGroup, GenericEvent[j].eventId );
					retval = _check_BGPM_error( retval, "Bgpm_AddEvent" );
					if ( retval < 0 ) return retval;
#ifdef DEBUG_BGQ
					printf(_AT_ " _bgq_update_control_state: ADD event: i = %d, eventId = %d\n", i, GenericEvent[j].eventId );
#endif
					
					evtIdx = Bgpm_GetEventIndex( ptr->EventGroup,
												 GenericEvent[j].eventId,
												 i );
#ifdef DEBUG_BGQ
					printf(_AT_ " _bgq_update_control_state: evtIdx in EventGroup = %d\n",
						   evtIdx );
#endif
					if ( 0 == strcmp( GenericEvent[j].mask, "PEVT_INST_XU_GRP_MASK" ) ) {
						retval = Bgpm_SetXuGrpMask( ptr->EventGroup,
												    evtIdx,
												    GenericEvent[j].opcode_mask );
						retval = _check_BGPM_error( retval, "Bgpm_SetXuGrpMask" );
						if ( retval < 0 ) return retval;
#ifdef DEBUG_BGQ
						printf(_AT_ " _bgq_update_control_state: it's PEVT_INST_XU_GRP_MASK\n" );
#endif
					} else if ( 0 == strcmp( GenericEvent[j].mask, "PEVT_INST_QFPU_GRP_MASK" ) ) {
						retval = Bgpm_SetQfpuGrpMask( ptr->EventGroup,
												      evtIdx,
													  GenericEvent[j].opcode_mask );
						retval = _check_BGPM_error( retval, "Bgpm_SetQfpuGrpMask" );
						if ( retval < 0 ) return retval;
#ifdef DEBUG_BGQ
						printf(_AT_ " _bgq_update_control_state: it's PEVT_INST_QFPU_GRP_MASK\n" );
#endif
					}
				}	
			}
		}
		else {
#ifdef DEBUG_BGQ
			printf(_AT_ " _bgq_update_control_state: no OPCODE\n" );
#endif
			
			/* Add events to the BGPM eventGroup */
			retval = Bgpm_AddEvent( ptr->EventGroup, index );
			retval = _check_BGPM_error( retval, "Bgpm_AddEvent" );
			if ( retval < 0 ) return retval;
#ifdef DEBUG_BGQ
			printf(_AT_ " _bgq_update_control_state: ADD event: i = %d, index = %d\n", i, index );
#endif
			
		}
	}
	
	// store how many events we added to an EventSet
	ptr->count = count;

	// if muxOn and EventGroup is not empty -- which is required by BGPM before 
	// we can call SetMultiplex() -- then drain the events from the 
	// BGPM EventGroup, turn on multiplex flag, and rebuild BGPM EventGroup.
	if ( 1 == ptr->muxOn ) {
		retval = _bgq_multiplex( ptr );
	}
		
    // since update_control_state trashes overflow settings, this puts things
    // back into balance for BGPM
    if ( 1 == ptr->overflow ) {
        for ( k = 0; k < ptr->overflow_count; k++ ) {
            retval = _common_set_overflow_BGPM( ptr->EventGroup,
                                       ptr->overflow_list[k].EventIndex,
                                       ptr->overflow_list[k].threshold,
                                       user_signal_handler );
			if ( retval < 0 ) return retval;
        }
    }
		
	return ( PAPI_OK );
}



/*
 * PAPI Start
 */
int
_bgq_start( hwd_context_t * ctx, hwd_control_state_t * ptr )
{
#ifdef DEBUG_BGQ
	printf( "BEGIN _bgq_start\n" );
#endif
	( void ) ctx;
	int retval;
		
	retval = Bgpm_Apply( ptr->EventGroup ); 
	retval = _check_BGPM_error( retval, "Bgpm_Apply" );
	if ( retval < 0 ) return retval;
	
	// set flag to 1: BGPM eventGroup HAS BEEN applied
	ptr->bgpm_eventset_applied = 1;

#ifdef DEBUG_BGQ
	int i;
	int numEvts = Bgpm_NumEvents( ptr->EventGroup );
	for ( i = 0; i < numEvts; i++ ) {
		printf("%d = %s\n", i, Bgpm_GetEventLabel( ptr->EventGroup, i) );
	}
#endif	
	
	/* Bgpm_Apply() does an implicit reset; 
	 hence no need to use Bgpm_ResetStart */
	retval = Bgpm_Start( ptr->EventGroup );
	retval = _check_BGPM_error( retval, "Bgpm_Start" );
	if ( retval < 0 ) return retval;
	
	return ( PAPI_OK );
}

/*
 * PAPI Stop
 */
int
_bgq_stop( hwd_context_t * ctx, hwd_control_state_t * ptr )
{
#ifdef DEBUG_BGQ
	printf( "BEGIN _bgq_stop\n" );
#endif
	( void ) ctx;
	int retval;
	
	retval = Bgpm_Stop( ptr->EventGroup );
	retval = _check_BGPM_error( retval, "Bgpm_Stop" );
	if ( retval < 0 ) return retval;
	
	return ( PAPI_OK );
}

/*
 * PAPI Read Counters
 *
 * Read the counters into local storage
 */
int
_bgq_read( hwd_context_t * ctx, hwd_control_state_t * ptr,
		   long_long ** dp, int flags )
{
#ifdef DEBUG_BGQ
	printf( "_bgq_read\n" );
#endif
	( void ) ctx;
	( void ) flags;
	int i, numEvts;
	
	numEvts = Bgpm_NumEvents( ptr->EventGroup );
	if ( numEvts == 0 ) {
#ifdef DEBUG_BGPM
		printf ("Error: ret value is %d for BGPM API function Bgpm_NumEvents.\n", numEvts );
		//return ( EXIT_FAILURE );
#endif
	}
	
	for ( i = 0; i < numEvts; i++ ) 
		ptr->counters[i] = _common_getEventValue( i, ptr->EventGroup );

	*dp = ptr->counters;
		
	return ( PAPI_OK );
}

/*
 * PAPI Reset
 *
 * Zero the counter values
 */
int
_bgq_reset( hwd_context_t * ctx, hwd_control_state_t * ptr )
{
#ifdef DEBUG_BGQ
	printf( "_bgq_reset\n" );
#endif
	( void ) ctx;
	int retval;
	
	/* we can't simply call Bgpm_Reset() since PAPI doesn't have the 
	   restriction that an EventSet has to be stopped before resetting is
	   possible. However, BGPM does have this restriction. 
	   Hence we need to stop, reset and start */
	retval = Bgpm_Stop( ptr->EventGroup );
	retval = _check_BGPM_error( retval, "Bgpm_Stop" );
	if ( retval < 0 ) return retval;
	
	retval = Bgpm_ResetStart( ptr->EventGroup );
	retval = _check_BGPM_error( retval, "Bgpm_ResetStart" );
	if ( retval < 0 ) return retval;

	return ( PAPI_OK );
}


/*
 * PAPI Shutdown
 *
 * This routine is for shutting down threads,
 * including the master thread.
 * Effectively a no-op, same as BG/L/P...
 */
int
_bgq_shutdown( hwd_context_t * ctx )
{
#ifdef DEBUG_BGQ
	printf( "_bgq_shutdown\n" );
#endif
	( void ) ctx;
	int retval;
	
	/* Disable BGPM library */	
	retval = Bgpm_Disable();
	retval = _check_BGPM_error( retval, "Bgpm_Disable" );
	if ( retval < 0 ) return retval;

	return ( PAPI_OK );
}

/*
 * PAPI Write
 *
 * Write counter values
 * NOTE:  Could possible support, but signal error as BG/L/P does...
 */
int
_bgq_write( hwd_context_t * ctx, hwd_control_state_t * cntrl, long_long * from )
{
#ifdef DEBUG_BGQ
	printf( "_bgq_write\n" );
#endif
	( void ) ctx;
	( void ) cntrl;
	( void ) from;
	
	return PAPI_ECMP;
}

/*
 * Dispatch Timer
 *
 * NOT the same as BG/L/P where we simply return
 * This function is used when hardware overflows are working or when
 * software overflows are forced
 */
void
_bgq_dispatch_timer( int signal, hwd_siginfo_t * info, void *uc )
{
	( void ) signal;
	( void ) info;
	( void ) uc;
#ifdef DEBUG_BGQ
	printf("BEGIN _bgq_dispatch_timer\n");
#endif
	
	return;
}



/*
 * user_signal_handler
 *
 * This function is used when hardware overflows are working or when
 * software overflows are forced
 */
void
user_signal_handler( int hEvtSet, uint64_t address, uint64_t ovfVector, const ucontext_t *pContext )
{
#ifdef DEBUG_BGQ
	printf( "user_signal_handler start\n" );
#endif
	( void ) address;
	int retval; 
	unsigned i;
	int isHardware = 1;
	int cidx = _bgq_vectors.cmp_info.CmpIdx;
	long_long overflow_bit = 0;
	caddr_t address1;
	_papi_hwi_context_t ctx;
	ctx.ucontext = ( hwd_ucontext_t * ) pContext;
	ThreadInfo_t *thread = _papi_hwi_lookup_thread( 0 );
	
	//printf(_AT_ " thread = %p\n", thread);	// <<<<<<<<<<<<<<<<<<
	
	EventSetInfo_t *ESI;
	ESI = thread->running_eventset[cidx];
    // Get the indices of all events which have overflowed.
    unsigned ovfIdxs[BGPM_MAX_OVERFLOW_EVENTS];
    unsigned len = BGPM_MAX_OVERFLOW_EVENTS;
	
    retval = Bgpm_GetOverflowEventIndices( hEvtSet, ovfVector, ovfIdxs, &len );

	if ( retval < 0 ) {
#ifdef DEBUG_BGPM
		printf ( "Error: ret value is %d for BGPM API function Bgpm_GetOverflowEventIndices.\n", 
				 retval ); 
#endif
		return;
	}
		
	if ( thread == NULL ) {
		PAPIERROR( "thread == NULL in user_signal_handler!" );
		return;
	}
		
	if ( ESI == NULL ) {
		PAPIERROR( "ESI == NULL in user_signal_handler!");
		return;
	}
		
	if ( ESI->overflow.flags == 0 ) {
		PAPIERROR( "ESI->overflow.flags == 0 in user_signal_handler!");
		return;
	}

	for ( i = 0; i < len; i++ ) {
		uint64_t hProf;
        Bgpm_GetEventUser1( hEvtSet, ovfIdxs[i], &hProf );
        if ( hProf ) {
			overflow_bit ^= 1 << ovfIdxs[i];
			break;
        }
		
	}
	
	if ( ESI->overflow.flags & PAPI_OVERFLOW_FORCE_SW ) {
#ifdef DEBUG_BGQ
		printf("OVERFLOW_SOFTWARE\n");
#endif
		address1 = GET_OVERFLOW_ADDRESS( ctx );
		_papi_hwi_dispatch_overflow_signal( ( void * ) &ctx, address1, NULL, 0, 0, &thread, cidx );
		return;
	}
	else if ( ESI->overflow.flags & PAPI_OVERFLOW_HARDWARE ) {
#ifdef DEBUG_BGQ
		printf("OVERFLOW_HARDWARE\n");
#endif
		address1 = GET_OVERFLOW_ADDRESS( ctx );
		_papi_hwi_dispatch_overflow_signal( ( void * ) &ctx, address1, &isHardware, overflow_bit, 0, &thread, cidx );
	}
	else {
#ifdef DEBUG_BGQ
		printf("OVERFLOW_NONE\n");
#endif
		PAPIERROR( "ESI->overflow.flags is set to something other than PAPI_OVERFLOW_HARDWARE or PAPI_OVERFLOW_FORCE_SW (%#x)", thread->running_eventset[cidx]->overflow.flags);
	}
}


/*
 * Set Overflow
 *
 * This is commented out in BG/L/P - need to explore and complete...
 * However, with true 64-bit counters in BG/Q and all counters for PAPI
 * always starting from a true zero (we don't allow write...), the possibility
 * for overflow is remote at best...
 */
int
_bgq_set_overflow( EventSetInfo_t * ESI, int EventIndex, int threshold )
{
#ifdef DEBUG_BGQ
	printf("BEGIN _bgq_set_overflow\n");
#endif
	hwd_control_state_t * this_state = ( hwd_control_state_t * ) ESI->ctl_state;
	int retval;
	int evt_idx;
	
	/*
	 * In case an BGPM eventGroup HAS BEEN applied or attached before
	 * overflow is set, delete the eventGroup and create an new empty one,
	 * and rebuild as it was prior to deletion
	 */
#ifdef DEBUG_BGQ
	printf( "_bgq_set_overflow: bgpm_eventset_applied = %d, threshold = %d\n",
		    this_state->bgpm_eventset_applied, threshold );
#endif	
	if ( 1 == this_state->bgpm_eventset_applied && 0 != threshold ) {
		retval = _common_deleteRecreate( &this_state->EventGroup );
		if ( retval < 0 ) return retval;

		retval = _common_rebuildEventgroup( this_state->count,
								   this_state->EventGroup_local,
								   &this_state->EventGroup );
		if ( retval < 0 ) return retval;

		/* set BGPM eventGroup flag back to NOT applied yet (0) 
		 * because the eventGroup has been recreated from scratch */
		this_state->bgpm_eventset_applied = 0;
	}
	
	
	evt_idx = ESI->EventInfoArray[EventIndex].pos[0];
	//evt_id = ( ESI->NativeInfoArray[EventIndex].ni_event & PAPI_NATIVE_AND_MASK ) + 1;
	SUBDBG( "Hardware counter %d (vs %d) used in overflow, threshold %d\n",
		    evt_idx, EventIndex, threshold );
#ifdef DEBUG_BGQ
	printf( "Hardware counter %d (vs %d) used in overflow, threshold %d\n",
		    evt_idx, EventIndex, threshold );
#endif
	
	/* If this counter isn't set to overflow, it's an error */
	if ( threshold == 0 ) {
		/* Remove the signal handler */
		retval = _papi_hwi_stop_signal( _bgq_vectors.cmp_info.hardware_intr_sig );
		if ( retval != PAPI_OK )
			return ( retval );
	}
	else {
		this_state->overflow = 1;
        this_state->overflow_count++;
		this_state->overflow_list[this_state->overflow_count-1].threshold = threshold;
		this_state->overflow_list[this_state->overflow_count-1].EventIndex = evt_idx;
	
#ifdef DEBUG_BGQ
		printf( "_bgq_set_overflow: Enable the signal handler\n" );
#endif		
		/* Enable the signal handler */
		retval = _papi_hwi_start_signal( _bgq_vectors.cmp_info.hardware_intr_sig, 
										 NEED_CONTEXT, 
										 _bgq_vectors.cmp_info.CmpIdx );
		if ( retval != PAPI_OK )
			return ( retval );
		
		retval = _common_set_overflow_BGPM( this_state->EventGroup,
                                  this_state->overflow_list[this_state->overflow_count-1].EventIndex,
                                  this_state->overflow_list[this_state->overflow_count-1].threshold,
                                  user_signal_handler );
		if ( retval < 0 ) return retval;
	}

	return ( PAPI_OK );
}


/*
 * Set Profile
 *
 * Same as for BG/L/P, routine not used and returns error
 */
int
_bgq_set_profile( EventSetInfo_t * ESI, int EventIndex, int threshold )
{
#ifdef DEBUG_BGQ
	printf("BEGIN _bgq_set_profile\n");
#endif
	
	( void ) ESI;
	( void ) EventIndex;
	( void ) threshold;
	
	return PAPI_ECMP;
}

/*
 * Stop Profiling
 *
 * Same as for BG/L/P...
 */
int
_bgq_stop_profiling( ThreadInfo_t * master, EventSetInfo_t * ESI )
{
#ifdef DEBUG_BGQ
	printf("BEGIN _bgq_stop_profiling\n");
#endif
	
	( void ) master;
	( void ) ESI;
	
	return ( PAPI_OK );
}

/*
 * PAPI Control
 *
 * Same as for BG/L/P - initialize the domain
 */
int
_bgq_ctl( hwd_context_t * ctx, int code, _papi_int_option_t * option )
{
#ifdef DEBUG_BGQ
	printf( "_bgq_ctl\n" );
#endif
	( void ) ctx;
	int retval;
	
	switch ( code ) {
		case PAPI_MULTIPLEX:
		{
			hwd_control_state_t * bgq_state = ( ( hwd_control_state_t * ) option->multiplex.ESI->ctl_state );
			bgq_state->muxOn = 1;
			retval = _bgq_multiplex( bgq_state );
			return ( retval );
		}
		default:
			return ( PAPI_OK );
	}
}

/*
 * Get Real Micro-seconds
 */
long long
_bgq_get_real_usec( void )
{
#ifdef DEBUG_BGQ
	printf( "_bgq_get_real_usec\n" );
#endif
	
	/*
	 * NOTE:  _papi_hwi_system_info.hw_info.mhz is really a representation of unit of time per cycle.
	 *        On BG/P, it's value is 8.5e-4.  Therefore, to get cycles per sec, we have to multiply
	 *        by 1.0e12.  To then convert to usec, we have to divide by 1.0e-3.
	 */
	return ( ( long long ) ( ( ( float ) get_cycles(  ) ) /
							 ( ( _papi_hwi_system_info.hw_info.cpu_max_mhz ) ) ) );

}

/*
 * Get Real Cycles
 *
 * Same for BG/L/P, using native function...
 */
long long
_bgq_get_real_cycles( void )
{
#ifdef DEBUG_BGQ
	printf( "_bgq_get_real_cycles\n" );
#endif

	return ( ( long long ) get_cycles(  ) );

}

/*
 * Get Virtual Micro-seconds
 *
 * Same calc as for BG/L/P, returns real usec...
 */
long long
_bgq_get_virt_usec( void )
{
#ifdef DEBUG_BGQ
	printf( "_bgq_get_virt_usec\n" );
#endif
	
	return _bgq_get_real_usec(  );
}

/*
 * Get Virtual Cycles
 *
 * Same calc as for BG/L/P, returns real cycles...
 */
long long
_bgq_get_virt_cycles( void )
{
#ifdef DEBUG_BGQ
	printf( "_bgq_get_virt_cycles\n" );
#endif
	
	return _bgq_get_real_cycles(  );
}

/*
 * Component setup and shutdown
 *
 * Initialize hardware counters, setup the function vector table
 * and get hardware information, this routine is called when the
 * PAPI process is initialized (IE PAPI_library_init)
 */
int
_bgq_init_component( int cidx )
{	
#ifdef DEBUG_BGQ
	printf("_bgq_init_substrate\n");
	//printf("_bgq_init_substrate: 1. BGPM_INITIALIZED = %d \n", BGPM_INITIALIZED);
#endif
	int retval;
	int i;
		
	/* allocate the opcode event structure */
	GenericEvent = calloc( OPCODE_EVENT_CHUNK, sizeof( struct bgq_generic_events_t ) );
	if ( NULL == GenericEvent ) {
		return PAPI_ENOMEM;
	}
	
	/* init opcode event stuff */
	allocated_opcode_events = OPCODE_EVENT_CHUNK;
	num_opcode_events = 0;
		
	_bgq_vectors.cmp_info.CmpIdx = cidx;

	/*
	 * Fill in what we can of the papi_system_info
	 */
	SUBDBG( "Before _bgq_get_system_info()...\n" );
	retval = _bgq_get_system_info( &_papi_hwi_system_info );
	SUBDBG( "After _bgq_get_system_info(), retval=%d...\n", retval );
	if ( retval != PAPI_OK )
		return ( retval );

	/*
	 * Setup memory info
	 */

	SUBDBG( "Before _bgq_get_memory_info...\n" );
	retval = _bgq_get_memory_info( &_papi_hwi_system_info.hw_info,
								  ( int ) _papi_hwi_system_info.hw_info.
								  model );
	SUBDBG( "After _bgq_get_memory_info, retval=%d...\n", retval );
	if ( retval )
		return ( retval );
#if 1
	/* Setup Locks */
	for ( i = 0; i < PAPI_MAX_LOCK; i++ )
		thdLocks[i] = 0;  // MUTEX_OPEN
#else
	for( i = 0; i < PAPI_MAX_LOCK; i++ ) {
		pthread_mutex_init( &thdLocks[i], NULL );
	}
#endif
	
	/* Setup presets */
	retval = _papi_load_preset_table( "BGQ", 0, cidx );
	if ( retval ) {
		return retval;
	}	
	
	
	return ( PAPI_OK );
}


/*************************************/
/* CODE TO SUPPORT OPAQUE NATIVE MAP */
/*************************************/

/*
 * Event Name to Native Code
 */
int
_bgq_ntv_name_to_code( const char *name, unsigned int *event_code )
{
#ifdef DEBUG_BGQ
	printf( "_bgq_ntv_name_to_code\n" );
#endif
	int ret;
#ifdef DEBUG_BGQ
	printf( "name = ===%s===\n", name );
#endif	

	/* Treat events differently if BGPM Opcodes are used */
	/* Opcode group selection values are "OR"ed together to create a desired 
	 mask of instruction group events to accumulate in the same counter */	
	if ( 0 == strncmp( name, "PEVT_INST_XU_GRP_MASK", strlen( "PEVT_INST_XU_GRP_MASK" ) ) ||
		 0 == strncmp( name, "PEVT_INST_QFPU_GRP_MASK", strlen( "PEVT_INST_QFPU_GRP_MASK" ) ) ) {

		char *pcolon;
		pcolon = strchr( name, ':' );
		
		// Found colon separator
		if ( pcolon != NULL ) {
			int mask_len = pcolon - name;
			strncpy( GenericEvent[num_opcode_events].mask, name,  mask_len  );
			strncpy( GenericEvent[num_opcode_events].opcode, pcolon+1, strlen(name) - 1 - mask_len );
			/* opcode_mask needs to be 'uint64_t',
			   hence we use strtoull() which returns an 'unsigned long long int' */
			GenericEvent[num_opcode_events].opcode_mask = strtoull( GenericEvent[num_opcode_events].opcode, (char **)NULL, 16 );
			GenericEvent[num_opcode_events].idx = OPCODE_BUF + num_opcode_events;
			/* Return event id matching the generic XU/QFPU event string */
			GenericEvent[num_opcode_events].eventId = Bgpm_GetEventIdFromLabel( GenericEvent[num_opcode_events].mask );
			if ( GenericEvent[num_opcode_events].eventId <= 0 ) {
#ifdef DEBUG_BGPM
				printf ("Error: ret value is %d for BGPM API function '%s'.\n",
						ret, "Bgpm_GetEventIdFromLabel" );
#endif
				return PAPI_ENOEVNT;
			}
			
			*event_code = GenericEvent[num_opcode_events].idx;
			
			num_opcode_events++;
			
			/* If there are too many opcode events than allocated, then allocate more room */
			if( num_opcode_events >= allocated_opcode_events ) {
				
				SUBDBG("Allocating more room for BGPM opcode events (%d %ld)\n",
					   ( allocated_opcode_events + NATIVE_OPCODE_CHUNK ),
					   ( long )sizeof( struct bgq_generic_events_t ) *
					   ( allocated_opcode_events + NATIVE_OPCODE_CHUNK ) );
				
				GenericEvent = realloc( GenericEvent, sizeof( struct bgq_generic_events_t ) *
									   ( allocated_opcode_events + OPCODE_EVENT_CHUNK ) );
				if ( NULL == GenericEvent ) {
					return PAPI_ENOMEM;
				}
				allocated_opcode_events += OPCODE_EVENT_CHUNK;
			}
        }
		else {
			SUBDBG( "Error: Found a generic BGPM event mask without opcode string\n" );
			return PAPI_ENOEVNT;
		}
		
		
#ifdef DEBUG_BGQ
		printf(_AT_ " _bgq_ntv_name_to_code: GenericEvent no. %d: \n", num_opcode_events-1 );
		printf(	"idx         = %d\n", GenericEvent[num_opcode_events-1].idx);
		printf(	"eventId     = %d\n", GenericEvent[num_opcode_events-1].eventId);
		printf(	"mask        = %s\n", GenericEvent[num_opcode_events-1].mask);
		printf(	"opcode      = %s\n", GenericEvent[num_opcode_events-1].opcode);
		printf( "opcode_mask = %#lX (%lu)\n", GenericEvent[num_opcode_events-1].opcode_mask,
			   GenericEvent[num_opcode_events-1].opcode_mask );
#endif
	}
	else {
		/* Return event id matching a given event label string */
		ret = Bgpm_GetEventIdFromLabel ( name );
		
		if ( ret <= 0 ) {
#ifdef DEBUG_BGPM
			printf ("Error: ret value is %d for BGPM API function '%s'.\n",
					ret, "Bgpm_GetEventIdFromLabel" );
#endif
			return PAPI_ENOEVNT;
		}
		else if ( ret > BGQ_PUNIT_MAX_EVENTS ) // not a PUnit event
			return PAPI_ENOEVNT;
		else
			*event_code = ( ret - 1 );		
	}
	
	return PAPI_OK;
}


/*
 * Native Code to Event Name
 *
 * Given a native event code, returns the short text label
 */
int
_bgq_ntv_code_to_name( unsigned int EventCode, char *name, int len )
{	
#ifdef DEBUG_BGQ	
	printf( "_bgq_ntv_code_to_name\n" );
#endif
	int index = ( EventCode & PAPI_NATIVE_AND_MASK ) + 1;
	
	if ( index >= MAX_COUNTERS )
		return PAPI_ENOEVNT;
			
	strncpy( name, Bgpm_GetEventIdLabel( index ), len );
	
	if ( name == NULL ) {
#ifdef DEBUG_BGPM
		printf ("Error: ret value is NULL for BGPM API function Bgpm_GetEventIdLabel.\n" );
#endif
		return PAPI_ENOEVNT;
	}
#ifdef DEBUG_BGQ
	printf( "name = ===%s===\n", name );
#endif	
	
	return ( PAPI_OK );
}

/*
 * Native Code to Event Description
 *
 * Given a native event code, returns the longer native event description
 */
int
_bgq_ntv_code_to_descr( unsigned int EventCode, char *name, int len )
{	
#ifdef DEBUG_BGQ
	printf( "_bgq_ntv_code_to_descr\n" );
#endif
	int retval;
	int index = ( EventCode & PAPI_NATIVE_AND_MASK ) + 1;

	retval = Bgpm_GetLongDesc( index, name, &len );
	retval = _check_BGPM_error( retval, "Bgpm_GetLongDesc" );						 
	if ( retval < 0 ) return retval;

	return ( PAPI_OK );
}

/*
 * Native Code to Bit Configuration
 *
 * Given a native event code, assigns the native event's
 * information to a given pointer.
 * NOTE: The info must be COPIED to location addressed by
 *       the provided pointer, not just referenced!
 * NOTE: For BG/Q, the bit configuration is not needed,
 *       as the native SPI is used to configure events.
 */
int
_bgq_ntv_code_to_bits( unsigned int EventCode, hwd_register_t * bits )
{
#ifdef DEBUG_BGQ
	printf( "_bgq_ntv_code_to_bits\n" );
#endif
	
	( void ) EventCode;
	( void ) bits;
	
	return ( PAPI_OK );
}

/*
 * Native ENUM Events
 *
 */
int
_bgq_ntv_enum_events( unsigned int *EventCode, int modifier )
{
#ifdef DEBUG_BGQ
	printf( "_bgq_ntv_enum_events\n" );
#endif
	
	switch ( modifier ) {
		case PAPI_ENUM_FIRST:
			*EventCode = PAPI_NATIVE_MASK;
			
			return ( PAPI_OK );
			break;
			
		case PAPI_ENUM_EVENTS:
		{
			int index = ( *EventCode & PAPI_NATIVE_AND_MASK ) + 1;
			
			if ( index < BGQ_PUNIT_MAX_EVENTS ) {
				*EventCode = *EventCode + 1;
				return ( PAPI_OK );
			} else
				return ( PAPI_ENOEVNT );
			
			break;
		}
		default:
			return ( PAPI_EINVAL );
	}
	
	return ( PAPI_EINVAL );	
}


int 
_papi_hwi_init_os(void) {
	
	struct utsname uname_buffer;
	
	/* Get the kernel info */
    uname(&uname_buffer);
	
    strncpy(_papi_os_info.name,uname_buffer.sysname,PAPI_MAX_STR_LEN);
	
    strncpy(_papi_os_info.version,uname_buffer.release,PAPI_MAX_STR_LEN);
	
    _papi_os_info.itimer_sig = PAPI_INT_MPX_SIGNAL;
    _papi_os_info.itimer_num = PAPI_INT_ITIMER;
    _papi_os_info.itimer_res_ns = 1;
	
    return PAPI_OK;
}


/*
 * PAPI Vector Table for BG/Q
 */
papi_vector_t _bgq_vectors = {
	.cmp_info = {
				 /* Default component information (unspecified values are initialized to 0) */
				 .name = "linux-bgq",
				 .short_name = "bgq",
				 .description = "Blue Gene/Q component",
				 .num_cntrs = BGQ_PUNIT_MAX_COUNTERS,
				 .num_mpx_cntrs = BGQ_PUNIT_MAX_COUNTERS,
				 .num_native_events = BGQ_PUNIT_MAX_EVENTS,
				 .default_domain = PAPI_DOM_USER,
				 .available_domains = PAPI_DOM_USER | PAPI_DOM_KERNEL,
				 .default_granularity = PAPI_GRN_THR,
				 .available_granularities = PAPI_GRN_THR,
				 .hardware_intr_sig = PAPI_INT_SIGNAL,
				 .hardware_intr = 1,
				 .kernel_multiplex = 1,
		
				 /* component specific cmp_info initializations */
				 .fast_real_timer = 1,
				 .fast_virtual_timer = 0,
				 }
	,

	/* Sizes of framework-opaque component-private structures */
	.size = {
			 .context = sizeof ( hwd_context_t ),
			 .control_state = sizeof ( hwd_control_state_t ),
			 .reg_value = sizeof ( hwd_register_t ),
			 .reg_alloc = sizeof ( hwd_reg_alloc_t ),
			 }
	,
	/* Function pointers in this component */
//   .get_overflow_address =
	.start = _bgq_start,
	.stop = _bgq_stop,
	.read = _bgq_read,
	.reset = _bgq_reset,
	.write = _bgq_write,
	.stop_profiling = _bgq_stop_profiling,
	.init_component = _bgq_init_component,
	.init_thread = _bgq_init,
	.init_control_state = _bgq_init_control_state,
	.update_control_state = _bgq_update_control_state,
	.ctl = _bgq_ctl,
	.set_overflow = _bgq_set_overflow,
	//.dispatch_timer = _bgq_dispatch_timer,
	.set_profile = _bgq_set_profile,
	.set_domain = _bgq_set_domain,
	.ntv_enum_events = _bgq_ntv_enum_events,
	.ntv_name_to_code = _bgq_ntv_name_to_code,
	.ntv_code_to_name = _bgq_ntv_code_to_name,
	.ntv_code_to_descr = _bgq_ntv_code_to_descr,
	.ntv_code_to_bits = _bgq_ntv_code_to_bits,
	.allocate_registers = _bgq_allocate_registers,
	.cleanup_eventset = _bgq_cleanup_eventset,
	.shutdown_thread = _bgq_shutdown
//  .shutdown_global      =
//  .user                 =
};

papi_os_vector_t _papi_os_vector = {
	.get_memory_info = _bgq_get_memory_info,
	.get_dmem_info = _bgq_get_dmem_info,
	.get_real_cycles = _bgq_get_real_cycles,
	.get_real_usec = _bgq_get_real_usec,
	.get_virt_cycles = _bgq_get_virt_cycles,
	.get_virt_usec = _bgq_get_virt_usec,
	.get_system_info = _bgq_get_system_info
};