/****************************/ /* THIS IS OPEN SOURCE CODE */ /****************************/ /** * @file linux-bgq.c * @author Heike Jagode * jagode@eecs.utk.edu * Mods: < your name here > * < your email address > * Blue Gene/Q CPU component: BGPM / Punit * * Tested version of bgpm (early access) * * @brief * This file has the source code for a component that enables PAPI-C to * access hardware monitoring counters for BG/Q through the BGPM library. */ #include "papi.h" #include "papi_internal.h" #include "papi_lock.h" #include "papi_memory.h" #include "extras.h" #include "linux-bgq.h" #include "papi_vector.h" #include "error.h" /* * BG/Q specific 'stuff' */ #include #include #include #include #include #include #include #include #include "spi/include/upci/upci.h" #ifdef DEBUG_BGQ #include #endif // BG/Q macros #define get_cycles GetTimeBase // BG/Q external structures/functions/stuff #if 1 UPC_Lock_t thdLocks[PAPI_MAX_LOCK]; #else pthread_mutex_t thdLocks[PAPI_MAX_LOCK]; #endif /* Defined in papi_data.c */ //extern papi_mdi_t _papi_hwi_system_info; papi_vector_t _bgq_vectors; PAPI_os_info_t _papi_os_info; #define OPCODE_EVENT_CHUNK 8 static int allocated_opcode_events = 0; static int num_opcode_events = 0; struct bgq_generic_events_t { int idx; int eventId; char mask[PAPI_MIN_STR_LEN]; char opcode[PAPI_MIN_STR_LEN]; uint64_t opcode_mask; }; static struct bgq_generic_events_t *GenericEvent; /* Defined in linux-bgq-memory.c */ extern int _bgq_get_memory_info( PAPI_hw_info_t * pHwInfo, int pCPU_Type ); extern int _bgq_get_dmem_info( PAPI_dmem_info_t * pDmemInfo ); /* prototypes */ void user_signal_handler( int hEvtSet, uint64_t address, uint64_t ovfVector, const ucontext_t *pContext ); /******************************************************************************* ******** BEGIN FUNCTIONS USED INTERNALLY SPECIFIC TO THIS COMPONENT ********** ******************************************************************************/ /* * Lock */ void _papi_hwd_lock( int lock ) { #ifdef DEBUG_BGQ printf( _AT_ " _papi_hwd_lock %d\n", lock); #endif assert( lock < PAPI_MAX_LOCK ); #if 1 UPC_Lock( &thdLocks[lock] ); #else pthread_mutex_lock( &thdLocks[lock] ); #endif #ifdef DEBUG_BGQ printf( _AT_ " _papi_hwd_lock got lock %d\n", lock ); #endif return; } /* * Unlock */ void _papi_hwd_unlock( int lock ) { #ifdef DEBUG_BGQ printf( _AT_ " _papi_hwd_unlock %d\n", lock ); #endif assert( lock < PAPI_MAX_LOCK ); #if 1 UPC_Unlock( &thdLocks[lock] ); #else pthread_mutex_unlock( &thdLocks[lock] ); #endif return; } /* * Get System Information * * Initialize system information structure */ int _bgq_get_system_info( papi_mdi_t *mdi ) { #ifdef DEBUG_BGQ printf( "_bgq_get_system_info\n" ); #endif ( void ) mdi; Personality_t personality; int retval; /* Hardware info */ retval = Kernel_GetPersonality( &personality, sizeof( Personality_t ) ); if ( retval ) { fprintf( stdout, "Kernel_GetPersonality returned %d (sys error=%d).\n" "\t%s\n", retval, errno, strerror( errno ) ); return PAPI_ESYS; } /* Returns the number of processors that are associated with the currently * running process */ _papi_hwi_system_info.hw_info.ncpu = Kernel_ProcessorCount( ); // TODO: HJ Those values need to be fixed _papi_hwi_system_info.hw_info.nnodes = Kernel_ProcessCount( ); _papi_hwi_system_info.hw_info.totalcpus = _papi_hwi_system_info.hw_info.ncpu; _papi_hwi_system_info.hw_info.cpu_max_mhz = personality.Kernel_Config.FreqMHz; _papi_hwi_system_info.hw_info.cpu_min_mhz = personality.Kernel_Config.FreqMHz; _papi_hwi_system_info.hw_info.mhz = ( float ) personality.Kernel_Config.FreqMHz; SUBDBG( "_bgq_get_system_info: Detected MHZ is %f\n", _papi_hwi_system_info.hw_info.mhz ); return ( PAPI_OK ); } /* * Initialize Control State * */ int _bgq_init_control_state( hwd_control_state_t * ptr ) { #ifdef DEBUG_BGQ printf( "_bgq_init_control_state\n" ); #endif int retval; ptr->EventGroup = Bgpm_CreateEventSet(); retval = _check_BGPM_error( ptr->EventGroup, "Bgpm_CreateEventSet" ); if ( retval < 0 ) return retval; // initialize multiplexing flag to OFF (0) ptr->muxOn = 0; // initialize overflow flag to OFF (0) ptr->overflow = 0; ptr->overflow_count = 0; // initialized BGPM eventGroup flag to NOT applied yet (0) ptr->bgpm_eventset_applied = 0; return PAPI_OK; } /* * Set Domain */ int _bgq_set_domain( hwd_control_state_t * cntrl, int domain ) { #ifdef DEBUG_BGQ printf( "_bgq_set_domain\n" ); #endif int found = 0; ( void ) cntrl; if ( PAPI_DOM_USER & domain ) found = 1; if ( PAPI_DOM_KERNEL & domain ) found = 1; if ( PAPI_DOM_OTHER & domain ) found = 1; if ( !found ) return ( PAPI_EINVAL ); return ( PAPI_OK ); } /* * PAPI Initialization * This is called whenever a thread is initialized */ int _bgq_init( hwd_context_t * ctx ) { #ifdef DEBUG_BGQ printf( "_bgq_init\n" ); #endif ( void ) ctx; int retval; #ifdef DEBUG_BGPM Bgpm_PrintOnError(1); Bgpm_ExitOnError(0); #else Bgpm_PrintOnError(0); // avoid bgpm default of exiting when error occurs - caller will check return code instead. Bgpm_ExitOnError(0); #endif retval = Bgpm_Init( BGPM_MODE_SWDISTRIB ); retval = _check_BGPM_error( retval, "Bgpm_Init" ); if ( retval < 0 ) return retval; //_common_initBgpm(); return PAPI_OK; } int _bgq_multiplex( hwd_control_state_t * bgq_state ) { int retval; uint64_t bgpm_period; double Sec, Hz; #ifdef DEBUG_BGQ printf("_bgq_multiplex BEGIN: Num of Events = %d (vs %d)\n", Bgpm_NumEvents( bgq_state->EventGroup ), bgq_state->count ); #endif // convert Mhz to Hz ( = cycles / sec ) Hz = (double) _papi_hwi_system_info.hw_info.cpu_max_mhz * 1000 * 1000; // convert PAPI multiplex period (in ns) to BGPM period (in cycles) Sec = (double) _papi_os_info.itimer_ns / ( 1000 * 1000 * 1000 ); bgpm_period = Hz * Sec; // if EventGroup is not empty -- which is required by BGPM before // we can call SetMultiplex() -- then drain the events from the // BGPM EventGroup, turn on multiplex flag, and rebuild BGPM EventGroup. if ( 0 < bgq_state->count ) { // Delete and re-create BGPM eventset retval = _common_deleteRecreate( &bgq_state->EventGroup ); if ( retval < 0 ) return retval; // turn on multiplex for BGPM retval = Bgpm_SetMultiplex( bgq_state->EventGroup, bgpm_period, BGPM_NORMAL ); retval = _check_BGPM_error( retval, "Bgpm_SetMultiplex" ); if ( retval < 0 ) return retval; // rebuild BGPM EventGroup retval = _common_rebuildEventgroup( bgq_state->count, bgq_state->EventGroup_local, &bgq_state->EventGroup ); if ( retval < 0 ) return retval; } else { // need to pass either BGPM_NORMAL or BGPM_NOTNORMAL // BGPM_NORMAL: numbers reported by Bgpm_ReadEvent() are normalized // to the maximum time spent in a multiplexed group retval = Bgpm_SetMultiplex( bgq_state->EventGroup, bgpm_period, BGPM_NORMAL ); retval = _check_BGPM_error( retval, "Bgpm_SetMultiplex" ); if ( retval < 0 ) return retval; } #ifdef DEBUG_BGQ printf("_bgq_multiplex END: Num of Events = %d (vs %d) --- retval = %d\n", Bgpm_NumEvents( bgq_state->EventGroup ), bgq_state->count, retval ); #endif return ( retval ); } /* * Register Allocation * */ int _bgq_allocate_registers( EventSetInfo_t * ESI ) { #ifdef DEBUG_BGQ printf("_bgq_allocate_registers\n"); #endif int i, natNum; int xEventId; /* * Start monitoring the events... */ natNum = ESI->NativeCount; for ( i = 0; i < natNum; i++ ) { xEventId = ( ESI->NativeInfoArray[i].ni_event & PAPI_NATIVE_AND_MASK ) + 1; ESI->NativeInfoArray[i].ni_position = i; } return PAPI_OK; } /* * PAPI Cleanup Eventset * * Destroy and re-create the BGPM / Punit EventSet */ int _bgq_cleanup_eventset( hwd_control_state_t * ctrl ) { #ifdef DEBUG_BGQ printf( "_bgq_cleanup_eventset\n" ); #endif // set multiplexing flag to OFF (0) ctrl->muxOn = 0; // set overflow flag to OFF (0) ctrl->overflow = 0; ctrl->overflow_count = 0; // set BGPM eventGroup flag back to NOT applied yet (0) ctrl->bgpm_eventset_applied = 0; return ( PAPI_OK ); } /* * Update Control State * * This function clears the current contents of the control * structure and updates it with whatever resources are allocated * for all the native events in the native info structure array. */ int _bgq_update_control_state( hwd_control_state_t * ptr, NativeInfo_t * native, int count, hwd_context_t * ctx ) { #ifdef DEBUG_BGQ printf( _AT_ " _bgq_update_control_state: count = %d, EventGroup=%d\n", count, ptr->EventGroup ); #endif ( void ) ctx; int i, j, k, index, retval; unsigned evtIdx; // Delete and re-create BGPM eventset retval = _common_deleteRecreate( &ptr->EventGroup ); if ( retval < 0 ) return retval; #ifdef DEBUG_BGQ printf( _AT_ " _bgq_update_control_state: EventGroup=%d, muxOn = %d, overflow = %d\n", ptr->EventGroup, ptr->muxOn, ptr->overflow ); #endif // add the events to the eventset for ( i = 0; i < count; i++ ) { index = ( native[i].ni_event & PAPI_NATIVE_AND_MASK ) + 1; ptr->EventGroup_local[i] = index; // we found an opcode event if ( index > BGQ_PUNIT_MAX_EVENTS ) { for( j = 0; j < num_opcode_events; j++ ) { #ifdef DEBUG_BGQ printf(_AT_ " _bgq_update_control_state: %d out of %d OPCODES\n", j, num_opcode_events ); #endif #ifdef DEBUG_BGQ printf(_AT_ " _bgq_update_control_state: j's idx = %d, index = %d\n", GenericEvent[j].idx, index ); #endif if ( GenericEvent[j].idx == ( index - 1) ) { /* Add events to the BGPM eventGroup */ retval = Bgpm_AddEvent( ptr->EventGroup, GenericEvent[j].eventId ); retval = _check_BGPM_error( retval, "Bgpm_AddEvent" ); if ( retval < 0 ) return retval; #ifdef DEBUG_BGQ printf(_AT_ " _bgq_update_control_state: ADD event: i = %d, eventId = %d\n", i, GenericEvent[j].eventId ); #endif evtIdx = Bgpm_GetEventIndex( ptr->EventGroup, GenericEvent[j].eventId, i ); #ifdef DEBUG_BGQ printf(_AT_ " _bgq_update_control_state: evtIdx in EventGroup = %d\n", evtIdx ); #endif if ( 0 == strcmp( GenericEvent[j].mask, "PEVT_INST_XU_GRP_MASK" ) ) { retval = Bgpm_SetXuGrpMask( ptr->EventGroup, evtIdx, GenericEvent[j].opcode_mask ); retval = _check_BGPM_error( retval, "Bgpm_SetXuGrpMask" ); if ( retval < 0 ) return retval; #ifdef DEBUG_BGQ printf(_AT_ " _bgq_update_control_state: it's PEVT_INST_XU_GRP_MASK\n" ); #endif } else if ( 0 == strcmp( GenericEvent[j].mask, "PEVT_INST_QFPU_GRP_MASK" ) ) { retval = Bgpm_SetQfpuGrpMask( ptr->EventGroup, evtIdx, GenericEvent[j].opcode_mask ); retval = _check_BGPM_error( retval, "Bgpm_SetQfpuGrpMask" ); if ( retval < 0 ) return retval; #ifdef DEBUG_BGQ printf(_AT_ " _bgq_update_control_state: it's PEVT_INST_QFPU_GRP_MASK\n" ); #endif } } } } else { #ifdef DEBUG_BGQ printf(_AT_ " _bgq_update_control_state: no OPCODE\n" ); #endif /* Add events to the BGPM eventGroup */ retval = Bgpm_AddEvent( ptr->EventGroup, index ); retval = _check_BGPM_error( retval, "Bgpm_AddEvent" ); if ( retval < 0 ) return retval; #ifdef DEBUG_BGQ printf(_AT_ " _bgq_update_control_state: ADD event: i = %d, index = %d\n", i, index ); #endif } } // store how many events we added to an EventSet ptr->count = count; // if muxOn and EventGroup is not empty -- which is required by BGPM before // we can call SetMultiplex() -- then drain the events from the // BGPM EventGroup, turn on multiplex flag, and rebuild BGPM EventGroup. if ( 1 == ptr->muxOn ) { retval = _bgq_multiplex( ptr ); } // since update_control_state trashes overflow settings, this puts things // back into balance for BGPM if ( 1 == ptr->overflow ) { for ( k = 0; k < ptr->overflow_count; k++ ) { retval = _common_set_overflow_BGPM( ptr->EventGroup, ptr->overflow_list[k].EventIndex, ptr->overflow_list[k].threshold, user_signal_handler ); if ( retval < 0 ) return retval; } } return ( PAPI_OK ); } /* * PAPI Start */ int _bgq_start( hwd_context_t * ctx, hwd_control_state_t * ptr ) { #ifdef DEBUG_BGQ printf( "BEGIN _bgq_start\n" ); #endif ( void ) ctx; int retval; retval = Bgpm_Apply( ptr->EventGroup ); retval = _check_BGPM_error( retval, "Bgpm_Apply" ); if ( retval < 0 ) return retval; // set flag to 1: BGPM eventGroup HAS BEEN applied ptr->bgpm_eventset_applied = 1; #ifdef DEBUG_BGQ int i; int numEvts = Bgpm_NumEvents( ptr->EventGroup ); for ( i = 0; i < numEvts; i++ ) { printf("%d = %s\n", i, Bgpm_GetEventLabel( ptr->EventGroup, i) ); } #endif /* Bgpm_Apply() does an implicit reset; hence no need to use Bgpm_ResetStart */ retval = Bgpm_Start( ptr->EventGroup ); retval = _check_BGPM_error( retval, "Bgpm_Start" ); if ( retval < 0 ) return retval; return ( PAPI_OK ); } /* * PAPI Stop */ int _bgq_stop( hwd_context_t * ctx, hwd_control_state_t * ptr ) { #ifdef DEBUG_BGQ printf( "BEGIN _bgq_stop\n" ); #endif ( void ) ctx; int retval; retval = Bgpm_Stop( ptr->EventGroup ); retval = _check_BGPM_error( retval, "Bgpm_Stop" ); if ( retval < 0 ) return retval; return ( PAPI_OK ); } /* * PAPI Read Counters * * Read the counters into local storage */ int _bgq_read( hwd_context_t * ctx, hwd_control_state_t * ptr, long_long ** dp, int flags ) { #ifdef DEBUG_BGQ printf( "_bgq_read\n" ); #endif ( void ) ctx; ( void ) flags; int i, numEvts; numEvts = Bgpm_NumEvents( ptr->EventGroup ); if ( numEvts == 0 ) { #ifdef DEBUG_BGPM printf ("Error: ret value is %d for BGPM API function Bgpm_NumEvents.\n", numEvts ); //return ( EXIT_FAILURE ); #endif } for ( i = 0; i < numEvts; i++ ) ptr->counters[i] = _common_getEventValue( i, ptr->EventGroup ); *dp = ptr->counters; return ( PAPI_OK ); } /* * PAPI Reset * * Zero the counter values */ int _bgq_reset( hwd_context_t * ctx, hwd_control_state_t * ptr ) { #ifdef DEBUG_BGQ printf( "_bgq_reset\n" ); #endif ( void ) ctx; int retval; /* we can't simply call Bgpm_Reset() since PAPI doesn't have the restriction that an EventSet has to be stopped before resetting is possible. However, BGPM does have this restriction. Hence we need to stop, reset and start */ retval = Bgpm_Stop( ptr->EventGroup ); retval = _check_BGPM_error( retval, "Bgpm_Stop" ); if ( retval < 0 ) return retval; retval = Bgpm_ResetStart( ptr->EventGroup ); retval = _check_BGPM_error( retval, "Bgpm_ResetStart" ); if ( retval < 0 ) return retval; return ( PAPI_OK ); } /* * PAPI Shutdown * * This routine is for shutting down threads, * including the master thread. * Effectively a no-op, same as BG/L/P... */ int _bgq_shutdown( hwd_context_t * ctx ) { #ifdef DEBUG_BGQ printf( "_bgq_shutdown\n" ); #endif ( void ) ctx; int retval; /* Disable BGPM library */ retval = Bgpm_Disable(); retval = _check_BGPM_error( retval, "Bgpm_Disable" ); if ( retval < 0 ) return retval; return ( PAPI_OK ); } /* * PAPI Write * * Write counter values * NOTE: Could possible support, but signal error as BG/L/P does... */ int _bgq_write( hwd_context_t * ctx, hwd_control_state_t * cntrl, long_long * from ) { #ifdef DEBUG_BGQ printf( "_bgq_write\n" ); #endif ( void ) ctx; ( void ) cntrl; ( void ) from; return PAPI_ECMP; } /* * Dispatch Timer * * NOT the same as BG/L/P where we simply return * This function is used when hardware overflows are working or when * software overflows are forced */ void _bgq_dispatch_timer( int signal, hwd_siginfo_t * info, void *uc ) { ( void ) signal; ( void ) info; ( void ) uc; #ifdef DEBUG_BGQ printf("BEGIN _bgq_dispatch_timer\n"); #endif return; } /* * user_signal_handler * * This function is used when hardware overflows are working or when * software overflows are forced */ void user_signal_handler( int hEvtSet, uint64_t address, uint64_t ovfVector, const ucontext_t *pContext ) { #ifdef DEBUG_BGQ printf( "user_signal_handler start\n" ); #endif ( void ) address; int retval; unsigned i; int isHardware = 1; int cidx = _bgq_vectors.cmp_info.CmpIdx; long_long overflow_bit = 0; caddr_t address1; _papi_hwi_context_t ctx; ctx.ucontext = ( hwd_ucontext_t * ) pContext; ThreadInfo_t *thread = _papi_hwi_lookup_thread( 0 ); //printf(_AT_ " thread = %p\n", thread); // <<<<<<<<<<<<<<<<<< EventSetInfo_t *ESI; ESI = thread->running_eventset[cidx]; // Get the indices of all events which have overflowed. unsigned ovfIdxs[BGPM_MAX_OVERFLOW_EVENTS]; unsigned len = BGPM_MAX_OVERFLOW_EVENTS; retval = Bgpm_GetOverflowEventIndices( hEvtSet, ovfVector, ovfIdxs, &len ); if ( retval < 0 ) { #ifdef DEBUG_BGPM printf ( "Error: ret value is %d for BGPM API function Bgpm_GetOverflowEventIndices.\n", retval ); #endif return; } if ( thread == NULL ) { PAPIERROR( "thread == NULL in user_signal_handler!" ); return; } if ( ESI == NULL ) { PAPIERROR( "ESI == NULL in user_signal_handler!"); return; } if ( ESI->overflow.flags == 0 ) { PAPIERROR( "ESI->overflow.flags == 0 in user_signal_handler!"); return; } for ( i = 0; i < len; i++ ) { uint64_t hProf; Bgpm_GetEventUser1( hEvtSet, ovfIdxs[i], &hProf ); if ( hProf ) { overflow_bit ^= 1 << ovfIdxs[i]; break; } } if ( ESI->overflow.flags & PAPI_OVERFLOW_FORCE_SW ) { #ifdef DEBUG_BGQ printf("OVERFLOW_SOFTWARE\n"); #endif address1 = GET_OVERFLOW_ADDRESS( ctx ); _papi_hwi_dispatch_overflow_signal( ( void * ) &ctx, address1, NULL, 0, 0, &thread, cidx ); return; } else if ( ESI->overflow.flags & PAPI_OVERFLOW_HARDWARE ) { #ifdef DEBUG_BGQ printf("OVERFLOW_HARDWARE\n"); #endif address1 = GET_OVERFLOW_ADDRESS( ctx ); _papi_hwi_dispatch_overflow_signal( ( void * ) &ctx, address1, &isHardware, overflow_bit, 0, &thread, cidx ); } else { #ifdef DEBUG_BGQ printf("OVERFLOW_NONE\n"); #endif PAPIERROR( "ESI->overflow.flags is set to something other than PAPI_OVERFLOW_HARDWARE or PAPI_OVERFLOW_FORCE_SW (%#x)", thread->running_eventset[cidx]->overflow.flags); } } /* * Set Overflow * * This is commented out in BG/L/P - need to explore and complete... * However, with true 64-bit counters in BG/Q and all counters for PAPI * always starting from a true zero (we don't allow write...), the possibility * for overflow is remote at best... */ int _bgq_set_overflow( EventSetInfo_t * ESI, int EventIndex, int threshold ) { #ifdef DEBUG_BGQ printf("BEGIN _bgq_set_overflow\n"); #endif hwd_control_state_t * this_state = ( hwd_control_state_t * ) ESI->ctl_state; int retval; int evt_idx; /* * In case an BGPM eventGroup HAS BEEN applied or attached before * overflow is set, delete the eventGroup and create an new empty one, * and rebuild as it was prior to deletion */ #ifdef DEBUG_BGQ printf( "_bgq_set_overflow: bgpm_eventset_applied = %d, threshold = %d\n", this_state->bgpm_eventset_applied, threshold ); #endif if ( 1 == this_state->bgpm_eventset_applied && 0 != threshold ) { retval = _common_deleteRecreate( &this_state->EventGroup ); if ( retval < 0 ) return retval; retval = _common_rebuildEventgroup( this_state->count, this_state->EventGroup_local, &this_state->EventGroup ); if ( retval < 0 ) return retval; /* set BGPM eventGroup flag back to NOT applied yet (0) * because the eventGroup has been recreated from scratch */ this_state->bgpm_eventset_applied = 0; } evt_idx = ESI->EventInfoArray[EventIndex].pos[0]; //evt_id = ( ESI->NativeInfoArray[EventIndex].ni_event & PAPI_NATIVE_AND_MASK ) + 1; SUBDBG( "Hardware counter %d (vs %d) used in overflow, threshold %d\n", evt_idx, EventIndex, threshold ); #ifdef DEBUG_BGQ printf( "Hardware counter %d (vs %d) used in overflow, threshold %d\n", evt_idx, EventIndex, threshold ); #endif /* If this counter isn't set to overflow, it's an error */ if ( threshold == 0 ) { /* Remove the signal handler */ retval = _papi_hwi_stop_signal( _bgq_vectors.cmp_info.hardware_intr_sig ); if ( retval != PAPI_OK ) return ( retval ); } else { this_state->overflow = 1; this_state->overflow_count++; this_state->overflow_list[this_state->overflow_count-1].threshold = threshold; this_state->overflow_list[this_state->overflow_count-1].EventIndex = evt_idx; #ifdef DEBUG_BGQ printf( "_bgq_set_overflow: Enable the signal handler\n" ); #endif /* Enable the signal handler */ retval = _papi_hwi_start_signal( _bgq_vectors.cmp_info.hardware_intr_sig, NEED_CONTEXT, _bgq_vectors.cmp_info.CmpIdx ); if ( retval != PAPI_OK ) return ( retval ); retval = _common_set_overflow_BGPM( this_state->EventGroup, this_state->overflow_list[this_state->overflow_count-1].EventIndex, this_state->overflow_list[this_state->overflow_count-1].threshold, user_signal_handler ); if ( retval < 0 ) return retval; } return ( PAPI_OK ); } /* * Set Profile * * Same as for BG/L/P, routine not used and returns error */ int _bgq_set_profile( EventSetInfo_t * ESI, int EventIndex, int threshold ) { #ifdef DEBUG_BGQ printf("BEGIN _bgq_set_profile\n"); #endif ( void ) ESI; ( void ) EventIndex; ( void ) threshold; return PAPI_ECMP; } /* * Stop Profiling * * Same as for BG/L/P... */ int _bgq_stop_profiling( ThreadInfo_t * master, EventSetInfo_t * ESI ) { #ifdef DEBUG_BGQ printf("BEGIN _bgq_stop_profiling\n"); #endif ( void ) master; ( void ) ESI; return ( PAPI_OK ); } /* * PAPI Control * * Same as for BG/L/P - initialize the domain */ int _bgq_ctl( hwd_context_t * ctx, int code, _papi_int_option_t * option ) { #ifdef DEBUG_BGQ printf( "_bgq_ctl\n" ); #endif ( void ) ctx; int retval; switch ( code ) { case PAPI_MULTIPLEX: { hwd_control_state_t * bgq_state = ( ( hwd_control_state_t * ) option->multiplex.ESI->ctl_state ); bgq_state->muxOn = 1; retval = _bgq_multiplex( bgq_state ); return ( retval ); } default: return ( PAPI_OK ); } } /* * Get Real Micro-seconds */ long long _bgq_get_real_usec( void ) { #ifdef DEBUG_BGQ printf( "_bgq_get_real_usec\n" ); #endif /* * NOTE: _papi_hwi_system_info.hw_info.mhz is really a representation of unit of time per cycle. * On BG/P, it's value is 8.5e-4. Therefore, to get cycles per sec, we have to multiply * by 1.0e12. To then convert to usec, we have to divide by 1.0e-3. */ return ( ( long long ) ( ( ( float ) get_cycles( ) ) / ( ( _papi_hwi_system_info.hw_info.cpu_max_mhz ) ) ) ); } /* * Get Real Cycles * * Same for BG/L/P, using native function... */ long long _bgq_get_real_cycles( void ) { #ifdef DEBUG_BGQ printf( "_bgq_get_real_cycles\n" ); #endif return ( ( long long ) get_cycles( ) ); } /* * Get Virtual Micro-seconds * * Same calc as for BG/L/P, returns real usec... */ long long _bgq_get_virt_usec( void ) { #ifdef DEBUG_BGQ printf( "_bgq_get_virt_usec\n" ); #endif return _bgq_get_real_usec( ); } /* * Get Virtual Cycles * * Same calc as for BG/L/P, returns real cycles... */ long long _bgq_get_virt_cycles( void ) { #ifdef DEBUG_BGQ printf( "_bgq_get_virt_cycles\n" ); #endif return _bgq_get_real_cycles( ); } /* * Component setup and shutdown * * Initialize hardware counters, setup the function vector table * and get hardware information, this routine is called when the * PAPI process is initialized (IE PAPI_library_init) */ int _bgq_init_component( int cidx ) { #ifdef DEBUG_BGQ printf("_bgq_init_substrate\n"); //printf("_bgq_init_substrate: 1. BGPM_INITIALIZED = %d \n", BGPM_INITIALIZED); #endif int retval; int i; /* allocate the opcode event structure */ GenericEvent = calloc( OPCODE_EVENT_CHUNK, sizeof( struct bgq_generic_events_t ) ); if ( NULL == GenericEvent ) { return PAPI_ENOMEM; } /* init opcode event stuff */ allocated_opcode_events = OPCODE_EVENT_CHUNK; num_opcode_events = 0; _bgq_vectors.cmp_info.CmpIdx = cidx; /* * Fill in what we can of the papi_system_info */ SUBDBG( "Before _bgq_get_system_info()...\n" ); retval = _bgq_get_system_info( &_papi_hwi_system_info ); SUBDBG( "After _bgq_get_system_info(), retval=%d...\n", retval ); if ( retval != PAPI_OK ) return ( retval ); /* * Setup memory info */ SUBDBG( "Before _bgq_get_memory_info...\n" ); retval = _bgq_get_memory_info( &_papi_hwi_system_info.hw_info, ( int ) _papi_hwi_system_info.hw_info. model ); SUBDBG( "After _bgq_get_memory_info, retval=%d...\n", retval ); if ( retval ) return ( retval ); #if 1 /* Setup Locks */ for ( i = 0; i < PAPI_MAX_LOCK; i++ ) thdLocks[i] = 0; // MUTEX_OPEN #else for( i = 0; i < PAPI_MAX_LOCK; i++ ) { pthread_mutex_init( &thdLocks[i], NULL ); } #endif /* Setup presets */ retval = _papi_load_preset_table( "BGQ", 0, cidx ); if ( retval ) { return retval; } return ( PAPI_OK ); } /*************************************/ /* CODE TO SUPPORT OPAQUE NATIVE MAP */ /*************************************/ /* * Event Name to Native Code */ int _bgq_ntv_name_to_code( const char *name, unsigned int *event_code ) { #ifdef DEBUG_BGQ printf( "_bgq_ntv_name_to_code\n" ); #endif int ret; #ifdef DEBUG_BGQ printf( "name = ===%s===\n", name ); #endif /* Treat events differently if BGPM Opcodes are used */ /* Opcode group selection values are "OR"ed together to create a desired mask of instruction group events to accumulate in the same counter */ if ( 0 == strncmp( name, "PEVT_INST_XU_GRP_MASK", strlen( "PEVT_INST_XU_GRP_MASK" ) ) || 0 == strncmp( name, "PEVT_INST_QFPU_GRP_MASK", strlen( "PEVT_INST_QFPU_GRP_MASK" ) ) ) { char *pcolon; pcolon = strchr( name, ':' ); // Found colon separator if ( pcolon != NULL ) { int mask_len = pcolon - name; strncpy( GenericEvent[num_opcode_events].mask, name, mask_len ); strncpy( GenericEvent[num_opcode_events].opcode, pcolon+1, strlen(name) - 1 - mask_len ); /* opcode_mask needs to be 'uint64_t', hence we use strtoull() which returns an 'unsigned long long int' */ GenericEvent[num_opcode_events].opcode_mask = strtoull( GenericEvent[num_opcode_events].opcode, (char **)NULL, 16 ); GenericEvent[num_opcode_events].idx = OPCODE_BUF + num_opcode_events; /* Return event id matching the generic XU/QFPU event string */ GenericEvent[num_opcode_events].eventId = Bgpm_GetEventIdFromLabel( GenericEvent[num_opcode_events].mask ); if ( GenericEvent[num_opcode_events].eventId <= 0 ) { #ifdef DEBUG_BGPM printf ("Error: ret value is %d for BGPM API function '%s'.\n", ret, "Bgpm_GetEventIdFromLabel" ); #endif return PAPI_ENOEVNT; } *event_code = GenericEvent[num_opcode_events].idx; num_opcode_events++; /* If there are too many opcode events than allocated, then allocate more room */ if( num_opcode_events >= allocated_opcode_events ) { SUBDBG("Allocating more room for BGPM opcode events (%d %ld)\n", ( allocated_opcode_events + NATIVE_OPCODE_CHUNK ), ( long )sizeof( struct bgq_generic_events_t ) * ( allocated_opcode_events + NATIVE_OPCODE_CHUNK ) ); GenericEvent = realloc( GenericEvent, sizeof( struct bgq_generic_events_t ) * ( allocated_opcode_events + OPCODE_EVENT_CHUNK ) ); if ( NULL == GenericEvent ) { return PAPI_ENOMEM; } allocated_opcode_events += OPCODE_EVENT_CHUNK; } } else { SUBDBG( "Error: Found a generic BGPM event mask without opcode string\n" ); return PAPI_ENOEVNT; } #ifdef DEBUG_BGQ printf(_AT_ " _bgq_ntv_name_to_code: GenericEvent no. %d: \n", num_opcode_events-1 ); printf( "idx = %d\n", GenericEvent[num_opcode_events-1].idx); printf( "eventId = %d\n", GenericEvent[num_opcode_events-1].eventId); printf( "mask = %s\n", GenericEvent[num_opcode_events-1].mask); printf( "opcode = %s\n", GenericEvent[num_opcode_events-1].opcode); printf( "opcode_mask = %#lX (%lu)\n", GenericEvent[num_opcode_events-1].opcode_mask, GenericEvent[num_opcode_events-1].opcode_mask ); #endif } else { /* Return event id matching a given event label string */ ret = Bgpm_GetEventIdFromLabel ( name ); if ( ret <= 0 ) { #ifdef DEBUG_BGPM printf ("Error: ret value is %d for BGPM API function '%s'.\n", ret, "Bgpm_GetEventIdFromLabel" ); #endif return PAPI_ENOEVNT; } else if ( ret > BGQ_PUNIT_MAX_EVENTS ) // not a PUnit event return PAPI_ENOEVNT; else *event_code = ( ret - 1 ); } return PAPI_OK; } /* * Native Code to Event Name * * Given a native event code, returns the short text label */ int _bgq_ntv_code_to_name( unsigned int EventCode, char *name, int len ) { #ifdef DEBUG_BGQ printf( "_bgq_ntv_code_to_name\n" ); #endif int index = ( EventCode & PAPI_NATIVE_AND_MASK ) + 1; if ( index >= MAX_COUNTERS ) return PAPI_ENOEVNT; strncpy( name, Bgpm_GetEventIdLabel( index ), len ); if ( name == NULL ) { #ifdef DEBUG_BGPM printf ("Error: ret value is NULL for BGPM API function Bgpm_GetEventIdLabel.\n" ); #endif return PAPI_ENOEVNT; } #ifdef DEBUG_BGQ printf( "name = ===%s===\n", name ); #endif return ( PAPI_OK ); } /* * Native Code to Event Description * * Given a native event code, returns the longer native event description */ int _bgq_ntv_code_to_descr( unsigned int EventCode, char *name, int len ) { #ifdef DEBUG_BGQ printf( "_bgq_ntv_code_to_descr\n" ); #endif int retval; int index = ( EventCode & PAPI_NATIVE_AND_MASK ) + 1; retval = Bgpm_GetLongDesc( index, name, &len ); retval = _check_BGPM_error( retval, "Bgpm_GetLongDesc" ); if ( retval < 0 ) return retval; return ( PAPI_OK ); } /* * Native Code to Bit Configuration * * Given a native event code, assigns the native event's * information to a given pointer. * NOTE: The info must be COPIED to location addressed by * the provided pointer, not just referenced! * NOTE: For BG/Q, the bit configuration is not needed, * as the native SPI is used to configure events. */ int _bgq_ntv_code_to_bits( unsigned int EventCode, hwd_register_t * bits ) { #ifdef DEBUG_BGQ printf( "_bgq_ntv_code_to_bits\n" ); #endif ( void ) EventCode; ( void ) bits; return ( PAPI_OK ); } /* * Native ENUM Events * */ int _bgq_ntv_enum_events( unsigned int *EventCode, int modifier ) { #ifdef DEBUG_BGQ printf( "_bgq_ntv_enum_events\n" ); #endif switch ( modifier ) { case PAPI_ENUM_FIRST: *EventCode = PAPI_NATIVE_MASK; return ( PAPI_OK ); break; case PAPI_ENUM_EVENTS: { int index = ( *EventCode & PAPI_NATIVE_AND_MASK ) + 1; if ( index < BGQ_PUNIT_MAX_EVENTS ) { *EventCode = *EventCode + 1; return ( PAPI_OK ); } else return ( PAPI_ENOEVNT ); break; } default: return ( PAPI_EINVAL ); } return ( PAPI_EINVAL ); } int _papi_hwi_init_os(void) { struct utsname uname_buffer; /* Get the kernel info */ uname(&uname_buffer); strncpy(_papi_os_info.name,uname_buffer.sysname,PAPI_MAX_STR_LEN); strncpy(_papi_os_info.version,uname_buffer.release,PAPI_MAX_STR_LEN); _papi_os_info.itimer_sig = PAPI_INT_MPX_SIGNAL; _papi_os_info.itimer_num = PAPI_INT_ITIMER; _papi_os_info.itimer_res_ns = 1; return PAPI_OK; } /* * PAPI Vector Table for BG/Q */ papi_vector_t _bgq_vectors = { .cmp_info = { /* Default component information (unspecified values are initialized to 0) */ .name = "linux-bgq", .short_name = "bgq", .description = "Blue Gene/Q component", .num_cntrs = BGQ_PUNIT_MAX_COUNTERS, .num_mpx_cntrs = BGQ_PUNIT_MAX_COUNTERS, .num_native_events = BGQ_PUNIT_MAX_EVENTS, .default_domain = PAPI_DOM_USER, .available_domains = PAPI_DOM_USER | PAPI_DOM_KERNEL, .default_granularity = PAPI_GRN_THR, .available_granularities = PAPI_GRN_THR, .hardware_intr_sig = PAPI_INT_SIGNAL, .hardware_intr = 1, .kernel_multiplex = 1, /* component specific cmp_info initializations */ .fast_real_timer = 1, .fast_virtual_timer = 0, } , /* Sizes of framework-opaque component-private structures */ .size = { .context = sizeof ( hwd_context_t ), .control_state = sizeof ( hwd_control_state_t ), .reg_value = sizeof ( hwd_register_t ), .reg_alloc = sizeof ( hwd_reg_alloc_t ), } , /* Function pointers in this component */ // .get_overflow_address = .start = _bgq_start, .stop = _bgq_stop, .read = _bgq_read, .reset = _bgq_reset, .write = _bgq_write, .stop_profiling = _bgq_stop_profiling, .init_component = _bgq_init_component, .init_thread = _bgq_init, .init_control_state = _bgq_init_control_state, .update_control_state = _bgq_update_control_state, .ctl = _bgq_ctl, .set_overflow = _bgq_set_overflow, //.dispatch_timer = _bgq_dispatch_timer, .set_profile = _bgq_set_profile, .set_domain = _bgq_set_domain, .ntv_enum_events = _bgq_ntv_enum_events, .ntv_name_to_code = _bgq_ntv_name_to_code, .ntv_code_to_name = _bgq_ntv_code_to_name, .ntv_code_to_descr = _bgq_ntv_code_to_descr, .ntv_code_to_bits = _bgq_ntv_code_to_bits, .allocate_registers = _bgq_allocate_registers, .cleanup_eventset = _bgq_cleanup_eventset, .shutdown_thread = _bgq_shutdown // .shutdown_global = // .user = }; papi_os_vector_t _papi_os_vector = { .get_memory_info = _bgq_get_memory_info, .get_dmem_info = _bgq_get_dmem_info, .get_real_cycles = _bgq_get_real_cycles, .get_real_usec = _bgq_get_real_usec, .get_virt_cycles = _bgq_get_virt_cycles, .get_virt_usec = _bgq_get_virt_usec, .get_system_info = _bgq_get_system_info };