Blob Blame History Raw
/*
* File:    linux-common.c
*/

#include <unistd.h>
#include <string.h>
#include <stdlib.h>
#include <ctype.h>
#include <err.h>
#include <stdarg.h>
#include <stdio.h>
#include <errno.h>
#include <syscall.h>
#include <sys/utsname.h>
#include <sys/time.h>

#include "papi.h"
#include "papi_internal.h"
#include "papi_vector.h"

#include "linux-memory.h"
#include "linux-common.h"
#include "linux-timer.h"

#include "x86_cpuid_info.h"

PAPI_os_info_t _papi_os_info;

/* The locks used by Linux */

#if defined(USE_PTHREAD_MUTEXES)
pthread_mutex_t _papi_hwd_lock_data[PAPI_MAX_LOCK];
#else
volatile unsigned int _papi_hwd_lock_data[PAPI_MAX_LOCK];
#endif


static int _linux_init_locks(void) {

   int i;

   for ( i = 0; i < PAPI_MAX_LOCK; i++ ) {
#if defined(USE_PTHREAD_MUTEXES)
       pthread_mutex_init(&_papi_hwd_lock_data[i],NULL);
#else
       _papi_hwd_lock_data[i] = MUTEX_OPEN;
#endif
   }

   return PAPI_OK;
}


int
_linux_detect_hypervisor(char *virtual_vendor_name) {

	int retval=0;

#if defined(__i386__)||defined(__x86_64__)
	retval=_x86_detect_hypervisor(virtual_vendor_name);
#else
	(void) virtual_vendor_name;
#endif

	return retval;
}


#define _PATH_SYS_SYSTEM "/sys/devices/system"
#define _PATH_SYS_CPU0	 _PATH_SYS_SYSTEM "/cpu/cpu0"

static char pathbuf[PATH_MAX] = "/";

static char *
search_cpu_info( FILE * f, char *search_str)
{
	static char line[PAPI_HUGE_STR_LEN] = "";
	char *s, *start = NULL;

	rewind(f);

	while (fgets(line,PAPI_HUGE_STR_LEN,f)!=NULL) {
		s=strstr(line,search_str);
		if (s!=NULL) {
			/* skip all characters in line up to the colon */
			/* and then spaces */
			s=strchr(s,':');
			if (s==NULL) break;
			s++;
			while (isspace(*s)) {
				s++;
			}
			start = s;
			/* Find and clear newline */
			s=strrchr(start,'\n');
			if (s!=NULL) *s = 0;
			break;
		}
	}
	return start;
}

static void
decode_vendor_string( char *s, int *vendor )
{
	if ( strcasecmp( s, "GenuineIntel" ) == 0 )
		*vendor = PAPI_VENDOR_INTEL;
	else if ( ( strcasecmp( s, "AMD" ) == 0 ) ||
			  ( strcasecmp( s, "AuthenticAMD" ) == 0 ) )
		*vendor = PAPI_VENDOR_AMD;
	else if ( strcasecmp( s, "IBM" ) == 0 )
		*vendor = PAPI_VENDOR_IBM;
	else if ( strcasecmp( s, "Cray" ) == 0 )
		*vendor = PAPI_VENDOR_CRAY;
	else if ( strcasecmp( s, "ARM" ) == 0 )
		*vendor = PAPI_VENDOR_ARM;
	else if ( strcasecmp( s, "MIPS" ) == 0 )
		*vendor = PAPI_VENDOR_MIPS;
	else if ( strcasecmp( s, "SiCortex" ) == 0 )
		*vendor = PAPI_VENDOR_MIPS;
	else
		*vendor = PAPI_VENDOR_UNKNOWN;
}

static FILE *
xfopen( const char *path, const char *mode )
{
	FILE *fd = fopen( path, mode );
	if ( !fd )
		err( EXIT_FAILURE, "error: %s", path );
	return fd;
}

static FILE *
path_vfopen( const char *mode, const char *path, va_list ap )
{
	vsnprintf( pathbuf, sizeof ( pathbuf ), path, ap );
	return xfopen( pathbuf, mode );
}


static int
path_sibling( const char *path, ... )
{
	int c;
	long n;
	int result = 0;
	char s[2];
	FILE *fp;
	va_list ap;
	va_start( ap, path );
	fp = path_vfopen( "r", path, ap );
	va_end( ap );

	while ( ( c = fgetc( fp ) ) != EOF ) {
		if ( isxdigit( c ) ) {
			s[0] = ( char ) c;
			s[1] = '\0';
			for ( n = strtol( s, NULL, 16 ); n > 0; n /= 2 ) {
				if ( n % 2 )
					result++;
			}
		}
	}

	fclose( fp );
	return result;
}

static int
path_exist( const char *path, ... )
{
	va_list ap;
	va_start( ap, path );
	vsnprintf( pathbuf, sizeof ( pathbuf ), path, ap );
	va_end( ap );
	return access( pathbuf, F_OK ) == 0;
}

static int
decode_cpuinfo_x86( FILE *f, PAPI_hw_info_t *hwinfo )
{
	int tmp;
	unsigned int strSize;
	char *s;

	/* Stepping */
	s = search_cpu_info( f, "stepping");
	if ( s ) {
		if (sscanf( s, "%d", &tmp ) ==1 ) {
			hwinfo->revision = ( float ) tmp;
			hwinfo->cpuid_stepping = tmp;
		}
	}

	/* Model Name */
	s = search_cpu_info( f, "model name");
	strSize = sizeof(hwinfo->model_string);
	if ( s ) {
		strncpy( hwinfo->model_string, s, strSize);
	}

	/* Family */
	s = search_cpu_info( f, "cpu family");
	if ( s ) {
		sscanf( s, "%d", &tmp );
		hwinfo->cpuid_family = tmp;
	}


	/* CPU Model */
	s = search_cpu_info( f, "model");
	if ( s ) {
		sscanf( s , "%d", &tmp );
		hwinfo->model = tmp;
		hwinfo->cpuid_model = tmp;
	}

	return PAPI_OK;
}

static int
decode_cpuinfo_power(FILE *f, PAPI_hw_info_t *hwinfo )
{

	int tmp;
	unsigned int strSize;
	char *s;

	/* Revision */
	s = search_cpu_info( f, "revision");
	if ( s ) {
		sscanf( s, "%d", &tmp );
		hwinfo->revision = ( float ) tmp;
		hwinfo->cpuid_stepping = tmp;
	}

       /* Model Name */
	s = search_cpu_info( f, "model");
	strSize = sizeof(hwinfo->model_string);
	if ( s ) {
		strncpy( hwinfo->model_string, s, strSize);
	}

	return PAPI_OK;
}



static int
decode_cpuinfo_arm(FILE *f, PAPI_hw_info_t *hwinfo )
{

	int tmp;
	unsigned int strSize;
	char *s, *t;

	/* revision */
	s = search_cpu_info( f, "CPU revision");
	if ( s ) {
		sscanf( s, "%d", &tmp );
		hwinfo->revision = ( float ) tmp;
		/* For compatability with old PAPI */
		hwinfo->model = tmp;
	}

	/* Model Name */
	s = search_cpu_info( f, "model name");
	strSize = sizeof(hwinfo->model_string);
	if ( s ) {
		strncpy( hwinfo->model_string, s, strSize );
	}

	/* Architecture (ARMv6, ARMv7, ARMv8, etc.) */
	/* Note the Raspberry Pi lies in the CPU architecture line */
	/* (it's ARMv6 not ARMv7)                                  */
	/* So we should actually get the value from the            */
	/*	Processor/ model name line                         */

	s = search_cpu_info( f, "CPU architecture");
	if ( s ) {

		if (strstr(s,"AArch64")) {
			hwinfo->cpuid_family = 8;
		}
		else {
			s = search_cpu_info( f, "Processor" );
			if (s) {
				t=strchr(s,'(');
				tmp=*(t+2)-'0';
				hwinfo->cpuid_family = tmp;
			}
			else {
				s = search_cpu_info( f, "model name" );
				if (s) {
					t=strchr(s,'(');
					tmp=*(t+2)-'0';
					hwinfo->cpuid_family = tmp;
				}
			}
		}
	}

	/* CPU Model */
	s = search_cpu_info( f, "CPU part" );
	if ( s ) {
		sscanf( s, "%x", &tmp );
		hwinfo->cpuid_model = tmp;
	}

	/* CPU Variant */
	s = search_cpu_info( f, "CPU variant" );
	if ( s ) {
		sscanf( s, "%x", &tmp );
		hwinfo->cpuid_stepping = tmp;
	}

	return PAPI_OK;

}


int
_linux_get_cpu_info( PAPI_hw_info_t *hwinfo, int *cpuinfo_mhz )
{
	int retval = PAPI_OK;
	char *s;
	float mhz = 0.0;
	FILE *f;
	char cpuinfo_filename[]="/proc/cpuinfo";

	if ( ( f = fopen( cpuinfo_filename, "r" ) ) == NULL ) {
		PAPIERROR( "fopen(/proc/cpuinfo) errno %d", errno );
		return PAPI_ESYS;
	}

	/* All of this information may be overwritten by the component */

	/***********************/
	/* Attempt to find MHz */
	/***********************/
	s = search_cpu_info( f, "cpu MHz" );
	if ( !s ) {
		s = search_cpu_info( f, "clock" );
	}
	if ( s ) {
		sscanf( s, "%f", &mhz );
		*cpuinfo_mhz = mhz;
	}
	else {
	//	PAPIWARN("Failed to find a clock speed in /proc/cpuinfo");
	}

	/*******************************/
	/* Vendor Name and Vendor Code */
	/*******************************/

	/* First try to read "vendor_id" field */
	/* Which is the most common field      */
	s = search_cpu_info( f, "vendor_id");
	if ( s ) {
		strcpy( hwinfo->vendor_string, s );
	}
	else {
		/* If not found, try "vendor" which seems to be Itanium specific */
		s = search_cpu_info( f, "vendor" );
		if ( s ) {
			strcpy( hwinfo->vendor_string, s );
		}
		else {
			/* "system type" seems to be MIPS and Alpha */
			s = search_cpu_info( f, "system type");
			if ( s ) {
				strcpy( hwinfo->vendor_string, s );
			}
			else {
				/* "platform" indicates Power */
				s = search_cpu_info( f, "platform");
				if ( s ) {
					if ( ( strcasecmp( s, "pSeries" ) == 0 ) ||
						( strcasecmp( s, "PowerNV" ) == 0 ) ||
						( strcasecmp( s, "PowerMac" ) == 0 ) ) {
						strcpy( hwinfo->vendor_string, "IBM" );
					}
				}
				else {
					/* "CPU implementer" indicates ARM */
					s = search_cpu_info( f, "CPU implementer");
					if ( s ) {
						strcpy( hwinfo->vendor_string, "ARM" );
					}
				}
			}
		}
	}

	/* Decode the string to a PAPI specific implementer value */
	if ( strlen( hwinfo->vendor_string ) ) {
		decode_vendor_string( hwinfo->vendor_string, &hwinfo->vendor );
	}

	/**********************************************/
	/* Provide more stepping/model/family numbers */
	/**********************************************/

	if ((hwinfo->vendor==PAPI_VENDOR_INTEL) ||
		(hwinfo->vendor==PAPI_VENDOR_AMD)) {

		decode_cpuinfo_x86(f,hwinfo);
	}

	if (hwinfo->vendor==PAPI_VENDOR_IBM) {

		decode_cpuinfo_power(f,hwinfo);
	}

	if (hwinfo->vendor==PAPI_VENDOR_ARM) {

		decode_cpuinfo_arm(f,hwinfo);
	}




	/* The following members are set using the same methodology */
	/* used in lscpu.                                           */

	/* Total number of CPUs */
	/* The following line assumes totalcpus was initialized to zero! */
	while ( path_exist( _PATH_SYS_SYSTEM "/cpu/cpu%d", hwinfo->totalcpus ) )
		hwinfo->totalcpus++;

	/* Number of threads per core */
	if ( path_exist( _PATH_SYS_CPU0 "/topology/thread_siblings" ) )
		hwinfo->threads =
			path_sibling( _PATH_SYS_CPU0 "/topology/thread_siblings" );

	/* Number of cores per socket */
	if ( path_exist( _PATH_SYS_CPU0 "/topology/core_siblings" ) &&
		 hwinfo->threads > 0 )
		hwinfo->cores =
			path_sibling( _PATH_SYS_CPU0 "/topology/core_siblings" ) /
			hwinfo->threads;

	/* Number of NUMA nodes */
	/* The following line assumes nnodes was initialized to zero! */
	while ( path_exist( _PATH_SYS_SYSTEM "/node/node%d", hwinfo->nnodes ) ) {
		hwinfo->nnodes++;
	}

	/* Number of CPUs per node */
	hwinfo->ncpu = hwinfo->nnodes > 1 ?
			hwinfo->totalcpus / hwinfo->nnodes : hwinfo->totalcpus;

	/* Number of sockets */
	if ( hwinfo->threads > 0 && hwinfo->cores > 0 ) {
		hwinfo->sockets = hwinfo->totalcpus / hwinfo->cores / hwinfo->threads;
	}

#if 0
	int *nodecpu;
	/* cpumap data is not currently part of the _papi_hw_info struct */
        nodecpu = malloc( (unsigned int) hwinfo->nnodes * sizeof(int) );
	if ( nodecpu ) {
	   int i;
	   for ( i = 0; i < hwinfo->nnodes; ++i ) {
	       nodecpu[i] = path_sibling(
                             _PATH_SYS_SYSTEM "/node/node%d/cpumap", i );
	   }
	} else {
		PAPIERROR( "malloc failed for variable not currently used" );
	}
#endif


	/* Fixup missing Megahertz Value */
	/* This is missing from cpuinfo on ARM and MIPS */
	if (*cpuinfo_mhz < 1.0) {
		s = search_cpu_info( f, "BogoMIPS" );
		if ((!s) || (sscanf( s, "%f", &mhz ) != 1)) {
			INTDBG("MHz detection failed. "
				"Please edit file %s at line %d.\n",
				__FILE__,__LINE__);
		}

		if (hwinfo->vendor == PAPI_VENDOR_MIPS) {
			/* MIPS has 2x clock multiplier */
			*cpuinfo_mhz = 2*(((int)mhz)+1);

			/* Also update version info on MIPS */
			s = search_cpu_info( f, "cpu model");
			s = strstr(s," V")+2;
			strtok(s," ");
			sscanf(s, "%f ", &hwinfo->revision );
		}
		else {
			/* In general bogomips is proportional to number of CPUs */
			if (hwinfo->totalcpus) {
				if (mhz!=0) *cpuinfo_mhz = mhz / hwinfo->totalcpus;
			}
		}
	}

	fclose( f );

	return retval;
}

int
_linux_get_mhz( int *sys_min_mhz, int *sys_max_mhz ) {

  FILE *fff;
  int result;

  /* Try checking for min MHz */
  /* Assume cpu0 exists */
  fff=fopen("/sys/devices/system/cpu/cpu0/cpufreq/cpuinfo_min_freq","r");
  if (fff==NULL) return PAPI_EINVAL;
  result=fscanf(fff,"%d",sys_min_mhz);
  fclose(fff);
  if (result!=1) return PAPI_EINVAL;

  fff=fopen("/sys/devices/system/cpu/cpu0/cpufreq/cpuinfo_max_freq","r");
  if (fff==NULL) return PAPI_EINVAL;
  result=fscanf(fff,"%d",sys_max_mhz);
  fclose(fff);
  if (result!=1) return PAPI_EINVAL;

  return PAPI_OK;

}

int
_linux_get_system_info( papi_mdi_t *mdi ) {

	int retval;
	char maxargs[PAPI_HUGE_STR_LEN];
	pid_t pid;
	int cpuinfo_mhz,sys_min_khz,sys_max_khz;

	/* Software info */

	/* Path and args */

	pid = getpid(  );
	if ( pid < 0 ) {
		PAPIERROR( "getpid() returned < 0" );
		return PAPI_ESYS;
	}
	mdi->pid = pid;

	sprintf( maxargs, "/proc/%d/exe", ( int ) pid );
	retval = readlink( maxargs, mdi->exe_info.fullname,
			PAPI_HUGE_STR_LEN-1 );
	if ( retval < 0 ) {
		PAPIERROR( "readlink(%s) returned < 0", maxargs );
		return PAPI_ESYS;
	}

	if (retval > PAPI_HUGE_STR_LEN-1) {
		retval=PAPI_HUGE_STR_LEN-1;
	}
	mdi->exe_info.fullname[retval] = '\0';

	/* Careful, basename can modify its argument */
	strcpy( maxargs, mdi->exe_info.fullname );

	strncpy( mdi->exe_info.address_info.name, basename( maxargs ),
		PAPI_HUGE_STR_LEN-1);
	mdi->exe_info.address_info.name[PAPI_HUGE_STR_LEN-1] = '\0';

	SUBDBG( "Executable is %s\n", mdi->exe_info.address_info.name );
	SUBDBG( "Full Executable is %s\n", mdi->exe_info.fullname );

	/* Executable regions, may require reading /proc/pid/maps file */

	retval = _linux_update_shlib_info( mdi );
	SUBDBG( "Text: Start %p, End %p, length %d\n",
			mdi->exe_info.address_info.text_start,
			mdi->exe_info.address_info.text_end,
			( int ) ( mdi->exe_info.address_info.text_end -
					  mdi->exe_info.address_info.text_start ) );
	SUBDBG( "Data: Start %p, End %p, length %d\n",
			mdi->exe_info.address_info.data_start,
			mdi->exe_info.address_info.data_end,
			( int ) ( mdi->exe_info.address_info.data_end -
					  mdi->exe_info.address_info.data_start ) );
	SUBDBG( "Bss: Start %p, End %p, length %d\n",
			mdi->exe_info.address_info.bss_start,
			mdi->exe_info.address_info.bss_end,
			( int ) ( mdi->exe_info.address_info.bss_end -
					  mdi->exe_info.address_info.bss_start ) );

	/* PAPI_preload_option information */

	strcpy( mdi->preload_info.lib_preload_env, "LD_PRELOAD" );
	mdi->preload_info.lib_preload_sep = ' ';
	strcpy( mdi->preload_info.lib_dir_env, "LD_LIBRARY_PATH" );
	mdi->preload_info.lib_dir_sep = ':';

	/* Hardware info */

	retval = _linux_get_cpu_info( &mdi->hw_info, &cpuinfo_mhz );
	if ( retval )
		return retval;

	/* Handle MHz */

	retval = _linux_get_mhz( &sys_min_khz, &sys_max_khz );
	if ( retval ) {

		mdi->hw_info.cpu_max_mhz=cpuinfo_mhz;
		mdi->hw_info.cpu_min_mhz=cpuinfo_mhz;

	   /*
	   mdi->hw_info.mhz=cpuinfo_mhz;
	   mdi->hw_info.clock_mhz=cpuinfo_mhz;
	   */
	}
	else {
		mdi->hw_info.cpu_max_mhz=sys_max_khz/1000;
		mdi->hw_info.cpu_min_mhz=sys_min_khz/1000;

	   /*
	   mdi->hw_info.mhz=sys_max_khz/1000;
	   mdi->hw_info.clock_mhz=sys_max_khz/1000;
	   */
	}

	/* Set Up Memory */

	retval = _linux_get_memory_info( &mdi->hw_info, mdi->hw_info.model );
	if ( retval )
		return retval;

	SUBDBG( "Found %d %s(%d) %s(%d) CPUs at %d Mhz.\n",
			mdi->hw_info.totalcpus,
			mdi->hw_info.vendor_string,
			mdi->hw_info.vendor,
		        mdi->hw_info.model_string,
		        mdi->hw_info.model,
		        mdi->hw_info.cpu_max_mhz);

	/* Get virtualization info */
	mdi->hw_info.virtualized=_linux_detect_hypervisor(mdi->hw_info.virtual_vendor_string);

	return PAPI_OK;
}

int
_papi_hwi_init_os(void) {

    int major=0,minor=0,sub=0;
    char *ptr;
    struct utsname uname_buffer;

    /* Initialize the locks */
    _linux_init_locks();

    /* Get the kernel info */
    uname(&uname_buffer);

    SUBDBG("Native kernel version %s\n",uname_buffer.release);

    strncpy(_papi_os_info.name,uname_buffer.sysname,PAPI_MAX_STR_LEN);

#ifdef ASSUME_KERNEL
    strncpy(_papi_os_info.version,ASSUME_KERNEL,PAPI_MAX_STR_LEN);
    SUBDBG("Assuming kernel version %s\n",_papi_os_info.name);
#else
    strncpy(_papi_os_info.version,uname_buffer.release,PAPI_MAX_STR_LEN);
#endif

    ptr=strtok(_papi_os_info.version,".");
    if (ptr!=NULL) major=atoi(ptr);

    ptr=strtok(NULL,".");
    if (ptr!=NULL) minor=atoi(ptr);

    ptr=strtok(NULL,".");
    if (ptr!=NULL) sub=atoi(ptr);

   _papi_os_info.os_version=LINUX_VERSION(major,minor,sub);

   _papi_os_info.itimer_sig = PAPI_INT_MPX_SIGNAL;
   _papi_os_info.itimer_num = PAPI_INT_ITIMER;
   _papi_os_info.itimer_ns = PAPI_INT_MPX_DEF_US * 1000;
   _papi_os_info.itimer_res_ns = 1;
   _papi_os_info.clock_ticks = sysconf( _SC_CLK_TCK );

   /* Get Linux-specific system info */
   _linux_get_system_info( &_papi_hwi_system_info );

   return PAPI_OK;
}



int _linux_detect_nmi_watchdog() {

  int watchdog_detected=0,watchdog_value=0;
  FILE *fff;

  fff=fopen("/proc/sys/kernel/nmi_watchdog","r");
  if (fff!=NULL) {
     if (fscanf(fff,"%d",&watchdog_value)==1) {
        if (watchdog_value>0) watchdog_detected=1;
     }
     fclose(fff);
  }

  return watchdog_detected;
}

papi_os_vector_t _papi_os_vector = {
  .get_memory_info =   _linux_get_memory_info,
  .get_dmem_info =     _linux_get_dmem_info,
  .get_real_cycles =   _linux_get_real_cycles,
  .update_shlib_info = _linux_update_shlib_info,
  .get_system_info =   _linux_get_system_info,


#if defined(HAVE_CLOCK_GETTIME)
  .get_real_usec =  _linux_get_real_usec_gettime,
#elif defined(HAVE_GETTIMEOFDAY)
  .get_real_usec =  _linux_get_real_usec_gettimeofday,
#else
  .get_real_usec =  _linux_get_real_usec_cycles,
#endif


#if defined(USE_PROC_PTTIMER)
  .get_virt_usec =   _linux_get_virt_usec_pttimer,
#elif defined(HAVE_CLOCK_GETTIME_THREAD)
  .get_virt_usec =   _linux_get_virt_usec_gettime,
#elif defined(HAVE_PER_THREAD_TIMES)
  .get_virt_usec =   _linux_get_virt_usec_times,
#elif defined(HAVE_PER_THREAD_GETRUSAGE)
  .get_virt_usec =   _linux_get_virt_usec_rusage,
#endif


#if defined(HAVE_CLOCK_GETTIME)
  .get_real_nsec =  _linux_get_real_nsec_gettime,
#endif

#if defined(HAVE_CLOCK_GETTIME_THREAD)
  .get_virt_nsec =   _linux_get_virt_nsec_gettime,
#endif


};