Blame irqlist.c

Packit 9eaa09
/* 
Packit 9eaa09
 * Copyright (C) 2006, Intel Corporation
Packit 9eaa09
 * Copyright (C) 2012, Neil Horman <nhorman@tuxdriver.com> 
Packit 9eaa09
 * 
Packit 9eaa09
 * This file is part of irqbalance
Packit 9eaa09
 *
Packit 9eaa09
 * This program file is free software; you can redistribute it and/or modify it
Packit 9eaa09
 * under the terms of the GNU General Public License as published by the
Packit 9eaa09
 * Free Software Foundation; version 2 of the License.
Packit 9eaa09
 * 
Packit 9eaa09
 * This program is distributed in the hope that it will be useful, but WITHOUT
Packit 9eaa09
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
Packit 9eaa09
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
Packit 9eaa09
 * for more details.
Packit 9eaa09
 * 
Packit 9eaa09
 * You should have received a copy of the GNU General Public License
Packit 9eaa09
 * along with this program in a file named COPYING; if not, write to the 
Packit 9eaa09
 * Free Software Foundation, Inc., 
Packit 9eaa09
 * 51 Franklin Street, Fifth Floor, 
Packit 9eaa09
 * Boston, MA 02110-1301 USA
Packit 9eaa09
 */
Packit 9eaa09
Packit 9eaa09
/*
Packit 9eaa09
 * This file has the basic functions to manipulate interrupt metadata
Packit 9eaa09
 */
Packit 9eaa09
#include "config.h"
Packit 9eaa09
#include <stdio.h>
Packit 9eaa09
#include <stdlib.h>
Packit 9eaa09
#include <unistd.h>
Packit 9eaa09
#include <sys/types.h>
Packit 9eaa09
#include <dirent.h>
Packit 9eaa09
#include <errno.h>
Packit 9eaa09
#include <math.h>
Packit 9eaa09
Packit 9eaa09
#include "types.h"
Packit 9eaa09
#include "irqbalance.h"
Packit 9eaa09
Packit 9eaa09
Packit 9eaa09
Packit 9eaa09
struct load_balance_info {
Packit 9eaa09
	unsigned long long int total_load;
Packit 9eaa09
	unsigned long long avg_load;
Packit 9eaa09
	unsigned long long min_load;
Packit 9eaa09
	unsigned long long adjustment_load;
Packit 9eaa09
	int load_sources;
Packit 9eaa09
	unsigned long long int deviations;
Packit 9eaa09
	long double std_deviation;
Packit 9eaa09
	unsigned int num_over;
Packit 9eaa09
	unsigned int num_under;
Packit 9eaa09
	unsigned int num_powersave;
Packit 9eaa09
	struct topo_obj *powersave;
Packit 9eaa09
};
Packit 9eaa09
Packit 9eaa09
static void gather_load_stats(struct topo_obj *obj, void *data)
Packit 9eaa09
{
Packit 9eaa09
	struct load_balance_info *info = data;
Packit 9eaa09
Packit 9eaa09
	if (info->load_sources == 0 || obj->load < info->min_load)
Packit 9eaa09
		info->min_load = obj->load;
Packit 9eaa09
	info->total_load += obj->load;
Packit 9eaa09
	info->load_sources += 1;
Packit 9eaa09
}
Packit 9eaa09
Packit 9eaa09
static void compute_deviations(struct topo_obj *obj, void *data)
Packit 9eaa09
{
Packit 9eaa09
	struct load_balance_info *info = data;
Packit 9eaa09
	unsigned long long int deviation;
Packit 9eaa09
Packit 9eaa09
	deviation = (obj->load > info->avg_load) ?
Packit 9eaa09
		obj->load - info->avg_load :
Packit 9eaa09
		info->avg_load - obj->load;
Packit 9eaa09
Packit 9eaa09
	info->deviations += (deviation * deviation);
Packit 9eaa09
}
Packit 9eaa09
Packit 9eaa09
static void move_candidate_irqs(struct irq_info *info, void *data)
Packit 9eaa09
{
Packit 9eaa09
	struct load_balance_info *lb_info = data;
Packit 9eaa09
Packit 9eaa09
	/* Don't rebalance irqs that don't want it */
Packit 9eaa09
	if (info->level == BALANCE_NONE)
Packit 9eaa09
		return;
Packit 9eaa09
Packit 9eaa09
	/* Don't move cpus that only have one irq, regardless of load */
Packit 9eaa09
	if (g_list_length(info->assigned_obj->interrupts) <= 1)
Packit 9eaa09
		return;
Packit 9eaa09
Packit 9eaa09
	/* IRQs with a load of 1 have most likely not had any interrupts and
Packit 9eaa09
	 * aren't worth migrating
Packit 9eaa09
	 */
Packit 9eaa09
	if (info->load <= 1)
Packit 9eaa09
		return;
Packit 9eaa09
Packit 9eaa09
	/* If we can migrate an irq without swapping the imbalance do it. */
Packit 9eaa09
	if ((lb_info->adjustment_load - info->load) > (lb_info->min_load + info->load)) {
Packit 9eaa09
		lb_info->adjustment_load -= info->load;
Packit 9eaa09
		lb_info->min_load += info->load;
Packit 9eaa09
	} else
Packit 9eaa09
		return;
Packit 9eaa09
Packit 9eaa09
	log(TO_CONSOLE, LOG_INFO, "Selecting irq %d for rebalancing\n", info->irq);
Packit 9eaa09
Packit 9eaa09
	migrate_irq(&info->assigned_obj->interrupts, &rebalance_irq_list, info);
Packit 9eaa09
Packit 9eaa09
	info->assigned_obj = NULL;
Packit 9eaa09
}
Packit 9eaa09
Packit 9eaa09
static void migrate_overloaded_irqs(struct topo_obj *obj, void *data)
Packit 9eaa09
{
Packit 9eaa09
	struct load_balance_info *info = data;
Packit 9eaa09
Packit 9eaa09
	if (obj->powersave_mode)
Packit 9eaa09
		info->num_powersave++;
Packit 9eaa09
Packit 9eaa09
	if ((obj->load + info->std_deviation) <= info->avg_load) {
Packit 9eaa09
		info->num_under++;
Packit 9eaa09
		if (power_thresh != ULONG_MAX && !info->powersave)
Packit 9eaa09
			if (!obj->powersave_mode)
Packit 9eaa09
				info->powersave = obj;
Packit 9eaa09
	} else if ((obj->load - info->std_deviation) >=info->avg_load) {
Packit 9eaa09
		info->num_over++;
Packit 9eaa09
	}
Packit 9eaa09
Packit 9eaa09
	if ((obj->load > info->min_load) &&
Packit 9eaa09
	    (g_list_length(obj->interrupts) > 1)) {
Packit 9eaa09
		/* order the list from greatest to least workload */
Packit 9eaa09
		sort_irq_list(&obj->interrupts);
Packit 9eaa09
		/*
Packit 9eaa09
		 * Each irq carries a weighted average amount of load
Packit 9eaa09
		 * we think it's responsible for. This object's load is larger
Packit 9eaa09
		 * than the object with the minimum load. Select irqs for
Packit 9eaa09
		 * migration if we could move them to the minimum object
Packit 9eaa09
		 * without reversing the imbalance or until we only have one
Packit 9eaa09
		 * left.
Packit 9eaa09
		 */
Packit 9eaa09
		info->adjustment_load = obj->load;
Packit 9eaa09
		for_each_irq(obj->interrupts, move_candidate_irqs, info);
Packit 9eaa09
	}
Packit 9eaa09
}
Packit 9eaa09
Packit 9eaa09
static void force_irq_migration(struct irq_info *info, void *data __attribute__((unused)))
Packit 9eaa09
{
Packit 9eaa09
	migrate_irq(&info->assigned_obj->interrupts, &rebalance_irq_list, info);
Packit 9eaa09
	info->assigned_obj = NULL;
Packit 9eaa09
}
Packit 9eaa09
Packit 9eaa09
static void clear_powersave_mode(struct topo_obj *obj, void *data __attribute__((unused)))
Packit 9eaa09
{
Packit 9eaa09
	obj->powersave_mode = 0;
Packit 9eaa09
}
Packit 9eaa09
Packit 9eaa09
static void find_overloaded_objs(GList *name, struct load_balance_info *info) {
Packit 9eaa09
	memset(info, 0, sizeof(struct load_balance_info));
Packit 9eaa09
	for_each_object(name, gather_load_stats, info);
Packit 9eaa09
	info->load_sources = (info->load_sources == 0) ? 1 : (info->load_sources);
Packit 9eaa09
	info->avg_load = info->total_load / info->load_sources;
Packit 9eaa09
	for_each_object(name, compute_deviations, info);
Packit 9eaa09
	/* Don't divide by zero if there is a single load source */
Packit 9eaa09
	if (info->load_sources == 1)
Packit 9eaa09
		info->std_deviation = 0;
Packit 9eaa09
	else {
Packit 9eaa09
		info->std_deviation = (long double)(info->deviations / (info->load_sources - 1));
Packit 9eaa09
		info->std_deviation = sqrt(info->std_deviation);
Packit 9eaa09
	}
Packit 9eaa09
Packit 9eaa09
	for_each_object(name, migrate_overloaded_irqs, info);
Packit 9eaa09
}
Packit 9eaa09
Packit 9eaa09
void update_migration_status(void)
Packit 9eaa09
{
Packit 9eaa09
	struct load_balance_info info;
Packit 9eaa09
	find_overloaded_objs(cpus, &info;;
Packit 9eaa09
	if (power_thresh != ULONG_MAX && cycle_count > 5) {
Packit 9eaa09
		if (!info.num_over && (info.num_under >= power_thresh) && info.powersave) {
Packit 9eaa09
			log(TO_ALL, LOG_INFO, "cpu %d entering powersave mode\n", info.powersave->number);
Packit 9eaa09
			info.powersave->powersave_mode = 1;
Packit 9eaa09
			if (g_list_length(info.powersave->interrupts) > 0)
Packit 9eaa09
				for_each_irq(info.powersave->interrupts, force_irq_migration, NULL);
Packit 9eaa09
		} else if ((info.num_over) && (info.num_powersave)) {
Packit 9eaa09
			log(TO_ALL, LOG_INFO, "Load average increasing, re-enabling all cpus for irq balancing\n");
Packit 9eaa09
			for_each_object(cpus, clear_powersave_mode, NULL);
Packit 9eaa09
		}
Packit 9eaa09
	}
Packit 9eaa09
	find_overloaded_objs(cache_domains, &info;;
Packit 9eaa09
	find_overloaded_objs(packages, &info;;
Packit 9eaa09
	find_overloaded_objs(numa_nodes, &info;;
Packit 9eaa09
}
Packit 9eaa09
Packit 9eaa09
static void dump_workload(struct irq_info *info, void *unused __attribute__((unused)))
Packit 9eaa09
{
Packit 9eaa09
	log(TO_CONSOLE, LOG_INFO, "Interrupt %i node_num %d (class %s) has workload %lu \n",
Packit 9eaa09
	    info->irq, irq_numa_node(info)->number, classes[info->class], (unsigned long)info->load);
Packit 9eaa09
}
Packit 9eaa09
Packit 9eaa09
void dump_workloads(void)
Packit 9eaa09
{
Packit 9eaa09
	for_each_irq(NULL, dump_workload, NULL);
Packit 9eaa09
}
Packit 9eaa09