/*
* EMU10k1 loader
*
* Copyright (c) 2003,2004 by Peter Zubaj
*
* This program is free software; you can redistribute it and/or modify
* it under the terms of the GNU General Public License as published by
* the Free Software Foundation; either version 2 of the License, or
* (at your option) any later version.
*
* This program is distributed in the hope that it will be useful,
* but WITHOUT ANY WARRANTY; without even the implied warranty of
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
* GNU General Public License for more details.
*
* You should have received a copy of the GNU General Public License
* along with this program; if not, write to the Free Software
* Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
*
*/
#include "ld10k1.h"
#include "ld10k1_fnc.h"
#include "ld10k1_tram.h"
#include "ld10k1_error.h"
#include <stdlib.h>
int ld10k1_tram_res_alloc_hwacc(ld10k1_dsp_mgr_t *dsp_mgr, ld10k1_dsp_tram_resolve_t *res);
int ld10k1_tram_realloc_space(ld10k1_dsp_mgr_t *dsp_mgr, ld10k1_dsp_tram_resolve_t *res);
void ld10k1_tram_init_res(ld10k1_dsp_mgr_t *dsp_mgr, ld10k1_dsp_tram_resolve_t *res)
{
res->isize = dsp_mgr->i_tram.size;
res->ifree = dsp_mgr->i_tram.size;
res->iacc_count = dsp_mgr->i_tram.max_hwacc;
res->iacc_free_count = dsp_mgr->i_tram.max_hwacc;
res->esize = dsp_mgr->e_tram.size;
res->efree = dsp_mgr->e_tram.size;
res->eacc_count = dsp_mgr->e_tram.max_hwacc;
res->eacc_free_count = dsp_mgr->e_tram.max_hwacc;
res->grp_free = res->iacc_free_count + res->eacc_free_count;
res->item_count = 0;
}
void ld10k1_tram_init_res_from_dsp_mgr(ld10k1_dsp_mgr_t *dsp_mgr, ld10k1_dsp_tram_resolve_t *res)
{
/* throught all groups */
int i;
for (i = 0; i < dsp_mgr->max_tram_grp; i++) {
if (dsp_mgr->tram_grp[i].used) {
/* get position */
res->grp_free--;
switch (dsp_mgr->tram_grp[i].req_pos) {
case TRAM_POS_NONE:
case TRAM_POS_AUTO:
/* add to res */
res->items[res->item_count].grp_idx = i;
res->items[res->item_count].grp_size = dsp_mgr->tram_grp[i].size;
res->items[res->item_count].grp_acc_count = dsp_mgr->tram_grp[i].acc_count;
res->items[res->item_count].res_value = 0;
res->items[res->item_count].pos = TRAM_POS_NONE;
res->item_count++;
break;
case TRAM_POS_INTERNAL:
/* decrease resources */
res->ifree -= dsp_mgr->tram_grp[i].size;
res->iacc_free_count -= dsp_mgr->tram_grp[i].acc_count;
break;
case TRAM_POS_EXTERNAL:
res->efree -= dsp_mgr->tram_grp[i].size;
res->eacc_free_count -= dsp_mgr->tram_grp[i].acc_count;
break;
}
}
}
}
int ld10k1_tram_acc_count_from_patch(ld10k1_patch_t *patch, int grp)
{
int i, count;
for (count = 0, i = 0; i < patch->tram_acc_count; i++)
if (patch->tram_acc[i].grp == grp)
count++;
return count;
}
int ld10k1_tram_init_res_from_patch(ld10k1_dsp_mgr_t *dsp_mgr, ld10k1_dsp_tram_resolve_t *res, ld10k1_patch_t *patch)
{
int i;
int acc_count;
/* through all groups */
for (i = 0; i < patch->tram_count; i++) {
if (res->grp_free <= 0)
return LD10K1_ERR_TRAM_FULL_GRP;
/* get acc count */
acc_count = ld10k1_tram_acc_count_from_patch(patch, i);
if (acc_count <= 0)
continue;
/* get position */
switch (patch->tram_grp[i].grp_pos) {
case TRAM_POS_NONE:
case TRAM_POS_AUTO:
/* add to res */
res->items[res->item_count].grp_idx = -i - 1;
res->items[res->item_count].grp_size = patch->tram_grp[i].grp_size;
res->items[res->item_count].grp_acc_count = acc_count;
res->items[res->item_count].res_value = 0;
res->items[res->item_count].pos = TRAM_POS_NONE;
res->item_count++;
break;
case TRAM_POS_INTERNAL:
/* decrease resources */
if (res->ifree < patch->tram_grp[i].grp_size)
return LD10K1_ERR_ITRAM_FULL;
if (res->iacc_free_count < acc_count)
return LD10K1_ERR_ITRAM_FULL_ACC;
res->ifree -= patch->tram_grp[i].grp_size;
res->iacc_free_count -= acc_count;
break;
case TRAM_POS_EXTERNAL:
/* decrease resources */
if (res->efree < patch->tram_grp[i].grp_size)
return LD10K1_ERR_ETRAM_FULL;
if (res->eacc_free_count < acc_count)
return LD10K1_ERR_ETRAM_FULL_ACC;
res->efree -= patch->tram_grp[i].grp_size;
res->eacc_free_count -= acc_count;
break;
}
}
return 0;
}
int ld10k1_tram_init_res_from_patch_copy(ld10k1_dsp_mgr_t *dsp_mgr, ld10k1_dsp_tram_resolve_t *res, ld10k1_patch_t *patch)
{
/* throught all groups */
int i;
int acc_count;
for (i = 0; i < patch->tram_count; i++) {
/* get acc count */
acc_count = ld10k1_tram_acc_count_from_patch(patch, i);
/* get position */
if (patch->tram_grp[i].grp_pos == TRAM_POS_INTERNAL ||
patch->tram_grp[i].grp_pos == TRAM_POS_EXTERNAL) {
res->items[res->item_count].grp_idx = -i - 1;
res->items[res->item_count].grp_size = patch->tram_grp[i].grp_size;
res->items[res->item_count].grp_acc_count = acc_count;
res->items[res->item_count].pos = patch->tram_grp[i].grp_pos;
res->items[res->item_count].res_value = 0;
res->item_count++;
}
}
return 0;
}
int ld10k1_tram_calc_res_value(ld10k1_dsp_tram_resolve_t *res)
{
/* res_value is calculated as grp_size / acc_count */
int i;
for (i = 0; i < res->item_count; i++)
res->items[i].res_value = res->items[i].grp_size / res->items[i].grp_acc_count;
return 0;
}
static int ld10k1_tram_sort_res_compare(const void *item1, const void *item2)
{
ld10k1_dsp_tram_resolve_item_t *i1 = (ld10k1_dsp_tram_resolve_item_t *)item1;
ld10k1_dsp_tram_resolve_item_t *i2 = (ld10k1_dsp_tram_resolve_item_t *)item2;
if (i1->res_value == i2->res_value)
return 0;
else if (i1->res_value > i2->res_value)
return 1;
else
return -1;
}
int ld10k1_tram_sort_res(ld10k1_dsp_tram_resolve_t *res)
{
qsort(res->items, res->item_count, sizeof(ld10k1_dsp_tram_resolve_item_t), ld10k1_tram_sort_res_compare);
return 0;
}
int ld10k1_tram_resolve_res(ld10k1_dsp_tram_resolve_t *res)
{
int i;
for (i = 0; i < res->item_count; i++) {
/* first try internal tram then external tram */
if (res->items[i].grp_size <= res->ifree &&
res->items[i].grp_acc_count <= res->iacc_free_count) {
/* put it into itram */
res->ifree -= res->items[i].grp_size;
res->iacc_free_count -= res->items[i].grp_acc_count;
res->items[i].pos = TRAM_POS_INTERNAL;
} else if (res->items[i].grp_size <= res->efree &&
res->items[i].grp_acc_count <= res->eacc_free_count) {
/* put it into etram */
res->efree -= res->items[i].grp_size;
res->eacc_free_count -= res->items[i].grp_acc_count;
res->items[i].pos = TRAM_POS_EXTERNAL;
} else
return LD10K1_ERR_TRAM_FULL;
}
return 0;
}
int ld10k1_tram_grp_alloc(ld10k1_dsp_mgr_t *dsp_mgr)
{
int i;
for (i = 0; i < dsp_mgr->max_tram_grp; i++) {
if (!dsp_mgr->tram_grp[i].used) {
dsp_mgr->tram_grp[i].used = 1;
return i;
}
}
return LD10K1_ERR_TRAM_FULL_GRP;
}
void ld10k1_tram_grp_free(ld10k1_dsp_mgr_t *dsp_mgr, int grp)
{
dsp_mgr->tram_grp[grp].used = 0;
}
int ld10k1_tram_acc_alloc(ld10k1_dsp_mgr_t *dsp_mgr)
{
int i;
for (i = 0; i < dsp_mgr->max_tram_acc; i++) {
if (!dsp_mgr->tram_acc[i].used) {
dsp_mgr->tram_acc[i].used = 1;
return i;
}
}
return LD10K1_ERR_TRAM_FULL_ACC;
}
void ld10k1_tram_acc_free(ld10k1_dsp_mgr_t *dsp_mgr, int acc)
{
dsp_mgr->tram_acc[acc].used = 0;
}
int ld10k1_tram_reserve_for_patch(ld10k1_dsp_mgr_t *dsp_mgr, ld10k1_patch_t *patch, ld10k1_dsp_tram_resolve_t *res)
{
int err;
ld10k1_tram_init_res(dsp_mgr, res);
ld10k1_tram_init_res_from_dsp_mgr(dsp_mgr, res);
if ((err = ld10k1_tram_init_res_from_patch(dsp_mgr, res, patch)) < 0)
return err;
ld10k1_tram_calc_res_value(res);
ld10k1_tram_sort_res(res);
if ((err = ld10k1_tram_resolve_res(res)) < 0)
return err;
ld10k1_tram_init_res_from_patch_copy(dsp_mgr, res, patch);
return 0;
}
int ld10k1_tram_alloc_for_patch(ld10k1_dsp_mgr_t *dsp_mgr, ld10k1_patch_t *patch, ld10k1_dsp_tram_resolve_t *res)
{
int i;
int grp;
int acc;
/* allocate tram grp and acc for patch */
for (i = 0; i < patch->tram_count; i++) {
grp = ld10k1_tram_grp_alloc(dsp_mgr);
patch->tram_grp[i].grp_idx = grp;
dsp_mgr->tram_grp[grp].type = patch->tram_grp[i].grp_type;
dsp_mgr->tram_grp[grp].size = patch->tram_grp[i].grp_size;
}
for (i = 0; i < res->item_count; i++) {
if (res->items[i].grp_idx < 0) {
res->items[i].grp_idx = patch->tram_grp[-(res->items[i].grp_idx + 1)].grp_idx;
dsp_mgr->tram_grp[res->items[i].grp_idx].pos = TRAM_POS_NONE;
dsp_mgr->tram_grp[res->items[i].grp_idx].acc_count = res->items[i].grp_acc_count;
}
}
for (i = 0; i < patch->tram_acc_count; i++) {
acc = ld10k1_tram_acc_alloc(dsp_mgr);
patch->tram_acc[i].acc_idx = acc;
dsp_mgr->tram_acc[acc].type = patch->tram_acc[i].acc_type;
dsp_mgr->tram_acc[acc].offset = patch->tram_acc[i].acc_offset;
dsp_mgr->tram_acc[acc].grp = patch->tram_grp[patch->tram_acc[i].grp].grp_idx;
}
ld10k1_tram_res_alloc_hwacc(dsp_mgr, res);
ld10k1_tram_realloc_space(dsp_mgr, res);
return 0;
}
int ld10k1_tram_hwacc_alloc(ld10k1_dsp_mgr_t *dsp_mgr, int external)
{
int i;
if (!external) {
for (i = 0; i < dsp_mgr->max_itram_hwacc; i++) {
if (!dsp_mgr->itram_hwacc[i].used) {
dsp_mgr->itram_hwacc[i].used = 1;
dsp_mgr->i_tram.used_hwacc++;
return i;
}
}
} else {
for (i = 0; i < dsp_mgr->max_etram_hwacc; i++) {
if (!dsp_mgr->etram_hwacc[i].used) {
dsp_mgr->etram_hwacc[i].used = 1;
dsp_mgr->e_tram.used_hwacc++;
return i + dsp_mgr->max_itram_hwacc;
}
}
}
return LD10K1_ERR_TRAM_FULL_ACC;
}
void ld10k1_tram_hwacc_free(ld10k1_dsp_mgr_t *dsp_mgr, int acc)
{
if (acc < dsp_mgr->max_itram_hwacc) {
dsp_mgr->itram_hwacc[acc].used = 0;
dsp_mgr->itram_hwacc[acc].addr_val = 0;
dsp_mgr->itram_hwacc[acc].data_val = 0;
dsp_mgr->itram_hwacc[acc].modified = 1;
dsp_mgr->i_tram.used_hwacc--;
} else {
int nacc = acc - dsp_mgr->max_itram_hwacc;
dsp_mgr->etram_hwacc[nacc].used = 0;
dsp_mgr->etram_hwacc[nacc].used = 0;
dsp_mgr->etram_hwacc[nacc].addr_val = 0;
dsp_mgr->etram_hwacc[nacc].data_val = 0;
dsp_mgr->etram_hwacc[nacc].modified = 1;
dsp_mgr->e_tram.used_hwacc--;
}
}
void ld10k1_tram_actualize_hwacc(ld10k1_dsp_mgr_t *dsp_mgr, int acc, unsigned int op, unsigned int addr, unsigned int data)
{
if (acc < dsp_mgr->max_itram_hwacc) {
dsp_mgr->itram_hwacc[acc].op = op;
dsp_mgr->itram_hwacc[acc].addr_val = addr;
dsp_mgr->itram_hwacc[acc].data_val = data;
dsp_mgr->itram_hwacc[acc].modified = 1;
} else {
int nacc = acc - dsp_mgr->max_itram_hwacc;
dsp_mgr->etram_hwacc[nacc].op = op;
dsp_mgr->etram_hwacc[nacc].addr_val = addr;
dsp_mgr->etram_hwacc[nacc].data_val = data;
dsp_mgr->etram_hwacc[nacc].modified = 1;
}
}
void ld10k1_tram_get_hwacc(ld10k1_dsp_mgr_t *dsp_mgr, int acc, unsigned int *addr, unsigned int *data)
{
int nacc;
if (acc < dsp_mgr->max_itram_hwacc) {
*addr = dsp_mgr->itram_hwacc[acc].addr_val;
*data = dsp_mgr->itram_hwacc[acc].data_val;
} else {
nacc = acc - dsp_mgr->max_itram_hwacc;
*addr = dsp_mgr->etram_hwacc[nacc].addr_val;
*data = dsp_mgr->etram_hwacc[nacc].data_val;
}
}
int ld10k1_tram_res_alloc_hwacc(ld10k1_dsp_mgr_t *dsp_mgr, ld10k1_dsp_tram_resolve_t *res)
{
int i, j;
int grp_idx;
int hwacc;
/* free hw acc - where pos changed */
for (i = 0; i < res->item_count; i++) {
grp_idx = res->items[i].grp_idx;
if (dsp_mgr->tram_grp[grp_idx].pos != TRAM_POS_NONE &&
dsp_mgr->tram_grp[grp_idx].pos != res->items[i].pos) {
for (j = 0; j < dsp_mgr->max_tram_acc; j++)
if (dsp_mgr->tram_acc[j].used &&
dsp_mgr->tram_acc[j].grp == grp_idx)
ld10k1_tram_hwacc_free(dsp_mgr, dsp_mgr->tram_acc[j].hwacc);
dsp_mgr->tram_grp[grp_idx].pos = TRAM_POS_NONE;
}
}
/* now allocate */
for (i = 0; i < res->item_count; i++) {
grp_idx = res->items[i].grp_idx;
if (dsp_mgr->tram_grp[grp_idx].pos == TRAM_POS_NONE &&
dsp_mgr->tram_grp[grp_idx].pos != res->items[i].pos) {
dsp_mgr->tram_grp[grp_idx].pos = res->items[i].pos;
for (j = 0; j < dsp_mgr->max_tram_acc; j++)
if (dsp_mgr->tram_acc[j].used &&
dsp_mgr->tram_acc[j].grp == grp_idx) {
hwacc = ld10k1_tram_hwacc_alloc(dsp_mgr, res->items[i].pos == TRAM_POS_EXTERNAL ? 1 : 0);
dsp_mgr->tram_acc[j].hwacc = hwacc;
}
}
}
return 0;
}
int ld10k1_tram_realloc_space(ld10k1_dsp_mgr_t *dsp_mgr, ld10k1_dsp_tram_resolve_t *res)
{
int itram_size = res->isize;
int etram_size = res->esize;
int i;
/* allocate from end */
for (i = 0; i < dsp_mgr->max_tram_grp; i++)
if (dsp_mgr->tram_grp[i].used) {
if (dsp_mgr->tram_grp[i].pos == TRAM_POS_INTERNAL) {
itram_size -= dsp_mgr->tram_grp[i].size;
dsp_mgr->tram_grp[i].offset = itram_size;
} else if (dsp_mgr->tram_grp[i].pos == TRAM_POS_EXTERNAL) {
etram_size -= dsp_mgr->tram_grp[i].size;
dsp_mgr->tram_grp[i].offset = etram_size;
}
}
return 0;
}
int ld10k1_tram_actualize_tram_for_patch(ld10k1_dsp_mgr_t *dsp_mgr, ld10k1_patch_t *patch)
{
int i;
int grp_idx;
int acc_idx;
int tram_op;
/* for all patch accs */
for (i = 0; i < patch->tram_acc_count; i++) {
grp_idx = patch->tram_grp[patch->tram_acc[i].grp].grp_idx;
acc_idx = patch->tram_acc[i].acc_idx;
tram_op = 0;
if (dsp_mgr->tram_acc[acc_idx].type == TRAM_ACC_WRITE)
tram_op = TRAM_OP_WRITE;
else
tram_op = TRAM_OP_READ;
ld10k1_tram_actualize_hwacc(dsp_mgr, dsp_mgr->tram_acc[acc_idx].hwacc,
tram_op, dsp_mgr->tram_grp[grp_idx].offset + patch->tram_acc[i].acc_offset, 0);
}
return 0;
}
int ld10k1_tram_free_tram_for_patch(ld10k1_dsp_mgr_t *dsp_mgr, ld10k1_patch_t *patch)
{
int i;
int acc_idx;
int grp_idx;
/* free all patch accs */
for (i = 0; i < patch->tram_acc_count; i++) {
acc_idx = patch->tram_acc[i].acc_idx;
ld10k1_tram_hwacc_free(dsp_mgr, dsp_mgr->tram_acc[acc_idx].hwacc);
ld10k1_tram_acc_free(dsp_mgr, acc_idx);
}
/* free all patch grps */
for (i = 0; i < patch->tram_count; i++) {
grp_idx = patch->tram_grp[i].grp_idx;
ld10k1_tram_grp_free(dsp_mgr, grp_idx);
}
return 0;
}