Use algorithm to speed up fespi flash programming.
It's still really slow, at 854b/s, but it seems to work and it's a lot of new code. Change-Id: I9dd057bbcc81a56eb558b4f33ac35f6f03c23588
This commit is contained in:
parent
6686e71bd6
commit
18eedf996c
|
@ -41,6 +41,7 @@
|
|||
#include "spi.h"
|
||||
#include <jtag/jtag.h>
|
||||
#include <helper/time_support.h>
|
||||
#include <target/algorithm.h>
|
||||
|
||||
/* Register offsets */
|
||||
|
||||
|
@ -357,27 +358,16 @@ static int fespi_protect(struct flash_bank *bank, int set,
|
|||
return ERROR_OK;
|
||||
}
|
||||
|
||||
/* This should write something less than or equal to a page.*/
|
||||
static int fespi_write_buffer(struct flash_bank *bank, const uint8_t *buffer,
|
||||
uint32_t offset, uint32_t len)
|
||||
static int slow_fespi_write_buffer(struct flash_bank *bank,
|
||||
const uint8_t *buffer, uint32_t offset, uint32_t len)
|
||||
{
|
||||
struct target *target = bank->target;
|
||||
struct fespi_flash_bank *fespi_info = bank->driver_priv;
|
||||
uint32_t ctrl_base = fespi_info->ctrl_base;
|
||||
|
||||
uint32_t ii;
|
||||
|
||||
//TODO!!! assert that len < page size
|
||||
|
||||
LOG_DEBUG("%s: offset=0x%08" PRIx32 " len=0x%08" PRIx32,
|
||||
__func__, offset, len);
|
||||
|
||||
|
||||
printf("%s: offset=0x%08" PRIx32 " len=0x%08" PRIx32,
|
||||
__func__, offset, len);
|
||||
|
||||
|
||||
|
||||
fespi_tx(bank, SPIFLASH_WRITE_ENABLE);
|
||||
fespi_txwm_wait(bank);
|
||||
|
||||
|
@ -400,6 +390,102 @@ static int fespi_write_buffer(struct flash_bank *bank, const uint8_t *buffer,
|
|||
return ERROR_OK;
|
||||
}
|
||||
|
||||
/* This should write something less than or equal to a page.*/
|
||||
static int fespi_write_buffer(struct flash_bank *bank, const uint8_t *buffer,
|
||||
uint32_t chip_offset, uint32_t len,
|
||||
struct working_area *algorithm_wa)
|
||||
{
|
||||
struct target *target = bank->target;
|
||||
struct fespi_flash_bank *fespi_info = bank->driver_priv;
|
||||
uint32_t ctrl_base = fespi_info->ctrl_base;
|
||||
|
||||
LOG_DEBUG("%s: chip_offset=0x%08" PRIx32 " len=0x%08" PRIx32,
|
||||
__func__, chip_offset, len);
|
||||
|
||||
if (!algorithm_wa) {
|
||||
return slow_fespi_write_buffer(bank, buffer, chip_offset, len);
|
||||
}
|
||||
|
||||
struct working_area *data_wa;
|
||||
unsigned data_wa_size = len + 4;
|
||||
while (1) {
|
||||
if (data_wa_size < 128) {
|
||||
LOG_WARNING("Couldn't allocate data working area.");
|
||||
return slow_fespi_write_buffer(bank, buffer, chip_offset, len);
|
||||
}
|
||||
if (target_alloc_working_area_try(target, data_wa_size, &data_wa) ==
|
||||
ERROR_OK) {
|
||||
break;
|
||||
}
|
||||
|
||||
data_wa_size /= 2;
|
||||
}
|
||||
|
||||
fespi_tx(bank, SPIFLASH_WRITE_ENABLE);
|
||||
fespi_txwm_wait(bank);
|
||||
|
||||
FESPI_WRITE_REG(FESPI_REG_CSMODE, FESPI_CSMODE_HOLD);
|
||||
|
||||
// Make the biggest possible block of txdata so we can write it in the
|
||||
// minimum number of operations.
|
||||
uint8_t *tx_data = malloc(4 + len);
|
||||
if (!tx_data) {
|
||||
LOG_ERROR("Couldn't allocate tx_data.");
|
||||
return ERROR_FAIL;
|
||||
}
|
||||
|
||||
tx_data[0] = SPIFLASH_PAGE_PROGRAM;
|
||||
tx_data[1] = chip_offset >> 16;
|
||||
tx_data[2] = chip_offset >> 8;
|
||||
tx_data[3] = chip_offset;
|
||||
memcpy(tx_data + 4, buffer, len);
|
||||
len += 4;
|
||||
|
||||
struct reg_param reg_params[3];
|
||||
init_reg_param(®_params[0], "x10", 32, PARAM_OUT);
|
||||
init_reg_param(®_params[1], "x11", 32, PARAM_OUT);
|
||||
init_reg_param(®_params[2], "x12", 32, PARAM_OUT);
|
||||
buf_set_u32(reg_params[0].value, 0, 32, ctrl_base + FESPI_REG_TXFIFO);
|
||||
buf_set_u32(reg_params[1].value, 0, 32, data_wa->address);
|
||||
unsigned offset = 0;
|
||||
while (len > 0) {
|
||||
unsigned bytes = MIN(len, data_wa->size);
|
||||
buf_set_u32(reg_params[2].value, 0, 32, bytes);
|
||||
int retval = target_write_buffer(target, data_wa->address, bytes,
|
||||
tx_data + offset);
|
||||
if (retval != ERROR_OK) {
|
||||
LOG_ERROR("Failed to write data to 0x%x: %d", data_wa->address,
|
||||
retval);
|
||||
goto error;
|
||||
}
|
||||
|
||||
retval = target_run_algorithm(target, 0, NULL, 3, reg_params,
|
||||
algorithm_wa->address,
|
||||
algorithm_wa->address + algorithm_wa->size - 4,
|
||||
10000, NULL);
|
||||
if (retval != ERROR_OK) {
|
||||
LOG_ERROR("Failed to execute algorithm at 0x%x: %d", algorithm_wa->address,
|
||||
retval);
|
||||
goto error;
|
||||
}
|
||||
|
||||
len -= bytes;
|
||||
offset += bytes;
|
||||
}
|
||||
|
||||
target_free_working_area(target, data_wa);
|
||||
|
||||
fespi_txwm_wait(bank);
|
||||
FESPI_WRITE_REG(FESPI_REG_CSMODE, FESPI_CSMODE_AUTO);
|
||||
|
||||
return ERROR_OK;
|
||||
|
||||
error:
|
||||
target_free_working_area(target, data_wa);
|
||||
LOG_ERROR("Falling back to slow write.");
|
||||
return slow_fespi_write_buffer(bank, buffer, chip_offset, len);
|
||||
}
|
||||
|
||||
static int fespi_write(struct flash_bank *bank, const uint8_t *buffer,
|
||||
uint32_t offset, uint32_t count)
|
||||
{
|
||||
|
@ -436,6 +522,39 @@ static int fespi_write(struct flash_bank *bank, const uint8_t *buffer,
|
|||
}
|
||||
}
|
||||
|
||||
struct working_area *algorithm_wa;
|
||||
static const uint32_t riscv_write_buffer_code[] = {
|
||||
// a0 - address of FESPI_REG_TXFIFO
|
||||
// a1 - start address of buffer
|
||||
// a2 - size of buffer, in bytes
|
||||
/* 0 */ 0x00052283, // lw t0,0(a0)
|
||||
/* 4 */ 0xfe02cee3, // bltz t0,0
|
||||
/* 8 */ 0x00058283, // lb t0,0(a1)
|
||||
/* c */ 0x00552023, // sw t0,0(a0)
|
||||
/* 10 */ 0x00158593, // addi a1,a1,1
|
||||
/* 14 */ 0xfff60613, // addi a2,a2,-1
|
||||
/* 18 */ 0xfec044e3, // bgtz a2,0
|
||||
/* 1c */ 0x00100073, // ebreak
|
||||
};
|
||||
if (target_alloc_working_area(target, sizeof(riscv_write_buffer_code),
|
||||
&algorithm_wa) != ERROR_OK) {
|
||||
LOG_WARNING("Couldn't allocate %ld-byte working area.",
|
||||
sizeof(riscv_write_buffer_code));
|
||||
algorithm_wa = NULL;
|
||||
} else {
|
||||
uint8_t code[sizeof(riscv_write_buffer_code)];
|
||||
target_buffer_set_u32_array(target, code,
|
||||
ARRAY_SIZE(riscv_write_buffer_code), riscv_write_buffer_code);
|
||||
retval = target_write_buffer(target, algorithm_wa->address,
|
||||
sizeof(code), code);
|
||||
if (retval != ERROR_OK) {
|
||||
LOG_ERROR("Failed to write code to 0x%x: %d", algorithm_wa->address,
|
||||
retval);
|
||||
target_free_working_area(target, algorithm_wa);
|
||||
algorithm_wa = NULL;
|
||||
}
|
||||
}
|
||||
|
||||
page_size = fespi_info->dev->pagesize;
|
||||
|
||||
fespi_txwm_wait(bank);
|
||||
|
@ -454,7 +573,7 @@ static int fespi_write(struct flash_bank *bank, const uint8_t *buffer,
|
|||
if (cur_count > count)
|
||||
cur_count = count;
|
||||
retval = fespi_write_buffer(bank, buffer, offset,
|
||||
cur_count);
|
||||
cur_count, algorithm_wa);
|
||||
if (retval != ERROR_OK)
|
||||
goto err;
|
||||
offset += cur_count;
|
||||
|
@ -472,7 +591,7 @@ static int fespi_write(struct flash_bank *bank, const uint8_t *buffer,
|
|||
cur_count = count & ~3;
|
||||
|
||||
retval = fespi_write_buffer(bank, buffer, offset,
|
||||
cur_count);
|
||||
cur_count, algorithm_wa);
|
||||
if (retval != ERROR_OK)
|
||||
goto err;
|
||||
|
||||
|
@ -486,9 +605,13 @@ static int fespi_write(struct flash_bank *bank, const uint8_t *buffer,
|
|||
|
||||
/* buffer tail */
|
||||
if (count > 0)
|
||||
retval = fespi_write_buffer(bank, buffer, offset, count);
|
||||
retval = fespi_write_buffer(bank, buffer, offset, count, algorithm_wa);
|
||||
|
||||
err:
|
||||
if (algorithm_wa) {
|
||||
target_free_working_area(target, algorithm_wa);
|
||||
}
|
||||
|
||||
/* Switch to HW mode before return to prompt */
|
||||
FESPI_ENABLE_HW_MODE();
|
||||
return retval;
|
||||
|
|
|
@ -7,12 +7,14 @@
|
|||
#endif
|
||||
|
||||
#include "target.h"
|
||||
#include "target/algorithm.h"
|
||||
#include "target_type.h"
|
||||
#include "log.h"
|
||||
#include "jtag/jtag.h"
|
||||
#include "opcodes.h"
|
||||
#include "register.h"
|
||||
#include "breakpoints.h"
|
||||
#include "helper/time_support.h"
|
||||
|
||||
/**
|
||||
* Since almost everything can be accomplish by scanning the dbus register, all
|
||||
|
@ -1291,6 +1293,7 @@ static int register_get(struct reg *reg)
|
|||
return ERROR_OK;
|
||||
} else if (reg->number == REG_PC) {
|
||||
buf_set_u32(reg->value, 0, 32, info->dpc);
|
||||
reg->valid = true;
|
||||
LOG_DEBUG("%s=0x%" PRIx64 " (cached)", reg->name, info->dpc);
|
||||
return ERROR_OK;
|
||||
} else if (reg->number >= REG_FPR0 && reg->number <= REG_FPR31) {
|
||||
|
@ -2628,11 +2631,114 @@ static int riscv_get_gdb_reg_list(struct target *target,
|
|||
return ERROR_OK;
|
||||
}
|
||||
|
||||
int riscv_arch_state(struct target *target)
|
||||
static int riscv_arch_state(struct target *target)
|
||||
{
|
||||
return ERROR_OK;
|
||||
}
|
||||
|
||||
// Algorithm must end with a software breakpoint instruction.
|
||||
static int riscv_run_algorithm(struct target *target, int num_mem_params,
|
||||
struct mem_param *mem_params, int num_reg_params,
|
||||
struct reg_param *reg_params, uint32_t entry_point,
|
||||
uint32_t exit_point, int timeout_ms, void *arch_info)
|
||||
{
|
||||
riscv_info_t *info = (riscv_info_t *) target->arch_info;
|
||||
|
||||
if (num_mem_params > 0) {
|
||||
LOG_ERROR("Memory parameters are not supported for RISC-V algorithms.");
|
||||
return ERROR_FAIL;
|
||||
}
|
||||
|
||||
if (target->state != TARGET_HALTED) {
|
||||
LOG_WARNING("target not halted");
|
||||
return ERROR_TARGET_NOT_HALTED;
|
||||
}
|
||||
|
||||
/// Save registers
|
||||
if (register_get(&target->reg_cache->reg_list[REG_PC]) != ERROR_OK) {
|
||||
return ERROR_FAIL;
|
||||
}
|
||||
uint64_t saved_pc = reg_cache_get(target, REG_PC);
|
||||
|
||||
uint64_t saved_regs[32];
|
||||
for (int i = 0; i < num_reg_params; i++) {
|
||||
LOG_DEBUG("save %s", reg_params[i].reg_name);
|
||||
struct reg *r = register_get_by_name(target->reg_cache, reg_params[i].reg_name, 0);
|
||||
if (!r) {
|
||||
LOG_ERROR("Couldn't find register named '%s'", reg_params[i].reg_name);
|
||||
return ERROR_FAIL;
|
||||
}
|
||||
|
||||
if (r->size != reg_params[i].size) {
|
||||
LOG_ERROR("Register %s is %d bits instead of %d bits.",
|
||||
reg_params[i].reg_name, r->size, reg_params[i].size);
|
||||
return ERROR_FAIL;
|
||||
}
|
||||
|
||||
if (r->number > REG_XPR31) {
|
||||
LOG_ERROR("Only GPRs can be use as argument registers.");
|
||||
return ERROR_FAIL;
|
||||
}
|
||||
|
||||
if (register_get(r) != ERROR_OK) {
|
||||
return ERROR_FAIL;
|
||||
}
|
||||
saved_regs[r->number] = buf_get_u64(r->value, 0, info->xlen);
|
||||
if (register_set(r, reg_params[i].value) != ERROR_OK) {
|
||||
return ERROR_FAIL;
|
||||
}
|
||||
}
|
||||
|
||||
/// Run algorithm
|
||||
LOG_DEBUG("resume at 0x%x", entry_point);
|
||||
if (riscv_resume(target, 0, entry_point, 0, 0) != ERROR_OK) {
|
||||
return ERROR_FAIL;
|
||||
}
|
||||
|
||||
int64_t start = timeval_ms();
|
||||
while (target->state != TARGET_HALTED) {
|
||||
LOG_DEBUG("poll()");
|
||||
int64_t now = timeval_ms();
|
||||
if (now - start > timeout_ms) {
|
||||
LOG_ERROR("Algorithm timed out after %d ms.", timeout_ms);
|
||||
return ERROR_TARGET_TIMEOUT;
|
||||
}
|
||||
|
||||
int result = riscv_poll(target);
|
||||
if (result != ERROR_OK) {
|
||||
return result;
|
||||
}
|
||||
}
|
||||
|
||||
if (register_get(&target->reg_cache->reg_list[REG_PC]) != ERROR_OK) {
|
||||
return ERROR_FAIL;
|
||||
}
|
||||
uint64_t final_pc = reg_cache_get(target, REG_PC);
|
||||
if (final_pc != exit_point) {
|
||||
LOG_ERROR("PC ended up at 0x%" PRIx64 " instead of 0x%" PRIx32,
|
||||
final_pc, exit_point);
|
||||
return ERROR_FAIL;
|
||||
}
|
||||
|
||||
/// Restore registers
|
||||
uint8_t buf[8];
|
||||
buf_set_u64(buf, 0, info->xlen, saved_pc);
|
||||
if (register_set(&target->reg_cache->reg_list[REG_PC], buf) != ERROR_OK) {
|
||||
return ERROR_FAIL;
|
||||
}
|
||||
|
||||
for (int i = 0; i < num_reg_params; i++) {
|
||||
LOG_DEBUG("restore %s", reg_params[i].reg_name);
|
||||
struct reg *r = register_get_by_name(target->reg_cache, reg_params[i].reg_name, 0);
|
||||
buf_set_u64(buf, 0, info->xlen, saved_regs[r->number]);
|
||||
if (register_set(r, buf) != ERROR_OK) {
|
||||
return ERROR_FAIL;
|
||||
}
|
||||
}
|
||||
|
||||
return ERROR_OK;
|
||||
}
|
||||
|
||||
struct target_type riscv_target =
|
||||
{
|
||||
.name = "riscv",
|
||||
|
@ -2663,4 +2769,6 @@ struct target_type riscv_target =
|
|||
.remove_watchpoint = riscv_remove_watchpoint,
|
||||
|
||||
.arch_state = riscv_arch_state,
|
||||
|
||||
.run_algorithm = riscv_run_algorithm,
|
||||
};
|
||||
|
|
Loading…
Reference in New Issue