port stuff to rpi and zynq

This commit is contained in:
Triss 2022-01-29 02:26:40 +01:00
parent 809ad7cf87
commit 6742aa38e3
6 changed files with 487 additions and 72 deletions

284
jazelle.c
View File

@ -1,9 +1,45 @@
#if !defined(__arm__) || (__SIZE_WIDTH__ != 32)
#error "This code is 32-bit ARM only!"
#endif
#if defined(__ARM_ARCH_6M__) || defined(__ARM_ARCH_7EM__) || defined(__ARM_ARCH_8M_MAIN__) \
|| defined(__ARM_ARCH_7R__) || defined(__ARM_ARCH_8R__)
#error "This code is only available on ARM7, ARM9, ARM11 and Cortex-A devices, not on Cortex-M or Cortex-R."
#endif
#include <stddef.h> #include <stddef.h>
#include <stdint.h> #include <stdint.h>
#include <stdbool.h> #include <stdbool.h>
#if defined(__linux__) && !defined(__KERNEL__)
#include <stdlib.h>
#include <stdio.h> #include <stdio.h>
#include <string.h> #include <string.h>
#define iprintf(fmt, ...) printf((fmt), ##__VA_ARGS__)
#elif defined(__KERNEL__)
#include <linux/kernel.h>
#include <linux/module.h>
#define iprintf(fmt, ...) printk(KERN_ERR " " fmt, ##__VA_ARGS__)
// TODO: is a memcpy impl needed?
#elif defined(ZYNQ) /* zynq baremetal */
#include <stdarg.h>
#include <string.h>
#include "xil_printf.h"
#include "zynq_printf.h"
#define iprintf(fmt, ...) printf((fmt), ##__VA_ARGS__)
#else
// newlib assumed
#include <stdio.h>
#include <string.h>
#endif // platform
// known ID table: // known ID table:
// Chip name | ARM core | ARM CPUID | JTAG IDCODE | Jazelle ID // Chip name | ARM core | ARM CPUID | JTAG IDCODE | Jazelle ID
@ -45,12 +81,66 @@ bytecode IDs that use a handler:
*/ */
#if !defined(__linux__) || defined(_LINUX_KERNEL_H) #ifdef __linux__
static bool getstr(char** ap, const char* name, uint32_t* out) {
char* a = *ap, *aa = a;
a = strstr(a, name); if (!a) { /*printf("no name\n");*/ return false; }
a = strstr(a, ": "); if (!a) { /*printf("no colon\n");*/ return false; }
a = a + strlen(": ");
*out = strtoul(a, &aa, 0);
if (a == aa) { /*printf("no int: %s\n", a);*/ return false; }
*ap = aa;
return true;
}
#endif
#if !defined(__linux__) || defined(__KERNEL__)
inline inline
#endif #endif
static uint32_t arm_get_id(void) { static uint32_t arm_get_id(void) {
#if defined(__linux__) && !defined(_LINUX_KERNEL_H) #if defined(__linux__) && !defined(__KERNEL__)
// TODO: read out /sys/devices/system/cpu/cpu*/regs/identification/midr_el1 or /proc/cpuinfo // NOTE: better to read out /sys/devices/system/cpu/cpu*/regs/identification/midr_el1 ,
// but this one doesn't seem to be available on my rpi running 5.4.x,
// so, /proc/cpuinfo it is
uint32_t midr = 0;
FILE* f = fopen("/proc/cpuinfo", "rb");
if (!f) return 0;
void* dest = malloc(4096); // should be enough
size_t rrr = fread(dest, 1, 4096, f);
fclose(f);
if (rrr == 0) goto EXIT;
char* a = (char*)dest;
uint32_t impl, arch, var, part, rev;
if (!getstr(&a, "CPU implementer", &impl)) { printf("no impl\n"); goto EXIT; }
if (!getstr(&a, "CPU architecture", &arch)) { printf("no arch\n"); goto EXIT; }
if (!getstr(&a, "CPU variant", &var)) { printf("no var\n"); goto EXIT; }
if (!getstr(&a, "CPU part", &part)) { printf("no part\n"); goto EXIT; }
if (!getstr(&a, "CPU revision", &rev)) { printf("no rev\n"); goto EXIT; }
midr = (impl << 24) | (arch << 20) | (var << 16) | (part << 4) | (rev << 0);
do {
// try to read more values, may be useful in eg. a big.LITTLE setup
if (!getstr(&a, "CPU implementer", &impl)) break;
if (!getstr(&a, "CPU architecture", &arch)) break;
if (!getstr(&a, "CPU variant", &var)) break;
if (!getstr(&a, "CPU part", &part)) break;
if (!getstr(&a, "CPU revision", &rev)) break;
uint32_t m2 = (impl << 24) | (arch << 20) | (var << 16) | (part << 4) | (rev << 0);
if (m2 != midr) {
printf("found different MIDR on other core: 0x%08lx\n", m2);
}
} while (a);
EXIT:
free(dest);
return midr;
#else #else
// NOTE: requires kernel mode execution level to read // NOTE: requires kernel mode execution level to read
uint32_t res; uint32_t res;
@ -65,40 +155,77 @@ inline static uint32_t jazelle_get_id(void) {
return res; return res;
} }
// TODO: use different implementations when porting to other stuff #if defined(__linux__) && !defined(__KERNEL__)
#if defined(__linux__) && !defined(_LINUX_KERNEL_H) // TODO: better implementation lmao
#error "TODO: implement cache flushes for Linux userspace" static void DC_FlushAll(void) {
#elif defined(ARM9) const size_t size = 65536*4;
__attribute__((__naked__)) // shrug
static void DC_FlushAll() { void* v = (void*)malloc(size);
if (!v) return; // a
for (size_t i = 0; i < size; i += 4) {
volatile uint32_t* p = (volatile uint32_t*)v;
p[i >> 2] = 0;
asm volatile("":::"memory");
}
free(v);
}
__attribute__((__unused__))
static void DC_InvalidateAll(void) {
DC_FlushAll();
}
__attribute__((__naked__, __no_inline__))
static void IC_InvalidateAll(void) {
asm volatile( asm volatile(
" mov r1, #0\n" ".fill 65536, 4, 0\n" // 64k nop instructions because eh
"bx lr\n"
:
:
:"memory"
);
}
#elif (__ARM_ARCH == 5 /* ARM9 */) || (__ARM_ARCH == 6 && defined(__ARM_ARCH_6KZ__))
__attribute__((__naked__))
static void DC_FlushAll(void) {
// lifted from libnds
asm volatile(
#if __ARM_ARCH == 5
"mov r1, #0\n"
"outer_loop:\n" "outer_loop:\n"
" mov r0, #0\n" "mov r0, #0\n"
"inner_loop:\n" "inner_loop:\n"
" orr r2, r1, r0 @ generate segment and line address\n" "orr r2, r1, r0 @ generate segment and line address\n"
" mcr p15, 0, r2, c7, c14, 2 @ clean and flush the line\n" "mcr p15, 0, r2, c7, c14, 2 @ clean and flush the line\n"
" add r0, r0, #32\n" "add r0, r0, #32\n" // FIXME hardcoded cache line size
" cmp r0, #0x1000/4\n" "cmp r0, #0x1000/4\n" // FIXME hardcoded cache size
" bne inner_loop\n" "bne inner_loop\n"
" add r1, r1, #0x40000000\n" "add r1, r1, #0x40000000\n"
" cmp r1, #0\n" "cmp r1, #0\n"
" bne outer_loop\n" "bne outer_loop\n"
#elif __ARM_ARCH == 6 && defined(__ARM_ARCH_6KZ__)
" mov r0, #0\n" "mov r0, #0\n"
" mcr p15, 0, r0, c7, c10, 4 @ drain write buffer\n" "mcr p15, 0, r0, c7, c10, 0\n" // clean & flush entire data cache
" bx lr\n" #else
:::"memory"); #error "wut"
} #endif
static inline void DC_InvalidateAll() {
asm volatile("mcr p15, 0, %0, c7, c6, 0" : : "r"(0)); "mov r0, #0\n"
} "mcr p15, 0, r0, c7, c10, 4 @ drain write buffer\n" // ARM9, ARM11 ok
static inline void IC_InvalidateAll() { "bx lr\n"
asm volatile("mcr p15, 0, %0, c7, c5, 0" : : "r"(0)); :
} :
:"memory"
);
}
__attribute__((__unused__))
static inline void DC_InvalidateAll(void) {
asm volatile("mcr p15, 0, %0, c7, c6, 0" : : "r"(0)); // ARM9, ARM11 ok
}
static inline void IC_InvalidateAll(void) {
asm volatile("mcr p15, 0, %0, c7, c5, 0" : : "r"(0)); // ARM9, ARM11 ok
}
#elif __ARM_ARCH == 7 && defined(__ARM_ARCH_7A__)
#include "cache_cortexa.c" /* go sue me */
#else #else
// TODO: ARM11
// TODO: Cortex-A[89]
#error "TODO: define data and instruction cache functions for your target!" #error "TODO: define data and instruction cache functions for your target!"
#endif #endif
@ -111,25 +238,25 @@ static struct {
/* /*
* c0: Jazelle Identity register (read-only) * c0: Jazelle Identity register (read-only)
Bits 0-11: Subarchitecture-defined bits (reads as 4, meaning unknown) * Bits 0-11: Subarchitecture-defined bits (reads as 4, meaning unknown)
Bits 12-19: Subarchitecture (reads as 0, Jazelle V1 according to documentation) * Bits 12-19: Subarchitecture (reads as 0, Jazelle V1 according to documentation)
Bits 20-27: Implementor (reads as 0x41, ARM Limited according to documentation) * Bits 20-27: Implementor (reads as 0x41, ARM Limited according to documentation)
Bits 28-31: Architecture (reads as 6, ARMv5TEJ according to documentation) * Bits 28-31: Architecture (reads as 6, ARMv5TEJ according to documentation)
c1: Operating System Control register * c1: Operating System Control register
Bit 0: Configuration Disabled (CD) (documented) * Bit 0: Configuration Disabled (CD) (documented)
Bit 1: Configuration Valid (CV) (documented) * Bit 1: Configuration Valid (CV) (documented)
c2: Main Configuration register * c2: Main Configuration register
Bit 0: Jazelle Enable (JE) (documented) * Bit 0: Jazelle Enable (JE) (documented)
Bits 26-28: Unknown * Bits 26-28: Unknown
Bit 29: If set, array object contains its elements directly, otherwise it contains a pointer to its elements * Bit 29: If set, array object contains its elements directly, otherwise it contains a pointer to its elements
Bit 31: Disable array instructions if set? * Bit 31: Disable array instructions if set?
c3: Array object layout register * c3: Array object layout register
Bits 0-7: Unknown * Bits 0-7: Unknown
Bits 8-11: Offset (in words) within array object of first element or of pointer to first element * Bits 8-11: Offset (in words) within array object of first element or of pointer to first element
Bits 12-15: Offset (in words) within array object of length * Bits 12-15: Offset (in words) within array object of length
Bit 16: If set, offset to length is subtracted, otherwise added * Bit 16: If set, offset to length is subtracted, otherwise added
Bits 17-19: Array length shift value (number of elements = stored length >> this) * Bits 17-19: Array length shift value (number of elements = stored length >> this)
Bits 20-21: Disable array instructions if set? * Bits 20-21: Disable array instructions if set?
*/ */
static uint32_t jazelle_exit_save; static uint32_t jazelle_exit_save;
@ -148,6 +275,7 @@ static int jazelle_exec_native(const void* bytecode, const void* block) {
"add r6, r5, #0x800\n" "add r6, r5, #0x800\n"
"add r7, r5, #0x900\n" "add r7, r5, #0x900\n"
// "r8: Pointer to constant pool? (haven't checked this yet)" -Hackspire // "r8: Pointer to constant pool? (haven't checked this yet)" -Hackspire
// libjz contradicts this...
// set configuration valid & jazelle enable bits // set configuration valid & jazelle enable bits
"mov r0, #2\n" "mov r0, #2\n"
@ -185,6 +313,24 @@ static int jazelle_exec_native(const void* bytecode, const void* block) {
} }
extern uint32_t backup_r5;
uint32_t backup_r5 = 0;
__attribute__((__naked__))
static void handler_0xfe(void) {
(void)&backup_r5;
asm volatile(
"ldr r0, =backup_r5\n"
"str r5, [r0]\n"
// return to jazelle (yes lr has to be incremented otherwise the
// current instruction keeps getting executed in a loop)
"add lr, #1\n"
"bxj r12\n" // FIXME: r12 can be modified by jazelle so it should be restored to something
//:
//:[br5]"m"(backup_r5)
);
}
__attribute__((__naked__)) __attribute__((__naked__))
static void handler_idiv(void) { static void handler_idiv(void) {
@ -243,7 +389,6 @@ static void handler_ireturn(void) {
:[exsav]"m"(jazelle_exit_save) :[exsav]"m"(jazelle_exit_save)
:"r12" :"r12"
); );
__builtin_unreachable();
} }
@ -267,7 +412,6 @@ static void handler_wasexec() {
,[we]"m"(was_exec) ,[we]"m"(was_exec)
:"r0","r12" :"r0","r12"
); );
__builtin_unreachable();
} }
__attribute__((__naked__)) __attribute__((__naked__))
@ -280,7 +424,6 @@ static void handler_noexec() {
:[exsav]"m"(jazelle_exit_save) :[exsav]"m"(jazelle_exit_save)
:"r0","r12" :"r0","r12"
); );
__builtin_unreachable();
} }
static uint8_t bytecode_testh[] = { static uint8_t bytecode_testh[] = {
@ -290,7 +433,7 @@ static uint8_t bytecode_testh[] = {
0x04, 0x04, 0x04, 0x04,
0x6C, // +8 0x6C, // +8
0x00, 0x00, 0x00, 0x00, // up to 4 nops of argument bytes eg for invokeXYZ 0x00, 0x00, 0x00, 0x00, // up to 4 nops of argument bytes eg for invokeXYZ
0x00, 0x00, 0x00, 0x00, // except 2nd byte is 3 for goto offset (BE) (3 aka iconst_0) 0x00, 0x00, 0x00, 0x00, // also needs to be modified to make some insns work
0xBA, // +17 // invokedynamic, complex enough to never be implemented in hw 0xBA, // +17 // invokedynamic, complex enough to never be implemented in hw
0x00, 0x00, 0x00, 0x00, // up to 4 nops of argument bytes eg for invokeXYZ 0x00, 0x00, 0x00, 0x00, // up to 4 nops of argument bytes eg for invokeXYZ
}; };
@ -321,19 +464,20 @@ static void jazelle_test_handlers(uint8_t hflags[256/8]) {
} }
memset(&jazelle_block, 0, sizeof jazelle_block); memset(&jazelle_block, 0, sizeof jazelle_block);
// initialize local 1 for a return address for the 'ret' opcode // initialize local 1 for a return address for the 'ret' opcode
uint32_t retval = &bytecode_testh[17]; uint32_t retval = (uint32_t)&bytecode_testh[17];
jazelle_block.locals[4] = retval >> 0; jazelle_block.locals[4] = retval >> 0;
jazelle_block.locals[5] = retval >> 8; jazelle_block.locals[5] = retval >> 8;
jazelle_block.locals[6] = retval >>16; jazelle_block.locals[6] = retval >>16;
jazelle_block.locals[7] = retval >>24; jazelle_block.locals[7] = retval >>24;
DC_FlushAll(); DC_FlushAll();
DC_InvalidateAll(); //DC_InvalidateAll();
IC_InvalidateAll(); IC_InvalidateAll();
jazelle_block.handlers[i] = handler_wasexec; jazelle_block.handlers[i] = handler_wasexec;
jazelle_block.handlers[0xba] = handler_noexec; jazelle_block.handlers[0xba] = handler_noexec;
//iprintf("bc 0x%02x\r\n", i);
was_exec = 0; was_exec = 0;
jazelle_exec_native(bytecode_testh, &jazelle_block); jazelle_exec_native(bytecode_testh, &jazelle_block);
@ -353,6 +497,7 @@ static uint8_t bytecode_test1[] = {
0x06, // iconst_3 0x06, // iconst_3
0x07, // iconst_4 0x07, // iconst_4
0x05, // iconst_2 0x05, // iconst_2
0xFE, // ??? (r5 readout)
0x6C, // idiv 0x6C, // idiv
0x04, // iconst_1 0x04, // iconst_1
0x60, // iadd 0x60, // iadd
@ -364,16 +509,19 @@ static uint8_t bytecode_test1[] = {
static int jazelle_exec(const uint8_t* bytecode) { static int jazelle_exec(const uint8_t* bytecode) {
jazelle_block.handlers[0x6C] = handler_idiv; jazelle_block.handlers[0x6C] = handler_idiv;
jazelle_block.handlers[0xAC] = handler_ireturn; jazelle_block.handlers[0xAC] = handler_ireturn;
/* jazelle_block.handlers[0xFE] = handler_0xfe;
/*
* +000-3FF: Unhandled bytecodes * +000-3FF: Unhandled bytecodes
The stack is flushed to memory before calling any of these handlers, so they may modify r0-r3 freely * The stack is flushed to memory before calling any of these handlers, so
+400: Null pointer exception * they may modify r0-r3 freely
+404: Array index out of bounds exception * +400: Null pointer exception
+40C: Jazelle mode entered with JE = 0 * +404: Array index out of bounds exception
+410: Configuration invalid (Jazelle mode entered with CV = 0) * +40C: Jazelle mode entered with JE = 0
CV is automatically set to 1 on entering this handler * +410: Configuration invalid (Jazelle mode entered with CV = 0)
+414: Prefetch abort occurred in middle of instruction * CV is automatically set to 1 on entering this handler
-Hackspire * +414: Prefetch abort occurred in middle of instruction
*
* -Hackspire
*/ */
const void* block = &jazelle_block; const void* block = &jazelle_block;
@ -387,7 +535,7 @@ void jazelle_main(void) {
while (jid == 0) ; while (jid == 0) ;
int r = jazelle_exec(bytecode_test1); int r = jazelle_exec(bytecode_test1);
iprintf("retcode=%d\r\n", r); iprintf("retcode=%d; r5 was 0x%08lx\r\n", r, backup_r5);
if (r == 0) { if (r == 0) {
static uint8_t hflags[256/8]; static uint8_t hflags[256/8];

View File

@ -5,7 +5,7 @@ OPENOCD_PORT_TELNET ?= 4444
PREFIX ?= arm-none-eabi- PREFIX ?= arm-none-eabi-
CC = $(PREFIX)gcc CC = $(PREFIX)gcc
CFLAGS = -mcpu=arm1176jzf-s CFLAGS = -mcpu=arm1176jzf-s -Wall
LDFLAGS = -T rpi.ld -nostartfiles -nostdlib LDFLAGS = -T rpi.ld -nostartfiles -nostdlib
GDB ?= $(PREFIX)gdb GDB ?= $(PREFIX)gdb
PYTHON3 ?= python3 PYTHON3 ?= python3
@ -21,6 +21,12 @@ rpi.o: rpi.c
rpi.elf: rpi.o rpi.elf: rpi.o
$(CC) $(CFLAGS) $(LDFLAGS) -o "$@" $^ $(CC) $(CFLAGS) $(LDFLAGS) -o "$@" $^
#jazelle.S: ../jazelle.c
# $(CC) $(CFLAGS) -S -o "$@" "$<"
jazelle.o: ../jazelle.c
$(CC) $(CFLAGS) -c -o "$@" "$<"
openocd-launch: openocd-launch:
openocd -f interface/cmsis-dap.cfg -c "transport select jtag" \ openocd -f interface/cmsis-dap.cfg -c "transport select jtag" \
-c "adapter speed 50" -f target/bcm2835.cfg \ -c "adapter speed 50" -f target/bcm2835.cfg \

1
zynq/.gitignore vendored
View File

@ -1,3 +1,4 @@
*.elf *.elf
*.o *.o
__pycache__/ __pycache__/
xil_printf.h

View File

@ -1,7 +1,7 @@
PREFIX ?= arm-none-eabi- PREFIX ?= arm-none-eabi-
CC = $(PREFIX)gcc CC = $(PREFIX)gcc
CFLAGS = -mcpu=cortex-a9 CFLAGS = -mcpu=cortex-a9 -I. -DZYNQ -Wall
LDFLAGS = -T zynq.ld -nostartfiles -nostdlib LDFLAGS = -T zynq.ld -nostartfiles -nostdlib
GDB ?= $(PREFIX)gdb GDB ?= $(PREFIX)gdb
PYTHON3 ?= python3 PYTHON3 ?= python3
@ -21,6 +21,9 @@ zynq.o: zynq.c
zynq.elf: zynq.o zynq.elf: zynq.o
$(CC) $(CFLAGS) $(LDFLAGS) -o "$@" $^ $(CC) $(CFLAGS) $(LDFLAGS) -o "$@" $^
jazelle.o: ../jazelle.c cache_cortexa.c zynq_printf.h
$(CC) $(CFLAGS) -c -o "$@" "$<"
openocd-load: zynq.elf openocd-load: zynq.elf
{ $(PYTHON3) ./elf2oocd.py "$<"; echo exit; } | $(NC) $(OPENOCD_HOST) $(OPENOCD_PORT_TELNET) { $(PYTHON3) ./elf2oocd.py "$<"; echo exit; } | $(NC) $(OPENOCD_HOST) $(OPENOCD_PORT_TELNET)
# printf 'halt\nload_image zynq.elf\nexit\n' \ # printf 'halt\nload_image zynq.elf\nexit\n' \

176
zynq/cache_cortexa.c Normal file
View File

@ -0,0 +1,176 @@
// stolen from
// https://github.com/Xilinx/embeddedsw/blob/master/lib/bsp/standalone/src/arm/cortexa9/xil_cache.c
#define IRQ_FIQ_MASK 0xC0
// CP15_CACHE_SIZE_SEL, CP15_CACHE_SIZE_ID, CP15_INVAL_IC_POU
// asm_cp15_inval_dc_line_sw
// asm_cp15_clean_inval_dc_line_sw
#define XREG_CP15_CACHE_SIZE_SEL "p15, 2, %0, c0, c0, 0"
#define XREG_CP15_CACHE_SIZE_ID "p15, 1, %0, c0, c0, 0"
#define XREG_CP15_INVAL_IC_POU "p15, 0, %0, c7, c5, 0"
#define XREG_CP15_INVAL_DC_LINE_SW "p15, 0, %0, c7, c6, 2"
#define XREG_CP15_CLEAN_INVAL_DC_LINE_SW "p15, 0, %0, c7, c14, 2"
#define asm_cp15_inval_dc_line_sw(param) __asm__ __volatile__("mcr " \
XREG_CP15_INVAL_DC_LINE_SW :: "r" (param)); \
#define asm_cp15_clean_inval_dc_line_sw(param) __asm__ __volatile__("mcr " \
XREG_CP15_CLEAN_INVAL_DC_LINE_SW :: "r" (param)); \
#define dsb() asm volatile("dsb":::"memory")
#define isb() asm volatile("isb":::"memory")
#define mfcpsr() ({uint32_t rval = 0U; \
__asm__ __volatile__(\
"mrs %0, cpsr\n"\
: "=r" (rval)\
);\
rval;\
}) \
#define mtcpsr(v) __asm__ __volatile__(\
"msr cpsr,%0\n"\
: : "r" (v) : "cc" \
) \
/* CP15 operations */
#define mtcp(rn, v) __asm__ __volatile__(\
"mcr " rn "\n"\
: : "r" (v)\
); \
#define mfcp(rn) ({uint32_t rval = 0U; \
__asm__ __volatile__(\
"mrc " rn "\n"\
: "=r" (rval)\
);\
rval;\
}) \
__attribute__((__unused__))
static void DC_InvalidateAll(void) {
register uint32_t CsidReg, C7Reg;
uint32_t CacheSize, LineSize, NumWays;
uint32_t Way, WayIndex, Set, SetIndex, NumSet;
uint32_t currmask;
currmask = mfcpsr();
mtcpsr(currmask | IRQ_FIQ_MASK);
/* Select cache level 0 and D cache in CSSR */
mtcp(XREG_CP15_CACHE_SIZE_SEL, 0U);
CsidReg = mfcp(XREG_CP15_CACHE_SIZE_ID);
/* Determine Cache Size */
CacheSize = (CsidReg >> 13U) & 0x1FFU;
CacheSize +=1U;
CacheSize *=128U; /* to get number of bytes */
/* Number of Ways */
NumWays = (CsidReg & 0x3ffU) >> 3U;
NumWays += 1U;
/* Get the cacheline size, way size, index size from csidr */
LineSize = (CsidReg & 0x07U) + 4U;
NumSet = CacheSize/NumWays;
NumSet /= (0x00000001U << LineSize);
Way = 0U;
Set = 0U;
/* Invalidate all the cachelines */
for (WayIndex =0U; WayIndex < NumWays; WayIndex++) {
for (SetIndex =0U; SetIndex < NumSet; SetIndex++) {
C7Reg = Way | Set;
/* Invalidate by Set/Way */
asm_cp15_inval_dc_line_sw(C7Reg);
Set += (0x00000001U << LineSize);
}
Set=0U;
Way += 0x40000000U;
}
/* Wait for L1 invalidate to complete */
dsb();
mtcpsr(currmask);
}
static void DC_FlushAll(void) {
register uint32_t CsidReg, C7Reg;
uint32_t CacheSize, LineSize, NumWays;
uint32_t Way;
uint32_t WayIndex, Set, SetIndex, NumSet;
uint32_t currmask;
currmask = mfcpsr();
mtcpsr(currmask | IRQ_FIQ_MASK);
/* Select cache level 0 and D cache in CSSR */
mtcp(XREG_CP15_CACHE_SIZE_SEL, 0);
CsidReg = mfcp(XREG_CP15_CACHE_SIZE_ID);
/* Determine Cache Size */
CacheSize = (CsidReg >> 13U) & 0x1FFU;
CacheSize +=1U;
CacheSize *=128U; /* to get number of bytes */
/* Number of Ways */
NumWays = (CsidReg & 0x3ffU) >> 3U;
NumWays += 1U;
/* Get the cacheline size, way size, index size from csidr */
LineSize = (CsidReg & 0x07U) + 4U;
NumSet = CacheSize/NumWays;
NumSet /= (0x00000001U << LineSize);
Way = 0U;
Set = 0U;
/* Invalidate all the cachelines */
for (WayIndex =0U; WayIndex < NumWays; WayIndex++) {
for (SetIndex =0U; SetIndex < NumSet; SetIndex++) {
C7Reg = Way | Set;
/* Flush by Set/Way */
asm_cp15_clean_inval_dc_line_sw(C7Reg);
Set += (0x00000001U << LineSize);
}
Set = 0U;
Way += 0x40000000U;
}
/* Wait for L1 flush to complete */
dsb();
mtcpsr(currmask);
}
static void IC_InvalidateAll(void) {
mtcp(XREG_CP15_CACHE_SIZE_SEL, 1U);
/* invalidate the instruction cache */
mtcp(XREG_CP15_INVAL_IC_POU, 0U);
/* Wait for L1 invalidate to complete */
dsb();
isb();
}
#undef dsb
#undef mfcpsr
#undef mtcpsr
#undef mtcp
#undef mfcp
#undef asm_cp15_inval_dc_line_sw
#undef asm_cp15_clean_inval_dc_line_sw
#undef IRQ_FIQ_MASK

81
zynq/zynq_printf.h Normal file
View File

@ -0,0 +1,81 @@
// because xil_printf's behavior isn't very portable, and the xilinx bare-metal
// libraries don't provide a printf() implementation, we will make one here
// using xil_printf under the hood
#include <stdlib.h>
#include <stdio.h>
#include <string.h>
#define XIL_NEWLINE "\n\r" /* yeah... wat */
static char* pbuf = NULL;
static int psize = 0;
int vdprintf(int fd, const char* fmt, va_list args) {
(void)fd;
if (pbuf == NULL) {
psize = 80; // initial value: "default" terminal width
pbuf = malloc(psize);
}
int r;
do {
r = vsnprintf(pbuf, psize, fmt, args);
if (r < 0) return r;
if (r < psize - 1) // it fits into the buffer, so we can stop
break;
// make buffer larger, and try again
psize <<= 1;
pbuf = realloc(pbuf, psize);
} while (1);
// print line by line
char* start = pbuf;
for (char* c = pbuf; *c && (ptrdiff_t)c < (ptrdiff_t)pbuf + r; ++c) {
if (*c == '\n') {
*c = '\0';
xil_printf("%s" XIL_NEWLINE, start);
start = c + 1;
}
}
if (*start && (ptrdiff_t)start < (ptrdiff_t)pbuf + r) {
xil_printf("%s", start);
}
return r;
}
int dprintf(int fd, const char* fmt, ...) {
va_list args;
va_start(args, fmt);
int r = vdprintf(fd, fmt, args);
va_end(args);
return r;
}
int vprintf(const char* fmt, va_list args) {
return vdprintf(1 /*STDOUT_FILENO*/, fmt, args);
}
int printf(const char* fmt, ...) {
va_list args;
va_start(args, fmt);
int r = vprintf(fmt, args);
va_end(args);
return r;
}
int vfprintf(FILE* f, const char* fmt, va_list args) {
(void)f;
return vdprintf(/*fileno(f)*/ 1, fmt, args);
}
int fprintf(FILE* f, const char* fmt, ...) {
va_list args;
va_start(args, fmt);
int r = vfprintf(f, fmt, args);
va_end(args);
return r;
}