Minimal ARM LPAE support. Sufficient to boot Linux kernel on vexpress-a15
Signed-off-by: Alexey Starikovskiy <aysta...@gmail.com> --- target-arm/cpu.h | 11 +- target-arm/helper.c | 239 ++++++++++++++++++++++++++++++++++++++++++++---- target-arm/helper.h | 2 target-arm/machine.c | 16 +-- target-arm/translate.c | 46 ++++++--- 5 files changed, 262 insertions(+), 52 deletions(-) diff --git a/target-arm/cpu.h b/target-arm/cpu.h index 0d9b39c..1d87c7e 100644 --- a/target-arm/cpu.h +++ b/target-arm/cpu.h @@ -117,11 +117,9 @@ typedef struct CPUARMState { uint32_t c1_coproc; /* Coprocessor access register. */ uint32_t c1_xscaleauxcr; /* XScale auxiliary control register. */ uint32_t c1_scr; /* secure config register. */ - uint32_t c2_base0; /* MMU translation table base 0. */ - uint32_t c2_base1; /* MMU translation table base 1. */ + uint64_t c2_base0; /* MMU translation table base 0. */ + uint64_t c2_base1; /* MMU translation table base 1. */ uint32_t c2_control; /* MMU translation table base control. */ - uint32_t c2_mask; /* MMU translation table base selection mask. */ - uint32_t c2_base_mask; /* MMU translation table base 0 mask. */ uint32_t c2_data; /* MPU data cachable bits. */ uint32_t c2_insn; /* MPU instruction cachable bits. */ uint32_t c3; /* MMU domain access control register @@ -131,7 +129,7 @@ typedef struct CPUARMState { uint32_t c6_region[8]; /* MPU base/size registers. */ uint32_t c6_insn; /* Fault address registers. */ uint32_t c6_data; - uint32_t c7_par; /* Translation result. */ + uint64_t c7_par; /* Translation result. */ uint32_t c9_insn; /* Cache lockdown registers. */ uint32_t c9_data; uint32_t c9_pmcr; /* performance monitor control register */ @@ -383,6 +381,7 @@ enum arm_features { ARM_FEATURE_ARM_DIV, /* divide supported in ARM encoding */ ARM_FEATURE_VFP4, /* VFPv4 (implies that NEON is v2) */ ARM_FEATURE_GENERIC_TIMER, + ARM_FEATURE_LPAE, /* Large Physical Address Extension */ }; static inline int arm_feature(CPUARMState *env, int feature) @@ -455,7 +454,7 @@ void cpu_arm_set_cp_io(CPUARMState *env, int cpnum, #define cpu_signal_handler cpu_arm_signal_handler #define cpu_list arm_cpu_list -#define CPU_SAVE_VERSION 6 +#define CPU_SAVE_VERSION 7 /* MMU modes definitions */ #define MMU_MODE0_SUFFIX _kernel diff --git a/target-arm/helper.c b/target-arm/helper.c index abe1c30..a5d5e7d 100644 --- a/target-arm/helper.c +++ b/target-arm/helper.c @@ -172,6 +172,7 @@ static void cpu_reset_model_id(CPUARMState *env, uint32_t id) set_feature(env, ARM_FEATURE_ARM_DIV); set_feature(env, ARM_FEATURE_V7MP); set_feature(env, ARM_FEATURE_GENERIC_TIMER); + set_feature(env, ARM_FEATURE_LPAE); env->vfp.xregs[ARM_VFP_FPSID] = 0x410430f0; env->vfp.xregs[ARM_VFP_MVFR0] = 0x10110222; env->vfp.xregs[ARM_VFP_MVFR1] = 0x11111111; @@ -325,7 +326,6 @@ void cpu_reset(CPUARMState *env) } } env->vfp.xregs[ARM_VFP_FPEXC] = 0; - env->cp15.c2_base_mask = 0xffffc000u; /* v7 performance monitor control register: same implementor * field as main ID register, and we implement no event counters. */ @@ -671,6 +671,16 @@ uint32_t HELPER(get_cp15)(CPUState *env, uint32_t insn) cpu_abort(env, "cp15 insn %08x\n", insn); } +void HELPER(set_cp15_64)(CPUState *env, uint32_t insn, uint64_t val) +{ + cpu_abort(env, "cp15 insn %08x\n", insn); +} + +uint64_t HELPER(get_cp15_64)(CPUState *env, uint32_t insn) +{ + cpu_abort(env, "cp15 insn %08x\n", insn); +} + /* These should probably raise undefined insn exceptions. */ void HELPER(v7m_msr)(CPUState *env, uint32_t reg, uint32_t val) { @@ -1050,18 +1060,21 @@ static inline int check_ap(CPUState *env, int ap, int domain_prot, static uint32_t get_level1_table_address(CPUState *env, uint32_t address) { uint32_t table; + int t0size = env->cp15.c2_control & 0x7; + uint32_t mask = ~(((uint32_t)0xffffffffu) >> t0size); - if (address & env->cp15.c2_mask) + if (address & mask) table = env->cp15.c2_base1 & 0xffffc000; - else - table = env->cp15.c2_base0 & env->cp15.c2_base_mask; - + else { + mask = ~((uint32_t)0x3fffu >> t0size); + table = env->cp15.c2_base0 & mask; + } table |= (address >> 18) & 0x3ffc; return table; } static int get_phys_addr_v5(CPUState *env, uint32_t address, int access_type, - int is_user, uint32_t *phys_ptr, int *prot, + int is_user, uint64_t *phys_ptr, int *prot, target_ulong *page_size) { int code; @@ -1156,7 +1169,7 @@ do_fault: } static int get_phys_addr_v6(CPUState *env, uint32_t address, int access_type, - int is_user, uint32_t *phys_ptr, int *prot, + int is_user, uint64_t *phys_ptr, int *prot, target_ulong *page_size) { int code; @@ -1260,7 +1273,7 @@ do_fault: } static int get_phys_addr_mpu(CPUState *env, uint32_t address, int access_type, - int is_user, uint32_t *phys_ptr, int *prot) + int is_user, uint64_t *phys_ptr, int *prot) { int n; uint32_t mask; @@ -1319,9 +1332,155 @@ static int get_phys_addr_mpu(CPUState *env, uint32_t address, int access_type, return 0; } +static inline uint64_t bitrange(int m, int n) { + int len = m - n + 1; // inclusive + if (len < 1) + return 0; + return (((1ULL << len) - 1) << n); +} + +static int get_phys_addr_lpae(CPUState *env, uint32_t address, int access_type, + int is_user, uint64_t *phys_ptr, int *prot, + target_ulong *page_size) +{ + uint64_t base_address = 0, ia = address; + bool base_found = false; + bool disabled = false; + int type = 1; // Translation + uint32_t ttbcr = env->cp15.c2_control; + uint64_t ttbr0 = env->cp15.c2_base0; + uint32_t t0size = ttbcr & 0x7; //T0SZ + int level = 0, start_bit; + bool is_secure = 1, lookup_secure = is_secure; + if (t0size || (ia & bitrange(31, 32 - t0size)) == 0) { + level = ((t0size & 6) == 0) ? 1 : 2; + int lowerbound = 9 * level - t0size - 4; + base_address = bitrange(39, lowerbound) & ttbr0; + base_found = true; + disabled = ttbcr & (1 << 7); // EPD0 + start_bit = 31 - t0size; + //TODO unpack type info from TTBCR + } + uint32_t t1size = (ttbcr >> 16) & 0x7; // T1SZ + uint64_t ttbr1 = env->cp15.c2_base1; + if ((t1size == 0 && !base_found) || (bitrange(31, 32 - t1size) & ~ia) == 0) { + level = ((t1size & 6) == 0) ? 1 : 2; + int lowerbound = 9 * level - t1size - 4; + base_address = bitrange(39, lowerbound) & ttbr1; + base_found = true; + disabled = ttbcr & (1 << 23); // EPD1 + start_bit = 31 - t1size; + //TODO unpack type info from TTBCR + } + if (!base_found || disabled) + goto do_fault; + bool first_iteration = true; + bool table_rw = true; + bool table_user = true; + bool table_xn = false; + bool table_pxn = false; + uint32_t attrs = 0; + bool lookup_finished; + do { + lookup_finished = true; + bool block_translate = false; + int offset = 9 * level; + uint64_t ia_select; + if (first_iteration) + ia_select = ((ia & bitrange(start_bit, 39 - offset)) >> (39 - offset - 3)); + else + ia_select = ((ia & bitrange(47 - offset, 39 - offset)) >> (39 - offset - 3)); + uint64_t lookup_address = base_address | ia_select; + first_iteration = false; + uint64_t descriptor = ldq_phys(lookup_address); + if ((descriptor & 1) == 0) { + goto do_fault; + } else { + if ((descriptor & 2) == 0) { + if (level == 3) { + goto do_fault; + } else + block_translate = true; + } else { + if (level == 3) + block_translate = true; + else { + base_address = bitrange(39, 12) & descriptor; + lookup_secure = lookup_secure && !((descriptor >> 63) & 1); + table_rw = table_rw && !((descriptor >> 62) & 1); + table_user = table_user && !((descriptor >> 61) & 1); + table_xn = table_xn || ((descriptor >> 60) & 1); + table_pxn = table_pxn || ((descriptor >> 59) & 1); + lookup_finished = false; + } + } + } + if (block_translate) { + *phys_ptr = (bitrange(39, 39 - offset) & descriptor) | (bitrange(38 - offset, 0) & ia); + attrs = ((descriptor & bitrange(54, 52)) >> 42) | + ((descriptor & bitrange(11, 2)) >> 2); + if (table_xn) + attrs |= 1 << 12; + if (table_pxn) + attrs |= 1 << 11; + if (is_secure && !lookup_secure) + attrs |= 1 << 9; + if (!table_rw) + attrs |= 1 << 5; + if (!table_user) + attrs &= ~(1UL << 4); + if (!lookup_secure) + attrs |= 1 << 3; + } else + ++level; + } while (!lookup_finished); + // checks + type = 2; // AccessFlag + if ((attrs & (1 << 8)) == 0) + goto do_fault; + *prot = 0; + if (((attrs >> 12) & 1) == 0) + *prot |= PAGE_EXEC; // XN + if (!is_user || ((attrs >> 11) & 1) == 0) + *prot |= PAGE_EXEC; // PXN + type = 3; // Permissions + switch ((attrs >> 4) & 3) { + case 0: + if (is_user) + goto do_fault; + // fall through + case 1: + *prot |= PAGE_READ | PAGE_WRITE; + break; + case 2: + if (is_user) + goto do_fault; + // fall through + case 3: + if (access_type == 1) + goto do_fault; + *prot |= PAGE_READ; + break; + } + switch (level) { + case 1: + *page_size = 0x40000000; //1G + break; + case 2: + *page_size = 0x200000; // 2M + break; + case 3: + *page_size = 0x1000; // 4k + break; + } + return 0; +do_fault: + return (1 << 9) | (type << 2) | level; // DFSR value +} + static inline int get_phys_addr(CPUState *env, uint32_t address, int access_type, int is_user, - uint32_t *phys_ptr, int *prot, + uint64_t *phys_ptr, int *prot, target_ulong *page_size) { /* Fast Context Switch Extension. */ @@ -1336,8 +1495,10 @@ static inline int get_phys_addr(CPUState *env, uint32_t address, return 0; } else if (arm_feature(env, ARM_FEATURE_MPU)) { *page_size = TARGET_PAGE_SIZE; - return get_phys_addr_mpu(env, address, access_type, is_user, phys_ptr, - prot); + return get_phys_addr_mpu(env, address, access_type, is_user, phys_ptr, prot); + } else if (env->cp15.c2_control & (1 << 31)) { + return get_phys_addr_lpae(env, address, access_type, is_user, phys_ptr, + prot, page_size); } else if (env->cp15.c1_sys & (1 << 23)) { return get_phys_addr_v6(env, address, access_type, is_user, phys_ptr, prot, page_size); @@ -1350,7 +1511,7 @@ static inline int get_phys_addr(CPUState *env, uint32_t address, int cpu_arm_handle_mmu_fault (CPUState *env, target_ulong address, int access_type, int mmu_idx) { - uint32_t phys_addr; + uint64_t phys_addr; target_ulong page_size; int prot; int ret, is_user; @@ -1366,7 +1527,7 @@ int cpu_arm_handle_mmu_fault (CPUState *env, target_ulong address, return 0; } - if (access_type == 2) { + if (access_type == 2 && !arm_feature(env, ARM_FEATURE_LPAE)) { env->cp15.c5_insn = ret; env->cp15.c6_insn = address; env->exception_index = EXCP_PREFETCH_ABORT; @@ -1382,7 +1543,7 @@ int cpu_arm_handle_mmu_fault (CPUState *env, target_ulong address, target_phys_addr_t cpu_get_phys_page_debug(CPUState *env, target_ulong addr) { - uint32_t phys_addr; + uint64_t phys_addr; target_ulong page_size; int prot; int ret; @@ -1529,10 +1690,7 @@ void HELPER(set_cp15)(CPUState *env, uint32_t insn, uint32_t val) env->cp15.c2_base1 = val; break; case 2: - val &= 7; env->cp15.c2_control = val; - env->cp15.c2_mask = ~(((uint32_t)0xffffffffu) >> val); - env->cp15.c2_base_mask = ~((uint32_t)0x3fffu >> val); break; default: goto bad_reg; @@ -1611,7 +1769,7 @@ void HELPER(set_cp15)(CPUState *env, uint32_t insn, uint32_t val) } break; case 8: { - uint32_t phys_addr; + uint64_t phys_addr; target_ulong page_size; int prot; int ret, is_user = op2 & 2; @@ -2261,6 +2419,51 @@ bad_reg: return 0; } +void HELPER(set_cp15_64)(CPUState *env, uint32_t insn, uint64_t val) +{ + int crm = insn & 0xf; + int opc1 = (insn >> 4) & 0xf; + if (crm == 2) { + switch (opc1) { + case 0: + env->cp15.c2_base0 = val; + tlb_flush(env, 0); // might change ASID + return; + case 1: + env->cp15.c2_base1 = val; + tlb_flush(env, 0); // might change ASID + return; + default:; + } + } else if (crm == 7) { + if (opc1 == 0) { + env->cp15.c7_par = val; + return; + } + } + cpu_abort(env, "Unimplemented cp15 register 64bit write (c%d[%d])\n", crm, opc1); +} + +uint64_t HELPER(get_cp15_64)(CPUState *env, uint32_t insn) +{ + int crm = insn & 0xf; + int opc1 = (insn >> 4) & 0xf; + if (crm == 2) { + switch (opc1) { + case 0: + return env->cp15.c2_base0; + case 1: + return env->cp15.c2_base1; + default:; + } + } else if (crm == 7) { + if (opc1 == 0) + return env->cp15.c7_par; + } + cpu_abort(env, "Unimplemented cp15 register 64bit read (c%d[%d])\n", crm, opc1); + return 0; +} + void HELPER(set_r13_banked)(CPUState *env, uint32_t mode, uint32_t val) { if ((env->uncached_cpsr & CPSR_M) == mode) { diff --git a/target-arm/helper.h b/target-arm/helper.h index 16dd5fc..bc8151c 100644 --- a/target-arm/helper.h +++ b/target-arm/helper.h @@ -60,7 +60,9 @@ DEF_HELPER_3(v7m_msr, void, env, i32, i32) DEF_HELPER_2(v7m_mrs, i32, env, i32) DEF_HELPER_3(set_cp15, void, env, i32, i32) +DEF_HELPER_3(set_cp15_64, void, env, i32, i64) DEF_HELPER_2(get_cp15, i32, env, i32) +DEF_HELPER_2(get_cp15_64, i64, env, i32) DEF_HELPER_3(set_cp, void, env, i32, i32) DEF_HELPER_2(get_cp, i32, env, i32) diff --git a/target-arm/machine.c b/target-arm/machine.c index f66b8df..8fa738e 100644 --- a/target-arm/machine.c +++ b/target-arm/machine.c @@ -27,11 +27,9 @@ void cpu_save(QEMUFile *f, void *opaque) qemu_put_be32(f, env->cp15.c1_coproc); qemu_put_be32(f, env->cp15.c1_xscaleauxcr); qemu_put_be32(f, env->cp15.c1_scr); - qemu_put_be32(f, env->cp15.c2_base0); - qemu_put_be32(f, env->cp15.c2_base1); + qemu_put_be64(f, env->cp15.c2_base0); + qemu_put_be64(f, env->cp15.c2_base1); qemu_put_be32(f, env->cp15.c2_control); - qemu_put_be32(f, env->cp15.c2_mask); - qemu_put_be32(f, env->cp15.c2_base_mask); qemu_put_be32(f, env->cp15.c2_data); qemu_put_be32(f, env->cp15.c2_insn); qemu_put_be32(f, env->cp15.c3); @@ -42,7 +40,7 @@ void cpu_save(QEMUFile *f, void *opaque) } qemu_put_be32(f, env->cp15.c6_insn); qemu_put_be32(f, env->cp15.c6_data); - qemu_put_be32(f, env->cp15.c7_par); + qemu_put_be64(f, env->cp15.c7_par); qemu_put_be32(f, env->cp15.c9_insn); qemu_put_be32(f, env->cp15.c9_data); qemu_put_be32(f, env->cp15.c9_pmcr); @@ -145,11 +143,9 @@ int cpu_load(QEMUFile *f, void *opaque, int version_id) env->cp15.c1_coproc = qemu_get_be32(f); env->cp15.c1_xscaleauxcr = qemu_get_be32(f); env->cp15.c1_scr = qemu_get_be32(f); - env->cp15.c2_base0 = qemu_get_be32(f); - env->cp15.c2_base1 = qemu_get_be32(f); + env->cp15.c2_base0 = qemu_get_be64(f); + env->cp15.c2_base1 = qemu_get_be64(f); env->cp15.c2_control = qemu_get_be32(f); - env->cp15.c2_mask = qemu_get_be32(f); - env->cp15.c2_base_mask = qemu_get_be32(f); env->cp15.c2_data = qemu_get_be32(f); env->cp15.c2_insn = qemu_get_be32(f); env->cp15.c3 = qemu_get_be32(f); @@ -160,7 +156,7 @@ int cpu_load(QEMUFile *f, void *opaque, int version_id) } env->cp15.c6_insn = qemu_get_be32(f); env->cp15.c6_data = qemu_get_be32(f); - env->cp15.c7_par = qemu_get_be32(f); + env->cp15.c7_par = qemu_get_be64(f); env->cp15.c9_insn = qemu_get_be32(f); env->cp15.c9_data = qemu_get_be32(f); env->cp15.c9_pmcr = qemu_get_be32(f); diff --git a/target-arm/translate.c b/target-arm/translate.c index 280bfca..1f1dde0 100644 --- a/target-arm/translate.c +++ b/target-arm/translate.c @@ -2559,17 +2559,9 @@ static int disas_cp15_insn(CPUState *env, DisasContext *s, uint32_t insn) /* M profile cores use memory mapped registers instead of cp15. */ if (arm_feature(env, ARM_FEATURE_M)) - return 1; + return 1; - if ((insn & (1 << 25)) == 0) { - if (insn & (1 << 20)) { - /* mrrc */ - return 1; - } - /* mcrr. Used for block cache operations, so implement as no-op. */ - return 0; - } - if ((insn & (1 << 4)) == 0) { + if ((insn & (1 << 4)) == 0 && (insn & (1 << 25))) { /* cdp */ return 1; } @@ -2636,16 +2628,34 @@ static int disas_cp15_insn(CPUState *env, DisasContext *s, uint32_t insn) tmp2 = tcg_const_i32(insn); if (insn & ARM_CP_RW_BIT) { - tmp = tcg_temp_new_i32(); - gen_helper_get_cp15(tmp, cpu_env, tmp2); - /* If the destination register is r15 then sets condition codes. */ - if (rd != 15) - store_reg(s, rd, tmp); - else - tcg_temp_free_i32(tmp); + if ((insn & (1 << 25))) { + tmp = tcg_temp_new_i32(); + gen_helper_get_cp15(tmp, cpu_env, tmp2); + /* If the destination register is r15 then sets condition codes. */ + if (rd != 15) + store_reg(s, rd, tmp); + else + tcg_temp_free_i32(tmp); + } else { + int rd1 = (insn >> 16) & 0xf; + TCGv_i64 tmp1 = tcg_temp_new_i64(); + gen_helper_get_cp15_64(tmp1, cpu_env, tmp2); + tcg_gen_trunc_i64_i32(cpu_R[rd], tmp1); + tcg_gen_shri_i64(tmp1, tmp1, 32); + tcg_gen_trunc_i64_i32(cpu_R[rd1], tmp1); + tcg_temp_free_i64(tmp1); + } } else { tmp = load_reg(s, rd); - gen_helper_set_cp15(cpu_env, tmp2, tmp); + if ((insn & (1 << 25))) { + gen_helper_set_cp15(cpu_env, tmp2, tmp); + } else { + int rd1 = (insn >> 16) & 0xf; + TCGv_i64 tmp1 = tcg_temp_new_i64(); + tcg_gen_concat_i32_i64(tmp1, cpu_R[rd], cpu_R[rd1]); + gen_helper_set_cp15_64(cpu_env, tmp2, tmp1); + tcg_temp_free_i64(tmp1); + } tcg_temp_free_i32(tmp); /* Normally we would always end the TB here, but Linux * arch/arm/mach-pxa/sleep.S expects two instructions following