[Date Prev][Date Next][Thread Prev][Thread Next][Date Index][Thread Index]
Re: [PATCH 6/6] target/arm: Implement FEAT_LPA2
From: |
Peter Maydell |
Subject: |
Re: [PATCH 6/6] target/arm: Implement FEAT_LPA2 |
Date: |
Fri, 7 Jan 2022 14:39:58 +0000 |
On Wed, 8 Dec 2021 at 23:21, Richard Henderson
<richard.henderson@linaro.org> wrote:
>
> Signed-off-by: Richard Henderson <richard.henderson@linaro.org>
Again, a commit message would be nice.
> ---
> target/arm/cpu.h | 12 +++++++
> target/arm/internals.h | 2 ++
> target/arm/cpu64.c | 2 ++
> target/arm/helper.c | 80 +++++++++++++++++++++++++++++++++++-------
> 4 files changed, 83 insertions(+), 13 deletions(-)
>
> diff --git a/target/arm/cpu.h b/target/arm/cpu.h
> index 3149000004..379585352b 100644
> --- a/target/arm/cpu.h
> +++ b/target/arm/cpu.h
> @@ -4283,6 +4283,18 @@ static inline bool isar_feature_aa64_i8mm(const
> ARMISARegisters *id)
> return FIELD_EX64(id->id_aa64isar1, ID_AA64ISAR1, I8MM) != 0;
> }
>
> +static inline bool isar_feature_aa64_tgran4_lpa2(const ARMISARegisters *id)
> +{
> + return sextract64(id->id_aa64mmfr0,
> + R_ID_AA64MMFR0_TGRAN4_SHIFT,
> + R_ID_AA64MMFR0_TGRAN4_LENGTH) >= 1;
> +}
> +
> +static inline bool isar_feature_aa64_tgran16_lpa2(const ARMISARegisters *id)
> +{
> + return FIELD_EX64(id->id_aa64mmfr0, ID_AA64MMFR0, TGRAN16) >= 2;
> +}
(I wonder if we should have a FIELD_SEX64 etc ?)
> +
> static inline bool isar_feature_aa64_ccidx(const ARMISARegisters *id)
> {
> return FIELD_EX64(id->id_aa64mmfr2, ID_AA64MMFR2, CCIDX) != 0;
> diff --git a/target/arm/internals.h b/target/arm/internals.h
> index 3e801833b4..868cae2a55 100644
> --- a/target/arm/internals.h
> +++ b/target/arm/internals.h
> @@ -1033,12 +1033,14 @@ static inline uint32_t
> aarch64_pstate_valid_mask(const ARMISARegisters *id)
> typedef struct ARMVAParameters {
> unsigned tsz : 8;
> unsigned ps : 3;
> + unsigned sh : 2;
> unsigned select : 1;
> bool tbi : 1;
> bool epd : 1;
> bool hpd : 1;
> bool using16k : 1;
> bool using64k : 1;
> + bool ds : 1;
> } ARMVAParameters;
>
> ARMVAParameters aa64_va_parameters(CPUARMState *env, uint64_t va,
> diff --git a/target/arm/cpu64.c b/target/arm/cpu64.c
> index 3bb79ca744..5a1940aa94 100644
> --- a/target/arm/cpu64.c
> +++ b/target/arm/cpu64.c
> @@ -740,6 +740,8 @@ static void aarch64_max_initfn(Object *obj)
>
> t = cpu->isar.id_aa64mmfr0;
> t = FIELD_DP64(t, ID_AA64MMFR0, PARANGE, 6); /* FEAT_LPA: 52 bits */
> + t = FIELD_DP64(t, ID_AA64MMFR0, TGRAN16, 2); /* FEAT_LPA2: 52 bits */
> + t = FIELD_DP64(t, ID_AA64MMFR0, TGRAN4, 1); /* FEAT_LPA2: 52 bits */
Shouldn't we also set the TGRAN4_2 and TGRAN16_2 fields?
> cpu->isar.id_aa64mmfr0 = t;
>
> t = cpu->isar.id_aa64mmfr1;
> diff --git a/target/arm/helper.c b/target/arm/helper.c
> index e39c1f5b3a..f4a8b37f98 100644
> --- a/target/arm/helper.c
> +++ b/target/arm/helper.c
> @@ -11008,8 +11008,13 @@ static bool check_s2_mmu_setup(ARMCPU *cpu, bool
> is_aa64, int level,
> const int grainsize = stride + 3;
> int startsizecheck;
>
> - /* Negative levels are never allowed. */
> - if (level < 0) {
> + /*
> + * Negative levels are usually not allowed...
> + * Except for FEAT_LPA2, 4k page table, 52-bit address space, which
> + * begins with level -1. Note that previous feature tests will have
> + * eliminated this combination if it is not enabled.
> + */
> + if (level < (inputsize == 52 && stride == 9 ? -1 : 0)) {
> return false;
> }
The checks on validity of 'level' are getting quite complicated:
* we do this check here (which now involves 'stride')
* some values of 'level' will cause the startsizecheck to fail
(calculation of startsizecheck also involves 'stride')
* we then switch on 'stride' and check for 'level' validity
differently in the various cases
Can we simplify this at all ? Or are we just following the logic
the pseudocode uses (I haven't checked) ?
> @@ -11150,8 +11155,8 @@ ARMVAParameters aa64_va_parameters(CPUARMState *env,
> uint64_t va,
> ARMMMUIdx mmu_idx, bool data)
> {
> uint64_t tcr = regime_tcr(env, mmu_idx)->raw_tcr;
> - bool epd, hpd, using16k, using64k;
> - int select, tsz, tbi, ps;
> + bool epd, hpd, using16k, using64k, ds;
> + int select, tsz, tbi, ps, sh;
>
> if (!regime_has_2_ranges(mmu_idx)) {
> select = 0;
> @@ -11165,7 +11170,9 @@ ARMVAParameters aa64_va_parameters(CPUARMState *env,
> uint64_t va,
> hpd = extract32(tcr, 24, 1);
> }
> epd = false;
> + sh = extract64(tcr, 12, 2);
> ps = extract64(tcr, 16, 3);
> + ds = extract64(tcr, 32, 1);
> } else {
> /*
> * Bit 55 is always between the two regions, and is canonical for
> @@ -11175,6 +11182,7 @@ ARMVAParameters aa64_va_parameters(CPUARMState *env,
> uint64_t va,
> if (!select) {
> tsz = extract32(tcr, 0, 6);
> epd = extract32(tcr, 7, 1);
> + sh = extract32(tcr, 12, 2);
> using64k = extract32(tcr, 14, 1);
> using16k = extract32(tcr, 15, 1);
> hpd = extract64(tcr, 41, 1);
> @@ -11184,9 +11192,11 @@ ARMVAParameters aa64_va_parameters(CPUARMState *env,
> uint64_t va,
> using64k = tg == 3;
> tsz = extract32(tcr, 16, 6);
> epd = extract32(tcr, 23, 1);
> + sh = extract32(tcr, 28, 2);
> hpd = extract64(tcr, 42, 1);
> }
> ps = extract64(tcr, 32, 3);
> + ds = extract64(tcr, 59, 1);
> }
>
> /* Present TBI as a composite with TBID. */
> @@ -11199,12 +11209,14 @@ ARMVAParameters aa64_va_parameters(CPUARMState
> *env, uint64_t va,
> return (ARMVAParameters) {
> .tsz = tsz,
> .ps = ps,
> + .sh = sh,
> .select = select,
> .tbi = tbi,
> .epd = epd,
> .hpd = hpd,
> .using16k = using16k,
> .using64k = using64k,
> + .ds = ds,
> };
> }
>
> @@ -11332,15 +11344,31 @@ static bool get_phys_addr_lpae(CPUARMState *env,
> uint64_t address,
> access_type != MMU_INST_FETCH);
> level = 0;
>
> - if (cpu_isar_feature(aa64_st, env_archcpu(env))) {
> + /* Find the minimum allowed input address size. */
> + if (cpu_isar_feature(aa64_st, cpu)) {
> max_tsz = 48 - param.using64k;
> }
> +
> + /*
> + * Find the maximum allowed input address size.
> + * DS is RES0 unless FEAT_LPA2 is supported for the given page size;
> + * adjust param.ds to the effective value of DS, as documented.
> + */
> if (param.using64k) {
> - if (cpu_isar_feature(aa64_lva, env_archcpu(env))) {
> + if (cpu_isar_feature(aa64_lva, cpu)) {
> min_tsz = 12;
> }
> + param.ds = false;
> + } else if (param.ds) {
> + /* ??? Assume tgran{4,16}_2 == 0, i.e. match tgran{4,16}. */
How painful would it be to fix this '???' ? Setting those fields to 0 is
deprecated, so it would be preferable not to start out depending on that.
(We don't currently use the tgran fields at all, I guess because we allow
all page sizes regardless of the ID register values. Maybe we should
correct that too.)
> + if (param.using16k
> + ? cpu_isar_feature(aa64_tgran16_lpa2, cpu)
> + : cpu_isar_feature(aa64_tgran4_lpa2, cpu)) {
> + min_tsz = 12;
> + } else {
> + param.ds = false;
> + }
> }
> - /* TODO: FEAT_LPA2 */
>
> /*
> * If TxSZ is programmed to a value larger than the maximum,
> @@ -11441,10 +11469,19 @@ static bool get_phys_addr_lpae(CPUARMState *env,
> uint64_t address,
> * VTCR_EL2.SL0 field (whose interpretation depends on the page size)
> */
> uint32_t sl0 = extract32(tcr->raw_tcr, 6, 2);
> + uint32_t sl2 = extract64(tcr->raw_tcr, 33, 1);
> uint32_t startlevel;
> bool ok;
>
> - if (!aarch64 || stride == 9) {
> + /* SL2 is RES0 unless DS=1 & 4kb granule. */
> + if (param.ds && stride == 9 && sl2) {
> + if (sl0 != 0) {
> + level = 0;
> + fault_type = ARMFault_Translation;
> + goto do_fault;
> + }
> + startlevel = -1;
> + } else if (!aarch64 || stride == 9) {
> /* AArch32 or 4KB pages */
> startlevel = 2 - sl0;
>
> @@ -11499,7 +11536,9 @@ static bool get_phys_addr_lpae(CPUARMState *env,
> uint64_t address,
> * but in ARMv8 they are checked for zero and an AddressSize fault
> * is raised if they are not.
> */
> - if (aarch64 || arm_feature(env, ARM_FEATURE_V8)) {
> + if (param.ds) {
> + descaddrmask = MAKE_64BIT_MASK(0, 50);
> + } else if (aarch64 || arm_feature(env, ARM_FEATURE_V8)) {
> descaddrmask = MAKE_64BIT_MASK(0, 48);
> } else {
> descaddrmask = MAKE_64BIT_MASK(0, 40);
> @@ -11534,11 +11573,16 @@ static bool get_phys_addr_lpae(CPUARMState *env,
> uint64_t address,
>
> /*
> * For FEAT_LPA and PS=6, bits [51:48] of descaddr are in [15:12]
> - * of descriptor. Otherwise, if descaddr is out of range, raise
> - * AddressSizeFault.
> + * of descriptor. For FEAT_LPA2 and effective DS, bits [51:50] of
> + * descaddr are in [9:8]. Otherwise, if descaddr is out of range,
> + * raise AddressSizeFault.
> */
> if (outputsize > 48) {
> - descaddr |= extract64(descriptor, 12, 4) << 48;
> + if (param.ds) {
> + descaddr |= extract64(descriptor, 8, 2) << 50;
> + } else {
> + descaddr |= extract64(descriptor, 12, 4) << 48;
> + }
> } else if (descaddr >> outputsize) {
> fault_type = ARMFault_AddressSize;
> goto do_fault;
> @@ -11632,7 +11676,17 @@ static bool get_phys_addr_lpae(CPUARMState *env,
> uint64_t address,
> assert(attrindx <= 7);
> cacheattrs->attrs = extract64(mair, attrindx * 8, 8);
> }
> - cacheattrs->shareability = extract32(attrs, 6, 2);
> +
> + /*
> + * For FEAT_LPA2 and effective DS, the SH field in the attributes
> + * was re-purposed for output address bits. The SH attribute in
> + * that case comes from TCR_ELx, which we extracted earlier.
> + */
> + if (param.ds) {
> + cacheattrs->shareability = param.sh;
> + } else {
> + cacheattrs->shareability = extract32(attrs, 6, 2);
> + }
>
> *phys_ptr = descaddr;
> *page_size_ptr = page_size;
The code above looks correct to me. There are some missing pieces
elsewhere, though:
(1) The handling of the BaseADDR field for TLB range
invalidates needs updating (there's a TODO to this effect in
tlbi_aa64_range_get_base()).
Side note: in that function, we shift the field by TARGET_PAGE_BITS,
but the docs say that the shift should depend on the configured
translation granule. Is that a bug?
(2) There are some new long-form fault status codes with FEAT_LPA2,
corresponding to various fault types that can now occur at level -1.
arm_fi_to_lfsc() needs updating to handle fi->level being -1.
(You could do this bit as a preceding patch; it doesn't need to
be squashed into this one.)
thanks
-- PMM
[Prev in Thread] |
Current Thread |
[Next in Thread] |
- Re: [PATCH 6/6] target/arm: Implement FEAT_LPA2,
Peter Maydell <=