lists.openwall.net   lists  /  announce  owl-users  owl-dev  john-users  john-dev  passwdqc-users  yescrypt  popa3d-users  /  oss-security  kernel-hardening  musl  sabotage  tlsify  passwords  /  crypt-dev  xvendor  /  Bugtraq  Full-Disclosure  linux-kernel  linux-netdev  linux-ext4  linux-hardening  linux-cve-announce  PHC 
Open Source and information security mailing list archives
 
Hash Suite: Windows password security audit tool. GUI, reports in PDF.
[<prev] [next>] [<thread-prev] [thread-next>] [day] [month] [year] [list]
Message-ID: <20210205131800.7d82b1b9@ibm-vm>
Date:   Fri, 5 Feb 2021 13:18:00 +0100
From:   Claudio Imbrenda <imbrenda@...ux.ibm.com>
To:     Janosch Frank <frankja@...ux.ibm.com>
Cc:     linux-kernel@...r.kernel.org, borntraeger@...ibm.com,
        david@...hat.com, kvm@...r.kernel.org, linux-s390@...r.kernel.org,
        stable@...r.kernel.org
Subject: Re: [PATCH v2 1/2] s390/kvm: extend kvm_s390_shadow_fault to return
 entry pointer

On Thu, 4 Feb 2021 18:05:15 +0100
Janosch Frank <frankja@...ux.ibm.com> wrote:

> On 2/4/21 5:34 PM, Janosch Frank wrote:
> > On 2/2/21 7:00 PM, Claudio Imbrenda wrote:  
> >> Extend kvm_s390_shadow_fault to return the pointer to the valid
> >> leaf DAT table entry, or to the invalid entry.
> >>
> >> Also return some flags in the lower bits of the address:
> >> DAT_PROT: indicates that DAT protection applies because of the
> >>           protection bit in the segment (or, if EDAT, region)
> >> tables NOT_PTE: indicates that the address of the DAT table entry
> >> returned does not refer to a PTE, but to a segment or region table.
> >>
> >> Signed-off-by: Claudio Imbrenda <imbrenda@...ux.ibm.com>
> >> Cc: stable@...r.kernel.org
> >> ---
> >>  arch/s390/kvm/gaccess.c | 26 ++++++++++++++++++++++----
> >>  arch/s390/kvm/gaccess.h |  5 ++++-
> >>  arch/s390/kvm/vsie.c    |  8 ++++----
> >>  3 files changed, 30 insertions(+), 9 deletions(-)
> >>
> >> diff --git a/arch/s390/kvm/gaccess.c b/arch/s390/kvm/gaccess.c
> >> index 6d6b57059493..2d7bcbfb185e 100644
> >> --- a/arch/s390/kvm/gaccess.c
> >> +++ b/arch/s390/kvm/gaccess.c
> >> @@ -1034,6 +1034,7 @@ static int kvm_s390_shadow_tables(struct
> >> gmap *sg, unsigned long saddr, rfte.val = ptr;
> >>  			goto shadow_r2t;
> >>  		}
> >> +		*pgt = ptr + vaddr.rfx * 8;  
> > 
> > So pgt either is a table entry if rc > 0 or a pointer to the first
> > pte on rc == 0 after this change?
> > 
> > Hrm, if it is really based on RCs than I might be able to come to
> > terms with having two things in a ptr with the name pgt. But it
> > needs a comment change.
> >   
> >>  		rc = gmap_read_table(parent, ptr + vaddr.rfx * 8,
> >> &rfte.val); if (rc)
> >>  			return rc;
> >> @@ -1060,6 +1061,7 @@ static int kvm_s390_shadow_tables(struct
> >> gmap *sg, unsigned long saddr, rste.val = ptr;
> >>  			goto shadow_r3t;
> >>  		}
> >> +		*pgt = ptr + vaddr.rsx * 8;
> >>  		rc = gmap_read_table(parent, ptr + vaddr.rsx * 8,
> >> &rste.val); if (rc)
> >>  			return rc;
> >> @@ -1087,6 +1089,7 @@ static int kvm_s390_shadow_tables(struct
> >> gmap *sg, unsigned long saddr, rtte.val = ptr;
> >>  			goto shadow_sgt;
> >>  		}
> >> +		*pgt = ptr + vaddr.rtx * 8;
> >>  		rc = gmap_read_table(parent, ptr + vaddr.rtx * 8,
> >> &rtte.val); if (rc)
> >>  			return rc;
> >> @@ -1123,6 +1126,7 @@ static int kvm_s390_shadow_tables(struct
> >> gmap *sg, unsigned long saddr, ste.val = ptr;
> >>  			goto shadow_pgt;
> >>  		}
> >> +		*pgt = ptr + vaddr.sx * 8;
> >>  		rc = gmap_read_table(parent, ptr + vaddr.sx * 8,
> >> &ste.val); if (rc)
> >>  			return rc;
> >> @@ -1157,6 +1161,8 @@ static int kvm_s390_shadow_tables(struct
> >> gmap *sg, unsigned long saddr,
> >>   * @vcpu: virtual cpu
> >>   * @sg: pointer to the shadow guest address space structure
> >>   * @saddr: faulting address in the shadow gmap
> >> + * @pteptr: will contain the address of the faulting DAT table
> >> entry, or of
> >> + *          the valid leaf, plus some flags  
> > 
> > pteptr is not the right name if it can be two things  
> 
> You use it for pei only, right?

yes

> >   
> >>   *
> >>   * Returns: - 0 if the shadow fault was successfully resolved
> >>   *	    - > 0 (pgm exception code) on exceptions while
> >> faulting @@ -1165,11 +1171,11 @@ static int
> >> kvm_s390_shadow_tables(struct gmap *sg, unsigned long saddr,
> >>   *	    - -ENOMEM if out of memory
> >>   */
> >>  int kvm_s390_shadow_fault(struct kvm_vcpu *vcpu, struct gmap *sg,
> >> -			  unsigned long saddr)
> >> +			  unsigned long saddr, unsigned long
> >> *pteptr) {
> >>  	union vaddress vaddr;
> >>  	union page_table_entry pte;
> >> -	unsigned long pgt;
> >> +	unsigned long pgt = 0;
> >>  	int dat_protection, fake;
> >>  	int rc;
> >>  
> >> @@ -1191,8 +1197,20 @@ int kvm_s390_shadow_fault(struct kvm_vcpu
> >> *vcpu, struct gmap *sg, pte.val = pgt + vaddr.px * PAGE_SIZE;
> >>  		goto shadow_page;
> >>  	}
> >> -	if (!rc)
> >> -		rc = gmap_read_table(sg->parent, pgt + vaddr.px *
> >> 8, &pte.val); +
> >> +	switch (rc) {
> >> +	case PGM_SEGMENT_TRANSLATION:
> >> +	case PGM_REGION_THIRD_TRANS:
> >> +	case PGM_REGION_SECOND_TRANS:
> >> +	case PGM_REGION_FIRST_TRANS:
> >> +		pgt |= NOT_PTE;  
> > 
> > GACC_TRANSL_ENTRY_INV ?
> >   
> >> +		break;
> >> +	case 0:
> >> +		pgt += vaddr.px * 8;
> >> +		rc = gmap_read_table(sg->parent, pgt, &pte.val);
> >> +	}
> >> +	if (*pteptr)
> >> +		*pteptr = pgt | dat_protection * DAT_PROT;
> >>  	if (!rc && pte.i)
> >>  		rc = PGM_PAGE_TRANSLATION;
> >>  	if (!rc && pte.z)
> >> diff --git a/arch/s390/kvm/gaccess.h b/arch/s390/kvm/gaccess.h
> >> index f4c51756c462..66a6e2cec97a 100644
> >> --- a/arch/s390/kvm/gaccess.h
> >> +++ b/arch/s390/kvm/gaccess.h
> >> @@ -359,7 +359,10 @@ void ipte_unlock(struct kvm_vcpu *vcpu);
> >>  int ipte_lock_held(struct kvm_vcpu *vcpu);
> >>  int kvm_s390_check_low_addr_prot_real(struct kvm_vcpu *vcpu,
> >> unsigned long gra); 
> >> +#define DAT_PROT 2  
> > 
> > GACC_TRANSL_ENTRY_PROT  
> 
> Ok after a second pass that's not what's going on here.
> Those basically directly correspond to the MVPG PEI indication bits,
> right?

yes :)

> Do we also need to consider bit 63?

no, that can only happen if a specific SIE feature is used, which KVM
neither uses nor supports for VSIE, so it cannot happen

> >   
> >> +#define NOT_PTE 4
> >> +
> >>  int kvm_s390_shadow_fault(struct kvm_vcpu *vcpu, struct gmap
> >> *shadow,
> >> -			  unsigned long saddr);
> >> +			  unsigned long saddr, unsigned long
> >> *pteptr); 
> >>  #endif /* __KVM_S390_GACCESS_H */
> >> diff --git a/arch/s390/kvm/vsie.c b/arch/s390/kvm/vsie.c
> >> index c5d0a58b2c29..7db022141db3 100644
> >> --- a/arch/s390/kvm/vsie.c
> >> +++ b/arch/s390/kvm/vsie.c
> >> @@ -619,10 +619,10 @@ static int map_prefix(struct kvm_vcpu *vcpu,
> >> struct vsie_page *vsie_page) /* with mso/msl, the prefix lies at
> >> offset *mso* */ prefix += scb_s->mso;
> >>  
> >> -	rc = kvm_s390_shadow_fault(vcpu, vsie_page->gmap, prefix);
> >> +	rc = kvm_s390_shadow_fault(vcpu, vsie_page->gmap, prefix,
> >> NULL); if (!rc && (scb_s->ecb & ECB_TE))
> >>  		rc = kvm_s390_shadow_fault(vcpu, vsie_page->gmap,
> >> -					   prefix + PAGE_SIZE);
> >> +					   prefix + PAGE_SIZE,
> >> NULL); /*
> >>  	 * We don't have to mprotect, we will be called for all
> >> unshadows.
> >>  	 * SIE will detect if protection applies and trigger a
> >> validity. @@ -913,7 +913,7 @@ static int handle_fault(struct
> >> kvm_vcpu *vcpu, struct vsie_page *vsie_page)
> >> current->thread.gmap_addr, 1); 
> >>  	rc = kvm_s390_shadow_fault(vcpu, vsie_page->gmap,
> >> -				   current->thread.gmap_addr);
> >> +				   current->thread.gmap_addr,
> >> NULL); if (rc > 0) {
> >>  		rc = inject_fault(vcpu, rc,
> >>  				  current->thread.gmap_addr,
> >> @@ -935,7 +935,7 @@ static void handle_last_fault(struct kvm_vcpu
> >> *vcpu, {
> >>  	if (vsie_page->fault_addr)
> >>  		kvm_s390_shadow_fault(vcpu, vsie_page->gmap,
> >> -				      vsie_page->fault_addr);
> >> +				      vsie_page->fault_addr,
> >> NULL);  
> > 
> > Ok
> >   
> >>  	vsie_page->fault_addr = 0;
> >>  }
> >>  
> >>  
> >   
> 

Powered by blists - more mailing lists

Powered by Openwall GNU/*/Linux Powered by OpenVZ