[Skiboot] [PATCH skiboot v2] opal: Deprecate reading the PHB status

Alexey Kardashevskiy aik at ozlabs.ru
Wed Feb 13 17:14:18 AEDT 2019



On 11/01/2019 15:03, Alexey Kardashevskiy wrote:
> The OPAL_PCI_EEH_FREEZE_STATUS call takes a bunch of parameters, one of
> them is @phb_status. It is defined as __be64* and always NULL in
> the current Linux upstream but if anyone ever decides to read that status,
> then the PHB3's handler will assume it is struct OpalIoPhb3ErrorData*
> (which is a lot bigger than 8 bytes) and zero it causing the stack
> corruption; p7ioc-phb has the same issue.
> 
> This removes @phb_status from all eeh_freeze_status() hooks and moves
> the error message from PHB4 to the affected OPAL handlers.
> 
> Signed-off-by: Alexey Kardashevskiy <aik at ozlabs.ru>

Stewart, ping?


> ---
> Changes:
> v2:
> * instead of fixing just phb3, this removes phb_status from everywhere
> 
> ---
>  include/npu2.h  |  3 +--
>  include/pci.h   |  3 +--
>  core/pci-opal.c | 14 ++++++++++++--
>  core/pci.c      |  2 +-
>  hw/npu.c        |  3 +--
>  hw/npu2.c       |  3 +--
>  hw/p7ioc-phb.c  | 11 +++--------
>  hw/phb3.c       | 10 ++--------
>  hw/phb4.c       |  9 ++-------
>  9 files changed, 24 insertions(+), 34 deletions(-)
> 
> diff --git a/include/npu2.h b/include/npu2.h
> index 1de963d..dc5d48b 100644
> --- a/include/npu2.h
> +++ b/include/npu2.h
> @@ -231,6 +231,5 @@ int64_t npu2_freeze_status(struct phb *phb __unused,
>  			   uint64_t pe_number __unused,
>  			   uint8_t *freeze_state,
>  			   uint16_t *pci_error_type __unused,
> -			   uint16_t *severity __unused,
> -			   uint64_t *phb_status __unused);
> +			   uint16_t *severity __unused);
>  #endif /* __NPU2_H */
> diff --git a/include/pci.h b/include/pci.h
> index 0516561..b49641c 100644
> --- a/include/pci.h
> +++ b/include/pci.h
> @@ -260,8 +260,7 @@ struct phb_ops {
>  	int64_t (*eeh_freeze_status)(struct phb *phb, uint64_t pe_number,
>  				     uint8_t *freeze_state,
>  				     uint16_t *pci_error_type,
> -				     uint16_t *severity,
> -				     uint64_t *phb_status);
> +				     uint16_t *severity);
>  	int64_t (*eeh_freeze_clear)(struct phb *phb, uint64_t pe_number,
>  				    uint64_t eeh_action_token);
>  	int64_t (*eeh_freeze_set)(struct phb *phb, uint64_t pe_number,
> diff --git a/core/pci-opal.c b/core/pci-opal.c
> index a4d6eee..d7abb15 100644
> --- a/core/pci-opal.c
> +++ b/core/pci-opal.c
> @@ -111,8 +111,13 @@ static int64_t opal_pci_eeh_freeze_status(uint64_t phb_id, uint64_t pe_number,
>  	if (!phb->ops->eeh_freeze_status)
>  		return OPAL_UNSUPPORTED;
>  	phb_lock(phb);
> +
> +	if (phb_status)
> +		prlog(PR_ERR, "PHB#%04llx: %s: deprecated PHB status\n",
> +				phb_id, __func__);
> +
>  	rc = phb->ops->eeh_freeze_status(phb, pe_number, freeze_state,
> -					 pci_error_type, NULL, phb_status);
> +					 pci_error_type, NULL);
>  	phb_unlock(phb);
>  
>  	return rc;
> @@ -961,8 +966,13 @@ static int64_t opal_pci_eeh_freeze_status2(uint64_t phb_id, uint64_t pe_number,
>  	if (!phb->ops->eeh_freeze_status)
>  		return OPAL_UNSUPPORTED;
>  	phb_lock(phb);
> +
> +	if (phb_status)
> +		prlog(PR_ERR, "PHB#%04llx: %s: deprecated PHB status\n",
> +				phb_id, __func__);
> +
>  	rc = phb->ops->eeh_freeze_status(phb, pe_number, freeze_state,
> -					 pci_error_type, severity, phb_status);
> +					 pci_error_type, severity);
>  	phb_unlock(phb);
>  
>  	return rc;
> diff --git a/core/pci.c b/core/pci.c
> index 14654d4..454b501 100644
> --- a/core/pci.c
> +++ b/core/pci.c
> @@ -337,7 +337,7 @@ static void pci_check_clear_freeze(struct phb *phb)
>  
>  	/* Retrieve the frozen state */
>  	rc = phb->ops->eeh_freeze_status(phb, pe_number, &freeze_state,
> -					 &pci_error_type, &sev, NULL);
> +					 &pci_error_type, &sev);
>  	if (rc)
>  		return;
>  	if (freeze_state == OPAL_EEH_STOPPED_NOT_FROZEN)
> diff --git a/hw/npu.c b/hw/npu.c
> index 08eee61..f505ac7 100644
> --- a/hw/npu.c
> +++ b/hw/npu.c
> @@ -882,8 +882,7 @@ static int64_t npu_freeze_status(struct phb *phb,
>  				     uint64_t pe_number __unused,
>  				     uint8_t *freeze_state,
>  				     uint16_t *pci_error_type __unused,
> -				     uint16_t *severity __unused,
> -				     uint64_t *phb_status __unused)
> +				     uint16_t *severity __unused)
>  {
>  	/* FIXME: When it's called by skiboot PCI config accessor,
>  	 * the PE number is fixed to 0, which is incorrect. We need
> diff --git a/hw/npu2.c b/hw/npu2.c
> index 4e75eeb..ea465f1 100644
> --- a/hw/npu2.c
> +++ b/hw/npu2.c
> @@ -1319,8 +1319,7 @@ int64_t npu2_freeze_status(struct phb *phb __unused,
>  			   uint64_t pe_number __unused,
>  			   uint8_t *freeze_state,
>  			   uint16_t *pci_error_type,
> -			   uint16_t *severity,
> -			   uint64_t *phb_status __unused)
> +			   uint16_t *severity)
>  {
>  	/*
>  	 * FIXME: When it's called by skiboot PCI config accessor,
> diff --git a/hw/p7ioc-phb.c b/hw/p7ioc-phb.c
> index e8730f4..f09e30c 100644
> --- a/hw/p7ioc-phb.c
> +++ b/hw/p7ioc-phb.c
> @@ -284,8 +284,7 @@ static void p7ioc_eeh_read_phb_status(struct p7ioc_phb *p,
>  static int64_t p7ioc_eeh_freeze_status(struct phb *phb, uint64_t pe_number,
>  				       uint8_t *freeze_state,
>  				       uint16_t *pci_error_type,
> -				       uint16_t *severity,
> -				       uint64_t *phb_status)
> +				       uint16_t *severity)
>  {
>  	struct p7ioc_phb *p = phb_to_p7ioc_phb(phb);
>  	uint64_t peev_bit = PPC_BIT(pe_number & 0x3f);
> @@ -301,7 +300,7 @@ static int64_t p7ioc_eeh_freeze_status(struct phb *phb, uint64_t pe_number,
>  		*pci_error_type = OPAL_EEH_PHB_ERROR;
>  		if (severity)
>  			*severity = OPAL_EEH_SEV_PHB_DEAD;
> -		goto bail;
> +		return OPAL_SUCCESS;
>  	}
>  
>  	/* Check fence */
> @@ -311,7 +310,7 @@ static int64_t p7ioc_eeh_freeze_status(struct phb *phb, uint64_t pe_number,
>  		*pci_error_type = OPAL_EEH_PHB_ERROR;
>  		if (severity)
>  			*severity = OPAL_EEH_SEV_PHB_FENCED;
> -		goto bail;
> +		return OPAL_SUCCESS;
>  	}
>  
>  	/* Check the PEEV */
> @@ -345,10 +344,6 @@ static int64_t p7ioc_eeh_freeze_status(struct phb *phb, uint64_t pe_number,
>  	else
>  		*pci_error_type = OPAL_EEH_PE_DMA_ERROR;
>  
> - bail:
> -	if (phb_status)
> -		p7ioc_eeh_read_phb_status(p, (struct OpalIoP7IOCPhbErrorData *)
> -					  phb_status);
>  	return OPAL_SUCCESS;
>  }
>  
> diff --git a/hw/phb3.c b/hw/phb3.c
> index 04c8b78..956a6f6 100644
> --- a/hw/phb3.c
> +++ b/hw/phb3.c
> @@ -2747,8 +2747,7 @@ static struct pci_slot *phb3_slot_create(struct phb *phb)
>  static int64_t phb3_eeh_freeze_status(struct phb *phb, uint64_t pe_number,
>  				      uint8_t *freeze_state,
>  				      uint16_t *pci_error_type,
> -				      uint16_t *severity,
> -				      uint64_t *phb_status)
> +				      uint16_t *severity)
>  {
>  	struct phb3 *p = phb_to_phb3(phb);
>  	uint64_t peev_bit = PPC_BIT(pe_number & 0x3f);
> @@ -2773,7 +2772,7 @@ static int64_t phb3_eeh_freeze_status(struct phb *phb, uint64_t pe_number,
>  		*pci_error_type = OPAL_EEH_PHB_ERROR;
>  		if (severity)
>  			*severity = OPAL_EEH_SEV_PHB_FENCED;
> -		goto bail;
> +		return OPAL_SUCCESS;
>  	}
>  
>  	/* Check the PEEV */
> @@ -2799,11 +2798,6 @@ static int64_t phb3_eeh_freeze_status(struct phb *phb, uint64_t pe_number,
>  	if (pestb & IODA2_PESTB_DMA_STOPPED)
>  		*freeze_state |= OPAL_EEH_STOPPED_DMA_FREEZE;
>  
> -bail:
> -	if (phb_status)
> -		phb3_read_phb_status(p,
> -			(struct OpalIoPhb3ErrorData *)phb_status);
> -
>  	return OPAL_SUCCESS;
>  }
>  
> diff --git a/hw/phb4.c b/hw/phb4.c
> index c079764..f2a31ab 100644
> --- a/hw/phb4.c
> +++ b/hw/phb4.c
> @@ -3341,8 +3341,7 @@ static bool phb4_freeze_escalate(uint64_t pesta)
>  static int64_t phb4_eeh_freeze_status(struct phb *phb, uint64_t pe_number,
>  				      uint8_t *freeze_state,
>  				      uint16_t *pci_error_type,
> -				      uint16_t *severity,
> -				      uint64_t *phb_status)
> +				      uint16_t *severity)
>  {
>  	struct phb4 *p = phb_to_phb4(phb);
>  	uint64_t peev_bit = PPC_BIT(pe_number & 0x3f);
> @@ -3367,7 +3366,7 @@ static int64_t phb4_eeh_freeze_status(struct phb *phb, uint64_t pe_number,
>  		*pci_error_type = OPAL_EEH_PHB_ERROR;
>  		if (severity)
>  			*severity = OPAL_EEH_SEV_PHB_FENCED;
> -		goto bail;
> +		return OPAL_SUCCESS;
>  	}
>  
>  	/* Check the PEEV */
> @@ -3401,10 +3400,6 @@ static int64_t phb4_eeh_freeze_status(struct phb *phb, uint64_t pe_number,
>  	if (pestb & IODA3_PESTB_DMA_STOPPED)
>  		*freeze_state |= OPAL_EEH_STOPPED_DMA_FREEZE;
>  
> -bail:
> -	if (phb_status)
> -		PHBERR(p, "%s: deprecated PHB status\n", __func__);
> -
>  	return OPAL_SUCCESS;
>  }
>  
> 

-- 
Alexey


More information about the Skiboot mailing list