[PATCH v2] cxl: Export AFU error buffer via sysfs
Michael Neuling
mikeyjo at neuling.org
Wed May 20 22:31:39 AEST 2015
On Wed, 2015-05-20 at 22:12 +1000, Michael Neuling wrote:
> On Wed, 2015-05-20 at 16:26 +0530, Vaibhav Jain wrote:
> > Export the "AFU Error Buffer" via sysfs attribute (afu_err_buf). AFU
> > error buffer is used by the AFU to report application specific
> > errors. The contents of this buffer are AFU specific and are intended to
> > be interpreted by the application interacting with the afu.
> >
> > Testing:
> > - Build against pseries le/be configs.
> > - Run testing with a special version of memcpy afu on a 'be'
> > kernel.
> >
> > Change-log:
> > v1 -> v2
> > - Simplified cxl_afu_read_err_buffer to handle unaligned reads
> > by performing a short read.
> >
> > Signed-off-by: Vaibhav Jain <vaibhav at linux.vnet.ibm.com>
> > ---
> > Documentation/ABI/testing/sysfs-class-cxl | 11 ++++++
> > drivers/misc/cxl/cxl.h | 7 ++++
> > drivers/misc/cxl/pci.c | 60 +++++++++++++++++++++++++++++++
> > drivers/misc/cxl/sysfs.c | 33 +++++++++++++++++
> > 4 files changed, 111 insertions(+)
> >
> > diff --git a/Documentation/ABI/testing/sysfs-class-cxl b/Documentation/ABI/testing/sysfs-class-cxl
> > index d46bba8..45e9ce3 100644
> > --- a/Documentation/ABI/testing/sysfs-class-cxl
> > +++ b/Documentation/ABI/testing/sysfs-class-cxl
> > @@ -6,6 +6,17 @@ Example: The real path of the attribute /sys/class/cxl/afu0.0s/irqs_max is
> >
> > Slave contexts (eg. /sys/class/cxl/afu0.0s):
> >
> > +What: /sys/class/cxl/<afu>/afu_err_buf
> > +Date: September 2014
> > +Contact: linuxppc-dev at lists.ozlabs.org
> > +Description: read only
> > + AFU Error Buffer contents. The contents of this file are
> > + application specific and depends on the AFU being used.
> > + Applications interacting with the AFU can use this attribute
> > + to know about the current error condition and take appropriate
> > + action like logging the event etc.
> > +
> > +
> > What: /sys/class/cxl/<afu>/irqs_max
> > Date: September 2014
> > Contact: linuxppc-dev at lists.ozlabs.org
> > diff --git a/drivers/misc/cxl/cxl.h b/drivers/misc/cxl/cxl.h
> > index a1cee47..789f077 100644
> > --- a/drivers/misc/cxl/cxl.h
> > +++ b/drivers/misc/cxl/cxl.h
> > @@ -362,6 +362,10 @@ struct cxl_afu {
> > struct mutex spa_mutex;
> > spinlock_t afu_cntl_lock;
> >
> > + /* AFU error buffer fields and bin attribute for sysfs */
> > + u64 eb_len, eb_offset;
> > + struct bin_attribute attr_eb;
> > +
> > /*
> > * Only the first part of the SPA is used for the process element
> > * linked list. The only other part that software needs to worry about
> > @@ -563,6 +567,9 @@ static inline void __iomem *_cxl_p2n_addr(struct cxl_afu *afu, cxl_p2n_reg_t reg
> > u16 cxl_afu_cr_read16(struct cxl_afu *afu, int cr, u64 off);
> > u8 cxl_afu_cr_read8(struct cxl_afu *afu, int cr, u64 off);
> >
> > +ssize_t cxl_afu_read_err_buffer(struct cxl_afu *afu, char *buf,
> > + loff_t off, size_t count);
> > +
> >
> > struct cxl_calls {
> > void (*cxl_slbia)(struct mm_struct *mm);
> > diff --git a/drivers/misc/cxl/pci.c b/drivers/misc/cxl/pci.c
> > index 1ef0164..162a8fc 100644
> > --- a/drivers/misc/cxl/pci.c
> > +++ b/drivers/misc/cxl/pci.c
> > @@ -593,6 +593,22 @@ static int cxl_read_afu_descriptor(struct cxl_afu *afu)
> > afu->crs_len = AFUD_CR_LEN(val) * 256;
> > afu->crs_offset = AFUD_READ_CR_OFF(afu);
> >
> > +
> > + /* eb_len is in multiple of 4K */
> > + afu->eb_len = AFUD_EB_LEN(AFUD_READ_EB(afu)) * 4096;
> > + afu->eb_offset = AFUD_READ_EB_OFF(afu);
> > +
> > + /* eb_off is 4K aligned so lower 12 bits are always zero */
> > + if (EXTRACT_PPC_BITS(afu->eb_offset, 0, 11) != 0) {
> > + dev_warn(&afu->dev,
> > + "Invalid AFU error buffer offset %Lx\n",
> > + afu->eb_offset);
> > + dev_info(&afu->dev,
> > + "Ignoring AFU error buffer in the descriptor\n");
> > + /* indicate that no afu buffer exists */
> > + afu->eb_len = 0;
> > + }
> > +
> > return 0;
> > }
> >
> > @@ -672,6 +688,50 @@ static int sanitise_afu_regs(struct cxl_afu *afu)
> > return 0;
> > }
> >
> > +/*
> > + * afu_eb_read:
> > + * Called from sysfs and reads the afu error info buffer. The h/w only supports
> > + * 4/8 bytes aligned access. So most of the code tries to get around this by
> > + * reading full 8 bytes aligned chunks, copying it to a temp buffer and dropping
> > + * unneeded bytes at the beginning & the end of the requested region.
> > + */
> > +ssize_t cxl_afu_read_err_buffer(struct cxl_afu *afu, char *buf,
> > + loff_t off, size_t count)
> > +{
> > + u8 tbuff[8];
> > + const void __iomem *ebuf = afu->afu_desc_mmio + afu->eb_offset;
> > +
> > + count = min((size_t)(afu->eb_len - off), count);
> > +
> > + if (unlikely(count <= 0)) {
> > + /* handle case where no ebuf exists or offset out of bound */
> > + count = 0;
> > +
> > + } else if ((count >= 8) && IS_ALIGNED(off, 8)) {
> > + /* read all the intermediate aligned words */
> > +
> > + count = round_down(off + count, 8) - off;
> > + _memcpy_fromio(buf,
> > + ebuf + off, count);
> > +
> > + } else if (!IS_ALIGNED(off, 8)) {
> > + /* handle unaligned access at the beginning */
> > + _memcpy_fromio(tbuff, ebuf + round_down(off, 8), 8);
> > +
> > + count = min((size_t)(ALIGN(off, 8) - off), count);
> > + memcpy(buf, tbuff + (off & 0x7), count);
> > +
> > + } else {
> > + /* offset is aligned but count < 8 */
> > + _memcpy_fromio(tbuff, ebuf + round_down(off + count, 8), 8);
> > +
> > + count = (off + count) - round_down(off + count, 8);
> > + memcpy(buf, tbuff, count);
> > + }
>
> I still think this is too complex. How about something like this where
> we always use a copy buffer (completely untested):
>
> copy_size_max = PAGESIZE;
>
> ebuf_start = round_down(off, 8);
> ebuf_length = min(count + 16, copy_size_max); // copy extra for alignment at start and end
> count = min(count, copy_size_max); // Adjust for max copy
> length
> count = count - (off & 7); // Adjust for non aligned offset
>
> tbuff = __get_free_page(GFP_KERNEL);
>
> _memcpy_fromio(tbuff, ebuf_start, ebuf_length);
> memcpy(buf, tbuff + (off & 0x7), count); // grab what we need
>
> free_page(tbuff);
>
> return count;
Slightly updated version as there was a bug in the count calculation.
Still untested.
copy_size_max = PAGESIZE;
ebuf_start = round_down(off, 8);
ebuf_length = min(count + 16, copy_size_max); // copy extra for alignment at start and end
if ((count + (off & 7)) > copy_size_max)
/* adjust count if we go past copy_size_max */
count = copy_size_max - (off & 7);
tbuff = __get_free_page(GFP_KERNEL);
_memcpy_fromio(tbuff, ebuf_start, ebuf_length);
memcpy(buf, tbuff + (off & 0x7), count); // grab what we need
free_page(tbuff);
return count;
Mikey
>
> Mikey
>
>
> > +
> > + return count;
> > +}
> > +
> > static int cxl_init_afu(struct cxl *adapter, int slice, struct pci_dev *dev)
> > {
> > struct cxl_afu *afu;
> > diff --git a/drivers/misc/cxl/sysfs.c b/drivers/misc/cxl/sysfs.c
> > index d0c38c7..4942d55 100644
> > --- a/drivers/misc/cxl/sysfs.c
> > +++ b/drivers/misc/cxl/sysfs.c
> > @@ -356,6 +356,16 @@ static ssize_t api_version_compatible_show(struct device *device,
> > return scnprintf(buf, PAGE_SIZE, "%i\n", CXL_API_VERSION_COMPATIBLE);
> > }
> >
> > +static ssize_t afu_eb_read(struct file *filp, struct kobject *kobj,
> > + struct bin_attribute *bin_attr, char *buf,
> > + loff_t off, size_t count)
> > +{
> > + struct cxl_afu *afu = to_cxl_afu(container_of(kobj,
> > + struct device, kobj));
> > +
> > + return cxl_afu_read_err_buffer(afu, buf, off, count);
> > +}
> > +
> > static struct device_attribute afu_attrs[] = {
> > __ATTR_RO(mmio_size),
> > __ATTR_RO(irqs_min),
> > @@ -534,6 +544,10 @@ void cxl_sysfs_afu_remove(struct cxl_afu *afu)
> > struct afu_config_record *cr, *tmp;
> > int i;
> >
> > + /* remove the err buffer bin attribute */
> > + if (afu->eb_len)
> > + device_remove_bin_file(&afu->dev, &afu->attr_eb);
> > +
> > for (i = 0; i < ARRAY_SIZE(afu_attrs); i++)
> > device_remove_file(&afu->dev, &afu_attrs[i]);
> >
> > @@ -555,6 +569,22 @@ int cxl_sysfs_afu_add(struct cxl_afu *afu)
> > goto err;
> > }
> >
> > + /* conditionally create the add the binary file for error info buffer */
> > + if (afu->eb_len) {
> > + afu->attr_eb.attr.name = "afu_err_buff";
> > + afu->attr_eb.attr.mode = S_IRUGO;
> > + afu->attr_eb.size = afu->eb_len;
> > + afu->attr_eb.read = afu_eb_read;
> > +
> > + rc = device_create_bin_file(&afu->dev, &afu->attr_eb);
> > + if (rc) {
> > + dev_err(&afu->dev,
> > + "Unable to create eb attr for the afu. Err(%d)\n",
> > + rc);
> > + goto err;
> > + }
> > + }
> > +
> > for (i = 0; i < afu->crs_num; i++) {
> > cr = cxl_sysfs_afu_new_cr(afu, i);
> > if (IS_ERR(cr)) {
> > @@ -570,6 +600,9 @@ err1:
> > cxl_sysfs_afu_remove(afu);
> > return rc;
> > err:
> > + /* reset the eb_len as we havent created the bin attr */
> > + afu->eb_len = 0;
> > +
> > for (i--; i >= 0; i--)
> > device_remove_file(&afu->dev, &afu_attrs[i]);
> > return rc;
>
More information about the Linuxppc-dev
mailing list