* [PATCH 4/6] mpt fusion: Fixing 1078 data corruption issue for 36GB memory region resubmitted with review suggestions included
@ 2008-05-20 19:30 Prakash, Sathya
2008-05-27 20:13 ` James Bottomley
0 siblings, 1 reply; 2+ messages in thread
From: Prakash, Sathya @ 2008-05-20 19:30 UTC (permalink / raw)
To: linux-scsi; +Cc: eric.moore
This patch is resubmitted with the changes suggested by James, except the usage of
dma_get_required_mask instead of dma_addr_t size. This change requires
additional modifications and will be submitted later as a seperate patch
---
The reason for this change is there is a data corruption when four
different physical memory regions in the 36GB to 37GB region are accessed.
This is only affecting 1078.
The solution is we need to use different addressing when filling in
the scatter gather table for the effected memory regions. So instead
of snooping on all four different memory holes, we treat any physical
addresses in the 36GB address with the same algorithm.
The fix is explained below
1) Ensure that the message frames are NOT located in the trouble
region. There is no remapping available for message frames, they must
be allocated outside the problem region.
2) Ensure that Sense buffers are NOT in the trouble region. There is
no remapping available.
3) Walk through the SGE entries and if any are inside the trouble
region then they need to be remapped as discussed below.
1) Set the Local Address bit in the SGE Flags field.
MPI_SGE_FLAGS_LOCAL_ADDRESS
2) Ensure we are using 64-bit SGEs
3) Set MSb (Bit 63) of the 64-bit address, this will indicate buffer
location is Host Memory.
Signed-off-by: Sathya Prakash <sathya.prakash@lsi.com>
---
diff --git a/drivers/message/fusion/mptbase.c b/drivers/message/fusion/mptbase.c
index ff9965d..f64f6b3 100644
--- a/drivers/message/fusion/mptbase.c
+++ b/drivers/message/fusion/mptbase.c
@@ -925,33 +925,75 @@ mpt_free_msg_frame(MPT_ADAPTER *ioc, MPT_FRAME_HDR *mf)
spin_unlock_irqrestore(&ioc->FreeQlock, flags);
}
+
/*=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=*/
/**
- * mpt_add_sge - Place a simple SGE at address pAddr.
- * @pAddr: virtual address for SGE
+ * mpt_add_sge - Place a simple 32 bit SGE at address addr.
+ * @addr: virtual address for SGE
* @flagslength: SGE flags and data transfer length
* @dma_addr: Physical address
- *
- * This routine places a MPT request frame back on the MPT adapter's
- * FreeQ.
*/
-void
-mpt_add_sge(char *pAddr, u32 flagslength, dma_addr_t dma_addr)
+static void
+mpt_add_sge(char *addr, u32 flagslength, dma_addr_t dma_addr)
{
- if (sizeof(dma_addr_t) == sizeof(u64)) {
- SGESimple64_t *pSge = (SGESimple64_t *) pAddr;
- u32 tmp = dma_addr & 0xFFFFFFFF;
+ SGESimple32_t *pSge = (SGESimple32_t *) addr;
+ pSge->FlagsLength = cpu_to_le32(flagslength);
+ pSge->Address = cpu_to_le32(dma_addr);
+}
- pSge->FlagsLength = cpu_to_le32(flagslength);
- pSge->Address.Low = cpu_to_le32(tmp);
- tmp = (u32) ((u64)dma_addr >> 32);
- pSge->Address.High = cpu_to_le32(tmp);
+/*=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=*/
+/**
+ * mpt_add_sge_64bit - Place a simple 64 bit SGE at address addr.
+ * @addr: virtual address for SGE
+ * @flagslength: SGE flags and data transfer length
+ * @dma_addr: Physical address
+ */
+static void
+mpt_add_sge_64bit(char *addr, u32 flagslength, dma_addr_t dma_addr)
+{
+ SGESimple64_t *pSge = (SGESimple64_t *) addr;
+ u32 tmp = dma_addr & 0xFFFFFFFF;
- } else {
- SGESimple32_t *pSge = (SGESimple32_t *) pAddr;
- pSge->FlagsLength = cpu_to_le32(flagslength);
- pSge->Address = cpu_to_le32(dma_addr);
- }
+ pSge->FlagsLength = cpu_to_le32(flagslength);
+ pSge->Address.Low = cpu_to_le32(tmp);
+ tmp = (u32) ((u64)dma_addr >> 32);
+ pSge->Address.High = cpu_to_le32(tmp);
+}
+
+/*=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=*/
+/**
+ * mpt_add_sge_64bit_1078 - Place a simple 64 bit SGE at address addr
+ * (1078 workaround).
+ * @addr: virtual address for SGE
+ * @flagslength: SGE flags and data transfer length
+ * @dma_addr: Physical address
+ */
+static void
+mpt_add_sge_64bit_1078(char *addr, u32 flagslength, dma_addr_t dma_addr)
+{
+ SGESimple64_t *pSge = (SGESimple64_t *) addr;
+ u32 tmp;
+
+ tmp = dma_addr & 0xFFFFFFFF;
+ pSge->Address.Low = cpu_to_le32(tmp);
+ tmp = (u32) ((u64)dma_addr >> 32);
+
+ /*
+ * 1078 errata workaround for the 36GB limitation
+ */
+ if ((((u64)dma_addr + MPI_SGE_LENGTH(flagslength)) >> 32) == 9) {
+ flagslength |=
+ MPI_SGE_SET_FLAGS(MPI_SGE_FLAGS_LOCAL_ADDRESS);
+ tmp |= (1<<31);
+ if (mpt_debug_level & MPT_DEBUG_36GB_MEM)
+ printk(KERN_DEBUG "1078 P0M2 addressing for "
+ "addr = 0x%llx len = %d\n",
+ (unsigned long long)dma_addr,
+ MPI_SGE_LENGTH(flagslength));
+ }
+
+ pSge->FlagsLength = cpu_to_le32(flagslength);
+ pSge->Address.High = cpu_to_le32(tmp);
}
/*=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=*/
@@ -1154,7 +1196,7 @@ mpt_host_page_alloc(MPT_ADAPTER *ioc, pIOCInit_t ioc_init)
}
flags_length = flags_length << MPI_SGE_FLAGS_SHIFT;
flags_length |= ioc->HostPageBuffer_sz;
- mpt_add_sge(psge, flags_length, ioc->HostPageBuffer_dma);
+ ioc->add_sge(psge, flags_length, ioc->HostPageBuffer_dma);
ioc->facts.HostPageBufferSGE = ioc_init->HostPageBufferSGE;
return 0;
@@ -1465,11 +1507,13 @@ mpt_mapresources(MPT_ADAPTER *ioc)
if (!pci_set_dma_mask(pdev, DMA_64BIT_MASK)
&& !pci_set_consistent_dma_mask(pdev, DMA_64BIT_MASK)) {
+ ioc->dma_mask = DMA_64BIT_MASK;
dinitprintk(ioc, printk(MYIOC_s_INFO_FMT
": 64 BIT PCI BUS DMA ADDRESSING SUPPORTED\n",
ioc->name));
} else if (!pci_set_dma_mask(pdev, DMA_32BIT_MASK)
&& !pci_set_consistent_dma_mask(pdev, DMA_32BIT_MASK)) {
+ ioc->dma_mask = DMA_32BIT_MASK;
dinitprintk(ioc, printk(MYIOC_s_INFO_FMT
": 32 BIT PCI BUS DMA ADDRESSING SUPPORTED\n",
ioc->name));
@@ -1573,6 +1617,17 @@ mpt_attach(struct pci_dev *pdev, const struct pci_device_id *id)
dinitprintk(ioc, printk(MYIOC_s_INFO_FMT ": mpt_adapter_install\n", ioc->name));
+ /*
+ * Setting up proper handlers for scatter gather handling
+ */
+ if (sizeof(dma_addr_t) == sizeof(u64)) {
+ if (pdev->device == MPI_MANUFACTPAGE_DEVID_SAS1078)
+ ioc->add_sge = &mpt_add_sge_64bit_1078;
+ else
+ ioc->add_sge = &mpt_add_sge_64bit;
+ } else
+ ioc->add_sge = &mpt_add_sge;
+
ioc->pcidev = pdev;
if (mpt_mapresources(ioc)) {
kfree(ioc);
@@ -3245,7 +3300,7 @@ mpt_do_upload(MPT_ADAPTER *ioc, int sleepFlag)
sgeoffset = sizeof(FWUpload_t) - sizeof(SGE_MPI_UNION) + sizeof(FWUploadTCSGE_t);
flagsLength = MPT_SGE_FLAGS_SSIMPLE_READ | sz;
- mpt_add_sge((char *)ptcsge, flagsLength, ioc->cached_fw_dma);
+ ioc->add_sge((char *)ptcsge, flagsLength, ioc->cached_fw_dma);
sgeoffset += sizeof(u32) + sizeof(dma_addr_t);
dinitprintk(ioc, printk(MYIOC_s_INFO_FMT ": Sending FW Upload (req @ %p) sgeoffset=%d \n",
@@ -4039,12 +4094,33 @@ PrimeIocFifos(MPT_ADAPTER *ioc)
dma_addr_t alloc_dma;
u8 *mem;
int i, reply_sz, sz, total_size, num_chain;
+ u64 dma_mask = 0;
/* Prime reply FIFO... */
if (ioc->reply_frames == NULL) {
if ( (num_chain = initChainBuffers(ioc)) < 0)
return -1;
+ /*
+ * 1078 errata workaround for the 36GB limitation
+ */
+ if (ioc->pcidev->device == MPI_MANUFACTPAGE_DEVID_SAS1078 &&
+ ioc->dma_mask > DMA_35BIT_MASK) {
+ if (!pci_set_dma_mask(ioc->pcidev, DMA_35BIT_MASK)
+ && !pci_set_consistent_dma_mask(ioc->pcidev,
+ DMA_35BIT_MASK)) {
+ dma_mask = DMA_35BIT_MASK;
+ d36memprintk(ioc, printk(MYIOC_s_DEBUG_FMT
+ "setting 35 bit addressing for "
+ "Request/Reply/Chain and Sense Buffers\n",
+ ioc->name));
+ } else {
+ d36memprintk(ioc, printk(MYIOC_s_DEBUG_FMT
+ "failed setting 35 bit addressing for "
+ "Request/Reply/Chain and Sense Buffers\n",
+ ioc->name));
+ }
+ }
total_size = reply_sz = (ioc->reply_sz * ioc->reply_depth);
dinitprintk(ioc, printk(MYIOC_s_DEBUG_FMT "ReplyBuffer sz=%d bytes, ReplyDepth=%d\n",
@@ -4183,6 +4259,12 @@ PrimeIocFifos(MPT_ADAPTER *ioc)
alloc_dma += ioc->reply_sz;
}
+ if (dma_mask == DMA_35BIT_MASK && !pci_set_dma_mask(ioc->pcidev,
+ DMA_64BIT_MASK) && !pci_set_consistent_dma_mask(ioc->pcidev,
+ DMA_64BIT_MASK))
+ d36memprintk(ioc, printk(MYIOC_s_DEBUG_FMT
+ "restoring 64 bit addressing\n", ioc->name));
+
return 0;
out_fail:
@@ -4202,6 +4284,13 @@ out_fail:
ioc->sense_buf_pool, ioc->sense_buf_pool_dma);
ioc->sense_buf_pool = NULL;
}
+
+ if (dma_mask == DMA_35BIT_MASK && !pci_set_dma_mask(ioc->pcidev,
+ DMA_64BIT_MASK) && !pci_set_consistent_dma_mask(ioc->pcidev,
+ DMA_64BIT_MASK))
+ d36memprintk(ioc, printk(MYIOC_s_DEBUG_FMT
+ "restoring 64 bit addressing\n", ioc->name));
+
return -1;
}
@@ -5805,7 +5894,7 @@ mpt_config(MPT_ADAPTER *ioc, CONFIGPARMS *pCfg)
ioc->name, pReq->Header.PageType, pReq->Header.PageNumber, pReq->Action));
}
- mpt_add_sge((char *)&pReq->PageBufferSGE, flagsLength, pCfg->physAddr);
+ ioc->add_sge((char *)&pReq->PageBufferSGE, flagsLength, pCfg->physAddr);
/* Append pCfg pointer to end of mf
*/
@@ -7465,7 +7554,6 @@ EXPORT_SYMBOL(mpt_get_msg_frame);
EXPORT_SYMBOL(mpt_put_msg_frame);
EXPORT_SYMBOL(mpt_put_msg_frame_hi_pri);
EXPORT_SYMBOL(mpt_free_msg_frame);
-EXPORT_SYMBOL(mpt_add_sge);
EXPORT_SYMBOL(mpt_send_handshake_request);
EXPORT_SYMBOL(mpt_verify_adapter);
EXPORT_SYMBOL(mpt_GetIocState);
diff --git a/drivers/message/fusion/mptbase.h b/drivers/message/fusion/mptbase.h
index c8671a3..56630c6 100644
--- a/drivers/message/fusion/mptbase.h
+++ b/drivers/message/fusion/mptbase.h
@@ -562,6 +562,8 @@ struct mptfc_rport_info
u8 flags;
};
+typedef void (*MPT_ADD_SGE)(char *addr, u32 flagslength, dma_addr_t dma_addr);
+
/*
* Adapter Structure - pci_dev specific. Maximum: MPT_MAX_ADAPTERS
*/
@@ -598,6 +600,8 @@ typedef struct _MPT_ADAPTER
int reply_depth; /* Num Allocated reply frames */
int reply_sz; /* Reply frame size */
int num_chain; /* Number of chain buffers */
+ MPT_ADD_SGE add_sge;
+ u64 dma_mask;
/* Pool of buffers for chaining. ReqToChain
* and ChainToChain track index of chain buffers.
* ChainBuffer (DMA) virt/phys addresses.
@@ -901,8 +905,6 @@ extern MPT_FRAME_HDR *mpt_get_msg_frame(u8 cb_idx, MPT_ADAPTER *ioc);
extern void mpt_free_msg_frame(MPT_ADAPTER *ioc, MPT_FRAME_HDR *mf);
extern void mpt_put_msg_frame(u8 cb_idx, MPT_ADAPTER *ioc, MPT_FRAME_HDR *mf);
extern void mpt_put_msg_frame_hi_pri(u8 cb_idx, MPT_ADAPTER *ioc, MPT_FRAME_HDR *mf);
-extern void mpt_add_sge(char *pAddr, u32 flagslength, dma_addr_t dma_addr);
-
extern int mpt_send_handshake_request(u8 cb_idx, MPT_ADAPTER *ioc, int reqBytes, u32 *req, int sleepFlag);
extern int mpt_verify_adapter(int iocid, MPT_ADAPTER **iocpp);
extern u32 mpt_GetIocState(MPT_ADAPTER *ioc, int cooked);
diff --git a/drivers/message/fusion/mptctl.c b/drivers/message/fusion/mptctl.c
index 68c844b..d43d606 100644
--- a/drivers/message/fusion/mptctl.c
+++ b/drivers/message/fusion/mptctl.c
@@ -871,7 +871,7 @@ mptctl_do_fw_download(int ioc, char __user *ufwbuf, size_t fwlen)
if (nib == 0 || nib == 3) {
;
} else if (sgIn->Address) {
- mpt_add_sge(sgOut, sgIn->FlagsLength, sgIn->Address);
+ iocp->add_sge(sgOut, sgIn->FlagsLength, sgIn->Address);
n++;
if (copy_from_user(bl->kptr, ufwbuf+fw_bytes_copied, bl->len)) {
printk(MYIOC_s_ERR_FMT "%s@%d::_ioctl_fwdl - "
@@ -2142,7 +2142,7 @@ mptctl_do_mpt_command (struct mpt_ioctl_command karg, void __user *mfPtr)
/* Set up this SGE.
* Copy to MF and to sglbuf
*/
- mpt_add_sge(psge, flagsLength, dma_addr_out);
+ ioc->add_sge(psge, flagsLength, dma_addr_out);
psge += (sizeof(u32) + sizeof(dma_addr_t));
/* Copy user data to kernel space.
@@ -2176,13 +2176,13 @@ mptctl_do_mpt_command (struct mpt_ioctl_command karg, void __user *mfPtr)
/* Set up this SGE
* Copy to MF and to sglbuf
*/
- mpt_add_sge(psge, flagsLength, dma_addr_in);
+ ioc->add_sge(psge, flagsLength, dma_addr_in);
}
}
} else {
/* Add a NULL SGE
*/
- mpt_add_sge(psge, flagsLength, (dma_addr_t) -1);
+ ioc->add_sge(psge, flagsLength, (dma_addr_t) -1);
}
ioc->ioctl->wait_done = 0;
@@ -2499,7 +2499,7 @@ mptctl_hp_hostinfo(unsigned long arg, unsigned int data_size)
pbuf = pci_alloc_consistent(ioc->pcidev, 4, &buf_dma);
if (!pbuf)
goto out;
- mpt_add_sge((char *)&IstwiRWRequest->SGL,
+ ioc->add_sge((char *)&IstwiRWRequest->SGL,
(MPT_SGE_FLAGS_SSIMPLE_READ|4), buf_dma);
ioc->ioctl->wait_done = 0;
diff --git a/drivers/message/fusion/mptdebug.h b/drivers/message/fusion/mptdebug.h
index 510b9f4..962ccbe 100644
--- a/drivers/message/fusion/mptdebug.h
+++ b/drivers/message/fusion/mptdebug.h
@@ -58,6 +58,7 @@
#define MPT_DEBUG_FC 0x00080000
#define MPT_DEBUG_SAS 0x00100000
#define MPT_DEBUG_SAS_WIDE 0x00200000
+#define MPT_DEBUG_36GB_MEM 0x00400000
/*
* CONFIG_FUSION_LOGGING - enabled in Kconfig
@@ -135,6 +136,8 @@
#define dsaswideprintk(IOC, CMD) \
MPT_CHECK_LOGGING(IOC, CMD, MPT_DEBUG_SAS_WIDE)
+#define d36memprintk(IOC, CMD) \
+ MPT_CHECK_LOGGING(IOC, CMD, MPT_DEBUG_36GB_MEM)
/*
diff --git a/drivers/message/fusion/mptsas.c b/drivers/message/fusion/mptsas.c
index 0cbb562..6d5cf68 100644
--- a/drivers/message/fusion/mptsas.c
+++ b/drivers/message/fusion/mptsas.c
@@ -1327,7 +1327,7 @@ static int mptsas_smp_handler(struct Scsi_Host *shost, struct sas_rphy *rphy,
req->data_len, PCI_DMA_BIDIRECTIONAL);
if (!dma_addr_out)
goto put_mf;
- mpt_add_sge(psge, flagsLength, dma_addr_out);
+ ioc->add_sge(psge, flagsLength, dma_addr_out);
psge += (sizeof(u32) + sizeof(dma_addr_t));
/* response */
@@ -1337,7 +1337,7 @@ static int mptsas_smp_handler(struct Scsi_Host *shost, struct sas_rphy *rphy,
rsp->data_len, PCI_DMA_BIDIRECTIONAL);
if (!dma_addr_in)
goto unmap;
- mpt_add_sge(psge, flagsLength, dma_addr_in);
+ ioc->add_sge(psge, flagsLength, dma_addr_in);
mpt_put_msg_frame(mptsasMgmtCtx, ioc, mf);
diff --git a/drivers/message/fusion/mptscsih.c b/drivers/message/fusion/mptscsih.c
index 63a5199..5297ad8 100644
--- a/drivers/message/fusion/mptscsih.c
+++ b/drivers/message/fusion/mptscsih.c
@@ -115,35 +115,6 @@ int mptscsih_resume(struct pci_dev *pdev);
/*=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=*/
/**
- * mptscsih_add_sge - Place a simple SGE at address pAddr.
- * @pAddr: virtual address for SGE
- * @flagslength: SGE flags and data transfer length
- * @dma_addr: Physical address
- *
- * This routine places a MPT request frame back on the MPT adapter's
- * FreeQ.
- */
-static inline void
-mptscsih_add_sge(char *pAddr, u32 flagslength, dma_addr_t dma_addr)
-{
- if (sizeof(dma_addr_t) == sizeof(u64)) {
- SGESimple64_t *pSge = (SGESimple64_t *) pAddr;
- u32 tmp = dma_addr & 0xFFFFFFFF;
-
- pSge->FlagsLength = cpu_to_le32(flagslength);
- pSge->Address.Low = cpu_to_le32(tmp);
- tmp = (u32) ((u64)dma_addr >> 32);
- pSge->Address.High = cpu_to_le32(tmp);
-
- } else {
- SGESimple32_t *pSge = (SGESimple32_t *) pAddr;
- pSge->FlagsLength = cpu_to_le32(flagslength);
- pSge->Address = cpu_to_le32(dma_addr);
- }
-} /* mptscsih_add_sge() */
-
-/*=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=*/
-/**
* mptscsih_add_chain - Place a chain SGE at address pAddr.
* @pAddr: virtual address for SGE
* @next: nextChainOffset value (u32's)
@@ -299,7 +270,7 @@ nextSGEset:
}
v2 = sg_dma_address(sg);
- mptscsih_add_sge(psge, sgflags | thisxfer, v2);
+ ioc->add_sge(psge, sgflags | thisxfer, v2);
sg = sg_next(sg); /* Get next SG element from the OS */
psge += (sizeof(u32) + sizeof(dma_addr_t));
@@ -320,7 +291,7 @@ nextSGEset:
thisxfer = sg_dma_len(sg);
v2 = sg_dma_address(sg);
- mptscsih_add_sge(psge, sgflags | thisxfer, v2);
+ ioc->add_sge(psge, sgflags | thisxfer, v2);
/*
sg = sg_next(sg);
psge += (sizeof(u32) + sizeof(dma_addr_t));
@@ -1448,8 +1419,8 @@ mptscsih_qcmd(struct scsi_cmnd *SCpnt, void (*done)(struct scsi_cmnd *))
*/
if (datalen == 0) {
/* Add a NULL SGE */
- mptscsih_add_sge((char *)&pScsiReq->SGL, MPT_SGE_FLAGS_SSIMPLE_READ | 0,
- (dma_addr_t) -1);
+ ioc->add_sge((char *)&pScsiReq->SGL,
+ MPT_SGE_FLAGS_SSIMPLE_READ | 0, (dma_addr_t) -1);
} else {
/* Add a 32 or 64 bit SGE */
if (mptscsih_AddSGE(ioc, SCpnt, pScsiReq, my_idx) != SUCCESS)
@@ -3202,11 +3173,11 @@ mptscsih_do_cmd(MPT_SCSI_HOST *hd, INTERNAL_CMD *io)
ioc->name, cmd, io->channel, io->id, io->lun));
if (dir == MPI_SCSIIO_CONTROL_READ) {
- mpt_add_sge((char *) &pScsiReq->SGL,
+ ioc->add_sge((char *) &pScsiReq->SGL,
MPT_SGE_FLAGS_SSIMPLE_READ | io->size,
io->data_dma);
} else {
- mpt_add_sge((char *) &pScsiReq->SGL,
+ ioc->add_sge((char *) &pScsiReq->SGL,
MPT_SGE_FLAGS_SSIMPLE_WRITE | io->size,
io->data_dma);
}
diff --git a/drivers/message/fusion/mptspi.c b/drivers/message/fusion/mptspi.c
index 1cdea1a..bd3a3be 100644
--- a/drivers/message/fusion/mptspi.c
+++ b/drivers/message/fusion/mptspi.c
@@ -300,7 +300,7 @@ mptspi_writeIOCPage4(MPT_SCSI_HOST *hd, u8 channel , u8 id)
flagsLength = MPT_SGE_FLAGS_SSIMPLE_WRITE |
(IOCPage4Ptr->Header.PageLength + ii) * 4;
- mpt_add_sge((char *)&pReq->PageBufferSGE, flagsLength, dataDma);
+ ioc->add_sge((char *)&pReq->PageBufferSGE, flagsLength, dataDma);
ddvprintk(ioc, printk(MYIOC_s_DEBUG_FMT
"writeIOCPage4: MaxSEP=%d ActiveSEP=%d id=%d bus=%d\n",
@@ -642,7 +642,7 @@ mptscsih_quiesce_raid(MPT_SCSI_HOST *hd, int quiesce, u8 channel, u8 id)
pReq->Reserved2 = 0;
pReq->ActionDataWord = 0; /* Reserved for this action */
- mpt_add_sge((char *)&pReq->ActionDataSGE,
+ ioc->add_sge((char *)&pReq->ActionDataSGE,
MPT_SGE_FLAGS_SSIMPLE_READ | 0, (dma_addr_t) -1);
ddvprintk(ioc, printk(MYIOC_s_DEBUG_FMT "RAID Volume action=%x channel=%d id=%d\n",
^ permalink raw reply related [flat|nested] 2+ messages in thread
* Re: [PATCH 4/6] mpt fusion: Fixing 1078 data corruption issue for 36GB memory region resubmitted with review suggestions included
2008-05-20 19:30 [PATCH 4/6] mpt fusion: Fixing 1078 data corruption issue for 36GB memory region resubmitted with review suggestions included Prakash, Sathya
@ 2008-05-27 20:13 ` James Bottomley
0 siblings, 0 replies; 2+ messages in thread
From: James Bottomley @ 2008-05-27 20:13 UTC (permalink / raw)
To: Prakash, Sathya; +Cc: linux-scsi, eric.moore
On Wed, 2008-05-21 at 01:00 +0530, Prakash, Sathya wrote:
> This patch is resubmitted with the changes suggested by James, except the usage of
> dma_get_required_mask instead of dma_addr_t size.
I thought you said it was slightly more efficient to use the 32 bit
addressing mode? So it should be slightly more efficient to use the 32
bit mode even on 64 bit kernels as long as all memory is < 4GB.
> This change requires
> additional modifications and will be submitted later as a seperate patch
So that means this 4/6 can't go in now? but 5/6 and 6/6 are OK (since I
can't see anything in 5 or 6 which is relevant to this)?
Also, just a note about the replacement of a 3 way 'if' that always
takes the same branch with a function pointer: in general, function
pointers are less efficient because they destroy pipelining and
speculation. A simple branch might be better (particularly in this case
where the prediction should always get it right since the logic value
doesn't alter). However, the CPUs that suffer most from this are the
long pipeline ones like ia64 and parisc, I suspect the effect is much
more marginal on x86.
> ---
>
> The reason for this change is there is a data corruption when four
> different physical memory regions in the 36GB to 37GB region are accessed.
> This is only affecting 1078.
>
> The solution is we need to use different addressing when filling in
> the scatter gather table for the effected memory regions. So instead
> of snooping on all four different memory holes, we treat any physical
> addresses in the 36GB address with the same algorithm.
>
> The fix is explained below
> 1) Ensure that the message frames are NOT located in the trouble
> region. There is no remapping available for message frames, they must
> be allocated outside the problem region.
> 2) Ensure that Sense buffers are NOT in the trouble region. There is
> no remapping available.
> 3) Walk through the SGE entries and if any are inside the trouble
> region then they need to be remapped as discussed below.
> 1) Set the Local Address bit in the SGE Flags field.
> MPI_SGE_FLAGS_LOCAL_ADDRESS
> 2) Ensure we are using 64-bit SGEs
> 3) Set MSb (Bit 63) of the 64-bit address, this will indicate buffer
> location is Host Memory.
>
> Signed-off-by: Sathya Prakash <sathya.prakash@lsi.com>
> ---
>
> diff --git a/drivers/message/fusion/mptbase.c b/drivers/message/fusion/mptbase.c
> index ff9965d..f64f6b3 100644
> --- a/drivers/message/fusion/mptbase.c
> +++ b/drivers/message/fusion/mptbase.c
> @@ -925,33 +925,75 @@ mpt_free_msg_frame(MPT_ADAPTER *ioc, MPT_FRAME_HDR *mf)
> spin_unlock_irqrestore(&ioc->FreeQlock, flags);
> }
>
> +
> /*=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=*/
> /**
> - * mpt_add_sge - Place a simple SGE at address pAddr.
> - * @pAddr: virtual address for SGE
> + * mpt_add_sge - Place a simple 32 bit SGE at address addr.
> + * @addr: virtual address for SGE
> * @flagslength: SGE flags and data transfer length
> * @dma_addr: Physical address
> - *
> - * This routine places a MPT request frame back on the MPT adapter's
> - * FreeQ.
> */
> -void
> -mpt_add_sge(char *pAddr, u32 flagslength, dma_addr_t dma_addr)
> +static void
> +mpt_add_sge(char *addr, u32 flagslength, dma_addr_t dma_addr)
if you used void * instead of char * here, you wouldn't need to do all
the recasting (both into and out of this function). Since you get
absolutely zero type safety from any of this, I think void * makes a lot
more sense and is much more readable.
> {
> - if (sizeof(dma_addr_t) == sizeof(u64)) {
> - SGESimple64_t *pSge = (SGESimple64_t *) pAddr;
> - u32 tmp = dma_addr & 0xFFFFFFFF;
> + SGESimple32_t *pSge = (SGESimple32_t *) addr;
> + pSge->FlagsLength = cpu_to_le32(flagslength);
> + pSge->Address = cpu_to_le32(dma_addr);
> +}
>
> - pSge->FlagsLength = cpu_to_le32(flagslength);
> - pSge->Address.Low = cpu_to_le32(tmp);
> - tmp = (u32) ((u64)dma_addr >> 32);
> - pSge->Address.High = cpu_to_le32(tmp);
> +/*=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=*/
> +/**
> + * mpt_add_sge_64bit - Place a simple 64 bit SGE at address addr.
> + * @addr: virtual address for SGE
> + * @flagslength: SGE flags and data transfer length
> + * @dma_addr: Physical address
> + */
> +static void
> +mpt_add_sge_64bit(char *addr, u32 flagslength, dma_addr_t dma_addr)
> +{
> + SGESimple64_t *pSge = (SGESimple64_t *) addr;
> + u32 tmp = dma_addr & 0xFFFFFFFF;
>
> - } else {
> - SGESimple32_t *pSge = (SGESimple32_t *) pAddr;
> - pSge->FlagsLength = cpu_to_le32(flagslength);
> - pSge->Address = cpu_to_le32(dma_addr);
> - }
> + pSge->FlagsLength = cpu_to_le32(flagslength);
> + pSge->Address.Low = cpu_to_le32(tmp);
> + tmp = (u32) ((u64)dma_addr >> 32);
Use the macro upper_32_bits() here.
> + pSge->Address.High = cpu_to_le32(tmp);
> +}
> +
> +/*=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=*/
> +/**
> + * mpt_add_sge_64bit_1078 - Place a simple 64 bit SGE at address addr
> + * (1078 workaround).
> + * @addr: virtual address for SGE
> + * @flagslength: SGE flags and data transfer length
> + * @dma_addr: Physical address
> + */
> +static void
> +mpt_add_sge_64bit_1078(char *addr, u32 flagslength, dma_addr_t dma_addr)
> +{
> + SGESimple64_t *pSge = (SGESimple64_t *) addr;
> + u32 tmp;
> +
> + tmp = dma_addr & 0xFFFFFFFF;
> + pSge->Address.Low = cpu_to_le32(tmp);
> + tmp = (u32) ((u64)dma_addr >> 32);
upper_32_bits() again.
> + /*
> + * 1078 errata workaround for the 36GB limitation
> + */
> + if ((((u64)dma_addr + MPI_SGE_LENGTH(flagslength)) >> 32) == 9) {
> + flagslength |=
> + MPI_SGE_SET_FLAGS(MPI_SGE_FLAGS_LOCAL_ADDRESS);
> + tmp |= (1<<31);
> + if (mpt_debug_level & MPT_DEBUG_36GB_MEM)
> + printk(KERN_DEBUG "1078 P0M2 addressing for "
> + "addr = 0x%llx len = %d\n",
> + (unsigned long long)dma_addr,
> + MPI_SGE_LENGTH(flagslength));
> + }
> +
> + pSge->FlagsLength = cpu_to_le32(flagslength);
> + pSge->Address.High = cpu_to_le32(tmp);
> }
>
> /*=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=*/
> @@ -1154,7 +1196,7 @@ mpt_host_page_alloc(MPT_ADAPTER *ioc, pIOCInit_t ioc_init)
> }
> flags_length = flags_length << MPI_SGE_FLAGS_SHIFT;
> flags_length |= ioc->HostPageBuffer_sz;
> - mpt_add_sge(psge, flags_length, ioc->HostPageBuffer_dma);
> + ioc->add_sge(psge, flags_length, ioc->HostPageBuffer_dma);
> ioc->facts.HostPageBufferSGE = ioc_init->HostPageBufferSGE;
>
> return 0;
> @@ -1465,11 +1507,13 @@ mpt_mapresources(MPT_ADAPTER *ioc)
>
> if (!pci_set_dma_mask(pdev, DMA_64BIT_MASK)
> && !pci_set_consistent_dma_mask(pdev, DMA_64BIT_MASK)) {
> + ioc->dma_mask = DMA_64BIT_MASK;
> dinitprintk(ioc, printk(MYIOC_s_INFO_FMT
> ": 64 BIT PCI BUS DMA ADDRESSING SUPPORTED\n",
> ioc->name));
> } else if (!pci_set_dma_mask(pdev, DMA_32BIT_MASK)
> && !pci_set_consistent_dma_mask(pdev, DMA_32BIT_MASK)) {
> + ioc->dma_mask = DMA_32BIT_MASK;
> dinitprintk(ioc, printk(MYIOC_s_INFO_FMT
> ": 32 BIT PCI BUS DMA ADDRESSING SUPPORTED\n",
> ioc->name));
> @@ -1573,6 +1617,17 @@ mpt_attach(struct pci_dev *pdev, const struct pci_device_id *id)
>
> dinitprintk(ioc, printk(MYIOC_s_INFO_FMT ": mpt_adapter_install\n", ioc->name));
>
> + /*
> + * Setting up proper handlers for scatter gather handling
> + */
> + if (sizeof(dma_addr_t) == sizeof(u64)) {
> + if (pdev->device == MPI_MANUFACTPAGE_DEVID_SAS1078)
> + ioc->add_sge = &mpt_add_sge_64bit_1078;
> + else
> + ioc->add_sge = &mpt_add_sge_64bit;
> + } else
> + ioc->add_sge = &mpt_add_sge;
> +
> ioc->pcidev = pdev;
> if (mpt_mapresources(ioc)) {
> kfree(ioc);
> @@ -3245,7 +3300,7 @@ mpt_do_upload(MPT_ADAPTER *ioc, int sleepFlag)
> sgeoffset = sizeof(FWUpload_t) - sizeof(SGE_MPI_UNION) + sizeof(FWUploadTCSGE_t);
>
> flagsLength = MPT_SGE_FLAGS_SSIMPLE_READ | sz;
> - mpt_add_sge((char *)ptcsge, flagsLength, ioc->cached_fw_dma);
> + ioc->add_sge((char *)ptcsge, flagsLength, ioc->cached_fw_dma);
>
> sgeoffset += sizeof(u32) + sizeof(dma_addr_t);
> dinitprintk(ioc, printk(MYIOC_s_INFO_FMT ": Sending FW Upload (req @ %p) sgeoffset=%d \n",
> @@ -4039,12 +4094,33 @@ PrimeIocFifos(MPT_ADAPTER *ioc)
> dma_addr_t alloc_dma;
> u8 *mem;
> int i, reply_sz, sz, total_size, num_chain;
> + u64 dma_mask = 0;
>
> /* Prime reply FIFO... */
>
> if (ioc->reply_frames == NULL) {
> if ( (num_chain = initChainBuffers(ioc)) < 0)
> return -1;
> + /*
> + * 1078 errata workaround for the 36GB limitation
> + */
> + if (ioc->pcidev->device == MPI_MANUFACTPAGE_DEVID_SAS1078 &&
> + ioc->dma_mask > DMA_35BIT_MASK) {
> + if (!pci_set_dma_mask(ioc->pcidev, DMA_35BIT_MASK)
> + && !pci_set_consistent_dma_mask(ioc->pcidev,
> + DMA_35BIT_MASK)) {
> + dma_mask = DMA_35BIT_MASK;
> + d36memprintk(ioc, printk(MYIOC_s_DEBUG_FMT
> + "setting 35 bit addressing for "
> + "Request/Reply/Chain and Sense Buffers\n",
> + ioc->name));
> + } else {
> + d36memprintk(ioc, printk(MYIOC_s_DEBUG_FMT
> + "failed setting 35 bit addressing for "
> + "Request/Reply/Chain and Sense Buffers\n",
> + ioc->name));
This is a pretty serious failure isn't it? Doesn't it mean that the
sense buffer for the device becomes unusable if it's placed in the wrong
memory and so the device is potentially inoperable? It would seem that
some action stronger than a debug message might be required.
> + }
> + }
>
> total_size = reply_sz = (ioc->reply_sz * ioc->reply_depth);
> dinitprintk(ioc, printk(MYIOC_s_DEBUG_FMT "ReplyBuffer sz=%d bytes, ReplyDepth=%d\n",
> @@ -4183,6 +4259,12 @@ PrimeIocFifos(MPT_ADAPTER *ioc)
> alloc_dma += ioc->reply_sz;
> }
>
> + if (dma_mask == DMA_35BIT_MASK && !pci_set_dma_mask(ioc->pcidev,
> + DMA_64BIT_MASK) && !pci_set_consistent_dma_mask(ioc->pcidev,
> + DMA_64BIT_MASK))
> + d36memprintk(ioc, printk(MYIOC_s_DEBUG_FMT
> + "restoring 64 bit addressing\n", ioc->name));
> +
> return 0;
>
> out_fail:
> @@ -4202,6 +4284,13 @@ out_fail:
> ioc->sense_buf_pool, ioc->sense_buf_pool_dma);
> ioc->sense_buf_pool = NULL;
> }
> +
> + if (dma_mask == DMA_35BIT_MASK && !pci_set_dma_mask(ioc->pcidev,
> + DMA_64BIT_MASK) && !pci_set_consistent_dma_mask(ioc->pcidev,
> + DMA_64BIT_MASK))
> + d36memprintk(ioc, printk(MYIOC_s_DEBUG_FMT
> + "restoring 64 bit addressing\n", ioc->name));
> +
> return -1;
> }
>
> @@ -5805,7 +5894,7 @@ mpt_config(MPT_ADAPTER *ioc, CONFIGPARMS *pCfg)
> ioc->name, pReq->Header.PageType, pReq->Header.PageNumber, pReq->Action));
> }
>
> - mpt_add_sge((char *)&pReq->PageBufferSGE, flagsLength, pCfg->physAddr);
> + ioc->add_sge((char *)&pReq->PageBufferSGE, flagsLength, pCfg->physAddr);
>
> /* Append pCfg pointer to end of mf
> */
> @@ -7465,7 +7554,6 @@ EXPORT_SYMBOL(mpt_get_msg_frame);
> EXPORT_SYMBOL(mpt_put_msg_frame);
> EXPORT_SYMBOL(mpt_put_msg_frame_hi_pri);
> EXPORT_SYMBOL(mpt_free_msg_frame);
> -EXPORT_SYMBOL(mpt_add_sge);
> EXPORT_SYMBOL(mpt_send_handshake_request);
> EXPORT_SYMBOL(mpt_verify_adapter);
> EXPORT_SYMBOL(mpt_GetIocState);
> diff --git a/drivers/message/fusion/mptbase.h b/drivers/message/fusion/mptbase.h
> index c8671a3..56630c6 100644
> --- a/drivers/message/fusion/mptbase.h
> +++ b/drivers/message/fusion/mptbase.h
> @@ -562,6 +562,8 @@ struct mptfc_rport_info
> u8 flags;
> };
>
> +typedef void (*MPT_ADD_SGE)(char *addr, u32 flagslength, dma_addr_t dma_addr);
> +
> /*
> * Adapter Structure - pci_dev specific. Maximum: MPT_MAX_ADAPTERS
> */
> @@ -598,6 +600,8 @@ typedef struct _MPT_ADAPTER
> int reply_depth; /* Num Allocated reply frames */
> int reply_sz; /* Reply frame size */
> int num_chain; /* Number of chain buffers */
> + MPT_ADD_SGE add_sge;
> + u64 dma_mask;
Can we not do this ... as I said before, there doesn't seem to be any
reason not to use ioc->pcidev->dma_mask.
James
^ permalink raw reply [flat|nested] 2+ messages in thread
end of thread, other threads:[~2008-05-27 20:13 UTC | newest]
Thread overview: 2+ messages (download: mbox.gz follow: Atom feed
-- links below jump to the message on this page --
2008-05-20 19:30 [PATCH 4/6] mpt fusion: Fixing 1078 data corruption issue for 36GB memory region resubmitted with review suggestions included Prakash, Sathya
2008-05-27 20:13 ` James Bottomley
This is a public inbox, see mirroring instructions
for how to clone and mirror all data and code used for this inbox;
as well as URLs for NNTP newsgroup(s).