From: Ben Chuang <benchuanggli@gmail.com>
To: Jason Lai <jasonlai.genesyslogic@gmail.com>
Cc: Ulf Hansson <ulf.hansson@linaro.org>,
Adrian Hunter <adrian.hunter@intel.com>,
linux-mmc <linux-mmc@vger.kernel.org>,
Ben Chuang <ben.chuang@genesyslogic.com.tw>,
greg.tu@genesyslogic.com.tw, SeanHY.chen@genesyslogic.com.tw,
jason.lai@genesyslogic.com.tw, victor.shih@genesyslogic.com.tw,
Renius Chen <reniuschengl@gmail.com>
Subject: Re: [PATCH] mmc: sdhci-pci-gli: Improve Random 4K Read Performance of GL9763E
Date: Thu, 26 May 2022 09:14:47 +0800 [thread overview]
Message-ID: <CACT4zj9F7J3NgFMK7sG1aL19Y12zrPejPuD2ZEhwKYf0oosEVQ@mail.gmail.com> (raw)
In-Reply-To: <20220525122754.6837-1-jasonlai.genesyslogic@gmail.com>
Hi Jason,
Please check your codebase because the patch removed the gl97[50|55]
ssc patches.
Thanks,
Ben
On Wed, May 25, 2022 at 11:48 PM Jason Lai
<jasonlai.genesyslogic@gmail.com> wrote:
>
> This patch is based on patch [1] and remove data transfer length
> checking.
>
> Due to flaws in hardware design, GL9763E takes long time to exit from L1
> state. The I/O performance will suffer severe impact if it often enter
> and exit L1 state.
>
> Unfortunately, entering and exiting L1 state is signal handshake in
> physical layer, software knows nothiong about it. The only way to stop
> entering L1 state is to disable hardware LPM negotiation on GL9763E.
>
> To improve read performance and take battery life into account, we reject
> L1 negotiation while executing MMC_READ_MULTIPLE_BLOCK command and enable L1
> negotiation again when receiving non-MMC_READ_MULTIPLE_BLOCK command.
>
> [1]
> https://patchwork.kernel.org/project/linux-mmc/list/?series=510801&archive
> =both
>
> Signed-off-by: Renius Chen <reniuschengl@gmail.com>
> Signed-off-by: Jason Lai <jason.lai@genesyslogic.com.tw>
> ---
> drivers/mmc/host/sdhci-pci-gli.c | 193 ++++++++++---------------------
> 1 file changed, 63 insertions(+), 130 deletions(-)
>
> diff --git a/drivers/mmc/host/sdhci-pci-gli.c b/drivers/mmc/host/sdhci-pci-gli.c
> index d09728c37d03..0c5aac8047f8 100644
> --- a/drivers/mmc/host/sdhci-pci-gli.c
> +++ b/drivers/mmc/host/sdhci-pci-gli.c
> @@ -13,7 +13,6 @@
> #include <linux/mmc/mmc.h>
> #include <linux/delay.h>
> #include <linux/of.h>
> -#include <linux/iopoll.h>
> #include "sdhci.h"
> #include "sdhci-pci.h"
> #include "cqhci.h"
> @@ -64,7 +63,6 @@
> #define GLI_9750_MISC_RX_INV_OFF 0x0
> #define GLI_9750_MISC_RX_INV_VALUE GLI_9750_MISC_RX_INV_OFF
> #define GLI_9750_MISC_TX1_DLY_VALUE 0x5
> -#define SDHCI_GLI_9750_MISC_SSC_OFF BIT(26)
>
> #define SDHCI_GLI_9750_TUNING_CONTROL 0x540
> #define SDHCI_GLI_9750_TUNING_CONTROL_EN BIT(4)
> @@ -95,9 +93,12 @@
> #define PCIE_GLI_9763E_SCR 0x8E0
> #define GLI_9763E_SCR_AXI_REQ BIT(9)
>
> +#define PCIE_GLI_9763E_CFG 0x8A0
> +#define GLI_9763E_CFG_LPSN_DIS BIT(12)
> +
> #define PCIE_GLI_9763E_CFG2 0x8A4
> #define GLI_9763E_CFG2_L1DLY GENMASK(28, 19)
> -#define GLI_9763E_CFG2_L1DLY_MID 0x54
> +#define GLI_9763E_CFG2_L1DLY_MID 0x54 // Set L1 entry delay time to 21us
>
> #define PCIE_GLI_9763E_MMC_CTRL 0x960
> #define GLI_9763E_HS400_SLOW BIT(3)
> @@ -139,11 +140,12 @@
> #define PCI_GLI_9755_SerDes 0x70
> #define PCI_GLI_9755_SCP_DIS BIT(19)
>
> -#define PCI_GLI_9755_MISC 0x78
> -#define PCI_GLI_9755_MISC_SSC_OFF BIT(26)
> -
> #define GLI_MAX_TUNING_LOOP 40
>
> +struct gli_host {
> + bool lpm_negotiation_enabled;
> +};
> +
> /* Genesys Logic chipset */
> static inline void gl9750_wt_on(struct sdhci_host *host)
> {
> @@ -376,19 +378,6 @@ static void gl9750_set_pll(struct sdhci_host *host, u8 dir, u16 ldiv, u8 pdiv)
> mdelay(1);
> }
>
> -static bool gl9750_ssc_enable(struct sdhci_host *host)
> -{
> - u32 misc;
> - u8 off;
> -
> - gl9750_wt_on(host);
> - misc = sdhci_readl(host, SDHCI_GLI_9750_MISC);
> - off = FIELD_GET(SDHCI_GLI_9750_MISC_SSC_OFF, misc);
> - gl9750_wt_off(host);
> -
> - return !off;
> -}
> -
> static void gl9750_set_ssc(struct sdhci_host *host, u8 enable, u8 step, u16 ppm)
> {
> u32 pll;
> @@ -410,31 +399,11 @@ static void gl9750_set_ssc(struct sdhci_host *host, u8 enable, u8 step, u16 ppm)
>
> static void gl9750_set_ssc_pll_205mhz(struct sdhci_host *host)
> {
> - bool enable = gl9750_ssc_enable(host);
> -
> - /* set pll to 205MHz and ssc */
> - gl9750_set_ssc(host, enable, 0xF, 0x5A1D);
> + /* set pll to 205MHz and enable ssc */
> + gl9750_set_ssc(host, 0x1, 0x1F, 0xFFE7);
> gl9750_set_pll(host, 0x1, 0x246, 0x0);
> }
>
> -static void gl9750_set_ssc_pll_100mhz(struct sdhci_host *host)
> -{
> - bool enable = gl9750_ssc_enable(host);
> -
> - /* set pll to 100MHz and ssc */
> - gl9750_set_ssc(host, enable, 0xE, 0x51EC);
> - gl9750_set_pll(host, 0x1, 0x244, 0x1);
> -}
> -
> -static void gl9750_set_ssc_pll_50mhz(struct sdhci_host *host)
> -{
> - bool enable = gl9750_ssc_enable(host);
> -
> - /* set pll to 50MHz and ssc */
> - gl9750_set_ssc(host, enable, 0xE, 0x51EC);
> - gl9750_set_pll(host, 0x1, 0x244, 0x3);
> -}
> -
> static void sdhci_gl9750_set_clock(struct sdhci_host *host, unsigned int clock)
> {
> struct mmc_ios *ios = &host->mmc->ios;
> @@ -452,10 +421,6 @@ static void sdhci_gl9750_set_clock(struct sdhci_host *host, unsigned int clock)
> if (clock == 200000000 && ios->timing == MMC_TIMING_UHS_SDR104) {
> host->mmc->actual_clock = 205000000;
> gl9750_set_ssc_pll_205mhz(host);
> - } else if (clock == 100000000) {
> - gl9750_set_ssc_pll_100mhz(host);
> - } else if (clock == 50000000) {
> - gl9750_set_ssc_pll_50mhz(host);
> }
>
> sdhci_enable_clk(host, clk);
> @@ -556,19 +521,6 @@ static void gl9755_set_pll(struct pci_dev *pdev, u8 dir, u16 ldiv, u8 pdiv)
> mdelay(1);
> }
>
> -static bool gl9755_ssc_enable(struct pci_dev *pdev)
> -{
> - u32 misc;
> - u8 off;
> -
> - gl9755_wt_on(pdev);
> - pci_read_config_dword(pdev, PCI_GLI_9755_MISC, &misc);
> - off = FIELD_GET(PCI_GLI_9755_MISC_SSC_OFF, misc);
> - gl9755_wt_off(pdev);
> -
> - return !off;
> -}
> -
> static void gl9755_set_ssc(struct pci_dev *pdev, u8 enable, u8 step, u16 ppm)
> {
> u32 pll;
> @@ -590,31 +542,11 @@ static void gl9755_set_ssc(struct pci_dev *pdev, u8 enable, u8 step, u16 ppm)
>
> static void gl9755_set_ssc_pll_205mhz(struct pci_dev *pdev)
> {
> - bool enable = gl9755_ssc_enable(pdev);
> -
> - /* set pll to 205MHz and ssc */
> - gl9755_set_ssc(pdev, enable, 0xF, 0x5A1D);
> + /* set pll to 205MHz and enable ssc */
> + gl9755_set_ssc(pdev, 0x1, 0x1F, 0xFFE7);
> gl9755_set_pll(pdev, 0x1, 0x246, 0x0);
> }
>
> -static void gl9755_set_ssc_pll_100mhz(struct pci_dev *pdev)
> -{
> - bool enable = gl9755_ssc_enable(pdev);
> -
> - /* set pll to 100MHz and ssc */
> - gl9755_set_ssc(pdev, enable, 0xE, 0x51EC);
> - gl9755_set_pll(pdev, 0x1, 0x244, 0x1);
> -}
> -
> -static void gl9755_set_ssc_pll_50mhz(struct pci_dev *pdev)
> -{
> - bool enable = gl9755_ssc_enable(pdev);
> -
> - /* set pll to 50MHz and ssc */
> - gl9755_set_ssc(pdev, enable, 0xE, 0x51EC);
> - gl9755_set_pll(pdev, 0x1, 0x244, 0x3);
> -}
> -
> static void sdhci_gl9755_set_clock(struct sdhci_host *host, unsigned int clock)
> {
> struct sdhci_pci_slot *slot = sdhci_priv(host);
> @@ -635,10 +567,6 @@ static void sdhci_gl9755_set_clock(struct sdhci_host *host, unsigned int clock)
> if (clock == 200000000 && ios->timing == MMC_TIMING_UHS_SDR104) {
> host->mmc->actual_clock = 205000000;
> gl9755_set_ssc_pll_205mhz(pdev);
> - } else if (clock == 100000000) {
> - gl9755_set_ssc_pll_100mhz(pdev);
> - } else if (clock == 50000000) {
> - gl9755_set_ssc_pll_50mhz(pdev);
> }
>
> sdhci_enable_clk(host, clk);
> @@ -818,6 +746,53 @@ static void sdhci_gl9763e_dumpregs(struct mmc_host *mmc)
> sdhci_dumpregs(mmc_priv(mmc));
> }
>
> +static void gl9763e_set_low_power_negotiation(struct sdhci_pci_slot *slot, bool enable)
> +{
> + struct pci_dev *pdev = slot->chip->pdev;
> + u32 value;
> +
> + pci_read_config_dword(pdev, PCIE_GLI_9763E_VHS, &value);
> + value &= ~GLI_9763E_VHS_REV;
> + value |= FIELD_PREP(GLI_9763E_VHS_REV, GLI_9763E_VHS_REV_W);
> + pci_write_config_dword(pdev, PCIE_GLI_9763E_VHS, value);
> +
> + pci_read_config_dword(pdev, PCIE_GLI_9763E_CFG, &value);
> +
> + if (enable)
> + value &= ~GLI_9763E_CFG_LPSN_DIS;
> + else
> + value |= GLI_9763E_CFG_LPSN_DIS;
> +
> + pci_write_config_dword(pdev, PCIE_GLI_9763E_CFG, value);
> +
> + pci_read_config_dword(pdev, PCIE_GLI_9763E_VHS, &value);
> + value &= ~GLI_9763E_VHS_REV;
> + value |= FIELD_PREP(GLI_9763E_VHS_REV, GLI_9763E_VHS_REV_R);
> + pci_write_config_dword(pdev, PCIE_GLI_9763E_VHS, value);
> +}
> +
> +static void gl9763e_request(struct mmc_host *mmc, struct mmc_request *mrq)
> +{
> + struct sdhci_host *host = mmc_priv(mmc);
> + struct mmc_command *cmd;
> + struct sdhci_pci_slot *slot = sdhci_priv(host);
> + struct gli_host *gli_host = sdhci_pci_priv(slot);
> +
> + cmd = mrq->cmd;
> +
> + if (cmd && (cmd->opcode == MMC_READ_MULTIPLE_BLOCK) && gli_host->lpm_negotiation_enabled) {
> + gl9763e_set_low_power_negotiation(slot, false);
> + gli_host->lpm_negotiation_enabled = false;
> + } else {
> + if (gli_host->lpm_negotiation_enabled == false) {
> + gl9763e_set_low_power_negotiation(slot, true);
> + gli_host->lpm_negotiation_enabled = true;
> + }
> + }
> +
> + sdhci_request(mmc, mrq);
> +}
> +
> static void sdhci_gl9763e_cqe_pre_enable(struct mmc_host *mmc)
> {
> struct cqhci_host *cq_host = mmc->cqe_private;
> @@ -952,47 +927,6 @@ static void gli_set_gl9763e(struct sdhci_pci_slot *slot)
> pci_write_config_dword(pdev, PCIE_GLI_9763E_VHS, value);
> }
>
> -#ifdef CONFIG_PM
> -static int gl9763e_runtime_suspend(struct sdhci_pci_chip *chip)
> -{
> - struct sdhci_pci_slot *slot = chip->slots[0];
> - struct sdhci_host *host = slot->host;
> - u16 clock;
> -
> - clock = sdhci_readw(host, SDHCI_CLOCK_CONTROL);
> - clock &= ~(SDHCI_CLOCK_PLL_EN | SDHCI_CLOCK_CARD_EN);
> - sdhci_writew(host, clock, SDHCI_CLOCK_CONTROL);
> -
> - return 0;
> -}
> -
> -static int gl9763e_runtime_resume(struct sdhci_pci_chip *chip)
> -{
> - struct sdhci_pci_slot *slot = chip->slots[0];
> - struct sdhci_host *host = slot->host;
> - u16 clock;
> -
> - clock = sdhci_readw(host, SDHCI_CLOCK_CONTROL);
> -
> - clock |= SDHCI_CLOCK_PLL_EN;
> - clock &= ~SDHCI_CLOCK_INT_STABLE;
> - sdhci_writew(host, clock, SDHCI_CLOCK_CONTROL);
> -
> - /* Wait max 150 ms */
> - if (read_poll_timeout(sdhci_readw, clock, (clock & SDHCI_CLOCK_INT_STABLE),
> - 1000, 150000, false, host, SDHCI_CLOCK_CONTROL)) {
> - pr_err("%s: PLL clock never stabilised.\n",
> - mmc_hostname(host->mmc));
> - sdhci_dumpregs(host);
> - }
> -
> - clock |= SDHCI_CLOCK_CARD_EN;
> - sdhci_writew(host, clock, SDHCI_CLOCK_CONTROL);
> -
> - return 0;
> -}
> -#endif
> -
> static int gli_probe_slot_gl9763e(struct sdhci_pci_slot *slot)
> {
> struct pci_dev *pdev = slot->chip->pdev;
> @@ -1016,6 +950,9 @@ static int gli_probe_slot_gl9763e(struct sdhci_pci_slot *slot)
> gli_pcie_enable_msi(slot);
> host->mmc_host_ops.hs400_enhanced_strobe =
> gl9763e_hs400_enhanced_strobe;
> +
> + host->mmc_host_ops.request = gl9763e_request;
> +
> gli_set_gl9763e(slot);
> sdhci_enable_v4_mode(host);
>
> @@ -1102,11 +1039,7 @@ const struct sdhci_pci_fixes sdhci_gl9763e = {
> #ifdef CONFIG_PM_SLEEP
> .resume = sdhci_cqhci_gli_resume,
> .suspend = sdhci_cqhci_gli_suspend,
> -#endif
> -#ifdef CONFIG_PM
> - .runtime_suspend = gl9763e_runtime_suspend,
> - .runtime_resume = gl9763e_runtime_resume,
> - .allow_runtime_pm = true,
> #endif
> .add_host = gl9763e_add_host,
> + .priv_size = sizeof(struct gli_host),
> };
> --
> 2.36.1
>
next prev parent reply other threads:[~2022-05-26 1:15 UTC|newest]
Thread overview: 3+ messages / expand[flat|nested] mbox.gz Atom feed top
2022-05-25 12:27 [PATCH] mmc: sdhci-pci-gli: Improve Random 4K Read Performance of GL9763E Jason Lai
2022-05-26 1:14 ` Ben Chuang [this message]
-- strict thread matches above, loose matches on Subject: below --
2021-06-24 2:16 Renius Chen
Reply instructions:
You may reply publicly to this message via plain-text email
using any one of the following methods:
* Save the following mbox file, import it into your mail client,
and reply-to-all from there: mbox
Avoid top-posting and favor interleaved quoting:
https://en.wikipedia.org/wiki/Posting_style#Interleaved_style
* Reply using the --to, --cc, and --in-reply-to
switches of git-send-email(1):
git send-email \
--in-reply-to=CACT4zj9F7J3NgFMK7sG1aL19Y12zrPejPuD2ZEhwKYf0oosEVQ@mail.gmail.com \
--to=benchuanggli@gmail.com \
--cc=SeanHY.chen@genesyslogic.com.tw \
--cc=adrian.hunter@intel.com \
--cc=ben.chuang@genesyslogic.com.tw \
--cc=greg.tu@genesyslogic.com.tw \
--cc=jason.lai@genesyslogic.com.tw \
--cc=jasonlai.genesyslogic@gmail.com \
--cc=linux-mmc@vger.kernel.org \
--cc=reniuschengl@gmail.com \
--cc=ulf.hansson@linaro.org \
--cc=victor.shih@genesyslogic.com.tw \
/path/to/YOUR_REPLY
https://kernel.org/pub/software/scm/git/docs/git-send-email.html
* If your mail client supports setting the In-Reply-To header
via mailto: links, try the mailto: link
Be sure your reply has a Subject: header at the top and a blank line
before the message body.
This is a public inbox, see mirroring instructions
for how to clone and mirror all data and code used for this inbox;
as well as URLs for NNTP newsgroup(s).