From: Anthony Liguori <anthony@codemonkey.ws>
To: Alex Williamson <alex.williamson@hp.com>
Cc: qemu-devel <qemu-devel@nongnu.org>, kvm <kvm@vger.kernel.org>
Subject: Re: [PATCH] e1000 VLAN offload emulation
Date: Thu, 20 Nov 2008 17:11:35 -0600 [thread overview]
Message-ID: <4925EEA7.6000804@codemonkey.ws> (raw)
In-Reply-To: <1227127052.7652.20.camel@lappy>
Alex Williamson wrote:
> We're currently ignoring the e1000 VLAN tagging, stripping and filtering
> features in the e1000 emulation. This patch adds backing for the
> relevant registers and provides a software implementation of the
> acceleration, such that a guest can make use of VLANs.
>
> This is mostly (only?) useful for a guest on a bridge (not user mode
> networking). The only caveat beyond that is that you need to make sure
> the host NIC isn't doing it's own tagging, stripping, or filtering.
> This generally means the host NIC on the bridge should not be part of a
> VLAN. Thanks,
>
> Alex
>
> Signed-off-by: Alex Williamson <alex.williamson@hp.com>
> --
>
> Patch against KVM, but applies w/ only one line of offset to qemu.
>
Hi Alex,
The patch looks good but I don't like the idea of taking patches against
kvm-userspace. It suggests that people have only tested in
kvm-userspace which means it's not guaranteed to work (or even compile)
in upstream QEMU. Please rebase against QEMU and resubmit.
Regards,
Anthony Liguori
> diff --git a/qemu/hw/e1000.c b/qemu/hw/e1000.c
> index e2cc7f1..7be87e4 100644
> --- a/qemu/hw/e1000.c
> +++ b/qemu/hw/e1000.c
> @@ -89,9 +89,12 @@ typedef struct E1000State_st {
> int check_rxov;
> struct e1000_tx {
> unsigned char header[256];
> + unsigned char vlan_header[4];
> + unsigned char vlan[4];
> unsigned char data[0x10000];
> uint16_t size;
> unsigned char sum_needed;
> + unsigned char vlan_needed;
> uint8_t ipcss;
> uint8_t ipcso;
> uint16_t ipcse;
> @@ -128,7 +131,8 @@ enum {
> defreg(TDBAL), defreg(TDH), defreg(TDLEN), defreg(TDT),
> defreg(TORH), defreg(TORL), defreg(TOTH), defreg(TOTL),
> defreg(TPR), defreg(TPT), defreg(TXDCTL), defreg(WUFC),
> - defreg(RA), defreg(MTA), defreg(CRCERRS),
> + defreg(RA), defreg(MTA), defreg(CRCERRS),defreg(VFTA),
> + defreg(VET),
> };
>
> enum { PHY_R = 1, PHY_W = 2, PHY_RW = PHY_R | PHY_W };
> @@ -294,6 +298,31 @@ putsum(uint8_t *data, uint32_t n, uint32_t sloc, uint32_t css, uint32_t cse)
> }
> }
>
> +static inline int
> +vlan_enabled(E1000State *s)
> +{
> + return ((s->mac_reg[CTRL] & E1000_CTRL_VME) != 0);
> +}
> +
> +static inline int
> +vlan_rx_filter_enabled(E1000State *s)
> +{
> + return ((s->mac_reg[RCTL] & E1000_RCTL_VFE) != 0);
> +}
> +
> +static inline int
> +is_vlan_packet(E1000State *s, const uint8_t *buf)
> +{
> + return (be16_to_cpup((uint16_t *)(buf + 12)) ==
> + le16_to_cpup((uint16_t *)(s->mac_reg + VET)));
> +}
> +
> +static inline int
> +is_vlan_txd(uint32_t txd_lower)
> +{
> + return ((txd_lower & E1000_TXD_CMD_VLE) != 0);
> +}
> +
> static void
> xmit_seg(E1000State *s)
> {
> @@ -336,7 +365,12 @@ xmit_seg(E1000State *s)
> putsum(tp->data, tp->size, tp->tucso, tp->tucss, tp->tucse);
> if (tp->sum_needed & E1000_TXD_POPTS_IXSM)
> putsum(tp->data, tp->size, tp->ipcso, tp->ipcss, tp->ipcse);
> - qemu_send_packet(s->vc, tp->data, tp->size);
> + if (tp->vlan_needed) {
> + memmove(tp->vlan, tp->data, 12);
> + memcpy(tp->data + 8, tp->vlan_header, 4);
> + qemu_send_packet(s->vc, tp->vlan, tp->size + 4);
> + } else
> + qemu_send_packet(s->vc, tp->data, tp->size);
> s->mac_reg[TPT]++;
> s->mac_reg[GPTC]++;
> n = s->mac_reg[TOTL];
> @@ -383,6 +417,15 @@ process_tx_desc(E1000State *s, struct e1000_tx_desc *dp)
> // legacy descriptor
> tp->cptse = 0;
>
> + if (vlan_enabled(s) && is_vlan_txd(txd_lower) &&
> + (tp->cptse || txd_lower & E1000_TXD_CMD_EOP)) {
> + tp->vlan_needed = 1;
> + cpu_to_be16wu((uint16_t *)(tp->vlan_header),
> + le16_to_cpup((uint16_t *)(s->mac_reg + VET)));
> + cpu_to_be16wu((uint16_t *)(tp->vlan_header + 2),
> + le16_to_cpu(dp->upper.fields.special));
> + }
> +
> addr = le64_to_cpu(dp->buffer_addr);
> if (tp->tse && tp->cptse) {
> hdr = tp->hdr_len;
> @@ -416,6 +459,7 @@ process_tx_desc(E1000State *s, struct e1000_tx_desc *dp)
> xmit_seg(s);
> tp->tso_frames = 0;
> tp->sum_needed = 0;
> + tp->vlan_needed = 0;
> tp->size = 0;
> tp->cptse = 0;
> }
> @@ -482,6 +526,14 @@ receive_filter(E1000State *s, const uint8_t *buf, int size)
> static int mta_shift[] = {4, 3, 2, 0};
> uint32_t f, rctl = s->mac_reg[RCTL], ra[2], *rp;
>
> + if (is_vlan_packet(s, buf) && vlan_rx_filter_enabled(s)) {
> + uint16_t vid = be16_to_cpup((uint16_t *)(buf + 14));
> + uint32_t vfta = le32_to_cpup((uint32_t *)(s->mac_reg + VFTA) +
> + ((vid >> 5) & 0x7f));
> + if ((vfta & (1 << (vid & 0x1f))) == 0)
> + return 0;
> + }
> +
> if (rctl & E1000_RCTL_UPE) // promiscuous
> return 1;
>
> @@ -536,6 +588,8 @@ e1000_receive(void *opaque, const uint8_t *buf, int size)
> target_phys_addr_t base;
> unsigned int n, rdt;
> uint32_t rdh_start;
> + uint16_t vlan_special = 0;
> + uint8_t vlan_status = 0, vlan_offset = 0;
>
> if (!(s->mac_reg[RCTL] & E1000_RCTL_EN))
> return;
> @@ -549,6 +603,14 @@ e1000_receive(void *opaque, const uint8_t *buf, int size)
> if (!receive_filter(s, buf, size))
> return;
>
> + if (vlan_enabled(s) && is_vlan_packet(s, buf)) {
> + vlan_special = cpu_to_le16(be16_to_cpup((uint16_t *)(buf + 14)));
> + memmove((void *)(buf + 4), buf, 12);
> + vlan_status = E1000_RXD_STAT_VP;
> + vlan_offset = 4;
> + size -= 4;
> + }
> +
> rdh_start = s->mac_reg[RDH];
> size += 4; // for the header
> do {
> @@ -559,10 +621,11 @@ e1000_receive(void *opaque, const uint8_t *buf, int size)
> base = ((uint64_t)s->mac_reg[RDBAH] << 32) + s->mac_reg[RDBAL] +
> sizeof(desc) * s->mac_reg[RDH];
> cpu_physical_memory_read(base, (void *)&desc, sizeof(desc));
> - desc.status |= E1000_RXD_STAT_DD;
> + desc.special = vlan_special;
> + desc.status |= (vlan_status | E1000_RXD_STAT_DD);
> if (desc.buffer_addr) {
> cpu_physical_memory_write(le64_to_cpu(desc.buffer_addr),
> - (void *)buf, size);
> + (void *)(buf + vlan_offset), size);
> desc.length = cpu_to_le16(size);
> desc.status |= E1000_RXD_STAT_EOP|E1000_RXD_STAT_IXSM;
> } else // as per intel docs; skip descriptors with null buf addr
> @@ -692,7 +755,7 @@ static uint32_t (*macreg_readops[])(E1000State *, int) = {
> getreg(WUFC), getreg(TDT), getreg(CTRL), getreg(LEDCTL),
> getreg(MANC), getreg(MDIC), getreg(SWSM), getreg(STATUS),
> getreg(TORL), getreg(TOTL), getreg(IMS), getreg(TCTL),
> - getreg(RDH), getreg(RDT),
> + getreg(RDH), getreg(RDT), getreg(VET),
>
> [TOTH] = mac_read_clr8, [TORH] = mac_read_clr8, [GPRC] = mac_read_clr4,
> [GPTC] = mac_read_clr4, [TPR] = mac_read_clr4, [TPT] = mac_read_clr4,
> @@ -700,6 +763,7 @@ static uint32_t (*macreg_readops[])(E1000State *, int) = {
> [CRCERRS ... MPC] = &mac_readreg,
> [RA ... RA+31] = &mac_readreg,
> [MTA ... MTA+127] = &mac_readreg,
> + [VFTA ... VFTA+127] = &mac_readreg,
> };
> enum { NREADOPS = sizeof(macreg_readops) / sizeof(*macreg_readops) };
>
> @@ -707,7 +771,7 @@ enum { NREADOPS = sizeof(macreg_readops) / sizeof(*macreg_readops) };
> static void (*macreg_writeops[])(E1000State *, int, uint32_t) = {
> putreg(PBA), putreg(EERD), putreg(SWSM), putreg(WUFC),
> putreg(TDBAL), putreg(TDBAH), putreg(TXDCTL), putreg(RDBAH),
> - putreg(RDBAL), putreg(LEDCTL),
> + putreg(RDBAL), putreg(LEDCTL), putreg(CTRL), putreg(VET),
> [TDLEN] = set_dlen, [RDLEN] = set_dlen, [TCTL] = set_tctl,
> [TDT] = set_tctl, [MDIC] = set_mdic, [ICS] = set_ics,
> [TDH] = set_16bit, [RDH] = set_16bit, [RDT] = set_rdt,
> @@ -715,6 +779,7 @@ static void (*macreg_writeops[])(E1000State *, int, uint32_t) = {
> [EECD] = set_eecd, [RCTL] = set_rx_control,
> [RA ... RA+31] = &mac_writereg,
> [MTA ... MTA+127] = &mac_writereg,
> + [VFTA ... VFTA+127] = &mac_writereg,
> };
> enum { NWRITEOPS = sizeof(macreg_writeops) / sizeof(*macreg_writeops) };
>
> @@ -789,13 +854,14 @@ static const int mac_regtosave[] = {
> LEDCTL, MANC, MDIC, MPC, PBA, RCTL, RDBAH, RDBAL, RDH,
> RDLEN, RDT, STATUS, SWSM, TCTL, TDBAH, TDBAL, TDH, TDLEN,
> TDT, TORH, TORL, TOTH, TOTL, TPR, TPT, TXDCTL, WUFC,
> + VET,
> };
> enum { MAC_NSAVE = sizeof mac_regtosave/sizeof *mac_regtosave };
>
> static const struct {
> int size;
> int array0;
> -} mac_regarraystosave[] = { {32, RA}, {128, MTA} };
> +} mac_regarraystosave[] = { {32, RA}, {128, MTA}, {128, VFTA} };
> enum { MAC_NARRAYS = sizeof mac_regarraystosave/sizeof *mac_regarraystosave };
>
> static void
>
>
> --
> To unsubscribe from this list: send the line "unsubscribe kvm" in
> the body of a message to majordomo@vger.kernel.org
> More majordomo info at http://vger.kernel.org/majordomo-info.html
>
next prev parent reply other threads:[~2008-11-20 23:11 UTC|newest]
Thread overview: 4+ messages / expand[flat|nested] mbox.gz Atom feed top
2008-11-19 20:37 [PATCH] e1000 VLAN offload emulation Alex Williamson
2008-11-20 23:11 ` Anthony Liguori [this message]
2008-11-21 15:41 ` Alex Williamson
2008-11-21 16:25 ` Anthony Liguori
Reply instructions:
You may reply publicly to this message via plain-text email
using any one of the following methods:
* Save the following mbox file, import it into your mail client,
and reply-to-all from there: mbox
Avoid top-posting and favor interleaved quoting:
https://en.wikipedia.org/wiki/Posting_style#Interleaved_style
* Reply using the --to, --cc, and --in-reply-to
switches of git-send-email(1):
git send-email \
--in-reply-to=4925EEA7.6000804@codemonkey.ws \
--to=anthony@codemonkey.ws \
--cc=alex.williamson@hp.com \
--cc=kvm@vger.kernel.org \
--cc=qemu-devel@nongnu.org \
/path/to/YOUR_REPLY
https://kernel.org/pub/software/scm/git/docs/git-send-email.html
* If your mail client supports setting the In-Reply-To header
via mailto: links, try the mailto: link
Be sure your reply has a Subject: header at the top and a blank line
before the message body.
This is a public inbox, see mirroring instructions
for how to clone and mirror all data and code used for this inbox