Linux CAN drivers development
 help / color / mirror / Atom feed
From: Vincent Mailhol <mailhol@kernel.org>
To: Oliver Hartkopp <socketcan@hartkopp.net>,
	Marc Kleine-Budde <mkl@pengutronix.de>
Cc: linux-can@vger.kernel.org, linux-kernel@vger.kernel.org
Subject: Re: [PATCH 2/3] can: raw: use bitfields to store flags in struct raw_sock
Date: Mon, 15 Sep 2025 19:47:00 +0900	[thread overview]
Message-ID: <f0a34514-19da-4c73-9cd4-ae220fed6447@kernel.org> (raw)
In-Reply-To: <f96cd163-0364-4c14-882b-48c3f8e0f05a@hartkopp.net>

On 15/09/2025 at 19:16, Oliver Hartkopp wrote:
> On 15.09.25 11:23, Vincent Mailhol wrote:
>> The loopback, recv_own_msgs, fd_frames and xl_frames fields of struct
>> raw_sock just need to store one bit of information.
>>
>> Declare all those members as a bitfields of type unsigned int and
>> width one bit.
>>
>> Add a temporary variable to raw_setsockopt() and raw_getsockopt() to
>> make the conversion between the stored bits and the socket interface.
>>
>> This reduces struct raw_sock by eight bytes.
>>
>> Statistics before:
>>
>>    $ pahole --class_name=raw_sock net/can/raw.o
>>    struct raw_sock {
>>        struct sock                sk __attribute__((__aligned__(8))); /*    
>> 0   776 */
>>
>>        /* XXX last struct has 1 bit hole */
>>
>>        /* --- cacheline 12 boundary (768 bytes) was 8 bytes ago --- */
>>        int                        bound;                /*   776     4 */
>>        int                        ifindex;              /*   780     4 */
>>        struct net_device *        dev;                  /*   784     8 */
>>        netdevice_tracker          dev_tracker;          /*   792     0 */
>>        struct list_head           notifier;             /*   792    16 */
>>        int                        loopback;             /*   808     4 */
>>        int                        recv_own_msgs;        /*   812     4 */
>>        int                        fd_frames;            /*   816     4 */
>>        int                        xl_frames;            /*   820     4 */
>>        struct can_raw_vcid_options raw_vcid_opts;       /*   824     4 */
>>        canid_t                    tx_vcid_shifted;      /*   828     4 */
>>        /* --- cacheline 13 boundary (832 bytes) --- */
>>        canid_t                    rx_vcid_shifted;      /*   832     4 */
>>        canid_t                    rx_vcid_mask_shifted; /*   836     4 */
>>        int                        join_filters;         /*   840     4 */
>>        int                        count;                /*   844     4 */
>>        struct can_filter          dfilter;              /*   848     8 */
>>        struct can_filter *        filter;               /*   856     8 */
>>        can_err_mask_t             err_mask;             /*   864     4 */
>>
>>        /* XXX 4 bytes hole, try to pack */
>>
>>        struct uniqframe *         uniq;                 /*   872     8 */
>>
>>        /* size: 880, cachelines: 14, members: 20 */
>>        /* sum members: 876, holes: 1, sum holes: 4 */
>>        /* member types with bit holes: 1, total: 1 */
>>        /* forced alignments: 1 */
>>        /* last cacheline: 48 bytes */
>>    } __attribute__((__aligned__(8)));
>>
>> ...and after:
>>
>>    $ pahole --class_name=raw_sock net/can/raw.o
>>    struct raw_sock {
>>        struct sock                sk __attribute__((__aligned__(8))); /*    
>> 0   776 */
>>
>>        /* XXX last struct has 1 bit hole */
>>
>>        /* --- cacheline 12 boundary (768 bytes) was 8 bytes ago --- */
>>        int                        bound;                /*   776     4 */
>>        int                        ifindex;              /*   780     4 */
>>        struct net_device *        dev;                  /*   784     8 */
>>        netdevice_tracker          dev_tracker;          /*   792     0 */
>>        struct list_head           notifier;             /*   792    16 */
>>        unsigned int               loopback:1;           /*   808: 0  4 */
>>        unsigned int               recv_own_msgs:1;      /*   808: 1  4 */
>>        unsigned int               fd_frames:1;          /*   808: 2  4 */
>>        unsigned int               xl_frames:1;          /*   808: 3  4 */
> 
> This means that the former data structures (int) are not copied but bits are set
> (shifted, ANDed, ORed, etc) right?
> 
> So what's the difference in the code the CPU has to process for this
> improvement? Is implementing this bitmap more efficient or similar to copy the
> (unsigned ints) as-is?

It will indeed have to add a couple assembly instructions. But this is peanuts.
In the best case, the out of order execution might very well optimize this so
that not even a CPU tick is wasted. In the worst case, it is a couple CPU ticks.

On the other hands, reducing the size by 16 bytes lowers the risk to have a
cache miss. And removing one cache miss outperforms by an order of magnitude the
penalty of adding a couple assembly instructions.

Well, I did not benchmark it, but this is a commonly accepted trade off.


Yours sincerely,
Vincent Mailhol


  reply	other threads:[~2025-09-15 10:47 UTC|newest]

Thread overview: 11+ messages / expand[flat|nested]  mbox.gz  Atom feed  top
2025-09-15  9:23 [PATCH 0/3] can: raw: optimize the sizes of struct uniqframe and struct raw_sock Vincent Mailhol
2025-09-15  9:23 ` [PATCH 1/3] can: raw: reorder struct uniqframe's members to optimise packing Vincent Mailhol
2025-09-15 10:18   ` Oliver Hartkopp
2025-09-15  9:23 ` [PATCH 2/3] can: raw: use bitfields to store flags in struct raw_sock Vincent Mailhol
2025-09-15 10:16   ` Oliver Hartkopp
2025-09-15 10:47     ` Vincent Mailhol [this message]
2025-09-15 17:41       ` Oliver Hartkopp
2025-09-16 18:35   ` Christophe JAILLET
2025-09-17  4:43     ` Vincent Mailhol
2025-09-15  9:23 ` [PATCH 3/3] can: raw: reorder struct raw_sock's members to optimise packing Vincent Mailhol
2025-09-15 17:42   ` Oliver Hartkopp

Reply instructions:

You may reply publicly to this message via plain-text email
using any one of the following methods:

* Save the following mbox file, import it into your mail client,
  and reply-to-all from there: mbox

  Avoid top-posting and favor interleaved quoting:
  https://en.wikipedia.org/wiki/Posting_style#Interleaved_style

* Reply using the --to, --cc, and --in-reply-to
  switches of git-send-email(1):

  git send-email \
    --in-reply-to=f0a34514-19da-4c73-9cd4-ae220fed6447@kernel.org \
    --to=mailhol@kernel.org \
    --cc=linux-can@vger.kernel.org \
    --cc=linux-kernel@vger.kernel.org \
    --cc=mkl@pengutronix.de \
    --cc=socketcan@hartkopp.net \
    /path/to/YOUR_REPLY

  https://kernel.org/pub/software/scm/git/docs/git-send-email.html

* If your mail client supports setting the In-Reply-To header
  via mailto: links, try the mailto: link
Be sure your reply has a Subject: header at the top and a blank line before the message body.
This is a public inbox, see mirroring instructions
for how to clone and mirror all data and code used for this inbox