Message ID | 20200922023151.387447-12-warthog618@gmail.com |
---|---|
State | Superseded |
Headers | show |
Series | gpio: cdev: add uAPI v2 | expand |
On Tue, Sep 22, 2020 at 5:36 AM Kent Gibson <warthog618@gmail.com> wrote: > > Add support for the GPIO_V2_LINE_SET_VALUES_IOCTL. > +static long linereq_set_values_unlocked(struct linereq *lr, > + struct gpio_v2_line_values *lv) > +{ > + DECLARE_BITMAP(vals, GPIO_V2_LINES_MAX); > + struct gpio_desc **descs; > + unsigned int i, didx, num_set; > + int ret; > + > + bitmap_zero(vals, GPIO_V2_LINES_MAX); > + for (num_set = 0, i = 0; i < lr->num_lines; i++) { > + if (lv->mask & BIT_ULL(i)) { Similar idea DECLARE_BITMAP(mask, 64) = BITMAP_FROM_U64(lv->mask); num_set = bitmap_weight(); for_each_set_bit(i, mask, lr->num_lines) > + if (!test_bit(FLAG_IS_OUT, &lr->lines[i].desc->flags)) > + return -EPERM; > + if (lv->bits & BIT_ULL(i)) > + __set_bit(num_set, vals); > + num_set++; > + descs = &lr->lines[i].desc; > + } > + } > + if (num_set == 0) > + return -EINVAL; > + > + if (num_set != 1) { > + /* build compacted desc array and values */ > + descs = kmalloc_array(num_set, sizeof(*descs), GFP_KERNEL); > + if (!descs) > + return -ENOMEM; > + for (didx = 0, i = 0; i < lr->num_lines; i++) { > + if (lv->mask & BIT_ULL(i)) { > + descs[didx] = lr->lines[i].desc; > + didx++; > + } > + } > + } > + ret = gpiod_set_array_value_complex(false, true, num_set, > + descs, NULL, vals); > + > + if (num_set != 1) > + kfree(descs); > + return ret; > +} > + > +static long linereq_set_values(struct linereq *lr, void __user *ip) > +{ > + struct gpio_v2_line_values lv; > + int ret; > + > + if (copy_from_user(&lv, ip, sizeof(lv))) > + return -EFAULT; > + > + mutex_lock(&lr->config_mutex); > + > + ret = linereq_set_values_unlocked(lr, &lv); > + > + mutex_unlock(&lr->config_mutex); > + > + return ret; > +} > + > static long linereq_set_config_unlocked(struct linereq *lr, > struct gpio_v2_line_config *lc) > { > @@ -889,6 +948,8 @@ static long linereq_ioctl(struct file *file, unsigned int cmd, > > if (cmd == GPIO_V2_LINE_GET_VALUES_IOCTL) > return linereq_get_values(lr, ip); > + else if (cmd == GPIO_V2_LINE_SET_VALUES_IOCTL) > + return linereq_set_values(lr, ip); > else if (cmd == GPIO_V2_LINE_SET_CONFIG_IOCTL) > return linereq_set_config(lr, ip); > > -- > 2.28.0 >
On Wed, Sep 23, 2020 at 07:18:08PM +0300, Andy Shevchenko wrote: > On Tue, Sep 22, 2020 at 5:36 AM Kent Gibson <warthog618@gmail.com> wrote: > > > > Add support for the GPIO_V2_LINE_SET_VALUES_IOCTL. > > > +static long linereq_set_values_unlocked(struct linereq *lr, > > + struct gpio_v2_line_values *lv) > > +{ > > + DECLARE_BITMAP(vals, GPIO_V2_LINES_MAX); > > + struct gpio_desc **descs; > > + unsigned int i, didx, num_set; > > + int ret; > > + > > + bitmap_zero(vals, GPIO_V2_LINES_MAX); > > + for (num_set = 0, i = 0; i < lr->num_lines; i++) { > > + if (lv->mask & BIT_ULL(i)) { > > Similar idea > > DECLARE_BITMAP(mask, 64) = BITMAP_FROM_U64(lv->mask); > > num_set = bitmap_weight(); > I had played with this option, but bitmap_weight() counts all the bits set in the mask - which considers bits >= lr->num_lines. So you would need to mask lv->mask before converting it to a bitmap. (I'm ok with ignoring those bits in case userspace wants to be lazy and use an all 1s mask.) But since we're looping over the bitmap anyway we may as well just count as we go. > for_each_set_bit(i, mask, lr->num_lines) > Yeah, that should work. I vaguely recall trying this and finding it generated larger object code, but I'll give it another try and if it works out then include it in v10. Cheers, Kent.
On Thu, Sep 24, 2020 at 10:32 AM Kent Gibson <warthog618@gmail.com> wrote: > On Wed, Sep 23, 2020 at 07:18:08PM +0300, Andy Shevchenko wrote: > > On Tue, Sep 22, 2020 at 5:36 AM Kent Gibson <warthog618@gmail.com> wrote: > > > > > > Add support for the GPIO_V2_LINE_SET_VALUES_IOCTL. > > > > > +static long linereq_set_values_unlocked(struct linereq *lr, > > > + struct gpio_v2_line_values *lv) > > > +{ > > > + DECLARE_BITMAP(vals, GPIO_V2_LINES_MAX); > > > + struct gpio_desc **descs; > > > + unsigned int i, didx, num_set; > > > + int ret; > > > + > > > + bitmap_zero(vals, GPIO_V2_LINES_MAX); > > > + for (num_set = 0, i = 0; i < lr->num_lines; i++) { > > > + if (lv->mask & BIT_ULL(i)) { > > > > Similar idea > > > > DECLARE_BITMAP(mask, 64) = BITMAP_FROM_U64(lv->mask); > > > > num_set = bitmap_weight(); > > > > I had played with this option, but bitmap_weight() counts all > the bits set in the mask - which considers bits >= lr->num_lines. Does it mean we have a bug in the code and no test case covered it? Because from the API I see the parameter nbits which should prevent this. > So you would need to mask lv->mask before converting it to a bitmap. > (I'm ok with ignoring those bits in case userspace wants to be lazy and > use an all 1s mask.) Can you confirm a bug in bitmap API? If it's so it's a serious one. > But since we're looping over the bitmap anyway we may as well just > count as we go. > > > for_each_set_bit(i, mask, lr->num_lines) > > > > Yeah, that should work. I vaguely recall trying this and finding it > generated larger object code, but I'll give it another try and if it > works out then include it in v10. -- With Best Regards, Andy Shevchenko
On Thu, Sep 24, 2020 at 11:21:05AM +0300, Andy Shevchenko wrote: > On Thu, Sep 24, 2020 at 10:32 AM Kent Gibson <warthog618@gmail.com> wrote: > > On Wed, Sep 23, 2020 at 07:18:08PM +0300, Andy Shevchenko wrote: > > > On Tue, Sep 22, 2020 at 5:36 AM Kent Gibson <warthog618@gmail.com> wrote: > > > > > > > > Add support for the GPIO_V2_LINE_SET_VALUES_IOCTL. > > > > > > > +static long linereq_set_values_unlocked(struct linereq *lr, > > > > + struct gpio_v2_line_values *lv) > > > > +{ > > > > + DECLARE_BITMAP(vals, GPIO_V2_LINES_MAX); > > > > + struct gpio_desc **descs; > > > > + unsigned int i, didx, num_set; > > > > + int ret; > > > > + > > > > + bitmap_zero(vals, GPIO_V2_LINES_MAX); > > > > + for (num_set = 0, i = 0; i < lr->num_lines; i++) { > > > > + if (lv->mask & BIT_ULL(i)) { > > > > > > Similar idea > > > > > > DECLARE_BITMAP(mask, 64) = BITMAP_FROM_U64(lv->mask); > > > > > > num_set = bitmap_weight(); > > > > > > > I had played with this option, but bitmap_weight() counts all > > the bits set in the mask - which considers bits >= lr->num_lines. > > Does it mean we have a bug in the code and no test case covered it? > Because from the API I see the parameter nbits which should prevent > this. > Probably me being thick and using nbits as the size of the mask rather than the number of bits of interest. Cheers, Kent. > > So you would need to mask lv->mask before converting it to a bitmap. > > (I'm ok with ignoring those bits in case userspace wants to be lazy and > > use an all 1s mask.) > > Can you confirm a bug in bitmap API? If it's so it's a serious one. > > > But since we're looping over the bitmap anyway we may as well just > > count as we go. > > > > > for_each_set_bit(i, mask, lr->num_lines) > > > > > > > Yeah, that should work. I vaguely recall trying this and finding it > > generated larger object code, but I'll give it another try and if it > > works out then include it in v10. > > > -- > With Best Regards, > Andy Shevchenko
On Thu, Sep 24, 2020 at 03:32:48PM +0800, Kent Gibson wrote: > On Wed, Sep 23, 2020 at 07:18:08PM +0300, Andy Shevchenko wrote: > > On Tue, Sep 22, 2020 at 5:36 AM Kent Gibson <warthog618@gmail.com> wrote: > > > > > > Add support for the GPIO_V2_LINE_SET_VALUES_IOCTL. > > > > > +static long linereq_set_values_unlocked(struct linereq *lr, > > > + struct gpio_v2_line_values *lv) > > > +{ > > > + DECLARE_BITMAP(vals, GPIO_V2_LINES_MAX); > > > + struct gpio_desc **descs; > > > + unsigned int i, didx, num_set; > > > + int ret; > > > + > > > + bitmap_zero(vals, GPIO_V2_LINES_MAX); > > > + for (num_set = 0, i = 0; i < lr->num_lines; i++) { > > > + if (lv->mask & BIT_ULL(i)) { > > > > Similar idea > > > > DECLARE_BITMAP(mask, 64) = BITMAP_FROM_U64(lv->mask); > > > > num_set = bitmap_weight(); > > > > I had played with this option, but bitmap_weight() counts all > the bits set in the mask - which considers bits >= lr->num_lines. > So you would need to mask lv->mask before converting it to a bitmap. > (I'm ok with ignoring those bits in case userspace wants to be lazy and > use an all 1s mask.) > > But since we're looping over the bitmap anyway we may as well just > count as we go. > > > for_each_set_bit(i, mask, lr->num_lines) > > > > Yeah, that should work. I vaguely recall trying this and finding it > generated larger object code, but I'll give it another try and if it > works out then include it in v10. > Tried it again and, while it works, it does increase the size of gpiolib-cdev.o as follows: u64 -> bitmap x86_64 28360 28616 i386 22056 22100 aarch64 37392 37600 mips32 28008 28016 So for 64-bit platforms changing to bitmap generates larger code, probably as we are forcing them to use 32-bit array semantics where before they could use the native u64. For 32-bit there is a much smaller difference as they were already using 32-bit array semantics to realise the u64. Those are for some of my test builds, so obviously YMMV. It is also only for changing linereq_get_values(), which has three instances of the loop. linereq_set_values_unlocked() has another two, so you could expect another increase of ~2/3 of that seen here if we change that as well. The sizeable increase in x86_64 was what made me revert this last time, and I'm still satisfied with that choice. Are you still eager to switch to for_each_set_bit()? Cheers, Kent.
On Thu, Sep 24, 2020 at 3:46 PM Kent Gibson <warthog618@gmail.com> wrote: > On Thu, Sep 24, 2020 at 03:32:48PM +0800, Kent Gibson wrote: > > On Wed, Sep 23, 2020 at 07:18:08PM +0300, Andy Shevchenko wrote: > > > On Tue, Sep 22, 2020 at 5:36 AM Kent Gibson <warthog618@gmail.com> wrote: > > > > > > > > Add support for the GPIO_V2_LINE_SET_VALUES_IOCTL. > > > > > > > +static long linereq_set_values_unlocked(struct linereq *lr, > > > > + struct gpio_v2_line_values *lv) > > > > +{ > > > > + DECLARE_BITMAP(vals, GPIO_V2_LINES_MAX); > > > > + struct gpio_desc **descs; > > > > + unsigned int i, didx, num_set; > > > > + int ret; > > > > + > > > > + bitmap_zero(vals, GPIO_V2_LINES_MAX); > > > > + for (num_set = 0, i = 0; i < lr->num_lines; i++) { > > > > + if (lv->mask & BIT_ULL(i)) { > > > > > > Similar idea > > > > > > DECLARE_BITMAP(mask, 64) = BITMAP_FROM_U64(lv->mask); > > > > > > num_set = bitmap_weight(); > > > > > > > I had played with this option, but bitmap_weight() counts all > > the bits set in the mask - which considers bits >= lr->num_lines. > > So you would need to mask lv->mask before converting it to a bitmap. > > (I'm ok with ignoring those bits in case userspace wants to be lazy and > > use an all 1s mask.) > > > > But since we're looping over the bitmap anyway we may as well just > > count as we go. > > > > > for_each_set_bit(i, mask, lr->num_lines) > > > > > > > Yeah, that should work. I vaguely recall trying this and finding it > > generated larger object code, but I'll give it another try and if it > > works out then include it in v10. > > > > Tried it again and, while it works, it does increase the size of > gpiolib-cdev.o as follows: > > u64 -> bitmap > x86_64 28360 28616 > i386 22056 22100 > aarch64 37392 37600 > mips32 28008 28016 Yes, that's pity... See below. > So for 64-bit platforms changing to bitmap generates larger code, > probably as we are forcing them to use 32-bit array semantics where > before they could use the native u64. For 32-bit there is a much > smaller difference as they were already using 32-bit array semantics > to realise the u64. > > Those are for some of my test builds, so obviously YMMV. > > It is also only for changing linereq_get_values(), which has three > instances of the loop. linereq_set_values_unlocked() has another two, > so you could expect another increase of ~2/3 of that seen here if we > change that as well. > > The sizeable increase in x86_64 was what made me revert this last time, > and I'm still satisfied with that choice. Are you still eager to switch > to for_each_set_bit()? I already asked once about short cut for for_each_set_bit in case of constant nbits parameter when it's <= BITS_PER_LONG, but here it seems we have variadic amount of lines, dunno if compiler can prove that it's smaller than long. In any case my point is that code readability has a preference vs. memory footprint (except hot paths) and if we are going to fix this it should be done in general. That said, if maintainers are okay with that I would prefer bitmap API over open-coded pieces. Also note, that it will be easier to extend in the future if needed (if we want to have more than BITS_PER_LONG [64] lines to handle). -- With Best Regards, Andy Shevchenko
On Fri, Sep 25, 2020 at 12:57:59PM +0300, Andy Shevchenko wrote: > On Thu, Sep 24, 2020 at 3:46 PM Kent Gibson <warthog618@gmail.com> wrote: > > On Thu, Sep 24, 2020 at 03:32:48PM +0800, Kent Gibson wrote: > > > On Wed, Sep 23, 2020 at 07:18:08PM +0300, Andy Shevchenko wrote: > > > > On Tue, Sep 22, 2020 at 5:36 AM Kent Gibson <warthog618@gmail.com> wrote: > > > > > > > > > > Add support for the GPIO_V2_LINE_SET_VALUES_IOCTL. > > > > > > > > > +static long linereq_set_values_unlocked(struct linereq *lr, > > > > > + struct gpio_v2_line_values *lv) > > > > > +{ > > > > > + DECLARE_BITMAP(vals, GPIO_V2_LINES_MAX); > > > > > + struct gpio_desc **descs; > > > > > + unsigned int i, didx, num_set; > > > > > + int ret; > > > > > + > > > > > + bitmap_zero(vals, GPIO_V2_LINES_MAX); > > > > > + for (num_set = 0, i = 0; i < lr->num_lines; i++) { > > > > > + if (lv->mask & BIT_ULL(i)) { > > > > > > > > Similar idea > > > > > > > > DECLARE_BITMAP(mask, 64) = BITMAP_FROM_U64(lv->mask); > > > > > > > > num_set = bitmap_weight(); > > > > > > > > > > I had played with this option, but bitmap_weight() counts all > > > the bits set in the mask - which considers bits >= lr->num_lines. > > > So you would need to mask lv->mask before converting it to a bitmap. > > > (I'm ok with ignoring those bits in case userspace wants to be lazy and > > > use an all 1s mask.) > > > > > > But since we're looping over the bitmap anyway we may as well just > > > count as we go. > > > > > > > for_each_set_bit(i, mask, lr->num_lines) > > > > > > > > > > Yeah, that should work. I vaguely recall trying this and finding it > > > generated larger object code, but I'll give it another try and if it > > > works out then include it in v10. > > > > > > > Tried it again and, while it works, it does increase the size of > > gpiolib-cdev.o as follows: > > > > u64 -> bitmap > > x86_64 28360 28616 > > i386 22056 22100 > > aarch64 37392 37600 > > mips32 28008 28016 > > Yes, that's pity... See below. > > > So for 64-bit platforms changing to bitmap generates larger code, > > probably as we are forcing them to use 32-bit array semantics where > > before they could use the native u64. For 32-bit there is a much > > smaller difference as they were already using 32-bit array semantics > > to realise the u64. > > > > Those are for some of my test builds, so obviously YMMV. > > > > It is also only for changing linereq_get_values(), which has three > > instances of the loop. linereq_set_values_unlocked() has another two, > > so you could expect another increase of ~2/3 of that seen here if we > > change that as well. > > > > The sizeable increase in x86_64 was what made me revert this last time, > > and I'm still satisfied with that choice. Are you still eager to switch > > to for_each_set_bit()? > > I already asked once about short cut for for_each_set_bit in case of > constant nbits parameter when it's <= BITS_PER_LONG, but here it seems > we have variadic amount of lines, dunno if compiler can prove that > it's smaller than long. In any case my point is that code readability > has a preference vs. memory footprint (except hot paths) and if we are > going to fix this it should be done in general. That said, if > maintainers are okay with that I would prefer bitmap API over > open-coded pieces. > Agreed - if the bitmap ops made better use of the architecure then I'd change to bitmap without question - it is more readable. Bart and Linus - do you have any preference? > Also note, that it will be easier to extend in the future if needed > (if we want to have more than BITS_PER_LONG [64] lines to handle). > Yeah, I think we can rule that one out - while I had initially written the uAPI with the option of > 64 lines we decided on the hard limit to keep things simple. And any user that needs to request more than 64 lines in one request shouldn't be using the GPIO uAPI. Cheers, Kent.
diff --git a/drivers/gpio/gpiolib-cdev.c b/drivers/gpio/gpiolib-cdev.c index debd3b277523..ba951f74e569 100644 --- a/drivers/gpio/gpiolib-cdev.c +++ b/drivers/gpio/gpiolib-cdev.c @@ -813,6 +813,65 @@ static long linereq_get_values(struct linereq *lr, void __user *ip) return 0; } +static long linereq_set_values_unlocked(struct linereq *lr, + struct gpio_v2_line_values *lv) +{ + DECLARE_BITMAP(vals, GPIO_V2_LINES_MAX); + struct gpio_desc **descs; + unsigned int i, didx, num_set; + int ret; + + bitmap_zero(vals, GPIO_V2_LINES_MAX); + for (num_set = 0, i = 0; i < lr->num_lines; i++) { + if (lv->mask & BIT_ULL(i)) { + if (!test_bit(FLAG_IS_OUT, &lr->lines[i].desc->flags)) + return -EPERM; + if (lv->bits & BIT_ULL(i)) + __set_bit(num_set, vals); + num_set++; + descs = &lr->lines[i].desc; + } + } + if (num_set == 0) + return -EINVAL; + + if (num_set != 1) { + /* build compacted desc array and values */ + descs = kmalloc_array(num_set, sizeof(*descs), GFP_KERNEL); + if (!descs) + return -ENOMEM; + for (didx = 0, i = 0; i < lr->num_lines; i++) { + if (lv->mask & BIT_ULL(i)) { + descs[didx] = lr->lines[i].desc; + didx++; + } + } + } + ret = gpiod_set_array_value_complex(false, true, num_set, + descs, NULL, vals); + + if (num_set != 1) + kfree(descs); + return ret; +} + +static long linereq_set_values(struct linereq *lr, void __user *ip) +{ + struct gpio_v2_line_values lv; + int ret; + + if (copy_from_user(&lv, ip, sizeof(lv))) + return -EFAULT; + + mutex_lock(&lr->config_mutex); + + ret = linereq_set_values_unlocked(lr, &lv); + + mutex_unlock(&lr->config_mutex); + + return ret; +} + static long linereq_set_config_unlocked(struct linereq *lr, struct gpio_v2_line_config *lc) { @@ -889,6 +948,8 @@ static long linereq_ioctl(struct file *file, unsigned int cmd, if (cmd == GPIO_V2_LINE_GET_VALUES_IOCTL) return linereq_get_values(lr, ip); + else if (cmd == GPIO_V2_LINE_SET_VALUES_IOCTL) + return linereq_set_values(lr, ip); else if (cmd == GPIO_V2_LINE_SET_CONFIG_IOCTL) return linereq_set_config(lr, ip);
Add support for the GPIO_V2_LINE_SET_VALUES_IOCTL. Signed-off-by: Kent Gibson <warthog618@gmail.com> --- drivers/gpio/gpiolib-cdev.c | 61 +++++++++++++++++++++++++++++++++++++ 1 file changed, 61 insertions(+)