On Thu, Jan 26, 2023 at 01:57:56AM +0300, Vitaliy Makkoveev wrote:
> On Wed, Jan 25, 2023 at 10:43:50PM +0300, Vitaliy Makkoveev wrote:
> > visa@, mpi@, I'm asking you to review, because you are involved in the
> > kevent(9) development.
> >
> > Hrvoje, if you want to test this diff, you need to disable pipex(4) with
> > "net.pipex.enable=0".
> >
>
> I missed we already have klist_init_mutex(), so the redundant *_klistops
> removed from previous diff.
I have a similar patch lying around, shown below. The main differences:
* Use the same mutex for both read and write side of the klists.
Having dedicated mutexes feels overkill.
* Use klist_insert() and klist_remove() for shorter code.
* Share f_modify and f_process functions for read and write filters.
As pppx and pppac do not seem to have forced detaching, the calls of
klist_invalidate() are not needed.
Mutex assertions could be added in filt_pppx_write() and
filt_pppac_write() to make the locking assumption more explicit
(the code that calls these functions needs the lock). However, I have
omitted these assertions as they might not add much value.
diff --git a/sys/net/if_pppx.c b/sys/net/if_pppx.c
index a59c932d276..e4675973a06 100644
--- a/sys/net/if_pppx.c
+++ b/sys/net/if_pppx.c
@@ -56,7 +56,8 @@
#include <sys/socket.h>
#include <sys/ioctl.h>
#include <sys/vnode.h>
-#include <sys/selinfo.h>
+#include <sys/event.h>
+#include <sys/mutex.h>
#include <sys/refcnt.h>
#include <net/if.h>
@@ -118,6 +119,7 @@ struct pppx_if;
* I immutable after creation
* K kernel lock
* N net lock
+ * m pxd_mtx
*/
struct pppx_dev {
@@ -125,10 +127,9 @@ struct pppx_dev {
int pxd_unit; /* [I] */
/* kq shizz */
- struct selinfo pxd_rsel;
- struct mutex pxd_rsel_mtx;
- struct selinfo pxd_wsel;
- struct mutex pxd_wsel_mtx;
+ struct mutex pxd_mtx;
+ struct klist pxd_rklist; /* [m] */
+ struct klist pxd_wklist; /* [m] */
/* queue of packets for userland to service - protected by splnet */
struct mbuf_queue pxd_svcq;
@@ -195,22 +196,28 @@ void pppxattach(int);
void filt_pppx_rdetach(struct knote *);
int filt_pppx_read(struct knote *, long);
+int filt_pppx_modify(struct kevent *, struct knote *);
+int filt_pppx_process(struct knote *, struct kevent *);
const struct filterops pppx_rd_filtops = {
- .f_flags = FILTEROP_ISFD,
+ .f_flags = FILTEROP_ISFD | FILTEROP_MPSAFE,
.f_attach = NULL,
.f_detach = filt_pppx_rdetach,
.f_event = filt_pppx_read,
+ .f_modify = filt_pppx_modify,
+ .f_process = filt_pppx_process,
};
void filt_pppx_wdetach(struct knote *);
int filt_pppx_write(struct knote *, long);
const struct filterops pppx_wr_filtops = {
- .f_flags = FILTEROP_ISFD,
+ .f_flags = FILTEROP_ISFD | FILTEROP_MPSAFE,
.f_attach = NULL,
.f_detach = filt_pppx_wdetach,
.f_event = filt_pppx_write,
+ .f_modify = filt_pppx_modify,
+ .f_process = filt_pppx_process,
};
struct pppx_dev *
@@ -257,8 +264,9 @@ pppxopen(dev_t dev, int flags, int mode, struct proc *p)
}
pxd->pxd_unit = minor(dev);
- mtx_init(&pxd->pxd_rsel_mtx, IPL_NET);
- mtx_init(&pxd->pxd_wsel_mtx, IPL_NET);
+ mtx_init(&pxd->pxd_mtx, IPL_NET);
+ klist_init_mutex(&pxd->pxd_rklist, &pxd->pxd_mtx);
+ klist_init_mutex(&pxd->pxd_wklist, &pxd->pxd_mtx);
LIST_INIT(&pxd->pxd_pxis);
mq_init(&pxd->pxd_svcq, 128, IPL_NET);
@@ -453,29 +461,24 @@ int
pppxkqfilter(dev_t dev, struct knote *kn)
{
struct pppx_dev *pxd = pppx_dev2pxd(dev);
- struct mutex *mtx;
struct klist *klist;
switch (kn->kn_filter) {
case EVFILT_READ:
- mtx = &pxd->pxd_rsel_mtx;
- klist = &pxd->pxd_rsel.si_note;
+ klist = &pxd->pxd_rklist;
kn->kn_fop = &pppx_rd_filtops;
break;
case EVFILT_WRITE:
- mtx = &pxd->pxd_wsel_mtx;
- klist = &pxd->pxd_wsel.si_note;
+ klist = &pxd->pxd_wklist;
kn->kn_fop = &pppx_wr_filtops;
break;
default:
return (EINVAL);
}
- kn->kn_hook = (caddr_t)pxd;
+ kn->kn_hook = pxd;
- mtx_enter(mtx);
- klist_insert_locked(klist, kn);
- mtx_leave(mtx);
+ klist_insert(klist, kn);
return (0);
}
@@ -483,18 +486,17 @@ pppxkqfilter(dev_t dev, struct knote *kn)
void
filt_pppx_rdetach(struct knote *kn)
{
- struct pppx_dev *pxd = (struct pppx_dev *)kn->kn_hook;
- struct klist *klist = &pxd->pxd_rsel.si_note;
+ struct pppx_dev *pxd = kn->kn_hook;
- mtx_enter(&pxd->pxd_rsel_mtx);
- klist_remove_locked(klist, kn);
- mtx_leave(&pxd->pxd_rsel_mtx);
+ klist_remove(&pxd->pxd_rklist, kn);
}
int
filt_pppx_read(struct knote *kn, long hint)
{
- struct pppx_dev *pxd = (struct pppx_dev *)kn->kn_hook;
+ struct pppx_dev *pxd = kn->kn_hook;
+
+ MUTEX_ASSERT_LOCKED(&pxd->pxd_mtx);
kn->kn_data = mq_hdatalen(&pxd->pxd_svcq);
@@ -504,12 +506,9 @@ filt_pppx_read(struct knote *kn, long hint)
void
filt_pppx_wdetach(struct knote *kn)
{
- struct pppx_dev *pxd = (struct pppx_dev *)kn->kn_hook;
- struct klist *klist = &pxd->pxd_wsel.si_note;
+ struct pppx_dev *pxd = kn->kn_hook;
- mtx_enter(&pxd->pxd_wsel_mtx);
- klist_remove_locked(klist, kn);
- mtx_leave(&pxd->pxd_wsel_mtx);
+ klist_remove(&pxd->pxd_wklist, kn);
}
int
@@ -519,6 +518,32 @@ filt_pppx_write(struct knote *kn, long hint)
return (1);
}
+int
+filt_pppx_modify(struct kevent *kev, struct knote *kn)
+{
+ struct pppx_dev *pxd = kn->kn_hook;
+ int active;
+
+ mtx_enter(&pxd->pxd_mtx);
+ active = knote_modify(kev, kn);
+ mtx_leave(&pxd->pxd_mtx);
+
+ return (active);
+}
+
+int
+filt_pppx_process(struct knote *kn, struct kevent *kev)
+{
+ struct pppx_dev *pxd = kn->kn_hook;
+ int active;
+
+ mtx_enter(&pxd->pxd_mtx);
+ active = knote_process(kn, kev);
+ mtx_leave(&pxd->pxd_mtx);
+
+ return (active);
+}
+
int
pppxclose(dev_t dev, int flags, int mode, struct proc *p)
{
@@ -536,6 +561,9 @@ pppxclose(dev_t dev, int flags, int mode, struct proc *p)
mq_purge(&pxd->pxd_svcq);
+ klist_free(&pxd->pxd_rklist);
+ klist_free(&pxd->pxd_rklist);
+
free(pxd, M_DEVBUF, sizeof(*pxd));
return (0);
@@ -875,7 +903,9 @@ pppx_if_output(struct ifnet *ifp, struct mbuf *m, struct
sockaddr *dst,
wakeup((caddr_t)pxi->pxi_dev);
pxi->pxi_dev->pxd_waiting = 0;
}
- selwakeup(&pxi->pxi_dev->pxd_rsel);
+ mtx_enter(&pxi->pxi_dev->pxd_mtx);
+ KNOTE(&pxi->pxi_dev->pxd_rklist, 0);
+ mtx_leave(&pxi->pxi_dev->pxd_mtx);
}
}
@@ -921,6 +951,14 @@ pppx_if_ioctl(struct ifnet *ifp, u_long cmd, caddr_t addr)
RBT_GENERATE(pppx_ifs, pppx_if, pxi_entry, pppx_if_cmp);
+/*
+ * Locks used to protect struct members and global data
+ * I immutable after creation
+ * K kernel lock
+ * N net lock
+ * m sc_mtx
+ */
+
struct pppac_softc {
struct ifnet sc_if;
dev_t sc_dev; /* [I] */
@@ -928,10 +966,9 @@ struct pppac_softc {
LIST_ENTRY(pppac_softc)
sc_entry; /* [K] */
- struct mutex sc_rsel_mtx;
- struct selinfo sc_rsel;
- struct mutex sc_wsel_mtx;
- struct selinfo sc_wsel;
+ struct mutex sc_mtx;
+ struct klist sc_rklist; /* [m] */
+ struct klist sc_wklist; /* [m] */
struct pipex_session
*sc_multicast_session;
@@ -944,22 +981,28 @@ LIST_HEAD(pppac_list, pppac_softc); /* [K] */
static void filt_pppac_rdetach(struct knote *);
static int filt_pppac_read(struct knote *, long);
+static int filt_pppac_modify(struct kevent *, struct knote *);
+static int filt_pppac_process(struct knote *, struct kevent *);
static const struct filterops pppac_rd_filtops = {
- .f_flags = FILTEROP_ISFD,
+ .f_flags = FILTEROP_ISFD | FILTEROP_MPSAFE,
.f_attach = NULL,
.f_detach = filt_pppac_rdetach,
- .f_event = filt_pppac_read
+ .f_event = filt_pppac_read,
+ .f_modify = filt_pppac_modify,
+ .f_process = filt_pppac_process,
};
static void filt_pppac_wdetach(struct knote *);
static int filt_pppac_write(struct knote *, long);
static const struct filterops pppac_wr_filtops = {
- .f_flags = FILTEROP_ISFD,
+ .f_flags = FILTEROP_ISFD | FILTEROP_MPSAFE,
.f_attach = NULL,
.f_detach = filt_pppac_wdetach,
- .f_event = filt_pppac_write
+ .f_event = filt_pppac_write,
+ .f_modify = filt_pppac_modify,
+ .f_process = filt_pppac_process,
};
static struct pppac_list pppac_devs = LIST_HEAD_INITIALIZER(pppac_devs);
@@ -1020,8 +1063,9 @@ pppacopen(dev_t dev, int flags, int mode, struct proc *p)
session->ownersc = sc;
sc->sc_multicast_session = session;
- mtx_init(&sc->sc_rsel_mtx, IPL_SOFTNET);
- mtx_init(&sc->sc_wsel_mtx, IPL_SOFTNET);
+ mtx_init(&sc->sc_mtx, IPL_SOFTNET);
+ klist_init_mutex(&sc->sc_rklist, &sc->sc_mtx);
+ klist_init_mutex(&sc->sc_wklist, &sc->sc_mtx);
mq_init(&sc->sc_mq, IFQ_MAXLEN, IPL_SOFTNET);
ifp = &sc->sc_if;
@@ -1205,18 +1249,15 @@ int
pppackqfilter(dev_t dev, struct knote *kn)
{
struct pppac_softc *sc = pppac_lookup(dev);
- struct mutex *mtx;
struct klist *klist;
switch (kn->kn_filter) {
case EVFILT_READ:
- mtx = &sc->sc_rsel_mtx;
- klist = &sc->sc_rsel.si_note;
+ klist = &sc->sc_rklist;
kn->kn_fop = &pppac_rd_filtops;
break;
case EVFILT_WRITE:
- mtx = &sc->sc_wsel_mtx;
- klist = &sc->sc_wsel.si_note;
+ klist = &sc->sc_wklist;
kn->kn_fop = &pppac_wr_filtops;
break;
default:
@@ -1225,9 +1266,7 @@ pppackqfilter(dev_t dev, struct knote *kn)
kn->kn_hook = sc;
- mtx_enter(mtx);
- klist_insert_locked(klist, kn);
- mtx_leave(mtx);
+ klist_insert(klist, kn);
return (0);
}
@@ -1236,11 +1275,8 @@ static void
filt_pppac_rdetach(struct knote *kn)
{
struct pppac_softc *sc = kn->kn_hook;
- struct klist *klist = &sc->sc_rsel.si_note;
- mtx_enter(&sc->sc_rsel_mtx);
- klist_remove_locked(klist, kn);
- mtx_leave(&sc->sc_rsel_mtx);
+ klist_remove(&sc->sc_rklist, kn);
}
static int
@@ -1248,6 +1284,8 @@ filt_pppac_read(struct knote *kn, long hint)
{
struct pppac_softc *sc = kn->kn_hook;
+ MUTEX_ASSERT_LOCKED(&sc->sc_mtx);
+
kn->kn_data = mq_hdatalen(&sc->sc_mq);
return (kn->kn_data > 0);
@@ -1257,11 +1295,8 @@ static void
filt_pppac_wdetach(struct knote *kn)
{
struct pppac_softc *sc = kn->kn_hook;
- struct klist *klist = &sc->sc_wsel.si_note;
- mtx_enter(&sc->sc_wsel_mtx);
- klist_remove_locked(klist, kn);
- mtx_leave(&sc->sc_wsel_mtx);
+ klist_remove(&sc->sc_wklist, kn);
}
static int
@@ -1271,12 +1306,37 @@ filt_pppac_write(struct knote *kn, long hint)
return (1);
}
+static int
+filt_pppac_modify(struct kevent *kev, struct knote *kn)
+{
+ struct pppac_softc *sc = kn->kn_hook;
+ int active;
+
+ mtx_enter(&sc->sc_mtx);
+ active = knote_modify(kev, kn);
+ mtx_leave(&sc->sc_mtx);
+
+ return (active);
+}
+
+static int
+filt_pppac_process(struct knote *kn, struct kevent *kev)
+{
+ struct pppac_softc *sc = kn->kn_hook;
+ int active;
+
+ mtx_enter(&sc->sc_mtx);
+ active = knote_process(kn, kev);
+ mtx_leave(&sc->sc_mtx);
+
+ return (active);
+}
+
int
pppacclose(dev_t dev, int flags, int mode, struct proc *p)
{
struct pppac_softc *sc = pppac_lookup(dev);
struct ifnet *ifp = &sc->sc_if;
- int s;
sc->sc_ready = 0;
@@ -1286,10 +1346,8 @@ pppacclose(dev_t dev, int flags, int mode, struct proc
*p)
if_detach(ifp);
- s = splhigh();
- klist_invalidate(&sc->sc_rsel.si_note);
- klist_invalidate(&sc->sc_wsel.si_note);
- splx(s);
+ klist_free(&sc->sc_rklist);
+ klist_free(&sc->sc_wklist);
pool_put(&pipex_session_pool, sc->sc_multicast_session);
pipex_destroy_all_sessions(sc);
@@ -1461,6 +1519,8 @@ bad:
if (!mq_empty(&sc->sc_mq)) {
wakeup(sc);
- selwakeup(&sc->sc_rsel);
+ mtx_enter(&sc->sc_mtx);
+ KNOTE(&sc->sc_rklist, 0);
+ mtx_leave(&sc->sc_mtx);
}
}