blob: cedaf7e024b4615f5fc75cab05568d56a2daa43c [file] [log] [blame]
David K. Bainbridgee05cf0c2021-08-19 03:16:50 +00001// Copyright 2020 The Go Authors. All rights reserved.
2// Use of this source code is governed by a BSD-style
3// license that can be found in the LICENSE file.
4
5//go:build zos && s390x
6// +build zos,s390x
7
8package unix
9
10import (
11 "sync"
12)
13
14// This file simulates epoll on z/OS using poll.
15
16// Analogous to epoll_event on Linux.
17// TODO(neeilan): Pad is because the Linux kernel expects a 96-bit struct. We never pass this to the kernel; remove?
18type EpollEvent struct {
19 Events uint32
20 Fd int32
21 Pad int32
22}
23
24const (
25 EPOLLERR = 0x8
26 EPOLLHUP = 0x10
27 EPOLLIN = 0x1
28 EPOLLMSG = 0x400
29 EPOLLOUT = 0x4
30 EPOLLPRI = 0x2
31 EPOLLRDBAND = 0x80
32 EPOLLRDNORM = 0x40
33 EPOLLWRBAND = 0x200
34 EPOLLWRNORM = 0x100
35 EPOLL_CTL_ADD = 0x1
36 EPOLL_CTL_DEL = 0x2
37 EPOLL_CTL_MOD = 0x3
38 // The following constants are part of the epoll API, but represent
39 // currently unsupported functionality on z/OS.
40 // EPOLL_CLOEXEC = 0x80000
41 // EPOLLET = 0x80000000
42 // EPOLLONESHOT = 0x40000000
43 // EPOLLRDHUP = 0x2000 // Typically used with edge-triggered notis
44 // EPOLLEXCLUSIVE = 0x10000000 // Exclusive wake-up mode
45 // EPOLLWAKEUP = 0x20000000 // Relies on Linux's BLOCK_SUSPEND capability
46)
47
48// TODO(neeilan): We can eliminate these epToPoll / pToEpoll calls by using identical mask values for POLL/EPOLL
49// constants where possible The lower 16 bits of epoll events (uint32) can fit any system poll event (int16).
50
51// epToPollEvt converts epoll event field to poll equivalent.
52// In epoll, Events is a 32-bit field, while poll uses 16 bits.
53func epToPollEvt(events uint32) int16 {
54 var ep2p = map[uint32]int16{
55 EPOLLIN: POLLIN,
56 EPOLLOUT: POLLOUT,
57 EPOLLHUP: POLLHUP,
58 EPOLLPRI: POLLPRI,
59 EPOLLERR: POLLERR,
60 }
61
62 var pollEvts int16 = 0
63 for epEvt, pEvt := range ep2p {
64 if (events & epEvt) != 0 {
65 pollEvts |= pEvt
66 }
67 }
68
69 return pollEvts
70}
71
72// pToEpollEvt converts 16 bit poll event bitfields to 32-bit epoll event fields.
73func pToEpollEvt(revents int16) uint32 {
74 var p2ep = map[int16]uint32{
75 POLLIN: EPOLLIN,
76 POLLOUT: EPOLLOUT,
77 POLLHUP: EPOLLHUP,
78 POLLPRI: EPOLLPRI,
79 POLLERR: EPOLLERR,
80 }
81
82 var epollEvts uint32 = 0
83 for pEvt, epEvt := range p2ep {
84 if (revents & pEvt) != 0 {
85 epollEvts |= epEvt
86 }
87 }
88
89 return epollEvts
90}
91
92// Per-process epoll implementation.
93type epollImpl struct {
94 mu sync.Mutex
95 epfd2ep map[int]*eventPoll
96 nextEpfd int
97}
98
99// eventPoll holds a set of file descriptors being watched by the process. A process can have multiple epoll instances.
100// On Linux, this is an in-kernel data structure accessed through a fd.
101type eventPoll struct {
102 mu sync.Mutex
103 fds map[int]*EpollEvent
104}
105
106// epoll impl for this process.
107var impl epollImpl = epollImpl{
108 epfd2ep: make(map[int]*eventPoll),
109 nextEpfd: 0,
110}
111
112func (e *epollImpl) epollcreate(size int) (epfd int, err error) {
113 e.mu.Lock()
114 defer e.mu.Unlock()
115 epfd = e.nextEpfd
116 e.nextEpfd++
117
118 e.epfd2ep[epfd] = &eventPoll{
119 fds: make(map[int]*EpollEvent),
120 }
121 return epfd, nil
122}
123
124func (e *epollImpl) epollcreate1(flag int) (fd int, err error) {
125 return e.epollcreate(4)
126}
127
128func (e *epollImpl) epollctl(epfd int, op int, fd int, event *EpollEvent) (err error) {
129 e.mu.Lock()
130 defer e.mu.Unlock()
131
132 ep, ok := e.epfd2ep[epfd]
133 if !ok {
134
135 return EBADF
136 }
137
138 switch op {
139 case EPOLL_CTL_ADD:
140 // TODO(neeilan): When we make epfds and fds disjoint, detect epoll
141 // loops here (instances watching each other) and return ELOOP.
142 if _, ok := ep.fds[fd]; ok {
143 return EEXIST
144 }
145 ep.fds[fd] = event
146 case EPOLL_CTL_MOD:
147 if _, ok := ep.fds[fd]; !ok {
148 return ENOENT
149 }
150 ep.fds[fd] = event
151 case EPOLL_CTL_DEL:
152 if _, ok := ep.fds[fd]; !ok {
153 return ENOENT
154 }
155 delete(ep.fds, fd)
156
157 }
158 return nil
159}
160
161// Must be called while holding ep.mu
162func (ep *eventPoll) getFds() []int {
163 fds := make([]int, len(ep.fds))
164 for fd := range ep.fds {
165 fds = append(fds, fd)
166 }
167 return fds
168}
169
170func (e *epollImpl) epollwait(epfd int, events []EpollEvent, msec int) (n int, err error) {
171 e.mu.Lock() // in [rare] case of concurrent epollcreate + epollwait
172 ep, ok := e.epfd2ep[epfd]
173
174 if !ok {
175 e.mu.Unlock()
176 return 0, EBADF
177 }
178
179 pollfds := make([]PollFd, 4)
180 for fd, epollevt := range ep.fds {
181 pollfds = append(pollfds, PollFd{Fd: int32(fd), Events: epToPollEvt(epollevt.Events)})
182 }
183 e.mu.Unlock()
184
185 n, err = Poll(pollfds, msec)
186 if err != nil {
187 return n, err
188 }
189
190 i := 0
191 for _, pFd := range pollfds {
192 if pFd.Revents != 0 {
193 events[i] = EpollEvent{Fd: pFd.Fd, Events: pToEpollEvt(pFd.Revents)}
194 i++
195 }
196
197 if i == n {
198 break
199 }
200 }
201
202 return n, nil
203}
204
205func EpollCreate(size int) (fd int, err error) {
206 return impl.epollcreate(size)
207}
208
209func EpollCreate1(flag int) (fd int, err error) {
210 return impl.epollcreate1(flag)
211}
212
213func EpollCtl(epfd int, op int, fd int, event *EpollEvent) (err error) {
214 return impl.epollctl(epfd, op, fd, event)
215}
216
217// Because EpollWait mutates events, the caller is expected to coordinate
218// concurrent access if calling with the same epfd from multiple goroutines.
219func EpollWait(epfd int, events []EpollEvent, msec int) (n int, err error) {
220 return impl.epollwait(epfd, events, msec)
221}