Skip to content

Commit 1dbd54d

Browse files
committed
multi: reduce Win32 API calls to improve performance
1. Consolidate pre-checks into a single Curl_poll call: This is an attempt to restructure the code in Curl_multi_wait in such a way that less syscalls are made by removing individual calls to Curl_socket_check via SOCKET_READABLE/SOCKET_WRITABLE. 2. Avoid resetting the WinSock event multiple times: We finally call WSAResetEvent anyway, so specifying it as an optional parameter to WSAEnumNetworkEvents is redundant. 3. Wakeup directly in case no sockets are being monitoring: Fix the WinSock based implementation to skip extra waiting by not sleeping in case no sockets are to be waited on and just the WinSock event is being monitored for wakeup functionality. Assisted-by: Tommy Odom Assisted-by: Jay Satiro Bug: curl#6146 Part of curl#6245
1 parent 1346d66 commit 1dbd54d

File tree

1 file changed

+45
-75
lines changed

1 file changed

+45
-75
lines changed

lib/multi.c

+45-75
Original file line numberDiff line numberDiff line change
@@ -1086,12 +1086,10 @@ static CURLMcode multi_wait(struct Curl_multi *multi,
10861086
unsigned int curlfds;
10871087
long timeout_internal;
10881088
int retcode = 0;
1089-
#ifndef USE_WINSOCK
10901089
struct pollfd a_few_on_stack[NUM_POLLS_ON_STACK];
10911090
struct pollfd *ufds = &a_few_on_stack[0];
10921091
bool ufds_malloc = FALSE;
1093-
#else
1094-
struct pollfd pre_poll;
1092+
#ifdef USE_WINSOCK
10951093
WSANETWORKEVENTS wsa_events;
10961094
DEBUGASSERT(multi->wsa_event != WSA_INVALID_EVENT);
10971095
#endif
@@ -1149,7 +1147,6 @@ static CURLMcode multi_wait(struct Curl_multi *multi,
11491147
}
11501148
#endif
11511149

1152-
#ifndef USE_WINSOCK
11531150
if(nfds > NUM_POLLS_ON_STACK) {
11541151
/* 'nfds' is a 32 bit value and 'struct pollfd' is typically 8 bytes
11551152
big, so at 2^29 sockets this value might wrap. When a process gets
@@ -1160,9 +1157,7 @@ static CURLMcode multi_wait(struct Curl_multi *multi,
11601157
return CURLM_OUT_OF_MEMORY;
11611158
ufds_malloc = TRUE;
11621159
}
1163-
11641160
nfds = 0;
1165-
#endif
11661161

11671162
/* only do the second loop if we found descriptors in the first stage run
11681163
above */
@@ -1180,34 +1175,31 @@ static CURLMcode multi_wait(struct Curl_multi *multi,
11801175
#endif
11811176
if(bitmap & GETSOCK_READSOCK(i)) {
11821177
#ifdef USE_WINSOCK
1183-
if(timeout_ms && SOCKET_READABLE(sockbunch[i], 0) > 0)
1184-
timeout_ms = 0;
11851178
mask |= FD_READ|FD_ACCEPT|FD_CLOSE;
1186-
#else
1179+
#endif
11871180
ufds[nfds].fd = sockbunch[i];
11881181
ufds[nfds].events = POLLIN;
11891182
++nfds;
1190-
#endif
11911183
s = sockbunch[i];
11921184
}
11931185
if(bitmap & GETSOCK_WRITESOCK(i)) {
11941186
#ifdef USE_WINSOCK
1195-
if(timeout_ms && SOCKET_WRITABLE(sockbunch[i], 0) > 0)
1196-
timeout_ms = 0;
11971187
mask |= FD_WRITE|FD_CONNECT|FD_CLOSE;
1198-
#else
1188+
#endif
11991189
ufds[nfds].fd = sockbunch[i];
12001190
ufds[nfds].events = POLLOUT;
12011191
++nfds;
1202-
#endif
12031192
s = sockbunch[i];
12041193
}
12051194
if(s == CURL_SOCKET_BAD) {
12061195
break;
12071196
}
12081197
#ifdef USE_WINSOCK
1209-
if(WSAEventSelect(s, multi->wsa_event, mask) != 0)
1198+
if(WSAEventSelect(s, multi->wsa_event, mask) != 0) {
1199+
if(ufds_malloc)
1200+
free(ufds);
12101201
return CURLM_INTERNAL_ERROR;
1202+
}
12111203
#endif
12121204
}
12131205

@@ -1219,35 +1211,18 @@ static CURLMcode multi_wait(struct Curl_multi *multi,
12191211
for(i = 0; i < extra_nfds; i++) {
12201212
#ifdef USE_WINSOCK
12211213
long mask = 0;
1222-
extra_fds[i].revents = 0;
1223-
pre_poll.fd = extra_fds[i].fd;
1224-
pre_poll.events = 0;
1225-
pre_poll.revents = 0;
1226-
if(extra_fds[i].events & CURL_WAIT_POLLIN) {
1214+
if(extra_fds[i].events & CURL_WAIT_POLLIN)
12271215
mask |= FD_READ|FD_ACCEPT|FD_CLOSE;
1228-
pre_poll.events |= POLLIN;
1229-
}
1230-
if(extra_fds[i].events & CURL_WAIT_POLLPRI) {
1216+
if(extra_fds[i].events & CURL_WAIT_POLLPRI)
12311217
mask |= FD_OOB;
1232-
pre_poll.events |= POLLPRI;
1233-
}
1234-
if(extra_fds[i].events & CURL_WAIT_POLLOUT) {
1218+
if(extra_fds[i].events & CURL_WAIT_POLLOUT)
12351219
mask |= FD_WRITE|FD_CONNECT|FD_CLOSE;
1236-
pre_poll.events |= POLLOUT;
1237-
}
1238-
if(Curl_poll(&pre_poll, 1, 0) > 0) {
1239-
if(pre_poll.revents & POLLIN)
1240-
extra_fds[i].revents |= CURL_WAIT_POLLIN;
1241-
if(pre_poll.revents & POLLPRI)
1242-
extra_fds[i].revents |= CURL_WAIT_POLLPRI;
1243-
if(pre_poll.revents & POLLOUT)
1244-
extra_fds[i].revents |= CURL_WAIT_POLLOUT;
1245-
if(extra_fds[i].revents)
1246-
timeout_ms = 0;
1247-
}
1248-
if(WSAEventSelect(extra_fds[i].fd, multi->wsa_event, mask) != 0)
1220+
if(WSAEventSelect(extra_fds[i].fd, multi->wsa_event, mask) != 0) {
1221+
if(ufds_malloc)
1222+
free(ufds);
12491223
return CURLM_INTERNAL_ERROR;
1250-
#else
1224+
}
1225+
#endif
12511226
ufds[nfds].fd = extra_fds[i].fd;
12521227
ufds[nfds].events = 0;
12531228
if(extra_fds[i].events & CURL_WAIT_POLLIN)
@@ -1257,7 +1232,6 @@ static CURLMcode multi_wait(struct Curl_multi *multi,
12571232
if(extra_fds[i].events & CURL_WAIT_POLLOUT)
12581233
ufds[nfds].events |= POLLOUT;
12591234
++nfds;
1260-
#endif
12611235
}
12621236

12631237
#ifdef ENABLE_WAKEUP
@@ -1270,53 +1244,59 @@ static CURLMcode multi_wait(struct Curl_multi *multi,
12701244
#endif
12711245
#endif
12721246

1247+
#if defined(ENABLE_WAKEUP) && defined(USE_WINSOCK)
1248+
if(nfds || use_wakeup) {
1249+
#else
12731250
if(nfds) {
1274-
/* wait... */
1251+
#endif
1252+
int pollrc;
12751253
#ifdef USE_WINSOCK
1276-
WSAWaitForMultipleEvents(1, &multi->wsa_event, FALSE, timeout_ms, FALSE);
1254+
if(nfds)
1255+
pollrc = Curl_poll(ufds, nfds, 0); /* just pre-check with WinSock */
1256+
else
1257+
pollrc = 0;
1258+
if(pollrc <= 0) /* now wait... if not ready during the pre-check above */
1259+
WSAWaitForMultipleEvents(1, &multi->wsa_event, FALSE, timeout_ms, FALSE);
12771260
#else
1278-
int pollrc = Curl_poll(ufds, nfds, timeout_ms);
1261+
pollrc = Curl_poll(ufds, nfds, timeout_ms); /* wait... */
12791262
#endif
12801263

1281-
#ifdef USE_WINSOCK
1282-
/* With Winsock, we have to run this unconditionally to call
1283-
WSAEventSelect(fd, event, 0) on all the sockets */
1284-
{
1285-
retcode = 0;
1286-
#else
12871264
if(pollrc > 0) {
12881265
retcode = pollrc;
1266+
#ifdef USE_WINSOCK
1267+
}
1268+
/* With WinSock, we have to run the following section unconditionally
1269+
to call WSAEventSelect(fd, event, 0) on all the sockets */
1270+
{
12891271
#endif
12901272
/* copy revents results from the poll to the curl_multi_wait poll
12911273
struct, the bit values of the actual underlying poll() implementation
12921274
may not be the same as the ones in the public libcurl API! */
12931275
for(i = 0; i < extra_nfds; i++) {
1276+
unsigned r = ufds[curlfds + i].revents;
12941277
unsigned short mask = 0;
12951278
#ifdef USE_WINSOCK
12961279
wsa_events.lNetworkEvents = 0;
1297-
mask = extra_fds[i].revents;
1298-
if(WSAEnumNetworkEvents(extra_fds[i].fd, multi->wsa_event,
1299-
&wsa_events) == 0) {
1280+
if(WSAEnumNetworkEvents(extra_fds[i].fd, NULL, &wsa_events) == 0) {
13001281
if(wsa_events.lNetworkEvents & (FD_READ|FD_ACCEPT|FD_CLOSE))
13011282
mask |= CURL_WAIT_POLLIN;
13021283
if(wsa_events.lNetworkEvents & (FD_WRITE|FD_CONNECT|FD_CLOSE))
13031284
mask |= CURL_WAIT_POLLOUT;
13041285
if(wsa_events.lNetworkEvents & FD_OOB)
13051286
mask |= CURL_WAIT_POLLPRI;
1306-
if(ret && wsa_events.lNetworkEvents != 0)
1287+
if(ret && pollrc <= 0 && wsa_events.lNetworkEvents != 0)
13071288
retcode++;
13081289
}
13091290
WSAEventSelect(extra_fds[i].fd, multi->wsa_event, 0);
1310-
#else
1311-
unsigned r = ufds[curlfds + i].revents;
1312-
1291+
if(pollrc <= 0)
1292+
continue;
1293+
#endif
13131294
if(r & POLLIN)
13141295
mask |= CURL_WAIT_POLLIN;
13151296
if(r & POLLOUT)
13161297
mask |= CURL_WAIT_POLLOUT;
13171298
if(r & POLLPRI)
13181299
mask |= CURL_WAIT_POLLPRI;
1319-
#endif
13201300
extra_fds[i].revents = mask;
13211301
}
13221302

@@ -1331,17 +1311,8 @@ static CURLMcode multi_wait(struct Curl_multi *multi,
13311311
for(i = 0; i < MAX_SOCKSPEREASYHANDLE; i++) {
13321312
if(bitmap & (GETSOCK_READSOCK(i) | GETSOCK_WRITESOCK(i))) {
13331313
wsa_events.lNetworkEvents = 0;
1334-
if(WSAEnumNetworkEvents(sockbunch[i], multi->wsa_event,
1335-
&wsa_events) == 0) {
1336-
if(ret && wsa_events.lNetworkEvents != 0)
1337-
retcode++;
1338-
}
1339-
if(ret && !timeout_ms && wsa_events.lNetworkEvents == 0) {
1340-
if((bitmap & GETSOCK_READSOCK(i)) &&
1341-
SOCKET_READABLE(sockbunch[i], 0) > 0)
1342-
retcode++;
1343-
else if((bitmap & GETSOCK_WRITESOCK(i)) &&
1344-
SOCKET_WRITABLE(sockbunch[i], 0) > 0)
1314+
if(WSAEnumNetworkEvents(sockbunch[i], NULL, &wsa_events) == 0) {
1315+
if(ret && pollrc <= 0 && wsa_events.lNetworkEvents != 0)
13451316
retcode++;
13461317
}
13471318
WSAEventSelect(sockbunch[i], multi->wsa_event, 0);
@@ -1382,16 +1353,15 @@ static CURLMcode multi_wait(struct Curl_multi *multi,
13821353
}
13831354
}
13841355

1385-
#ifndef USE_WINSOCK
13861356
if(ufds_malloc)
13871357
free(ufds);
1388-
#endif
13891358
if(ret)
13901359
*ret = retcode;
1391-
if(!extrawait || nfds)
1392-
/* if any socket was checked */
1393-
;
1394-
else {
1360+
#if defined(ENABLE_WAKEUP) && defined(USE_WINSOCK)
1361+
if(extrawait && !nfds && !use_wakeup) {
1362+
#else
1363+
if(extrawait && !nfds) {
1364+
#endif
13951365
long sleep_ms = 0;
13961366

13971367
/* Avoid busy-looping when there's nothing particular to wait for */

0 commit comments

Comments
 (0)