diff --git a/configure.in b/configure.in index 4d26034579..7b2b531675 100644 --- a/configure.in +++ b/configure.in @@ -1425,7 +1425,7 @@ PGAC_FUNC_WCSTOMBS_L LIBS_including_readline="$LIBS" LIBS=`echo "$LIBS" | sed -e 's/-ledit//g' -e 's/-lreadline//g'` -AC_CHECK_FUNCS([cbrt clock_gettime dlopen fdatasync getifaddrs getpeerucred getrlimit mbstowcs_l memmove poll posix_fallocate pstat pthread_is_threaded_np readlink setproctitle setsid shm_open symlink sync_file_range utime utimes wcstombs_l]) +AC_CHECK_FUNCS([cbrt clock_gettime dlopen fdatasync getifaddrs getpeerucred getrlimit mbstowcs_l memmove poll posix_fallocate ppoll pstat pthread_is_threaded_np readlink setproctitle setsid shm_open symlink sync_file_range utime utimes wcstombs_l]) AC_REPLACE_FUNCS(fseeko) case $host_os in diff --git a/src/bin/pgbench/pgbench.c b/src/bin/pgbench/pgbench.c index 31ea6ca06e..fb100abaaa 100644 --- a/src/bin/pgbench/pgbench.c +++ b/src/bin/pgbench/pgbench.c @@ -44,9 +44,13 @@ #include #include #include +#ifdef HAVE_PPOLL +#include +#else #ifdef HAVE_SYS_SELECT_H #include #endif +#endif #ifdef HAVE_SYS_RESOURCE_H #include /* for getrlimit */ @@ -83,12 +87,19 @@ static int pthread_join(pthread_t th, void **thread_return); /******************************************************************** * some configurable parameters */ -/* max number of clients allowed */ +#ifdef HAVE_PPOLL /* using ppoll(2) */ +#define SOCKET_WAIT_METHOD "ppoll" +typedef struct pollfd socket_set; +#define MAXCLIENTS -1 /* unlimited number of clients */ +#else /* using select(2) */ +#define SOCKET_WAIT_METHOD "select" +typedef fd_set socket_set; #ifdef FD_SETSIZE -#define MAXCLIENTS (FD_SETSIZE - 10) +#define MAXCLIENTS (FD_SETSIZE - 10) /* system limited max number of clients allowed */ #else -#define MAXCLIENTS 1024 +#define MAXCLIENTS 1024 /* max number of clients allowed */ #endif +#endif /* HAVE_PPOLL */ #define DEFAULT_INIT_STEPS "dtgvp" /* default -I setting */ @@ -502,6 +513,13 @@ static void pgbench_error(const char *fmt,...) pg_attribute_printf(1, 2); static void addScript(ParsedScript script); static void *threadRun(void *arg); static void setalarm(int seconds); +static socket_set *alloc_socket_set(int count); +static int error_on_socket(socket_set *sa, int idx, PGconn *con); +static void free_socket_set(socket_set *sa); +static int ignore_socket(socket_set *sa, int idx, PGconn *con); +static void clear_socket_set(socket_set *sa, int count); +static void set_socket(socket_set *sa, int fd, int idx); +static int wait_on_socket_set(socket_set *sa, int nstate, int maxsock, int64 usec); /* callback functions for our flex lexer */ @@ -1071,6 +1089,7 @@ doConnect(void) !have_password) { PQfinish(conn); + conn = NULL; simple_prompt("Password: ", password, sizeof(password), false); have_password = true; new_pass = true; @@ -2704,6 +2723,7 @@ doCustom(TState *thread, CState *st, StatsData *agg) if (INSTR_TIME_IS_ZERO(now)) INSTR_TIME_SET_CURRENT(now); start = now; + if ((st->con = doConnect()) == NULL) { fprintf(stderr, "client %d aborted while establishing connection\n", @@ -4507,7 +4527,7 @@ main(int argc, char **argv) case 'c': benchmarking_option_set = true; nclients = atoi(optarg); - if (nclients <= 0 || nclients > MAXCLIENTS) + if (nclients <= 0 || (MAXCLIENTS != -1 && nclients > MAXCLIENTS)) { fprintf(stderr, "invalid number of clients: \"%s\"\n", optarg); @@ -5189,6 +5209,7 @@ threadRun(void *arg) int64 next_report = last_report + (int64) progress * 1000000; StatsData last, aggs; + socket_set *sockets = alloc_socket_set(nstate); /* * Initialize throttling rate target for all of the thread's clients. It @@ -5232,6 +5253,7 @@ threadRun(void *arg) { if ((state[i].con = doConnect()) == NULL) goto done; + set_socket(sockets, PQsocket(state[i].con), i); } } @@ -5248,13 +5270,13 @@ threadRun(void *arg) /* loop till all clients have terminated */ while (remains > 0) { - fd_set input_mask; int maxsock; /* max socket number to be waited for */ int64 min_usec; int64 now_usec = 0; /* set this only if needed */ /* identify which client sockets should be checked for input */ - FD_ZERO(&input_mask); + clear_socket_set(sockets, nstate); + maxsock = -1; min_usec = PG_INT64_MAX; for (i = 0; i < nstate; i++) @@ -5304,7 +5326,7 @@ threadRun(void *arg) goto done; } - FD_SET(sock, &input_mask); + set_socket(sockets, sock, i); if (maxsock < sock) maxsock = sock; } @@ -5341,7 +5363,7 @@ threadRun(void *arg) /* * If no clients are ready to execute actions, sleep until we receive * data from the server, or a nap-time specified in the script ends, - * or it's time to print a progress report. Update input_mask to show + * or it's time to print a progress report. Update sockets to show * which client(s) received data. */ if (min_usec > 0) @@ -5352,11 +5374,7 @@ threadRun(void *arg) { if (maxsock != -1) { - struct timeval timeout; - - timeout.tv_sec = min_usec / 1000000; - timeout.tv_usec = min_usec % 1000000; - nsocks = select(maxsock + 1, &input_mask, NULL, NULL, &timeout); + nsocks = wait_on_socket_set(sockets, nstate, maxsock, min_usec); } else /* nothing active, simple sleep */ { @@ -5365,7 +5383,7 @@ threadRun(void *arg) } else /* no explicit delay, select without timeout */ { - nsocks = select(maxsock + 1, &input_mask, NULL, NULL, NULL); + nsocks = wait_on_socket_set(sockets, nstate, maxsock, 0); } if (nsocks < 0) @@ -5376,7 +5394,7 @@ threadRun(void *arg) continue; } /* must be something wrong */ - fprintf(stderr, "select() failed: %s\n", strerror(errno)); + fprintf(stderr, "%s() failed: %s\n", SOCKET_WAIT_METHOD, strerror(errno)); goto done; } } @@ -5385,7 +5403,7 @@ threadRun(void *arg) /* min_usec == 0, i.e. something needs to be executed */ /* If we didn't call select(), don't try to read any data */ - FD_ZERO(&input_mask); + clear_socket_set(sockets, nstate); } /* ok, advance the state machine of each connection */ @@ -5396,16 +5414,11 @@ threadRun(void *arg) if (st->state == CSTATE_WAIT_RESULT) { /* don't call doCustom unless data is available */ - int sock = PQsocket(st->con); - if (sock < 0) - { - fprintf(stderr, "invalid socket: %s", - PQerrorMessage(st->con)); + if (error_on_socket(sockets, i, st->con)) goto done; - } - if (!FD_ISSET(sock, &input_mask)) + if (ignore_socket(sockets, i, st->con)) continue; } else if (st->state == CSTATE_FINISHED || @@ -5543,9 +5556,118 @@ done: fclose(thread->logfile); thread->logfile = NULL; } + free_socket_set(sockets); + sockets = NULL; return NULL; } +static socket_set * +alloc_socket_set(int count) +{ + return (socket_set *) pg_malloc0(sizeof(socket_set) * ((MAXCLIENTS > 0) ? 1 : count)); +} + +static void +free_socket_set(socket_set *sa) +{ + pg_free(sa); +} + +#ifdef HAVE_PPOLL /* ppoll(2) based socket polling */ +#define POLL_EVENTS (POLLRDHUP|POLLIN|POLLPRI) +#define POLL_ISSUES (POLLRDHUP|POLLERR|POLLHUP|POLLNVAL|POLLRDHUP) + +static int +error_on_socket(socket_set *sa, int idx, PGconn *con) +{ + if (sa[idx].fd == -1 || (PQsocket(con) >= 0 && !(sa[idx].revents & POLL_ISSUES))) + return 0; + fprintf(stderr, "ppoll() fail - errno: %d, idx: %d, events: %x, %s\n", + errno, idx, (sa[idx].revents & POLL_ISSUES), + PQerrorMessage(con)); + return 1; +} + +static int +ignore_socket(socket_set *sa, int idx, PGconn *con) +{ + return (sa[idx].fd != -1 && !sa[idx].revents) ? 1 : 0; +} + +static void +clear_socket_set(socket_set *sa, int count) +{ + int i = 0; + for (i = 0; i < count; i++) + set_socket(sa, -1, i); +} + +static void +set_socket(socket_set *sa, int fd, int idx) +{ + sa[idx].fd = fd; + sa[idx].events = POLL_EVENTS; + sa[idx].revents = 0; +} + +static int +wait_on_socket_set(socket_set *sa, int nstate, int maxsock, int64 usec) +{ + struct timespec timeout; + + if (usec) + { + timeout.tv_sec = usec / 1000000; + timeout.tv_nsec = usec % 1000000000; + } else { + timeout.tv_sec = timeout.tv_nsec = 0; + } + return ppoll(sa, nstate, &timeout, NULL); +} +#else /* select(2) based socket polling */ +static int +error_on_socket(socket_set *sa, int idx, PGconn *con) +{ + if (PQsocket(con) >= 0) return 0; + fprintf(stderr, "invalid socket: %s", PQerrorMessage(con)); + return 0; +} + +static int +ignore_socket(socket_set *sa, int idx, PGconn *con) +{ + return (!FD_ISSET(PQsocket(con), sa)) ? 1 : 0; +} + +static void +clear_socket_set(socket_set *sa, int count) +{ + FD_ZERO(sa); +} + +static void +set_socket(socket_set *sa, int fd, int idx) +{ + FD_SET(fd, sa); +} + +static int +wait_on_socket_set(socket_set *sa, int nstate, int maxsock, int64 usec) +{ + struct timeval timeout; + + if (usec) + { + timeout.tv_sec = usec / 1000000; + timeout.tv_usec = usec % 1000000; + } else { + timeout.tv_sec = timeout.tv_usec = 0; + } + + return select(maxsock + 1, sa, NULL, NULL, &timeout); +} +#endif /* HAVE_PPOLL */ + /* * Support for duration option: set timer_exceeded after so many seconds. */ diff --git a/src/include/pg_config.h.in b/src/include/pg_config.h.in index f98f773ff0..63207e13fd 100644 --- a/src/include/pg_config.h.in +++ b/src/include/pg_config.h.in @@ -409,6 +409,9 @@ /* Define to 1 if the assembler supports PPC's LWARX mutex hint bit. */ #undef HAVE_PPC_LWARX_MUTEX_HINT +/* Define to 1 if you have the `ppoll' function. */ +#undef HAVE_PPOLL + /* Define to 1 if you have the `pstat' function. */ #undef HAVE_PSTAT