/* * ODISSEY. * * PostgreSQL connection pooler and request router. */ #include #include #include #include #include #include #include #include #include #include "od_macro.h" #include "od_version.h" #include "od_list.h" #include "od_pid.h" #include "od_id.h" #include "od_syslog.h" #include "od_log.h" #include "od_daemon.h" #include "od_scheme.h" #include "od_lex.h" #include "od_config.h" #include "od_msg.h" #include "od_system.h" #include "od_instance.h" #include "od_server.h" #include "od_server_pool.h" #include "od_client.h" #include "od_client_pool.h" #include "od_route_id.h" #include "od_route.h" #include "od_route_pool.h" #include "od_io.h" #include "od_router.h" #include "od_pooler.h" #include "od_relay.h" #include "od_frontend.h" #include "od_backend.h" #include "od_auth.h" #include "od_tls.h" #include "od_cancel.h" void od_backend_close(od_server_t *server) { assert(server->route == NULL); if (server->io) { machine_close(server->io); machine_io_free(server->io); server->io = NULL; } if (server->tls) { machine_tls_free(server->tls); server->tls = NULL; } server->is_transaction = 0; server->idle_time = 0; so_keyinit(&server->key); so_keyinit(&server->key_client); od_server_free(server); } int od_backend_terminate(od_server_t *server) { int rc; so_stream_t *stream = &server->stream; so_stream_reset(stream); rc = so_fewrite_terminate(stream); if (rc == -1) return -1; rc = od_write(server->io, stream); if (rc == -1) return -1; server->count_request++; return 0; } void od_backend_error(od_server_t *server, char *state, uint8_t *data, int size) { od_instance_t *instance = server->system->instance; so_feerror_t error; int rc; rc = so_feread_error(&error, data, size); if (rc == -1) { od_error_server(&instance->log, &server->id, state, "failed to parse error message from server"); return; } od_error_server(&instance->log, &server->id, state, "%s %s %s", error.severity, error.code, error.message); if (error.detail) { od_error_server(&instance->log, &server->id, state, "DETAIL: %s", error.detail); } if (error.hint) { od_error_server(&instance->log, &server->id, state, "HINT: %s", error.hint); } } int od_backend_ready(od_server_t *server, uint8_t *data, int size) { int status; int rc; rc = so_feread_ready(&status, data, size); if (rc == -1) return -1; if (status == 'I') { /* no active transaction */ server->is_transaction = 0; } else if (status == 'T' || status == 'E') { /* in active transaction or in interrupted * transaction block */ server->is_transaction = 1; } server->count_reply++; return 0; } static inline int od_backend_ready_wait(od_server_t *server, char *context, int time_ms) { od_instance_t *instance = server->system->instance; so_stream_t *stream = &server->stream; /* wait for response */ while (1) { so_stream_reset(stream); int rc; rc = od_read(server->io, stream, time_ms); if (rc == -1) { if (! machine_timedout()) { od_error_server(&instance->log, &server->id, context, "read error: %s", machine_error(server->io)); } return -1; } int offset = rc; uint8_t type = stream->s[offset]; od_debug_server(&instance->log, &server->id, context, "%c", type); /* ErrorResponse */ if (type == 'E') { od_backend_error(server, context, stream->s, so_stream_used(stream)); } /* ReadyForQuery */ if (type == 'Z') { od_backend_ready(server, stream->s + offset, so_stream_used(stream) - offset); break; } } return 0; } static inline int od_backend_startup(od_server_t *server) { od_instance_t *instance = server->system->instance; od_route_t *route = server->route; so_stream_t *stream = &server->stream; so_stream_reset(stream); so_fearg_t argv[] = { { "user", 5 }, { route->id.user, route->id.user_len }, { "database", 9 }, { route->id.database, route->id.database_len } }; int rc; rc = so_fewrite_startup_message(stream, 4, argv); if (rc == -1) return -1; rc = od_write(server->io, stream); if (rc == -1) { od_error_server(&instance->log, &server->id, "startup", "write error: %s", machine_error(server->io)); return -1; } server->count_request++; while (1) { so_stream_reset(stream); int rc; rc = od_read(server->io, &server->stream, UINT32_MAX); if (rc == -1) { od_error_server(&instance->log, &server->id, "startup", "read error: %s", machine_error(server->io)); return -1; } uint8_t type = *server->stream.s; od_debug_server(&instance->log, &server->id, "startup", "%c", type); switch (type) { /* ReadyForQuery */ case 'Z': od_backend_ready(server, stream->s, so_stream_used(stream)); return 0; /* Authentication */ case 'R': rc = od_auth_backend(server); if (rc == -1) return -1; break; /* BackendKeyData */ case 'K': rc = so_feread_key(&server->key, stream->s, so_stream_used(stream)); if (rc == -1) { od_error_server(&instance->log, &server->id, "startup", "failed to parse BackendKeyData message"); return -1; } break; /* ParameterStatus */ case 'S': break; /* NoticeResponse */ case 'N': break; /* ErrorResponse */ case 'E': od_backend_error(server, "startup", stream->s, so_stream_used(stream)); return -1; default: od_debug_server(&instance->log, &server->id, "startup", "unknown packet: %c", type); return -1; } } return 0; } static int od_backend_connect_to(od_server_t *server, od_schemestorage_t *server_scheme, char *context) { od_instance_t *instance = server->system->instance; assert(server->io == NULL); /* create io handle */ server->io = machine_io_create(); if (server->io == NULL) return -1; /* set network options */ machine_set_nodelay(server->io, instance->scheme.nodelay); if (instance->scheme.keepalive > 0) machine_set_keepalive(server->io, 1, instance->scheme.keepalive); int rc; rc = machine_set_readahead(server->io, instance->scheme.readahead); if (rc == -1) { od_error_server(&instance->log, &server->id, context, "failed to set readahead"); return -1; } /* set tls options */ if (server_scheme->tls_verify != OD_TDISABLE) { server->tls = od_tls_backend(server_scheme); if (server->tls == NULL) return -1; } /* resolve server address */ char port[16]; snprintf(port, sizeof(port), "%d", server_scheme->port); struct addrinfo *ai = NULL; rc = machine_getaddrinfo(server_scheme->host, port, NULL, &ai, 0); if (rc != 0) { od_error_server(&instance->log, &server->id, context, "failed to resolve %s:%d", server_scheme->host, server_scheme->port); return -1; } assert(ai != NULL); /* connect to server */ rc = machine_connect(server->io, ai->ai_addr, UINT32_MAX); freeaddrinfo(ai); if (rc == -1) { od_error_server(&instance->log, &server->id, context, "failed to connect to %s:%d", server_scheme->host, server_scheme->port); return -1; } /* do tls handshake */ if (server_scheme->tls_verify != OD_TDISABLE) { rc = od_tls_backend_connect(server, &instance->log, server_scheme); if (rc == -1) return -1; } return 0; } int od_backend_connect(od_server_t *server) { od_instance_t *instance = server->system->instance; od_route_t *route = server->route; assert(route != NULL); od_schemestorage_t *server_scheme; server_scheme = route->scheme->storage; /* connect to server */ int rc; rc = od_backend_connect_to(server, server_scheme, NULL); if (rc == -1) return -1; /* log server connection */ if (instance->scheme.log_session) { od_log_server(&instance->log, &server->id, NULL, "new server connection %s:%d", server_scheme->host, server_scheme->port); } /* send startup and do initial configuration */ rc = od_backend_startup(server); if (rc == -1) return -1; return 0; } int od_backend_connect_cancel(od_server_t *server, od_schemestorage_t *server_scheme, so_key_t *key) { od_instance_t *instance = server->system->instance; /* connect to server */ int rc; rc = od_backend_connect_to(server, server_scheme, "cancel"); if (rc == -1) return -1; /* send cancel request */ so_stream_reset(&server->stream); rc = so_fewrite_cancel(&server->stream, key->key_pid, key->key); if (rc == -1) return -1; rc = od_write(server->io, &server->stream); if (rc == -1) od_error_server(&instance->log, 0, "cancel", "write error: %s", machine_error(server->io)); return 0; } static inline int od_backend_query(od_server_t *server, char *context, char *query, int len) { od_instance_t *instance = server->system->instance; int rc; so_stream_t *stream = &server->stream; so_stream_reset(stream); rc = so_fewrite_query(stream, query, len); if (rc == -1) return -1; rc = od_write(server->io, stream); if (rc == -1) { od_error_server(&instance->log, &server->id, context, "write error: %s", machine_error(server->io)); return -1; } server->count_request++; rc = od_backend_ready_wait(server, context, UINT32_MAX); if (rc == -1) return -1; return 0; } int od_backend_configure(od_server_t *server, so_bestartup_t *startup) { od_instance_t *instance = server->system->instance; char query_configure[1024]; int size = 0; so_parameter_t *param; so_parameter_t *end; param = (so_parameter_t*)startup->params.buf.s; end = (so_parameter_t*)startup->params.buf.p; for (; param < end; param = so_parameter_next(param)) { if (param == startup->user || param == startup->database) continue; size += snprintf(query_configure + size, sizeof(query_configure) - size, "SET %s=%s;", so_parameter_name(param), so_parameter_value(param)); } if (size == 0) return 0; od_debug_server(&instance->log, &server->id, "configure", "%s", query_configure); int rc; rc = od_backend_query(server, "configure", query_configure, size + 1); return rc; } int od_backend_reset(od_server_t *server) { od_instance_t *instance = server->system->instance; od_route_t *route = server->route; /* server left in copy mode */ if (server->is_copy) { od_debug_server(&instance->log, &server->id, "reset", "in copy, closing"); goto drop; } /* support route rollback off */ if (! route->scheme->rollback) { if (server->is_transaction) { od_debug_server(&instance->log, &server->id, "reset", "in active transaction, closing"); goto drop; } } /* support route cancel off */ if (! route->scheme->cancel) { if (! od_server_is_sync(server)) { od_debug_server(&instance->log, &server->id, "reset", "not synchronized, closing"); goto drop; } } /* Server is not synchronized. * * Number of queries sent to server is not equal * to the number of received replies. Do the following * logic until server becomes synchronized: * * 1. Wait each ReadyForQuery until we receive all * replies with 1 sec timeout. * * 2. Send Cancel in other connection. * * It is possible that client could previously * pipeline server with requests. Each request * may stall database on its own way and may require * additional Cancel request. * * 3. Continue with (1) */ int wait_timeout = 1000; int wait_try = 0; int wait_try_cancel = 0; int wait_cancel_limit = 1; int rc = 0; for (;;) { while (! od_server_is_sync(server)) { od_debug_server(&instance->log, &server->id, "reset", "not synchronized, wait for %d msec (#%d)", wait_timeout, wait_try); wait_try++; rc = od_backend_ready_wait(server, "reset", wait_timeout); if (rc == -1) break; } if (rc == -1) { if (! machine_timedout()) goto error; if (wait_try_cancel == wait_cancel_limit) { od_debug_server(&instance->log, &server->id, "reset", "server cancel limit reached, closing"); goto error; } od_debug_server(&instance->log, &server->id, "reset", "not responded, cancel (#%d)", wait_try_cancel); wait_try_cancel++; rc = od_cancel(server->system, route->scheme->storage, &server->key, &server->id); if (rc == -1) goto error; continue; } assert(od_server_is_sync(server)); break; } od_debug_server(&instance->log, &server->id, "reset", "synchronized"); /* send rollback in case server has an active * transaction running */ if (route->scheme->rollback) { if (server->is_transaction) { char query_rlb[] = "ROLLBACK"; rc = od_backend_query(server, "reset rollback", query_rlb, sizeof(query_rlb)); if (rc == -1) goto error; assert(! server->is_transaction); } } /* ready to use (yet maybe discard is required) */ return 1; drop: return 0; error: return -1; } int od_backend_discard(od_server_t *server) { od_instance_t *instance = server->system->instance; char query_discard[] = "DISCARD ALL"; od_debug_server(&instance->log, &server->id, "discard", "%s", query_discard); return od_backend_query(server, "reset", query_discard, sizeof(query_discard)); }