mirror of https://github.com/yandex/odyssey.git
539 lines
14 KiB
C
539 lines
14 KiB
C
|
|
/*
|
|
* Odyssey.
|
|
*
|
|
* Scalable PostgreSQL connection pooler.
|
|
*/
|
|
|
|
#include <stdlib.h>
|
|
#include <stdarg.h>
|
|
#include <stdint.h>
|
|
#include <stdio.h>
|
|
#include <string.h>
|
|
#include <ctype.h>
|
|
#include <inttypes.h>
|
|
#include <assert.h>
|
|
#include <arpa/inet.h>
|
|
|
|
#include <machinarium.h>
|
|
#include <kiwi.h>
|
|
#include <odyssey.h>
|
|
|
|
void
|
|
od_backend_close(od_server_t *server)
|
|
{
|
|
assert(server->route == NULL);
|
|
assert(server->io.io == NULL);
|
|
assert(server->tls == NULL);
|
|
server->is_transaction = 0;
|
|
server->idle_time = 0;
|
|
kiwi_key_init(&server->key);
|
|
kiwi_key_init(&server->key_client);
|
|
od_relay_free(&server->relay);
|
|
od_io_free(&server->io);
|
|
od_server_free(server);
|
|
}
|
|
|
|
static inline int
|
|
od_backend_terminate(od_server_t *server)
|
|
{
|
|
machine_msg_t *msg;
|
|
msg = kiwi_fe_write_terminate(NULL);
|
|
if (msg == NULL)
|
|
return -1;
|
|
return od_write(&server->io, msg);
|
|
}
|
|
|
|
void
|
|
od_backend_close_connection(od_server_t *server)
|
|
{
|
|
if (machine_connected(server->io.io))
|
|
od_backend_terminate(server);
|
|
|
|
od_io_close(&server->io);
|
|
|
|
if (server->error_connect) {
|
|
machine_msg_free(server->error_connect);
|
|
server->error_connect = NULL;
|
|
}
|
|
|
|
if (server->tls) {
|
|
machine_tls_free(server->tls);
|
|
server->tls = NULL;
|
|
}
|
|
}
|
|
|
|
void
|
|
od_backend_error(od_server_t *server, char *context,
|
|
char *data, uint32_t size)
|
|
{
|
|
od_instance_t *instance = server->global->instance;
|
|
kiwi_fe_error_t error;
|
|
int rc;
|
|
rc = kiwi_fe_read_error(data, size, &error);
|
|
if (rc == -1) {
|
|
od_error(&instance->logger, context, server->client, server,
|
|
"failed to parse error message from server");
|
|
return;
|
|
}
|
|
od_error(&instance->logger, context, server->client, server,
|
|
"%s %s %s",
|
|
error.severity,
|
|
error.code,
|
|
error.message);
|
|
if (error.detail) {
|
|
od_error(&instance->logger, context, server->client, server,
|
|
"DETAIL: %s", error.detail);
|
|
}
|
|
if (error.hint) {
|
|
od_error(&instance->logger, context, server->client, server,
|
|
"HINT: %s", error.hint);
|
|
}
|
|
}
|
|
|
|
int
|
|
od_backend_ready(od_server_t *server, char *data, uint32_t size)
|
|
{
|
|
int status;
|
|
int rc;
|
|
rc = kiwi_fe_read_ready(data, size, &status);
|
|
if (rc == -1)
|
|
return -1;
|
|
if (status == 'I') {
|
|
/* no active transaction */
|
|
server->is_transaction = 0;
|
|
} else
|
|
if (status == 'T' || status == 'E') {
|
|
/* in active transaction or in interrupted
|
|
* transaction block */
|
|
server->is_transaction = 1;
|
|
}
|
|
|
|
/* update server sync reply state */
|
|
od_server_sync_reply(server);
|
|
return 0;
|
|
}
|
|
|
|
static inline int
|
|
od_backend_startup(od_server_t *server, kiwi_params_t *route_params)
|
|
{
|
|
od_instance_t *instance = server->global->instance;
|
|
od_route_t *route = server->route;
|
|
kiwi_fe_arg_t argv[] = {
|
|
{ "user", 5 }, { route->id.user, route->id.user_len },
|
|
{ "database", 9 }, { route->id.database, route->id.database_len },
|
|
{ "replication", 12}, { NULL, 0 }
|
|
};
|
|
int argc = 4;
|
|
if (route->rule->storage->storage_type == OD_RULE_STORAGE_REPLICATION ||
|
|
route->id.physical_rep) {
|
|
argc = 6;
|
|
argv[5].name = "on";
|
|
argv[5].len = 3;
|
|
} else
|
|
if (route->rule->storage->storage_type == OD_RULE_STORAGE_REPLICATION_LOGICAL) {
|
|
argc = 6;
|
|
argv[5].name = "database";
|
|
argv[5].len = 9;
|
|
}
|
|
|
|
machine_msg_t *msg;
|
|
msg = kiwi_fe_write_startup_message(NULL, argc, argv);
|
|
if (msg == NULL)
|
|
return -1;
|
|
int rc;
|
|
rc = od_write(&server->io, msg);
|
|
if (rc == -1) {
|
|
od_error(&instance->logger, "startup", NULL, server,
|
|
"write error: %s",
|
|
od_io_error(&server->io));
|
|
return -1;
|
|
}
|
|
|
|
/* update request count and sync state */
|
|
od_server_sync_request(server, 1);
|
|
|
|
while (1)
|
|
{
|
|
msg = od_read(&server->io, UINT32_MAX);
|
|
if (msg == NULL) {
|
|
od_error(&instance->logger, "startup", NULL, server,
|
|
"read error: %s",
|
|
od_io_error(&server->io));
|
|
return -1;
|
|
}
|
|
kiwi_be_type_t type = *(char*)machine_msg_data(msg);
|
|
od_debug(&instance->logger, "startup", NULL, server, "%s",
|
|
kiwi_be_type_to_string(type));
|
|
|
|
switch (type) {
|
|
case KIWI_BE_READY_FOR_QUERY:
|
|
od_backend_ready(server, machine_msg_data(msg), machine_msg_size(msg));
|
|
machine_msg_free(msg);
|
|
return 0;
|
|
case KIWI_BE_AUTHENTICATION:
|
|
rc = od_auth_backend(server, msg);
|
|
machine_msg_free(msg);
|
|
if (rc == -1)
|
|
return -1;
|
|
break;
|
|
case KIWI_BE_BACKEND_KEY_DATA:
|
|
rc = kiwi_fe_read_key(machine_msg_data(msg),
|
|
machine_msg_size(msg), &server->key);
|
|
machine_msg_free(msg);
|
|
if (rc == -1) {
|
|
od_error(&instance->logger, "startup", NULL, server,
|
|
"failed to parse BackendKeyData message");
|
|
return -1;
|
|
}
|
|
break;
|
|
case KIWI_BE_PARAMETER_STATUS:
|
|
{
|
|
char *name;
|
|
uint32_t name_len;
|
|
char *value;
|
|
uint32_t value_len;
|
|
rc = kiwi_fe_read_parameter(machine_msg_data(msg),
|
|
machine_msg_size(msg), &name, &name_len,
|
|
&value, &value_len);
|
|
if (rc == -1) {
|
|
machine_msg_free(msg);
|
|
od_error(&instance->logger, "startup", NULL, server,
|
|
"failed to parse ParameterStatus message");
|
|
return -1;
|
|
}
|
|
|
|
/* set server parameters */
|
|
kiwi_vars_update(&server->vars, name, name_len, value, value_len);
|
|
|
|
if (route_params) {
|
|
kiwi_param_t *param;
|
|
param = kiwi_param_allocate(name, name_len, value, value_len);
|
|
if (param)
|
|
kiwi_params_add(route_params, param);
|
|
}
|
|
|
|
machine_msg_free(msg);
|
|
break;
|
|
}
|
|
case KIWI_BE_NOTICE_RESPONSE:
|
|
machine_msg_free(msg);
|
|
break;
|
|
case KIWI_BE_ERROR_RESPONSE:
|
|
od_backend_error(server, "startup",
|
|
machine_msg_data(msg),
|
|
machine_msg_size(msg));
|
|
server->error_connect = msg;
|
|
return -1;
|
|
default:
|
|
machine_msg_free(msg);
|
|
od_debug(&instance->logger, "startup", NULL, server,
|
|
"unexpected message: %s",
|
|
kiwi_be_type_to_string(type));
|
|
return -1;
|
|
}
|
|
}
|
|
return 0;
|
|
}
|
|
|
|
static inline int
|
|
od_backend_connect_to(od_server_t *server, char *context,
|
|
od_rule_storage_t *storage)
|
|
{
|
|
od_instance_t *instance = server->global->instance;
|
|
assert(server->io.io == NULL);
|
|
|
|
/* create io handle */
|
|
machine_io_t *io;
|
|
io = machine_io_create();
|
|
if (io == NULL)
|
|
return -1;
|
|
|
|
/* set network options */
|
|
machine_set_nodelay(io, instance->config.nodelay);
|
|
if (instance->config.keepalive > 0)
|
|
machine_set_keepalive(io, 1, instance->config.keepalive);
|
|
int rc;
|
|
rc = od_io_prepare(&server->io, io, instance->config.readahead);
|
|
if (rc == -1) {
|
|
od_error(&instance->logger, context, NULL, server,
|
|
"failed to set server io");
|
|
machine_close(io);
|
|
machine_io_free(io);
|
|
return -1;
|
|
}
|
|
|
|
/* set tls options */
|
|
if (storage->tls_mode != OD_RULE_TLS_DISABLE) {
|
|
server->tls = od_tls_backend(storage);
|
|
if (server->tls == NULL)
|
|
return -1;
|
|
}
|
|
|
|
uint64_t time_connect_start = 0;
|
|
if (instance->config.log_session)
|
|
time_connect_start = machine_time_us();
|
|
|
|
struct sockaddr_un saddr_un;
|
|
struct sockaddr_in saddr_v4;
|
|
struct sockaddr_in6 saddr_v6;
|
|
struct sockaddr *saddr;
|
|
struct addrinfo *ai = NULL;
|
|
|
|
/* resolve server address */
|
|
if (storage->host)
|
|
{
|
|
/* assume IPv6 or IPv4 is specified */
|
|
int rc_resolve = -1;
|
|
if (strchr(storage->host, ':')) {
|
|
/* v6 */
|
|
memset(&saddr_v6, 0, sizeof(saddr_v6));
|
|
saddr_v6.sin6_family = AF_INET6;
|
|
saddr_v6.sin6_port = htons(storage->port);
|
|
rc_resolve = inet_pton(AF_INET6, storage->host, &saddr_v6.sin6_addr);
|
|
saddr = (struct sockaddr*)&saddr_v6;
|
|
} else {
|
|
/* v4 or hostname */
|
|
memset(&saddr_v4, 0, sizeof(saddr_v4));
|
|
saddr_v4.sin_family = AF_INET;
|
|
saddr_v4.sin_port = htons(storage->port);
|
|
rc_resolve = inet_pton(AF_INET, storage->host, &saddr_v4.sin_addr);
|
|
saddr = (struct sockaddr*)&saddr_v4;
|
|
}
|
|
|
|
/* schedule getaddrinfo() execution */
|
|
if (rc_resolve != 1) {
|
|
char port[16];
|
|
od_snprintf(port, sizeof(port), "%d", storage->port);
|
|
|
|
rc = machine_getaddrinfo(storage->host, port, NULL, &ai, 0);
|
|
if (rc != 0) {
|
|
od_error(&instance->logger, context, NULL, server,
|
|
"failed to resolve %s:%d",
|
|
storage->host,
|
|
storage->port);
|
|
return -1;
|
|
}
|
|
assert(ai != NULL);
|
|
saddr = ai->ai_addr;
|
|
}
|
|
} else {
|
|
/* set unix socket path */
|
|
memset(&saddr_un, 0, sizeof(saddr_un));
|
|
saddr_un.sun_family = AF_UNIX;
|
|
saddr = (struct sockaddr*)&saddr_un;
|
|
od_snprintf(saddr_un.sun_path, sizeof(saddr_un.sun_path),
|
|
"%s/.s.PGSQL.%d",
|
|
instance->config.unix_socket_dir,
|
|
storage->port);
|
|
}
|
|
|
|
uint64_t time_resolve = 0;
|
|
if (instance->config.log_session)
|
|
time_resolve = machine_time_us() - time_connect_start;
|
|
|
|
/* connect to server */
|
|
rc = machine_connect(server->io.io, saddr, UINT32_MAX);
|
|
if (ai)
|
|
freeaddrinfo(ai);
|
|
if (rc == -1) {
|
|
if (storage->host) {
|
|
od_error(&instance->logger, context, server->client, server,
|
|
"failed to connect to %s:%d", storage->host,
|
|
storage->port);
|
|
} else {
|
|
od_error(&instance->logger, context, server->client, server,
|
|
"failed to connect to %s", saddr_un.sun_path);
|
|
}
|
|
return -1;
|
|
}
|
|
|
|
/* do tls handshake */
|
|
if (storage->tls_mode != OD_RULE_TLS_DISABLE) {
|
|
rc = od_tls_backend_connect(server, &instance->logger, storage);
|
|
if (rc == -1)
|
|
return -1;
|
|
}
|
|
|
|
uint64_t time_connect = 0;
|
|
if (instance->config.log_session)
|
|
time_connect = machine_time_us() - time_connect_start;
|
|
|
|
/* log server connection */
|
|
if (instance->config.log_session) {
|
|
if (storage->host) {
|
|
od_log(&instance->logger, context, server->client, server,
|
|
"new server connection %s:%d (connect time: %d usec, resolve time: %d usec)",
|
|
storage->host,
|
|
storage->port,
|
|
(int)time_connect,
|
|
(int)time_resolve);
|
|
} else {
|
|
od_log(&instance->logger, context, server->client, server,
|
|
"new server connection %s (connect time: %d usec, resolve time: %d usec)",
|
|
saddr_un.sun_path,
|
|
(int)time_connect,
|
|
(int)time_resolve);
|
|
}
|
|
}
|
|
|
|
return 0;
|
|
}
|
|
|
|
int
|
|
od_backend_connect(od_server_t *server, char *context, kiwi_params_t *route_params)
|
|
{
|
|
od_route_t *route = server->route;
|
|
assert(route != NULL);
|
|
|
|
od_rule_storage_t *storage;
|
|
storage = route->rule->storage;
|
|
|
|
/* connect to server */
|
|
int rc;
|
|
rc = od_backend_connect_to(server, context, storage);
|
|
if (rc == -1)
|
|
return -1;
|
|
|
|
/* send startup and do initial configuration */
|
|
rc = od_backend_startup(server, route_params);
|
|
return rc;
|
|
}
|
|
|
|
int
|
|
od_backend_connect_cancel(od_server_t *server, od_rule_storage_t *storage,
|
|
kiwi_key_t *key)
|
|
{
|
|
od_instance_t *instance = server->global->instance;
|
|
/* connect to server */
|
|
int rc;
|
|
rc = od_backend_connect_to(server, "cancel", storage);
|
|
if (rc == -1)
|
|
return -1;
|
|
/* send cancel request */
|
|
machine_msg_t *msg;
|
|
msg = kiwi_fe_write_cancel(NULL, key->key_pid, key->key);
|
|
if (msg == NULL)
|
|
return -1;
|
|
rc = od_write(&server->io, msg);
|
|
if (rc == -1) {
|
|
od_error(&instance->logger, "cancel", NULL, NULL,
|
|
"write error: %s",
|
|
od_io_error(&server->io));
|
|
return -1;
|
|
}
|
|
return 0;
|
|
}
|
|
|
|
int
|
|
od_backend_update_parameter(od_server_t *server, char *context,
|
|
char *data, uint32_t size,
|
|
int server_only)
|
|
{
|
|
od_instance_t *instance = server->global->instance;
|
|
od_client_t *client = server->client;
|
|
|
|
char *name;
|
|
uint32_t name_len;
|
|
char *value;
|
|
uint32_t value_len;
|
|
int rc;
|
|
rc = kiwi_fe_read_parameter(data, size, &name, &name_len,
|
|
&value, &value_len);
|
|
if (rc == -1) {
|
|
od_error(&instance->logger, context, NULL, server,
|
|
"failed to parse ParameterStatus message");
|
|
return -1;
|
|
}
|
|
|
|
/* update server only or client and server parameter */
|
|
od_debug(&instance->logger, context, client, server,
|
|
"%.*s = %.*s",
|
|
name_len, name, value_len, value);
|
|
|
|
if (server_only)
|
|
kiwi_vars_update(&server->vars, name, name_len, value, value_len);
|
|
else
|
|
kiwi_vars_update_both(&client->vars, &server->vars, name, name_len,
|
|
value, value_len);
|
|
return 0;
|
|
}
|
|
|
|
|
|
int
|
|
od_backend_ready_wait(od_server_t *server, char *context, int count,
|
|
uint32_t time_ms)
|
|
{
|
|
od_instance_t *instance = server->global->instance;
|
|
int ready = 0;
|
|
for (;;)
|
|
{
|
|
machine_msg_t *msg;
|
|
msg = od_read(&server->io, time_ms);
|
|
if (msg == NULL) {
|
|
if (! machine_timedout()) {
|
|
od_error(&instance->logger, context, server->client, server,
|
|
"read error: %s",
|
|
od_io_error(&server->io));
|
|
}
|
|
return -1;
|
|
}
|
|
kiwi_be_type_t type = *(char*)machine_msg_data(msg);
|
|
od_debug(&instance->logger, context, server->client, server, "%s",
|
|
kiwi_be_type_to_string(type));
|
|
|
|
if (type == KIWI_BE_PARAMETER_STATUS) {
|
|
/* update server parameter */
|
|
int rc;
|
|
rc = od_backend_update_parameter(server, context,
|
|
machine_msg_data(msg),
|
|
machine_msg_size(msg), 1);
|
|
if (rc == -1) {
|
|
machine_msg_free(msg);
|
|
return -1;
|
|
}
|
|
} else
|
|
if (type == KIWI_BE_ERROR_RESPONSE) {
|
|
od_backend_error(server, context, machine_msg_data(msg),
|
|
machine_msg_size(msg));
|
|
machine_msg_free(msg);
|
|
continue;
|
|
} else
|
|
if (type == KIWI_BE_READY_FOR_QUERY) {
|
|
od_backend_ready(server, machine_msg_data(msg), machine_msg_size(msg));
|
|
ready++;
|
|
if (ready == count) {
|
|
machine_msg_free(msg);
|
|
break;
|
|
}
|
|
}
|
|
machine_msg_free(msg);
|
|
}
|
|
return 0;
|
|
}
|
|
|
|
int
|
|
od_backend_query(od_server_t *server, char *context, char *query, int len)
|
|
{
|
|
od_instance_t *instance = server->global->instance;
|
|
|
|
machine_msg_t *msg;
|
|
msg = kiwi_fe_write_query(NULL, query, len);
|
|
if (msg == NULL)
|
|
return -1;
|
|
int rc;
|
|
rc = od_write(&server->io, msg);
|
|
if (rc == -1) {
|
|
od_error(&instance->logger, context, server->client, server,
|
|
"write error: %s",
|
|
od_io_error(&server->io));
|
|
return -1;
|
|
}
|
|
|
|
/* update server sync state */
|
|
od_server_sync_request(server, 1);
|
|
|
|
rc = od_backend_ready_wait(server, context, 1, UINT32_MAX);
|
|
return rc;
|
|
}
|