blob: 8e1226ba8ea1e4e8a6b9b3057a0d96f33084c529 [file] [log] [blame]
// SPDX-License-Identifier: LGPL-2.1
/*
* trace-msg.c : define message protocol for communication between clients and
* a server
*
* Copyright (C) 2013 Hitachi, Ltd.
* Created by Yoshihiro YUNOMAE <yoshihiro.yunomae.ez@hitachi.com>
*
*/
#include <errno.h>
#include <poll.h>
#include <fcntl.h>
#include <limits.h>
#include <stddef.h>
#include <stdio.h>
#include <stdlib.h>
#include <stdarg.h>
#include <unistd.h>
#include <arpa/inet.h>
#include <sys/types.h>
#include <linux/types.h>
#include "trace-cmd-local.h"
#include "trace-local.h"
#include "trace-msg.h"
typedef __u32 u32;
typedef __be32 be32;
static inline void dprint(const char *fmt, ...)
{
va_list ap;
if (!debug)
return;
va_start(ap, fmt);
vprintf(fmt, ap);
va_end(ap);
}
/* Two (4k) pages is the max transfer for now */
#define MSG_MAX_LEN 8192
#define MSG_HDR_LEN sizeof(struct tracecmd_msg_header)
#define MSG_DATA_LEN (MSG_MAX_LEN - MSG_HDR_LEN)
/* - header size for error msg */
#define MSG_META_MAX_LEN (MSG_MAX_LEN - MIN_META_SIZE)
#define MIN_TINIT_SIZE (sizeof(struct tracecmd_msg_header) + \
sizeof(struct tracecmd_msg_tinit))
/* Not really the minimum, but I couldn't think of a better name */
#define MIN_RINIT_SIZE (sizeof(struct tracecmd_msg_header) + \
sizeof(struct tracecmd_msg_rinit))
#define MIN_META_SIZE (sizeof(struct tracecmd_msg_header) + \
sizeof(struct tracecmd_msg_meta))
unsigned int page_size;
struct tracecmd_msg_server {
struct tracecmd_msg_handle handle;
int done;
};
static struct tracecmd_msg_server *
make_server(struct tracecmd_msg_handle *msg_handle)
{
if (!(msg_handle->flags & TRACECMD_MSG_FL_SERVER)) {
plog("Message handle not of type server\n");
return NULL;
}
return (struct tracecmd_msg_server *)msg_handle;
}
struct tracecmd_msg_opt {
be32 size;
be32 opt_cmd;
be32 padding; /* for backward compatibility */
};
struct tracecmd_msg_tinit {
be32 cpus;
be32 page_size;
be32 opt_num;
} __attribute__((packed));
struct tracecmd_msg_rinit {
be32 cpus;
} __attribute__((packed));
struct tracecmd_msg_meta {
be32 size;
} __attribute__((packed));
struct tracecmd_msg_header {
be32 size;
be32 cmd;
} __attribute__((packed));
#define MSG_MAP \
C(UNUSED_0, 0, -1), \
C(CLOSE, 1, 0), \
C(USUSED_2, 2, -1), \
C(UNUSED_3, 3, -1), \
C(TINIT, 4, MIN_TINIT_SIZE), \
C(RINIT, 5, MIN_RINIT_SIZE), \
C(SENDMETA, 6, MIN_META_SIZE), \
C(FINMETA, 7, 0),
#undef C
#define C(a,b,c) MSG_##a = b
enum tracecmd_msg_cmd {
MSG_MAP
};
#undef C
#define C(a,b,c) c
static be32 msg_min_sizes[] = { MSG_MAP };
#undef C
#define C(a,b,c) #a
static const char *msg_names[] = { MSG_MAP };
static const char *cmd_to_name(int cmd)
{
if (cmd <= MSG_FINMETA)
return msg_names[cmd];
return "Unkown";
}
struct tracecmd_msg {
struct tracecmd_msg_header hdr;
union {
struct tracecmd_msg_tinit tinit;
struct tracecmd_msg_rinit rinit;
struct tracecmd_msg_meta meta;
};
union {
struct tracecmd_msg_opt *opt;
be32 *port_array;
void *buf;
};
} __attribute__((packed));
struct tracecmd_msg *errmsg;
static int msg_write(int fd, struct tracecmd_msg *msg)
{
int cmd = ntohl(msg->hdr.cmd);
int size;
int ret;
if (cmd > MSG_FINMETA)
return -EINVAL;
dprint("msg send: %d (%s)\n", cmd, cmd_to_name(cmd));
size = msg_min_sizes[cmd];
if (!size)
size = ntohl(msg->hdr.size);
ret = __do_write_check(fd, msg, size);
if (ret < 0)
return ret;
if (ntohl(msg->hdr.size) <= size)
return 0;
return __do_write_check(fd, msg->buf, ntohl(msg->hdr.size) - size);
}
enum msg_opt_command {
MSGOPT_USETCP = 1,
};
static int make_tinit(struct tracecmd_msg_handle *msg_handle,
struct tracecmd_msg *msg)
{
struct tracecmd_msg_opt *opt;
int cpu_count = msg_handle->cpu_count;
int opt_num = 0;
int size = MIN_TINIT_SIZE;
if (msg_handle->flags & TRACECMD_MSG_FL_USE_TCP) {
opt_num++;
opt = malloc(sizeof(*opt));
if (!opt)
return -ENOMEM;
opt->size = htonl(sizeof(*opt));
opt->opt_cmd = htonl(MSGOPT_USETCP);
msg->opt = opt;
size += sizeof(*opt);
}
msg->tinit.cpus = htonl(cpu_count);
msg->tinit.page_size = htonl(page_size);
msg->tinit.opt_num = htonl(opt_num);
msg->hdr.size = htonl(size);
return 0;
}
static int make_rinit(struct tracecmd_msg *msg, int total_cpus, int *ports)
{
int size = MIN_RINIT_SIZE;
be32 *ptr;
be32 port;
int i;
msg->rinit.cpus = htonl(total_cpus);
msg->port_array = malloc(sizeof(*ports) * total_cpus);
if (!msg->port_array)
return -ENOMEM;
size += sizeof(*ports) * total_cpus;
ptr = msg->port_array;
for (i = 0; i < total_cpus; i++) {
/* + rrqports->cpus or rrqports->port_array[i] */
port = htonl(ports[i]);
*ptr = port;
ptr++;
}
msg->hdr.size = htonl(size);
return 0;
}
static void tracecmd_msg_init(u32 cmd, struct tracecmd_msg *msg)
{
memset(msg, 0, sizeof(*msg));
msg->hdr.cmd = htonl(cmd);
if (!msg_min_sizes[cmd])
msg->hdr.size = htonl(MSG_HDR_LEN);
else
msg->hdr.size = htonl(msg_min_sizes[cmd]);
}
static void msg_free(struct tracecmd_msg *msg)
{
int cmd = ntohl(msg->hdr.cmd);
/* If a min size is defined, then the buf needs to be freed */
if (cmd < MSG_FINMETA && (msg_min_sizes[cmd] > 0))
free(msg->buf);
memset(msg, 0, sizeof(*msg));
}
static int tracecmd_msg_send(int fd, struct tracecmd_msg *msg)
{
int ret = 0;
ret = msg_write(fd, msg);
if (ret < 0)
ret = -ECOMM;
msg_free(msg);
return ret;
}
static int msg_read(int fd, void *buf, u32 size, int *n)
{
ssize_t r;
while (size) {
r = read(fd, buf + *n, size);
if (r < 0) {
if (errno == EINTR)
continue;
return -errno;
} else if (!r)
return -ENOTCONN;
size -= r;
*n += r;
}
return 0;
}
static int msg_read_extra(int fd, struct tracecmd_msg *msg,
int *n, int size)
{
u32 cmd;
int rsize;
int ret;
cmd = ntohl(msg->hdr.cmd);
if (cmd > MSG_FINMETA)
return -EINVAL;
rsize = msg_min_sizes[cmd] - *n;
if (rsize <= 0)
return 0;
ret = msg_read(fd, msg, rsize, n);
if (ret < 0)
return ret;
if (size > *n) {
size -= *n;
msg->buf = malloc(size);
if (!msg->buf)
return -ENOMEM;
*n = 0;
return msg_read(fd, msg->buf, size, n);
}
return 0;
}
/*
* Read header information of msg first, then read all data
*/
static int tracecmd_msg_recv(int fd, struct tracecmd_msg *msg)
{
u32 size = 0;
int n = 0;
int ret;
ret = msg_read(fd, msg, MSG_HDR_LEN, &n);
if (ret < 0)
return ret;
dprint("msg received: %d (%s)\n",
ntohl(msg->hdr.cmd), cmd_to_name(ntohl(msg->hdr.cmd)));
size = ntohl(msg->hdr.size);
if (size > MSG_MAX_LEN)
/* too big */
goto error;
else if (size < MSG_HDR_LEN)
/* too small */
goto error;
else if (size > MSG_HDR_LEN)
return msg_read_extra(fd, msg, &n, size);
return 0;
error:
plog("Receive an invalid message(size=%d)\n", size);
return -ENOMSG;
}
#define MSG_WAIT_MSEC 5000
static int msg_wait_to = MSG_WAIT_MSEC;
bool tracecmd_msg_done(struct tracecmd_msg_handle *msg_handle)
{
struct tracecmd_msg_server *msg_server = make_server(msg_handle);
return (volatile int)msg_server->done;
}
void tracecmd_msg_set_done(struct tracecmd_msg_handle *msg_handle)
{
struct tracecmd_msg_server *msg_server = make_server(msg_handle);
msg_server->done = true;
}
/*
* A return value of 0 indicates time-out
*/
static int tracecmd_msg_recv_wait(int fd, struct tracecmd_msg *msg)
{
struct pollfd pfd;
int ret;
pfd.fd = fd;
pfd.events = POLLIN;
ret = poll(&pfd, 1, debug ? -1 : msg_wait_to);
if (ret < 0)
return -errno;
else if (ret == 0)
return -ETIMEDOUT;
return tracecmd_msg_recv(fd, msg);
}
static int tracecmd_msg_wait_for_msg(int fd, struct tracecmd_msg *msg)
{
u32 cmd;
int ret;
ret = tracecmd_msg_recv_wait(fd, msg);
if (ret < 0) {
if (ret == -ETIMEDOUT)
warning("Connection timed out\n");
return ret;
}
cmd = ntohl(msg->hdr.cmd);
if (cmd == MSG_CLOSE)
return -ECONNABORTED;
return 0;
}
int tracecmd_msg_send_init_data(struct tracecmd_msg_handle *msg_handle,
int **client_ports)
{
struct tracecmd_msg send_msg;
struct tracecmd_msg recv_msg;
int fd = msg_handle->fd;
int *ports;
int i, cpus;
int ret;
*client_ports = NULL;
tracecmd_msg_init(MSG_TINIT, &send_msg);
ret = make_tinit(msg_handle, &send_msg);
if (ret < 0)
return ret;
ret = tracecmd_msg_send(fd, &send_msg);
if (ret < 0)
return ret;
ret = tracecmd_msg_wait_for_msg(fd, &recv_msg);
if (ret < 0)
return ret;
if (ntohl(recv_msg.hdr.cmd) != MSG_RINIT)
return -EINVAL;
cpus = ntohl(recv_msg.rinit.cpus);
ports = malloc_or_die(sizeof(int) * cpus);
for (i = 0; i < cpus; i++)
ports[i] = ntohl(recv_msg.port_array[i]);
*client_ports = ports;
return 0;
}
static bool process_option(struct tracecmd_msg_handle *msg_handle,
struct tracecmd_msg_opt *opt)
{
/* currently the only option we have is to us TCP */
if (ntohl(opt->opt_cmd) == MSGOPT_USETCP) {
msg_handle->flags |= TRACECMD_MSG_FL_USE_TCP;
return true;
}
return false;
}
static void error_operation_for_server(struct tracecmd_msg *msg)
{
u32 cmd;
cmd = ntohl(msg->hdr.cmd);
warning("Message: cmd=%d size=%d\n", cmd, ntohl(msg->hdr.size));
}
struct tracecmd_msg_handle *
tracecmd_msg_handle_alloc(int fd, unsigned long flags)
{
struct tracecmd_msg_handle *handle;
int size;
if (flags == TRACECMD_MSG_FL_SERVER)
size = sizeof(struct tracecmd_msg_server);
else
size = sizeof(struct tracecmd_msg_handle);
handle = calloc(1, size);
if (!handle)
return NULL;
handle->fd = fd;
handle->flags = flags;
return handle;
}
void tracecmd_msg_handle_close(struct tracecmd_msg_handle *msg_handle)
{
close(msg_handle->fd);
free(msg_handle);
}
#define MAX_OPTION_SIZE 4096
int tracecmd_msg_initial_setting(struct tracecmd_msg_handle *msg_handle)
{
struct tracecmd_msg_opt *opt;
struct tracecmd_msg msg;
int pagesize;
int options, i, s;
int cpus;
int ret;
int offset = 0;
u32 size = MIN_TINIT_SIZE;
u32 cmd;
ret = tracecmd_msg_recv_wait(msg_handle->fd, &msg);
if (ret < 0) {
if (ret == -ETIMEDOUT)
warning("Connection timed out\n");
return ret;
}
cmd = ntohl(msg.hdr.cmd);
if (cmd != MSG_TINIT) {
ret = -EINVAL;
goto error;
}
cpus = ntohl(msg.tinit.cpus);
plog("cpus=%d\n", cpus);
if (cpus < 0) {
ret = -EINVAL;
goto error;
}
msg_handle->cpu_count = cpus;
pagesize = ntohl(msg.tinit.page_size);
plog("pagesize=%d\n", pagesize);
if (pagesize <= 0) {
ret = -EINVAL;
goto error;
}
options = ntohl(msg.tinit.opt_num);
for (i = 0; i < options; i++) {
if (size + sizeof(*opt) > ntohl(msg.hdr.size)) {
plog("Not enough message for options\n");
ret = -EINVAL;
goto error;
}
opt = (void *)msg.opt + offset;
offset += ntohl(opt->size);
size += ntohl(opt->size);
if (ntohl(msg.hdr.size) < size) {
plog("Not enough message for options\n");
ret = -EINVAL;
goto error;
}
/* prevent a client from killing us */
if (ntohl(opt->size) > MAX_OPTION_SIZE) {
plog("Exceed MAX_OPTION_SIZE\n");
ret = -EINVAL;
goto error;
}
s = process_option(msg_handle, opt);
/* do we understand this option? */
if (!s) {
plog("Cannot understand(%d:%d:%d)\n",
i, ntohl(opt->size), ntohl(opt->opt_cmd));
ret = -EINVAL;
goto error;
}
}
return pagesize;
error:
error_operation_for_server(&msg);
return ret;
}
int tracecmd_msg_send_port_array(struct tracecmd_msg_handle *msg_handle,
int *ports)
{
struct tracecmd_msg msg;
int ret;
tracecmd_msg_init(MSG_RINIT, &msg);
ret = make_rinit(&msg, msg_handle->cpu_count, ports);
if (ret < 0)
return ret;
ret = tracecmd_msg_send(msg_handle->fd, &msg);
if (ret < 0)
return ret;
return 0;
}
void tracecmd_msg_send_close_msg(struct tracecmd_msg_handle *msg_handle)
{
struct tracecmd_msg msg;
tracecmd_msg_init(MSG_CLOSE, &msg);
tracecmd_msg_send(msg_handle->fd, &msg);
}
int tracecmd_msg_metadata_send(struct tracecmd_msg_handle *msg_handle,
const char *buf, int size)
{
struct tracecmd_msg msg;
int fd = msg_handle->fd;
int n;
int ret;
int count = 0;
tracecmd_msg_init(MSG_SENDMETA, &msg);
msg.buf = malloc(MSG_META_MAX_LEN);
if (!msg.buf)
return -ENOMEM;
msg.meta.size = htonl(MSG_META_MAX_LEN);
msg.hdr.size = htonl(MIN_META_SIZE + MSG_META_MAX_LEN);
n = size;
do {
if (n > MSG_META_MAX_LEN) {
memcpy(msg.buf, buf+count, MSG_META_MAX_LEN);
n -= MSG_META_MAX_LEN;
count += MSG_META_MAX_LEN;
} else {
msg.hdr.size = htonl(MIN_META_SIZE + n);
msg.meta.size = htonl(n);
memcpy(msg.buf, buf+count, n);
n = 0;
}
ret = msg_write(fd, &msg);
if (ret < 0)
break;
} while (n);
msg_free(&msg);
return ret;
}
int tracecmd_msg_finish_sending_metadata(struct tracecmd_msg_handle *msg_handle)
{
struct tracecmd_msg msg;
int ret;
tracecmd_msg_init(MSG_FINMETA, &msg);
ret = tracecmd_msg_send(msg_handle->fd, &msg);
if (ret < 0)
return ret;
return 0;
}
int tracecmd_msg_collect_metadata(struct tracecmd_msg_handle *msg_handle, int ofd)
{
struct tracecmd_msg msg;
u32 t, n, cmd;
ssize_t s;
int ret;
do {
ret = tracecmd_msg_recv_wait(msg_handle->fd, &msg);
if (ret < 0) {
if (ret == -ETIMEDOUT)
warning("Connection timed out\n");
else
warning("reading client");
return ret;
}
cmd = ntohl(msg.hdr.cmd);
if (cmd == MSG_FINMETA) {
/* Finish receiving meta data */
break;
} else if (cmd != MSG_SENDMETA)
goto error;
n = ntohl(msg.meta.size);
t = n;
s = 0;
do {
s = write(ofd, msg.buf+s, t);
if (s < 0) {
if (errno == EINTR)
continue;
warning("writing to file");
return -errno;
}
t -= s;
s = n - t;
} while (t);
} while (cmd == MSG_SENDMETA);
/* check the finish message of the client */
while (!tracecmd_msg_done(msg_handle)) {
ret = tracecmd_msg_recv(msg_handle->fd, &msg);
if (ret < 0) {
warning("reading client");
return ret;
}
cmd = ntohl(msg.hdr.cmd);
if (cmd == MSG_CLOSE)
/* Finish this connection */
break;
else {
warning("Not accept the message %d", ntohl(msg.hdr.cmd));
ret = -EINVAL;
goto error;
}
}
return 0;
error:
error_operation_for_server(&msg);
return ret;
}