On 4/13/21 12:00 AM, Ilya Maximets wrote:
> For debugging purposes it is useful to be able to record all the
> incoming transactions and commands and replay them locally under
> debugger or with additional logging enabled. This patch introduces
> ability to record all the incoming stream data and replay it via new
> stream provider named 'stream-replay'. During the record phase all
> the incoming stream data written to special replay_* files in the
> application rundir. On replay phase instead of opening real streams
> application will open replay_* files and read all the incoming data
> directly from them.
>
> If enabled for ovsdb-server, for example, this allows to record all
> the connections and transactions from the big setup and replay them
> locally afterwards to debug the behaviour or test performance.
>
> To start application in recording mode there is a --replay-record
> cmdline option. --replay is to replay previously recorded streams.
>
> Current version doesn't work well with time-based stream events like
> inactivity probes or any other events generated internally. This is
> a point for further improvement.
>
> Signed-off-by: Ilya Maximets <[email protected]>
> ---
> lib/automake.mk | 1 +
> lib/stream-provider.h | 5 +
> lib/stream-replay.c | 459 ++++++++++++++++++++++++++++++++++++++++++
> lib/stream.c | 35 +++-
> lib/stream.h | 12 ++
> 5 files changed, 506 insertions(+), 6 deletions(-)
> create mode 100644 lib/stream-replay.c
>
> diff --git a/lib/automake.mk b/lib/automake.mk
> index b558692c6..db9017591 100644
> --- a/lib/automake.mk
> +++ b/lib/automake.mk
> @@ -312,6 +312,7 @@ lib_libopenvswitch_la_SOURCES = \
> lib/stream-fd.c \
> lib/stream-fd.h \
> lib/stream-provider.h \
> + lib/stream-replay.c \
> lib/stream-ssl.h \
> lib/stream-tcp.c \
> lib/stream.c \
> diff --git a/lib/stream-provider.h b/lib/stream-provider.h
> index 75f4f059b..44e3c6431 100644
> --- a/lib/stream-provider.h
> +++ b/lib/stream-provider.h
> @@ -18,6 +18,7 @@
> #define STREAM_PROVIDER_H 1
>
> #include <sys/types.h>
> +#include "ovs-replay.h"
> #include "stream.h"
>
> /* Active stream connection. */
> @@ -29,6 +30,7 @@ struct stream {
> const struct stream_class *class;
> int state;
> int error;
> + replay_file_t replay_wfd;
> char *name;
> char *peer_id;
> };
> @@ -133,6 +135,7 @@ struct pstream {
> const struct pstream_class *class;
> char *name;
> ovs_be16 bound_port;
> + replay_file_t replay_wfd;
> };
>
> void pstream_init(struct pstream *, const struct pstream_class *, char
> *name);
> @@ -200,5 +203,7 @@ extern const struct pstream_class pwindows_pstream_class;
> extern const struct stream_class ssl_stream_class;
> extern const struct pstream_class pssl_pstream_class;
> #endif
> +extern const struct stream_class replay_stream_class;
> +extern const struct pstream_class preplay_pstream_class;
>
> #endif /* stream-provider.h */
> diff --git a/lib/stream-replay.c b/lib/stream-replay.c
> new file mode 100644
> index 000000000..ef591b920
> --- /dev/null
> +++ b/lib/stream-replay.c
> @@ -0,0 +1,459 @@
> +/*
> + * Copyright (c) 2021, Red Hat, Inc.
> + *
> + * Licensed under the Apache License, Version 2.0 (the "License");
> + * you may not use this file except in compliance with the License.
> + * You may obtain a copy of the License at:
> + *
> + * http://www.apache.org/licenses/LICENSE-2.0
> + *
> + * Unless required by applicable law or agreed to in writing, software
> + * distributed under the License is distributed on an "AS IS" BASIS,
> + * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
> + * See the License for the specific language governing permissions and
> + * limitations under the License.
> + */
> +
> +#include <config.h>
> +#include <ctype.h>
> +#include <errno.h>
> +#include <poll.h>
> +#include <stdlib.h>
> +#include <string.h>
> +#include <sys/socket.h>
> +#include <sys/types.h>
> +#include <unistd.h>
> +#include "ovs-atomic.h"
> +#include "ovs-replay.h"
> +#include "util.h"
> +#include "stream-provider.h"
> +#include "stream.h"
> +#include "openvswitch/poll-loop.h"
> +#include "openvswitch/vlog.h"
> +
> +VLOG_DEFINE_THIS_MODULE(stream_replay);
> +
> +/* Active replay stream. */
> +
> +struct stream_replay
> +{
Nit: Curly brace on the line above, please.
> + struct stream stream;
> + replay_file_t f;
> + int seqno;
> +};
> +
> +const struct stream_class replay_stream_class;
> +
> +/* Creates a new stream named 'name' that will emulate sending and receiving
> + * data using replay file and stores a pointer to the stream in '*streamp'.
> + *
> + * Takes ownership of 'name'.
> + *
> + * Returns 0 if successful, otherwise a positive errno value. */
> +static int
> +new_replay_stream(char *name, struct stream **streamp)
> +{
> + struct stream_replay *s;
> + int seqno = 0, error = 0, open_result;
> + replay_file_t f;
> +
> + ovs_replay_lock();
> + error = ovs_replay_file_open(name, &f, &seqno);
> + if (error) {
> + VLOG_ERR("%s: failed to open stream.", name);
> + goto unlock;
I didn't try this out but don't we leak 'name' here?
> + }
> +
> + error = ovs_replay_read(f, NULL, 0, &open_result, &seqno, true);
> + if (error) {
> + VLOG_ERR("%s: failed to read 'open' record.", name);
> + ovs_replay_file_close(f);
> + goto unlock;
Same here.
> + }
> +
> + if (open_result) {
> + error = -open_result;
> + ovs_replay_file_close(f);
> + goto unlock;
Here too.
> + }
> +
> + s = xmalloc(sizeof *s);
> + stream_init(&s->stream, &replay_stream_class, 0, name);
> + s->f = f;
> + s->seqno = seqno;
> + *streamp = &s->stream;
> +unlock:
> + ovs_replay_unlock();
> + return error;
> +}
> +
> +static struct stream_replay *
> +stream_replay_cast(struct stream *stream)
> +{
> + stream_assert_class(stream, &replay_stream_class);
> + return CONTAINER_OF(stream, struct stream_replay, stream);
> +}
> +
> +void
> +stream_replay_open_wfd(struct stream *s, int open_result, const char *name)
> +{
> + int state = ovs_replay_get_state();
> + int error = 0;
> + replay_file_t f;
> +
> + if (OVS_LIKELY(state != OVS_REPLAY_WRITE)) {
> + return;
> + }
> +
> + ovs_replay_lock();
> + error = ovs_replay_file_open(name, &f, NULL);
> + if (error) {
> + VLOG_ERR("%s: failed to open replay file for stream.", name);
> + ovs_replay_unlock();
> + return;
> + }
> + ovs_replay_unlock();
> +
> + if (ovs_replay_write(f, NULL, -open_result, true)) {
> + VLOG_ERR("%s: failed to write 'open' failure: %d",
> + s->name, open_result);
> + }
> + if (open_result) {
> + /* We recorded failure to open the stream. */
> + ovs_replay_file_close(f);
> + } else {
> + s->replay_wfd = f;
> + }
> +}
> +
> +void
> +stream_replay_write(struct stream *s, const void *buffer, int n, bool
> is_read)
> +{
> + int state = ovs_replay_get_state();
> +
> + if (OVS_LIKELY(state != OVS_REPLAY_WRITE)) {
> + return;
> + }
> +
> + if (ovs_replay_write(s->replay_wfd, buffer, n, is_read)) {
> + VLOG_ERR("%s: failed to write buffer.", s->name);
ovs_replay_write() rate limits error logs, should we do that here too?
AFAICT this applies to all VLOG_ERR() calls in this file.
> + }
> +}
> +
> +void
> +stream_replay_close_wfd(struct stream *s)
> +{
> + if (s->replay_wfd) {
> + ovs_replay_file_close(s->replay_wfd);
> + }
> +}
> +
> +static int
> +stream_replay_open(const char *name, char *suffix OVS_UNUSED,
> + struct stream **streamp, uint8_t dscp OVS_UNUSED)
> +{
> + return new_replay_stream(xstrdup(name), streamp);
> +}
> +
> +static void
> +stream_replay_close(struct stream *stream)
> +{
> + struct stream_replay *s = stream_replay_cast(stream);
> + ovs_replay_file_close(s->f);
> + free(s);
> +}
> +
> +static ssize_t
> +stream_replay_recv(struct stream *stream, void *buffer, size_t n)
> +{
> + struct stream_replay *s = stream_replay_cast(stream);
> + int norm_seqno = ovs_replay_normalized_seqno(s->seqno);
> + int error, len;
> +
> + ovs_replay_lock();
> + ovs_assert(norm_seqno >= ovs_replay_seqno());
> +
> + if (norm_seqno != ovs_replay_seqno()
> + || !ovs_replay_seqno_is_read(s->seqno)) {
> + error = EAGAIN;
> + goto unlock;
> + }
> +
> + error = ovs_replay_read(s->f, buffer, n, &len, &s->seqno, true);
> + if (error) {
> + VLOG_ERR("%s: failed to read from replay file.", stream->name);
> + goto unlock;
> + }
> +
> +unlock:
> + ovs_replay_unlock();
> + return error ? -error : len;
> +}
> +
> +static ssize_t
> +stream_replay_send(struct stream *stream OVS_UNUSED,
> + const void *buffer OVS_UNUSED, size_t n)
> +{
> + struct stream_replay *s = stream_replay_cast(stream);
> + int norm_seqno = ovs_replay_normalized_seqno(s->seqno);
> + int error, len;
> +
> + ovs_replay_lock();
> + ovs_assert(norm_seqno >= ovs_replay_seqno());
> +
> + if (norm_seqno != ovs_replay_seqno()
> + || ovs_replay_seqno_is_read(s->seqno)) {
> + error = EAGAIN;
> + goto unlock;
> + }
> +
> + error = ovs_replay_read(s->f, NULL, 0, &len, &s->seqno, false);
> + if (error) {
> + VLOG_ERR("%s: failed to read from replay file.", stream->name);
> + goto unlock;
> + }
> + ovs_assert(len < 0 || len <= n);
> +
> +unlock:
> + ovs_replay_unlock();
> + return error ? -error : len;
> +}
> +
> +static void
> +stream_replay_wait(struct stream *stream, enum stream_wait_type wait)
> +{
> + struct stream_replay *s = stream_replay_cast(stream);
> + switch (wait) {
> + case STREAM_CONNECT:
> + /* Connect does nothing and always available. */
> + poll_immediate_wake();
> + break;
> +
> + case STREAM_SEND:
> + if (s->seqno != INT_MAX && !ovs_replay_seqno_is_read(s->seqno)) {
> + /* Stream waits for write. */
> + poll_immediate_wake();
> + }
> + break;
> +
> + case STREAM_RECV:
> + if (s->seqno != INT_MAX && ovs_replay_seqno_is_read(s->seqno)) {
> + /* We still have something to read. */
> + poll_immediate_wake();
> + }
> + break;
> +
> + default:
> + OVS_NOT_REACHED();
> + }
> +}
> +
> +const struct stream_class replay_stream_class = {
> + "replay", /* name */
> + false, /* needs_probes */
> + stream_replay_open, /* open */
> + stream_replay_close, /* close */
> + NULL, /* connect */
> + stream_replay_recv, /* recv */
> + stream_replay_send, /* send */
> + NULL, /* run */
> + NULL, /* run_wait */
> + stream_replay_wait, /* wait */
> +};
> +
> +/* Passive replay stream. */
> +
> +struct replay_pstream
> +{
> + struct pstream pstream;
> + replay_file_t f;
> + int seqno;
> +};
> +
> +const struct pstream_class preplay_pstream_class;
> +
> +static struct replay_pstream *
> +replay_pstream_cast(struct pstream *pstream)
> +{
> + pstream_assert_class(pstream, &preplay_pstream_class);
> + return CONTAINER_OF(pstream, struct replay_pstream, pstream);
> +}
> +
> +/* Creates a new pstream named 'name' that will accept new replay connections
> + * reading them from the replay file and stores a pointer to the stream in
> + * '*pstreamp'.
> + *
> + * Takes ownership of 'name'.
> + *
> + * Returns 0 if successful, otherwise a positive errno value. */
> +static int
> +pstream_replay_listen(const char *name, char *suffix OVS_UNUSED,
> + struct pstream **pstreamp, uint8_t dscp OVS_UNUSED)
> +{
> + int seqno = 0, error = 0, listen_result;
> + replay_file_t f;
> +
> + ovs_replay_lock();
> + error = ovs_replay_file_open(name, &f, &seqno);
> + if (error) {
> + VLOG_ERR("%s: failed to open pstream.", name);> + goto unlock;
'name' is leaked here.
> + }
> +
> + error = ovs_replay_read(f, NULL, 0, &listen_result, &seqno, true);
> + if (error) {
> + VLOG_ERR("%s: failed to read 'listen' record.", name);
> + ovs_replay_file_close(f);
> + goto unlock;
Same here.
> + }
> +
> + if (listen_result) {
> + error = -listen_result;
> + ovs_replay_file_close(f);
> + goto unlock;
Here too.
> + }
> +
> + struct replay_pstream *ps = xmalloc(sizeof *ps);
> + pstream_init(&ps->pstream, &preplay_pstream_class, xstrdup(name));
I guess the xstrdup(name) is not needed, otherwise we don't really take
ownership of 'name' and we actually leak it.
> + ps->f = f;
> + ps->seqno = seqno;
> + *pstreamp = &ps->pstream;
> +unlock:
> + ovs_replay_unlock();
> + return error;
> +}
> +
> +void
> +pstream_replay_open_wfd(struct pstream *ps, int listen_result,
> + const char *name)
> +{
> + int state = ovs_replay_get_state();
> + int error = 0;
> + replay_file_t f;
> +
> + if (OVS_LIKELY(state != OVS_REPLAY_WRITE)) {
> + return;
> + }
> +
> + ovs_replay_lock();
> + error = ovs_replay_file_open(name, &f, NULL);
> + if (error) {
> + VLOG_ERR("%s: failed to open replay file for pstream.", name);
> + ovs_replay_unlock();
> + return;
> + }
> + ovs_replay_unlock();
> +
> + if (ovs_replay_write(f, NULL, -listen_result, true)) {
> + VLOG_ERR("%s: failed to write 'listen' result: %d",
> + ps->name, listen_result);
> + }
> +
> + if (listen_result) {
> + /* We recorded failure to open the stream. */
> + ovs_replay_file_close(f);
> + } else {
> + ps->replay_wfd = f;
> + }
> +}
> +
> +
> +void
> +pstream_replay_write_accept(struct pstream *ps, const struct stream *s,
> + int accept_result)
> +{
> + int state = ovs_replay_get_state();
> + int len;
> +
> + if (OVS_LIKELY(state != OVS_REPLAY_WRITE)) {
> + return;
> + }
> +
> + if (!accept_result) {
> + len = strlen(s->name);
> + if (ovs_replay_write(ps->replay_wfd, s->name, len, true)) {
> + VLOG_ERR("%s: failed to write accept name: %s", ps->name,
> s->name);
> + }
> + } else if (ovs_replay_write(ps->replay_wfd, NULL, -accept_result, true))
> {
> + VLOG_ERR("%s: failed to write 'accept' failure: %d",
> + ps->name, accept_result);
> + }
> +}
> +
> +void
> +pstream_replay_close_wfd(struct pstream *ps)
> +{
> + if (ps->replay_wfd) {
> + ovs_replay_file_close(ps->replay_wfd);
> + }
> +}
> +
> +
Nit: I'd remove the second newline.
Thanks,
Dumitru
_______________________________________________
dev mailing list
[email protected]
https://mail.openvswitch.org/mailman/listinfo/ovs-dev