On 2/4/06, Ian McDonald <[EMAIL PROTECTED]> wrote:
> Initial implementation of transmit buffering. Tested using netem with
> delay and loss also.
>
> Signed off by: Ian McDonald <[EMAIL PROTECTED]>
> ----
> diff --git a/include/linux/dccp.h b/include/linux/dccp.h
> index 088529f..4a2f845 100644
> --- a/include/linux/dccp.h
> +++ b/include/linux/dccp.h
> @@ -411,6 +411,8 @@ struct dccp_ackvec;
> * @dccps_role - Role of this sock, one of %dccp_role
> * @dccps_ndp_count - number of Non Data Packets since last data packet
> * @dccps_hc_rx_ackvec - rx half connection ack vector
> + * @dccps_xmit_timer - timer for when CCID is not ready to send
> + * @dccps_xmit_lock - lock for transmitting
> */
> struct dccp_sock {
> /* inet_connection_sock has to be the first member of dccp_sock */
> @@ -443,6 +445,8 @@ struct dccp_sock {
> enum dccp_role dccps_role:2;
> __u8 dccps_hc_rx_insert_options:1;
> __u8 dccps_hc_tx_insert_options:1;
> + struct timer_list dccps_xmit_timer;
> + spinlock_t dccps_xmit_lock;
See the comments below, I guess we don't need yet another lock :-)
> };
>
> static inline struct dccp_sock *dccp_sk(const struct sock *sk)
> diff --git a/net/dccp/dccp.h b/net/dccp/dccp.h
> index 93f26dd..82431c0 100644
> --- a/net/dccp/dccp.h
> +++ b/net/dccp/dccp.h
> @@ -5,7 +5,7 @@
> *
> * An implementation of the DCCP protocol
> * Copyright (c) 2005 Arnaldo Carvalho de Melo <[EMAIL PROTECTED]>
> - * Copyright (c) 2005 Ian McDonald <[EMAIL PROTECTED]>
> + * Copyright (c) 2005-6 Ian McDonald <[EMAIL PROTECTED]>
> *
> * This program is free software; you can redistribute it and/or modify
> it
> * under the terms of the GNU General Public License version 2 as
> @@ -126,7 +126,7 @@ extern void dccp_send_delayed_ack(struct
> extern void dccp_send_sync(struct sock *sk, const u64 seq,
> const enum dccp_pkt_type pkt_type);
>
> -extern int dccp_write_xmit(struct sock *sk, struct sk_buff *skb, long
> *timeo);
> +void dccp_write_xmit(struct sock *sk, int block);
> extern void dccp_write_space(struct sock *sk);
Please leave the "extern"
> extern void dccp_init_xmit_timers(struct sock *sk);
> diff --git a/net/dccp/output.c b/net/dccp/output.c
> index efd7ffb..90b802d 100644
> --- a/net/dccp/output.c
> +++ b/net/dccp/output.c
> @@ -2,7 +2,8 @@
> * net/dccp/output.c
> *
> * An implementation of the DCCP protocol
> - * Arnaldo Carvalho de Melo <[EMAIL PROTECTED]>
> + * Copyright (c) 2005 Arnaldo Carvalho de Melo <[EMAIL PROTECTED]>
> + * Copyright (c) 2006 Ian McDonald <[EMAIL PROTECTED]>
> *
> * This program is free software; you can redistribute it and/or
> * modify it under the terms of the GNU General Public License
> @@ -191,7 +192,7 @@ static int dccp_wait_for_ccid(struct soc
> while (1) {
> prepare_to_wait(sk->sk_sleep, &wait, TASK_INTERRUPTIBLE);
>
> - if (sk->sk_err || (sk->sk_shutdown & SEND_SHUTDOWN))
> + if (sk->sk_err)
Humm, have to check this one...
> goto do_error;
> if (!*timeo)
> goto do_nonblock;
> @@ -207,9 +208,11 @@ static int dccp_wait_for_ccid(struct soc
> goto do_nonblock;
>
> sk->sk_write_pending++;
> + spin_unlock(&dp->dccps_xmit_lock);
> release_sock(sk);
See? two locks being released...
> *timeo -= schedule_timeout(delay);
> lock_sock(sk);
> + spin_lock(&dp->dccps_xmit_lock);
and being grabbed again...
> sk->sk_write_pending--;
> }
> out:
> @@ -227,37 +230,56 @@ do_interrupted:
> goto out;
> }
>
> -int dccp_write_xmit(struct sock *sk, struct sk_buff *skb, long *timeo)
> -{
> - const struct dccp_sock *dp = dccp_sk(sk);
> - int err = ccid_hc_tx_send_packet(dp->dccps_hc_tx_ccid, sk, skb,
> - skb->len);
> +static void dccp_write_xmit_timer(unsigned long sk) {
> + dccp_write_xmit((struct sock *)sk,0);
> +}
I guess we don't need this lock, but instead use bh_lock_sock, check if
there are users, look at ccid3_hc_tx_no_feedback_timer & ccid2_hc_tx_rto_expire
(I left a comment even having fixed the problem, duh will fix).
> - if (err > 0)
> - err = dccp_wait_for_ccid(sk, skb, timeo);
> +void dccp_write_xmit(struct sock *sk, int block)
> +{
> + struct dccp_sock *dp = dccp_sk(sk);
> + struct sk_buff *skb;
> + long timeo = 2000; /* FIXME imcdnzl - 2 second default */
>
> - if (err == 0) {
> - struct dccp_skb_cb *dcb = DCCP_SKB_CB(skb);
> - const int len = skb->len;
> + spin_lock(&dp->dccps_xmit_lock);
We're already protected by lock_sock() and the timer will just use bh_lock_sock
> +
> + while ((skb = skb_peek(&sk->sk_write_queue))) {
> + int err = ccid_hc_tx_send_packet(dp->dccps_hc_tx_ccid, sk,
> skb,
> + skb->len);
> +
> + if (err > 0) {
> + if (likely(!block)) {
> + mod_timer(&dp->dccps_xmit_timer,
> +
> msecs_to_jiffies(err)+jiffies);
sk_reset_timer() please, so that we make sure we have a reference count
for the sock as its going to be on a timer
> + goto xmit_out;
> + } else {
> + err = dccp_wait_for_ccid(sk, skb, &timeo);
> + }
No need for the {}, just one statement
> + }
>
> - if (sk->sk_state == DCCP_PARTOPEN) {
> - /* See 8.1.5. Handshake Completion */
> - inet_csk_schedule_ack(sk);
> - inet_csk_reset_xmit_timer(sk, ICSK_TIME_DACK,
> + skb_dequeue(&sk->sk_write_queue);
sk_eat_skb() later?
> + if (err == 0) {
> + struct dccp_skb_cb *dcb = DCCP_SKB_CB(skb);
> + const int len = skb->len;
> +
> + if (sk->sk_state == DCCP_PARTOPEN) {
> + /* See 8.1.5. Handshake Completion */
> + inet_csk_schedule_ack(sk);
> + inet_csk_reset_xmit_timer(sk, ICSK_TIME_DACK,
> inet_csk(sk)->icsk_rto,
> DCCP_RTO_MAX);
> - dcb->dccpd_type = DCCP_PKT_DATAACK;
> - } else if (dccp_ack_pending(sk))
> - dcb->dccpd_type = DCCP_PKT_DATAACK;
> - else
> - dcb->dccpd_type = DCCP_PKT_DATA;
> -
> - err = dccp_transmit_skb(sk, skb);
> - ccid_hc_tx_packet_sent(dp->dccps_hc_tx_ccid, sk, 0, len);
> - } else
> - kfree_skb(skb);
> -
> - return err;
> + dcb->dccpd_type = DCCP_PKT_DATAACK;
> + } else if (dccp_ack_pending(sk))
> + dcb->dccpd_type = DCCP_PKT_DATAACK;
> + else
> + dcb->dccpd_type = DCCP_PKT_DATA;
> +
> + err = dccp_transmit_skb(sk, skb);
> + ccid_hc_tx_packet_sent(dp->dccps_hc_tx_ccid, sk, 0,
> len);
> + } else
> + kfree(skb);
Like at the end, i.e. we dequeue and free (sk_eat_skb())
> + }
> +xmit_out:
> + spin_unlock(&dp->dccps_xmit_lock);
> }
>
> int dccp_retransmit_skb(struct sock *sk, struct sk_buff *skb)
> @@ -396,6 +418,10 @@ static inline void dccp_connect_init(str
> dccp_set_seqno(&dp->dccps_awl, max48(dp->dccps_awl, dp->dccps_iss));
>
> icsk->icsk_retransmits = 0;
> + init_timer(&dp->dccps_xmit_timer);
> + dp->dccps_xmit_timer.data = (unsigned long)sk;
> + dp->dccps_xmit_timer.function = dccp_write_xmit_timer;
Perhaps we use one of icsk timers? Have to check
> + dp->dccps_xmit_lock = SPIN_LOCK_UNLOCKED;
Not needed
> }
>
> int dccp_connect(struct sock *sk)
> @@ -527,8 +553,11 @@ void dccp_send_close(struct sock *sk, co
> DCCP_PKT_CLOSE : DCCP_PKT_CLOSEREQ;
>
> if (active) {
> + dccp_write_xmit(sk, 1);
> dccp_skb_entail(sk, skb);
> dccp_transmit_skb(sk, skb_clone(skb, prio));
> - } else
> + /* FIXME do we need a retransmit timer here? */
> + } else {
> dccp_transmit_skb(sk, skb);
> + }
No need for {}, just one statement
> }
> diff --git a/net/dccp/proto.c b/net/dccp/proto.c
> index 65b11ea..119ecc5 100644
> --- a/net/dccp/proto.c
> +++ b/net/dccp/proto.c
> @@ -385,6 +385,7 @@ int dccp_sendmsg(struct kiocb *iocb, str
>
> lock_sock(sk);
> timeo = sock_sndtimeo(sk, noblock);
> + /* FIXME imcdnzl - we should be using timeo for memory allocation */
>
> /*
> * We have to use sk_stream_wait_connect here to set sk_write_pending,
> @@ -407,19 +408,13 @@ int dccp_sendmsg(struct kiocb *iocb, str
> if (rc != 0)
> goto out_discard;
>
> - rc = dccp_write_xmit(sk, skb, &timeo);
> - /*
> - * XXX we don't use sk_write_queue, so just discard the packet.
> - * Current plan however is to _use_ sk_write_queue with
> - * an algorith similar to tcp_sendmsg, where the main difference
> - * is that in DCCP we have to respect packet boundaries, so
> - * no coalescing of skbs.
> - *
> - * This bug was _quickly_ found & fixed by just looking at an
> OSTRA
> - * generated callgraph 8) -acme
> - */
> + skb_queue_tail(&sk->sk_write_queue, skb);
> + release_sock(sk);
> + dccp_write_xmit(sk,0);
> + goto out_end;
> out_release:
> release_sock(sk);
> +out_end:
> return rc ? : len;
> out_discard:
> kfree_skb(skb);
> @@ -591,6 +586,7 @@ static int dccp_close_state(struct sock
>
> void dccp_close(struct sock *sk, long timeout)
> {
> + struct dccp_sock *dp = dccp_sk(sk);
> struct sk_buff *skb;
>
> lock_sock(sk);
> @@ -606,6 +602,8 @@ void dccp_close(struct sock *sk, long ti
> goto adjudge_to_death;
> }
>
> + del_timer_sync(&dp->dccps_xmit_timer);
> +
sk_stop_timer please, to drop the refcount we grabbed with sk_reset_timer()
elsewhere.
- Arnaldo
-
To unsubscribe from this list: send the line "unsubscribe dccp" in
the body of a message to [EMAIL PROTECTED]
More majordomo info at http://vger.kernel.org/majordomo-info.html