netperf-2.4.5/src/nettest_bsd.c - nest-learning-thermostat/5.0.1/netperf - Git at Google

 #ifndef lint
 char	nettest_id[]="\
 @(#)nettest_bsd.c (c) Copyright 1993-2008 Hewlett-Packard Co. Version 2.4.5";
 #endif /* lint */


 /****************************************************************/
 /*								*/
 /*	nettest_bsd.c						*/
 /*								*/
 /*      the BSD sockets parsing routine...                      */
 /*       ...with the addition of Windows NT, this is now also   */
 /*          a Winsock test... sigh :)                           */
 /*                                                              */
 /*      scan_sockets_args()                                     */
 /*                                                              */
 /*	the actual test routines...				*/
 /*								*/
 /*	send_tcp_stream()	perform a tcp stream test	*/
 /*	recv_tcp_stream()					*/
 /*      send_tcp_maerts()       perform a tcp stream test       */
 /*      recv_tcp_maerts()       in the other direction          */
 /*	send_tcp_rr()		perform a tcp request/response	*/
 /*	recv_tcp_rr()						*/
 /*      send_tcp_conn_rr()      an RR test including connect    */
 /*      recv_tcp_conn_rr()                                      */
 /*      send_tcp_cc()           a connect/disconnect test with  */
 /*      recv_tcp_cc()           no RR                           */
 /*      send_tcp_mss()          just report the mss             */
 /*	send_udp_stream()	perform a udp stream test	*/
 /*	recv_udp_stream()					*/
 /*	send_udp_rr()		perform a udp request/response	*/
 /*	recv_udp_rr()						*/
 /*	loc_cpu_rate()		determine the local cpu maxrate */
 /*	rem_cpu_rate()		find the remote cpu maxrate	*/
 /*								*/
 /****************************************************************/

 #ifdef HAVE_CONFIG_H
 #include <config.h>
 #endif

 #include <stdio.h>
 #if HAVE_SYS_TYPES_H
 # include <sys/types.h>
 #endif
 #if HAVE_SYS_STAT_H
 # include <sys/stat.h>
 #endif
 #if STDC_HEADERS
 # include <stdlib.h>
 # include <stddef.h>
 #else
 # if HAVE_STDLIB_H
 #  include <stdlib.h>
 # endif
 #endif
 #if HAVE_STRING_H
 # if !STDC_HEADERS && HAVE_MEMORY_H
 #  include <memory.h>
 # endif
 # include <string.h>
 #endif
 #if HAVE_STRINGS_H
 # include <strings.h>
 #endif
 #if HAVE_INTTYPES_H
 # include <inttypes.h>
 #else
 # if HAVE_STDINT_H
 #  include <stdint.h>
 # endif
 #endif
 #if HAVE_UNISTD_H
 # include <unistd.h>
 #endif

 #include <fcntl.h>
 #ifndef WIN32
 #include <errno.h>
 #include <signal.h>
 #endif

 #if TIME_WITH_SYS_TIME
 # include <sys/time.h>
 # include <time.h>
 #else
 # if HAVE_SYS_TIME_H
 #  include <sys/time.h>
 # else
 #  include <time.h>
 # endif
 #endif

 #ifdef NOSTDLIBH
 #include <malloc.h>
 #endif /* NOSTDLIBH */

 #ifdef WANT_SCTP
 #include <netinet/sctp.h>
 #endif

 #ifndef WIN32
 #if !defined(__VMS) && !defined(MSDOS)
 #include <sys/ipc.h>
 #endif /* !__VMS && !MSDOS */
 #include <sys/socket.h>
 #include <netinet/in.h>
 #include <netinet/tcp.h>
 #include <arpa/inet.h>
 #include <netdb.h>
 #else /* WIN32 */
 #include <process.h>
 #define netperf_socklen_t socklen_t
 #include <winsock2.h>

 /* while it is unlikely that anyone running Windows 2000 or NT 4 is
    going to be trying to compile this, if they are they will want to
    define DONT_IPV6 in the sources file */
 #ifndef DONT_IPV6
 #include <ws2tcpip.h>
 #endif
 #include <windows.h>

 #define sleep(x) Sleep((x)*1000)

 #define __func__ __FUNCTION__
 #endif /* WIN32 */

 /* We don't want to use bare constants in the shutdown() call.  In the
    extremely unlikely event that SHUT_WR isn't defined, we will define
    it to the value we used to be passing to shutdown() anyway.  raj
    2007-02-08 */
 #if !defined(SHUT_WR)
 #define SHUT_WR 1
 #endif

 #if !defined(HAVE_GETADDRINFO) || !defined(HAVE_GETNAMEINFO)
 # include "missing/getaddrinfo.h"
 #endif

 #include "netlib.h"
 #include "netsh.h"
 #include "nettest_bsd.h"

 #if defined(WANT_HISTOGRAM) || defined(WANT_DEMO)
 #include "hist.h"
 #endif /* WANT_HISTOGRAM */


 /* make first_burst_size unconditional so we can use it easily enough
    when calculating transaction latency for the TCP_RR test. raj
    2007-06-08 however, change its default value so one can tell in
    "omni" output whether or not WANT_BURST was enabled. raj
    2008-01-28 */
 #if defined(WANT_FIRST_BURST)
 int first_burst_size=0;
 #else
 int first_burst_size=-1;
 #endif

 #if defined(HAVE_SENDFILE) && (defined(__linux) || defined(__sun))
 #include <sys/sendfile.h>
 #endif /* HAVE_SENDFILE && (__linux || __sun) */


 /* these variables are specific to the BSD sockets tests, but can
  * be used elsewhere if needed.  They are externed through nettest_bsd.h
  */

 int
   socket_type,          /* used initially by the "omni" tests */
   rss_size_req = -1,	/* requested remote socket send buffer size */
   rsr_size_req = -1,	/* requested remote socket recv buffer size */
   rss_size,		/* initial remote socket send buffer size */
   rsr_size,		/* initial remote socket recv buffer size */
   rss_size_end = -1,    /* final  remote socket send buffer size */
   rsr_size_end = -1,    /* final  remote socket recv buffer size */
   lss_size_req = -1,	/* requested local socket send buffer size */
   lsr_size_req = -1,	/* requested local socket recv buffer size */
   lss_size,		/* local  socket send buffer size 	*/
   lsr_size,		/* local  socket recv buffer size 	*/
   lss_size_end = -1,    /* final local  socket send buffer size */
   lsr_size_end = -1,    /* final local  socket recv buffer size */
   req_size = 1,		/* request size                   	*/
   rsp_size = 1,		/* response size			*/
   send_size,		/* how big are individual sends		*/
   recv_size;		/* how big are individual receives	*/

 static  int confidence_iteration;
 static  char  local_cpu_method;
 static  char  remote_cpu_method;

 /* these will control the width of port numbers we try to use in the */
 /* TCP_CRR and/or TCP_TRR tests. raj 3/95 */
 static int client_port_min = 5000;
 static int client_port_max = 65535;

  /* different options for the sockets				*/

 int
   loc_nodelay,		/* don't/do use NODELAY	locally		*/
   rem_nodelay,		/* don't/do use NODELAY remotely	*/
 #ifdef TCP_CORK
   loc_tcpcork=0,        /* don't/do use TCP_CORK locally        */
   rem_tcpcork=0,        /* don't/do use TCP_CORK remotely       */
 #else
   loc_tcpcork=-1,
   rem_tcpcork=-1,
 #endif /* TCP_CORK */
   loc_sndavoid,		/* avoid send copies locally		*/
   loc_rcvavoid,		/* avoid recv copies locally		*/
   rem_sndavoid,		/* avoid send copies remotely		*/
   rem_rcvavoid, 	/* avoid recv_copies remotely		*/
   local_connected = 0,  /* local socket type, connected/non-connected */
   remote_connected = 0; /* remote socket type, connected/non-connected */

 #ifdef WANT_HISTOGRAM
 #ifdef HAVE_GETHRTIME
 static hrtime_t time_one;
 static hrtime_t time_two;
 #elif HAVE_GET_HRT
 #include "hrt.h"
 static hrt_t time_one;
 static hrt_t time_two;
 #elif defined(WIN32)
 static LARGE_INTEGER time_one;
 static LARGE_INTEGER time_two;
 #else
 static struct timeval time_one;
 static struct timeval time_two;
 #endif /* HAVE_GETHRTIME */
 static HIST time_hist;
 #endif /* WANT_HISTOGRAM */

 #ifdef WANT_INTERVALS
 int interval_count;
 #ifndef WANT_SPIN
 sigset_t signal_set;
 #define INTERVALS_INIT() \
     if (interval_burst) { \
       /* zero means that we never pause, so we never should need the \
          interval timer. we used to use it for demo mode, but we deal \
 	 with that with a variant on watching the clock rather than \
 	 waiting for a timer. raj 2006-02-06 */ \
       start_itimer(interval_wate); \
     } \
     interval_count = interval_burst; \
     /* get the signal set for the call to sigsuspend */ \
     if (sigprocmask(SIG_BLOCK, (sigset_t *)NULL, &signal_set) != 0) { \
       fprintf(where, \
 	      "%s: unable to get sigmask errno %d\n", \
 	      __func__, \
 	      errno); \
       fflush(where); \
       exit(1); \
     }

 #define INTERVALS_WAIT() \
       /* in this case, the interval count is the count-down couter \
 	 to decide to sleep for a little bit */ \
       if ((interval_burst) && (--interval_count == 0)) { \
 	/* call sigsuspend and wait for the interval timer to get us \
 	   out */ \
 	if (debug > 1) { \
 	  fprintf(where,"about to suspend\n"); \
 	  fflush(where); \
 	} \
 	if (sigsuspend(&signal_set) == EFAULT) { \
 	  fprintf(where, \
 		  "%s: fault with sigsuspend.\n", \
                   __func__); \
 	  fflush(where); \
 	  exit(1); \
 	} \
 	interval_count = interval_burst; \
       }
 #else
 /* first out timestamp */
 #ifdef HAVE_GETHRTIME
 static hrtime_t intvl_one;
 static hrtime_t intvl_two;
 static hrtime_t *intvl_one_ptr = &intvl_one;
 static hrtime_t *intvl_two_ptr = &intvl_two;
 static hrtime_t *temp_intvl_ptr = &intvl_one;
 #elif defined(WIN32)
 static LARGE_INTEGER intvl_one;
 static LARGE_INTEGER intvl_two;
 static LARGE_INTEGER *intvl_one_ptr = &intvl_one;
 static LARGE_INTEGER *intvl_two_ptr = &intvl_two;
 static LARGE_INTEGER *temp_intvl_ptr = &intvl_one;
 #else
 static struct timeval intvl_one;
 static struct timeval intvl_two;
 static struct timeval *intvl_one_ptr = &intvl_one;
 static struct timeval *intvl_two_ptr = &intvl_two;
 static struct timeval *temp_intvl_ptr = &intvl_one;
 #endif

 #define INTERVALS_INIT() \
       if (interval_burst) { \
 	HIST_timestamp(intvl_one_ptr); \
       } \
       interval_count = interval_burst; \

 #define INTERVALS_WAIT() \
       /* in this case, the interval count is the count-down couter \
 	 to decide to sleep for a little bit */ \
       if ((interval_burst) && (--interval_count == 0)) { \
 	/* call sigsuspend and wait for the interval timer to get us \
 	   out */ \
 	if (debug > 1) { \
 	  fprintf(where,"about to spin suspend\n"); \
 	  fflush(where); \
 	} \
         HIST_timestamp(intvl_two_ptr); \
         while(delta_micro(intvl_one_ptr,intvl_two_ptr) < interval_usecs) { \
 	  HIST_timestamp(intvl_two_ptr); \
 	} \
 	temp_intvl_ptr = intvl_one_ptr; \
 	intvl_one_ptr = intvl_two_ptr; \
 	intvl_two_ptr = temp_intvl_ptr; \
 	interval_count = interval_burst; \
       }
 #endif
 #endif

 #ifdef WANT_DEMO
 #ifdef HAVE_GETHRTIME
 static hrtime_t demo_one;
 static hrtime_t demo_two;
 static hrtime_t *demo_one_ptr = &demo_one;
 static hrtime_t *demo_two_ptr = &demo_two;
 static hrtime_t *temp_demo_ptr = &demo_one;
 #elif defined(WIN32)
 static LARGE_INTEGER demo_one;
 static LARGE_INTEGER demo_two;
 static LARGE_INTEGER *demo_one_ptr = &demo_one;
 static LARGE_INTEGER *demo_two_ptr = &demo_two;
 static LARGE_INTEGER *temp_demo_ptr = &demo_one;
 #else
 static struct timeval demo_one;
 static struct timeval demo_two;
 static struct timeval *demo_one_ptr = &demo_one;
 static struct timeval *demo_two_ptr = &demo_two;
 static struct timeval *temp_demo_ptr = &demo_one;
 #endif

 /* for a _STREAM test, "a" should be lss_size and "b" should be
    rsr_size. for a _MAERTS test, "a" should be lsr_size and "b" should
    be rss_size. raj 2005-04-06 */
 #define DEMO_STREAM_SETUP(a,b) \
     if ((demo_mode) && (demo_units == 0)) { \
       /* take our default value of demo_units to be the larger of \
 	 twice the remote's SO_RCVBUF or twice our SO_SNDBUF */ \
       if (a > b) { \
 	demo_units = 2*a; \
       } \
       else { \
 	demo_units = 2*b; \
       } \
     }

 /* now that calc_thruput_interval knows about transactions as a format
    we can merge DEMO_STREAM_INTERVAL and DEMO_RR_INTERVAL since the
    are the same */

 #define DEMO_INTERVAL(units) \
       if (demo_mode) { \
 	double actual_interval; \
 	units_this_tick += units; \
 	if (units_this_tick >= demo_units) { \
 	  /* time to possibly update demo_units and maybe output an \
 	     interim result */ \
 	  HIST_timestamp(demo_two_ptr); \
 	  actual_interval = delta_micro(demo_one_ptr,demo_two_ptr); \
 	  /* we always want to fine-tune demo_units here whether we \
 	     emit an interim result or not.  if we are short, this \
 	     will lengthen demo_units.  if we are long, this will \
 	     shorten it */ \
 	  demo_units = demo_units * (demo_interval / actual_interval); \
 	  if (actual_interval >= demo_interval) { \
 	    /* time to emit an interim result */ \
 	    fprintf(where, \
 		    "Interim result: %.2f %s/s over %.2f seconds\n", \
 		    calc_thruput_interval(units_this_tick, \
 					  actual_interval/1000000.0), \
 		    format_units(), \
 		    actual_interval/1000000.0); \
 	    units_this_tick = 0.0; \
 	    /* now get a new starting timestamp.  we could be clever \
 	       and swap pointers - the math we do probably does not \
 	       take all that long, but for now this will suffice */ \
 	    temp_demo_ptr = demo_one_ptr; \
 	    demo_one_ptr = demo_two_ptr; \
 	    demo_two_ptr = temp_demo_ptr; \
 	  } \
 	} \
       }

 #define DEMO_STREAM_INTERVAL(units) DEMO_INTERVAL(units)

 #define DEMO_RR_SETUP(a) \
     if ((demo_mode) && (demo_units == 0)) { \
       /* take whatever we are given */ \
 	demo_units = a; \
     }

 #define DEMO_RR_INTERVAL(units) DEMO_INTERVAL(units)

 #endif

 char sockets_usage[] = "\n\
 Usage: netperf [global options] -- [test options] \n\
 \n\
 TCP/UDP BSD Sockets Test Options:\n\
     -b number         Send number requests at start of _RR tests\n\
     -C                Set TCP_CORK when available\n\
     -D [L][,R]        Set TCP_NODELAY locally and/or remotely (TCP_*)\n\
     -h                Display this text\n\
     -H name,fam       Use name (or IP) and family as target of data connection\n\
     -L name,fam       Use name (or IP) and family as source of data connection\n\
     -m bytes          Set the send size (TCP_STREAM, UDP_STREAM)\n\
     -M bytes          Set the recv size (TCP_STREAM, UDP_STREAM)\n\
     -n                Use the connected socket for UDP locally\n\
     -N                Use the connected socket for UDP remotely\n\
     -p min[,max]      Set the min/max port numbers for TCP_CRR, TCP_TRR\n\
     -P local[,remote] Set the local/remote port for the data socket\n\
     -r req,[rsp]      Set request/response sizes (TCP_RR, UDP_RR)\n\
     -s send[,recv]    Set local socket send/recv buffer sizes\n\
     -S send[,recv]    Set remote socket send/recv buffer sizes\n\
     -4                Use AF_INET (eg IPv4) on both ends of the data conn\n\
     -6                Use AF_INET6 (eg IPv6) on both ends of the data conn\n\
 \n\
 For those options taking two parms, at least one must be specified;\n\
 specifying one value without a comma will set both parms to that\n\
 value, specifying a value with a leading comma will set just the second\n\
 parm, a value with a trailing comma will set just the first. To set\n\
 each parm to unique values, specify both and separate them with a\n\
 comma.\n";


 /* these routines convert between the AF address space and the NF
    address space since the numeric values of AF_mumble are not the
    same across the platforms. raj 2005-02-08 */

 int
 nf_to_af(int nf) {
   switch(nf) {
   case NF_INET:
     return AF_INET;
     break;
   case NF_UNSPEC:
     return AF_UNSPEC;
     break;
   case NF_INET6:
 #if defined(AF_INET6)
     return AF_INET6;
 #else
     return AF_UNSPEC;
 #endif
     break;
   default:
     return AF_UNSPEC;
     break;
   }
 }

 int
 af_to_nf(int af) {

   switch(af) {
   case AF_INET:
     return NF_INET;
     break;
   case AF_UNSPEC:
     return NF_UNSPEC;
     break;
 #if defined(AF_INET6)
   case AF_INET6:
     return NF_INET6;
     break;
 #endif
   default:
     return NF_UNSPEC;
     break;
   }
 }


 /* these routines will convert between the hosts' socket types and
    those netperf uses.  we need this because different platforms can
    have different values for SOCK_STREAM, SOCK_DGRAM and the
    like... */

 int
 nst_to_hst(int nst) {
   switch(nst) {
 #ifdef SOCK_STREAM
   case NST_STREAM:
     return SOCK_STREAM;
     break;  /* ok, this may not be necessary :) */
 #endif
 #ifdef SOCK_DGRAM
   case NST_DGRAM:
     return SOCK_DGRAM;
     break;
 #endif
 #ifdef SOCK_DCCP
   case NST_DCCP:
     return SOCK_DCCP;
     break;
 #endif
   default:
     return -1;
   }
 }

 int
 hst_to_nst(int hst) {

   switch(hst) {
 #ifdef SOCK_STREAM
   case SOCK_STREAM:
     return NST_STREAM;
     break;
 #endif
 #ifdef SOCK_DGRAM
   case SOCK_DGRAM:
     return NST_DGRAM;
     break;
 #endif
 #ifdef SOCK_DCCP
   case SOCK_DCCP:
     return NST_DCCP;
     break;
 #endif
   default:
     return NST_UNKN;
   }
 }
 char *
 hst_to_str(int hst) {

   switch(hst) {
 #ifdef SOCK_STREAM
   case SOCK_STREAM:
     return "Stream";
     break;
 #endif
 #ifdef SOCK_DGRAM
   case SOCK_DGRAM:
     return "Datagram";
     break;
 #endif
 #ifdef SOCK_DCCP
   case SOCK_DCCP:
     return "DCCP";
     break;
 #endif
   default:
     return "Unknown";
   }
 }

 char *
 protocol_to_str(int protocol) {
   switch(protocol) {
 #ifdef IPPROTO_TCP
   case IPPROTO_TCP:
     return "TCP";
 #endif
 #ifdef IPPROTO_UDP
   case IPPROTO_UDP:
     return "UDP";
 #endif
 #ifdef IPPROTO_SCTP
   case IPPROTO_SCTP:
     return "SCTP";
 #endif
 #ifdef IPPROTO_DCCP
   case IPPROTO_DCCP:
     return "DCCP";
 #endif
 #ifdef IPPROTO_SDP
   case IPPROTO_SDP:
     return "SDP";
 #endif
   default:
     return "Unknown Protocol";
   }
 }


  /* This routine is intended to retrieve interesting aspects of tcp */
  /* for the data connection. at first, it attempts to retrieve the */
  /* maximum segment size. later, it might be modified to retrieve */
  /* other information, but it must be information that can be */
  /* retrieved quickly as it is called during the timing of the test. */
  /* for that reason, a second routine may be created that can be */
  /* called outside of the timing loop */
 static
 void
 get_tcp_info(SOCKET socket, int *mss)
 {

 #ifdef TCP_MAXSEG
   netperf_socklen_t sock_opt_len;

   sock_opt_len = sizeof(netperf_socklen_t);
   if (getsockopt(socket,
 		 getprotobyname("tcp")->p_proto,
 		 TCP_MAXSEG,
 		 (char *)mss,
 		 &sock_opt_len) == SOCKET_ERROR) {
     fprintf(where,
 	    "netperf: get_tcp_info: getsockopt TCP_MAXSEG: errno %d\n",
 	    errno);
     fflush(where);
     *mss = -1;
   }
 #else
   *mss = -1;
 #endif /* TCP_MAXSEG */
 }


 /* return a pointer to a completed addrinfo chain - prefer
    data_address to controlhost and utilize the specified address
    family */

 struct addrinfo *
 complete_addrinfo(char *controlhost, char *data_address, char *port, int family, int type, int protocol, int flags)
 {
   struct addrinfo hints;
   struct addrinfo *res;
   struct addrinfo *temp_res;

 #define CHANGED_SOCK_TYPE  0x1
 #define CHANGED_PROTOCOL   0x2
 #define CHANGED_SCTP       0x4
 #define CHANGED_DCCP       0x8
 #define CHANGED_DCCP_SOCK  0x10

   int    change_info = 0;
   static int change_warning_displayed = 0;

   int count = 0;
   int error = 0;

   char *hostname;

   /* take data-address over controlhost */
   if (data_address)
     hostname = data_address;
   else
     hostname = controlhost;

   if (debug) {
     fprintf(where,
 	    "complete_addrinfo using hostname %s port %s family %s type %s prot %s flags 0x%x\n",
 	    hostname,
 	    port,
 	    inet_ftos(family),
 	    inet_ttos(type),
 	    inet_ptos(protocol),
 	    flags);
     fflush(where);
   }

   memset(&hints, 0, sizeof(hints));
   hints.ai_family = family;
   hints.ai_socktype = type;
   hints.ai_protocol = protocol;
   hints.ai_flags = flags|AI_CANONNAME;

   count = 0;
   do {
     error = getaddrinfo((char *)hostname,
                         (char *)port,
                         &hints,
                         &res);
     count += 1;
     if (error == EAI_AGAIN) {
       if (debug) {
         fprintf(where,"Sleeping on getaddrinfo EAI_AGAIN\n");
         fflush(where);
       }
       sleep(1);
     }
     /* while you see this kludge first, it is actually the second, the
        first being the one for Solaris below. The need for this kludge
        came after implementing the Solaris broken getaddrinfo kludge -
        now we see a kludge in Linux getaddrinfo where if it is given
        SOCK_STREAM and IPPROTO_SCTP it barfs with a -7
        EAI_SOCKTYPE. so, we check if the error was EAI_SOCKTYPE and if
        we were asking for IPPROTO_SCTP and if so, kludge, again... raj
        200?-10-13 and of course, requiring the kludge for SCTP, it is
        no surprise that linux needs a kludge for DCCP...actually not
        only does it need the ai_protocol kludge, it needs an
        ai_socktype kludge too... sigh raj 2008-02-01 */
 #if defined(IPPROTO_SCTP) || defined (IPPROTO_DCCP)
     if (EAI_SOCKTYPE == error
 #ifdef EAI_BADHINTS
         || EAI_BADHINTS == error
 #endif
         ) {
       /* we ass-u-me this is the Linux getaddrinfo bug, clear the
 	 hints.ai_protocol field, and set some state "remembering"
 	 that we did this so the code for the Solaris kludge can do
 	 the fix-up for us.  also flip error over to EAI_AGAIN and
 	 make sure we don't "count" this time around the loop. */
 #if defined(IPPROTO_DCCP)
       /* only tweak on this one the second time around, after we've
 	 kludged the ai_protocol field */
       if ((hints.ai_socktype == SOCK_DCCP) &&
 	  (hints.ai_protocol == 0)) {
 	change_info |= CHANGED_DCCP_SOCK;
 	hints.ai_socktype = 0;
 	/* we need to give it some sort of IPPROTO or it gets unhappy,
 	   so for now, pick one from deep within the colon and use
 	   IPPROTO_TCP */
 	hints.ai_protocol = IPPROTO_TCP;
       }

       if (hints.ai_protocol == IPPROTO_DCCP) {
 	change_info |= CHANGED_DCCP;
 	hints.ai_protocol = 0;
       }

 #endif
 #if defined(IPPROTO_SCTP)
       if (hints.ai_protocol == IPPROTO_SCTP) {
 	change_info |= CHANGED_SCTP;
 	hints.ai_protocol = 0;
       }
 #endif

       error = EAI_AGAIN;
       count -= 1;
     }
 #endif
   } while ((error == EAI_AGAIN) && (count <= 5));

   if (error) {
     fprintf(where,
 	    "complete_addrinfo: could not resolve '%s' port '%s' af %d",
 	    hostname,
 	    port,
 	    family);
     fprintf(where,
 	    "\n\tgetaddrinfo returned %d %s\n",
 	    error,
 	    gai_strerror(error));
     fflush(where);
     exit(-1);
   }

   /* there exists at least one platform - Solaris 10 - that does not
      seem to completely honor the ai_protocol and/or ai_socktype one
      sets in the hints parm to the getaddrinfo call.  so, we need to
      walk the list of entries returned and if either of those do not
      match what we asked for, we need to go ahead and set them
      "correctly" this is based in part on some earlier SCTP-only code
      from previous revisions.  raj 2006-10-09 */

   temp_res = res;

   while (temp_res) {

     if ((type)  &&
 	(temp_res->ai_socktype != type)) {
       change_info |= CHANGED_SOCK_TYPE;
       if (debug) {
 	fprintf(where,
 		"WARNING! Changed bogus getaddrinfo socket type %d to %d\n",
 		temp_res->ai_socktype,
 		type);
 	fflush(where);
       }
       temp_res->ai_socktype = type;
     }

     if ((protocol) &&
 	(temp_res->ai_protocol != protocol)) {
       change_info |= CHANGED_PROTOCOL;
       if (debug) {
 	fprintf(where,
 		"WARNING! Changed bogus getaddrinfo protocol %d to %d\n",
 		temp_res->ai_protocol,
 		protocol);
 	fflush(where);
       }
       temp_res->ai_protocol = protocol;
     }
     temp_res = temp_res->ai_next;
   }

   if ((change_info & CHANGED_SOCK_TYPE) &&
       !(change_warning_displayed & CHANGED_SOCK_TYPE)) {
     change_warning_displayed |= CHANGED_SOCK_TYPE;
     fprintf(where,
 	    "WARNING! getaddrinfo returned a socket type which did not\n");
     fprintf(where,
 	    "match the requested type.  Please contact your vendor for\n");
     fprintf(where,
 	    "a fix to this bug in getaddrinfo()\n");
     fflush(where);
   }

   /* if we dropped the protocol hint, it would be for a protocol that
      getaddrinfo() wasn't supporting yet, not for the bug that it took
      our hint and still returned zero. raj 2006-10-16 */
   /* as there is now an open bug against (Open)Solaris (id 6847733) on
      this behaviour we will only emit this warning if debug is set
      under Solaris and will continue to emit it under any circumstance
      on other platforms should it arise. raj 2009-06-03 */
   if ((change_info & CHANGED_PROTOCOL) &&
       !(change_warning_displayed & CHANGED_PROTOCOL) &&
 #ifdef __sun
       (debug) &&
 #endif
       (hints.ai_protocol != 0)) {
     change_warning_displayed |= CHANGED_PROTOCOL;
     fprintf(where,
 	    "WARNING! getaddrinfo returned a protocol other than the\n");
     fprintf(where,
 	    "requested protocol.  Please contact your vendor for\n");
     fprintf(where,
 	    "a fix to this bug in getaddrinfo()\n");
     fflush(where);
   }

   if ((change_info & CHANGED_SCTP) &&
       !(change_warning_displayed & CHANGED_SCTP)) {
     change_warning_displayed |= CHANGED_SCTP;
     fprintf(where,
 	    "WARNING! getaddrinfo on this platform does not accept IPPROTO_SCTP!\n");
     fprintf(where,
 	    "Please contact your vendor for a fix to this bug in getaddrinfo().\n");
     fflush(where);
   }

   if ((change_info & CHANGED_DCCP) &&
       !(change_warning_displayed & CHANGED_DCCP)) {
     change_warning_displayed |= CHANGED_DCCP;
     fprintf(where,
 	    "WARNING! getaddrinfo on this platform does not accept IPPROTO_DCCP!\n");
     fprintf(where,
 	    "Please contact your vendor for a fix to this bug in getaddrinfo().\n");
     fflush(where);
   }


   if (debug) {
     dump_addrinfo(where, res, hostname, port, family);
   }

   return(res);
 }

 void
 complete_addrinfos(struct addrinfo **remote,struct addrinfo **local, char remote_host[], int type, int protocol, int flags) {

   *remote = complete_addrinfo(remote_host,
 			      remote_data_address,
 			      remote_data_port,
 			      remote_data_family,
 			      type,
 			      protocol,
 			      flags);

   /* OK, if the user has not specified a local data endpoint address
      (test-specific -L), pick the local data endpoint address based on
      the remote data family info (test-specific -H or -4 or -6
      option).  if the user has not specified remote data addressing
      info (test-specific -H, -4 -6) pick something based on the local
      control connection address (ie the global -L option). */

   if (NULL == local_data_address) {
     local_data_address = malloc(HOSTNAMESIZE);
     if (NULL == remote_data_address) {
       if (debug) {
 	fprintf(where,
 		"local_data_address not set, using local_host_name of '%s'\n",
 		local_host_name);
 	fflush(where);
       }
       strcpy(local_data_address,local_host_name);
     }
     else {
       if (debug) {
 	fprintf(where,
 		"local_data_address not set, using address family info\n");
 	fflush(where);
       }
       /* by default, use 0.0.0.0 - assume IPv4 */
       strcpy(local_data_address,"0.0.0.0");
 #if defined(AF_INET6)
       if ((AF_INET6 == local_data_family) ||
 	  ((AF_UNSPEC == local_data_family) &&
 	   (AF_INET6 == remote_data_family)) ||
 	  ((AF_UNSPEC == local_data_family) &&
 	   (AF_INET6 == (*remote)->ai_family))) {
 	strcpy(local_data_address,"::0");
       }
 #endif
     }
   }

   *local = complete_addrinfo("what to put here?",
 			     local_data_address,
 			     local_data_port,
 			     local_data_family,
 			     type,
 			     protocol,
 			     flags|AI_PASSIVE);

   /* OK, at this point, if remote_data_address is NULL, we know that
      we used the value of remote_host (the control connection) for the
      remote, which means we can/should set remote_data_address to
      remote_host so the "omni" output routines can use that global
      variable. at least i think I can get away with that :) I'm sure
      that at some point I'll find-out that I need to allocate
      something for it rather than mess with the pointers, but that can
      wait.  famous last words of raj 2008-01-25 */
   if (remote_data_address == NULL)
     remote_data_address = remote_host;
 }

 void
 set_hostname_and_port(char *hostname, char *portstr, int family, int port)
 {
   strcpy(hostname,"0.0.0.0");
 #if defined AF_INET6
   if (AF_INET6 == family) {
     strcpy(hostname,"::0");
   }
 #endif

   sprintf(portstr, "%u", port);

 }

 static unsigned short
 get_port_number(struct addrinfo *res)
 {
  switch(res->ai_family) {
   case AF_INET: {
     struct sockaddr_in *foo = (struct sockaddr_in *)res->ai_addr;
     return(ntohs(foo->sin_port));
     break;
   }
 #if defined(AF_INET6)
   case AF_INET6: {
     struct sockaddr_in6 *foo = (struct sockaddr_in6 *)res->ai_addr;
     return(ntohs(foo->sin6_port));
     break;
   }
 #endif
   default:
     fprintf(where,
 	    "Given Unexpected Address Family of %u\n",res->ai_family);
     fflush(where);
     exit(-1);
   }
 }

 static void
 extract_inet_address_and_port(struct addrinfo *res, void *addr, int len, int *port)
 {
  switch(res->ai_family) {
   case AF_INET: {
     struct sockaddr_in *foo = (struct sockaddr_in *)res->ai_addr;
     *port = foo->sin_port;
     memcpy(addr,&(foo->sin_addr),min(len,sizeof(foo->sin_addr)));
     break;
   }
 #if defined(AF_INET6)
   case AF_INET6: {
     struct sockaddr_in6 *foo = (struct sockaddr_in6 *)res->ai_addr;
     *port = foo->sin6_port;
     memcpy(addr,&(foo->sin6_addr),min(len,sizeof(foo->sin6_addr)));
     break;
   }
 #endif
   default:
     *port = 0xDEADBEEF;
     strncpy(addr,"UNKN FAMILY",len);
   }
 }

 /* this routine will set the port number of the sockaddr in the
    addrinfo to the specified value, based on the address family */
 void
 set_port_number(struct addrinfo *res, unsigned short port)
 {
   switch(res->ai_family) {
   case AF_INET: {
     struct sockaddr_in *foo = (struct sockaddr_in *)res->ai_addr;
     foo->sin_port = htons(port);
     break;
   }
 #if defined(AF_INET6)
   case AF_INET6: {
     struct sockaddr_in6 *foo = (struct sockaddr_in6 *)res->ai_addr;
     foo->sin6_port = htons(port);
     break;
   }
 #endif
   default:
     fprintf(where,
 	    "set_port_number Unexpected Address Family of %u\n",res->ai_family);
     fflush(where);
     exit(-1);
   }
 }

 /* stuff the address family, port number and address into a
    sockaddr. for now, we will go ahead and zero-out the sockaddr
    first */
 void
 set_sockaddr_family_addr_port(struct sockaddr_storage *sockaddr, int family, void *addr, int port) {

   memset(sockaddr,0,sizeof(struct sockaddr_storage));

   switch (family) {
   case AF_INET: {
     struct sockaddr_in *foo = (struct sockaddr_in *)sockaddr;
     foo->sin_port = htons((unsigned short) port);
     foo->sin_family = (unsigned short) family;
     memcpy(&(foo->sin_addr),addr,sizeof(foo->sin_addr));
     *(int *)addr = htonl(*(int *)addr);
     break;
   }
 #if defined(AF_INET6)
   case AF_INET6: {
     struct sockaddr_in6 *foo = (struct sockaddr_in6 *)sockaddr;
     int *bar;
     int i;
     foo->sin6_port = htons((unsigned short) port);
     foo->sin6_family = (unsigned short) family;
     memcpy(&(foo->sin6_addr),addr,sizeof(foo->sin6_addr));
     /* how to put this into "host" order? */
     for (i = sizeof(foo->sin6_addr)/sizeof(int), bar=addr; i > 0; i--) {
       bar[i] = htonl(bar[i]);
     }
     break;
   }
 #endif
   default:
     fprintf(where,
 	    "set_sockaddr_family_addr_port Unexpected Address Family of %u\n",family);
     fflush(where);
     exit(-1);
   }
 }

 /* pull the port and address out of the sockaddr in host format */
 int
 get_sockaddr_family_addr_port(struct sockaddr_storage *sockaddr, int family, void *addr, int *port)
 {
   struct sockaddr_in *sin = (struct sockaddr_in *)sockaddr;

   int ret = 0;
   if (sin->sin_family != family) {
     fprintf(where,
 	    "get_sockaddr_family_addr_port family mismatch %d vs %d\n",
 	    sin->sin_family,
 	    family);
     fflush(where);
     return -1;
   }

   switch(family) {
   case  AF_INET: {
     *port = ntohs(sin->sin_port);
     memcpy(addr,&(sin->sin_addr),sizeof(sin->sin_addr));
     if (*(int *)addr == INADDR_ANY) ret = 1;
     *(int *)addr = ntohl(*(int *)addr);
     break;
   }
 #ifdef AF_INET6
   case AF_INET6: {
     int *foo;
     int i;
     struct sockaddr_in6 *sin6 = (struct sockaddr_in6 *)sockaddr;
     ret = 0;
     *port = ntohs(sin6->sin6_port);
     memcpy(addr,&(sin6->sin6_addr), sizeof(sin6->sin6_addr));
     /* how to put this into "host" order? */
     for (i = sizeof(sin6->sin6_addr)/sizeof(int), foo=addr; i > 0; i--) {
       if (foo[i] != 0) ret = 1;
       foo[i] = ntohl(foo[i]);
     }
     break;
   }
 #endif
   default:
     fprintf(where,
 	    "get_sockaddr_family_addr_port: Unexpected Address Family of %u\n",family);
     fflush(where);
     exit(-1);
   }
   return ret;
 }


  /* This routine will create a data (listen) socket with the
   apropriate options set and return it to the caller. this replaces
   all the duplicate code in each of the test routines and should help
   make things a little easier to understand. since this routine can be
   called by either the netperf or netserver programs, all output
   should be directed towards "where." family is generally AF_INET and
   type will be either SOCK_STREAM or SOCK_DGRAM.  This routine will
   also be used by the "SCTP" tests, hence the slightly strange-looking
   SCTP stuff in the classic bsd sockets test file... vlad/raj
   2005-03-15 */

 SOCKET
 create_data_socket(struct addrinfo *res)
 {

   SOCKET temp_socket;
   int one;
   int    on  = 1;


   /*set up the data socket                        */
   temp_socket = socket(res->ai_family,
 		       res->ai_socktype,
 		       res->ai_protocol);

   if (temp_socket == INVALID_SOCKET){
     fprintf(where,
 	    "netperf: create_data_socket: socket: errno %d fam %s type %s prot %s errmsg %s\n",
 	    errno,
 	    inet_ftos(res->ai_family),
 	    inet_ttos(res->ai_socktype),
 	    inet_ptos(res->ai_protocol),
 	    strerror(errno));
     fflush(where);
     exit(1);
   }

   if (debug) {
     fprintf(where,"create_data_socket: socket %d obtained...\n",temp_socket);
     fflush(where);
   }

   /* Modify the local socket size. The reason we alter the send buffer
    size here rather than when the connection is made is to take care
    of decreases in buffer size. Decreasing the window size after
    connection establishment is a TCP no-no. Also, by setting the
    buffer (window) size before the connection is established, we can
    control the TCP MSS (segment size). The MSS is never (well, should
    never be) more that 1/2 the minimum receive buffer size at each
    half of the connection.  This is why we are altering the receive
    buffer size on the sending size of a unidirectional transfer. If
    the user has not requested that the socket buffers be altered, we
    will try to find-out what their values are. If we cannot touch the
    socket buffer in any way, we will set the values to -1 to indicate
    that.  */

   /* all the oogy nitty gritty stuff moved from here into the routine
      being called below, per patches from davidm to workaround the bug
      in Linux getsockopt().  raj 2004-06-15 */
   set_sock_buffer (temp_socket, SEND_BUFFER, lss_size_req, &lss_size);
   set_sock_buffer (temp_socket, RECV_BUFFER, lsr_size_req, &lsr_size);

   /* now, we may wish to enable the copy avoidance features on the */
   /* local system. of course, this may not be possible... */

 #ifdef SO_RCV_COPYAVOID
   if (loc_rcvavoid) {
     if (setsockopt(temp_socket,
 		   SOL_SOCKET,
 		   SO_RCV_COPYAVOID,
 		   (const char *)&loc_rcvavoid,
 		   sizeof(int)) == SOCKET_ERROR) {
       fprintf(where,
 	      "netperf: create_data_socket: Could not enable receive copy avoidance");
       fflush(where);
       loc_rcvavoid = 0;
     }
   }
 #else
   /* it wasn't compiled in... */
   loc_rcvavoid = 0;
 #endif /* SO_RCV_COPYAVOID */

 #ifdef SO_SND_COPYAVOID
   if (loc_sndavoid) {
     if (setsockopt(temp_socket,
 		   SOL_SOCKET,
 		   SO_SND_COPYAVOID,
 		   (const char *)&loc_sndavoid,
 		   sizeof(int)) == SOCKET_ERROR) {
       fprintf(where,
 	      "netperf: create_data_socket: Could not enable send copy avoidance");
       fflush(where);
       loc_sndavoid = 0;
     }
   }
 #else
   /* it was not compiled in... */
   loc_sndavoid = 0;
 #endif

   /* Now, we will see about setting the TCP_NODELAY flag on the local */
   /* socket. We will only do this for those systems that actually */
   /* support the option. If it fails, note the fact, but keep going. */
   /* If the user tries to enable TCP_NODELAY on a UDP socket, this */
   /* will cause an error to be displayed */

   /* well..... long ago and far away that would have happened, in
      particular because we would always use IPPROTO_TCP here.
      however, now we are using res->ai_protocol, which will be
      IPPROT_UDP, and while HP-UX, and I suspect no-one else on the
      planet has a UDP_mumble option that overlaps with TCP_NODELAY,
      sure as knuth made little green programs, linux has a UDP_CORK
      option that is defined as a value of 1, which is the same a
      TCP_NODELAY under Linux.  So, when asking for -D and
      "TCP_NODELAY" under Linux, we are actually setting UDP_CORK
      instead of getting an error like every other OS on the
      planet. joy and rupture. this stops a UDP_RR test cold sooo we
      have to make sure that res->ai_protocol actually makes sense for
      a _NODELAY setsockopt() or a UDP_RR test on Linux where someone
      mistakenly sets -D will hang.  raj 2005-04-21 */

 #if defined(TCP_NODELAY) || defined(SCTP_NODELAY)
   if ((loc_nodelay) && (res->ai_protocol != IPPROTO_UDP)) {

     /* strictly speaking, since the if defined above is an OR, we
        should probably check against TCP_NODELAY being defined here.
        however, the likelihood of SCTP_NODELAY being defined and
        TCP_NODELAY _NOT_ being defined is, probably :), epsilon.  raj
        2005-03-15 */

     int option = TCP_NODELAY;

     /* I suspect that WANT_SCTP would suffice here since that is the
        only time we would have called getaddrinfo with a hints asking
        for SCTP, but just in case there is an SCTP implementation out
        there _without_ SCTP_NODELAY... raj 2005-03-15 */
     /* change this to IPPROTO_SCTP rather than WANT_SCTP to better fit
        with the modus operendi (sp) of the new "omni" tests. raj
        2008-02-04 */
 #if defined(IPPROTO_SCTP) && defined(SCTP_NODELAY)
     if (IPPROTO_SCTP == res->ai_protocol) {
       option = SCTP_NODELAY;
     }
 #endif

     one = 1;
     if(setsockopt(temp_socket,
 		  res->ai_protocol,
 		  option,
 		  (char *)&one,
 		  sizeof(one)) == SOCKET_ERROR) {
       fprintf(where,
 	      "netperf: create_data_socket: nodelay: errno %d\n",
 	      errno);
       fflush(where);
     }

     if (debug > 1) {
       fprintf(where,
 	      "netperf: create_data_socket: [TCP|SCTP]_NODELAY requested...\n");
       fflush(where);
     }
   }
 #else /* TCP_NODELAY */

   loc_nodelay = 0;

 #endif /* TCP_NODELAY */

 #if defined(TCP_CORK)

     if (loc_tcpcork > 0) {
       /* the user wishes for us to set TCP_CORK on the socket */
       int one = 1;
       if (setsockopt(temp_socket,
 		     getprotobyname("tcp")->p_proto,
 		     TCP_CORK,
 		     (char *)&one,
 		     sizeof(one)) == SOCKET_ERROR) {
 	perror("netperf: create_data_socket: tcp_cork");
 	exit(1);
       }
       if (debug) {
 	fprintf(where,"create_data_socket: tcp_cork...\n");
       }
     }

 #endif /* TCP_CORK */

   /* since some of the UDP tests do not do anything to cause an
      implicit bind() call, we need to be rather explicit about our
      bind() call here. even if the address and/or the port are zero
      (INADDR_ANY etc). raj 2004-07-20 */

   if (setsockopt(temp_socket,
 #ifdef IPPROTO_DCCP
 		 /* it is REALLY SILLY THAT THIS SHOULD BE NEEDED!! I
 		    should be able to use SOL_SOCKET for this just
 		    like TCP and SCTP */
 		 /* IT IS EVEN SILLIER THAT THERE COULD BE SYSTEMS
 		    WITH IPPROTO_DCCP and no SOL_DCCP */
 #ifndef SOL_DCCP
 #define SOL_DCCP SOL_SOCKET
 #define NETPERF_NEED_CLEANUP 1
 #endif
 		 (res->ai_protocol == IPPROTO_DCCP) ? SOL_DCCP : SOL_SOCKET,
 #ifdef NETPERF_NEED_CLEANUP
 #undef SOL_DCCP
 #undef NETPERF_NEED_CLEANUP
 #endif

 #else
 		 SOL_SOCKET,
 #endif
 		 SO_REUSEADDR,
 		 (const char *)&on,
 		 sizeof(on)) < 0) {
     fprintf(where,
 	    "netperf: create_data_socket: SO_REUSEADDR failed %d\n",
 	    errno);
     fflush(where);
   }

   if (bind(temp_socket,
 	   res->ai_addr,
 	   res->ai_addrlen) < 0) {
     if (debug) {
       fprintf(where,
 	      "netperf: create_data_socket: data socket bind failed errno %d\n",
 	      errno);
       fprintf(where," port: %d\n",get_port_number(res));
       fflush(where);
     }
   }


   return(temp_socket);

 }

 #ifdef KLUDGE_SOCKET_OPTIONS


  /* This routine is for those BROKEN systems which do not correctly */
  /* pass socket attributes through calls such as accept(). It should */
  /* only be called for those broken systems. I *really* don't want to */
  /* have this, but even broken systems must be measured. raj 11/95 */
 void
 kludge_socket_options(int temp_socket)
 {

   set_sock_buffer(temp_socket, SEND_BUFFER, lss_size_req, &lss_size);
   set_sock_buffer(temp_socket, RECV_BUFFER, lsr_size_req, &lsr_size);

   /* now, we may wish to enable the copy avoidance features on the */
   /* local system. of course, this may not be possible... */
   /* those calls were only valid for HP-UX, and I know that HP-UX is */
   /* written correctly, and so we do not need to include those calls */
   /* in this kludgy routine. raj 11/95 */


   /* Now, we will see about setting the TCP_NODELAY flag on the local */
   /* socket. We will only do this for those systems that actually */
   /* support the option. If it fails, note the fact, but keep going. */
   /* If the user tries to enable TCP_NODELAY on a UDP socket, this */
   /* will cause an error to be displayed */

 #ifdef TCP_NODELAY
   if (loc_nodelay) {
     one = 1;
     if(setsockopt(temp_socket,
 		  getprotobyname("tcp")->p_proto,
 		  TCP_NODELAY,
 		  (char *)&one,
 		  sizeof(one)) == SOCKET_ERROR) {
       fprintf(where,"netperf: kludge_socket_options: nodelay: errno %d\n",
 	      errno);
       fflush(where);
     }

     if (debug > 1) {
       fprintf(where,
 	      "netperf: kludge_socket_options: TCP_NODELAY requested...\n");
       fflush(where);
     }
   }
 #else /* TCP_NODELAY */

   loc_nodelay = 0;

 #endif /* TCP_NODELAY */

   }

 #endif /* KLUDGE_SOCKET_OPTIONS */


 static void *
 get_address_address(struct addrinfo *info)
 {
   struct sockaddr_in *sin;
 #if defined(AF_INET6)
   struct sockaddr_in6 *sin6;
 #endif

   switch(info->ai_family) {
   case AF_INET:
     sin = (struct sockaddr_in *)info->ai_addr;
     return(&(sin->sin_addr));
     break;
 #if defined(AF_INET6)
   case AF_INET6:
     sin6 = (struct sockaddr_in6 *)info->ai_addr;
     return(&(sin6->sin6_addr));
     break;
 #endif
   default:
     fprintf(stderr,"we never expected to get here in get_address_address\n");
     fflush(stderr);
     exit(-1);
   }
 }

 #if defined(WIN32)
 #if !defined(InetNtop)
 /* +*+ Why isn't this in the winsock headers yet? */
 const char *
 inet_ntop(int af, const void *src, char *dst, size_t size);
 #endif
 #endif

 /* This routine is a generic test header printer for the topmost header */
 void
 print_top_test_header(char test_name[], struct addrinfo *source, struct addrinfo *destination)
 {

 #if defined(AF_INET6)
   char address_buf[INET6_ADDRSTRLEN];
 #else
   char address_buf[16]; /* magic constant */
 #endif

   /* we want to have some additional, interesting information in */
   /* the headers. we know some of it here, but not all, so we will */
   /* only print the test title here and will print the results */
   /* titles after the test is finished */
   fprintf(where,test_name);
   address_buf[0] = '\0';
   inet_ntop(source->ai_family,get_address_address(source),address_buf,sizeof(address_buf));
   fprintf(where,
 	  " from %s (%s) port %u %s",
 	  source->ai_canonname,
 	  address_buf,
 	  get_port_number(source),
 	  inet_ftos(source->ai_family));
   address_buf[0] = '\0';
   inet_ntop(destination->ai_family,get_address_address(destination),address_buf,sizeof(address_buf));
   fprintf(where,
 	  " to %s (%s) port %u %s",
 	  destination->ai_canonname,
 	  address_buf,
 	  get_port_number(destination),
 	  inet_ftos(destination->ai_family));

   if (iteration_max > 1) {
     fprintf(where,
 	    " : +/-%.3f%% @ %2d%% conf. %s",
 	    interval/0.02,
 	    confidence_level,
 	    result_confidence_only ? " on result only" : "");
   }
   if ((loc_nodelay > 0) || (rem_nodelay > 0)) {
     fprintf(where," : nodelay");
   }
   if ((loc_sndavoid > 0) ||
       (loc_rcvavoid > 0) ||
       (rem_sndavoid > 0) ||
       (rem_rcvavoid > 0)) {
     fprintf(where," : copy avoidance");
   }

   if (no_control) {
     fprintf(where," : no control");
   }

 #ifdef WANT_HISTOGRAM
   fprintf(where," : histogram");
 #endif /* WANT_HISTOGRAM */

 #ifdef WANT_INTERVALS
 #ifndef WANT_SPIN
   fprintf(where," : interval");
 #else
   fprintf(where," : spin interval");
 #endif
 #endif /* WANT_INTERVALS */

 #ifdef DIRTY
   fprintf(where," : dirty data");
 #endif /* DIRTY */
 #ifdef WANT_DEMO
   fprintf(where," : demo");
 #endif
 #ifdef WANT_FIRST_BURST
   /* a little hokey perhaps, but we really only want this to be
      emitted for tests where it actually is used, which means a
      "REQUEST/RESPONSE" test. raj 2005-11-10 */
   if (strstr(test_name,"REQUEST/RESPONSE")) {
     fprintf(where," : first burst %d",first_burst_size);
   }
 #endif
   if (cpu_binding_requested) {
     fprintf(where," : cpu bind");
   }
   fprintf(where,"\n");

 }


 /* This routine implements the TCP unidirectional data transfer test */
 /* (a.k.a. stream) for the sockets interface. It receives its */
 /* parameters via global variables from the shell and writes its */
 /* output to the standard output. */


 void
 send_tcp_stream(char remote_host[])
 {

   char *tput_title = "\
 Recv   Send    Send                          \n\
 Socket Socket  Message  Elapsed              \n\
 Size   Size    Size     Time     Throughput  \n\
 bytes  bytes   bytes    secs.    %s/sec  \n\n";

   char *tput_fmt_0 =
     "%7.2f %s\n";

   char *tput_fmt_1 =
     "%6d %6d %6d    %-6.2f   %7.2f   %s\n";

   char *cpu_title = "\
 Recv   Send    Send                          Utilization       Service Demand\n\
 Socket Socket  Message  Elapsed              Send     Recv     Send    Recv\n\
 Size   Size    Size     Time     Throughput  local    remote   local   remote\n\
 bytes  bytes   bytes    secs.    %-8.8s/s  %% %c      %% %c      us/KB   us/KB\n\n";

   char *cpu_fmt_0 =
     "%6.3f %c %s\n";

   char *cpu_fmt_1 =
     "%6d %6d %6d    %-6.2f     %7.2f   %-6.2f   %-6.2f   %-6.3f  %-6.3f %s\n";

   char *ksink_fmt = "\n\
 Alignment      Offset         %-8.8s %-8.8s    Sends   %-8.8s Recvs\n\
 Local  Remote  Local  Remote  Xfered   Per                 Per\n\
 Send   Recv    Send   Recv             Send (avg)          Recv (avg)\n\
 %5d   %5d  %5d   %5d %6.4g  %6.2f    %6d   %6.2f %6d\n";

   char *ksink_fmt2 = "\n\
 Maximum\n\
 Segment\n\
 Size (bytes)\n\
 %6d\n";


   float			elapsed_time;

   /* what we want is to have a buffer space that is at least one */
   /* send-size greater than our send window. this will insure that we */
   /* are never trying to re-use a buffer that may still be in the hands */
   /* of the transport. This buffer will be malloc'd after we have found */
   /* the size of the local senc socket buffer. We will want to deal */
   /* with alignment and offset concerns as well. */

   struct ring_elt *send_ring;

   int len;
   unsigned int nummessages = 0;
   SOCKET send_socket;
   int bytes_remaining;
   int tcp_mss = -1;  /* possibly uninitialized on printf far below */

   /* with links like fddi, one can send > 32 bits worth of bytes */
   /* during a test... ;-) at some point, this should probably become a */
   /* 64bit integral type, but those are not entirely common yet */

   unsigned long long local_bytes_sent = 0;
   double	bytes_sent = 0.0;

   float	local_cpu_utilization;
   float	local_service_demand;
   float	remote_cpu_utilization;
   float	remote_service_demand;

   double	thruput;

   struct addrinfo *remote_res;
   struct addrinfo *local_res;

   struct	tcp_stream_request_struct	*tcp_stream_request;
   struct	tcp_stream_response_struct	*tcp_stream_response;
   struct	tcp_stream_results_struct	*tcp_stream_result;

   tcp_stream_request  =
     (struct tcp_stream_request_struct *)netperf_request.content.test_specific_data;
   tcp_stream_response =
     (struct tcp_stream_response_struct *)netperf_response.content.test_specific_data;
   tcp_stream_result   =
     (struct tcp_stream_results_struct *)netperf_response.content.test_specific_data;

 #ifdef WANT_HISTOGRAM
   if (verbosity > 1) {
     time_hist = HIST_new();
   }
 #endif /* WANT_HISTOGRAM */
   /* since we are now disconnected from the code that established the */
   /* control socket, and since we want to be able to use different */
   /* protocols and such, we are passed the name of the remote host and */
   /* must turn that into the test specific addressing information. */

   /* complete_addrinfos will either succede or exit the process */
   complete_addrinfos(&remote_res,
 		     &local_res,
 		     remote_host,
 		     SOCK_STREAM,
 		     IPPROTO_TCP,
 		     0);

   if ( print_headers ) {
     print_top_test_header("TCP STREAM TEST",local_res,remote_res);
   }

   send_ring = NULL;
   confidence_iteration = 1;
   init_stat();

   /* we have a great-big while loop which controls the number of times */
   /* we run a particular test. this is for the calculation of a */
   /* confidence interval (I really should have stayed awake during */
   /* probstats :). If the user did not request confidence measurement */
   /* (no confidence is the default) then we will only go though the */
   /* loop once. the confidence stuff originates from the folks at IBM */

   while (((confidence < 0) && (confidence_iteration < iteration_max)) ||
 	 (confidence_iteration <= iteration_min)) {

     /* initialize a few counters. we have to remember that we might be */
     /* going through the loop more than once. */

     nummessages    =	0;
     bytes_sent     =	0.0;
     times_up       = 	0;

     /*set up the data socket                        */
     send_socket = create_data_socket(local_res);

     if (send_socket == INVALID_SOCKET){
       perror("netperf: send_tcp_stream: tcp stream data socket");
       exit(1);
     }

     if (debug) {
       fprintf(where,"send_tcp_stream: send_socket obtained...\n");
     }

     /* at this point, we have either retrieved the socket buffer sizes, */
     /* or have tried to set them, so now, we may want to set the send */
     /* size based on that (because the user either did not use a -m */
     /* option, or used one with an argument of 0). If the socket buffer */
     /* size is not available, we will set the send size to 4KB - no */
     /* particular reason, just arbitrary... */
     if (send_size == 0) {
       if (lss_size > 0) {
 	send_size = lss_size;
       }
       else {
 	send_size = 4096;
       }
     }

     /* set-up the data buffer ring with the requested alignment and offset. */
     /* note also that we have allocated a quantity */
     /* of memory that is at least one send-size greater than our socket */
     /* buffer size. We want to be sure that there are at least two */
     /* buffers allocated - this can be a bit of a problem when the */
     /* send_size is bigger than the socket size, so we must check... the */
     /* user may have wanted to explicitly set the "width" of our send */
     /* buffers, we should respect that wish... */
     if (send_width == 0) {
       send_width = (lss_size/send_size) + 1;
       if (send_width == 1) send_width++;
     }

     if (send_ring == NULL) {
       /* only allocate the send ring once. this is a networking test, */
       /* not a memory allocation test. this way, we do not need a */
       /* deallocate_buffer_ring() routine, and I don't feel like */
       /* writing one anyway :) raj 11/94 */
       send_ring = allocate_buffer_ring(send_width,
 				       send_size,
 				       local_send_align,
 				       local_send_offset);
     }

     /* If the user has requested cpu utilization measurements, we must */
     /* calibrate the cpu(s). We will perform this task within the tests */
     /* themselves. If the user has specified the cpu rate, then */
     /* calibrate_local_cpu will return rather quickly as it will have */
     /* nothing to do. If local_cpu_rate is zero, then we will go through */
     /* all the "normal" calibration stuff and return the rate back. */

     if (local_cpu_usage) {
       local_cpu_rate = calibrate_local_cpu(local_cpu_rate);
     }

     if (!no_control) {
       /* Tell the remote end to do a listen. The server alters the
 	 socket paramters on the other side at this point, hence the
 	 reason for all the values being passed in the setup
 	 message. If the user did not specify any of the parameters,
 	 they will be passed as 0, which will indicate to the remote
 	 that no changes beyond the system's default should be
 	 used. Alignment is the exception, it will default to 1, which
 	 will be no alignment alterations. */

       netperf_request.content.request_type =	DO_TCP_STREAM;
       tcp_stream_request->send_buf_size	=	rss_size_req;
       tcp_stream_request->recv_buf_size	=	rsr_size_req;
       tcp_stream_request->receive_size	=	recv_size;
       tcp_stream_request->no_delay	=	rem_nodelay;
       tcp_stream_request->recv_alignment	=	remote_recv_align;
       tcp_stream_request->recv_offset	=	remote_recv_offset;
       tcp_stream_request->measure_cpu	=	remote_cpu_usage;
       tcp_stream_request->cpu_rate	=	remote_cpu_rate;
       if (test_time) {
 	tcp_stream_request->test_length	=	test_time;
       }
       else {
 	tcp_stream_request->test_length	=	test_bytes;
       }
       tcp_stream_request->so_rcvavoid	=	rem_rcvavoid;
       tcp_stream_request->so_sndavoid	=	rem_sndavoid;
 #ifdef DIRTY
       tcp_stream_request->dirty_count     =       rem_dirty_count;
       tcp_stream_request->clean_count     =       rem_clean_count;
 #endif /* DIRTY */
       tcp_stream_request->port            =    atoi(remote_data_port);
       tcp_stream_request->ipfamily = af_to_nf(remote_res->ai_family);
       if (debug > 1) {
 	fprintf(where,
 		"netperf: send_tcp_stream: requesting TCP stream test\n");
       }

       send_request();

       /* The response from the remote will contain all of the relevant
          socket parameters for this test type. We will put them back
          into the variables here so they can be displayed if desired.
          The remote will have calibrated CPU if necessary, and will
          have done all the needed set-up we will have calibrated the
          cpu locally before sending the request, and will grab the
          counter value right after the connect returns. The remote
          will grab the counter right after the accept call. This saves
          the hassle of extra messages being sent for the TCP
          tests.  */

       recv_response();

       if (!netperf_response.content.serv_errno) {
 	if (debug)
 	  fprintf(where,"remote listen done.\n");
 	rsr_size	      =	tcp_stream_response->recv_buf_size;
 	rss_size	      =	tcp_stream_response->send_buf_size;
 	rem_nodelay     =	tcp_stream_response->no_delay;
 	remote_cpu_usage=	tcp_stream_response->measure_cpu;
 	remote_cpu_rate = tcp_stream_response->cpu_rate;

 	/* we have to make sure that the server port number is in
 	   network order */
 	set_port_number(remote_res,
 			(short)tcp_stream_response->data_port_number);

 	rem_rcvavoid	= tcp_stream_response->so_rcvavoid;
 	rem_sndavoid	= tcp_stream_response->so_sndavoid;
       }
       else {
 	Set_errno(netperf_response.content.serv_errno);
 	fprintf(where,
 		"netperf: remote error %d",
 		netperf_response.content.serv_errno);
 	perror("");
 	fflush(where);

 	exit(1);
       }
     }

 #ifdef WANT_DEMO
     DEMO_STREAM_SETUP(lss_size,rsr_size)
 #endif

     /*Connect up to the remote port on the data socket  */
     if (connect(send_socket,
 		remote_res->ai_addr,
 		remote_res->ai_addrlen) == INVALID_SOCKET){
       perror("netperf: send_tcp_stream: data socket connect failed");
       exit(1);
     }

 #ifdef WIN32
   /* this is used so the timer thread can close the socket out from */
   /* under us, which to date is the easiest/cleanest/least */
   /* Windows-specific way I can find to force the winsock calls to */
   /* return WSAEINTR with the test is over. anything that will run on */
   /* 95 and NT and is closer to what netperf expects from Unix signals */
   /* and such would be appreciated raj 1/96 */
   win_kludge_socket = send_socket;
 #endif /* WIN32 */

     /* Data Socket set-up is finished. If there were problems, either */
     /* the connect would have failed, or the previous response would */
     /* have indicated a problem. I failed to see the value of the */
     /* extra  message after the accept on the remote. If it failed, */
     /* we'll see it here. If it didn't, we might as well start pumping */
     /* data. */

     /* Set-up the test end conditions. For a stream test, they can be */
     /* either time or byte-count based. */

     if (test_time) {
       /* The user wanted to end the test after a period of time. */
       times_up = 0;
       bytes_remaining = 0;
       /* in previous revisions, we had the same code repeated throught */
       /* all the test suites. this was unnecessary, and meant more */
       /* work for me when I wanted to switch to POSIX signals, so I */
       /* have abstracted this out into a routine in netlib.c. if you */
       /* are experiencing signal problems, you might want to look */
       /* there. raj 11/94 */
       start_timer(test_time);
     }
     else {
       /* The tester wanted to send a number of bytes. */
       bytes_remaining = test_bytes;
       times_up = 1;
     }

     /* The cpu_start routine will grab the current time and possibly */
     /* value of the idle counter for later use in measuring cpu */
     /* utilization and/or service demand and thruput. */

     cpu_start(local_cpu_usage);

     /* we only start the interval timer if we are using the
        timer-timed intervals rather than the sit and spin ones. raj
        2006-02-06 */
 #if defined(WANT_INTERVALS)
     INTERVALS_INIT();
 #endif /* WANT_INTERVALS */

     /* before we start, initialize a few variables */

 #ifdef WANT_DEMO
       if (demo_mode) {
 	HIST_timestamp(demo_one_ptr);
       }
 #endif


     /* We use an "OR" to control test execution. When the test is */
     /* controlled by time, the byte count check will always return false. */
     /* When the test is controlled by byte count, the time test will */
     /* always return false. When the test is finished, the whole */
     /* expression will go false and we will stop sending data. */

     while ((!times_up) || (bytes_remaining > 0)) {

 #ifdef DIRTY
       access_buffer(send_ring->buffer_ptr,
 		    send_size,
 		    loc_dirty_count,
 		    loc_clean_count);
 #endif /* DIRTY */

 #ifdef WANT_HISTOGRAM
       if (verbosity > 1) {
 	/* timestamp just before we go into send and then again just
 	 after we come out raj 8/94 */
 	/* but lets only do this if there is going to be a histogram
 	   displayed */
 	HIST_timestamp(&time_one);
       }
 #endif /* WANT_HISTOGRAM */

       if((len=send(send_socket,
 		   send_ring->buffer_ptr,
 		   send_size,
 		   0)) != send_size) {
       if ((len >=0) || SOCKET_EINTR(len)) {
 	    /* the test was interrupted, must be the end of test */
 	    break;
 	  }
 	perror("netperf: data send error");
 	printf("len was %d\n",len);
 	exit(1);
       }

       local_bytes_sent += send_size;

 #ifdef WANT_HISTOGRAM
       if (verbosity > 1) {
 	/* timestamp the exit from the send call and update the histogram */
 	HIST_timestamp(&time_two);
 	HIST_add(time_hist,delta_micro(&time_one,&time_two));
       }
 #endif /* WANT_HISTOGRAM */

 #ifdef WANT_DEMO
       DEMO_STREAM_INTERVAL(send_size)
 #endif

 #if defined(WANT_INTERVALS)
       INTERVALS_WAIT();
 #endif /* WANT_INTERVALS */

       /* now we want to move our pointer to the next position in the */
       /* data buffer...we may also want to wrap back to the "beginning" */
       /* of the bufferspace, so we will mod the number of messages sent */
       /* by the send width, and use that to calculate the offset to add */
       /* to the base pointer. */
       nummessages++;
       send_ring = send_ring->next;
       if (bytes_remaining) {
 	bytes_remaining -= send_size;
       }
     }

     /* The test is over. Flush the buffers to the remote end. We do a */
     /* graceful release to insure that all data has been taken by the */
     /* remote. */

     /* but first, if the verbosity is greater than 1, find-out what */
     /* the TCP maximum segment_size was (if possible) */
     if (verbosity > 1) {
       tcp_mss = -1;
       get_tcp_info(send_socket,&tcp_mss);
     }

     if (shutdown(send_socket,SHUT_WR) == SOCKET_ERROR) {
       perror("netperf: cannot shutdown tcp stream socket");
       exit(1);
     }

     /* hang a recv() off the socket to block until the remote has */
     /* brought all the data up into the application. it will do a */
     /* shutdown to cause a FIN to be sent our way. We will assume that */
     /* any exit from the recv() call is good... raj 4/93 */

     recv(send_socket, send_ring->buffer_ptr, send_size, 0);

     /* this call will always give us the elapsed time for the test, and */
     /* will also store-away the necessaries for cpu utilization */

     cpu_stop(local_cpu_usage,&elapsed_time);	/* was cpu being */
 						/* measured and how */
 						/* long did we really */
 						/* run? */

     /* we are finished with the socket, so close it to prevent hitting */
     /* the limit on maximum open files. */

     close(send_socket);

     if (!no_control) {
       /* Get the statistics from the remote end. The remote will have
 	 calculated service demand and all those interesting
 	 things. If it wasn't supposed to care, it will return obvious
 	 values. */

       recv_response();
       if (!netperf_response.content.serv_errno) {
 	if (debug)
 	  fprintf(where,
 		  "remote reporting results for %.2f seconds\n",
 		  tcp_stream_result->elapsed_time);
       }
       else {
 	Set_errno(netperf_response.content.serv_errno);
 	fprintf(where,
 		"netperf: remote error %d",
 		netperf_response.content.serv_errno);
 	perror("");
 	fflush(where);

 	exit(1);
       }

       /* We now calculate what our thruput was for the test. In the
 	 future, we may want to include a calculation of the thruput
 	 measured by the remote, but it should be the case that for a
 	 TCP stream test, that the two numbers should be *very*
 	 close... We calculate bytes_sent regardless of the way the
 	 test length was controlled.  If it was time, we needed to,
 	 and if it was by bytes, the user may have specified a number
 	 of bytes that wasn't a multiple of the send_size, so we
 	 really didn't send what he asked for ;-) */

       bytes_sent	= ntohd(tcp_stream_result->bytes_received);
     }
     else {
       bytes_sent = (double)local_bytes_sent;
     }

     thruput	= calc_thruput(bytes_sent);

     if (local_cpu_usage || remote_cpu_usage) {
       /* We must now do a little math for service demand and cpu */
       /* utilization for the system(s) */
       /* Of course, some of the information might be bogus because */
       /* there was no idle counter in the kernel(s). We need to make */
       /* a note of this for the user's benefit...*/
       if (local_cpu_usage) {

 	local_cpu_utilization	= calc_cpu_util(0.0);
 	local_service_demand	= calc_service_demand(bytes_sent,
 						      0.0,
 						      0.0,
 						      0);
       }
       else {
 	local_cpu_utilization	= (float) -1.0;
 	local_service_demand	= (float) -1.0;
       }

       if (remote_cpu_usage) {

 	remote_cpu_utilization	= tcp_stream_result->cpu_util;
 	remote_service_demand	= calc_service_demand(bytes_sent,
 						      0.0,
 						      remote_cpu_utilization,
 						      tcp_stream_result->num_cpus);
       }
       else {
 	remote_cpu_utilization = (float) -1.0;
 	remote_service_demand  = (float) -1.0;
       }
     }
     else {
       /* we were not measuring cpu, for the confidence stuff, we */
       /* should make it -1.0 */
       local_cpu_utilization	= (float) -1.0;
       local_service_demand	= (float) -1.0;
       remote_cpu_utilization = (float) -1.0;
       remote_service_demand  = (float) -1.0;
     }

     /* at this point, we want to calculate the confidence information. */
     /* if debugging is on, calculate_confidence will print-out the */
     /* parameters we pass it */

     calculate_confidence(confidence_iteration,
 			 elapsed_time,
 			 thruput,
 			 local_cpu_utilization,
 			 remote_cpu_utilization,
 			 local_service_demand,
 			 remote_service_demand);


     confidence_iteration++;
   }

   /* at this point, we have finished making all the runs that we */
   /* will be making. so, we should extract what the calcuated values */
   /* are for all the confidence stuff. we could make the values */
   /* global, but that seemed a little messy, and it did not seem worth */
   /* all the mucking with header files. so, we create a routine much */
   /* like calcualte_confidence, which just returns the mean values. */
   /* raj 11/94 */

   retrieve_confident_values(&elapsed_time,
 			    &thruput,
 			    &local_cpu_utilization,
 			    &remote_cpu_utilization,
 			    &local_service_demand,
 			    &remote_service_demand);

   /* We are now ready to print all the information. If the user */
   /* has specified zero-level verbosity, we will just print the */
   /* local service demand, or the remote service demand. If the */
   /* user has requested verbosity level 1, he will get the basic */
   /* "streamperf" numbers. If the user has specified a verbosity */
   /* of greater than 1, we will display a veritable plethora of */
   /* background information from outside of this block as it it */
   /* not cpu_measurement specific...  */

   if (confidence < 0) {
     /* we did not hit confidence, but were we asked to look for it? */
     if (iteration_max > 1) {
       display_confidence();
     }
   }

   if (local_cpu_usage || remote_cpu_usage) {
     local_cpu_method = format_cpu_method(cpu_method);
     remote_cpu_method = format_cpu_method(tcp_stream_result->cpu_method);

     switch (verbosity) {
     case 0:
       if (local_cpu_usage) {
 	fprintf(where,
 		cpu_fmt_0,
 		local_service_demand,
 		local_cpu_method,
 		((print_headers) ||
 		 (result_brand == NULL)) ? "" : result_brand);
       }
       else {
 	fprintf(where,
 		cpu_fmt_0,
 		remote_service_demand,
 		remote_cpu_method,
 		((print_headers) ||
 		 (result_brand == NULL)) ? "" : result_brand);
       }
       break;
     case 1:
     case 2:
       if (print_headers) {
 		fprintf(where,
 		cpu_title,
 		format_units(),
 		local_cpu_method,
 		remote_cpu_method);
       }

       fprintf(where,
 	      cpu_fmt_1,		/* the format string */
 	      rsr_size,		        /* remote recvbuf size */
 	      lss_size,		        /* local sendbuf size */
 	      send_size,		/* how large were the sends */
 	      elapsed_time,		/* how long was the test */
 	      thruput, 		        /* what was the xfer rate */
 	      local_cpu_utilization,	/* local cpu */
 	      remote_cpu_utilization,	/* remote cpu */
 	      local_service_demand,	/* local service demand */
 	      remote_service_demand,	/* remote service demand */
 	      ((print_headers) ||
 	       (result_brand == NULL)) ? "" : result_brand);
       break;
     }
   }
   else {
     /* The tester did not wish to measure service demand. */

     switch (verbosity) {
     case 0:
       fprintf(where,
 	      tput_fmt_0,
 	      thruput,
 	      ((print_headers) ||
 	       (result_brand == NULL)) ? "" : result_brand);
       break;
     case 1:
     case 2:
       if (print_headers) {
 		fprintf(where,tput_title,format_units());
       }
       fprintf(where,
 	      tput_fmt_1,		/* the format string */
 	      rsr_size, 		/* remote recvbuf size */
 	      lss_size, 		/* local sendbuf size */
 	      send_size,		/* how large were the sends */
 	      elapsed_time, 		/* how long did it take */
 	      thruput,                  /* how fast did it go */
 	      ((print_headers) ||
 	       (result_brand == NULL)) ? "" : result_brand);
       break;
     }
   }

   /* it would be a good thing to include information about some of the */
   /* other parameters that may have been set for this test, but at the */
   /* moment, I do not wish to figure-out all the  formatting, so I will */
   /* just put this comment here to help remind me that it is something */
   /* that should be done at a later time. */

   if (verbosity > 1) {
     /* The user wanted to know it all, so we will give it to him. */
     /* This information will include as much as we can find about */
     /* TCP statistics, the alignments of the sends and receives */
     /* and all that sort of rot... */

     /* this stuff needs to be worked-out in the presence of confidence */
     /* intervals and multiple iterations of the test... raj 11/94 */

     fprintf(where,
 	    ksink_fmt,
 	    "Bytes",
 	    "Bytes",
 	    "Bytes",
 	    local_send_align,
 	    remote_recv_align,
 	    local_send_offset,
 	    remote_recv_offset,
 	    bytes_sent,
 	    bytes_sent / (double)nummessages,
 	    nummessages,
 	    bytes_sent / (double)tcp_stream_result->recv_calls,
 	    tcp_stream_result->recv_calls);
     fprintf(where,
 	    ksink_fmt2,
 	    tcp_mss);
     fflush(where);
 #ifdef WANT_HISTOGRAM
     fprintf(where,"\n\nHistogram of time spent in send() call.\n");
     fflush(where);
     HIST_report(time_hist);
 #endif /* WANT_HISTOGRAM */
   }

 }


 /* This routine implements the netperf-side TCP unidirectional data
    transfer test (a.k.a. stream) for the sockets interface where the
    data flow is from the netserver to the netperf.  It receives its
    parameters via global variables from the shell and writes its
    output to the standard output. */


 void
 send_tcp_maerts(char remote_host[])
 {

   char *tput_title = "\
 Recv   Send    Send                          \n\
 Socket Socket  Message  Elapsed              \n\
 Size   Size    Size     Time     Throughput  \n\
 bytes  bytes   bytes    secs.    %s/sec  \n\n";

   char *tput_fmt_0 =
     "%7.2f %s\n";

   char *tput_fmt_1 =
     "%6d %6d %6d    %-6.2f   %7.2f   %s\n";

   char *cpu_title = "\
 Recv   Send    Send                          Utilization       Service Demand\n\
 Socket Socket  Message  Elapsed              Recv     Send     Recv    Send\n\
 Size   Size    Size     Time     Throughput  local    remote   local   remote\n\
 bytes  bytes   bytes    secs.    %-8.8s/s  %% %c      %% %c      us/KB   us/KB\n\n";

   char *cpu_fmt_0 =
     "%6.3f %c %s\n";

   char *cpu_fmt_1 =
     "%6d %6d %6d    %-6.2f     %7.2f   %-6.2f   %-6.2f   %-6.3f  %-6.3f %s\n";

   char *ksink_fmt = "\n\
 Alignment      Offset         %-8.8s %-8.8s    Recvs   %-8.8s Sends\n\
 Local  Remote  Local  Remote  Xfered   Per                 Per\n\
 Recv   Send    Recv   Send             Recv (avg)          Send (avg)\n\
 %5d   %5d  %5d   %5d %6.4g  %6.2f    %6d   %6.2f %6d\n";

   char *ksink_fmt2 = "\n\
 Maximum\n\
 Segment\n\
 Size (bytes)\n\
 %6d\n";


   float			elapsed_time;

   /* what we want is to have a buffer space that is at least one */
   /* recv-size greater than our recv window. this will insure that we */
   /* are never trying to re-use a buffer that may still be in the hands */
   /* of the transport. This buffer will be malloc'd after we have found */
   /* the size of the local senc socket buffer. We will want to deal */
   /* with alignment and offset concerns as well. */

   struct ring_elt *recv_ring;

   int len;
   unsigned int nummessages = 0;
   SOCKET recv_socket;
   int bytes_remaining;
   int tcp_mss = -1;  /* possibly uninitialized on printf far below */

   /* with links like fddi, one can recv > 32 bits worth of bytes */
   /* during a test... ;-) at some point, this should probably become a */
   /* 64bit integral type, but those are not entirely common yet */
   double	bytes_sent = 0.0;
   unsigned long long local_bytes_recvd = 0;

   float	local_cpu_utilization;
   float	local_service_demand;
   float	remote_cpu_utilization;
   float	remote_service_demand;

   double	thruput;

   struct addrinfo *remote_res;
   struct addrinfo *local_res;

   struct	tcp_maerts_request_struct	*tcp_maerts_request;
   struct	tcp_maerts_response_struct	*tcp_maerts_response;
   struct	tcp_maerts_results_struct	*tcp_maerts_result;

   tcp_maerts_request  =
     (struct tcp_maerts_request_struct *)netperf_request.content.test_specific_data;
   tcp_maerts_response =
     (struct tcp_maerts_response_struct *)netperf_response.content.test_specific_data;
   tcp_maerts_result   =
     (struct tcp_maerts_results_struct *)netperf_response.content.test_specific_data;

 #ifdef WANT_HISTOGRAM
   if (verbosity > 1) {
     time_hist = HIST_new();
   }
 #endif /* WANT_HISTOGRAM */
   /* since we are now disconnected from the code that established the */
   /* control socket, and since we want to be able to use different */
   /* protocols and such, we are passed the name of the remote host and */
   /* must turn that into the test specific addressing information. */

   complete_addrinfos(&remote_res,
 		     &local_res,
 		     remote_host,
 		     SOCK_STREAM,
 		     IPPROTO_TCP,
 		     0);

   if ( print_headers ) {
     print_top_test_header("TCP MAERTS TEST",local_res,remote_res);
   }

   recv_ring = NULL;
   confidence_iteration = 1;
   init_stat();

   /* we have a great-big while loop which controls the number of times */
   /* we run a particular test. this is for the calculation of a */
   /* confidence interval (I really should have stayed awake during */
   /* probstats :). If the user did not request confidence measurement */
   /* (no confidence is the default) then we will only go though the */
   /* loop once. the confidence stuff originates from the folks at IBM */

   while (((confidence < 0) && (confidence_iteration < iteration_max)) ||
 	 (confidence_iteration <= iteration_min)) {

     /* initialize a few counters. we have to remember that we might be */
     /* going through the loop more than once. */

     nummessages    =	0;
     bytes_sent     =	0.0;
     times_up       = 	0;

     /*set up the data socket                        */
     recv_socket = create_data_socket(local_res);

     if (recv_socket == INVALID_SOCKET){
       perror("netperf: send_tcp_maerts: tcp stream data socket");
       exit(1);
     }

     if (debug) {
       fprintf(where,"send_tcp_maerts: recv_socket obtained...\n");
     }

     /* at this point, we have either retrieved the socket buffer sizes, */
     /* or have tried to set them, so now, we may want to set the recv */
     /* size based on that (because the user either did not use a -m */
     /* option, or used one with an argument of 0). If the socket buffer */
     /* size is not available, we will set the recv size to 4KB - no */
     /* particular reason, just arbitrary... */
     if (recv_size == 0) {
       if (lsr_size > 0) {
 	recv_size = lsr_size;
       }
       else {
 	recv_size = 4096;
       }
     }

     /* set-up the data buffer ring with the requested alignment and offset. */
     /* note also that we have allocated a quantity */
     /* of memory that is at least one recv-size greater than our socket */
     /* buffer size. We want to be sure that there are at least two */
     /* buffers allocated - this can be a bit of a problem when the */
     /* recv_size is bigger than the socket size, so we must check... the */
     /* user may have wanted to explicitly set the "width" of our recv */
     /* buffers, we should respect that wish... */
     if (recv_width == 0) {
       recv_width = (lsr_size/recv_size) + 1;
       if (recv_width == 1) recv_width++;
     }

     if (recv_ring == NULL) {
       /* only allocate the recv ring once. this is a networking test, */
       /* not a memory allocation test. this way, we do not need a */
       /* deallocate_buffer_ring() routine, and I don't feel like */
       /* writing one anyway :) raj 11/94 */
       recv_ring = allocate_buffer_ring(recv_width,
 				       recv_size,
 				       local_recv_align,
 				       local_recv_offset);
     }

     /* If the user has requested cpu utilization measurements, we must */
     /* calibrate the cpu(s). We will perform this task within the tests */
     /* themselves. If the user has specified the cpu rate, then */
     /* calibrate_local_cpu will return rather quickly as it will have */
     /* nothing to do. If local_cpu_rate is zero, then we will go through */
     /* all the "normal" calibration stuff and return the rate back. */

     if (local_cpu_usage) {
       local_cpu_rate = calibrate_local_cpu(local_cpu_rate);
     }

     if (!no_control) {
       /* Tell the remote end to do a listen. The server alters the
 	 socket paramters on the other side at this point, hence the
 	 reason for all the values being passed in the setup
 	 message. If the user did not specify any of the parameters,
 	 they will be passed as 0, which will indicate to the remote
 	 that no changes beyond the system's default should be
 	 used. Alignment is the exception, it will default to 1, which
 	 will be no alignment alterations. */

       netperf_request.content.request_type	=	DO_TCP_MAERTS;
       tcp_maerts_request->send_buf_size	=	rss_size_req;
       tcp_maerts_request->recv_buf_size	=	rsr_size_req;
       tcp_maerts_request->send_size	=	send_size;
       tcp_maerts_request->no_delay	=	rem_nodelay;
       tcp_maerts_request->send_alignment	=	remote_send_align;
       tcp_maerts_request->send_offset	=	remote_send_offset;
       tcp_maerts_request->measure_cpu	=	remote_cpu_usage;
       tcp_maerts_request->cpu_rate	=	remote_cpu_rate;
       if (test_time) {
 	tcp_maerts_request->test_length	=	test_time;
       }
       else {
 	tcp_maerts_request->test_length	=	test_bytes;
       }
       tcp_maerts_request->so_rcvavoid	=	rem_rcvavoid;
       tcp_maerts_request->so_sndavoid	=	rem_sndavoid;
 #ifdef DIRTY
       tcp_maerts_request->dirty_count       =       rem_dirty_count;
       tcp_maerts_request->clean_count       =       rem_clean_count;
 #endif /* DIRTY */
       tcp_maerts_request->port            = atoi(remote_data_port);
       tcp_maerts_request->ipfamily        = af_to_nf(remote_res->ai_family);
       if (debug > 1) {
 	fprintf(where,
 		"netperf: send_tcp_maerts: requesting TCP maerts test\n");
       }

       send_request();

       /* The response from the remote will contain all of the relevant
 	 socket parameters for this test type. We will put them back
 	 into the variables here so they can be displayed if desired.
 	 The remote will have calibrated CPU if necessary, and will
 	 have done all the needed set-up we will have calibrated the
 	 cpu locally before sending the request, and will grab the
 	 counter value right after the connect returns. The remote
 	 will grab the counter right after the accept call. This saves
 	 the hassle of extra messages being sent for the TCP
 	 tests.  */

       recv_response();

       if (!netperf_response.content.serv_errno) {
 	if (debug)
 	  fprintf(where,"remote listen done.\n");
 	rsr_size	=	tcp_maerts_response->recv_buf_size;
 	rss_size	=	tcp_maerts_response->send_buf_size;
 	rem_nodelay     =	tcp_maerts_response->no_delay;
 	remote_cpu_usage=	tcp_maerts_response->measure_cpu;
 	remote_cpu_rate = tcp_maerts_response->cpu_rate;
 	send_size       = tcp_maerts_response->send_size;

 	/* we have to make sure that the server port number is in
 	 network order */
       set_port_number(remote_res,
 		      (short)tcp_maerts_response->data_port_number);
       rem_rcvavoid	= tcp_maerts_response->so_rcvavoid;
       rem_sndavoid	= tcp_maerts_response->so_sndavoid;
       }
       else {
 	Set_errno(netperf_response.content.serv_errno);
 	fprintf(where,
 		"netperf: remote error %d",
 		netperf_response.content.serv_errno);
 	perror("");
 	fflush(where);

 	exit(1);
       }
     }

 #ifdef WANT_DEMO
     DEMO_STREAM_SETUP(lsr_size,rss_size)
 #endif

     /*Connect up to the remote port on the data socket  */
     if (connect(recv_socket,
 		remote_res->ai_addr,
 		remote_res->ai_addrlen) == INVALID_SOCKET){
       perror("netperf: send_tcp_maerts: data socket connect failed");
       exit(1);
     }

 #ifdef WIN32
   /* this is used so the timer thread can close the socket out from */
   /* under us, which to date is the easiest/cleanest/least */
   /* Windows-specific way I can find to force the winsock calls to */
   /* return WSAEINTR with the test is over. anything that will run on */
   /* 95 and NT and is closer to what netperf expects from Unix signals */
   /* and such would be appreciated raj 1/96 */
   win_kludge_socket = recv_socket;
 #endif /* WIN32 */

     /* Data Socket set-up is finished. If there were problems, either */
     /* the connect would have failed, or the previous response would */
     /* have indicated a problem. I failed to see the value of the */
     /* extra  message after the accept on the remote. If it failed, */
     /* we'll see it here. If it didn't, we might as well start pumping */
     /* data. */

     /* Set-up the test end conditions. For a maerts test, they can be */
     /* either time or byte-count based. */

     if (test_time) {
       /* The user wanted to end the test after a period of time. */
       times_up = 0;
       bytes_remaining = 0;
       /* in previous revisions, we had the same code repeated throught */
       /* all the test suites. this was unnecessary, and meant more */
       /* work for me when I wanted to switch to POSIX signals, so I */
       /* have abstracted this out into a routine in netlib.c. if you */
       /* are experiencing signal problems, you might want to look */
       /* there. raj 11/94 */
       if (!no_control) {
 	/* this is a netperf to netserver test, netserver will close
 	   to tell us the test is over, so use PAD_TIME to avoid
 	   causing the netserver fits. */
 	start_timer(test_time + PAD_TIME);
       }
       else {
 	/* this is a netperf to data source test, no PAD_TIME */
 	start_timer(test_time);
       }
     }
     else {
       /* The tester wanted to recv a number of bytes. we don't do that
 	 in a TCP_MAERTS test. sorry. raj 2002-06-21 */
       printf("netperf: send_tcp_maerts: test must be timed\n");
       exit(1);
     }

     /* The cpu_start routine will grab the current time and possibly */
     /* value of the idle counter for later use in measuring cpu */
     /* utilization and/or service demand and thruput. */

     cpu_start(local_cpu_usage);

 #ifdef WANT_INTERVALS
     INTERVALS_INIT();
 #endif /* WANT_INTERVALS */

     /* before we start, initialize a few variables */

 #ifdef WANT_DEMO
     if (demo_mode) {
       HIST_timestamp(demo_one_ptr);
     }
 #endif

     /* the test will continue until we either get a zero-byte recv()
        on the socket or our failsafe timer expires. most of the time
        we trust that we get a zero-byte recieve from the socket. raj
        2002-06-21 */

 #ifdef WANT_HISTOGRAM
     if (verbosity > 1) {
       /* timestamp just before we go into recv and then again just
 	 after we come out raj 8/94 */
       /* but only if we are actually going to display a histogram. raj
 	 2006-02-07 */
       HIST_timestamp(&time_one);
     }
 #endif /* WANT_HISTOGRAM */

     while ((!times_up) && (len=recv(recv_socket,
 				    recv_ring->buffer_ptr,
 				    recv_size,
 				    0)) > 0 ) {

 #ifdef WANT_HISTOGRAM
       if (verbosity > 1) {
 	/* timestamp the exit from the recv call and update the histogram */
 	HIST_timestamp(&time_two);
 	HIST_add(time_hist,delta_micro(&time_one,&time_two));
       }
 #endif /* WANT_HISTOGRAM */

 #ifdef DIRTY
       access_buffer(recv_ring->buffer_ptr,
 		    recv_size,
 		    loc_dirty_count,
 		    loc_clean_count);
 #endif /* DIRTY */

 #ifdef WANT_DEMO
       DEMO_STREAM_INTERVAL(len);
 #endif

 #ifdef WANT_INTERVALS
       INTERVALS_WAIT();
 #endif /* WANT_INTERVALS */

       /* now we want to move our pointer to the next position in the */
       /* data buffer...we may also want to wrap back to the "beginning" */
       /* of the bufferspace, so we will mod the number of messages sent */
       /* by the recv width, and use that to calculate the offset to add */
       /* to the base pointer. */
       nummessages++;
       recv_ring = recv_ring->next;
       if (bytes_remaining) {
 	bytes_remaining -= len;
       }

       local_bytes_recvd += len;

 #ifdef WANT_HISTOGRAM
       if (verbosity > 1) {
 	/* make sure we timestamp just before we go into recv  */
 	/* raj 2004-06-15 */
 	HIST_timestamp(&time_one);
       }
 #endif /* WANT_HISTOGRAM */

     }

     /* an EINTR is to be expected when this is a no_control test */
     if (((len < 0) || SOCKET_EINTR(len)) && (!no_control)) {
       perror("send_tcp_maerts: data recv error");
       printf("len was %d\n",len);
       exit(1);
     }

     /* if we get here, it must mean we had a recv return of 0 before
        the watchdog timer expired, or the watchdog timer expired and
        this was a no_control test */

     /* The test is over. Flush the buffers to the remote end. We do a
        graceful release to tell the  remote we have all the data. */

     /* but first, if the verbosity is greater than 1, find-out what */
     /* the TCP maximum segment_size was (if possible) */
     if (verbosity > 1) {
       tcp_mss = -1;
       get_tcp_info(recv_socket,&tcp_mss);
     }

     if (shutdown(recv_socket,SHUT_WR) == SOCKET_ERROR) {
       perror("netperf: cannot shutdown tcp maerts socket");
       exit(1);
     }

     stop_timer();

     /* this call will always give us the local elapsed time for the
        test, and will also store-away the necessaries for cpu
        utilization */

     cpu_stop(local_cpu_usage,&elapsed_time);	/* was cpu being */
 						/* measured and how */
 						/* long did we really */
 						/* run? */

     /* we are finished with the socket, so close it to prevent hitting */
     /* the limit on maximum open files. */

     close(recv_socket);

     if (!no_control) {
       /* Get the statistics from the remote end. The remote will have
          calculated service demand and all those interesting
          things. If it wasn't supposed to care, it will return obvious
          values. */

       recv_response();
       if (!netperf_response.content.serv_errno) {
 	if (debug)
 	  fprintf(where,"remote results obtained\n");
       }
       else {
 	Set_errno(netperf_response.content.serv_errno);
 	fprintf(where,
 		"netperf: remote error %d",
 		netperf_response.content.serv_errno);
 	perror("");
 	fflush(where);

 	exit(1);
       }

       /* We now calculate what our thruput was for the test. In the
 	 future, we may want to include a calculation of the thruput
 	 measured by the remote, but it should be the case that for a
 	 TCP maerts test, that the two numbers should be *very*
 	 close... We calculate bytes_sent regardless of the way the
 	 test length was controlled.  If it was time, we needed to,
 	 and if it was by bytes, the user may have specified a number
 	 of bytes that wasn't a multiple of the recv_size, so we
 	 really didn't recv what he asked for ;-) */

       bytes_sent	= ntohd(tcp_maerts_result->bytes_sent);
     }
     else {
       bytes_sent = (double)local_bytes_recvd;
     }


     thruput	= calc_thruput(bytes_sent);

     if (local_cpu_usage || remote_cpu_usage) {
       /* We must now do a little math for service demand and cpu */
       /* utilization for the system(s) */
       /* Of course, some of the information might be bogus because */
       /* there was no idle counter in the kernel(s). We need to make */
       /* a note of this for the user's benefit...*/
       if (local_cpu_usage) {

 	local_cpu_utilization	= calc_cpu_util(0.0);
 	local_service_demand	= calc_service_demand(bytes_sent,
 						      0.0,
 						      0.0,
 						      0);
       }
       else {
 	local_cpu_utilization	= (float) -1.0;
 	local_service_demand	= (float) -1.0;
       }

       if (remote_cpu_usage) {

 	remote_cpu_utilization	= tcp_maerts_result->cpu_util;
 	remote_service_demand	= calc_service_demand(bytes_sent,
 						      0.0,
 						      remote_cpu_utilization,
 						      tcp_maerts_result->num_cpus);
       }
       else {
 	remote_cpu_utilization = (float) -1.0;
 	remote_service_demand  = (float) -1.0;
       }
     }
     else {
       /* we were not measuring cpu, for the confidence stuff, we */
       /* should make it -1.0 */
       local_cpu_utilization	= (float) -1.0;
       local_service_demand	= (float) -1.0;
       remote_cpu_utilization = (float) -1.0;
       remote_service_demand  = (float) -1.0;
     }

     /* at this point, we want to calculate the confidence information. */
     /* if debugging is on, calculate_confidence will print-out the */
     /* parameters we pass it */

     calculate_confidence(confidence_iteration,
 			 elapsed_time,
 			 thruput,
 			 local_cpu_utilization,
 			 remote_cpu_utilization,
 			 local_service_demand,
 			 remote_service_demand);


     confidence_iteration++;
   }

   /* at this point, we have finished making all the runs that we */
   /* will be making. so, we should extract what the calcuated values */
   /* are for all the confidence stuff. we could make the values */
   /* global, but that seemed a little messy, and it did not seem worth */
   /* all the mucking with header files. so, we create a routine much */
   /* like calcualte_confidence, which just returns the mean values. */
   /* raj 11/94 */

   retrieve_confident_values(&elapsed_time,
 			    &thruput,
 			    &local_cpu_utilization,
 			    &remote_cpu_utilization,
 			    &local_service_demand,
 			    &remote_service_demand);

   /* We are now ready to print all the information. If the user */
   /* has specified zero-level verbosity, we will just print the */
   /* local service demand, or the remote service demand. If the */
   /* user has requested verbosity level 1, he will get the basic */
   /* "streamperf" numbers. If the user has specified a verbosity */
   /* of greater than 1, we will display a veritable plethora of */
   /* background information from outside of this block as it it */
   /* not cpu_measurement specific...  */

   if (confidence < 0) {
     /* we did not hit confidence, but were we asked to look for it? */
     if (iteration_max > 1) {
       display_confidence();
     }
   }

   if (local_cpu_usage || remote_cpu_usage) {
     local_cpu_method = format_cpu_method(cpu_method);
     remote_cpu_method = format_cpu_method(tcp_maerts_result->cpu_method);

     switch (verbosity) {
     case 0:
       if (local_cpu_usage) {
 	fprintf(where,
 		cpu_fmt_0,
 		local_service_demand,
 		local_cpu_method,
 		((print_headers) ||
 		 (result_brand == NULL)) ? "" : result_brand);
       }
       else {
 	fprintf(where,
 		cpu_fmt_0,
 		remote_service_demand,
 		remote_cpu_method,
 		((print_headers) ||
 		 (result_brand == NULL)) ? "" : result_brand);
       }
       break;
     case 1:
     case 2:
       if (print_headers) {
 	fprintf(where,
 		cpu_title,
 		format_units(),
 		local_cpu_method,
 		remote_cpu_method);
       }

       fprintf(where,
 	      cpu_fmt_1,		/* the format string */
 	      rsr_size,		        /* remote recvbuf size */
 	      lss_size,		        /* local sendbuf size */
 	      send_size,		/* how large were the recvs */
 	      elapsed_time,		/* how long was the test */
 	      thruput, 		        /* what was the xfer rate */
 	      local_cpu_utilization,	/* local cpu */
 	      remote_cpu_utilization,	/* remote cpu */
 	      local_service_demand,	/* local service demand */
 	      remote_service_demand,	/* remote service demand */
 	      ((print_headers) ||
 	       (result_brand == NULL)) ? "" : result_brand);
       break;
     }
   }
   else {
     /* The tester did not wish to measure service demand. */

     switch (verbosity) {
     case 0:
       fprintf(where,
 	      tput_fmt_0,
 	      thruput,
 	      ((print_headers) ||
 	       (result_brand == NULL)) ? "" : result_brand);
       break;
     case 1:
     case 2:
       if (print_headers) {
 	fprintf(where,tput_title,format_units());
       }
       fprintf(where,
 	      tput_fmt_1,		/* the format string */
 	      lsr_size, 		/* local recvbuf size */
 	      rss_size, 		/* remot sendbuf size */
 	      send_size,		/* how large were the recvs */
 	      elapsed_time, 		/* how long did it take */
 	      thruput,                  /* how fast did it go */
 	      ((print_headers) ||
 	       (result_brand == NULL)) ? "" : result_brand);
       break;
     }
   }

   /* it would be a good thing to include information about some of the */
   /* other parameters that may have been set for this test, but at the */
   /* moment, I do not wish to figure-out all the  formatting, so I will */
   /* just put this comment here to help remind me that it is something */
   /* that should be done at a later time. */

   if (verbosity > 1) {
     /* The user wanted to know it all, so we will give it to him. */
     /* This information will include as much as we can find about */
     /* TCP statistics, the alignments of the sends and receives */
     /* and all that sort of rot... */

     /* this stuff needs to be worked-out in the presence of confidence */
     /* intervals and multiple iterations of the test... raj 11/94 */

     fprintf(where,
 	    ksink_fmt,
 	    "Bytes",
 	    "Bytes",
 	    "Bytes",
 	    local_recv_align,
 	    remote_recv_align,
 	    local_recv_offset,
 	    remote_recv_offset,
 	    bytes_sent,
 	    bytes_sent / (double)nummessages,
 	    nummessages,
 	    bytes_sent / (double)tcp_maerts_result->send_calls,
 	    tcp_maerts_result->send_calls);
     fprintf(where,
 	    ksink_fmt2,
 	    tcp_mss);
     fflush(where);
 #ifdef WANT_HISTOGRAM
     fprintf(where,"\n\nHistogram of time spent in recv() call.\n");
     fflush(where);
     HIST_report(time_hist);
 #endif /* WANT_HISTOGRAM */
   }

 }


 /* this routine implements the TCP_MSS test.  All it does is pretend
    to be a TCP_STREAM test and report the TCP_MSS for the data
    connection.  No actual data is transferred. raj 2007-11-07
 */
 void
 send_tcp_mss(char remote_host[])
 {

   char *mss_title = "\
 Maximum\n\
 Segment\n\
 Size (bytes)\n\n";

   char *mss_fmt_0 =
     "%d %s\n";

   SOCKET send_socket;
   int tcp_mss = -1;  /* possibly uninitialized on printf far below */

   struct addrinfo *remote_res;
   struct addrinfo *local_res;

   struct	tcp_stream_request_struct	*tcp_stream_request;
   struct	tcp_stream_response_struct	*tcp_stream_response;
   struct	tcp_stream_results_struct	*tcp_stream_result;

   tcp_stream_request  =
     (struct tcp_stream_request_struct *)netperf_request.content.test_specific_data;
   tcp_stream_response =
     (struct tcp_stream_response_struct *)netperf_response.content.test_specific_data;
   tcp_stream_result   =
     (struct tcp_stream_results_struct *)netperf_response.content.test_specific_data;

   /* since we are now disconnected from the code that established the */
   /* control socket, and since we want to be able to use different */
   /* protocols and such, we are passed the name of the remote host and */
   /* must turn that into the test specific addressing information. */

   /* complete_addrinfos will either succede or exit the process */
   complete_addrinfos(&remote_res,
 		     &local_res,
 		     remote_host,
 		     SOCK_STREAM,
 		     IPPROTO_TCP,
 		     0);

   if ( print_headers ) {
     print_top_test_header("TCP MSS TEST",local_res,remote_res);
   }

   /*set up the data socket                        */
   send_socket = create_data_socket(local_res);

   if (send_socket == INVALID_SOCKET){
     perror("netperf: send_tcp_stream: tcp stream data socket");
     exit(1);
   }

   if (debug) {
     fprintf(where,"send_tcp_stream: send_socket obtained...\n");
   }


   if (!no_control) {
     /* Tell the remote end to do a listen. The server alters the
        socket paramters on the other side at this point, hence the
        reason for all the values being passed in the setup
        message. If the user did not specify any of the parameters,
        they will be passed as 0, which will indicate to the remote
        that no changes beyond the system's default should be
        used. Alignment is the exception, it will default to 1, which
        will be no alignment alterations. */

     netperf_request.content.request_type =	DO_TCP_STREAM;
     tcp_stream_request->send_buf_size	=	rss_size_req;
     tcp_stream_request->recv_buf_size	=	rsr_size_req;
     tcp_stream_request->receive_size	=	recv_size;
     tcp_stream_request->no_delay	=	rem_nodelay;
     tcp_stream_request->recv_alignment	=	remote_recv_align;
     tcp_stream_request->recv_offset	=	remote_recv_offset;
     tcp_stream_request->measure_cpu	=	remote_cpu_usage;
     tcp_stream_request->cpu_rate	=	remote_cpu_rate;
     if (test_time) {
       tcp_stream_request->test_length	=	test_time;
     }
     else {
       tcp_stream_request->test_length	=	test_bytes;
     }
     tcp_stream_request->so_rcvavoid	=	rem_rcvavoid;
     tcp_stream_request->so_sndavoid	=	rem_sndavoid;
 #ifdef DIRTY
     tcp_stream_request->dirty_count     =       rem_dirty_count;
     tcp_stream_request->clean_count     =       rem_clean_count;
 #endif /* DIRTY */
     tcp_stream_request->port            =    atoi(remote_data_port);
     tcp_stream_request->ipfamily = af_to_nf(remote_res->ai_family);
     if (debug > 1) {
       fprintf(where,
 	      "netperf: send_tcp_mss: requesting TCP stream test\n");
     }

     send_request();

     /* The response from the remote will contain all of the relevant
        socket parameters for this test type. We will put them back
        into the variables here so they can be displayed if desired.
        The remote will have calibrated CPU if necessary, and will
        have done all the needed set-up we will have calibrated the
        cpu locally before sending the request, and will grab the
        counter value right after the connect returns. The remote
        will grab the counter right after the accept call. This saves
        the hassle of extra messages being sent for the TCP
        tests.  */

     recv_response();

     if (!netperf_response.content.serv_errno) {
       if (debug)
 	fprintf(where,"remote listen done.\n");
       rsr_size	      =	tcp_stream_response->recv_buf_size;
       rss_size	      =	tcp_stream_response->send_buf_size;
       rem_nodelay     =	tcp_stream_response->no_delay;
       remote_cpu_usage=	tcp_stream_response->measure_cpu;
       remote_cpu_rate = tcp_stream_response->cpu_rate;

       /* we have to make sure that the server port number is in
 	 network order */
       set_port_number(remote_res,
 		      (short)tcp_stream_response->data_port_number);

       rem_rcvavoid	= tcp_stream_response->so_rcvavoid;
       rem_sndavoid	= tcp_stream_response->so_sndavoid;
     }
     else {
       Set_errno(netperf_response.content.serv_errno);
       fprintf(where,
 	      "netperf: remote error %d",
 	      netperf_response.content.serv_errno);
       perror("");
       fflush(where);

       exit(1);
     }
   }

   /*Connect up to the remote port on the data socket  */
   if (connect(send_socket,
 	      remote_res->ai_addr,
 	      remote_res->ai_addrlen) == INVALID_SOCKET){
     perror("netperf: send_tcp_mss: data socket connect failed");
     exit(1);
     }


   /* find-out what the TCP maximum segment_size was (if possible) */
   tcp_mss = -1;
   get_tcp_info(send_socket,&tcp_mss);

   /* just go ahead and close the socket, the remote should figure it
      out */
   close(send_socket);

   /* statistics? we don't need no stinking statistics */


     switch (verbosity) {
     case 0:
       fprintf(where,
 	      mss_fmt_0,
 	      tcp_mss,
 	      ((print_headers) ||
 	       (result_brand == NULL)) ? "" : result_brand);
       break;
     case 1:
     case 2:
       if (print_headers) {
 		fprintf(where,mss_title);
       }
       fprintf(where,
 	      mss_fmt_0,		/* the format string */
 	      tcp_mss,
 	      ((print_headers) ||
 	       (result_brand == NULL)) ? "" : result_brand);
       break;
     }


 }


 #ifdef HAVE_ICSC_EXS

 #include <sys/exs.h>


 /* This routine implements the TCP unidirectional data transfer test */
 /* (a.k.a. stream) for the sockets interface. It receives its */
 /* parameters via global variables from the shell and writes its */
 /* output to the standard output. */

 void
 send_exs_tcp_stream(char remote_host[])
 {

     char *tput_title = "\
 Recv   Send    Send                          \n\
 Socket Socket  Message  Elapsed              \n\
 Size   Size    Size     Time     Throughput  \n\
 bytes  bytes   bytes    secs.    %s/sec  \n\n";

     char *tput_fmt_0 =
         "%7.2f\n";

     char *tput_fmt_1 =
         "%6d %6d %6d    %-6.2f   %7.2f   \n";

     char *cpu_title = "\
 Recv   Send    Send                          Utilization       Service Demand\n\
 Socket Socket  Message  Elapsed              Send     Recv     Send    Recv\n\
 Size   Size    Size     Time     Throughput  local    remote   local   remote\n\
 bytes  bytes   bytes    secs.    %-8.8s/s  %% %c      %% %c      us/KB   us/KB\n\n";

     char *cpu_fmt_0 =
         "%6.3f %c\n";

     char *cpu_fmt_1 =
         "%6d %6d %6d    %-6.2f     %7.2f   %-6.2f   %-6.2f   %-6.3f  %-6.3f\n";

     char *ksink_fmt = "\n\
 Alignment      Offset         %-8.8s %-8.8s    Sends   %-8.8s Recvs\n\
 Local  Remote  Local  Remote  Xfered   Per                 Per\n\
 Send   Recv    Send   Recv             Send (avg)          Recv (avg)\n\
 %5d   %5d  %5d   %5d %6.4g  %6.2f    %6d   %6.2f %6d\n";

     char *ksink_fmt2 = "\n\
 Maximum\n\
 Segment\n\
 Size (bytes)\n\
 %6d\n";


     float         elapsed_time;

     /* what we want is to have a buffer space that is at least one */
     /* send-size greater than our send window. this will insure that we */
     /* are never trying to re-use a buffer that may still be in the hands */
     /* of the transport. This buffer will be malloc'd after we have found */
     /* the size of the local senc socket buffer. We will want to deal */
     /* with alignment and offset concerns as well. */

     struct ring_elt *send_ring;

     int len;
     unsigned int nummessages = 0;
     SOCKET send_socket;
     int bytes_remaining;
     int tcp_mss = -1;  /* possibly uninitialized on printf far below */

     exs_mhandle_t exs_mhandle;
     exs_qhandle_t exs_qhandle;
 #define NETPERF_EXS_PENDING  16
     int exs_aio_pending;
     int exs_aio_eagain;
     int exs_aio_dequeued;
     int exs_aio_dequeuecnt;
     int exs_evtcnt;
 #define NETPERF_EXS_QSIZE    128
     exs_event_t exs_evtvec[NETPERF_EXS_QSIZE];

     /* with links like fddi, one can send > 32 bits worth of bytes */
     /* during a test... ;-) at some point, this should probably become a */
     /* 64bit integral type, but those are not entirely common yet */

     double   bytes_sent = 0.0;

     float   local_cpu_utilization;
     float   local_service_demand;
     float   remote_cpu_utilization;
     float   remote_service_demand;

     double   thruput;

     struct addrinfo *remote_res;
     struct addrinfo *local_res;

     struct   tcp_stream_request_struct   *tcp_stream_request;
     struct   tcp_stream_response_struct   *tcp_stream_response;
     struct   tcp_stream_results_struct   *tcp_stream_result;

     tcp_stream_request  =
         (struct tcp_stream_request_struct *)netperf_request.content.test_specific_data;
     tcp_stream_response =
         (struct tcp_stream_response_struct *)netperf_response.content.test_specific_data;
     tcp_stream_result   =
         (struct tcp_stream_results_struct *)netperf_response.content.test_specific_data;

 #if 0 /* def WANT_HISTOGRAM */
     time_hist = HIST_new();
 #endif /* WANT_HISTOGRAM */
     /* since we are now disconnected from the code that established the */
     /* control socket, and since we want to be able to use different */
     /* protocols and such, we are passed the name of the remote host and */
     /* must turn that into the test specific addressing information. */

     /* complete_addrinfos will either succede or exit the process */
     complete_addrinfos(&remote_res,
                        &local_res,
                        remote_host,
                        SOCK_STREAM,
                        IPPROTO_TCP,
                        0);

     if ( print_headers ) {
         print_top_test_header("EXS TCP STREAM TEST",local_res,remote_res);
     }

     send_ring = NULL;
     confidence_iteration = 1;
     init_stat();

     /* initialize EXS API and create event queue */
     if (exs_init (EXS_VERSION) == -1) {
         perror ("netperf: send_exs_tcp_stream: exs_init failed");
         exit (1);
     }

     if ((exs_qhandle = exs_qcreate (NETPERF_EXS_QSIZE)) == EXS_QHANDLE_INVALID) {
         perror ("netperf: send_exs_tcp_stream: exs_qcreate failed");
         exit (1);
     }
     if (debug) {
         fprintf (where, "send_exs_tcp_stream: qhandle=%d\n", exs_qhandle);
     }

     /* we have a great-big while loop which controls the number of times */
     /* we run a particular test. this is for the calculation of a */
     /* confidence interval (I really should have stayed awake during */
     /* probstats :). If the user did not request confidence measurement */
     /* (no confidence is the default) then we will only go though the */
     /* loop once. the confidence stuff originates from the folks at IBM */

     while (((confidence < 0) && (confidence_iteration < iteration_max)) ||
            (confidence_iteration <= iteration_min)) {

         /* initialize a few counters. we have to remember that we might be */
         /* going through the loop more than once. */

         nummessages    =   0;
         bytes_sent     =   0.0;
         times_up       =    0;

         /*set up the data socket                        */
         send_socket = create_data_socket(local_res);

         if (send_socket == INVALID_SOCKET){
             perror("netperf: send_tcp_stream: tcp stream data socket");
             exit(1);
         }

         if (debug) {
             fprintf(where,"send_tcp_stream: send_socket obtained...\n");
         }

         /* at this point, we have either retrieved the socket buffer sizes, */
         /* or have tried to set them, so now, we may want to set the send */
         /* size based on that (because the user either did not use a -m */
         /* option, or used one with an argument of 0). If the socket buffer */
         /* size is not available, we will set the send size to 4KB - no */
         /* particular reason, just arbitrary... */
         if (send_size == 0) {
             if (lss_size > 0) {
                 send_size = lss_size;
             }
             else {
                 send_size = 4096;
             }
         }

         /* set-up the data buffer ring with the requested alignment and offset. */
         /* note also that we have allocated a quantity */
         /* of memory that is at least one send-size greater than our socket */
         /* buffer size. We want to be sure that there are at least two */
         /* buffers allocated - this can be a bit of a problem when the */
         /* send_size is bigger than the socket size, so we must check... the */
         /* user may have wanted to explicitly set the "width" of our send */
         /* buffers, we should respect that wish... */
         if (send_width == 0) {
             send_width = (lss_size/send_size) + 1;
             if (send_width == 1) send_width++;
         }

         if (send_ring == NULL) {
             /* only allocate the send ring once. this is a networking test, */
             /* not a memory allocation test. this way, we do not need a */
             /* deallocate_buffer_ring() routine, and I don't feel like */
             /* writing one anyway :) raj 11/94 */
             send_ring = allocate_exs_buffer_ring(send_width,
                                                  send_size,
                                                  local_send_align,
                                                  local_send_offset,
                                                  &exs_mhandle);
         }

         /* If the user has requested cpu utilization measurements, we must */
         /* calibrate the cpu(s). We will perform this task within the tests */
         /* themselves. If the user has specified the cpu rate, then */
         /* calibrate_local_cpu will return rather quickly as it will have */
         /* nothing to do. If local_cpu_rate is zero, then we will go through */
         /* all the "normal" calibration stuff and return the rate back. */

         if (local_cpu_usage) {
             local_cpu_rate = calibrate_local_cpu(local_cpu_rate);
         }

         /* Tell the remote end to do a listen. The server alters the socket */
         /* paramters on the other side at this point, hence the reason for */
         /* all the values being passed in the setup message. If the user did */
         /* not specify any of the parameters, they will be passed as 0, which */
         /* will indicate to the remote that no changes beyond the system's */
         /* default should be used. Alignment is the exception, it will */
         /* default to 1, which will be no alignment alterations. */

         netperf_request.content.request_type =   DO_TCP_STREAM;
         tcp_stream_request->send_buf_size   =   rss_size_req;
         tcp_stream_request->recv_buf_size   =   rsr_size_req;
         tcp_stream_request->receive_size   =   recv_size;
         tcp_stream_request->no_delay   =   rem_nodelay;
         tcp_stream_request->recv_alignment   =   remote_recv_align;
         tcp_stream_request->recv_offset   =   remote_recv_offset;
         tcp_stream_request->measure_cpu   =   remote_cpu_usage;
         tcp_stream_request->cpu_rate   =   remote_cpu_rate;
         if (test_time) {
             tcp_stream_request->test_length   =   test_time;
         }
         else {
             tcp_stream_request->test_length   =   test_bytes;
         }
         tcp_stream_request->so_rcvavoid   =   rem_rcvavoid;
         tcp_stream_request->so_sndavoid   =   rem_sndavoid;
 #ifdef DIRTY
         tcp_stream_request->dirty_count     =       rem_dirty_count;
         tcp_stream_request->clean_count     =       rem_clean_count;
 #endif /* DIRTY */
         tcp_stream_request->port            =    atoi(remote_data_port);
         tcp_stream_request->ipfamily = af_to_nf(remote_res->ai_family);
         if (debug > 1) {
             fprintf(where,
                     "netperf: send_tcp_stream: requesting TCP stream test\n");
         }

         send_request();

         /* The response from the remote will contain all of the relevant    */
         /* socket parameters for this test type. We will put them back into */
         /* the variables here so they can be displayed if desired.  The   */
         /* remote will have calibrated CPU if necessary, and will have done   */
         /* all the needed set-up we will have calibrated the cpu locally   */
         /* before sending the request, and will grab the counter value right*/
         /* after the connect returns. The remote will grab the counter right*/
         /* after the accept call. This saves the hassle of extra messages   */
         /* being sent for the TCP tests.               */

         recv_response();

         if (!netperf_response.content.serv_errno) {
             if (debug)
                 fprintf(where,"remote listen done.\n");
             rsr_size         =   tcp_stream_response->recv_buf_size;
             rss_size         =   tcp_stream_response->send_buf_size;
             rem_nodelay     =   tcp_stream_response->no_delay;
             remote_cpu_usage=   tcp_stream_response->measure_cpu;
             remote_cpu_rate = tcp_stream_response->cpu_rate;

             /* we have to make sure that the server port number is in */
             /* network order */
             set_port_number(remote_res,(short)tcp_stream_response->data_port_number);

             rem_rcvavoid   = tcp_stream_response->so_rcvavoid;
             rem_sndavoid   = tcp_stream_response->so_sndavoid;
         }
         else {
             Set_errno(netperf_response.content.serv_errno);
             fprintf(where,
                     "netperf: remote error %d",
                     netperf_response.content.serv_errno);
             perror("");
             fflush(where);

             exit(1);
         }

 #if 0 /* def WANT_DEMO */
         DEMO_STREAM_SETUP(lss_size,rsr_size)
 #endif

             /*Connect up to the remote port on the data socket  */
             if (connect(send_socket,
                         remote_res->ai_addr,
                         remote_res->ai_addrlen) == INVALID_SOCKET){
                 perror("netperf: send_tcp_stream: data socket connect failed");
                 exit(1);
             }

 #ifdef WIN32
   /* this is used so the timer thread can close the socket out from */
   /* under us, which to date is the easiest/cleanest/least */
   /* Windows-specific way I can find to force the winsock calls to */
   /* return WSAEINTR with the test is over. anything that will run on */
   /* 95 and NT and is closer to what netperf expects from Unix signals */
   /* and such would be appreciated raj 1/96 */
   win_kludge_socket = send_socket;
 #endif /* WIN32 */

         /* Data Socket set-up is finished. If there were problems, either */
         /* the connect would have failed, or the previous response would */
         /* have indicated a problem. I failed to see the value of the */
         /* extra  message after the accept on the remote. If it failed, */
         /* we'll see it here. If it didn't, we might as well start pumping */
         /* data. */

         /* Set-up the test end conditions. For a stream test, they can be */
         /* either time or byte-count based. */

         if (test_time) {
             /* The user wanted to end the test after a period of time. */
             times_up = 0;
             bytes_remaining = 0;
             /* in previous revisions, we had the same code repeated throught */
             /* all the test suites. this was unnecessary, and meant more */
             /* work for me when I wanted to switch to POSIX signals, so I */
             /* have abstracted this out into a routine in netlib.c. if you */
             /* are experiencing signal problems, you might want to look */
             /* there. raj 11/94 */
             start_timer(test_time);
         }
         else {
             /* The tester wanted to send a number of bytes. */
             bytes_remaining = test_bytes;
             times_up = 1;
         }

         /* The cpu_start routine will grab the current time and possibly */
         /* value of the idle counter for later use in measuring cpu */
         /* utilization and/or service demand and thruput. */

         cpu_start(local_cpu_usage);

 #if 0 /* def WANT_INTERVALS */
 	INTERVALS_INIT();
 #endif /* WANT_INTERVALS */

         /* before we start, initialize a few variables */

 #if 0 /* def WANT_DEMO */
         if (demo_mode) {
             HIST_timestamp(demo_one_ptr);
         }
 #endif


         /* We use an "OR" to control test execution. When the test is */
         /* controlled by time, the byte count check will always return false. */
         /* When the test is controlled by byte count, the time test will */
         /* always return false. When the test is finished, the whole */
         /* expression will go false and we will stop sending data. */

         exs_aio_pending = 0;
         exs_aio_eagain = 0;
         exs_aio_dequeuecnt = 0;

         while ((!times_up) || (bytes_remaining > 0)) {

 #ifdef DIRTY
 	  access_buffer(send_ring->buffer_ptr,
 			send_size,
 			loc_dirty_count,
 			loc_clean_count);
 #endif /* DIRTY */

 #if 0 /* def WANT_HISTOGRAM */
             /* timestamp just before we go into send and then again just after */
             /* we come out raj 8/94 */
             HIST_timestamp(&time_one);
 #endif /* WANT_HISTOGRAM */


             /* post up to NETPERF_EXS_PENDING I/Os  */
             while ((exs_aio_pending < NETPERF_EXS_PENDING) &&
                    (exs_send (send_socket, send_ring->buffer_ptr, send_size,
                               0, exs_qhandle, (exs_ahandle_t)-1, exs_mhandle) == 0)) {
                 exs_aio_pending++;

                 /* now we want to move our pointer to the next
 		   position in the data buffer...we may also want to
 		   wrap back to the "beginning" of the bufferspace, so
 		   we will mod the number of messages sent by the send
 		   width, and use that to calculate the offset to add
 		   to the base pointer. */

                 nummessages++;
                 send_ring = send_ring->next;
                 if (bytes_remaining) {
                     bytes_remaining -= send_size;
                 }
             }

             /* check exs_send result */
             if (exs_aio_pending < NETPERF_EXS_PENDING) {
                /* standard flow control case */
                 if (errno == EAGAIN)
                     exs_aio_eagain++;
                 /* case of times_up */
                 else if (errno == EINTR)
                     break;
                 /* strange, let's stop */
                 else {
                     perror ("netperf: exs_send error");
                     exit (1);
                 }
             }

             /* dequeue events with "threshold" on 1/2 posted */
             exs_aio_dequeued =
                 exs_qdequeue (exs_qhandle, exs_evtvec,
                               -(exs_aio_pending>>1), NULL);
             exs_aio_dequeuecnt++;

             /* check exs_dequeue result */
             if (exs_aio_dequeued < 0) {
                 /* case of times_up */
                 if (errno == EINTR)
                     break;
                 /* strange, let's stop */
                 else {
                     perror ("netperf: exs_send error");
                     exit (1);
                 }
             }
             /* update number of pending I/Os */
             else {
                 exs_aio_pending -= exs_aio_dequeued;
             }


 #if 0 /* def WANT_HISTOGRAM */
             /* timestamp the exit from the send call and update the histogram */
             HIST_timestamp(&time_two);
             HIST_add(time_hist,delta_micro(&time_one,&time_two));
 #endif /* WANT_HISTOGRAM */

 #if 0 /* def WANT_DEMO */
             DEMO_STREAM_INTERVAL(send_size);
 #endif

 #if 0 /* def WANT_INTERVALS */
 	    INTERVALS_WAIT();
 #endif /* WANT_INTERVALS */

         }

         /* Collect the last completion events */
         exs_aio_dequeued =
             exs_qdequeue (exs_qhandle, exs_evtvec, -exs_aio_pending, NULL);
         exs_aio_dequeuecnt++;
         /* check exs_dequeue result and update number of pending I/Os */
         if (exs_aio_dequeued < 0) {
             perror ("netperf: exs_send error");
             exit (1);
         }
         exs_aio_pending -= exs_aio_dequeued;

         /* Display some async I/O debug info */
         if (debug) {
             fprintf (where, "send_exs_tcp_stream: "
                      "aio sent=%d eagain=%d dequeue=%d pending=%d\n",
                      nummessages, exs_aio_eagain, exs_aio_dequeuecnt, exs_aio_pending);
         }

         /* The test is over. Flush the buffers to the remote end. We do a */
         /* graceful release to insure that all data has been taken by the */
         /* remote. */

         /* but first, if the verbosity is greater than 1, find-out what */
         /* the TCP maximum segment_size was (if possible) */
         if (verbosity > 1) {
             tcp_mss = -1;
             get_tcp_info(send_socket,&tcp_mss);
         }

         if (shutdown(send_socket,SHUT_WR) == SOCKET_ERROR) {
             perror("netperf: cannot shutdown tcp stream socket");
             exit(1);
         }

         /* hang a recv() off the socket to block until the remote has */
         /* brought all the data up into the application. it will do a */
         /* shutdown to cause a FIN to be sent our way. We will assume that */
         /* any exit from the recv() call is good... raj 4/93 */

         recv(send_socket, send_ring->buffer_ptr, send_size, 0);

         /* this call will always give us the elapsed time for the test, and */
         /* will also store-away the necessaries for cpu utilization */

         cpu_stop(local_cpu_usage,&elapsed_time);   /* was cpu being */
         /* measured and how */
         /* long did we really */
         /* run? */

         /* we are finished with the socket, so close it to prevent hitting */
         /* the limit on maximum open files. */

         close(send_socket);

         /* Get the statistics from the remote end. The remote will have */
         /* calculated service demand and all those interesting things. If it */
         /* wasn't supposed to care, it will return obvious values. */

         recv_response();
         if (!netperf_response.content.serv_errno) {
             if (debug)
                 fprintf(where,"remote results obtained\n");
         }
         else {
             Set_errno(netperf_response.content.serv_errno);
             fprintf(where,
                     "netperf: remote error %d",
                     netperf_response.content.serv_errno);
             perror("");
             fflush(where);

             exit(1);
         }

         /* We now calculate what our thruput was for the test. In the future, */
         /* we may want to include a calculation of the thruput measured by */
         /* the remote, but it should be the case that for a TCP stream test, */
         /* that the two numbers should be *very* close... We calculate */
         /* bytes_sent regardless of the way the test length was controlled. */
         /* If it was time, we needed to, and if it was by bytes, the user may */
         /* have specified a number of bytes that wasn't a multiple of the */
         /* send_size, so we really didn't send what he asked for ;-) */

         bytes_sent   = ntohd(tcp_stream_result->bytes_received);

         thruput   = calc_thruput(bytes_sent);

         if (local_cpu_usage || remote_cpu_usage) {
             /* We must now do a little math for service demand and cpu */
             /* utilization for the system(s) */
             /* Of course, some of the information might be bogus because */
             /* there was no idle counter in the kernel(s). We need to make */
             /* a note of this for the user's benefit...*/
             if (local_cpu_usage) {

                 local_cpu_utilization   = calc_cpu_util(0.0);
                 local_service_demand   = calc_service_demand(bytes_sent,
                                                              0.0,
                                                              0.0,
                                                              0);
             }
             else {
                 local_cpu_utilization   = (float) -1.0;
                 local_service_demand   = (float) -1.0;
             }

             if (remote_cpu_usage) {

                 remote_cpu_utilization   = tcp_stream_result->cpu_util;
                 remote_service_demand   = calc_service_demand(bytes_sent,
                                                               0.0,
                                                               remote_cpu_utilization,
                                                               tcp_stream_result->num_cpus);
             }
             else {
                 remote_cpu_utilization = (float) -1.0;
                 remote_service_demand  = (float) -1.0;
             }
         }
         else {
             /* we were not measuring cpu, for the confidence stuff, we */
             /* should make it -1.0 */
             local_cpu_utilization   = (float) -1.0;
             local_service_demand   = (float) -1.0;
             remote_cpu_utilization = (float) -1.0;
             remote_service_demand  = (float) -1.0;
         }

         /* at this point, we want to calculate the confidence information. */
         /* if debugging is on, calculate_confidence will print-out the */
         /* parameters we pass it */

         calculate_confidence(confidence_iteration,
                              elapsed_time,
                              thruput,
                              local_cpu_utilization,
                              remote_cpu_utilization,
                              local_service_demand,
                              remote_service_demand);


         confidence_iteration++;
     }

     /* at this point, we have finished making all the runs that we */
     /* will be making. so, we should extract what the calcuated values */
     /* are for all the confidence stuff. we could make the values */
     /* global, but that seemed a little messy, and it did not seem worth */
     /* all the mucking with header files. so, we create a routine much */
     /* like calcualte_confidence, which just returns the mean values. */
     /* raj 11/94 */

     retrieve_confident_values(&elapsed_time,
                               &thruput,
                               &local_cpu_utilization,
                               &remote_cpu_utilization,
                               &local_service_demand,
                               &remote_service_demand);

     /* We are now ready to print all the information. If the user */
     /* has specified zero-level verbosity, we will just print the */
     /* local service demand, or the remote service demand. If the */
     /* user has requested verbosity level 1, he will get the basic */
     /* "streamperf" numbers. If the user has specified a verbosity */
     /* of greater than 1, we will display a veritable plethora of */
     /* background information from outside of this block as it it */
     /* not cpu_measurement specific...  */

     if (confidence < 0) {
         /* we did not hit confidence, but were we asked to look for it? */
         if (iteration_max > 1) {
             display_confidence();
         }
     }

     if (local_cpu_usage || remote_cpu_usage) {
         local_cpu_method = format_cpu_method(cpu_method);
         remote_cpu_method = format_cpu_method(tcp_stream_result->cpu_method);

         switch (verbosity) {
             case 0:
                 if (local_cpu_usage) {
                     fprintf(where,
                             cpu_fmt_0,
                             local_service_demand,
                             local_cpu_method);
                 }
                 else {
                     fprintf(where,
                             cpu_fmt_0,
                             remote_service_demand,
                             remote_cpu_method);
                 }
                 break;
             case 1:
             case 2:
                 if (print_headers) {
                     fprintf(where,
                             cpu_title,
                             format_units(),
                             local_cpu_method,
                             remote_cpu_method);
                 }

                 fprintf(where,
                         cpu_fmt_1,      /* the format string */
                         rsr_size,              /* remote recvbuf size */
                         lss_size,              /* local sendbuf size */
                         send_size,      /* how large were the sends */
                         elapsed_time,      /* how long was the test */
                         thruput,               /* what was the xfer rate */
                         local_cpu_utilization,   /* local cpu */
                         remote_cpu_utilization,   /* remote cpu */
                         local_service_demand,   /* local service demand */
                         remote_service_demand);   /* remote service demand */
                 break;
         }
     }
     else {
         /* The tester did not wish to measure service demand. */

         switch (verbosity) {
             case 0:
                 fprintf(where,
                         tput_fmt_0,
                         thruput);
                 break;
             case 1:
             case 2:
                 if (print_headers) {
                     fprintf(where,tput_title,format_units());
                 }
                 fprintf(where,
                         tput_fmt_1,      /* the format string */
                         rsr_size,       /* remote recvbuf size */
                         lss_size,       /* local sendbuf size */
                         send_size,      /* how large were the sends */
                         elapsed_time,       /* how long did it take */
                         thruput);/* how fast did it go */
                 break;
         }
     }

     /* it would be a good thing to include information about some of the */
     /* other parameters that may have been set for this test, but at the */
     /* moment, I do not wish to figure-out all the  formatting, so I will */
     /* just put this comment here to help remind me that it is something */
     /* that should be done at a later time. */

     if (verbosity > 1) {
         /* The user wanted to know it all, so we will give it to him. */
         /* This information will include as much as we can find about */
         /* TCP statistics, the alignments of the sends and receives */
         /* and all that sort of rot... */

         /* this stuff needs to be worked-out in the presence of confidence */
         /* intervals and multiple iterations of the test... raj 11/94 */

         fprintf(where,
                 ksink_fmt,
                 "Bytes",
                 "Bytes",
                 "Bytes",
                 local_send_align,
                 remote_recv_align,
                 local_send_offset,
                 remote_recv_offset,
                 bytes_sent,
                 bytes_sent / (double)nummessages,
                 nummessages,
                 bytes_sent / (double)tcp_stream_result->recv_calls,
                 tcp_stream_result->recv_calls);
         fprintf(where,
                 ksink_fmt2,
                 tcp_mss);
         fflush(where);
 #if 0 /* def WANT_HISTOGRAM */
         fprintf(where,"\n\nHistogram of time spent in send() call.\n");
         fflush(where);
         HIST_report(time_hist);
 #endif /* WANT_HISTOGRAM */
     }

 }

 #endif /* HAVE_ICSC_EXS */


 #if defined(HAVE_SENDFILE)

 #if defined(QUICK_SENDPATH)

 /*
  * a temporary stub for the sendpath() system call
  * which is defined & implemented in the kernel
  * but which has no libc stub.
  */
 #include <sys/types.h>
 #include <sys/scall_define.h>
 #include <sys/uio.h>

 ssize_t
 sendpath(int s, char *path, off_t offset, size_t nbytes,
 	 const struct iovec *hdtrl, int flags)
   {
     return syscall(SYS_sendpath, s, path, offset, nbytes, hdtrl, flags);
   }
 #endif /* QUICK_SENDPATH */

 /* This routine implements the TCP unidirectional data transfer test
    (a.k.a. stream) for the sockets interface using the sendfile()
    system call - TCP_SENDFILE.  It receives its  parameters via global
    variables from the shell and writes its  output to the standard
    output. Basically,  this is the same test as the send_tcp_stream()
    logic and we even tell the remote to do a TCP_STREAM test since for
    all it knows, nothig is different. */

 void
 sendfile_tcp_stream(remote_host)
      char	remote_host[];
 {

   char *tput_title = "\
 Recv   Send    Send                          \n\
 Socket Socket  Message  Elapsed              \n\
 Size   Size    Size     Time     Throughput  \n\
 bytes  bytes   bytes    secs.    %s/sec  \n\n";

   char *tput_fmt_0 =
     "%7.2f %s\n";

   char *tput_fmt_1 =
     "%6d %6d %6d    %-6.2f   %7.2f   %s\n";

   char *cpu_title = "\
 Recv   Send    Send                          Utilization       Service Demand\n\
 Socket Socket  Message  Elapsed              Send     Recv     Send    Recv\n\
 Size   Size    Size     Time     Throughput  local    remote   local   remote\n\
 bytes  bytes   bytes    secs.    %-8.8s/s  %% %c      %% %c      us/KB   us/KB\n\n";

   char *cpu_fmt_0 =
     "%6.3f %c %s\n";
   char *cpu_fmt_1 =
     "%6d %6d %6d    %-6.2f     %7.2f   %-6.2f   %-6.2f   %-6.3f  %-6.3f %s\n";

   char *ksink_fmt = "\n\
 Alignment      Offset         %-8.8s %-8.8s    Sends   %-8.8s Recvs\n\
 Local  Remote  Local  Remote  Xfered   Per                 Per\n\
 Send   Recv    Send   Recv             Send (avg)          Recv (avg)\n\
 %5d   %5d  %5d   %5d %6.4g  %6.2f    %6d   %6.2f %6d\n";

 char *ksink_fmt2 = "\n\
 Maximum\n\
 Segment\n\
 Size (bytes)\n\
 %6d\n";

   float			elapsed_time;

   /* what we want is to have a buffer space that is at least one */
   /* send-size greater than our send window. this will insure that we */
   /* are never trying to re-use a buffer that may still be in the hands */
   /* of the transport. This buffer will be malloc'd after we have found */
   /* the size of the local senc socket buffer. We will want to deal */
   /* with alignment and offset concerns as well. */

   struct sendfile_ring_elt *send_ring;

   int len;
   unsigned int nummessages = 0;
   SOCKET send_socket;
   int bytes_remaining;
   int tcp_mss = -1;  /* possibly uninitialized on printf far below */

   /* with links like fddi, one can send > 32 bits worth of bytes */
   /* during a test... ;-) at some point, this should probably become a */
   /* 64bit integral type, but those are not entirely common yet */
   double	bytes_sent = 0.0;

   float	local_cpu_utilization;
   float	local_service_demand;
   float	remote_cpu_utilization;
   float	remote_service_demand;

   double	thruput;

   struct  addrinfo *remote_res;
   struct  addrinfo *local_res;
   struct	sockaddr_in	server;

 #if defined(__linux) || defined(__sun)
   off_t     scratch_offset;   /* the linux sendfile() call will update
 				 the offset variable, which is
 				 something we do _not_ want to happen
 				 to the value in the send_ring! so, we
 				 have to use a scratch variable. */
 #endif /* __linux  || defined(__sun) */
 #if defined (USE_OSX)
    off_t    scratch_len;  /* Darwin 9.x need a value-result parameter  */
 #endif
 #if defined (__sun)
    size_t  scratch_len;	/* the sun sendfilev() needs a place to
 			   tell us how many bytes were written,
 			   even though it also returns the value */
    sendfilevec_t sv;
 #endif /* __sun */

   struct	tcp_stream_request_struct	*tcp_stream_request;
   struct	tcp_stream_response_struct	*tcp_stream_response;
   struct	tcp_stream_results_struct	*tcp_stream_result;

   tcp_stream_request  =
     (struct tcp_stream_request_struct *)netperf_request.content.test_specific_data;
   tcp_stream_response =
     (struct tcp_stream_response_struct *)netperf_response.content.test_specific_data;
   tcp_stream_result   =
     (struct tcp_stream_results_struct *)netperf_response.content.test_specific_data;

 #ifdef WANT_HISTOGRAM
   if (verbosity > 1) {
     time_hist = HIST_new();
   }
 #endif /* WANT_HISTOGRAM */

   /* since we are now disconnected from the code that established the */
   /* control socket, and since we want to be able to use different */
   /* protocols and such, we are passed the name of the remote host and */
   /* must turn that into the test specific addressing information. */

   bzero((char *)&server,
 	sizeof(server));

   complete_addrinfos(&remote_res,
 		     &local_res,
 		     remote_host,
 		     SOCK_STREAM,
 		     IPPROTO_TCP,
 		     0);

   if ( print_headers ) {
     /* we want to have some additional, interesting information in */
     /* the headers. we know some of it here, but not all, so we will */
     /* only print the test title here and will print the results */
     /* titles after the test is finished */
 #ifdef QUICK_SENDPATH
     print_top_test_header("TCP SENDPATH TEST",local_res,remote_res);
 #else
     print_top_test_header("TCP SENDFILE TEST",local_res,remote_res);
 #endif /* QUICK_SENDPATH */
   }
   send_ring = NULL;
   confidence_iteration = 1;
   init_stat();

   /* we have a great-big while loop which controls the number of times */
   /* we run a particular test. this is for the calculation of a */
   /* confidence interval (I really should have stayed awake during */
   /* probstats :). If the user did not request confidence measurement */
   /* (no confidence is the default) then we will only go though the */
   /* loop once. the confidence stuff originates from the folks at IBM */

   while (((confidence < 0) && (confidence_iteration < iteration_max)) ||
 	 (confidence_iteration <= iteration_min)) {

     /* initialize a few counters. we have to remember that we might be */
     /* going through the loop more than once. */

     nummessages    =	0;
     bytes_sent     =	0.0;
     times_up       = 	0;

     /* set up the data socket */
     send_socket = create_data_socket(local_res);

     if (send_socket == INVALID_SOCKET){
       perror("netperf: sendfile_tcp_stream: tcp stream data socket");
       exit(1);
     }

     if (debug) {
       fprintf(where,"sendfile_tcp_stream: send_socket obtained...\n");
     }

 #if defined(TCP_CORK)
     /* should this even be here?!? */
     if (loc_tcpcork > 0) {
       /* the user wishes for us to set TCP_CORK on the socket */
       int one = 1;
       if (setsockopt(send_socket,
 		     getprotobyname("tcp")->p_proto,
 		     TCP_CORK,
 		     (char *)&one,
 		     sizeof(one)) == SOCKET_ERROR) {
 	perror("netperf: sendfile_tcp_stream: tcp_cork");
 	exit(1);
       }
       if (debug) {
 	fprintf(where,"sendfile_tcp_stream: tcp_cork...\n");
       }
     }

 #endif /* TCP_CORK */

     /* at this point, we have either retrieved the socket buffer sizes, */
     /* or have tried to set them, so now, we may want to set the send */
     /* size based on that (because the user either did not use a -m */
     /* option, or used one with an argument of 0). If the socket buffer */
     /* size is not available, we will set the send size to 4KB - no */
     /* particular reason, just arbitrary... */

     /*check for file size/ min file size here?  create file here/ back out???*/

     if (send_size == 0) {
       if (lss_size > 0) {
 	send_size = lss_size;
       }
       else {
 	send_size = 4096;
       }
     }

     /* set-up the data buffer ring with the requested alignment and
        offset. note also that we have allocated a quantity  of memory
        that is at least one send-size greater than our socket  buffer
        size. We want to be sure that there are at least two  buffers
        allocated - this can be a bit of a problem when the  send_size
        is bigger than the socket size, so we must check... the  user
        may have wanted to explicitly set the "width" of our send
        buffers, we should respect that wish... */

     /*sendring -> an offset index that will shift the starting point of the*/
     /*section of the file sent throughout the file*/

     if (send_width == 0) {
       send_width = (lss_size/send_size) + 1;
       if (send_width == 1) send_width++;
     }

     if (send_ring == NULL) {

       /* only allocate the send ring once. this is a networking test,
 	 not a memory allocation test. this way, we do not need a
 	 deallocate_buffer_ring() routine, and I don't feel like
 	 writing one anyway :) raj 11/94 */

       send_ring = alloc_sendfile_buf_ring(send_width,
 					  send_size,
 					  local_send_align,
 					  local_send_offset);
     }

     /* If the user has requested cpu utilization measurements, we must
        calibrate the cpu(s). We will perform this task within the
        tests  themselves. If the user has specified the cpu rate, then
        calibrate_local_cpu will return rather quickly as it will have
        nothing to do. If local_cpu_rate is zero, then we will go
        through  all the "normal" calibration stuff and return the rate
        back. */

     if (local_cpu_usage) {
       local_cpu_rate = calibrate_local_cpu(local_cpu_rate);
     }

     /* Tell the remote end to do a listen. The server alters the
        socket  paramters on the other side at this point, hence the
        reason for  all the values being passed in the setup
        message. If the user did  not specify any of the parameters,
        they will be passed as 0, which  will indicate to the remote
        that no changes beyond the system's  default should be
        used. Alignment is the exception, it will  default to 1, which
        will be no alignment alterations. */

     netperf_request.content.request_type =	DO_TCP_STREAM;
     tcp_stream_request->send_buf_size	=	rss_size_req;
     tcp_stream_request->recv_buf_size	=	rsr_size_req;
     tcp_stream_request->receive_size	=	recv_size;
     tcp_stream_request->no_delay	=	rem_nodelay;
     tcp_stream_request->recv_alignment	=	remote_recv_align;
     tcp_stream_request->recv_offset	=	remote_recv_offset;
     tcp_stream_request->measure_cpu	=	remote_cpu_usage;
     tcp_stream_request->cpu_rate	=	remote_cpu_rate;

     if (test_time) {
       tcp_stream_request->test_length	=	test_time;
     }
     else {
       tcp_stream_request->test_length	=	test_bytes;
     }

     tcp_stream_request->so_rcvavoid	=	rem_rcvavoid;
     tcp_stream_request->so_sndavoid	=	rem_sndavoid;

 #ifdef DIRTY
     tcp_stream_request->dirty_count       =       rem_dirty_count;
     tcp_stream_request->clean_count       =       rem_clean_count;
 #endif /* DIRTY */
     tcp_stream_request->port     = atoi(remote_data_port);
     tcp_stream_request->ipfamily = af_to_nf(remote_res->ai_family);

     if (debug > 1) {
       fprintf(where,
 	      "netperf: send_tcp_stream: requesting TCP stream test\n");
     }

     send_request();

     /* The response from the remote will contain all of the relevant
        socket parameters for this test type. We will put them back
        into the variables here so they can be displayed if desired.
        The remote will have calibrated CPU if necessary, and will have
        done all the needed set-up we will have calibrated the cpu
        locally before sending the request, and will grab the counter
        value right after the connect returns. The remote will grab the
        counter right after the accept call. This saves the hassle of
        extra messages being sent for the TCP tests.  */

     recv_response();

     if (!netperf_response.content.serv_errno) {
       if (debug)
 	fprintf(where,"remote listen done.\n");
       rsr_size	      =	tcp_stream_response->recv_buf_size;
       rss_size	      =	tcp_stream_response->send_buf_size;
       rem_nodelay     =	tcp_stream_response->no_delay;
       remote_cpu_usage=	tcp_stream_response->measure_cpu;
       remote_cpu_rate = tcp_stream_response->cpu_rate;

       /* we have to make sure that the server port number is in */
       /* network order */
       set_port_number(remote_res,(short)tcp_stream_response->data_port_number);
       rem_rcvavoid	= tcp_stream_response->so_rcvavoid;
       rem_sndavoid	= tcp_stream_response->so_sndavoid;
     }
     else {
       Set_errno(netperf_response.content.serv_errno);
       fprintf(where,
 	      "netperf: remote error %d",
 	      netperf_response.content.serv_errno);
       perror("");
       fflush(where);

       exit(1);
     }

 #ifdef WANT_DEMO
     DEMO_STREAM_SETUP(lss_size,rsr_size)
 #endif

     /*Connect up to the remote port on the data socket  */
     if (connect(send_socket,
 		remote_res->ai_addr,
 		remote_res->ai_addrlen) == INVALID_SOCKET){
       perror("netperf: send_tcp_stream: data socket connect failed");
       printf(" port: %d\n",ntohs(server.sin_port));
       exit(1);
     }

 #ifdef WIN32
   /* this is used so the timer thread can close the socket out from */
   /* under us, which to date is the easiest/cleanest/least */
   /* Windows-specific way I can find to force the winsock calls to */
   /* return WSAEINTR with the test is over. anything that will run on */
   /* 95 and NT and is closer to what netperf expects from Unix signals */
   /* and such would be appreciated raj 1/96 */
   win_kludge_socket = send_socket;
 #endif /* WIN32 */

     /* Data Socket set-up is finished. If there were problems, either
        the connect would have failed, or the previous response would
        have indicated a problem. I failed to see the value of the
        extra message after the accept on the remote. If it failed,
        we'll see it here. If it didn't, we might as well start pumping
        data. */

     /* Set-up the test end conditions. For a stream test, they can be */
     /* either time or byte-count based. */

     if (test_time) {
       /* The user wanted to end the test after a period of time. */
       times_up = 0;
       bytes_remaining = 0;

       /* in previous revisions, we had the same code repeated throught
          all the test suites. this was unnecessary, and meant more
          work for me when I wanted to switch to POSIX signals, so I
          have abstracted this out into a routine in netlib.c. if you
          are experiencing signal problems, you might want to look
          there. raj 11/94 */

       start_timer(test_time);
     }
     else {
       /* The tester wanted to send a number of bytes. */
       bytes_remaining = test_bytes;
       times_up = 1;
     }

     /* The cpu_start routine will grab the current time and possibly */
     /* value of the idle counter for later use in measuring cpu */
     /* utilization and/or service demand and thruput. */

     cpu_start(local_cpu_usage);

 #ifdef WANT_INTERVALS
     INTERVALS_INIT();
 #endif /* WANT_INTERVALS */


     /* before we start, initialize a few variables */

 #ifdef WANT_DEMO
     if (demo_mode) {
       HIST_timestamp(demo_one_ptr);
     }
 #endif

     /* We use an "OR" to control test execution. When the test is
        controlled by time, the byte count check will always return
        false. When the test is controlled by byte count, the time test
        will always return false. When the test is finished, the whole
        expression will go false and we will stop sending data. */

     while ((!times_up) || (bytes_remaining > 0)) {

       /* the sendfile_tcp_stream test does not support making the buffers
 	 dirty. 08/2000 */

 #ifdef WANT_HISTOGRAM
       if (verbosity > 1) {
 	/* timestamp just before we go into sendfile() and then again
          just after we come out raj 08/2000 */
 	/* but only if we are actually going to display a histogram */
 	HIST_timestamp(&time_one);
       }
 #endif /* WANT_HISTOGRAM */

       /* you can look at netlib.h for a description of the fields we
 	 are passing to sendfile(). 08/2000 */
 #ifdef QUICK_SENDPATH
       if ((len=sendpath(send_socket,
 			fill_file,
 			send_ring->offset,
 			send_ring->length,
 			send_ring->hdtrl,
 			send_ring->flags)) != send_size)
 #elif defined(__linux)
 	scratch_offset = send_ring->offset;
       if ((len=sendfile(send_socket,
 			send_ring->fildes,
 			&scratch_offset,   /* modified after the call! */
 			send_ring->length)) != send_size)
 #elif defined (__sun)
       /* We must call with SFV_NOWAIT and a large file size (>= 16MB) to
 	 get zero-copy, as well as compiling with  -D_LARGEFILE_SOURCE
 	  -D_FILE_OFFSET_BITS=64 */
       sv.sfv_fd = send_ring->fildes;
       sv.sfv_flag = SFV_NOWAIT;
       sv.sfv_off = send_ring->offset;
       sv.sfv_len =  send_ring->length;
       if ((len = sendfilev(send_socket, &sv, 1, &scratch_len)) != send_size)
 #elif defined(__FreeBSD__)
 	/* so close to HP-UX and yet so far away... :) */
 	if ((sendfile(send_ring->fildes,
 		      send_socket,
 		      send_ring->offset,
 		      send_ring->length,
 		      NULL,
 		      (off_t *)&len,
 		      send_ring->flags) != 0) ||
 	    (len != send_size))
 #elif defined(USE_OSX)
     scratch_len = send_ring->length;
     if ((sendfile(send_ring->fildes,
               send_socket,
               send_ring->offset,
               (off_t *)&scratch_len,
               NULL,
               send_ring->flags) != 0) ||
         (scratch_len != send_size))
 #else /* original sendile HP-UX */
 	  if ((len=sendfile(send_socket,
 			    send_ring->fildes,
 			    send_ring->offset,
 			    send_ring->length,
 			    send_ring->hdtrl,
 			    send_ring->flags)) != send_size)
 #endif /* QUICK_SENDPATH */
 	    {
 	      /* the test was interrupted, must be the end of test. the
 		 send_tcp_stream code has some WIN32 ifdefs that we do not
 		 need here. */
 	      if ((len >=0) || SOCKET_EINTR(len)) {
 		break;
 	      }
 	      perror("netperf: data send error: sendfile");
 	      fprintf(stderr,
 		      "len was %d send_size was %d\n",
 		      len,
 		      send_size);
 	      fflush(stderr);
 	      exit(1);
 	    }

       /*	offset += len;*/

 #ifdef WANT_HISTOGRAM
       if (verbosity > 1) {
 	/* timestamp the exit from the send call and update the
 	   histogram */

 	HIST_timestamp(&time_two);
 	HIST_add(time_hist,delta_micro(&time_one,&time_two));
       }
 #endif /* WANT_HISTOGRAM */

 #ifdef WANT_DEMO
       DEMO_STREAM_INTERVAL(send_size);
 #endif

 #ifdef WANT_INTERVALS
       INTERVALS_WAIT();
 #endif /* WANT_INTERVALS */

       /* now we want to move our pointer to the next position in the */
       /* data buffer...we may also want to wrap back to the "beginning" */
       /* of the bufferspace, so we will mod the number of messages sent */
       /* by the send width, and use that to calculate the offset to add */
       /* to the base pointer. */

       nummessages++;
       send_ring = send_ring->next;
       if (bytes_remaining) {
 	bytes_remaining -= send_size;
       }
     }

     /* The test is over. Flush the buffers to the remote end. We do a
        graceful release to insure that all data has been taken by the
        remote. */

     /* but first, if the verbosity is greater than 1, find-out what */
     /* the TCP maximum segment_size was (if possible) */
     if (verbosity > 1) {
       tcp_mss = -1;
       get_tcp_info(send_socket,&tcp_mss);
     }

     if (shutdown(send_socket,SHUT_WR) == SOCKET_ERROR) {
       perror("netperf: cannot shutdown tcp stream socket");
       exit(1);
     }

     /* hang a recv() off the socket to block until the remote has */
     /* brought all the data up into the application. it will do a */
     /* shutdown to cause a FIN to be sent our way. We will assume that */
     /* any exit from the recv() call is good... raj 4/93 */

     /* since we are using sendfile() instead of send, we have no
        scratch buffer from the send_ring to use for the
        receive. however, since we "know" that the recv should be
        returning zero bytes (not that we are making the checks we
        should) we can pass the address of the flags field. raj 08/2000
     */

     recv(send_socket,
 	 &(send_ring->flags),
 	 sizeof(send_ring->flags),
 	 0);

     /* this call will always give us the elapsed time for the test, and */
     /* will also store-away the necessaries for cpu utilization */

     cpu_stop(local_cpu_usage,&elapsed_time);	/* was cpu being */
 						/* measured and how */
 						/* long did we really */
 						/* run? */

     /* we are finished with the socket, so close it to prevent hitting */
     /* the limit on maximum open files. */

     close(send_socket);

     /* Get the statistics from the remote end. The remote will have */
     /* calculated service demand and all those interesting things. If it */
     /* wasn't supposed to care, it will return obvious values. */

     recv_response();

     if (!netperf_response.content.serv_errno) {
       if (debug)
 	fprintf(where,"remote results obtained\n");
     }

     else {
       Set_errno(netperf_response.content.serv_errno);
       fprintf(where,
 	      "netperf: remote error %d",
 	      netperf_response.content.serv_errno);
       perror("");
       fflush(where);

       exit(1);
     }

     /* We now calculate what our thruput was for the test. In the future, */
     /* we may want to include a calculation of the thruput measured by */
     /* the remote, but it should be the case that for a TCP stream test, */
     /* that the two numbers should be *very* close... We calculate */
     /* bytes_sent regardless of the way the test length was controlled. */
     /* If it was time, we needed to, and if it was by bytes, the user may */
     /* have specified a number of bytes that wasn't a multiple of the */
     /* send_size, so we really didn't send what he asked for ;-) */

     bytes_sent	= ntohd(tcp_stream_result->bytes_received);

     thruput	= calc_thruput(bytes_sent);

     if (local_cpu_usage || remote_cpu_usage) {

       /* We must now do a little math for service demand and cpu */
       /* utilization for the system(s) */
       /* Of course, some of the information might be bogus because */
       /* there was no idle counter in the kernel(s). We need to make */
       /* a note of this for the user's benefit...*/
       if (local_cpu_usage) {

 	local_cpu_utilization	= calc_cpu_util(0.0);
 	local_service_demand	= calc_service_demand(bytes_sent,
 						      0.0,
 						      0.0,
 						      0);
       }
       else {
 	local_cpu_utilization	= (float) -1.0;
 	local_service_demand	= (float) -1.0;
       }

       if (remote_cpu_usage) {

 	remote_cpu_utilization	= tcp_stream_result->cpu_util;
 	remote_service_demand	= calc_service_demand(bytes_sent,
 						      0.0,
 						      remote_cpu_utilization,
 						      tcp_stream_result->num_cpus);
       }
       else {
 	remote_cpu_utilization = (float) -1.0;
 	remote_service_demand  = (float) -1.0;
       }
     }
     else {
       /* we were not measuring cpu, for the confidence stuff, we */
       /* should make it -1.0 */
       local_cpu_utilization	= (float) -1.0;
       local_service_demand	= (float) -1.0;
       remote_cpu_utilization = (float) -1.0;
       remote_service_demand  = (float) -1.0;
     }

     /* at this point, we want to calculate the confidence information. */
     /* if debugging is on, calculate_confidence will print-out the */
     /* parameters we pass it */

     calculate_confidence(confidence_iteration,
 			 elapsed_time,
 			 thruput,
 			 local_cpu_utilization,
 			 remote_cpu_utilization,
 			 local_service_demand,
 			 remote_service_demand);

     confidence_iteration++;
   }

   /* at this point, we have finished making all the runs that we */
   /* will be making. so, we should extract what the calcuated values */
   /* are for all the confidence stuff. we could make the values */
   /* global, but that seemed a little messy, and it did not seem worth */
   /* all the mucking with header files. so, we create a routine much */
   /* like calcualte_confidence, which just returns the mean values. */
   /* raj 11/94 */

   retrieve_confident_values(&elapsed_time,
 			    &thruput,
 			    &local_cpu_utilization,
 			    &remote_cpu_utilization,
 			    &local_service_demand,
 			    &remote_service_demand);

   /* We are now ready to print all the information. If the user */
   /* has specified zero-level verbosity, we will just print the */
   /* local service demand, or the remote service demand. If the */
   /* user has requested verbosity level 1, he will get the basic */
   /* "streamperf" numbers. If the user has specified a verbosity */
   /* of greater than 1, we will display a veritable plethora of */
   /* background information from outside of this block as it it */
   /* not cpu_measurement specific...  */

   if (confidence < 0) {
     /* we did not hit confidence, but were we asked to look for it? */
     if (iteration_max > 1) {
       display_confidence();
     }
   }

   if (local_cpu_usage || remote_cpu_usage) {
     local_cpu_method = format_cpu_method(cpu_method);
     remote_cpu_method = format_cpu_method(tcp_stream_result->cpu_method);

     switch (verbosity) {
     case 0:

     if (local_cpu_usage) {
 	fprintf(where,
 		cpu_fmt_0,
 		local_service_demand,
 		local_cpu_method,
 		((print_headers) ||
 		 (result_brand == NULL)) ? "" : result_brand);
       }

       else {
 	fprintf(where,
 		cpu_fmt_0,
 		remote_service_demand,
 		remote_cpu_method,
 		((print_headers) ||
 		 (result_brand == NULL)) ? "" : result_brand);
       }

       break;

     case 1:
     case 2:
       if (print_headers) {
 	fprintf(where,
 		cpu_title,
 		format_units(),
 		local_cpu_method,
 		remote_cpu_method);
       }

       fprintf(where,
 	      cpu_fmt_1,		/* the format string */
 	      rsr_size,		        /* remote recvbuf size */
 	      lss_size,		        /* local sendbuf size */
 	      send_size,		/* how large were the sends */
 	      elapsed_time,		/* how long was the test */
 	      thruput, 		        /* what was the xfer rate */
 	      local_cpu_utilization,	/* local cpu */
 	      remote_cpu_utilization,	/* remote cpu */
 	      local_service_demand,	/* local service demand */
 	      remote_service_demand,	/* remote service demand */
 	      ((print_headers) ||
 	       (result_brand == NULL)) ? "" : result_brand);
       break;
     }

   }

   else {
     /* The tester did not wish to measure service demand. */

     switch (verbosity) {

     case 0:

       fprintf(where,
 	      tput_fmt_0,
 	      thruput,
 	      ((print_headers) ||
 	       (result_brand == NULL)) ? "" : result_brand);
       break;

     case 1:
     case 2:

       if (print_headers) {
 	fprintf(where,tput_title,format_units());
       }

       fprintf(where,
 	      tput_fmt_1,		/* the format string */
 	      rsr_size, 		/* remote recvbuf size */
 	      lss_size, 		/* local sendbuf size */
 	      send_size,		/* how large were the sends */
 	      elapsed_time, 		/* how long did it take */
 	      thruput,                  /* how fast did it go */
 	      ((print_headers) ||
 	       (result_brand == NULL)) ? "" : result_brand);
       break;
     }
   }

   /* it would be a good thing to include information about some of the */
   /* other parameters that may have been set for this test, but at the */
   /* moment, I do not wish to figure-out all the  formatting, so I will */
   /* just put this comment here to help remind me that it is something */
   /* that should be done at a later time. */

     if (verbosity > 1) {

     /* The user wanted to know it all, so we will give it to him. */
     /* This information will include as much as we can find about */
     /* TCP statistics, the alignments of the sends and receives */
     /* and all that sort of rot... */

     /* this stuff needs to be worked-out in the presence of confidence */
     /* intervals and multiple iterations of the test... raj 11/94 */

     fprintf(where,
 	    ksink_fmt,
 	    "Bytes",
 	    "Bytes",
 	    "Bytes",
 	    local_send_align,
 	    remote_recv_align,
 	    local_send_offset,
 	    remote_recv_offset,
 	    bytes_sent,
 	    bytes_sent / (double)nummessages,
 	    nummessages,
 	    bytes_sent / (double)tcp_stream_result->recv_calls,
 	    tcp_stream_result->recv_calls);

     fprintf(where,
 	    ksink_fmt2,
 	    tcp_mss);

     fflush(where);

 #ifdef WANT_HISTOGRAM

     fprintf(where,"\n\nHistogram of time spent in send() call.\n");
     fflush(where);
     HIST_report(time_hist);
 #endif /* WANT_HISTOGRAM */
   }
 }

 #endif /* HAVE_SENDFILE */

 /* This is the server-side routine for the tcp stream test. It is */
 /* implemented as one routine. I could break things-out somewhat, but */
 /* didn't feel it was necessary. */

 void
 recv_tcp_stream()
 {

   struct sockaddr_storage myaddr_in, peeraddr_in;
   SOCKET s_listen,s_data;
   netperf_socklen_t addrlen;
   int	len;
   unsigned int	receive_calls;
   float	elapsed_time;
   double   bytes_received;

   struct ring_elt *recv_ring;

   struct addrinfo *local_res;
   char local_name[BUFSIZ];
   char port_buffer[PORTBUFSIZE];

 #ifdef DO_SELECT
   fd_set readfds;
   struct timeval timeout;
 #endif /* DO_SELECT */

   struct	tcp_stream_request_struct	*tcp_stream_request;
   struct	tcp_stream_response_struct	*tcp_stream_response;
   struct	tcp_stream_results_struct	*tcp_stream_results;

 #ifdef DO_SELECT
   FD_ZERO(&readfds);
   timeout.tv_sec = 1;
   timeout.tv_usec = 0;
 #endif /* DO_SELECT */

   tcp_stream_request	=
     (struct tcp_stream_request_struct *)netperf_request.content.test_specific_data;
   tcp_stream_response	=
     (struct tcp_stream_response_struct *)netperf_response.content.test_specific_data;
   tcp_stream_results	=
     (struct tcp_stream_results_struct *)netperf_response.content.test_specific_data;

   if (debug) {
     fprintf(where,"netserver: recv_tcp_stream: entered...\n");
     fflush(where);
   }

   /* We want to set-up the listen socket with all the desired */
   /* parameters and then let the initiator know that all is ready. If */
   /* socket size defaults are to be used, then the initiator will have */
   /* sent us 0's. If the socket sizes cannot be changed, then we will */
   /* send-back what they are. If that information cannot be determined, */
   /* then we send-back -1's for the sizes. If things go wrong for any */
   /* reason, we will drop back ten yards and punt. */

   /* If anything goes wrong, we want the remote to know about it. It */
   /* would be best if the error that the remote reports to the user is */
   /* the actual error we encountered, rather than some bogus unexpected */
   /* response type message. */

   if (debug) {
     fprintf(where,"recv_tcp_stream: setting the response type...\n");
     fflush(where);
   }

   netperf_response.content.response_type = TCP_STREAM_RESPONSE;

   if (debug) {
     fprintf(where,"recv_tcp_stream: the response type is set...\n");
     fflush(where);
   }

   /* We now alter the message_ptr variable to be at the desired */
   /* alignment with the desired offset. */

   if (debug) {
     fprintf(where,"recv_tcp_stream: requested alignment of %d\n",
 	    tcp_stream_request->recv_alignment);
     fflush(where);
   }

   /* create_data_socket expects to find some things in the global */
   /* variables, so set the globals based on the values in the request. */
   /* once the socket has been created, we will set the response values */
   /* based on the updated value of those globals. raj 7/94 */
   lss_size_req = tcp_stream_request->send_buf_size;
   lsr_size_req = tcp_stream_request->recv_buf_size;
   loc_nodelay  = tcp_stream_request->no_delay;
   loc_rcvavoid = tcp_stream_request->so_rcvavoid;
   loc_sndavoid = tcp_stream_request->so_sndavoid;

   set_hostname_and_port(local_name,
 			port_buffer,
 			nf_to_af(tcp_stream_request->ipfamily),
 			tcp_stream_request->port);

   local_res = complete_addrinfo(local_name,
 				local_name,
 				port_buffer,
 				nf_to_af(tcp_stream_request->ipfamily),
 				SOCK_STREAM,
 				IPPROTO_TCP,
 				0);

   s_listen = create_data_socket(local_res);

   if (s_listen == INVALID_SOCKET) {
     netperf_response.content.serv_errno = errno;
     send_response();
     exit(1);
   }

 #ifdef WIN32
   /* The test timer can fire during operations on the listening socket,
      so to make the start_timer below work we have to move
      it to close s_listen while we are blocked on accept. */
   win_kludge_socket2 = s_listen;
 #endif

   /* what sort of sizes did we end-up with? */
   if (tcp_stream_request->receive_size == 0) {
     if (lsr_size > 0) {
       recv_size = lsr_size;
     }
     else {
       recv_size = 4096;
     }
   }
   else {
     recv_size = tcp_stream_request->receive_size;
   }

   /* we want to set-up our recv_ring in a manner analagous to what we */
   /* do on the sending side. this is more for the sake of symmetry */
   /* than for the needs of say copy avoidance, but it might also be */
   /* more realistic - this way one could conceivably go with a */
   /* double-buffering scheme when taking the data an putting it into */
   /* the filesystem or something like that. raj 7/94 */

   if (recv_width == 0) {
     recv_width = (lsr_size/recv_size) + 1;
     if (recv_width == 1) recv_width++;
   }

   recv_ring = allocate_buffer_ring(recv_width,
 				   recv_size,
 				   tcp_stream_request->recv_alignment,
 				   tcp_stream_request->recv_offset);

   if (debug) {
     fprintf(where,"recv_tcp_stream: receive alignment and offset set...\n");
     fflush(where);
   }

   /* Now, let's set-up the socket to listen for connections */
   if (listen(s_listen, 5) == SOCKET_ERROR) {
     netperf_response.content.serv_errno = errno;
     close(s_listen);
     send_response();

     exit(1);
   }


   /* now get the port number assigned by the system  */
   addrlen = sizeof(myaddr_in);
   if (getsockname(s_listen,
 		  (struct sockaddr *)&myaddr_in,
 		  &addrlen) == SOCKET_ERROR){
     netperf_response.content.serv_errno = errno;
     close(s_listen);
     send_response();

     exit(1);
   }

   /* Now myaddr_in contains the port and the internet address this is */
   /* returned to the sender also implicitly telling the sender that the */
   /* socket buffer sizing has been done. */

   tcp_stream_response->data_port_number =
     (int) ntohs(((struct sockaddr_in *)&myaddr_in)->sin_port);
   netperf_response.content.serv_errno   = 0;

   /* But wait, there's more. If the initiator wanted cpu measurements, */
   /* then we must call the calibrate routine, which will return the max */
   /* rate back to the initiator. If the CPU was not to be measured, or */
   /* something went wrong with the calibration, we will return a -1 to */
   /* the initiator. */

   tcp_stream_response->cpu_rate = (float)0.0; 	/* assume no cpu */
   if (tcp_stream_request->measure_cpu) {
     tcp_stream_response->measure_cpu = 1;
     tcp_stream_response->cpu_rate =
       calibrate_local_cpu(tcp_stream_request->cpu_rate);
   }
   else {
     tcp_stream_response->measure_cpu = 0;
   }

   /* before we send the response back to the initiator, pull some of */
   /* the socket parms from the globals */
   tcp_stream_response->send_buf_size = lss_size;
   tcp_stream_response->recv_buf_size = lsr_size;
   tcp_stream_response->no_delay = loc_nodelay;
   tcp_stream_response->so_rcvavoid = loc_rcvavoid;
   tcp_stream_response->so_sndavoid = loc_sndavoid;
   tcp_stream_response->receive_size = recv_size;

   send_response();

   addrlen = sizeof(peeraddr_in);

   if ((s_data=accept(s_listen,
 		     (struct sockaddr *)&peeraddr_in,
 		     &addrlen)) == INVALID_SOCKET) {
     /* Let's just punt. The remote will be given some information */
     close(s_listen);
     exit(1);
   }

 #ifdef WIN32
   /* this is used so the timer thread can close the socket out from */
   /* under us, which to date is the easiest/cleanest/least */
   /* Windows-specific way I can find to force the winsock calls to */
   /* return WSAEINTR with the test is over. anything that will run on */
   /* 95 and NT and is closer to what netperf expects from Unix signals */
   /* and such would be appreciated raj 1/96 */
   win_kludge_socket = s_data;
   win_kludge_socket2 = INVALID_SOCKET;
 #endif /* WIN32 */

   times_up = 0;

   start_timer(tcp_stream_request->test_length + PAD_TIME);

 #ifdef KLUDGE_SOCKET_OPTIONS
   /* this is for those systems which *INCORRECTLY* fail to pass */
   /* attributes across an accept() call. Including this goes against */
   /* my better judgement :( raj 11/95 */

   kludge_socket_options(s_data);

 #endif /* KLUDGE_SOCKET_OPTIONS */

   /* Now it's time to start receiving data on the connection. We will */
   /* first grab the apropriate counters and then start grabbing. */

   cpu_start(tcp_stream_request->measure_cpu);

   /* The loop will exit when the sender does a shutdown, which will */
   /* return a length of zero   */

   /* there used to be an #ifdef DIRTY call to access_buffer() here,
      but we have switched from accessing the buffer before the recv()
      call to accessing the buffer after the recv() call.  The
      accessing before was, IIRC, related to having dirty data when
      doing page-flipping copy avoidance. */

   bytes_received = 0;
   receive_calls  = 0;

   while (!times_up && ((len = recv(s_data, recv_ring->buffer_ptr, recv_size, 0)) != 0)) {
     if (len == SOCKET_ERROR )
 	{
       netperf_response.content.serv_errno = errno;
       send_response();
       exit(1);
     }
     bytes_received += len;
     receive_calls++;

 #ifdef DIRTY
     /* we access the buffer after the recv() call now, rather than before */
     access_buffer(recv_ring->buffer_ptr,
 		  recv_size,
 		  tcp_stream_request->dirty_count,
 		  tcp_stream_request->clean_count);
 #endif /* DIRTY */


     /* move to the next buffer in the recv_ring */
     recv_ring = recv_ring->next;

 #ifdef PAUSE
     sleep(1);
 #endif /* PAUSE */

 #ifdef DO_SELECT
 	FD_SET(s_data,&readfds);
 	select(s_data+1,&readfds,NULL,NULL,&timeout);
 #endif /* DO_SELECT */

   }

   /* perform a shutdown to signal the sender that */
   /* we have received all the data sent. raj 4/93 */

   if (shutdown(s_data,SHUT_WR) == SOCKET_ERROR) {
       netperf_response.content.serv_errno = errno;
       send_response();
       exit(1);
     }

   cpu_stop(tcp_stream_request->measure_cpu,&elapsed_time);

   /* send the results to the sender			*/

   if (debug) {
     fprintf(where,
 	    "recv_tcp_stream: got %g bytes\n",
 	    bytes_received);
     fprintf(where,
 	    "recv_tcp_stream: got %d recvs\n",
 	    receive_calls);
     fflush(where);
   }

   tcp_stream_results->bytes_received	= htond(bytes_received);
   tcp_stream_results->elapsed_time	= elapsed_time;
   tcp_stream_results->recv_calls	= receive_calls;

   tcp_stream_results->cpu_method = cpu_method;
   tcp_stream_results->num_cpus   = lib_num_loc_cpus;

   if (tcp_stream_request->measure_cpu) {
     tcp_stream_results->cpu_util	= calc_cpu_util(0.0);
   };

   if (debug) {
     fprintf(where,
 	    "recv_tcp_stream: test complete, sending results.\n");
     fprintf(where,
 	    "                 bytes_received %g receive_calls %d\n",
 	    bytes_received,
 	    receive_calls);
     fprintf(where,
 	    "                 len %d\n",
 	    len);
     fflush(where);
   }

   send_response();

   /* we are now done with the sockets */
   close(s_data);
   close(s_listen);

   }

 /* This is the server-side routine for the tcp maerts test. It is
    implemented as one routine. I could break things-out somewhat, but
    didn't feel it was necessary. */

 void
 recv_tcp_maerts()
 {

   struct sockaddr_storage myaddr_in, peeraddr_in;
   struct addrinfo *local_res;
   char  local_name[BUFSIZ];
   char  port_buffer[PORTBUFSIZE];

   SOCKET	s_listen,s_data;
   netperf_socklen_t 	addrlen;
   int	len;
   unsigned int	send_calls;
   float	elapsed_time;
   double   bytes_sent = 0.0 ;

   struct ring_elt *send_ring;

   struct	tcp_maerts_request_struct	*tcp_maerts_request;
   struct	tcp_maerts_response_struct	*tcp_maerts_response;
   struct	tcp_maerts_results_struct	*tcp_maerts_results;

   tcp_maerts_request	=
     (struct tcp_maerts_request_struct *)netperf_request.content.test_specific_data;
   tcp_maerts_response	=
     (struct tcp_maerts_response_struct *)netperf_response.content.test_specific_data;
   tcp_maerts_results	=
     (struct tcp_maerts_results_struct *)netperf_response.content.test_specific_data;

   if (debug) {
     fprintf(where,"netserver: recv_tcp_maerts: entered...\n");
     fflush(where);
   }

   /* We want to set-up the listen socket with all the desired
      parameters and then let the initiator know that all is ready. If
      socket size defaults are to be used, then the initiator will have
      sent us 0's. If the socket sizes cannot be changed, then we will
      send-back what they are. If that information cannot be
      determined, then we send-back -1's for the sizes. If things go
      wrong for any reason, we will drop back ten yards and punt. */

   /* If anything goes wrong, we want the remote to know about it. It
      would be best if the error that the remote reports to the user is
      the actual error we encountered, rather than some bogus
      unexpected response type message. */

   if (debug) {
     fprintf(where,"recv_tcp_maerts: setting the response type...\n");
     fflush(where);
   }

   netperf_response.content.response_type = TCP_MAERTS_RESPONSE;

   if (debug) {
     fprintf(where,"recv_tcp_maerts: the response type is set...\n");
     fflush(where);
   }

   /* We now alter the message_ptr variable to be at the desired */
   /* alignment with the desired offset. */

   if (debug) {
     fprintf(where,"recv_tcp_maerts: requested alignment of %d\n",
 	    tcp_maerts_request->send_alignment);
     fflush(where);
   }

   /* Grab a socket to listen on, and then listen on it. */

   if (debug) {
     fprintf(where,"recv_tcp_maerts: grabbing a socket...\n");
     fflush(where);
   }

   /* create_data_socket expects to find some things in the global */
   /* variables, so set the globals based on the values in the request. */
   /* once the socket has been created, we will set the response values */
   /* based on the updated value of those globals. raj 7/94 */
   lss_size_req = tcp_maerts_request->send_buf_size;
   lsr_size_req = tcp_maerts_request->recv_buf_size;
   loc_nodelay = tcp_maerts_request->no_delay;
   loc_rcvavoid = tcp_maerts_request->so_rcvavoid;
   loc_sndavoid = tcp_maerts_request->so_sndavoid;

   set_hostname_and_port(local_name,
 			port_buffer,
 			nf_to_af(tcp_maerts_request->ipfamily),
 			tcp_maerts_request->port);

   local_res = complete_addrinfo(local_name,
 				local_name,
 				port_buffer,
 				nf_to_af(tcp_maerts_request->ipfamily),
 				SOCK_STREAM,
 				IPPROTO_TCP,
 				0);

   s_listen = create_data_socket(local_res);

   if (s_listen == INVALID_SOCKET) {
     netperf_response.content.serv_errno = errno;
     send_response();
     exit(1);
   }

 #ifdef WIN32
   /* The test timer can fire during operations on the listening socket,
      so to make the start_timer below work we have to move
      it to close s_listen while we are blocked on accept. */
   win_kludge_socket2 = s_listen;
 #endif


   /* what sort of sizes did we end-up with? */
   if (tcp_maerts_request->send_size == 0) {
     if (lss_size > 0) {
       send_size = lss_size;
     }
     else {
       send_size = 4096;
     }
   }
   else {
     send_size = tcp_maerts_request->send_size;
   }

   /* we want to set-up our recv_ring in a manner analagous to what we */
   /* do on the recving side. this is more for the sake of symmetry */
   /* than for the needs of say copy avoidance, but it might also be */
   /* more realistic - this way one could conceivably go with a */
   /* double-buffering scheme when taking the data an putting it into */
   /* the filesystem or something like that. raj 7/94 */

   if (send_width == 0) {
     send_width = (lsr_size/send_size) + 1;
     if (send_width == 1) send_width++;
   }

   send_ring = allocate_buffer_ring(send_width,
 				   send_size,
 				   tcp_maerts_request->send_alignment,
 				   tcp_maerts_request->send_offset);

   if (debug) {
     fprintf(where,"recv_tcp_maerts: receive alignment and offset set...\n");
     fflush(where);
   }

   /* Now, let's set-up the socket to listen for connections */
   if (listen(s_listen, 5) == SOCKET_ERROR) {
     netperf_response.content.serv_errno = errno;
     close(s_listen);
     send_response();

     exit(1);
   }


   /* now get the port number assigned by the system  */
   addrlen = sizeof(myaddr_in);
   if (getsockname(s_listen,
 		  (struct sockaddr *)&myaddr_in,
 		  &addrlen) == SOCKET_ERROR){
     netperf_response.content.serv_errno = errno;
     close(s_listen);
     send_response();

     exit(1);
   }

   /* Now myaddr_in contains the port and the internet address this is */
   /* returned to the sender also implicitly telling the sender that the */
   /* socket buffer sizing has been done. */

   tcp_maerts_response->data_port_number =
     (int) ntohs(((struct sockaddr_in *)&myaddr_in)->sin_port);
   netperf_response.content.serv_errno   = 0;

   /* But wait, there's more. If the initiator wanted cpu measurements, */
   /* then we must call the calibrate routine, which will return the max */
   /* rate back to the initiator. If the CPU was not to be measured, or */
   /* something went wrong with the calibration, we will return a -1 to */
   /* the initiator. */

   tcp_maerts_response->cpu_rate = (float)0.0; 	/* assume no cpu */
   if (tcp_maerts_request->measure_cpu) {
     tcp_maerts_response->measure_cpu = 1;
     tcp_maerts_response->cpu_rate =
       calibrate_local_cpu(tcp_maerts_request->cpu_rate);
   }
   else {
     tcp_maerts_response->measure_cpu = 0;
   }

   /* before we send the response back to the initiator, pull some of */
   /* the socket parms from the globals */
   tcp_maerts_response->send_buf_size = lss_size;
   tcp_maerts_response->recv_buf_size = lsr_size;
   tcp_maerts_response->no_delay = loc_nodelay;
   tcp_maerts_response->so_rcvavoid = loc_rcvavoid;
   tcp_maerts_response->so_sndavoid = loc_sndavoid;
   tcp_maerts_response->send_size = send_size;

   send_response();

   addrlen = sizeof(peeraddr_in);

   /* we will start the timer before the accept() to be somewhat
      analagous to the starting of the timer before the connect() call
      in the TCP_STREAM test. raj 2002-06-21 */

   start_timer(tcp_maerts_request->test_length);

   /* Now it's time to start receiving data on the connection. We will
      first grab the apropriate counters and then start grabbing. */

   cpu_start(tcp_maerts_request->measure_cpu);


   if ((s_data=accept(s_listen,
 		     (struct sockaddr *)&peeraddr_in,
 		     &addrlen)) == INVALID_SOCKET) {
     /* Let's just punt. The remote will be given some information */
     close(s_listen);
     exit(1);
   }

 #ifdef WIN32
   /* this is used so the timer thread can close the socket out from */
   /* under us, which to date is the easiest/cleanest/least */
   /* Windows-specific way I can find to force the winsock calls to */
   /* return WSAEINTR with the test is over. anything that will run on */
   /* 95 and NT and is closer to what netperf expects from Unix signals */
   /* and such would be appreciated raj 1/96 */
   win_kludge_socket = s_data;
   win_kludge_socket2 = INVALID_SOCKET;
 #endif /* WIN32 */

 #ifdef KLUDGE_SOCKET_OPTIONS

   /* this is for those systems which *INCORRECTLY* fail to pass
      attributes across an accept() call. Including this goes against
      my better judgement :( raj 11/95 */

   kludge_socket_options(s_data);

 #endif /* KLUDGE_SOCKET_OPTIONS */

   /* The loop will exit when the sender does a shutdown, which will */
   /* return a length of zero   */

   bytes_sent = 0.0;
   send_calls  = 0;

   len = 0;   /* nt-lint; len is not initialized (printf far below) if
 		times_up initially true.*/
   times_up = 0; /* must remember to initialize this little beauty */
   while (!times_up) {

 #ifdef DIRTY
     /* we want to dirty some number of consecutive integers in the buffer */
     /* we are about to send. we may also want to bring some number of */
     /* them cleanly into the cache. The clean ones will follow any dirty */
     /* ones into the cache. */

   access_buffer(send_ring->buffer_ptr,
 		send_size,
 		tcp_maerts_request->dirty_count,
 		tcp_maerts_request->clean_count);

 #endif /* DIRTY */

     if((len=send(s_data,
 		 send_ring->buffer_ptr,
 		 send_size,
 		 0)) != send_size) {
 		if ((len >=0) || SOCKET_EINTR(len)) {
 	      /* the test was interrupted, must be the end of test */
 	      break;
 		}
       netperf_response.content.serv_errno = errno;
       send_response();
       exit(1);
     }

     bytes_sent += len;
     send_calls++;

     /* more to the next buffer in the send_ring */
     send_ring = send_ring->next;

   }

   /* perform a shutdown to signal the sender that */
   /* we have received all the data sent. raj 4/93 */

   if (shutdown(s_data,SHUT_WR) == SOCKET_ERROR) {
       netperf_response.content.serv_errno = errno;
       send_response();
       exit(1);
     }

   /* hang a recv() off the socket to block until the remote has
      brought all the data up into the application. it will do a
      shutdown to cause a FIN to be sent our way. We will assume that
      any exit from the recv() call is good... raj 4/93 */

   recv(s_data, send_ring->buffer_ptr, send_size, 0);


   cpu_stop(tcp_maerts_request->measure_cpu,&elapsed_time);

   /* send the results to the sender			*/

   if (debug) {
     fprintf(where,
 	    "recv_tcp_maerts: got %g bytes\n",
 	    bytes_sent);
     fprintf(where,
 	    "recv_tcp_maerts: got %d sends\n",
 	    send_calls);
     fflush(where);
   }

   tcp_maerts_results->bytes_sent	= htond(bytes_sent);
   tcp_maerts_results->elapsed_time	= elapsed_time;
   tcp_maerts_results->send_calls	= send_calls;

   if (tcp_maerts_request->measure_cpu) {
     tcp_maerts_results->cpu_util	= calc_cpu_util(0.0);
   };

   if (debug) {
     fprintf(where,
 	    "recv_tcp_maerts: test complete, sending results.\n");
     fprintf(where,
 	    "                 bytes_sent %g send_calls %d\n",
 	    bytes_sent,
 	    send_calls);
     fprintf(where,
 	    "                 len %d\n",
 	    len);
     fflush(where);
   }

   tcp_maerts_results->cpu_method = cpu_method;
   tcp_maerts_results->num_cpus   = lib_num_loc_cpus;
   send_response();

   /* we are now done with the sockets */
   close(s_data);
   close(s_listen);

   }


  /* this routine implements the sending (netperf) side of the TCP_RR */
  /* test. */

 void
 send_tcp_rr(char remote_host[])
 {

   char *tput_title = "\
 Local /Remote\n\
 Socket Size   Request  Resp.   Elapsed  Trans.\n\
 Send   Recv   Size     Size    Time     Rate         \n\
 bytes  Bytes  bytes    bytes   secs.    per sec   \n\n";

   char *tput_title_band = "\
 Local /Remote\n\
 Socket Size   Request  Resp.   Elapsed  \n\
 Send   Recv   Size     Size    Time     Throughput \n\
 bytes  Bytes  bytes    bytes   secs.    %s/sec   \n\n";

   char *tput_fmt_0 =
     "%7.2f %s\n";

   char *tput_fmt_1_line_1 = "\
 %-6d %-6d %-6d   %-6d  %-6.2f   %7.2f   %s\n";
   char *tput_fmt_1_line_2 = "\
 %-6d %-6d\n";

   char *cpu_title = "\
 Local /Remote\n\
 Socket Size   Request Resp.  Elapsed Trans.   CPU    CPU    S.dem   S.dem\n\
 Send   Recv   Size    Size   Time    Rate     local  remote local   remote\n\
 bytes  bytes  bytes   bytes  secs.   per sec  %% %c    %% %c    us/Tr   us/Tr\n\n";

   char *cpu_title_tput = "\
 Local /Remote\n\
 Socket Size   Request Resp.  Elapsed Tput     CPU    CPU    S.dem   S.dem\n\
 Send   Recv   Size    Size   Time    %-8.8s local  remote local   remote\n\
 bytes  bytes  bytes   bytes  secs.   per sec  %% %c    %% %c    us/Tr   us/Tr\n\n";

   char *cpu_title_latency = "\
 Local /Remote\n\
 Socket Size   Request Resp.  Elapsed Latency  CPU    CPU    S.dem   S.dem\n\
 Send   Recv   Size    Size   Time    usecs    local  remote local   remote\n\
 bytes  bytes  bytes   bytes  secs.   per tran %% %c    %% %c    us/Tr   us/Tr\n\n";

   char *cpu_fmt_0 =
     "%6.3f %c %s\n";

   char *cpu_fmt_1_line_1 = "\
 %-6d %-6d %-6d  %-6d %-6.2f  %-6.2f  %-6.2f %-6.2f %-6.3f  %-6.3f %s\n";

   char *cpu_fmt_1_line_2 = "\
 %-6d %-6d\n";

   char *ksink_fmt = "\
 Alignment      Offset         RoundTrip  Trans    Throughput\n\
 Local  Remote  Local  Remote  Latency    Rate     %-8.8s/s\n\
 Send   Recv    Send   Recv    usec/Tran  per sec  Outbound   Inbound\n\
 %5d  %5d   %5d  %5d   %-6.3f   %-6.3f %-6.3f    %-6.3f\n";


   int			timed_out = 0;
   float			elapsed_time;

   int	len;
   char	*temp_message_ptr;
   int	nummessages;
   SOCKET	send_socket;
   int	trans_remaining;
   double	bytes_xferd;

   struct ring_elt *send_ring;
   struct ring_elt *recv_ring;

   int	rsp_bytes_left;
   int	rsp_bytes_recvd;

   float	local_cpu_utilization;
   float	local_service_demand;
   float	remote_cpu_utilization;
   float	remote_service_demand;
   double	thruput;

   struct addrinfo *local_res;
   struct addrinfo *remote_res;

   struct	tcp_rr_request_struct	*tcp_rr_request;
   struct	tcp_rr_response_struct	*tcp_rr_response;
   struct	tcp_rr_results_struct	*tcp_rr_result;

 #ifdef WANT_FIRST_BURST
 #define REQUEST_CWND_INITIAL 2
   /* "in the beginning..." the WANT_FIRST_BURST stuff was like both
      Unix and the state of New Jersey - both were simple an unspoiled.
      then it was realized that some stacks are quite picky about
      initial congestion windows and a non-trivial initial burst of
      requests would not be individual segments even with TCP_NODELAY
      set. so, we have to start tracking a poor-man's congestion window
      up here in window space because we want to try to make something
      happen that frankly, we cannot guarantee with the specification
      of TCP.  ain't that grand?-)  raj 2006-01-30 */
   int requests_outstanding = 0;
   int request_cwnd = REQUEST_CWND_INITIAL;  /* we ass-u-me that having
 					       three requests
 					       outstanding at the
 					       beginning of the test
 					       is ok with TCP stacks
 					       of interest. the first
 					       two will come from our
 					       first_burst loop, and
 					       the third from our
 					       regularly scheduled
 					       send */
 #endif

   tcp_rr_request =
     (struct tcp_rr_request_struct *)netperf_request.content.test_specific_data;
   tcp_rr_response=
     (struct tcp_rr_response_struct *)netperf_response.content.test_specific_data;
   tcp_rr_result	=
     (struct tcp_rr_results_struct *)netperf_response.content.test_specific_data;

 #ifdef WANT_HISTOGRAM
   if (verbosity > 1) {
     time_hist = HIST_new();
   }
 #endif /* WANT_HISTOGRAM */

   /* since we are now disconnected from the code that established the */
   /* control socket, and since we want to be able to use different */
   /* protocols and such, we are passed the name of the remote host and */
   /* must turn that into the test specific addressing information. */

   complete_addrinfos(&remote_res,
 		     &local_res,
 		     remote_host,
 		     SOCK_STREAM,
 		     IPPROTO_TCP,
 		     0);

   if ( print_headers ) {
     print_top_test_header("TCP REQUEST/RESPONSE TEST",local_res,remote_res);
   }

   /* initialize a few counters */

   send_ring = NULL;
   recv_ring = NULL;
   confidence_iteration = 1;
   init_stat();

   /* we have a great-big while loop which controls the number of times */
   /* we run a particular test. this is for the calculation of a */
   /* confidence interval (I really should have stayed awake during */
   /* probstats :). If the user did not request confidence measurement */
   /* (no confidence is the default) then we will only go though the */
   /* loop once. the confidence stuff originates from the folks at IBM */

   while (((confidence < 0) && (confidence_iteration < iteration_max)) ||
 	 (confidence_iteration <= iteration_min)) {

     /* initialize a few counters. we have to remember that we might be */
     /* going through the loop more than once. */

     nummessages     = 0;
     bytes_xferd     = 0.0;
     times_up        = 0;
     timed_out       = 0;
     trans_remaining = 0;

 #ifdef WANT_FIRST_BURST
     /* we have to remember to reset the number of transactions
        outstanding and the "congestion window for each new
        iteration. raj 2006-01-31 */
     requests_outstanding = 0;
     request_cwnd = REQUEST_CWND_INITIAL;
 #endif


     /* set-up the data buffers with the requested alignment and offset. */
     /* since this is a request/response test, default the send_width and */
     /* recv_width to 1 and not two raj 7/94 */

     if (send_width == 0) send_width = 1;
     if (recv_width == 0) recv_width = 1;

     if (send_ring == NULL) {
       send_ring = allocate_buffer_ring(send_width,
 				       req_size,
 				       local_send_align,
 				       local_send_offset);
     }

     if (recv_ring == NULL) {
       recv_ring = allocate_buffer_ring(recv_width,
 				       rsp_size,
 				       local_recv_align,
 				       local_recv_offset);
     }

     /*set up the data socket                        */
     send_socket = create_data_socket(local_res);

     if (send_socket == INVALID_SOCKET){
       perror("netperf: send_tcp_rr: tcp stream data socket");
       exit(1);
     }

     if (debug) {
       fprintf(where,"send_tcp_rr: send_socket obtained...\n");
     }

     /* If the user has requested cpu utilization measurements, we must */
     /* calibrate the cpu(s). We will perform this task within the tests */
     /* themselves. If the user has specified the cpu rate, then */
     /* calibrate_local_cpu will return rather quickly as it will have */
     /* nothing to do. If local_cpu_rate is zero, then we will go through */
     /* all the "normal" calibration stuff and return the rate back.*/

     if (local_cpu_usage) {
       local_cpu_rate = calibrate_local_cpu(local_cpu_rate);
     }

     if (!no_control) {
       /* Tell the remote end to do a listen. The server alters the
 	 socket paramters on the other side at this point, hence the
 	 reason for all the values being passed in the setup
 	 message. If the user did not specify any of the parameters,
 	 they will be passed as 0, which will indicate to the remote
 	 that no changes beyond the system's default should be
 	 used. Alignment is the exception, it will default to 8, which
 	 will be no alignment alterations. */

       netperf_request.content.request_type	=	DO_TCP_RR;
       tcp_rr_request->recv_buf_size	=	rsr_size_req;
       tcp_rr_request->send_buf_size	=	rss_size_req;
       tcp_rr_request->recv_alignment    =	remote_recv_align;
       tcp_rr_request->recv_offset	=	remote_recv_offset;
       tcp_rr_request->send_alignment    =	remote_send_align;
       tcp_rr_request->send_offset	=	remote_send_offset;
       tcp_rr_request->request_size	=	req_size;
       tcp_rr_request->response_size	=	rsp_size;
       tcp_rr_request->no_delay	        =	rem_nodelay;
       tcp_rr_request->measure_cpu	=	remote_cpu_usage;
       tcp_rr_request->cpu_rate	        =	remote_cpu_rate;
       tcp_rr_request->so_rcvavoid	=	rem_rcvavoid;
       tcp_rr_request->so_sndavoid	=	rem_sndavoid;
       if (test_time) {
 	tcp_rr_request->test_length	=	test_time;
       }
       else {
 	tcp_rr_request->test_length	=	test_trans * -1;
       }
       tcp_rr_request->port              =      atoi(remote_data_port);
       tcp_rr_request->ipfamily = af_to_nf(remote_res->ai_family);

       if (debug > 1) {
 	fprintf(where,"netperf: send_tcp_rr: requesting TCP rr test\n");
       }

       send_request();

       /* The response from the remote will contain all of the relevant
 	 socket parameters for this test type. We will put them back
 	 into the variables here so they can be displayed if desired.
 	 The remote will have calibrated CPU if necessary, and will
 	 have done all the needed set-up we will have calibrated the
 	 cpu locally before sending the request, and will grab the
 	 counter value right after the connect returns. The remote
 	 will grab the counter right after the accept call. This saves
 	 the hassle of extra messages being sent for the TCP
 	 tests.  */

       recv_response();

       if (!netperf_response.content.serv_errno) {
 	if (debug)
 	  fprintf(where,"remote listen done.\n");
 	rsr_size          = tcp_rr_response->recv_buf_size;
 	rss_size          = tcp_rr_response->send_buf_size;
 	rem_nodelay       = tcp_rr_response->no_delay;
 	remote_cpu_usage  = tcp_rr_response->measure_cpu;
 	remote_cpu_rate   = tcp_rr_response->cpu_rate;
 	/* make sure that port numbers are in network order */
 	set_port_number(remote_res,(short)tcp_rr_response->data_port_number);
       }
       else {
 	Set_errno(netperf_response.content.serv_errno);
 	fprintf(where,
 		"netperf: remote error %d",
 		netperf_response.content.serv_errno);
 	perror("");
 	fflush(where);

 	exit(1);
       }
     }

 #ifdef WANT_DEMO
     DEMO_RR_SETUP(1000)
 #endif

     /*Connect up to the remote port on the data socket  */
     if (connect(send_socket,
 		remote_res->ai_addr,
 		remote_res->ai_addrlen) == INVALID_SOCKET){
       perror("netperf: data socket connect failed");

       exit(1);
     }

 #ifdef WIN32
     /* this is used so the timer thread can close the socket out from */
     /* under us, which to date is the easiest/cleanest/least */
     /* Windows-specific way I can find to force the winsock calls to */
     /* return WSAEINTR with the test is over. anything that will run on */
     /* 95 and NT and is closer to what netperf expects from Unix signals */
     /* and such would be appreciated raj 1/96 */
     win_kludge_socket = send_socket;
 #endif /* WIN32 */

     /* Data Socket set-up is finished. If there were problems, either the */
     /* connect would have failed, or the previous response would have */
     /* indicated a problem. I failed to see the value of the extra */
     /* message after the accept on the remote. If it failed, we'll see it */
     /* here. If it didn't, we might as well start pumping data. */

     /* Set-up the test end conditions. For a request/response test, they */
     /* can be either time or transaction based. */

     if (test_time) {
       /* The user wanted to end the test after a period of time. */
       times_up = 0;
       trans_remaining = 0;
       start_timer(test_time);
     }
     else {
       /* The tester wanted to send a number of bytes. */
       trans_remaining = test_bytes;
       times_up = 1;
     }

     /* The cpu_start routine will grab the current time and possibly */
     /* value of the idle counter for later use in measuring cpu */
     /* utilization and/or service demand and thruput. */

     cpu_start(local_cpu_usage);

 #ifdef WANT_INTERVALS
     INTERVALS_INIT();
 #endif /* WANT_INTERVALS */

     /* We use an "OR" to control test execution. When the test is */
     /* controlled by time, the byte count check will always return false. */
     /* When the test is controlled by byte count, the time test will */
     /* always return false. When the test is finished, the whole */
     /* expression will go false and we will stop sending data. I think I */
     /* just arbitrarily decrement trans_remaining for the timed test, but */
     /* will not do that just yet... One other question is whether or not */
     /* the send buffer and the receive buffer should be the same buffer. */

 #ifdef WANT_DEMO
       if (demo_mode) {
 	HIST_timestamp(demo_one_ptr);
       }
 #endif

     while ((!times_up) || (trans_remaining > 0)) {
       /* send the request. we assume that if we use a blocking socket, */
       /* the request will be sent at one shot. */

 #ifdef WANT_FIRST_BURST
       /* we can inject no more than request_cwnd, which will grow with
 	 time, and no more than first_burst_size.  we don't use <= to
 	 account for the "regularly scheduled" send call.  of course
 	 that makes it more a "max_outstanding_ than a
 	 "first_burst_size" but for now we won't fix the names. also,
 	 I suspect the extra check against < first_burst_size is
 	 redundant since later I expect to make sure that request_cwnd
 	 can never get larger than first_burst_size, but just at the
 	 moment I'm feeling like a belt and suspenders kind of
 	 programmer. raj 2006-01-30 */
       while ((first_burst_size > 0) &&
 	     (requests_outstanding < request_cwnd) &&
 	     (requests_outstanding < first_burst_size)) {
 	if (debug) {
 	  fprintf(where,
 		  "injecting, req_outstndng %d req_cwnd %d burst %d\n",
 		  requests_outstanding,
 		  request_cwnd,
 		  first_burst_size);
 	}
 	if ((len = send(send_socket,
 			send_ring->buffer_ptr,
 			req_size,
 			0)) != req_size) {
 	  /* we should never hit the end of the test in the first burst */
 	  perror("send_tcp_rr: initial burst data send error");
 	  exit(-1);
 	}
 	requests_outstanding += 1;
       }

 #endif /* WANT_FIRST_BURST */

 #ifdef WANT_HISTOGRAM
       if (verbosity > 1) {
 	/* timestamp just before our call to send, and then again just
 	   after the receive raj 8/94 */
 	/* but only if we are actually going to display one. raj
 	   2007-02-07 */

 	HIST_timestamp(&time_one);
       }
 #endif /* WANT_HISTOGRAM */

       if ((len = send(send_socket,
 		      send_ring->buffer_ptr,
 		      req_size,
 		      0)) != req_size) {
 	if (SOCKET_EINTR(len) || (errno == 0)) {
 	  /* we hit the end of a */
 	  /* timed test. */
 	  timed_out = 1;
 	  break;
 	}
 	perror("send_tcp_rr: data send error");
 	exit(1);
       }
       send_ring = send_ring->next;

 #ifdef WANT_FIRST_BURST
       requests_outstanding += 1;
 #endif

       /* receive the response */
       rsp_bytes_left = rsp_size;
       temp_message_ptr  = recv_ring->buffer_ptr;
       while(rsp_bytes_left > 0) {
 	if((rsp_bytes_recvd=recv(send_socket,
 				 temp_message_ptr,
 				 rsp_bytes_left,
 				 0)) == SOCKET_ERROR || rsp_bytes_recvd == 0) {
 		if ( SOCKET_EINTR(rsp_bytes_recvd) ) {
 		    /* We hit the end of a timed test. */
 			timed_out = 1;
 			break;
 		}
 	  perror("send_tcp_rr: data recv error");
 	  exit(1);
 	}
 	rsp_bytes_left -= rsp_bytes_recvd;
 	temp_message_ptr  += rsp_bytes_recvd;
       }
       recv_ring = recv_ring->next;

 #ifdef WANT_FIRST_BURST
       /* so, since we've gotten a response back, update the
 	 bookkeeping accordingly.  there is one less request
 	 outstanding and we can put one more out there than before. */
       requests_outstanding -= 1;
       if (request_cwnd < first_burst_size) {
 	request_cwnd += 1;
 	if (debug) {
 	  fprintf(where,
 		  "incr req_cwnd to %d first_burst %d reqs_outstndng %d\n",
 		  request_cwnd,
 		  first_burst_size,
 		  requests_outstanding);
 	}
       }
 #endif
       if (timed_out) {
 	/* we may have been in a nested while loop - we need */
 	/* another call to break. */
 	break;
       }

 #ifdef WANT_HISTOGRAM
       if (verbosity > 1) {
 	HIST_timestamp(&time_two);
 	HIST_add(time_hist,delta_micro(&time_one,&time_two));
       }
 #endif /* WANT_HISTOGRAM */

 #ifdef WANT_DEMO
       DEMO_RR_INTERVAL(1);
 #endif

 #ifdef WANT_INTERVALS
       INTERVALS_WAIT();
 #endif /* WANT_INTERVALS */

       nummessages++;
       if (trans_remaining) {
 	trans_remaining--;
       }

       if (debug > 3) {
 	if ((nummessages % 100) == 0) {
 	  fprintf(where,
 		  "Transaction %d completed\n",
 		  nummessages);
 	  fflush(where);
 	}
       }
     }

     /* At this point we used to call shutdown on the data socket to be
        sure all the data was delivered, but this was not germane in a
        request/response test, and it was causing the tests to "hang"
        when they were being controlled by time. So, I have replaced
        this shutdown call with a call to close that can be found later
        in the procedure. */

     /* this call will always give us the elapsed time for the test,
        and will also store-away the necessaries for cpu utilization */

     cpu_stop(local_cpu_usage,&elapsed_time);	/* was cpu being */
 						/* measured? how long */
 						/* did we really run? */

     if (!no_control) {
       /* Get the statistics from the remote end. The remote will have
 	 calculated CPU utilization. If it wasn't supposed to care, it
 	 will return obvious values. */

       recv_response();
       if (!netperf_response.content.serv_errno) {
 	if (debug)
 	  fprintf(where,"remote results obtained\n");
       }
       else {
 	Set_errno(netperf_response.content.serv_errno);
 	fprintf(where,"netperf: remote error %d",
 		netperf_response.content.serv_errno);
 	perror("");
 	fflush(where);
 	exit(1);
       }
     }

     /* We now calculate what our "throughput" was for the test. */

     bytes_xferd	= (req_size * nummessages) + (rsp_size * nummessages);
     thruput	= nummessages/elapsed_time;

     if (local_cpu_usage || remote_cpu_usage) {
       /* We must now do a little math for service demand and cpu
        utilization for the system(s) Of course, some of the
        information might be bogus because there was no idle counter in
        the kernel(s). We need to make a note of this for the user's
        benefit... */
       if (local_cpu_usage) {
 	local_cpu_utilization = calc_cpu_util(0.0);
  	/* since calc_service demand is doing ms/Kunit we will
 	   multiply the number of transaction by 1024 to get "good"
 	   numbers */
 	local_service_demand  = calc_service_demand((double) nummessages*1024,
 						    0.0,
 						    0.0,
 						    0);
       }
       else {
 	local_cpu_utilization	= (float) -1.0;
 	local_service_demand	= (float) -1.0;
       }

       if (remote_cpu_usage) {
 	remote_cpu_utilization = tcp_rr_result->cpu_util;
 	/* since calc_service demand is doing ms/Kunit we will
 	   multiply the number of transaction by 1024 to get "good"
 	   numbers */
 	remote_service_demand = calc_service_demand((double) nummessages*1024,
 						    0.0,
 						    remote_cpu_utilization,
 						    tcp_rr_result->num_cpus);
       }
       else {
 	remote_cpu_utilization = (float) -1.0;
 	remote_service_demand  = (float) -1.0;
       }

     }
     else {
       /* we were not measuring cpu, for the confidence stuff, we */
       /* should make it -1.0 */
       local_cpu_utilization	= (float) -1.0;
       local_service_demand	= (float) -1.0;
       remote_cpu_utilization = (float) -1.0;
       remote_service_demand  = (float) -1.0;
     }

     /* at this point, we want to calculate the confidence information.
        if debugging is on, calculate_confidence will print-out the
        parameters we pass it */

     calculate_confidence(confidence_iteration,
 			 elapsed_time,
 			 thruput,
 			 local_cpu_utilization,
 			 remote_cpu_utilization,
 			 local_service_demand,
 			 remote_service_demand);


     confidence_iteration++;

     /* we are now done with the socket, so close it */
     close(send_socket);

   }

   retrieve_confident_values(&elapsed_time,
 			    &thruput,
 			    &local_cpu_utilization,
 			    &remote_cpu_utilization,
 			    &local_service_demand,
 			    &remote_service_demand);

   /* We are now ready to print all the information. If the user has
      specified zero-level verbosity, we will just print the local
      service demand, or the remote service demand. If the user has
      requested verbosity level 1, he will get the basic "streamperf"
      numbers. If the user has specified a verbosity of greater than 1,
      we will display a veritable plethora of background information
      from outside of this block as it it not cpu_measurement
      specific...  */

   if (confidence < 0) {
     /* we did not hit confidence, but were we asked to look for it? */
     if (iteration_max > 1) {
       display_confidence();
     }
   }

   if (local_cpu_usage || remote_cpu_usage) {
     local_cpu_method = format_cpu_method(cpu_method);
     remote_cpu_method = format_cpu_method(tcp_rr_result->cpu_method);

     switch (verbosity) {
     case 0:
       if (local_cpu_usage) {
 	fprintf(where,
 		cpu_fmt_0,
 		local_service_demand,
 		local_cpu_method,
 		((print_headers) ||
 		 (result_brand == NULL)) ? "" : result_brand);
       }
       else {
 	fprintf(where,
 		cpu_fmt_0,
 		remote_service_demand,
 		remote_cpu_method,
 		((print_headers) ||
 		 (result_brand == NULL)) ? "" : result_brand);
       }
       break;
     case 1:
     case 2:
       if (print_headers) {
 	if ('x' == libfmt) {
 	  fprintf(where,
 		  cpu_title,
 		  local_cpu_method,
 		  remote_cpu_method);
 	}
 	else {
 	  fprintf(where,
 		  cpu_title_tput,
 		  format_units(),
 		  local_cpu_method,
 		  remote_cpu_method);
 	}
       }

       fprintf(where,
 	      cpu_fmt_1_line_1,		/* the format string */
 	      lss_size,		/* local sendbuf size */
 	      lsr_size,
 	      req_size,		/* how large were the requests */
 	      rsp_size,		/* guess */
 	      elapsed_time,		/* how long was the test */
 	      ('x' == libfmt) ? thruput :
 	      calc_thruput_interval_omni(thruput * (req_size+rsp_size),
 					 1.0),
 	      local_cpu_utilization,	/* local cpu */
 	      remote_cpu_utilization,	/* remote cpu */
 	      local_service_demand,	/* local service demand */
 	      remote_service_demand,	/* remote service demand */
 	      ((print_headers) ||
 	       (result_brand == NULL)) ? "" : result_brand);
       fprintf(where,
 	      cpu_fmt_1_line_2,
 	      rss_size,
 	      rsr_size);
       break;
     }
   }
   else {
     /* The tester did not wish to measure service demand. */

     switch (verbosity) {
     case 0:
       fprintf(where,
 	      tput_fmt_0,
 	      ('x' == libfmt) ? thruput :
 	      calc_thruput_interval_omni(thruput * (req_size+rsp_size),
 					 1.0),
 	      ((print_headers) ||
 	       (result_brand == NULL)) ? "" : result_brand);
       break;
     case 1:
     case 2:
       if (print_headers) {
 	fprintf(where,
 		('x' == libfmt) ? tput_title : tput_title_band,
 		format_units());
       }

       fprintf(where,
 	      tput_fmt_1_line_1,	/* the format string */
 	      lss_size,
 	      lsr_size,
 	      req_size,		/* how large were the requests */
 	      rsp_size,		/* how large were the responses */
 	      elapsed_time, 		/* how long did it take */
 	      /* are we trans or do we need to convert to bytes then
 		 bits? at this point, thruput is in our "confident"
 		 transactions per second. we can convert to a
 		 bidirectional bitrate by multiplying that by the sum
 		 of the req_size and rsp_size.  we pass that to
 		 calc_thruput_interval_omni with an elapsed time of
 		 1.0 s to get it converted to [kmg]bits/s or
 		 [KMG]Bytes/s */
 	      ('x' == libfmt) ?  thruput :
 	      calc_thruput_interval_omni(thruput * (req_size+rsp_size),
 					 1.0),
 	      ((print_headers) ||
 	       (result_brand == NULL)) ? "" : result_brand);
       fprintf(where,
 	      tput_fmt_1_line_2,
 	      rss_size, 		/* remote recvbuf size */
 	      rsr_size);

       break;
     }
   }

   /* it would be a good thing to include information about some of the */
   /* other parameters that may have been set for this test, but at the */
   /* moment, I do not wish to figure-out all the  formatting, so I will */
   /* just put this comment here to help remind me that it is something */
   /* that should be done at a later time. */

   /* how to handle the verbose information in the presence of */
   /* confidence intervals is yet to be determined... raj 11/94 */
   if (verbosity > 1) {
     /* The user wanted to know it all, so we will give it to him. */
     /* This information will include as much as we can find about */
     /* TCP statistics, the alignments of the sends and receives */
     /* and all that sort of rot... */

     /* normally, you might think that if we were messing about with
        the value of libfmt we would need to put it back again, but
        since this is basically the last thing we are going to do with
        it, it does not matter.  so there :) raj 2007-06-08 */
     /* if the user was asking for transactions, then we report
        megabits per second for the unidirectional throughput,
        otherwise we use the desired units. */
     if ('x' == libfmt) {
       libfmt = 'm';
     }

     fprintf(where,
 	    ksink_fmt,
 	    format_units(),
 	    local_send_align,
 	    remote_recv_offset,
 	    local_send_offset,
 	    remote_recv_offset,
 	    /* if the user has enable burst mode, we have to remember
 	       to account for that in the number of transactions
 	       outstanding at any one time. otherwise we will
 	       underreport the latency of individual
 	       transactions. learned from saf by raj 2007-06-08  */
 	    (((double)1.0/thruput)*(double)1000000.0) *
 	    (double) (1 + ((first_burst_size > 0) ? first_burst_size : 0)),
 	    thruput,
 	    calc_thruput_interval_omni(thruput * (double)req_size,1.0),
 	    calc_thruput_interval_omni(thruput * (double)rsp_size,1.0));

 #ifdef WANT_HISTOGRAM
     fprintf(where,"\nHistogram of request/response times\n");
     fflush(where);
     HIST_report(time_hist);
 #endif /* WANT_HISTOGRAM */

   }

 }

 void
 send_udp_stream(char remote_host[])
 {
   /**********************************************************************/
   /*									*/
   /*               	UDP Unidirectional Send Test                    */
   /*									*/
   /**********************************************************************/

 #define UDP_LENGTH_MAX 0XFFFF - 28

   char *tput_title = "\
 Socket  Message  Elapsed      Messages                \n\
 Size    Size     Time         Okay Errors   Throughput\n\
 bytes   bytes    secs            #      #   %s/sec\n\n";

   char *tput_fmt_0 =
     "%7.2f\n";

   char *tput_fmt_1 = "\
 %6d  %6d   %-7.2f   %7d %6d    %7.2f\n\
 %6d           %-7.2f   %7d           %7.2f\n\n";


   char *cpu_title = "\
 Socket  Message  Elapsed      Messages                   CPU      Service\n\
 Size    Size     Time         Okay Errors   Throughput   Util     Demand\n\
 bytes   bytes    secs            #      #   %s/sec %% %c%c     us/KB\n\n";

   char *cpu_fmt_0 =
     "%6.2f %c\n";

   char *cpu_fmt_1 = "\
 %6d  %6d   %-7.2f   %7d %6d    %7.1f     %-6.2f   %-6.3f\n\
 %6d           %-7.2f   %7d           %7.1f     %-6.2f   %-6.3f\n\n";

   unsigned int	messages_recvd;
   unsigned int 	messages_sent;
   unsigned int	failed_sends;

   float	elapsed_time,
         local_cpu_utilization,
         remote_cpu_utilization;

   float	 local_service_demand, remote_service_demand;
   double local_thruput, remote_thruput;
   double bytes_sent;
   double bytes_recvd;


   int	len;
   struct ring_elt *send_ring;
   SOCKET 	data_socket;

   unsigned int sum_messages_sent;
   unsigned int sum_messages_recvd;
   unsigned int sum_failed_sends;
   double sum_local_thruput;

   struct addrinfo *local_res;
   struct addrinfo *remote_res;

   struct	udp_stream_request_struct	*udp_stream_request;
   struct	udp_stream_response_struct	*udp_stream_response;
   struct	udp_stream_results_struct	*udp_stream_results;

   udp_stream_request	=
     (struct udp_stream_request_struct *)netperf_request.content.test_specific_data;
   udp_stream_response	=
     (struct udp_stream_response_struct *)netperf_response.content.test_specific_data;
   udp_stream_results	=
     (struct udp_stream_results_struct *)netperf_response.content.test_specific_data;

 #ifdef WANT_HISTOGRAM
   if (verbosity > 1) {
     time_hist = HIST_new();
   }
 #endif /* WANT_HISTOGRAM */

   /* since we are now disconnected from the code that established the */
   /* control socket, and since we want to be able to use different */
   /* protocols and such, we are passed the name of the remote host and */
   /* must turn that into the test specific addressing information. */

   complete_addrinfos(&remote_res,
 		     &local_res,
 		     remote_host,
 		     SOCK_DGRAM,
 		     IPPROTO_UDP,
 		     0);

   if ( print_headers ) {
     print_top_test_header("UDP UNIDIRECTIONAL SEND TEST",local_res,remote_res);
   }

   send_ring            = NULL;
   confidence_iteration = 1;
   init_stat();
   sum_messages_sent    = 0;
   sum_messages_recvd   = 0;
   sum_failed_sends     = 0;
   sum_local_thruput    = 0.0;

   /* we have a great-big while loop which controls the number of times */
   /* we run a particular test. this is for the calculation of a */
   /* confidence interval (I really should have stayed awake during */
   /* probstats :). If the user did not request confidence measurement */
   /* (no confidence is the default) then we will only go though the */
   /* loop once. the confidence stuff originates from the folks at IBM */

   while (((confidence < 0) && (confidence_iteration < iteration_max)) ||
 	 (confidence_iteration <= iteration_min)) {

     /* initialize a few counters. we have to remember that we might be */
     /* going through the loop more than once. */
     messages_sent  = 0;
     messages_recvd = 0;
     failed_sends   = 0;
     times_up       = 0;

     /*set up the data socket			*/
     data_socket = create_data_socket(local_res);

     if (data_socket == INVALID_SOCKET){
       perror("udp_send: data socket");
       exit(1);
     }

     /* now, we want to see if we need to set the send_size */
     if (send_size == 0) {
       if (lss_size > 0) {
 	send_size = (lss_size < UDP_LENGTH_MAX ? lss_size : UDP_LENGTH_MAX);
       }
       else {
 	send_size = 4096;
       }
     }


     /* set-up the data buffer with the requested alignment and offset, */
     /* most of the numbers here are just a hack to pick something nice */
     /* and big in an attempt to never try to send a buffer a second time */
     /* before it leaves the node...unless the user set the width */
     /* explicitly. */
     if (send_width == 0) send_width = 32;

     if (send_ring == NULL ) {
       send_ring = allocate_buffer_ring(send_width,
 				       send_size,
 				       local_send_align,
 				       local_send_offset);
     }


     /* if the user supplied a cpu rate, this call will complete rather */
     /* quickly, otherwise, the cpu rate will be retured to us for */
     /* possible display. The Library will keep it's own copy of this data */
     /* for use elsewhere. We will only display it. (Does that make it */
     /* "opaque" to us?) */

     if (local_cpu_usage)
       local_cpu_rate = calibrate_local_cpu(local_cpu_rate);

     if (!no_control) {
       /* Tell the remote end to set up the data connection. The server
          sends back the port number and alters the socket parameters
          there.  Of course this is a datagram service so no connection
          is actually set up, the server just sets up the socket and
          binds it. */

       netperf_request.content.request_type      = DO_UDP_STREAM;
       udp_stream_request->recv_buf_size  = rsr_size_req;
       udp_stream_request->message_size   = send_size;
       udp_stream_request->recv_connected = remote_connected;
       udp_stream_request->recv_alignment = remote_recv_align;
       udp_stream_request->recv_offset    = remote_recv_offset;
       udp_stream_request->measure_cpu    = remote_cpu_usage;
       udp_stream_request->cpu_rate       = remote_cpu_rate;
       udp_stream_request->test_length    = test_time;
       udp_stream_request->so_rcvavoid    = rem_rcvavoid;
       udp_stream_request->so_sndavoid    = rem_sndavoid;
       udp_stream_request->port           = atoi(remote_data_port);
       udp_stream_request->ipfamily = af_to_nf(remote_res->ai_family);

       send_request();

       recv_response();

       if (!netperf_response.content.serv_errno) {
 	if (debug)
 	  fprintf(where,"send_udp_stream: remote data connection done.\n");
       }
       else {
 	Set_errno(netperf_response.content.serv_errno);
 	perror("send_udp_stream: error on remote");
 	exit(1);
       }

       /* Place the port number returned by the remote into the sockaddr */
       /* structure so our sends can be sent to the correct place. Also get */
       /* some of the returned socket buffer information for user display. */

       /* make sure that port numbers are in the proper order */
       set_port_number(remote_res,(short)udp_stream_response->data_port_number);

       rsr_size        = udp_stream_response->recv_buf_size;
       rss_size        = udp_stream_response->send_buf_size;
       remote_cpu_rate = udp_stream_response->cpu_rate;
     }

 #ifdef WANT_DEMO
     DEMO_STREAM_SETUP(lss_size,rsr_size)
 #endif

     /* We "connect" up to the remote post to allow is to use the send */
     /* call instead of the sendto call. Presumeably, this is a little */
     /* simpler, and a little more efficient. I think that it also means */
     /* that we can be informed of certain things, but am not sure */
     /* yet...also, this is the way I would expect a client to behave */
     /* when talking to a server */
     if (local_connected) {
        if (connect(data_socket,
       		   remote_res->ai_addr,
 		   remote_res->ai_addrlen) == INVALID_SOCKET){
           perror("send_udp_stream: data socket connect failed");
           exit(1);
        } else if (debug) {
           fprintf(where,"send_udp_stream: connected data socket.\n");
           fflush(where);
        }
     }

 #ifdef WIN32
   /* this is used so the timer thread can close the socket out from */
   /* under us, which to date is the easiest/cleanest/least */
   /* Windows-specific way I can find to force the winsock calls to */
   /* return WSAEINTR with the test is over. anything that will run on */
   /* 95 and NT and is closer to what netperf expects from Unix signals */
   /* and such would be appreciated raj 1/96 */
     win_kludge_socket = data_socket;
 #endif /* WIN32 */

     /* set up the timer to call us after test_time. one of these days, */
     /* it might be nice to figure-out a nice reliable way to have the */
     /* test controlled by a byte count as well, but since UDP is not */
     /* reliable, that could prove difficult. so, in the meantime, we */
     /* only allow a UDP_STREAM test to be a timed test. */

     if (test_time) {
       times_up = 0;
       start_timer(test_time);
     }
     else {
       fprintf(where,"Sorry, UDP_STREAM tests must be timed.\n");
       fflush(where);
     }

     /* Get the start count for the idle counter and the start time */

     cpu_start(local_cpu_usage);

 #ifdef WANT_INTERVALS
     INTERVALS_INIT();
 #endif /* WANT_INTERVALS */

 #ifdef WANT_DEMO
     if (demo_mode) {
       HIST_timestamp(demo_one_ptr);
     }
 #endif

     /* Send datagrams like there was no tomorrow. at somepoint it might */
     /* be nice to set this up so that a quantity of bytes could be sent, */
     /* but we still need some sort of end of test trigger on the receive */
     /* side. that could be a select with a one second timeout, but then */
     /* if there is a test where none of the data arrives for awile and */
     /* then starts again, we would end the test too soon. something to */
     /* think about... */
     while (!times_up) {

 #ifdef DIRTY
       /* we want to dirty some number of consecutive integers in the buffer */
       /* we are about to send. we may also want to bring some number of */
       /* them cleanly into the cache. The clean ones will follow any dirty */
       /* ones into the cache. */

       access_buffer(send_ring->buffer_ptr,
 		    send_size,
 		    loc_dirty_count,
 		    loc_clean_count);
 #endif /* DIRTY */

 #ifdef WANT_HISTOGRAM
       if (verbosity > 1) {
 	HIST_timestamp(&time_one);
       }
 #endif /* WANT_HISTOGRAM */

       if (local_connected) {
          len = send(data_socket,
 	  	    send_ring->buffer_ptr,
 		    send_size,
 		    0);
       } else {
          len = sendto(data_socket,
 		      send_ring->buffer_ptr,
 		      send_size,
 		      0,
 		      remote_res->ai_addr,
 		      remote_res->ai_addrlen);
       }

       if (len != send_size) {
 	if ((len >= 0) ||
 	    SOCKET_EINTR(len))
 	  break;
 	if (errno == ENOBUFS) {
 	  failed_sends++;
 	  continue;
 	}
 	perror("udp_send: data send error");
 	exit(1);
       }
       messages_sent++;

       /* now we want to move our pointer to the next position in the */
       /* data buffer... */

       send_ring = send_ring->next;


 #ifdef WANT_HISTOGRAM
       if (verbosity > 1) {
 	/* get the second timestamp */
 	HIST_timestamp(&time_two);
 	HIST_add(time_hist,delta_micro(&time_one,&time_two));
       }
 #endif /* WANT_HISTOGRAM */

 #ifdef WANT_DEMO
       DEMO_STREAM_INTERVAL(send_size)
 #endif

 #ifdef WANT_INTERVALS
       INTERVALS_WAIT();
 #endif /* WANT_INTERVALS */

     }

     /* This is a timed test, so the remote will be returning to us after */
     /* a time. We should not need to send any "strange" messages to tell */
     /* the remote that the test is completed, unless we decide to add a */
     /* number of messages to the test. */

     /* the test is over, so get stats and stuff */
     cpu_stop(local_cpu_usage,
 	     &elapsed_time);

     if (!no_control) {
       /* Get the statistics from the remote end	*/
       recv_response();
       if (!netperf_response.content.serv_errno) {
 	if (debug)
 	  fprintf(where,"send_udp_stream: remote results obtained\n");
       }
       else {
 	Set_errno(netperf_response.content.serv_errno);
 	perror("send_udp_stream: error on remote");
 	exit(1);
       }
       messages_recvd = udp_stream_results->messages_recvd;
       bytes_recvd    = (double) send_size * (double) messages_recvd;
     }
     else {
       /* since there was no control connection, we've no idea what was
 	 actually received. raj 2007-02-08 */
       messages_recvd = -1;
       bytes_recvd = -1.0;
     }

     bytes_sent    = (double) send_size * (double) messages_sent;
     local_thruput = calc_thruput(bytes_sent);


     /* we asume that the remote ran for as long as we did */

     remote_thruput = calc_thruput(bytes_recvd);

     /* print the results for this socket and message size */

     if (local_cpu_usage || remote_cpu_usage) {
       /* We must now do a little math for service demand and cpu */
       /* utilization for the system(s) We pass zeros for the local */
       /* cpu utilization and elapsed time to tell the routine to use */
       /* the libraries own values for those. */
       if (local_cpu_usage) {
 	local_cpu_utilization	= calc_cpu_util(0.0);
 	/* shouldn't this really be based on bytes_recvd, since that is */
 	/* the effective throughput of the test? I think that it should, */
 	/* so will make the change raj 11/94 */
 	local_service_demand	= calc_service_demand(bytes_recvd,
 						      0.0,
 						      0.0,
 						      0);
       }
       else {
 	local_cpu_utilization	= (float) -1.0;
 	local_service_demand	= (float) -1.0;
       }

       /* The local calculations could use variables being kept by */
       /* the local netlib routines. The remote calcuations need to */
       /* have a few things passed to them. */
       if (remote_cpu_usage) {
 	remote_cpu_utilization	= udp_stream_results->cpu_util;
 	remote_service_demand	= calc_service_demand(bytes_recvd,
 						      0.0,
 						      remote_cpu_utilization,
 						      udp_stream_results->num_cpus);
       }
       else {
 	remote_cpu_utilization	= (float) -1.0;
 	remote_service_demand	= (float) -1.0;
       }
     }
     else {
       /* we were not measuring cpu, for the confidence stuff, we */
       /* should make it -1.0 */
       local_cpu_utilization  = (float) -1.0;
       local_service_demand   = (float) -1.0;
       remote_cpu_utilization = (float) -1.0;
       remote_service_demand  = (float) -1.0;
     }

     /* at this point, we want to calculate the confidence information. */
     /* if debugging is on, calculate_confidence will print-out the */
     /* parameters we pass it */

     calculate_confidence(confidence_iteration,
 			 elapsed_time,
 			 remote_thruput,
 			 local_cpu_utilization,
 			 remote_cpu_utilization,
 			 local_service_demand,
 			 remote_service_demand);

     /* since the routine calculate_confidence is rather generic, and */
     /* we have a few other parms of interest, we will do a little work */
     /* here to caclulate their average. */
     sum_messages_sent  += messages_sent;
     sum_messages_recvd += messages_recvd;
     sum_failed_sends   += failed_sends;
     sum_local_thruput  += local_thruput;

     confidence_iteration++;

     /* this datapoint is done, so we don't need the socket any longer */
     close(data_socket);

   }

   /* we should reach this point once the test is finished */

   retrieve_confident_values(&elapsed_time,
 			    &remote_thruput,
 			    &local_cpu_utilization,
 			    &remote_cpu_utilization,
 			    &local_service_demand,
 			    &remote_service_demand);

   /* some of the interesting values aren't covered by the generic */
   /* confidence routine */
   messages_sent    = sum_messages_sent / (confidence_iteration -1);
   messages_recvd   = sum_messages_recvd / (confidence_iteration -1);
   failed_sends     = sum_failed_sends / (confidence_iteration -1);
   local_thruput    = sum_local_thruput / (confidence_iteration -1);

   /* We are now ready to print all the information. If the user */
   /* has specified zero-level verbosity, we will just print the */
   /* local service demand, or the remote service demand. If the */
   /* user has requested verbosity level 1, he will get the basic */
   /* "streamperf" numbers. If the user has specified a verbosity */
   /* of greater than 1, we will display a veritable plethora of */
   /* background information from outside of this block as it it */
   /* not cpu_measurement specific...  */


   if (confidence < 0) {
     /* we did not hit confidence, but were we asked to look for it? */
     if (iteration_max > 1) {
       display_confidence();
     }
   }

   if (local_cpu_usage || remote_cpu_usage) {
     local_cpu_method = format_cpu_method(cpu_method);
     remote_cpu_method = format_cpu_method(udp_stream_results->cpu_method);

     switch (verbosity) {
     case 0:
       if (local_cpu_usage) {
 	fprintf(where,
 		cpu_fmt_0,
 		local_service_demand,
 		local_cpu_method);
       }
       else {
 	fprintf(where,
 		cpu_fmt_0,
 		remote_service_demand,
 		local_cpu_method);
       }
       break;
     case 1:
     case 2:
       if (print_headers) {
 	fprintf(where,
 		cpu_title,
 		format_units(),
 		local_cpu_method,
 		remote_cpu_method);
       }

       fprintf(where,
 	      cpu_fmt_1,		/* the format string */
 	      lss_size,		        /* local sendbuf size */
 	      send_size,		/* how large were the sends */
 	      elapsed_time,		/* how long was the test */
 	      messages_sent,
 	      failed_sends,
 	      local_thruput, 		/* what was the xfer rate */
 	      local_cpu_utilization,	/* local cpu */
 	      local_service_demand,	/* local service demand */
 	      rsr_size,
 	      elapsed_time,
 	      messages_recvd,
 	      remote_thruput,
 	      remote_cpu_utilization,	/* remote cpu */
 	      remote_service_demand);	/* remote service demand */
       break;
     }
   }
   else {
     /* The tester did not wish to measure service demand. */
     switch (verbosity) {
     case 0:
       fprintf(where,
 	      tput_fmt_0,
 	      local_thruput);
       break;
     case 1:
     case 2:
       if (print_headers) {
 	fprintf(where,tput_title,format_units());
       }
       fprintf(where,
 	      tput_fmt_1,		/* the format string */
 	      lss_size, 		/* local sendbuf size */
 	      send_size,		/* how large were the sends */
 	      elapsed_time, 		/* how long did it take */
 	      messages_sent,
 	      failed_sends,
 	      local_thruput,
 	      rsr_size, 		/* remote recvbuf size */
 	      elapsed_time,
 	      messages_recvd,
 	      remote_thruput);
       break;
     }
   }

   fflush(where);
 #ifdef WANT_HISTOGRAM
   if (verbosity > 1) {
     fprintf(where,"\nHistogram of time spent in send() call\n");
     fflush(where);
     HIST_report(time_hist);
   }
 #endif /* WANT_HISTOGRAM */

 }


  /* this routine implements the receive side (netserver) of the */
  /* UDP_STREAM performance test. */

 void
 recv_udp_stream()
 {
   struct ring_elt *recv_ring;
   struct addrinfo *local_res;
   char local_name[BUFSIZ];
   char port_buffer[PORTBUFSIZE];

   struct sockaddr_storage myaddr_in;
   SOCKET	s_data;
   netperf_socklen_t 	addrlen;
   struct sockaddr_storage remote_addr;
   netperf_socklen_t remote_addrlen;

   int	len = 0;
   unsigned int	bytes_received = 0;
   float	elapsed_time;

   int	message_size;
   unsigned int	messages_recvd = 0;

   struct	udp_stream_request_struct	*udp_stream_request;
   struct	udp_stream_response_struct	*udp_stream_response;
   struct	udp_stream_results_struct	*udp_stream_results;

   udp_stream_request  =
     (struct udp_stream_request_struct *)netperf_request.content.test_specific_data;
   udp_stream_response =
     (struct udp_stream_response_struct *)netperf_response.content.test_specific_data;
   udp_stream_results  =
     (struct udp_stream_results_struct *)netperf_response.content.test_specific_data;

   if (debug) {
     fprintf(where,"netserver: recv_udp_stream: entered...\n");
     fflush(where);
   }

   /* We want to set-up the listen socket with all the desired */
   /* parameters and then let the initiator know that all is ready. If */
   /* socket size defaults are to be used, then the initiator will have */
   /* sent us 0's. If the socket sizes cannot be changed, then we will */
   /* send-back what they are. If that information cannot be determined, */
   /* then we send-back -1's for the sizes. If things go wrong for any */
   /* reason, we will drop back ten yards and punt. */

   /* If anything goes wrong, we want the remote to know about it. It */
   /* would be best if the error that the remote reports to the user is */
   /* the actual error we encountered, rather than some bogus unexpected */
   /* response type message. */

   if (debug > 1) {
     fprintf(where,"recv_udp_stream: setting the response type...\n");
     fflush(where);
   }

   netperf_response.content.response_type = UDP_STREAM_RESPONSE;

   if (debug > 2) {
     fprintf(where,"recv_udp_stream: the response type is set...\n");
     fflush(where);
   }

   /* We now alter the message_ptr variable to be at the desired */
   /* alignment with the desired offset. */

   if (debug > 1) {
     fprintf(where,"recv_udp_stream: requested alignment of %d\n",
 	    udp_stream_request->recv_alignment);
     fflush(where);
   }

   if (recv_width == 0) recv_width = 1;

   recv_ring = allocate_buffer_ring(recv_width,
 				   udp_stream_request->message_size,
 				   udp_stream_request->recv_alignment,
 				   udp_stream_request->recv_offset);

   if (debug > 1) {
     fprintf(where,"recv_udp_stream: receive alignment and offset set...\n");
     fflush(where);
   }

   /* Grab a socket to listen on, and then listen on it. */

   if (debug > 1) {
     fprintf(where,"recv_udp_stream: grabbing a socket...\n");
     fflush(where);
   }

   /* create_data_socket expects to find some things in the global */
   /* variables, so set the globals based on the values in the request. */
   /* once the socket has been created, we will set the response values */
   /* based on the updated value of those globals. raj 7/94 */
   lsr_size_req = udp_stream_request->recv_buf_size;
   loc_rcvavoid = udp_stream_request->so_rcvavoid;
   loc_sndavoid = udp_stream_request->so_sndavoid;
   local_connected = udp_stream_request->recv_connected;

   set_hostname_and_port(local_name,
 			port_buffer,
 			nf_to_af(udp_stream_request->ipfamily),
 			udp_stream_request->port);

   local_res = complete_addrinfo(local_name,
 				local_name,
 				port_buffer,
 				nf_to_af(udp_stream_request->ipfamily),
 				SOCK_DGRAM,
 				IPPROTO_UDP,
 				0);

   s_data = create_data_socket(local_res);

   if (s_data == INVALID_SOCKET) {
     netperf_response.content.serv_errno = errno;
     send_response();
     exit(1);
   }

   udp_stream_response->test_length = udp_stream_request->test_length;

   /* now get the port number assigned by the system  */
   addrlen = sizeof(myaddr_in);
   if (getsockname(s_data,
 		  (struct sockaddr *)&myaddr_in,
 		  &addrlen) == SOCKET_ERROR){
     netperf_response.content.serv_errno = errno;
     close(s_data);
     send_response();

     exit(1);
   }

   /* Now myaddr_in contains the port and the internet address this is */
   /* returned to the sender also implicitly telling the sender that the */
   /* socket buffer sizing has been done. */

   udp_stream_response->data_port_number =
     (int) ntohs(((struct sockaddr_in *)&myaddr_in)->sin_port);
   netperf_response.content.serv_errno   = 0;

   /* But wait, there's more. If the initiator wanted cpu measurements, */
   /* then we must call the calibrate routine, which will return the max */
   /* rate back to the initiator. If the CPU was not to be measured, or */
   /* something went wrong with the calibration, we will return a -1 to */
   /* the initiator. */

   udp_stream_response->cpu_rate    = (float)0.0; /* assume no cpu */
   udp_stream_response->measure_cpu = 0;
   if (udp_stream_request->measure_cpu) {
     /* We will pass the rate into the calibration routine. If the */
     /* user did not specify one, it will be 0.0, and we will do a */
     /* "real" calibration. Otherwise, all it will really do is */
     /* store it away... */
     udp_stream_response->measure_cpu = 1;
     udp_stream_response->cpu_rate =
       calibrate_local_cpu(udp_stream_request->cpu_rate);
   }

   message_size	= udp_stream_request->message_size;
   test_time	= udp_stream_request->test_length;

   /* before we send the response back to the initiator, pull some of */
   /* the socket parms from the globals */
   udp_stream_response->send_buf_size = lss_size;
   udp_stream_response->recv_buf_size = lsr_size;
   udp_stream_response->so_rcvavoid = loc_rcvavoid;
   udp_stream_response->so_sndavoid = loc_sndavoid;

   send_response();

   /* Now it's time to start receiving data on the connection. We will */
   /* first grab the apropriate counters and then start grabbing. */

   cpu_start(udp_stream_request->measure_cpu);

 #ifdef WIN32
   /* this is used so the timer thread can close the socket out from */
   /* under us, which to date is the easiest/cleanest/least */
   /* Windows-specific way I can find to force the winsock calls to */
   /* return WSAEINTR with the test is over. anything that will run on */
   /* 95 and NT and is closer to what netperf expects from Unix signals */
   /* and such would be appreciated raj 1/96 */
   win_kludge_socket = s_data;
 #endif /* WIN32 */

   /* The loop will exit when the timer pops, or if we happen to recv a */
   /* message of less than send_size bytes... */

   times_up = 0;

   start_timer(test_time + PAD_TIME);

   if (debug) {
     fprintf(where,"recv_udp_stream: about to enter inner sanctum.\n");
     fflush(where);
   }

   /* We "connect" up to the remote post to allow us to use the recv */
   /* call instead of the recvfrom call. Presumeably, this is a little */
   /* simpler, and a little more efficient. */

   if (local_connected) {

     /* Receive the first message using recvfrom to find the remote address */
     remote_addrlen = sizeof(remote_addr);
     len = recvfrom(s_data, recv_ring->buffer_ptr,
                    message_size, 0,
                    (struct sockaddr*)&remote_addr, &remote_addrlen);
     if (len != message_size) {
       if ((len == SOCKET_ERROR) && !SOCKET_EINTR(len)) {
             netperf_response.content.serv_errno = errno;
             send_response();
             exit(1);
       }
     }
     messages_recvd++;
     recv_ring = recv_ring->next;


     /* Now connect with the remote socket address */
     if (connect(s_data,
                 (struct sockaddr*)&remote_addr,
                 remote_addrlen )== INVALID_SOCKET) {
         netperf_response.content.serv_errno = errno;
         close(s_data);
         send_response();
         exit(1);
     }

     if (debug) {
         fprintf(where,"recv_udp_stream: connected data socket\n");
         fflush(where);
      }
   }

   while (!times_up) {
     if(local_connected) {
        len = recv(s_data,
                   recv_ring->buffer_ptr,
                   message_size,
                   0);
     } else {
        len = recvfrom(s_data,
                       recv_ring->buffer_ptr,
     	              message_size,
 		      0,0,0);
     }

     if (len != message_size) {
       if ((len == SOCKET_ERROR) && !SOCKET_EINTR(len)) {
             netperf_response.content.serv_errno = errno;
 	    send_response();
 	    exit(1);
       }
       break;
     }
     messages_recvd++;
     recv_ring = recv_ring->next;
   }

   if (debug) {
     fprintf(where,"recv_udp_stream: got %d messages.\n",messages_recvd);
     fflush(where);
   }


   /* The loop now exits due timer or < send_size bytes received. in */
   /* reality, we only really support a timed UDP_STREAM test. raj */
   /* 12/95 */

   cpu_stop(udp_stream_request->measure_cpu,&elapsed_time);

   if (times_up) {
     /* we ended on a timer, subtract the PAD_TIME */
     elapsed_time -= (float)PAD_TIME;
   }
   else {
     stop_timer();
   }

   if (debug) {
     fprintf(where,"recv_udp_stream: test ended in %f seconds.\n",elapsed_time);
     fflush(where);
   }


   /* We will count the "off" message that got us out of the loop */
   bytes_received = (messages_recvd * message_size) + len;

   /* send the results to the sender			*/

   if (debug) {
     fprintf(where,
 	    "recv_udp_stream: got %d bytes\n",
 	    bytes_received);
     fflush(where);
   }

   netperf_response.content.response_type	= UDP_STREAM_RESULTS;
   udp_stream_results->bytes_received	= htonl(bytes_received);
   udp_stream_results->messages_recvd	= messages_recvd;
   udp_stream_results->elapsed_time	= elapsed_time;
   udp_stream_results->cpu_method        = cpu_method;
   udp_stream_results->num_cpus          = lib_num_loc_cpus;
   if (udp_stream_request->measure_cpu) {
     udp_stream_results->cpu_util	= calc_cpu_util(elapsed_time);
   }
   else {
     udp_stream_results->cpu_util	= (float) -1.0;
   }

   if (debug > 1) {
     fprintf(where,
 	    "recv_udp_stream: test complete, sending results.\n");
     fflush(where);
   }

   send_response();

   close(s_data);

 }

 void
 send_udp_rr(char remote_host[])
 {

   char *tput_title = "\
 Local /Remote\n\
 Socket Size   Request  Resp.   Elapsed  Trans.\n\
 Send   Recv   Size     Size    Time     Rate         \n\
 bytes  Bytes  bytes    bytes   secs.    per sec   \n\n";

   char *tput_title_band = "\
 Local /Remote\n\
 Socket Size   Request  Resp.   Elapsed  \n\
 Send   Recv   Size     Size    Time     Throughput \n\
 bytes  Bytes  bytes    bytes   secs.    %s/sec   \n\n";

   char *tput_fmt_0 =
     "%7.2f %s\n";

   char *tput_fmt_1_line_1 = "\
 %-6d %-6d %-6d   %-6d  %-6.2f   %7.2f   %s\n";

   char *tput_fmt_1_line_2 = "\
 %-6d %-6d\n";

   char *cpu_title = "\
 Local /Remote\n\
 Socket Size   Request Resp.  Elapsed Trans.   CPU    CPU    S.dem   S.dem\n\
 Send   Recv   Size    Size   Time    Rate     local  remote local   remote\n\
 bytes  bytes  bytes   bytes  secs.   per sec  %% %c    %% %c    us/Tr   us/Tr\n\n";

   char *cpu_title_tput = "\
 Local /Remote\n\
 Socket Size   Request Resp.  Elapsed Tput     CPU    CPU    S.dem   S.dem\n\
 Send   Recv   Size    Size   Time    %-8.8s local  remote local   remote\n\
 bytes  bytes  bytes   bytes  secs.   per sec  %% %c    %% %c    us/Tr   us/Tr\n\n";

   char *cpu_fmt_0 =
     "%6.3f %c %s\n";

   char *cpu_fmt_1_line_1 = "\
 %-6d %-6d %-6d  %-6d %-6.2f  %-6.2f   %-6.2f %-6.2f %-6.3f  %-6.3f %s\n";

   char *cpu_fmt_1_line_2 = "\
 %-6d %-6d\n";

   float			elapsed_time;

   struct ring_elt *send_ring;
   struct ring_elt *recv_ring;

   int	len;
   int	nummessages;
   SOCKET	send_socket;
   int	trans_remaining;
   int	bytes_xferd;

   int	rsp_bytes_recvd;

   float	local_cpu_utilization;
   float	local_service_demand;
   float	remote_cpu_utilization;
   float	remote_service_demand;
   double	thruput;

   struct addrinfo *local_res;
   struct addrinfo *remote_res;

   struct	udp_rr_request_struct	*udp_rr_request;
   struct	udp_rr_response_struct	*udp_rr_response;
   struct	udp_rr_results_struct	*udp_rr_result;

   udp_rr_request  =
     (struct udp_rr_request_struct *)netperf_request.content.test_specific_data;
   udp_rr_response =
     (struct udp_rr_response_struct *)netperf_response.content.test_specific_data;
   udp_rr_result	 =
     (struct udp_rr_results_struct *)netperf_response.content.test_specific_data;

 #ifdef WANT_HISTOGRAM
   if (verbosity > 1) {
     time_hist = HIST_new();
   }
 #endif

   /* since we are now disconnected from the code that established the */
   /* control socket, and since we want to be able to use different */
   /* protocols and such, we are passed the name of the remote host and */
   /* must turn that into the test specific addressing information. */

   complete_addrinfos(&remote_res,
 		     &local_res,
 		     remote_host,
 		     SOCK_DGRAM,
 		     IPPROTO_UDP,
 		     0);

   if ( print_headers ) {
     print_top_test_header("UDP REQUEST/RESPONSE TEST",local_res,remote_res);
   }

   /* initialize a few counters */

   send_ring     = NULL;
   recv_ring     = NULL;
   nummessages	= 0;
   bytes_xferd	= 0;
   times_up 	= 0;
   confidence_iteration = 1;
   init_stat();

   /* we have a great-big while loop which controls the number of times */
   /* we run a particular test. this is for the calculation of a */
   /* confidence interval (I really should have stayed awake during */
   /* probstats :). If the user did not request confidence measurement */
   /* (no confidence is the default) then we will only go though the */
   /* loop once. the confidence stuff originates from the folks at IBM */

   while (((confidence < 0) && (confidence_iteration < iteration_max)) ||
 	 (confidence_iteration <= iteration_min)) {

     nummessages     = 0;
     bytes_xferd     = 0;
     times_up        = 0;
     trans_remaining = 0;

     /* set-up the data buffers with the requested alignment and offset */

     if (send_width == 0) send_width = 1;
     if (recv_width == 0) recv_width = 1;

     if (send_ring == NULL) {
       send_ring = allocate_buffer_ring(send_width,
 				       req_size,
 				       local_send_align,
 				       local_send_offset);
     }

     if (recv_ring == NULL) {
       recv_ring = allocate_buffer_ring(recv_width,
 				       rsp_size,
 				       local_recv_align,
 				       local_recv_offset);
     }

     /*set up the data socket                        */
     send_socket = create_data_socket(local_res);

     if (send_socket == INVALID_SOCKET){
       perror("netperf: send_udp_rr: udp rr data socket");
       exit(1);
     }

     if (debug) {
       fprintf(where,"send_udp_rr: send_socket obtained...\n");
     }

     /* If the user has requested cpu utilization measurements, we must */
     /* calibrate the cpu(s). We will perform this task within the tests */
     /* themselves. If the user has specified the cpu rate, then */
     /* calibrate_local_cpu will return rather quickly as it will have */
     /* nothing to do. If local_cpu_rate is zero, then we will go through */
     /* all the "normal" calibration stuff and return the rate back. If */
     /* there is no idle counter in the kernel idle loop, the */
     /* local_cpu_rate will be set to -1. */

     if (local_cpu_usage) {
       local_cpu_rate = calibrate_local_cpu(local_cpu_rate);
     }

     if (!no_control) {
       /* Tell the remote end to do a listen. The server alters the
 	 socket paramters on the other side at this point, hence the
 	 reason for all the values being passed in the setup
 	 message. If the user did not specify any of the parameters,
 	 they will be passed as 0, which will indicate to the remote
 	 that no changes beyond the system's default should be
 	 used. Alignment is the exception, it will default to 8, which
 	 will be no alignment alterations. */

       netperf_request.content.request_type	= DO_UDP_RR;
       udp_rr_request->recv_buf_size	= rsr_size_req;
       udp_rr_request->send_buf_size	= rss_size_req;
       udp_rr_request->recv_alignment      = remote_recv_align;
       udp_rr_request->recv_offset	        = remote_recv_offset;
       udp_rr_request->send_alignment      = remote_send_align;
       udp_rr_request->send_offset	        = remote_send_offset;
       udp_rr_request->request_size	= req_size;
       udp_rr_request->response_size	= rsp_size;
       udp_rr_request->measure_cpu	        = remote_cpu_usage;
       udp_rr_request->cpu_rate	        = remote_cpu_rate;
       udp_rr_request->so_rcvavoid	        = rem_rcvavoid;
       udp_rr_request->so_sndavoid	        = rem_sndavoid;
       if (test_time) {
 	udp_rr_request->test_length	= test_time;
       }
       else {
 	udp_rr_request->test_length	= test_trans * -1;
       }
       udp_rr_request->port                = atoi(remote_data_port);
       udp_rr_request->ipfamily = af_to_nf(remote_res->ai_family);

       if (debug > 1) {
 	fprintf(where,"netperf: send_udp_rr: requesting UDP r/r test\n");
       }

       send_request();

       /* The response from the remote will contain all of the relevant
 	 socket parameters for this test type. We will put them back
 	 into the variables here so they can be displayed if desired.
 	 The remote will have calibrated CPU if necessary, and will
 	 have done all the needed set-up we will have calibrated the
 	 cpu locally before sending the request, and will grab the
 	 counter value right after the connect returns. The remote
 	 will grab the counter right after the accept call. This saves
 	 the hassle of extra messages being sent for the UDP
 	 tests.  */

       recv_response();

       if (!netperf_response.content.serv_errno) {
 	if (debug)
 	  fprintf(where,"remote listen done.\n");
 	rsr_size	       =	udp_rr_response->recv_buf_size;
 	rss_size	       =	udp_rr_response->send_buf_size;
 	remote_cpu_usage =	udp_rr_response->measure_cpu;
 	remote_cpu_rate  = 	udp_rr_response->cpu_rate;
 	/* port numbers in proper order */
 	set_port_number(remote_res,(short)udp_rr_response->data_port_number);
       }
       else {
 	Set_errno(netperf_response.content.serv_errno);
 	fprintf(where,
 		"netperf: remote error %d",
 		netperf_response.content.serv_errno);
 	perror("");
 	fflush(where);
 	exit(1);
       }
     }

 #ifdef WANT_DEMO
     DEMO_RR_SETUP(100)
 #endif

     /* Connect up to the remote port on the data socket. This will set */
     /* the default destination address on this socket. With UDP, this */
     /* does make a performance difference as we may not have to do as */
     /* many routing lookups, however, I expect that a client would */
     /* behave this way. raj 1/94 */

     if ( connect(send_socket,
 		 remote_res->ai_addr,
 		 remote_res->ai_addrlen) == INVALID_SOCKET ) {
       perror("netperf: data socket connect failed");
       exit(1);
     }

 #ifdef WIN32
   /* this is used so the timer thread can close the socket out from */
   /* under us, which to date is the easiest/cleanest/least */
   /* Windows-specific way I can find to force the winsock calls to */
   /* return WSAEINTR with the test is over. anything that will run on */
   /* 95 and NT and is closer to what netperf expects from Unix signals */
   /* and such would be appreciated raj 1/96 */
   win_kludge_socket = send_socket;
 #endif /* WIN32 */

     /* Data Socket set-up is finished. If there were problems, either the */
     /* connect would have failed, or the previous response would have */
     /* indicated a problem. I failed to see the value of the extra */
     /* message after the accept on the remote. If it failed, we'll see it */
     /* here. If it didn't, we might as well start pumping data. */

     /* Set-up the test end conditions. For a request/response test, they */
     /* can be either time or transaction based. */

     if (test_time) {
       /* The user wanted to end the test after a period of time. */
       times_up = 0;
       trans_remaining = 0;
       start_timer(test_time);
     }
     else {
       /* The tester wanted to send a number of bytes. */
       trans_remaining = test_bytes;
       times_up = 1;
     }

     /* The cpu_start routine will grab the current time and possibly */
     /* value of the idle counter for later use in measuring cpu */
     /* utilization and/or service demand and thruput. */

     cpu_start(local_cpu_usage);

 #ifdef WANT_DEMO
     if (demo_mode) {
       HIST_timestamp(demo_one_ptr);
     }
 #endif

 #ifdef WANT_INTERVALS
     INTERVALS_INIT();
 #endif /* WANT_INTERVALS */

     /* We use an "OR" to control test execution. When the test is */
     /* controlled by time, the byte count check will always return */
     /* false. When the test is controlled by byte count, the time test */
     /* will always return false. When the test is finished, the whole */
     /* expression will go false and we will stop sending data. I think */
     /* I just arbitrarily decrement trans_remaining for the timed */
     /* test, but will not do that just yet... One other question is */
     /* whether or not the send buffer and the receive buffer should be */
     /* the same buffer. */

 #ifdef WANT_FIRST_BURST
     {
       int i;
       for (i = 0; i < first_burst_size; i++) {
 	if((len=send(send_socket,
 		     send_ring->buffer_ptr,
 		     req_size,
 		     0)) != req_size) {
 	  /* we should never hit the end of the test in the first burst */
 	  perror("send_udp_rr: initial burst data send error");
 	  exit(-1);
 	}
       }
     }
 #endif /* WANT_FIRST_BURST */

     while ((!times_up) || (trans_remaining > 0)) {
       /* send the request */
 #ifdef WANT_HISTOGRAM
       if (verbosity > 1) {
 	HIST_timestamp(&time_one);
       }
 #endif
       if((len=send(send_socket,
 		   send_ring->buffer_ptr,
 		   req_size,
 		   0)) != req_size) {
         if (SOCKET_EINTR(len)) {
 	      /* We likely hit */
 	      /* test-end time. */
 	      break;
 		}
 	    perror("send_udp_rr: data send error");
 	    exit(1);
 	  }
       send_ring = send_ring->next;

       /* receive the response. with UDP we will get it all, or nothing */

       if((rsp_bytes_recvd=recv(send_socket,
 			       recv_ring->buffer_ptr,
 			       rsp_size,
 			       0)) != rsp_size) {
 	    if (SOCKET_EINTR(rsp_bytes_recvd))
 		{
     	  /* Again, we have likely hit test-end time */
 	      break;
 		}
 	    perror("send_udp_rr: data recv error");
 	    exit(1);
       }
       recv_ring = recv_ring->next;

 #ifdef WANT_HISTOGRAM
       if (verbosity > 1) {
 	HIST_timestamp(&time_two);
 	HIST_add(time_hist,delta_micro(&time_one,&time_two));
       }

 #endif

       /* at this point, we may wish to sleep for some period of */
       /* time, so we see how long that last transaction just took, */
       /* and sleep for the difference of that and the interval. We */
       /* will not sleep if the time would be less than a */
       /* millisecond.  */

 #ifdef WANT_DEMO
       DEMO_RR_INTERVAL(1);
 #endif

 #ifdef WANT_INTERVALS
       INTERVALS_WAIT();
 #endif /* WANT_INTERVALS */

       nummessages++;
       if (trans_remaining) {
 	trans_remaining--;
       }

       if (debug > 3) {
 	if ((nummessages % 100) == 0) {
 	  fprintf(where,"Transaction %d completed\n",nummessages);
 	  fflush(where);
 	}
       }

     }

     /* for some strange reason, I used to call shutdown on the UDP */
     /* data socket here. I'm not sure why, because it would not have */
     /* any effect... raj 11/94 */

     /* this call will always give us the elapsed time for the test, and */
     /* will also store-away the necessaries for cpu utilization */

     cpu_stop(local_cpu_usage,&elapsed_time);	/* was cpu being */
 						/* measured? how long */
 						/* did we really run? */

     if (!no_control) {
       /* Get the statistics from the remote end. The remote will have
 	 calculated service demand and all those interesting
 	 things. If it wasn't supposed to care, it will return obvious
 	 values. */

       recv_response();
       if (!netperf_response.content.serv_errno) {
 	if (debug)
 	  fprintf(where,"remote results obtained\n");
       }
       else {
 	Set_errno(netperf_response.content.serv_errno);
 	fprintf(where,
 		"netperf: remote error %d",
 		netperf_response.content.serv_errno);
 	perror("");
 	fflush(where);
 	exit(1);
       }
     }

     /* We now calculate what our thruput was for the test. In the */
     /* future, we may want to include a calculation of the thruput */
     /* measured by the remote, but it should be the case that for a */
     /* UDP rr test, that the two numbers should be *very* close... */
     /* We calculate bytes_sent regardless of the way the test length */
     /* was controlled.  */

     bytes_xferd	= (req_size * nummessages) + (rsp_size * nummessages);
     thruput	= nummessages / elapsed_time;

     if (local_cpu_usage || remote_cpu_usage) {

       /* We must now do a little math for service demand and cpu */
       /* utilization for the system(s) Of course, some of the */
       /* information might be bogus because there was no idle counter */
       /* in the kernel(s). We need to make a note of this for the */
       /* user's benefit by placing a code for the metod used in the */
       /* test banner */

       if (local_cpu_usage) {
 	local_cpu_utilization = calc_cpu_util(0.0);

 	/* since calc_service demand is doing ms/Kunit we will */
 	/* multiply the number of transaction by 1024 to get */
 	/* "good" numbers */

 	local_service_demand  = calc_service_demand((double) nummessages*1024,
 						    0.0,
 						    0.0,
 						    0);
       }
       else {
 	local_cpu_utilization	= (float) -1.0;
 	local_service_demand	= (float) -1.0;
       }

       if (remote_cpu_usage) {
 	remote_cpu_utilization = udp_rr_result->cpu_util;

 	/* since calc_service demand is doing ms/Kunit we will */
 	/* multiply the number of transaction by 1024 to get */
 	/* "good" numbers */

 	remote_service_demand  = calc_service_demand((double) nummessages*1024,
 						     0.0,
 						     remote_cpu_utilization,
 						     udp_rr_result->num_cpus);
       }
       else {
 	remote_cpu_utilization = (float) -1.0;
 	remote_service_demand  = (float) -1.0;
       }
     }
     else {
       /* we were not measuring cpu, for the confidence stuff, we */
       /* should make it -1.0 */
       local_cpu_utilization	= (float) -1.0;
       local_service_demand	= (float) -1.0;
       remote_cpu_utilization = (float) -1.0;
       remote_service_demand  = (float) -1.0;
     }

     /* at this point, we want to calculate the confidence information. */
     /* if debugging is on, calculate_confidence will print-out the */
     /* parameters we pass it */

     calculate_confidence(confidence_iteration,
 			 elapsed_time,
 			 thruput,
 			 local_cpu_utilization,
 			 remote_cpu_utilization,
 			 local_service_demand,
 			 remote_service_demand);


     confidence_iteration++;

     /* we are done with the socket */
     close(send_socket);
   }

   /* at this point, we have made all the iterations we are going to */
   /* make. */
   retrieve_confident_values(&elapsed_time,
 			    &thruput,
 			    &local_cpu_utilization,
 			    &remote_cpu_utilization,
 			    &local_service_demand,
 			    &remote_service_demand);

   /* We are now ready to print all the information. If the user */
   /* has specified zero-level verbosity, we will just print the */
   /* local service demand, or the remote service demand. If the */
   /* user has requested verbosity level 1, he will get the basic */
   /* "streamperf" numbers. If the user has specified a verbosity */
   /* of greater than 1, we will display a veritable plethora of */
   /* background information from outside of this block as it it */
   /* not cpu_measurement specific...  */

   if (confidence < 0) {
     /* we did not hit confidence, but were we asked to look for it? */
     if (iteration_max > 1) {
       display_confidence();
     }
   }

   if (local_cpu_usage || remote_cpu_usage) {
     local_cpu_method = format_cpu_method(cpu_method);
     remote_cpu_method = format_cpu_method(udp_rr_result->cpu_method);

     switch (verbosity) {
     case 0:
       if (local_cpu_usage) {
 	fprintf(where,
 		cpu_fmt_0,
 		local_service_demand,
 		local_cpu_method,
                 ((print_headers) ||
                  (result_brand == NULL)) ? "" : result_brand);

       }
       else {
 	fprintf(where,
 		cpu_fmt_0,
 		remote_service_demand,
 		remote_cpu_method,
                 ((print_headers) ||
                  (result_brand == NULL)) ? "" : result_brand);

       }
       break;
     case 1:
     case 2:
       if (print_headers) {
         if ('x' == libfmt) {
           fprintf(where,
                   cpu_title,
                   local_cpu_method,
                   remote_cpu_method);
         }
         else {
           fprintf(where,
                   cpu_title_tput,
                   format_units(),
                   local_cpu_method,
                   remote_cpu_method);
         }
       }

       fprintf(where,
 	      cpu_fmt_1_line_1,		/* the format string */
 	      lss_size,		/* local sendbuf size */
 	      lsr_size,
 	      req_size,		/* how large were the requests */
 	      rsp_size,		/* guess */
 	      elapsed_time,		/* how long was the test */
 	      ('x' == libfmt) ? thruput :
 	      calc_thruput_interval_omni(thruput * (req_size+rsp_size),
 									 1.0),
 	      local_cpu_utilization,	/* local cpu */
 	      remote_cpu_utilization,	/* remote cpu */
 	      local_service_demand,	/* local service demand */
 	      remote_service_demand,	/* remote service demand */
 	      ((print_headers) ||
 	       (result_brand == NULL)) ? "" : result_brand);
       fprintf(where,
 	      cpu_fmt_1_line_2,
 	      rss_size,
 	      rsr_size);
       break;
     }
   }
   else {
     /* The tester did not wish to measure service demand. */
     switch (verbosity) {
     case 0:
       fprintf(where,
 	      tput_fmt_0,
 	      ('x' == libfmt) ? thruput :
 	      calc_thruput_interval_omni(thruput * (req_size+rsp_size),
 					 1.0),
 	      ((print_headers) ||
 	       (result_brand == NULL)) ? "" : result_brand);
       break;
     case 1:
     case 2:
       if (print_headers) {
 	fprintf(where,
 		('x' == libfmt) ? tput_title : tput_title_band,
 		format_units());
       }

       fprintf(where,
 	      tput_fmt_1_line_1,	/* the format string */
 	      lss_size,
 	      lsr_size,
 	      req_size,		/* how large were the requests */
 	      rsp_size,		/* how large were the responses */
 	      elapsed_time, 		/* how long did it take */
 	      ('x' == libfmt) ?  thruput :
 	      calc_thruput_interval_omni(thruput * (req_size+rsp_size),
 					 1.0),
 	      ((print_headers) ||
 	       (result_brand == NULL)) ? "" : result_brand);
       fprintf(where,
 	      tput_fmt_1_line_2,
 	      rss_size, 		/* remote recvbuf size */
 	      rsr_size);

       break;
     }
   }
   fflush(where);

   /* it would be a good thing to include information about some of the */
   /* other parameters that may have been set for this test, but at the */
   /* moment, I do not wish to figure-out all the  formatting, so I will */
   /* just put this comment here to help remind me that it is something */
   /* that should be done at a later time. */

   /* how to handle the verbose information in the presence of */
   /* confidence intervals is yet to be determined... raj 11/94 */

   if (verbosity > 1) {
     /* The user wanted to know it all, so we will give it to him. */
     /* This information will include as much as we can find about */
     /* UDP statistics, the alignments of the sends and receives */
     /* and all that sort of rot... */

 #ifdef WANT_HISTOGRAM
     fprintf(where,"\nHistogram of request/reponse times.\n");
     fflush(where);
     HIST_report(time_hist);
 #endif /* WANT_HISTOGRAM */
   }
 }

  /* this routine implements the receive side (netserver) of a UDP_RR */
  /* test. */
 void
 recv_udp_rr()
 {

   struct ring_elt *recv_ring;
   struct ring_elt *send_ring;

   struct addrinfo *local_res;
   char local_name[BUFSIZ];
   char port_buffer[PORTBUFSIZE];

   struct sockaddr_storage        myaddr_in;
   struct sockaddr_storage    peeraddr;
   SOCKET	s_data;
   netperf_socklen_t 	addrlen;
   int	trans_received;
   int	trans_remaining;
   int   request_bytes_recvd;
   int   response_bytes_sent;
   float	elapsed_time;

   struct	udp_rr_request_struct	*udp_rr_request;
   struct	udp_rr_response_struct	*udp_rr_response;
   struct	udp_rr_results_struct	*udp_rr_results;

   udp_rr_request  =
     (struct udp_rr_request_struct *)netperf_request.content.test_specific_data;
   udp_rr_response =
     (struct udp_rr_response_struct *)netperf_response.content.test_specific_data;
   udp_rr_results  =
     (struct udp_rr_results_struct *)netperf_response.content.test_specific_data;

   if (debug) {
     fprintf(where,"netserver: recv_udp_rr: entered...\n");
     fflush(where);
   }

   /* We want to set-up the listen socket with all the desired */
   /* parameters and then let the initiator know that all is ready. If */
   /* socket size defaults are to be used, then the initiator will have */
   /* sent us 0's. If the socket sizes cannot be changed, then we will */
   /* send-back what they are. If that information cannot be determined, */
   /* then we send-back -1's for the sizes. If things go wrong for any */
   /* reason, we will drop back ten yards and punt. */

   /* If anything goes wrong, we want the remote to know about it. It */
   /* would be best if the error that the remote reports to the user is */
   /* the actual error we encountered, rather than some bogus unexpected */
   /* response type message. */

   if (debug) {
     fprintf(where,"recv_udp_rr: setting the response type...\n");
     fflush(where);
   }

   netperf_response.content.response_type = UDP_RR_RESPONSE;

   if (debug) {
     fprintf(where,"recv_udp_rr: the response type is set...\n");
     fflush(where);
   }

   /* We now alter the message_ptr variables to be at the desired */
   /* alignments with the desired offsets. */

   if (debug) {
     fprintf(where,"recv_udp_rr: requested recv alignment of %d offset %d\n",
 	    udp_rr_request->recv_alignment,
 	    udp_rr_request->recv_offset);
     fprintf(where,"recv_udp_rr: requested send alignment of %d offset %d\n",
 	    udp_rr_request->send_alignment,
 	    udp_rr_request->send_offset);
     fflush(where);
   }

   if (send_width == 0) send_width = 1;
   if (recv_width == 0) recv_width = 1;

   recv_ring = allocate_buffer_ring(recv_width,
 				   udp_rr_request->request_size,
 				   udp_rr_request->recv_alignment,
 				   udp_rr_request->recv_offset);

   send_ring = allocate_buffer_ring(send_width,
 				   udp_rr_request->response_size,
 				   udp_rr_request->send_alignment,
 				   udp_rr_request->send_offset);

   if (debug) {
     fprintf(where,"recv_udp_rr: receive alignment and offset set...\n");
     fflush(where);
   }

   /* Grab a socket to listen on, and then listen on it. */

   if (debug) {
     fprintf(where,"recv_udp_rr: grabbing a socket...\n");
     fflush(where);
   }


   /* create_data_socket expects to find some things in the global */
   /* variables, so set the globals based on the values in the request. */
   /* once the socket has been created, we will set the response values */
   /* based on the updated value of those globals. raj 7/94 */
   lss_size_req = udp_rr_request->send_buf_size;
   lsr_size_req = udp_rr_request->recv_buf_size;
   loc_rcvavoid = udp_rr_request->so_rcvavoid;
   loc_sndavoid = udp_rr_request->so_sndavoid;

   set_hostname_and_port(local_name,
 			port_buffer,
 			nf_to_af(udp_rr_request->ipfamily),
 			udp_rr_request->port);

   local_res = complete_addrinfo(local_name,
 				local_name,
 				port_buffer,
 				nf_to_af(udp_rr_request->ipfamily),
 				SOCK_DGRAM,
 				IPPROTO_UDP,
 				0);

   s_data = create_data_socket(local_res);

   if (s_data == INVALID_SOCKET) {
     netperf_response.content.serv_errno = errno;
     send_response();

     exit(1);
   }

   /* now get the port number assigned by the system  */
   addrlen = sizeof(myaddr_in);
   if (getsockname(s_data,
 		  (struct sockaddr *)&myaddr_in,
 		  &addrlen) == SOCKET_ERROR){
     netperf_response.content.serv_errno = errno;
     close(s_data);
     send_response();

     exit(1);
   }

   /* Now myaddr_in contains the port and the internet address this is */
   /* returned to the sender also implicitly telling the sender that the */
   /* socket buffer sizing has been done. */

   udp_rr_response->data_port_number =
     (int) ntohs(((struct sockaddr_in *)&myaddr_in)->sin_port);
   netperf_response.content.serv_errno   = 0;

   if (debug) {
     fprintf(where,
 	    "recv port number %d\n",
 	    ((struct sockaddr_in *)&myaddr_in)->sin_port);
     fflush(where);
   }

   /* But wait, there's more. If the initiator wanted cpu measurements, */
   /* then we must call the calibrate routine, which will return the max */
   /* rate back to the initiator. If the CPU was not to be measured, or */
   /* something went wrong with the calibration, we will return a 0.0 to */
   /* the initiator. */

   udp_rr_response->cpu_rate    = (float)0.0; 	/* assume no cpu */
   udp_rr_response->measure_cpu = 0;
   if (udp_rr_request->measure_cpu) {
     udp_rr_response->measure_cpu = 1;
     udp_rr_response->cpu_rate = calibrate_local_cpu(udp_rr_request->cpu_rate);
   }

   /* before we send the response back to the initiator, pull some of */
   /* the socket parms from the globals */
   udp_rr_response->send_buf_size = lss_size;
   udp_rr_response->recv_buf_size = lsr_size;
   udp_rr_response->so_rcvavoid   = loc_rcvavoid;
   udp_rr_response->so_sndavoid   = loc_sndavoid;

   send_response();


   /* Now it's time to start receiving data on the connection. We will */
   /* first grab the apropriate counters and then start grabbing. */

   cpu_start(udp_rr_request->measure_cpu);

 #ifdef WIN32
   /* this is used so the timer thread can close the socket out from */
   /* under us, which to date is the easiest/cleanest/least */
   /* Windows-specific way I can find to force the winsock calls to */
   /* return WSAEINTR with the test is over. anything that will run on */
   /* 95 and NT and is closer to what netperf expects from Unix signals */
   /* and such would be appreciated raj 1/96 */
   win_kludge_socket = s_data;
 #endif /* WIN32 */

   if (udp_rr_request->test_length > 0) {
     times_up = 0;
     trans_remaining = 0;
     start_timer(udp_rr_request->test_length + PAD_TIME);
   }
   else {
     times_up = 1;
     trans_remaining = udp_rr_request->test_length * -1;
   }

   addrlen = sizeof(peeraddr);
   bzero((char *)&peeraddr, addrlen);

   trans_received = 0;

   while ((!times_up) || (trans_remaining > 0)) {

     /* receive the request from the other side */
     if ((request_bytes_recvd = recvfrom(s_data,
 		 recv_ring->buffer_ptr,
 		 udp_rr_request->request_size,
 		 0,
 		 (struct sockaddr *)&peeraddr,
 		 &addrlen)) != udp_rr_request->request_size) {
 	  if ( SOCKET_EINTR(request_bytes_recvd) )
 	  {
 	    /* we must have hit the end of test time. */
 	    break;
       }
       netperf_response.content.serv_errno = errno;
       send_response();
       exit(1);
     }
     recv_ring = recv_ring->next;

     /* Now, send the response to the remote */
     if ((response_bytes_sent = sendto(s_data,
 				      send_ring->buffer_ptr,
 				      udp_rr_request->response_size,
 				      0,
 				      (struct sockaddr *)&peeraddr,
 				      addrlen)) !=
 	udp_rr_request->response_size) {
       if ( SOCKET_EINTR(response_bytes_sent) )
 	  {
 	    /* we have hit end of test time. */
 	    break;
       }
       netperf_response.content.serv_errno = errno;
       send_response();
       exit(1);
     }
     send_ring = send_ring->next;

     trans_received++;
     if (trans_remaining) {
       trans_remaining--;
     }

     if (debug) {
       fprintf(where,
 	      "recv_udp_rr: Transaction %d complete.\n",
 	      trans_received);
       fflush(where);
     }

   }


   /* The loop now exits due to timeout or transaction count being */
   /* reached */

   cpu_stop(udp_rr_request->measure_cpu,&elapsed_time);

   if (times_up) {
     /* we ended the test by time, which was at least 2 seconds */
     /* longer than we wanted to run. so, we want to subtract */
     /* PAD_TIME from the elapsed_time. */
     elapsed_time -= PAD_TIME;
   }
   /* send the results to the sender			*/

   if (debug) {
     fprintf(where,
 	    "recv_udp_rr: got %d transactions\n",
 	    trans_received);
     fflush(where);
   }

   udp_rr_results->bytes_received = (trans_received *
 				    (udp_rr_request->request_size +
 				     udp_rr_request->response_size));
   udp_rr_results->trans_received = trans_received;
   udp_rr_results->elapsed_time	 = elapsed_time;
   udp_rr_results->cpu_method     = cpu_method;
   udp_rr_results->num_cpus       = lib_num_loc_cpus;
   if (udp_rr_request->measure_cpu) {
     udp_rr_results->cpu_util	= calc_cpu_util(elapsed_time);
   }

   if (debug) {
     fprintf(where,
 	    "recv_udp_rr: test complete, sending results.\n");
     fflush(where);
   }

   send_response();

   /* we are done with the socket now */
   close(s_data);

       }


  /* this routine implements the receive (netserver) side of a TCP_RR */
  /* test */
 void
 recv_tcp_rr()
 {

   struct ring_elt *send_ring;
   struct ring_elt *recv_ring;

   struct addrinfo *local_res;
   char local_name[BUFSIZ];
   char port_buffer[PORTBUFSIZE];

   struct	sockaddr_storage        myaddr_in,
   peeraddr_in;
   SOCKET	s_listen,s_data;
   netperf_socklen_t 	addrlen;
   char	*temp_message_ptr;
   int	trans_received;
   int	trans_remaining;
   int	bytes_sent;
   int	request_bytes_recvd;
   int	request_bytes_remaining;
   int	timed_out = 0;
   int   sock_closed = 0;
   float	elapsed_time;

   struct	tcp_rr_request_struct	*tcp_rr_request;
   struct	tcp_rr_response_struct	*tcp_rr_response;
   struct	tcp_rr_results_struct	*tcp_rr_results;

   tcp_rr_request =
     (struct tcp_rr_request_struct *)netperf_request.content.test_specific_data;
   tcp_rr_response =
     (struct tcp_rr_response_struct *)netperf_response.content.test_specific_data;
   tcp_rr_results =
     (struct tcp_rr_results_struct *)netperf_response.content.test_specific_data;

   if (debug) {
     fprintf(where,"netserver: recv_tcp_rr: entered...\n");
     fflush(where);
   }

   /* We want to set-up the listen socket with all the desired */
   /* parameters and then let the initiator know that all is ready. If */
   /* socket size defaults are to be used, then the initiator will have */
   /* sent us 0's. If the socket sizes cannot be changed, then we will */
   /* send-back what they are. If that information cannot be determined, */
   /* then we send-back -1's for the sizes. If things go wrong for any */
   /* reason, we will drop back ten yards and punt. */

   /* If anything goes wrong, we want the remote to know about it. It */
   /* would be best if the error that the remote reports to the user is */
   /* the actual error we encountered, rather than some bogus unexpected */
   /* response type message. */

   if (debug) {
     fprintf(where,"recv_tcp_rr: setting the response type...\n");
     fflush(where);
   }

   netperf_response.content.response_type = TCP_RR_RESPONSE;

   if (debug) {
     fprintf(where,"recv_tcp_rr: the response type is set...\n");
     fflush(where);
   }

   /* allocate the recv and send rings with the requested alignments */
   /* and offsets. raj 7/94 */
   if (debug) {
     fprintf(where,"recv_tcp_rr: requested recv alignment of %d offset %d\n",
 	    tcp_rr_request->recv_alignment,
 	    tcp_rr_request->recv_offset);
     fprintf(where,"recv_tcp_rr: requested send alignment of %d offset %d\n",
 	    tcp_rr_request->send_alignment,
 	    tcp_rr_request->send_offset);
     fflush(where);
   }

   /* at some point, these need to come to us from the remote system */
   if (send_width == 0) send_width = 1;
   if (recv_width == 0) recv_width = 1;

   send_ring = allocate_buffer_ring(send_width,
 				   tcp_rr_request->response_size,
 				   tcp_rr_request->send_alignment,
 				   tcp_rr_request->send_offset);

   recv_ring = allocate_buffer_ring(recv_width,
 				   tcp_rr_request->request_size,
 				   tcp_rr_request->recv_alignment,
 				   tcp_rr_request->recv_offset);


   /* Grab a socket to listen on, and then listen on it. */

   if (debug) {
     fprintf(where,"recv_tcp_rr: grabbing a socket...\n");
     fflush(where);
   }

   /* create_data_socket expects to find some things in the global */
   /* variables, so set the globals based on the values in the request. */
   /* once the socket has been created, we will set the response values */
   /* based on the updated value of those globals. raj 7/94 */
   lss_size_req = tcp_rr_request->send_buf_size;
   lsr_size_req = tcp_rr_request->recv_buf_size;
   loc_nodelay = tcp_rr_request->no_delay;
   loc_rcvavoid = tcp_rr_request->so_rcvavoid;
   loc_sndavoid = tcp_rr_request->so_sndavoid;

   set_hostname_and_port(local_name,
 			port_buffer,
 			nf_to_af(tcp_rr_request->ipfamily),
 			tcp_rr_request->port);

   local_res = complete_addrinfo(local_name,
 				local_name,
 				port_buffer,
 				nf_to_af(tcp_rr_request->ipfamily),
 				SOCK_STREAM,
 				IPPROTO_TCP,
 				0);

   s_listen = create_data_socket(local_res);

   if (s_listen == INVALID_SOCKET) {
     netperf_response.content.serv_errno = errno;
     send_response();

     exit(1);
   }


 #ifdef WIN32
   /* The test timer can fire during operations on the listening socket,
      so to make the start_timer below work we have to move
      it to close s_listen while we are blocked on accept. */
   win_kludge_socket2 = s_listen;
 #endif


   /* Now, let's set-up the socket to listen for connections */
   if (listen(s_listen, 5) == SOCKET_ERROR) {
     netperf_response.content.serv_errno = errno;
     close(s_listen);
     send_response();

     exit(1);
   }


   /* now get the port number assigned by the system  */
   addrlen = sizeof(myaddr_in);
   if (getsockname(s_listen,
 		  (struct sockaddr *)&myaddr_in,
 		  &addrlen) == SOCKET_ERROR) {
     netperf_response.content.serv_errno = errno;
     close(s_listen);
     send_response();

     exit(1);
   }

   /* Now myaddr_in contains the port and the internet address this is */
   /* returned to the sender also implicitly telling the sender that the */
   /* socket buffer sizing has been done. */

   tcp_rr_response->data_port_number =
     (int) ntohs(((struct sockaddr_in *)&myaddr_in)->sin_port);
   netperf_response.content.serv_errno   = 0;

   /* But wait, there's more. If the initiator wanted cpu measurements, */
   /* then we must call the calibrate routine, which will return the max */
   /* rate back to the initiator. If the CPU was not to be measured, or */
   /* something went wrong with the calibration, we will return a 0.0 to */
   /* the initiator. */

   tcp_rr_response->cpu_rate = (float)0.0; 	/* assume no cpu */
   tcp_rr_response->measure_cpu = 0;

   if (tcp_rr_request->measure_cpu) {
     tcp_rr_response->measure_cpu = 1;
     tcp_rr_response->cpu_rate = calibrate_local_cpu(tcp_rr_request->cpu_rate);
   }


   /* before we send the response back to the initiator, pull some of */
   /* the socket parms from the globals */
   tcp_rr_response->send_buf_size = lss_size;
   tcp_rr_response->recv_buf_size = lsr_size;
   tcp_rr_response->no_delay = loc_nodelay;
   tcp_rr_response->so_rcvavoid = loc_rcvavoid;
   tcp_rr_response->so_sndavoid = loc_sndavoid;
   tcp_rr_response->test_length = tcp_rr_request->test_length;
   send_response();

   addrlen = sizeof(peeraddr_in);

   if ((s_data = accept(s_listen,
 		       (struct sockaddr *)&peeraddr_in,
 		       &addrlen)) == INVALID_SOCKET) {
     /* Let's just punt. The remote will be given some information */
     close(s_listen);

     exit(1);
   }

 #ifdef KLUDGE_SOCKET_OPTIONS
   /* this is for those systems which *INCORRECTLY* fail to pass */
   /* attributes across an accept() call. Including this goes against */
   /* my better judgement :( raj 11/95 */

   kludge_socket_options(s_data);

 #endif /* KLUDGE_SOCKET_OPTIONS */

 #ifdef WIN32
   /* this is used so the timer thread can close the socket out from */
   /* under us, which to date is the easiest/cleanest/least */
   /* Windows-specific way I can find to force the winsock calls to */
   /* return WSAEINTR with the test is over. anything that will run on */
   /* 95 and NT and is closer to what netperf expects from Unix signals */
   /* and such would be appreciated raj 1/96 */
   win_kludge_socket = s_data;
   win_kludge_socket2 = INVALID_SOCKET;
 #endif /* WIN32 */

   if (debug) {
     fprintf(where,"recv_tcp_rr: accept completes on the data connection.\n");
     fflush(where);
   }

   /* Now it's time to start receiving data on the connection. We will */
   /* first grab the apropriate counters and then start grabbing. */

   cpu_start(tcp_rr_request->measure_cpu);

   /* The loop will exit when we hit the end of the test time, or when */
   /* we have exchanged the requested number of transactions. */

   if (tcp_rr_request->test_length > 0) {
     times_up = 0;
     trans_remaining = 0;
     start_timer(tcp_rr_request->test_length + PAD_TIME);
   }
   else {
     times_up = 1;
     trans_remaining = tcp_rr_request->test_length * -1;
   }

   trans_received = 0;

   while ((!times_up) || (trans_remaining > 0)) {
     temp_message_ptr = recv_ring->buffer_ptr;
     request_bytes_remaining	= tcp_rr_request->request_size;
     while(request_bytes_remaining > 0) {
       if((request_bytes_recvd=recv(s_data,
 				   temp_message_ptr,
 				   request_bytes_remaining,
 				   0)) == SOCKET_ERROR) {
 	if (SOCKET_EINTR(request_bytes_recvd))
 	{
 	  timed_out = 1;
 	  break;
 	}

 	netperf_response.content.serv_errno = errno;
 	send_response();
 	exit(1);
       }
       else if( request_bytes_recvd == 0 ) {
 	if (debug) {
 	  fprintf(where,"zero is my hero\n");
 	  fflush(where);
 	}
 	sock_closed = 1;
 	break;
       }
       else {
 	request_bytes_remaining -= request_bytes_recvd;
 	temp_message_ptr  += request_bytes_recvd;
       }
     }

     recv_ring = recv_ring->next;

     if ((timed_out) || (sock_closed)) {
       /* we hit the end of the test based on time - or the socket
 	 closed on us along the way.  bail out of here now... */
       if (debug) {
 	fprintf(where,"yo5\n");
 	fflush(where);
       }
       break;
     }

     /* Now, send the response to the remote */
     if((bytes_sent=send(s_data,
 			send_ring->buffer_ptr,
 			tcp_rr_request->response_size,
 			0)) == SOCKET_ERROR) {
       if (SOCKET_EINTR(bytes_sent)) {
 	/* the test timer has popped */
 	timed_out = 1;
 	fprintf(where,"yo6\n");
 	fflush(where);
 	break;
       }
       netperf_response.content.serv_errno = 992;
       send_response();
       exit(1);
     }

     send_ring = send_ring->next;

     trans_received++;
     if (trans_remaining) {
       trans_remaining--;
     }
   }


   /* The loop now exits due to timeout or transaction count being */
   /* reached */

   cpu_stop(tcp_rr_request->measure_cpu,&elapsed_time);

   stop_timer();

   if (timed_out) {
     /* we ended the test by time, which was at least 2 seconds */
     /* longer than we wanted to run. so, we want to subtract */
     /* PAD_TIME from the elapsed_time. */
     elapsed_time -= PAD_TIME;
   }

   /* send the results to the sender			*/

   if (debug) {
     fprintf(where,
 	    "recv_tcp_rr: got %d transactions\n",
 	    trans_received);
     fflush(where);
   }

   tcp_rr_results->bytes_received = (trans_received *
 				    (tcp_rr_request->request_size +
 				     tcp_rr_request->response_size));
   tcp_rr_results->trans_received = trans_received;
   tcp_rr_results->elapsed_time   = elapsed_time;
   tcp_rr_results->cpu_method     = cpu_method;
   tcp_rr_results->num_cpus       = lib_num_loc_cpus;
   if (tcp_rr_request->measure_cpu) {
     tcp_rr_results->cpu_util	= calc_cpu_util(elapsed_time);
   }

   if (debug) {
     fprintf(where,
 	    "recv_tcp_rr: test complete, sending results.\n");
     fflush(where);
   }

   /* we are now done with the sockets */
   close(s_data);
   close(s_listen);

   send_response();

 }


 void
 loc_cpu_rate()
 {
 #if defined(USE_LOOPER)
   float dummy;
 #endif

   /* a rather simple little test - it merely calibrates the local cpu */
   /* and prints the results. There are no headers to allow someone to */
   /* find a rate and use it in other tests automagically by setting a */
   /* variable equal to the output of this test. We ignore any rates */
   /* that may have been specified. In fact, we ignore all of the */
   /* command line args! */

   fprintf(where,
 	  "%g",
 	  calibrate_local_cpu(0.0));

   if (verbosity > 1)
     fprintf(where,
 	    "\nThere %s %d local %s\n",
 	    (lib_num_loc_cpus > 1) ? "are" : "is",
 	    lib_num_loc_cpus,
 	    (lib_num_loc_cpus > 1) ? "cpus" : "cpu");

   /* we need the cpu_start, cpu_stop in the looper case to kill the */
   /* child proceses raj 4/95 */

 #ifdef USE_LOOPER
   cpu_start(1);
   cpu_stop(1,&dummy);
 #endif /* USE_LOOPER */

 }

 void
 rem_cpu_rate()
 {
   /* this test is much like the local variant, except that it works for */
   /* the remote system, so in this case, we do pay attention to the */
   /* value of the '-H' command line argument. */

   fprintf(where,
 	  "%g",
 	  calibrate_remote_cpu());

   if (verbosity > 1)
     fprintf(where,
 	    "\nThere %s %d remote %s\n",
 	    (lib_num_rem_cpus > 1) ? "are" : "is",
 	    lib_num_rem_cpus,
 	    (lib_num_rem_cpus > 1) ? "cpus" : "cpu");

 }


  /* this test is intended to test the performance of establishing a
     connection, exchanging a request/response pair, and repeating. it
     is expected that this would be a good starting-point for
     comparision of T/TCP with classic TCP for transactional workloads.
     it will also look (can look) much like the communication pattern
     of http for www access. */

 void
 send_tcp_conn_rr(char remote_host[])
 {

   char *tput_title = "\
 Local /Remote\n\
 Socket Size   Request  Resp.   Elapsed  Trans.\n\
 Send   Recv   Size     Size    Time     Rate         \n\
 bytes  Bytes  bytes    bytes   secs.    per sec   \n\n";

   char *tput_fmt_0 =
     "%7.2f\n";

   char *tput_fmt_1_line_1 = "\
 %-6d %-6d %-6d   %-6d  %-6.2f   %7.2f   \n";
   char *tput_fmt_1_line_2 = "\
 %-6d %-6d\n";

   char *cpu_title = "\
 Local /Remote\n\
 Socket Size   Request Resp.  Elapsed Trans.   CPU    CPU    S.dem   S.dem\n\
 Send   Recv   Size    Size   Time    Rate     local  remote local   remote\n\
 bytes  bytes  bytes   bytes  secs.   per sec  %%      %%      us/Tr   us/Tr\n\n";

   char *cpu_fmt_0 =
     "%6.3f\n";

   char *cpu_fmt_1_line_1 = "\
 %-6d %-6d %-6d  %-6d %-6.2f  %-6.2f   %-6.2f %-6.2f %-6.3f  %-6.3f\n";

   char *cpu_fmt_1_line_2 = "\
 %-6d %-6d\n";

   char *ksink_fmt = "\n\
 Alignment      Offset\n\
 Local  Remote  Local  Remote\n\
 Send   Recv    Send   Recv\n\
 %5d  %5d   %5d  %5d\n";


   int			timed_out = 0;
   float			elapsed_time;

   int	len;
   struct ring_elt *send_ring;
   struct ring_elt *recv_ring;
   char	*temp_message_ptr;
   int	nummessages;
   SOCKET	send_socket;
   int	trans_remaining;
   double	bytes_xferd;
   int	rsp_bytes_left;
   int	rsp_bytes_recvd;

   float	local_cpu_utilization;
   float	local_service_demand;
   float	remote_cpu_utilization;
   float	remote_service_demand;
   double	thruput;

   struct addrinfo *local_res;
   struct addrinfo *remote_res;

   int                           myport;
   int                           ret;

   struct	tcp_conn_rr_request_struct	*tcp_conn_rr_request;
   struct	tcp_conn_rr_response_struct	*tcp_conn_rr_response;
   struct	tcp_conn_rr_results_struct	*tcp_conn_rr_result;

   tcp_conn_rr_request =
     (struct tcp_conn_rr_request_struct *)netperf_request.content.test_specific_data;
   tcp_conn_rr_response =
     (struct tcp_conn_rr_response_struct *)netperf_response.content.test_specific_data;
   tcp_conn_rr_result =
     (struct tcp_conn_rr_results_struct *)netperf_response.content.test_specific_data;


 #ifdef WANT_HISTOGRAM
   if (verbosity > 1) {
     time_hist = HIST_new();
   }
 #endif /* WANT_HISTOGRAM */

   /* since we are now disconnected from the code that established the */
   /* control socket, and since we want to be able to use different */
   /* protocols and such, we are passed the name of the remote host and */
   /* must turn that into the test specific addressing information. */

   complete_addrinfos(&remote_res,
 		     &local_res,
 		     remote_host,
 		     SOCK_STREAM,
 		     IPPROTO_TCP,
 		     0);

   if ( print_headers ) {
     print_top_test_header("TCP Connect/Request/Response TEST",local_res,remote_res);
   }

   /* initialize a few counters */

   nummessages	=	0;
   bytes_xferd	=	0.0;
   times_up 	= 	0;

   /* set-up the data buffers with the requested alignment and offset */
   if (send_width == 0) send_width = 1;
   if (recv_width == 0) recv_width = 1;

   send_ring = allocate_buffer_ring(send_width,
 				   req_size,
 				   local_send_align,
 				   local_send_offset);

   recv_ring = allocate_buffer_ring(recv_width,
 				   rsp_size,
 				   local_recv_align,
 				   local_recv_offset);


   if (debug) {
     fprintf(where,"send_tcp_conn_rr: send_socket obtained...\n");
   }

   /* If the user has requested cpu utilization measurements, we must */
   /* calibrate the cpu(s). We will perform this task within the tests */
   /* themselves. If the user has specified the cpu rate, then */
   /* calibrate_local_cpu will return rather quickly as it will have */
   /* nothing to do. If local_cpu_rate is zero, then we will go through */
   /* all the "normal" calibration stuff and return the rate back.*/

   if (local_cpu_usage) {
     local_cpu_rate = calibrate_local_cpu(local_cpu_rate);
   }

   if (!no_control) {

     /* Tell the remote end to do a listen. The server alters the
        socket paramters on the other side at this point, hence the
        reason for all the values being passed in the setup message. If
        the user did not specify any of the parameters, they will be
        passed as 0, which will indicate to the remote that no changes
        beyond the system's default should be used. Alignment is the
        exception, it will default to 8, which will be no alignment
        alterations. */

     netperf_request.content.request_type =	DO_TCP_CRR;
     tcp_conn_rr_request->recv_buf_size	=	rsr_size_req;
     tcp_conn_rr_request->send_buf_size	=	rss_size_req;
     tcp_conn_rr_request->recv_alignment	=	remote_recv_align;
     tcp_conn_rr_request->recv_offset	=	remote_recv_offset;
     tcp_conn_rr_request->send_alignment	=	remote_send_align;
     tcp_conn_rr_request->send_offset	=	remote_send_offset;
     tcp_conn_rr_request->request_size	=	req_size;
     tcp_conn_rr_request->response_size	=	rsp_size;
     tcp_conn_rr_request->no_delay	=	rem_nodelay;
     tcp_conn_rr_request->measure_cpu	=	remote_cpu_usage;
     tcp_conn_rr_request->cpu_rate	=	remote_cpu_rate;
     tcp_conn_rr_request->so_rcvavoid	=	rem_rcvavoid;
     tcp_conn_rr_request->so_sndavoid	=	rem_sndavoid;
     if (test_time) {
       tcp_conn_rr_request->test_length	=	test_time;
     }
     else {
       tcp_conn_rr_request->test_length	=	test_trans * -1;
     }
     tcp_conn_rr_request->port           = atoi(remote_data_port);
     tcp_conn_rr_request->ipfamily       = af_to_nf(remote_res->ai_family);

     if (debug > 1) {
       fprintf(where,"netperf: send_tcp_conn_rr: requesting TCP crr test\n");
     }

     send_request();

     /* The response from the remote will contain all of the relevant
        socket parameters for this test type. We will put them back
        into the variables here so they can be displayed if desired.
        The remote will have calibrated CPU if necessary, and will have
        done all the needed set-up we will have calibrated the cpu
        locally before sending the request, and will grab the counter
        value right after the connect returns. The remote will grab the
        counter right after the accept call. This saves the hassle of
        extra messages being sent for the TCP tests.  */

     recv_response();

     if (!netperf_response.content.serv_errno) {
       rsr_size	       =	tcp_conn_rr_response->recv_buf_size;
       rss_size	       =	tcp_conn_rr_response->send_buf_size;
       rem_nodelay      =	tcp_conn_rr_response->no_delay;
       remote_cpu_usage =	tcp_conn_rr_response->measure_cpu;
       remote_cpu_rate  = 	tcp_conn_rr_response->cpu_rate;
       /* make sure that port numbers are in network order */
       set_port_number(remote_res,
 		      (unsigned short)tcp_conn_rr_response->data_port_number);

       if (debug) {
 	fprintf(where,"remote listen done.\n");
 	fprintf(where,"remote port is %u\n",get_port_number(remote_res));
 	fflush(where);
       }
     }
     else {
       Set_errno(netperf_response.content.serv_errno);
       fprintf(where,
 	      "netperf: remote error %d",
 	      netperf_response.content.serv_errno);
       perror("");
       fflush(where);
       exit(1);
     }
   }
 #ifdef WANT_DEMO
   DEMO_RR_SETUP(100)
 #endif

   /* pick a nice random spot between client_port_min and */
   /* client_port_max for our initial port number */
   srand(getpid());
   if (client_port_max - client_port_min) {
     myport = client_port_min +
       (rand() % (client_port_max - client_port_min));
   }
   else {
     myport = client_port_min;
   }
   /* there will be a ++ before the first call to bind, so subtract one */
   myport--;
   /* Set-up the test end conditions. For a request/response test, they */
   /* can be either time or transaction based. */

   if (test_time) {
     /* The user wanted to end the test after a period of time. */
     times_up = 0;
     trans_remaining = 0;
     start_timer(test_time);
   }
   else {
     /* The tester wanted to send a number of bytes. */
     trans_remaining = test_bytes;
     times_up = 1;
   }

   /* The cpu_start routine will grab the current time and possibly */
   /* value of the idle counter for later use in measuring cpu */
   /* utilization and/or service demand and thruput. */


   cpu_start(local_cpu_usage);

 #ifdef WANT_DEMO
       if (demo_mode) {
 	HIST_timestamp(demo_one_ptr);
       }
 #endif

   /* We use an "OR" to control test execution. When the test is */
   /* controlled by time, the byte count check will always return false. */
   /* When the test is controlled by byte count, the time test will */
   /* always return false. When the test is finished, the whole */
   /* expression will go false and we will stop sending data. I think I */
   /* just arbitrarily decrement trans_remaining for the timed test, but */
   /* will not do that just yet... One other question is whether or not */
   /* the send buffer and the receive buffer should be the same buffer. */

   while ((!times_up) || (trans_remaining > 0)) {

 #ifdef WANT_HISTOGRAM
     if (verbosity > 1) {
       /* timestamp just before our call to create the socket, and then */
       /* again just after the receive raj 3/95 */
       HIST_timestamp(&time_one);
     }
 #endif /* WANT_HISTOGRAM */

 newport:
     /* pick a new port number */
     myport++;

     /* wrap the port number when we get to client_port_max. NOTE, some */
     /* broken TCP's might treat the port number as a signed 16 bit */
     /* quantity.  we aren't interested in testing such broken */
     /* implementations :) so we won't make sure that it is below 32767 */
     /* raj 8/94  */
     if (myport >= client_port_max) {
       myport = client_port_min;
     }

     /* we do not want to use the port number that the server is */
     /* sitting at - this would cause us to fail in a loopback test. we */
     /* could just rely on the failure of the bind to get us past this, */
     /* but I'm guessing that in this one case at least, it is much */
     /* faster, given that we *know* that port number is already in use */
     /* (or rather would be in a loopback test) */

     if (myport == get_port_number(remote_res)) myport++;

     if (debug) {
       if ((nummessages % 100) == 0) {
 	printf("port %d\n",myport);
       }
     }

     /* set up the data socket */
     set_port_number(local_res, (unsigned short)myport);
     send_socket = create_data_socket(local_res);

     if (send_socket == INVALID_SOCKET) {
       perror("netperf: send_tcp_conn_rr: tcp stream data socket");
       exit(1);
     }


     /* we used to call bind here, but that is now taken-care-of by the
        create_data_socket routine. */

     /* Connect up to the remote port on the data socket  */
     if ((ret = connect(send_socket,
 		       remote_res->ai_addr,
 		       remote_res->ai_addrlen)) == INVALID_SOCKET){
       if (SOCKET_EINTR(ret))
 	  {
 	    /* we hit the end of a */
 	    /* timed test. */
 	    timed_out = 1;
 	    break;
       }
       if ((SOCKET_EADDRINUSE(ret)) || SOCKET_EADDRNOTAVAIL(ret)) {
 	/* likely something our explicit bind() would have caught in
            the past, so go get another port, via create_data_socket.
            yes, this is a bit more overhead than before, but the
            condition should be rather rare.  raj 2005-02-08 */
 	close(send_socket);
 	goto newport;
       }
       perror("netperf: data socket connect failed");
       printf("\tattempted to connect on socket %d to port %d",
 	     send_socket,
 	     get_port_number(remote_res));
       printf(" from port %d \n",get_port_number(local_res));
       exit(1);
     }


     /* send the request */
     if((len=send(send_socket,
 		 send_ring->buffer_ptr,
 		 req_size,
 		 0)) != req_size) {
       if (SOCKET_EINTR(len))
 	  {
 	    /* we hit the end of a */
 	    /* timed test. */
 	    timed_out = 1;
 	    break;
       }
       perror("send_tcp_conn_rr: data send error");
       exit(1);
     }
     send_ring = send_ring->next;

     /* receive the response */
     rsp_bytes_left = rsp_size;
     temp_message_ptr  = recv_ring->buffer_ptr;


     do {
       rsp_bytes_recvd = recv(send_socket,
 			     temp_message_ptr,
 			     rsp_bytes_left,
 			     0);
       if (rsp_bytes_recvd > 0) {
 	rsp_bytes_left -= rsp_bytes_recvd;
 	temp_message_ptr += rsp_bytes_recvd;
       }
       else {
 	break;
       }
     } while (rsp_bytes_left);


     /* OK, we are out of the loop - now what? */
     if (rsp_bytes_recvd < 0) {
       /* did the timer hit, or was there an error? */
       if (SOCKET_EINTR(rsp_bytes_recvd))
 	  {
 	    /* We hit the end of a timed test. */
 	    timed_out = 1;
 	    break;
 	  }
 	  perror("send_tcp_conn_rr: data recv error");
 	  exit(1);
     }

     /* if this is a no_control test, we initiate connection close,
        otherwise the remote netserver does it to remain just like
        previous behaviour. raj 2007-27-08 */
     if (!no_control) {
       shutdown(send_socket,SHUT_WR);
     }

     /* we are expecting to get either a return of zero indicating
        connection close, or an error.  */
     rsp_bytes_recvd = recv(send_socket,
 			   temp_message_ptr,
 			   1,
 			   0);

     /* our exit from the while loop should generally be when */
     /* tmp_bytes_recvd is equal to zero, which implies the connection */
     /* has been closed by the server side. By waiting until we get the */
     /* zero return we can avoid race conditions that stick us with the */
     /* TIME_WAIT connection and not the server. raj 8/96 */

 #ifdef VMWARE_UW
     /* why this should be for VMware I'm not sure, but it was given as
        part of the patches, so we include it here, but put it under an
        ifdef VMWARE_UW. raj 2008-07-25 */
     if (sp_bytes_recvd < 0 && errno == ECONNRESET) {
       rsp_bytes_recvd = 0;
     }
 #endif /* VMWARE_UW */

     if (rsp_bytes_recvd == 0) {
       /* connection close, call close. we assume that the requisite */
       /* number of bytes have been received */
       recv_ring = recv_ring->next;

 #ifdef WANT_HISTOGRAM
       if (verbosity > 1) {
 	HIST_timestamp(&time_two);
 	HIST_add(time_hist,delta_micro(&time_one,&time_two));
       }
 #endif /* WANT_HISTOGRAM */

 #ifdef WANT_DEMO
       DEMO_RR_INTERVAL(1)
 #endif

       nummessages++;
       if (trans_remaining) {
 	trans_remaining--;
       }

       if (debug > 3) {
 	fprintf(where,
 		"Transaction %d completed on local port %d\n",
 		nummessages,
 		get_port_number(local_res));
 	fflush(where);
       }

       close(send_socket);

     }
     else {
       /* it was less than zero - an error occured */
       if (SOCKET_EINTR(rsp_bytes_recvd))
 	  {
 	    /* We hit the end of a timed test. */
 	    timed_out = 1;
 	    break;
 	  }
 	  perror("send_tcp_conn_rr: data recv error");
 	  exit(1);
     }

   }


   /* this call will always give us the elapsed time for the test, and */
   /* will also store-away the necessaries for cpu utilization */

   cpu_stop(local_cpu_usage,&elapsed_time);	/* was cpu being measured? */
   /* how long did we really run? */

   if (!no_control) {
     /* Get the statistics from the remote end. The remote will have
        calculated service demand and all those interesting things. If
        it wasn't supposed to care, it will return obvious values. */

     recv_response();
     if (!netperf_response.content.serv_errno) {
       if (debug)
 	fprintf(where,"remote results obtained\n");
     }
     else {
       Set_errno(netperf_response.content.serv_errno);
       fprintf(where,
 	      "netperf: remote error %d",
 	      netperf_response.content.serv_errno);
       perror("");
       fflush(where);

       exit(1);
     }
   }

   /* We now calculate what our thruput was for the test. In the future, */
   /* we may want to include a calculation of the thruput measured by */
   /* the remote, but it should be the case that for a TCP stream test, */
   /* that the two numbers should be *very* close... We calculate */
   /* bytes_sent regardless of the way the test length was controlled. */
   /* If it was time, we needed to, and if it was by bytes, the user may */
   /* have specified a number of bytes that wasn't a multiple of the */
   /* send_size, so we really didn't send what he asked for ;-) We use */
   /* Kbytes/s as the units of thruput for a TCP stream test, where K = */
   /* 1024. A future enhancement *might* be to choose from a couple of */
   /* unit selections. */

   bytes_xferd	= (req_size * nummessages) + (rsp_size * nummessages);
   thruput	= calc_thruput(bytes_xferd);

   if (local_cpu_usage || remote_cpu_usage) {
     /* We must now do a little math for service demand and cpu */
     /* utilization for the system(s) */
     /* Of course, some of the information might be bogus because */
     /* there was no idle counter in the kernel(s). We need to make */
     /* a note of this for the user's benefit...*/
     if (local_cpu_usage) {
       if (local_cpu_rate == 0.0) {
 	fprintf(where,
 		"WARNING WARNING WARNING  WARNING WARNING WARNING  WARNING!\n");
 	fprintf(where,
 		"Local CPU usage numbers based on process information only!\n");
 	fflush(where);
       }
       local_cpu_utilization = calc_cpu_util(0.0);
       /* since calc_service demand is doing ms/Kunit we will */
       /* multiply the number of transaction by 1024 to get */
       /* "good" numbers */
       local_service_demand  = calc_service_demand((double) nummessages*1024,
 						  0.0,
 						  0.0,
 						  0);
     }
     else {
       local_cpu_utilization	= (float) -1.0;
       local_service_demand	= (float) -1.0;
     }

     if (remote_cpu_usage) {
       if (remote_cpu_rate == 0.0) {
 	fprintf(where,
 		"DANGER  DANGER  DANGER    DANGER  DANGER  DANGER    DANGER!\n");
 	fprintf(where,
 		"Remote CPU usage numbers based on process information only!\n");
 	fflush(where);
       }
       remote_cpu_utilization = tcp_conn_rr_result->cpu_util;
       /* since calc_service demand is doing ms/Kunit we will */
       /* multiply the number of transaction by 1024 to get */
       /* "good" numbers */
       remote_service_demand = calc_service_demand((double) nummessages*1024,
 						  0.0,
 						  remote_cpu_utilization,
 						  tcp_conn_rr_result->num_cpus);
     }
     else {
       remote_cpu_utilization = (float) -1.0;
       remote_service_demand  = (float) -1.0;
     }

     /* We are now ready to print all the information. If the user */
     /* has specified zero-level verbosity, we will just print the */
     /* local service demand, or the remote service demand. If the */
     /* user has requested verbosity level 1, he will get the basic */
     /* "streamperf" numbers. If the user has specified a verbosity */
     /* of greater than 1, we will display a veritable plethora of */
     /* background information from outside of this block as it it */
     /* not cpu_measurement specific...  */

     switch (verbosity) {
     case 0:
       if (local_cpu_usage) {
 	fprintf(where,
 		cpu_fmt_0,
 		local_service_demand);
       }
       else {
 	fprintf(where,
 		cpu_fmt_0,
 		remote_service_demand);
       }
       break;
     case 1:
     case 2:

       if (print_headers) {
 	fprintf(where,
 		cpu_title,
 		local_cpu_method,
 		remote_cpu_method);
       }

       fprintf(where,
 	      cpu_fmt_1_line_1,		/* the format string */
 	      lss_size,		/* local sendbuf size */
 	      lsr_size,
 	      req_size,		/* how large were the requests */
 	      rsp_size,		/* guess */
 	      elapsed_time,		/* how long was the test */
 	      nummessages/elapsed_time,
 	      local_cpu_utilization,	/* local cpu */
 	      remote_cpu_utilization,	/* remote cpu */
 	      local_service_demand,	/* local service demand */
 	      remote_service_demand);	/* remote service demand */
       fprintf(where,
 	      cpu_fmt_1_line_2,
 	      rss_size,
 	      rsr_size);
       break;
     }
   }
   else {
     /* The tester did not wish to measure service demand. */
     switch (verbosity) {
     case 0:
       fprintf(where,
 	      tput_fmt_0,
 	      nummessages/elapsed_time);
       break;
     case 1:
     case 2:
       if (print_headers) {
 	fprintf(where,tput_title,format_units());
       }

       fprintf(where,
 	      tput_fmt_1_line_1,	/* the format string */
 	      lss_size,
 	      lsr_size,
 	      req_size,		/* how large were the requests */
 	      rsp_size,		/* how large were the responses */
 	      elapsed_time, 		/* how long did it take */
 	      nummessages/elapsed_time);
       fprintf(where,
 	      tput_fmt_1_line_2,
 	      rss_size, 		/* remote recvbuf size */
 	      rsr_size);

       break;
     }
   }

   /* it would be a good thing to include information about some of the */
   /* other parameters that may have been set for this test, but at the */
   /* moment, I do not wish to figure-out all the  formatting, so I will */
   /* just put this comment here to help remind me that it is something */
   /* that should be done at a later time. */

   if (verbosity > 1) {
     /* The user wanted to know it all, so we will give it to him. */
     /* This information will include as much as we can find about */
     /* TCP statistics, the alignments of the sends and receives */
     /* and all that sort of rot... */

     fprintf(where,
 	    ksink_fmt,
 	    local_send_align,
 	    remote_recv_offset,
 	    local_send_offset,
 	    remote_recv_offset);

 #ifdef WANT_HISTOGRAM
     fprintf(where,"\nHistogram of request/response times\n");
     fflush(where);
     HIST_report(time_hist);
 #endif /* WANT_HISTOGRAM */

   }

 }


 void
 recv_tcp_conn_rr()
 {

   char  *message;
   struct addrinfo *local_res;
   char local_name[BUFSIZ];
   char port_buffer[PORTBUFSIZE];

   struct	sockaddr_storage        myaddr_in, peeraddr_in;
   SOCKET	s_listen,s_data;
   netperf_socklen_t 	addrlen;
   char	*recv_message_ptr;
   char	*send_message_ptr;
   char	*temp_message_ptr;
   int	trans_received;
   int	trans_remaining;
   int	bytes_sent;
   int	request_bytes_recvd;
   int	request_bytes_remaining;
   int	timed_out = 0;
   float	elapsed_time;

   struct	tcp_conn_rr_request_struct	*tcp_conn_rr_request;
   struct	tcp_conn_rr_response_struct	*tcp_conn_rr_response;
   struct	tcp_conn_rr_results_struct	*tcp_conn_rr_results;

   tcp_conn_rr_request =
     (struct tcp_conn_rr_request_struct *)netperf_request.content.test_specific_data;
   tcp_conn_rr_response =
     (struct tcp_conn_rr_response_struct *)netperf_response.content.test_specific_data;
   tcp_conn_rr_results =
     (struct tcp_conn_rr_results_struct *)netperf_response.content.test_specific_data;

   if (debug) {
     fprintf(where,"netserver: recv_tcp_conn_rr: entered...\n");
     fflush(where);
   }

   /* We want to set-up the listen socket with all the desired */
   /* parameters and then let the initiator know that all is ready. If */
   /* socket size defaults are to be used, then the initiator will have */
   /* sent us 0's. If the socket sizes cannot be changed, then we will */
   /* send-back what they are. If that information cannot be determined, */
   /* then we send-back -1's for the sizes. If things go wrong for any */
   /* reason, we will drop back ten yards and punt. */

   /* If anything goes wrong, we want the remote to know about it. It */
   /* would be best if the error that the remote reports to the user is */
   /* the actual error we encountered, rather than some bogus unexpected */
   /* response type message. */

   if (debug) {
     fprintf(where,"recv_tcp_conn_rr: setting the response type...\n");
     fflush(where);
   }

   netperf_response.content.response_type = TCP_CRR_RESPONSE;

   if (debug) {
     fprintf(where,"recv_tcp_conn_rr: the response type is set...\n");
     fflush(where);
   }

   /* set-up the data buffer with the requested alignment and offset */
   message = (char *)malloc(DATABUFFERLEN);
   if (message == NULL) {
     printf("malloc(%d) failed!\n", DATABUFFERLEN);
     exit(1);
   }

   /* We now alter the message_ptr variables to be at the desired */
   /* alignments with the desired offsets. */

   if (debug) {
     fprintf(where,
 	    "recv_tcp_conn_rr: requested recv alignment of %d offset %d\n",
 	    tcp_conn_rr_request->recv_alignment,
 	    tcp_conn_rr_request->recv_offset);
     fprintf(where,
 	    "recv_tcp_conn_rr: requested send alignment of %d offset %d\n",
 	    tcp_conn_rr_request->send_alignment,
 	    tcp_conn_rr_request->send_offset);
     fflush(where);
   }

   recv_message_ptr = ALIGN_BUFFER(message, tcp_conn_rr_request->recv_alignment, tcp_conn_rr_request->recv_offset);

   send_message_ptr = ALIGN_BUFFER(message, tcp_conn_rr_request->send_alignment, tcp_conn_rr_request->send_offset);

   if (debug) {
     fprintf(where,"recv_tcp_conn_rr: receive alignment and offset set...\n");
     fflush(where);
   }

   /* Grab a socket to listen on, and then listen on it. */

   if (debug) {
     fprintf(where,"recv_tcp_conn_rr: grabbing a socket...\n");
     fflush(where);
   }

   /* create_data_socket expects to find some things in the global */
   /* variables, so set the globals based on the values in the request. */
   /* once the socket has been created, we will set the response values */
   /* based on the updated value of those globals. raj 7/94 */
   lss_size_req = tcp_conn_rr_request->send_buf_size;
   lsr_size_req = tcp_conn_rr_request->recv_buf_size;
   loc_nodelay = tcp_conn_rr_request->no_delay;
   loc_rcvavoid = tcp_conn_rr_request->so_rcvavoid;
   loc_sndavoid = tcp_conn_rr_request->so_sndavoid;

   set_hostname_and_port(local_name,
 			port_buffer,
 			nf_to_af(tcp_conn_rr_request->ipfamily),
 			tcp_conn_rr_request->port);

   local_res = complete_addrinfo(local_name,
 				local_name,
 				port_buffer,
 				nf_to_af(tcp_conn_rr_request->ipfamily),
 				SOCK_STREAM,
 				IPPROTO_TCP,
 				0);

   s_listen = create_data_socket(local_res);

   if (s_listen == INVALID_SOCKET) {
     netperf_response.content.serv_errno = errno;
     send_response();
     if (debug) {
       fprintf(where,"could not create data socket\n");
       fflush(where);
     }
     exit(1);
   }

 #ifdef WIN32
     /* The test timer can fire during operations on the listening socket,
        so to make the start_timer below work we have to move
        it to close s_listen while we are blocked on accept. */
     win_kludge_socket2 = s_listen;
 #endif


   /* Now, let's set-up the socket to listen for connections */
   if (listen(s_listen, 5) == SOCKET_ERROR) {
     netperf_response.content.serv_errno = errno;
     close(s_listen);
     send_response();
     if (debug) {
       fprintf(where,"could not listen\n");
       fflush(where);
     }
     exit(1);
   }

   /* now get the port number assigned by the system  */
   addrlen = sizeof(myaddr_in);
   if (getsockname(s_listen,
 		  (struct sockaddr *)&myaddr_in,
 		  &addrlen) == SOCKET_ERROR){
     netperf_response.content.serv_errno = errno;
     close(s_listen);
     send_response();
     if (debug) {
       fprintf(where,"could not getsockname\n");
       fflush(where);
     }
     exit(1);
   }

   /* Now myaddr_in contains the port and the internet address this is */
   /* returned to the sender also implicitly telling the sender that the */
   /* socket buffer sizing has been done. */

   tcp_conn_rr_response->data_port_number =
     (int) ntohs(((struct sockaddr_in *)&myaddr_in)->sin_port);
   if (debug) {
     fprintf(where,"telling the remote to call me at %d\n",
 	    tcp_conn_rr_response->data_port_number);
     fflush(where);
   }
   netperf_response.content.serv_errno   = 0;

   /* But wait, there's more. If the initiator wanted cpu measurements, */
   /* then we must call the calibrate routine, which will return the max */
   /* rate back to the initiator. If the CPU was not to be measured, or */
   /* something went wrong with the calibration, we will return a 0.0 to */
   /* the initiator. */

   tcp_conn_rr_response->cpu_rate = (float)0.0; 	/* assume no cpu */
   if (tcp_conn_rr_request->measure_cpu) {
     tcp_conn_rr_response->measure_cpu = 1;
     tcp_conn_rr_response->cpu_rate =
       calibrate_local_cpu(tcp_conn_rr_request->cpu_rate);
   }


   /* before we send the response back to the initiator, pull some of */
   /* the socket parms from the globals */
   tcp_conn_rr_response->send_buf_size = lss_size;
   tcp_conn_rr_response->recv_buf_size = lsr_size;
   tcp_conn_rr_response->no_delay = loc_nodelay;
   tcp_conn_rr_response->so_rcvavoid = loc_rcvavoid;
   tcp_conn_rr_response->so_sndavoid = loc_sndavoid;

   send_response();

   addrlen = sizeof(peeraddr_in);

   /* Now it's time to start receiving data on the connection. We will */
   /* first grab the apropriate counters and then start grabbing. */

   cpu_start(tcp_conn_rr_request->measure_cpu);

   /* The loop will exit when the sender does a shutdown, which will */
   /* return a length of zero   */

   if (tcp_conn_rr_request->test_length > 0) {
     times_up = 0;
     trans_remaining = 0;
     start_timer(tcp_conn_rr_request->test_length + PAD_TIME);
   }
   else {
     times_up = 1;
     trans_remaining = tcp_conn_rr_request->test_length * -1;
   }

   trans_received = 0;

   while ((!times_up) || (trans_remaining > 0)) {

     /* accept a connection from the remote */
 #ifdef WIN32
     /* The test timer will probably fire during this accept,
        so to make the start_timer above work we have to move
        it to close s_listen while we are blocked on accept. */
     win_kludge_socket = s_listen;
 #endif
     if ((s_data=accept(s_listen,
 		       (struct sockaddr *)&peeraddr_in,
 		       &addrlen)) == INVALID_SOCKET) {
       if (errno == EINTR) {
 	/* the timer popped */
 	timed_out = 1;
 	break;
       }
       fprintf(where,"recv_tcp_conn_rr: accept: errno = %d\n",errno);
       fflush(where);
       close(s_listen);

       exit(1);
     }

     if (debug) {
       fprintf(where,"recv_tcp_conn_rr: accepted data connection.\n");
       fflush(where);
     }

 #ifdef WIN32
   /* this is used so the timer thread can close the socket out from */
   /* under us, which to date is the easiest/cleanest/least */
   /* Windows-specific way I can find to force the winsock calls to */
   /* return WSAEINTR with the test is over. anything that will run on */
   /* 95 and NT and is closer to what netperf expects from Unix signals */
   /* and such would be appreciated raj 1/96 */
   win_kludge_socket = s_data;
 #endif /* WIN32 */

 #ifdef KLUDGE_SOCKET_OPTIONS
     /* this is for those systems which *INCORRECTLY* fail to pass */
     /* attributes across an accept() call. Including this goes against */
     /* my better judgement :( raj 11/95 */

     kludge_socket_options(s_data);

 #endif /* KLUDGE_SOCKET_OPTIONS */

     temp_message_ptr	= recv_message_ptr;
     request_bytes_remaining	= tcp_conn_rr_request->request_size;

     /* receive the request from the other side */
     while (!times_up && (request_bytes_remaining > 0)) {
       if((request_bytes_recvd=recv(s_data,
 				   temp_message_ptr,
 				   request_bytes_remaining,
 				   0)) == SOCKET_ERROR) {
 	if (SOCKET_EINTR(request_bytes_recvd))
 	{
 	  /* the timer popped */
 	  timed_out = 1;
 	  break;
 	}
 	netperf_response.content.serv_errno = errno;
 	send_response();
 	exit(1);
       }
       else {
 	request_bytes_remaining -= request_bytes_recvd;
 	temp_message_ptr  += request_bytes_recvd;
       }
     }

     if (timed_out) {
       /* we hit the end of the test based on time - lets */
       /* bail out of here now... */
       fprintf(where,"yo5\n");
       fflush(where);
       break;
     }

     /* Now, send the response to the remote */
     if((bytes_sent=send(s_data,
 			send_message_ptr,
 			tcp_conn_rr_request->response_size,
 			0)) == SOCKET_ERROR) {
       if (errno == EINTR) {
 	/* the test timer has popped */
 	timed_out = 1;
 	fprintf(where,"yo6\n");
 	fflush(where);
 	break;
       }
       netperf_response.content.serv_errno = 99;
       send_response();
       exit(1);
     }

     trans_received++;
     if (trans_remaining) {
       trans_remaining--;
     }

     if (debug) {
       fprintf(where,
 	      "recv_tcp_conn_rr: Transaction %d complete\n",
 	      trans_received);
       fflush(where);
     }

     /* close the connection. the server will likely do a graceful */
     /* close of the connection, insuring that all data has arrived at */
     /* the client. for this it will call shutdown(), and then recv() and */
     /* then close(). I'm reasonably confident that this is the */
     /* appropriate sequence of calls - I would like to hear of */
     /* examples in web servers to the contrary. raj 10/95*/
 #ifdef TCP_CRR_SHUTDOWN
     shutdown(s_data,SHUT_WR);
     recv(s_data,
 	 recv_message_ptr,
 	 1,
 	 0);
     close(s_data);
 #else
     close(s_data);
 #endif /* TCP_CRR_SHUTDOWN */

   }


   /* The loop now exits due to timeout or transaction count being */
   /* reached */

   cpu_stop(tcp_conn_rr_request->measure_cpu,&elapsed_time);

   if (timed_out) {
     /* we ended the test by time, which was at least 2 seconds */
     /* longer than we wanted to run. so, we want to subtract */
     /* PAD_TIME from the elapsed_time. */
     elapsed_time -= PAD_TIME;
   }
   /* send the results to the sender			*/

   if (debug) {
     fprintf(where,
 	    "recv_tcp_conn_rr: got %d transactions\n",
 	    trans_received);
     fflush(where);
   }

   tcp_conn_rr_results->bytes_received	= (trans_received *
 					   (tcp_conn_rr_request->request_size +
 					    tcp_conn_rr_request->response_size));
   tcp_conn_rr_results->trans_received	= trans_received;
   tcp_conn_rr_results->elapsed_time	= elapsed_time;
   if (tcp_conn_rr_request->measure_cpu) {
     tcp_conn_rr_results->cpu_util	= calc_cpu_util(elapsed_time);
   }

   if (debug) {
     fprintf(where,
 	    "recv_tcp_conn_rr: test complete, sending results.\n");
     fflush(where);
   }

   send_response();

 }


 #ifdef DO_1644

  /* this test is intended to test the performance of establishing a */
  /* connection, exchanging a request/response pair, and repeating. it */
  /* is expected that this would be a good starting-point for */
  /* comparision of T/TCP with classic TCP for transactional workloads. */
  /* it will also look (can look) much like the communication pattern */
  /* of http for www access. */

 int
 send_tcp_tran_rr(char remote_host[])
 {

   char *tput_title = "\
 Local /Remote\n\
 Socket Size   Request  Resp.   Elapsed  Trans.\n\
 Send   Recv   Size     Size    Time     Rate         \n\
 bytes  Bytes  bytes    bytes   secs.    per sec   \n\n";

   char *tput_fmt_0 =
     "%7.2f\n";

   char *tput_fmt_1_line_1 = "\
 %-6d %-6d %-6d   %-6d  %-6.2f   %7.2f   \n";
   char *tput_fmt_1_line_2 = "\
 %-6d %-6d\n";

   char *cpu_title = "\
 Local /Remote\n\
 Socket Size   Request Resp.  Elapsed Trans.   CPU    CPU    S.dem   S.dem\n\
 Send   Recv   Size    Size   Time    Rate     local  remote local   remote\n\
 bytes  bytes  bytes   bytes  secs.   per sec  %%      %%      us/Tr   us/Tr\n\n";

   char *cpu_fmt_0 =
     "%6.3f\n";

   char *cpu_fmt_1_line_1 = "\
 %-6d %-6d %-6d  %-6d %-6.2f  %-6.2f   %-6.2f %-6.2f %-6.3f  %-6.3f\n";

   char *cpu_fmt_1_line_2 = "\
 %-6d %-6d\n";

   char *ksink_fmt = "\n\
 Alignment      Offset\n\
 Local  Remote  Local  Remote\n\
 Send   Recv    Send   Recv\n\
 %5d  %5d   %5d  %5d\n";


   int 			one = 1;
   int			timed_out = 0;
   float			elapsed_time;

   int	len;
   struct ring_elt *send_ring;
   struct ring_elt *recv_ring;
   char	*temp_message_ptr;
   int	nummessages;
   SOCKET	send_socket;
   int	trans_remaining;
   double	bytes_xferd;
   int	sock_opt_len = sizeof(int);
   int	rsp_bytes_left;
   int	rsp_bytes_recvd;

   float	local_cpu_utilization;
   float	local_service_demand;
   float	remote_cpu_utilization;
   float	remote_service_demand;
   double	thruput;

   struct	hostent	        *hp;
   struct	sockaddr_in	server;
   struct        sockaddr_in     *myaddr;
   unsigned      int             addr;
   int                           myport;

   struct	tcp_tran_rr_request_struct	*tcp_tran_rr_request;
   struct	tcp_tran_rr_response_struct	*tcp_tran_rr_response;
   struct	tcp_tran_rr_results_struct	*tcp_tran_rr_result;

   tcp_tran_rr_request =
     (struct tcp_tran_rr_request_struct *)netperf_request.content.test_specific_data;
   tcp_tran_rr_response =
     (struct tcp_tran_rr_response_struct *)netperf_response.content.test_specific_data;
   tcp_tran_rr_result =
     (struct tcp_tran_rr_results_struct *)netperf_response.content.test_specific_data;


 #ifdef WANT_HISTOGRAM
   if (verbosity > 1) {
     time_hist = HIST_new();
   }
 #endif /* WANT_HISTOGRAM */

   /* since we are now disconnected from the code that established the */
   /* control socket, and since we want to be able to use different */
   /* protocols and such, we are passed the name of the remote host and */
   /* must turn that into the test specific addressing information. */

   myaddr = (struct sockaddr_storage *)malloc(sizeof(struct sockaddr_storage));
   if (myaddr == NULL) {
     printf("malloc(%d) failed!\n", sizeof(struct sockaddr_storage));
     exit(1);
   }

   bzero((char *)&server,
 	sizeof(server));
   bzero((char *)myaddr,
 	sizeof(struct sockaddr_storage));
   myaddr->sin_family = AF_INET;

   complete_addrinfos(&remote_res,
 		     &local_res,
 		     remote_host,
 		     SOCK_STREAM,
 		     IPPROTO_TCP,
 		     0);

   if ( print_headers ) {
     print_top_test_header("TCP Transactional/Request/Response TEST",local_res,remote_res);
   }

   /* initialize a few counters */

   nummessages	=	0;
   bytes_xferd	=	0.0;
   times_up 	= 	0;

   /* set-up the data buffers with the requested alignment and offset */
   if (send_width == 0) send_width = 1;
   if (recv_width == 0) recv_width = 1;

   send_ring = allocate_buffer_ring(send_width,
 				   req_size,
 				   local_send_align,
 				   local_send_offset);

   recv_ring = allocate_buffer_ring(recv_width,
 				   rsp_size,
 				   local_recv_align,
 				   local_recv_offset);


   if (debug) {
     fprintf(where,"send_tcp_tran_rr: send_socket obtained...\n");
   }

   /* If the user has requested cpu utilization measurements, we must */
   /* calibrate the cpu(s). We will perform this task within the tests */
   /* themselves. If the user has specified the cpu rate, then */
   /* calibrate_local_cpu will return rather quickly as it will have */
   /* nothing to do. If local_cpu_rate is zero, then we will go through */
   /* all the "normal" calibration stuff and return the rate back.*/

   if (local_cpu_usage) {
     local_cpu_rate = calibrate_local_cpu(local_cpu_rate);
   }

   /* Tell the remote end to do a listen. The server alters the socket */
   /* paramters on the other side at this point, hence the reason for */
   /* all the values being passed in the setup message. If the user did */
   /* not specify any of the parameters, they will be passed as 0, which */
   /* will indicate to the remote that no changes beyond the system's */
   /* default should be used. Alignment is the exception, it will */
   /* default to 8, which will be no alignment alterations. */

   netperf_request.content.request_type	        =	DO_TCP_TRR;
   tcp_tran_rr_request->recv_buf_size	=	rsr_size_req;
   tcp_tran_rr_request->send_buf_size	=	rss_size_req;
   tcp_tran_rr_request->recv_alignment	=	remote_recv_align;
   tcp_tran_rr_request->recv_offset	=	remote_recv_offset;
   tcp_tran_rr_request->send_alignment	=	remote_send_align;
   tcp_tran_rr_request->send_offset	=	remote_send_offset;
   tcp_tran_rr_request->request_size	=	req_size;
   tcp_tran_rr_request->response_size	=	rsp_size;
   tcp_tran_rr_request->no_delay	        =	rem_nodelay;
   tcp_tran_rr_request->measure_cpu	=	remote_cpu_usage;
   tcp_tran_rr_request->cpu_rate	        =	remote_cpu_rate;
   tcp_tran_rr_request->so_rcvavoid	=	rem_rcvavoid;
   tcp_tran_rr_request->so_sndavoid	=	rem_sndavoid;
   if (test_time) {
     tcp_tran_rr_request->test_length	=	test_time;
   }
   else {
     tcp_tran_rr_request->test_length	=	test_trans * -1;
   }
   tcp_tran_rr_request->port             =       atoi(remote_data_port);
   tcp_tran_rr_request->ipfamily        =       af_to_nf(remote_res->ai_family);

   if (debug > 1) {
     fprintf(where,"netperf: send_tcp_tran_rr: requesting TCP_TRR test\n");
   }

   send_request();

   /* The response from the remote will contain all of the relevant 	*/
   /* socket parameters for this test type. We will put them back into 	*/
   /* the variables here so they can be displayed if desired.  The	*/
   /* remote will have calibrated CPU if necessary, and will have done	*/
   /* all the needed set-up we will have calibrated the cpu locally	*/
   /* before sending the request, and will grab the counter value right	*/
   /* after the connect returns. The remote will grab the counter right	*/
   /* after the accept call. This saves the hassle of extra messages	*/
   /* being sent for the TCP tests.					*/

   recv_response();

   if (!netperf_response.content.serv_errno) {
     rsr_size	=	tcp_tran_rr_response->recv_buf_size;
     rss_size	=	tcp_tran_rr_response->send_buf_size;
     rem_nodelay	=	tcp_tran_rr_response->no_delay;
     remote_cpu_usage=	tcp_tran_rr_response->measure_cpu;
     remote_cpu_rate = 	tcp_tran_rr_response->cpu_rate;
     /* make sure that port numbers are in network order */
     server.sin_port	=	tcp_tran_rr_response->data_port_number;
     server.sin_port =	htons(server.sin_port);
     if (debug) {
       fprintf(where,"remote listen done.\n");
       fprintf(where,"remote port is %d\n",ntohs(server.sin_port));
       fflush(where);
     }
   }
   else {
     Set_errno(netperf_response.content.serv_errno);
     fprintf(where,
 	    "netperf: remote error %d",
 	    netperf_response.content.serv_errno);
     perror("");
     fflush(where);
     exit(1);
   }

   /* pick a nice random spot between client_port_min and */
   /* client_port_max for our initial port number. if they are the */
   /* same, then just set to _min */
   if (client_port_max - client_port_min) {
     srand(getpid());
     myport = client_port_min +
       (rand() % (client_port_max - client_port_min));
   }
   else {
     myport = client_port_min;
   }

   /* there will be a ++ before the first call to bind, so subtract one */
   myport--;
   myaddr->sin_port = htons((unsigned short)myport);

   /* Set-up the test end conditions. For a request/response test, they */
   /* can be either time or transaction based. */

   if (test_time) {
     /* The user wanted to end the test after a period of time. */
     times_up = 0;
     trans_remaining = 0;
     start_timer(test_time);
   }
   else {
     /* The tester wanted to send a number of bytes. */
     trans_remaining = test_bytes;
     times_up = 1;
   }

   /* The cpu_start routine will grab the current time and possibly */
   /* value of the idle counter for later use in measuring cpu */
   /* utilization and/or service demand and thruput. */

   cpu_start(local_cpu_usage);

   /* We use an "OR" to control test execution. When the test is */
   /* controlled by time, the byte count check will always return false. */
   /* When the test is controlled by byte count, the time test will */
   /* always return false. When the test is finished, the whole */
   /* expression will go false and we will stop sending data. I think I */
   /* just arbitrarily decrement trans_remaining for the timed test, but */
   /* will not do that just yet... One other question is whether or not */
   /* the send buffer and the receive buffer should be the same buffer. */

   while ((!times_up) || (trans_remaining > 0)) {

 #ifdef WANT_HISTOGRAM
     if (verbosity > 1) {
       /* timestamp just before our call to create the socket, and then */
       /* again just after the receive raj 3/95 */
       HIST_timestamp(&time_one);
     }
 #endif /* WANT_HISTOGRAM */

     /* set up the data socket - is this really necessary or can I just */
     /* re-use the same socket and move this cal out of the while loop. */
     /* it does introcudea *boatload* of system calls. I guess that it */
     /* all depends on "reality of programming." keeping it this way is */
     /* a bit more conservative I imagine - raj 3/95 */
     send_socket = create_data_socket(local_res);

     if (send_socket == INVALID_SOCKET) {
       perror("netperf: send_tcp_tran_rr: tcp stream data socket");
       exit(1);
     }

     /* we set SO_REUSEADDR on the premis that no unreserved port */
     /* number on the local system is going to be already connected to */
     /* the remote netserver's port number. One thing that I might */
     /* try later is to have the remote actually allocate a couple of */
     /* port numbers and cycle through those as well. depends on if we */
     /* can get through all the unreserved port numbers in less than */
     /* the length of the TIME_WAIT state raj 8/94 */
     one = 1;
     if(setsockopt(send_socket, SOL_SOCKET, SO_REUSEADDR,
 		  (char *)&one, sock_opt_len) == SOCKET_ERROR) {
       perror("netperf: send_tcp_tran_rr: so_reuseaddr");
       exit(1);
     }

 newport:
     /* pick a new port number */
     myport = ntohs(myaddr->sin_port);
     myport++;

     /* we do not want to use the port number that the server is */
     /* sitting at - this would cause us to fail in a loopback test. we */
     /* could just rely on the failure of the bind to get us past this, */
     /* but I'm guessing that in this one case at least, it is much */
     /* faster, given that we *know* that port number is already in use */
     /* (or rather would be in a loopback test) */

     if (myport == ntohs(server.sin_port)) myport++;

     /* wrap the port number when we get to 65535. NOTE, some broken */
     /* TCP's might treat the port number as a signed 16 bit quantity. */
     /* we aren't interested in testing such broken implementations :) */
     /* raj 8/94  */
     if (myport >= client_port_max) {
       myport = client_port_min;
     }
     myaddr->sin_port = htons((unsigned short)myport);

     if (debug) {
       if ((nummessages % 100) == 0) {
 	printf("port %d\n",myport);
       }
     }

     /* we want to bind our socket to a particular port number. */
     if (bind(send_socket,
 	     (struct sockaddr *)myaddr,
 	     sizeof(struct sockaddr_storage)) == SOCKET_ERROR) {
       /* if the bind failed, someone else must have that port number */
       /* - perhaps in the listen state. since we can't use it, skip to */
       /* the next port number. we may have to do this again later, but */
       /* that's just too bad :) */
       if (debug > 1) {
 	fprintf(where,
 		"send_tcp_tran_rr: tried to bind to port %d errno %d\n",
 		ntohs(myaddr->sin_port),
 		errno);
 	fflush(where);
       }
 	/* yes, goto's are supposed to be evil, but they do have their */
 	/* uses from time to time. the real world doesn't always have */
 	/* to code to ge tthe A in CS 101 :) raj 3/95 */
 	goto newport;
     }

     /* Connect up to the remote port on the data socket. Since this is */
     /* a test for RFC_1644-style transactional TCP, we can use the */
     /* sendto() call instead of calling connect and then send() */

     /* send the request */
     if((len=sendto(send_socket,
 		   send_ring->buffer_ptr,
 		   req_size,
 		   MSG_EOF,
 		   (struct sockaddr *)&server,
 		   sizeof(server))) != req_size) {
       if (SOCKET_EINTR(len))
 	  {
 	    /* we hit the end of a */
 	    /* timed test. */
 	    timed_out = 1;
 	    break;
       }
       perror("send_tcp_tran_rr: data send error");
       exit(1);
     }
     send_ring = send_ring->next;

     /* receive the response */
     rsp_bytes_left = rsp_size;
     temp_message_ptr  = recv_ring->buffer_ptr;
     while(rsp_bytes_left > 0) {
       if((rsp_bytes_recvd=recv(send_socket,
 			       temp_message_ptr,
 			       rsp_bytes_left,
 			       0)) == SOCKET_ERROR) {
 	    if (SOCKET_EINTR(rsp_bytes_recvd))
 		{
 	      /* We hit the end of a timed test. */
 	      timed_out = 1;
 	      break;
 		}
 	    perror("send_tcp_tran_rr: data recv error");
 	    exit(1);
       }
       rsp_bytes_left -= rsp_bytes_recvd;
       temp_message_ptr  += rsp_bytes_recvd;
     }
     recv_ring = recv_ring->next;

     if (timed_out) {
       /* we may have been in a nested while loop - we need */
       /* another call to break. */
       break;
     }

     close(send_socket);

 #ifdef WANT_HISTOGRAM
     if (verbosity > 1) {
       HIST_timestamp(&time_two);
       HIST_add(time_hist,delta_micro(&time_one,&time_two));
     }
 #endif /* WANT_HISTOGRAM */

     nummessages++;
     if (trans_remaining) {
       trans_remaining--;
     }

     if (debug > 3) {
       fprintf(where,
 	      "Transaction %d completed on local port %d\n",
 	      nummessages,
 	      ntohs(myaddr->sin_port));
       fflush(where);
     }


   }

   /* this call will always give us the elapsed time for the test, and */
   /* will also store-away the necessaries for cpu utilization */

   cpu_stop(local_cpu_usage,&elapsed_time);	/* was cpu being measured? */
   /* how long did we really run? */

   /* Get the statistics from the remote end. The remote will have */
   /* calculated service demand and all those interesting things. If it */
   /* wasn't supposed to care, it will return obvious values. */

   recv_response();
   if (!netperf_response.content.serv_errno) {
     if (debug)
       fprintf(where,"remote results obtained\n");
   }
   else {
     Set_errno(netperf_response.content.serv_errno);
     fprintf(where,
 	    "netperf: remote error %d",
 	    netperf_response.content.serv_errno);
     perror("");
     fflush(where);
     exit(1);
   }

   /* We now calculate what our thruput was for the test. In the future, */
   /* we may want to include a calculation of the thruput measured by */
   /* the remote, but it should be the case that for a TCP stream test, */
   /* that the two numbers should be *very* close... We calculate */
   /* bytes_sent regardless of the way the test length was controlled. */
   /* If it was time, we needed to, and if it was by bytes, the user may */
   /* have specified a number of bytes that wasn't a multiple of the */
   /* send_size, so we really didn't send what he asked for ;-) We use */
   /* Kbytes/s as the units of thruput for a TCP stream test, where K = */
   /* 1024. A future enhancement *might* be to choose from a couple of */
   /* unit selections. */

   bytes_xferd	= (req_size * nummessages) + (rsp_size * nummessages);
   thruput	= calc_thruput(bytes_xferd);

   if (local_cpu_usage || remote_cpu_usage) {
     /* We must now do a little math for service demand and cpu */
     /* utilization for the system(s) */
     /* Of course, some of the information might be bogus because */
     /* there was no idle counter in the kernel(s). We need to make */
     /* a note of this for the user's benefit...*/
     if (local_cpu_usage) {
       if (local_cpu_rate == 0.0) {
 	fprintf(where,"WARNING WARNING WARNING  WARNING WARNING WARNING  WARNING!\n");
 	fprintf(where,"Local CPU usage numbers based on process information only!\n");
 	fflush(where);
       }
       local_cpu_utilization = calc_cpu_util(0.0);
       /* since calc_service demand is doing ms/Kunit we will */
       /* multiply the number of transaction by 1024 to get */
       /* "good" numbers */
       local_service_demand  = calc_service_demand((double) nummessages*1024,
 						  0.0,
 						  0.0,
 						  0);
     }
     else {
       local_cpu_utilization	= (float) -1.0;
       local_service_demand	= (float) -1.0;
     }

     if (remote_cpu_usage) {
       if (remote_cpu_rate == 0.0) {
 	fprintf(where,"DANGER  DANGER  DANGER    DANGER  DANGER  DANGER    DANGER!\n");
 	fprintf(where,"Remote CPU usage numbers based on process information only!\n");
 	fflush(where);
       }
       remote_cpu_utilization = tcp_tran_rr_result->cpu_util;
       /* since calc_service demand is doing ms/Kunit we will */
       /* multiply the number of transaction by 1024 to get */
       /* "good" numbers */
       remote_service_demand = calc_service_demand((double) nummessages*1024,
 						  0.0,
 						  remote_cpu_utilization,
 						  tcp_tran_rr_result->num_cpus);
     }
     else {
       remote_cpu_utilization = (float) -1.0;
       remote_service_demand  = (float) -1.0;
     }

     /* We are now ready to print all the information. If the user */
     /* has specified zero-level verbosity, we will just print the */
     /* local service demand, or the remote service demand. If the */
     /* user has requested verbosity level 1, he will get the basic */
     /* "streamperf" numbers. If the user has specified a verbosity */
     /* of greater than 1, we will display a veritable plethora of */
     /* background information from outside of this block as it it */
     /* not cpu_measurement specific...  */

     switch (verbosity) {
     case 0:
       if (local_cpu_usage) {
 	fprintf(where,
 		cpu_fmt_0,
 		local_service_demand);
       }
       else {
 	fprintf(where,
 		cpu_fmt_0,
 		remote_service_demand);
       }
       break;
     case 1:
     case 2:

       if (print_headers) {
 	fprintf(where,
 		cpu_title,
 		local_cpu_method,
 		remote_cpu_method);
       }

       fprintf(where,
 	      cpu_fmt_1_line_1,		/* the format string */
 	      lss_size,		/* local sendbuf size */
 	      lsr_size,
 	      req_size,		/* how large were the requests */
 	      rsp_size,		/* guess */
 	      elapsed_time,		/* how long was the test */
 	      nummessages/elapsed_time,
 	      local_cpu_utilization,	/* local cpu */
 	      remote_cpu_utilization,	/* remote cpu */
 	      local_service_demand,	/* local service demand */
 	      remote_service_demand);	/* remote service demand */
       fprintf(where,
 	      cpu_fmt_1_line_2,
 	      rss_size,
 	      rsr_size);
       break;
     }
   }
   else {
     /* The tester did not wish to measure service demand. */
     switch (verbosity) {
     case 0:
       fprintf(where,
 	      tput_fmt_0,
 	      nummessages/elapsed_time);
       break;
     case 1:
     case 2:
       if (print_headers) {
 	fprintf(where,tput_title,format_units());
       }

       fprintf(where,
 	      tput_fmt_1_line_1,	/* the format string */
 	      lss_size,
 	      lsr_size,
 	      req_size,		/* how large were the requests */
 	      rsp_size,		/* how large were the responses */
 	      elapsed_time, 		/* how long did it take */
 	      nummessages/elapsed_time);
       fprintf(where,
 	      tput_fmt_1_line_2,
 	      rss_size, 		/* remote recvbuf size */
 	      rsr_size);

       break;
     }
   }

   /* it would be a good thing to include information about some of the */
   /* other parameters that may have been set for this test, but at the */
   /* moment, I do not wish to figure-out all the  formatting, so I will */
   /* just put this comment here to help remind me that it is something */
   /* that should be done at a later time. */

   if (verbosity > 1) {
     /* The user wanted to know it all, so we will give it to him. */
     /* This information will include as much as we can find about */
     /* TCP statistics, the alignments of the sends and receives */
     /* and all that sort of rot... */

     fprintf(where,
 	    ksink_fmt,
 	    local_send_align,
 	    remote_recv_offset,
 	    local_send_offset,
 	    remote_recv_offset);

 #ifdef WANT_HISTOGRAM
     fprintf(where,"\nHistogram of request/response times\n");
     fflush(where);
     HIST_report(time_hist);
 #endif /* WANT_HISTOGRAM */

   }

 }


 int
 recv_tcp_tran_rr()
 {

   char  *message;
   struct	sockaddr_in        myaddr_in,
   peeraddr_in;
   SOCKET	s_listen,s_data;
   netperf_socklen_t 	addrlen;
   int   NoPush = 1;

   char	*recv_message_ptr;
   char	*send_message_ptr;
   char	*temp_message_ptr;
   int	trans_received;
   int	trans_remaining;
   int	bytes_sent;
   int	request_bytes_recvd;
   int	request_bytes_remaining;
   int	timed_out = 0;
   float	elapsed_time;

   struct	tcp_tran_rr_request_struct	*tcp_tran_rr_request;
   struct	tcp_tran_rr_response_struct	*tcp_tran_rr_response;
   struct	tcp_tran_rr_results_struct	*tcp_tran_rr_results;

   tcp_tran_rr_request =
     (struct tcp_tran_rr_request_struct *)netperf_request.content.test_specific_data;
   tcp_tran_rr_response =
     (struct tcp_tran_rr_response_struct *)netperf_response.content.test_specific_data;
   tcp_tran_rr_results =
     (struct tcp_tran_rr_results_struct *)netperf_response.content.test_specific_data;

   if (debug) {
     fprintf(where,"netserver: recv_tcp_tran_rr: entered...\n");
     fflush(where);
   }

   /* We want to set-up the listen socket with all the desired */
   /* parameters and then let the initiator know that all is ready. If */
   /* socket size defaults are to be used, then the initiator will have */
   /* sent us 0's. If the socket sizes cannot be changed, then we will */
   /* send-back what they are. If that information cannot be determined, */
   /* then we send-back -1's for the sizes. If things go wrong for any */
   /* reason, we will drop back ten yards and punt. */

   /* If anything goes wrong, we want the remote to know about it. It */
   /* would be best if the error that the remote reports to the user is */
   /* the actual error we encountered, rather than some bogus unexpected */
   /* response type message. */

   if (debug) {
     fprintf(where,"recv_tcp_tran_rr: setting the response type...\n");
     fflush(where);
   }

   netperf_response.content.response_type = TCP_TRR_RESPONSE;

   if (debug) {
     fprintf(where,"recv_tcp_tran_rr: the response type is set...\n");
     fflush(where);
   }

   /* set-up the data buffer with the requested alignment and offset */
   message = (char *)malloc(DATABUFFERLEN);
   if (message == NULL) {
     printf("malloc(%d) failed!\n", DATABUFFERLEN);
     exit(1);
   }

   /* We now alter the message_ptr variables to be at the desired */
   /* alignments with the desired offsets. */

   if (debug) {
     fprintf(where,
 	    "recv_tcp_tran_rr: requested recv alignment of %d offset %d\n",
 	    tcp_tran_rr_request->recv_alignment,
 	    tcp_tran_rr_request->recv_offset);
     fprintf(where,
 	    "recv_tcp_tran_rr: requested send alignment of %d offset %d\n",
 	    tcp_tran_rr_request->send_alignment,
 	    tcp_tran_rr_request->send_offset);
     fflush(where);
   }

   recv_message_ptr = ALIGN_BUFFER(message, tcp_tran_rr_request->recv_alignment, tcp_tran_rr_request->recv_offset);

   send_message_ptr = ALIGN_BUFFER(message, tcp_tran_rr_request->send_alignment, tcp_tran_rr_request->send_offset);

   if (debug) {
     fprintf(where,"recv_tcp_tran_rr: receive alignment and offset set...\n");
     fflush(where);
   }

   /* Let's clear-out our sockaddr for the sake of cleanlines. Then we */
   /* can put in OUR values !-) At some point, we may want to nail this */
   /* socket to a particular network-level address, but for now, */
   /* INADDR_ANY should be just fine. */

   bzero((char *)&myaddr_in,
 	sizeof(myaddr_in));
   myaddr_in.sin_family      = AF_INET;
   myaddr_in.sin_addr.s_addr = INADDR_ANY;
   myaddr_in.sin_port        = htons((unsigned short)tcp_tran_rr_request->port);

   /* Grab a socket to listen on, and then listen on it. */

   if (debug) {
     fprintf(where,"recv_tcp_tran_rr: grabbing a socket...\n");
     fflush(where);
   }

   /* create_data_socket expects to find some things in the global */
   /* variables, so set the globals based on the values in the request. */
   /* once the socket has been created, we will set the response values */
   /* based on the updated value of those globals. raj 7/94 */
   lss_size_req = tcp_tran_rr_request->send_buf_size;
   lsr_size_req = tcp_tran_rr_request->recv_buf_size;
   loc_nodelay = tcp_tran_rr_request->no_delay;
   loc_rcvavoid = tcp_tran_rr_request->so_rcvavoid;
   loc_sndavoid = tcp_tran_rr_request->so_sndavoid;

   set_hostname_and_port(local_name,
 			port_buffer,
 			nf_to_af(tcp_tran_rr_request->ipfamily),
 			tcp_tran_rr_request->port);

   local_res = complete_addrinfo(local_name,
 				local_name,
 				port_buffer,
 				nf_to_af(tcp_tran_rr_request->ipfamily),
 				SOCK_STREAM,
 				IPPROTO_TCP,
 				0);

   s_listen = create_data_socket(local_res);

   if (s_listen == INVALID_SOCKET) {
     netperf_response.content.serv_errno = errno;
     send_response();
     if (debug) {
       fprintf(where,"could not create data socket\n");
       fflush(where);
     }
     exit(1);
   }

 #ifdef WIN32
   /* The test timer can fire during operations on the listening socket,
      so to make the start_timer below work we have to move
      it to close s_listen while we are blocked on accept. */
   win_kludge_socket2 = s_listen;
 #endif


   /* Let's get an address assigned to this socket so we can tell the */
   /* initiator how to reach the data socket. There may be a desire to */
   /* nail this socket to a specific IP address in a multi-homed, */
   /* multi-connection situation, but for now, we'll ignore the issue */
   /* and concentrate on single connection testing. */

   if (bind(s_listen,
 	   (struct sockaddr *)&myaddr_in,
 	   sizeof(myaddr_in)) == SOCKET_ERROR) {
     netperf_response.content.serv_errno = errno;
     close(s_listen);
     send_response();
     if (debug) {
       fprintf(where,"could not bind\n");
       fflush(where);
     }
     exit(1);
   }

   /* we want to disable the implicit PUSH on all sends. at some point, */
   /* this might want to be a parm to the test raj 3/95 */
   if (setsockopt(s_listen,
 		 IPPROTO_TCP,
 		 TCP_NOPUSH,
 		 (const char *)&NoPush,
 		 sizeof(int)) == SOCKET_ERROR) {
     fprintf(where,
 	    "recv_tcp_tran_rr: could not set TCP_NOPUSH errno %d\n",
 	    errno);
     fflush(where);
     netperf_response.content.serv_errno = errno;
     close(s_listen);
     send_response();
   }

   /* Now, let's set-up the socket to listen for connections */
   if (listen(s_listen, 5) == SOCKET_ERROR) {
     netperf_response.content.serv_errno = errno;
     close(s_listen);
     send_response();
     if (debug) {
       fprintf(where,"could not listen\n");
       fflush(where);
     }
     exit(1);
   }

   /* now get the port number assigned by the system  */
   addrlen = sizeof(myaddr_in);
   if (getsockname(s_listen,
 		  (struct sockaddr *)&myaddr_in,
 		  &addrlen) == SOCKET_ERROR){
     netperf_response.content.serv_errno = errno;
     close(s_listen);
     send_response();
     if (debug) {
       fprintf(where,"could not geetsockname\n");
       fflush(where);
     }
     exit(1);
   }

   /* Now myaddr_in contains the port and the internet address this is */
   /* returned to the sender also implicitly telling the sender that the */
   /* socket buffer sizing has been done. */

   tcp_tran_rr_response->data_port_number = (int) ntohs(myaddr_in.sin_port);
   if (debug) {
     fprintf(where,"telling the remote to call me at %d\n",
 	    tcp_tran_rr_response->data_port_number);
     fflush(where);
   }
   netperf_response.content.serv_errno   = 0;

   /* But wait, there's more. If the initiator wanted cpu measurements, */
   /* then we must call the calibrate routine, which will return the max */
   /* rate back to the initiator. If the CPU was not to be measured, or */
   /* something went wrong with the calibration, we will return a 0.0 to */
   /* the initiator. */

   tcp_tran_rr_response->cpu_rate = 0.0; 	/* assume no cpu */
   if (tcp_tran_rr_request->measure_cpu) {
     tcp_tran_rr_response->measure_cpu = 1;
     tcp_tran_rr_response->cpu_rate =
       calibrate_local_cpu(tcp_tran_rr_request->cpu_rate);
   }


   /* before we send the response back to the initiator, pull some of */
   /* the socket parms from the globals */
   tcp_tran_rr_response->send_buf_size = lss_size;
   tcp_tran_rr_response->recv_buf_size = lsr_size;
   tcp_tran_rr_response->no_delay = loc_nodelay;
   tcp_tran_rr_response->so_rcvavoid = loc_rcvavoid;
   tcp_tran_rr_response->so_sndavoid = loc_sndavoid;

   send_response();

   addrlen = sizeof(peeraddr_in);

   /* Now it's time to start receiving data on the connection. We will */
   /* first grab the apropriate counters and then start grabbing. */

   cpu_start(tcp_tran_rr_request->measure_cpu);

   /* The loop will exit when the sender does a shutdown, which will */
   /* return a length of zero   */

   if (tcp_tran_rr_request->test_length > 0) {
     times_up = 0;
     trans_remaining = 0;
     start_timer(tcp_tran_rr_request->test_length + PAD_TIME);
   }
   else {
     times_up = 1;
     trans_remaining = tcp_tran_rr_request->test_length * -1;
   }

   trans_received = 0;

   while ((!times_up) || (trans_remaining > 0)) {

     /* accept a connection from the remote */
     if ((s_data=accept(s_listen,
 		       (struct sockaddr *)&peeraddr_in,
 		       &addrlen)) == INVALID_SOCKET) {
       if (errno == EINTR) {
 	/* the timer popped */
 	timed_out = 1;
 	break;
       }
       fprintf(where,"recv_tcp_tran_rr: accept: errno = %d\n",errno);
       fflush(where);
       close(s_listen);

       exit(1);
     }

     if (debug) {
       fprintf(where,"recv_tcp_tran_rr: accepted data connection.\n");
       fflush(where);
     }

 #ifdef WIN32
   /* this is used so the timer thread can close the socket out from */
   /* under us, which to date is the easiest/cleanest/least */
   /* Windows-specific way I can find to force the winsock calls to */
   /* return WSAEINTR with the test is over. anything that will run on */
   /* 95 and NT and is closer to what netperf expects from Unix signals */
   /* and such would be appreciated raj 1/96 */
   win_kludge_socket = s_data;
 #endif /* WIN32 */

 #ifdef KLUDGE_SOCKET_OPTIONS
   /* this is for those systems which *INCORRECTLY* fail to pass */
   /* attributes across an accept() call. Including this goes against */
   /* my better judgement :( raj 11/95 */

   kludge_socket_options(s_data);

 #endif /* KLUDGE_SOCKET_OPTIONS */

     temp_message_ptr	= recv_message_ptr;
     request_bytes_remaining	= tcp_tran_rr_request->request_size;

     /* receive the request from the other side. we can just receive */
     /* until we get zero bytes, but that would be a slight structure */
     /* change in the code, with minimal perfomance effects. If */
     /* however, I has variable-length messages, I would want to do */
     /* this to avoid needing "double reads" - one for the message */
     /* length, and one for the rest of the message raj 3/95 */
     while(request_bytes_remaining > 0) {
       if((request_bytes_recvd=recv(s_data,
 				   temp_message_ptr,
 				   request_bytes_remaining,
 				   0)) == SOCKET_ERROR) {
 	    if ( SOCKET_EINTR(request_bytes_recvd) )
 		{
 	      /* the timer popped */
 	      timed_out = 1;
 	      break;
 		}
 	    netperf_response.content.serv_errno = errno;
 	    send_response();
 	    exit(1);
       }
       else {
 	request_bytes_remaining -= request_bytes_recvd;
 	temp_message_ptr  += request_bytes_recvd;
       }
     }

     if (timed_out) {
       /* we hit the end of the test based on time - lets */
       /* bail out of here now... */
       fprintf(where,"yo5\n");
       fflush(where);
       break;
     }

     /* Now, send the response to the remote we can use sendto here to */
     /* help remind people that this is an rfc 1644 style of test */
     if((bytes_sent=sendto(s_data,
 			  send_message_ptr,
 			  tcp_tran_rr_request->response_size,
 			  MSG_EOF,
 			  (struct sockaddr *)&peeraddr_in,
 			  sizeof(struct sockaddr_storage))) == SOCKET_ERROR) {
       if (SOCKET_EINTR(bytes_sent)) {
 	/* the test timer has popped */
 	timed_out = 1;
 	fprintf(where,"yo6\n");
 	fflush(where);
 	break;
       }
       netperf_response.content.serv_errno = 99;
       send_response();
       exit(1);
     }

     trans_received++;
     if (trans_remaining) {
       trans_remaining--;
     }

     if (debug) {
       fprintf(where,
 	      "recv_tcp_tran_rr: Transaction %d complete\n",
 	      trans_received);
       fflush(where);
     }

     /* close the connection. since we have disable PUSH on sends, the */
     /* FIN should be tacked-onto our last send instead of being */
     /* standalone */
     close(s_data);

   }


   /* The loop now exits due to timeout or transaction count being */
   /* reached */

   cpu_stop(tcp_tran_rr_request->measure_cpu,&elapsed_time);

   if (timed_out) {
     /* we ended the test by time, which was at least 2 seconds */
     /* longer than we wanted to run. so, we want to subtract */
     /* PAD_TIME from the elapsed_time. */
     elapsed_time -= PAD_TIME;
   }
   /* send the results to the sender			*/

   if (debug) {
     fprintf(where,
 	    "recv_tcp_tran_rr: got %d transactions\n",
 	    trans_received);
     fflush(where);
   }

   tcp_tran_rr_results->bytes_received	= (trans_received *
 					   (tcp_tran_rr_request->request_size +
 					    tcp_tran_rr_request->response_size));
   tcp_tran_rr_results->trans_received	= trans_received;
   tcp_tran_rr_results->elapsed_time	= elapsed_time;
   if (tcp_tran_rr_request->measure_cpu) {
     tcp_tran_rr_results->cpu_util	= calc_cpu_util(elapsed_time);
   }

   if (debug) {
     fprintf(where,
 	    "recv_tcp_tran_rr: test complete, sending results.\n");
     fflush(where);
   }

   send_response();

 }
 #endif /* DO_1644 */

 #ifdef DO_NBRR
  /* this routine implements the sending (netperf) side of the TCP_RR */
  /* test using POSIX-style non-blocking sockets. */

 void
 send_tcp_nbrr(char remote_host[])
 {

   char *tput_title = "\
 Local /Remote\n\
 Socket Size   Request  Resp.   Elapsed  Trans.\n\
 Send   Recv   Size     Size    Time     Rate         \n\
 bytes  Bytes  bytes    bytes   secs.    per sec   \n\n";

   char *tput_fmt_0 =
     "%7.2f\n";

   char *tput_fmt_1_line_1 = "\
 %-6d %-6d %-6d   %-6d  %-6.2f   %7.2f   \n";
   char *tput_fmt_1_line_2 = "\
 %-6d %-6d\n";

   char *cpu_title = "\
 Local /Remote\n\
 Socket Size   Request Resp.  Elapsed Trans.   CPU    CPU    S.dem   S.dem\n\
 Send   Recv   Size    Size   Time    Rate     local  remote local   remote\n\
 bytes  bytes  bytes   bytes  secs.   per sec  %% %c    %% %c    us/Tr   us/Tr\n\n";

   char *cpu_fmt_0 =
     "%6.3f %c\n";

   char *cpu_fmt_1_line_1 = "\
 %-6d %-6d %-6d  %-6d %-6.2f  %-6.2f  %-6.2f %-6.2f %-6.3f  %-6.3f\n";

   char *cpu_fmt_1_line_2 = "\
 %-6d %-6d\n";

   char *ksink_fmt = "\
 Alignment      Offset\n\
 Local  Remote  Local  Remote\n\
 Send   Recv    Send   Recv\n\
 %5d  %5d   %5d  %5d\n";


   int			timed_out = 0;
   float			elapsed_time;

   int	len;
   char	*temp_message_ptr;
   int	nummessages;
   SOCKET	send_socket;
   int	trans_remaining;
   double	bytes_xferd;

   struct ring_elt *send_ring;
   struct ring_elt *recv_ring;

   int	rsp_bytes_left;
   int	rsp_bytes_recvd;

   float	local_cpu_utilization;
   float	local_service_demand;
   float	remote_cpu_utilization;
   float	remote_service_demand;
   double	thruput;

   struct	hostent	        *hp;
   struct	sockaddr_storage	server;
   unsigned      int             addr;

   struct	tcp_rr_request_struct	*tcp_rr_request;
   struct	tcp_rr_response_struct	*tcp_rr_response;
   struct	tcp_rr_results_struct	*tcp_rr_result;

   struct addrinfo *remote_res;
   struct addrinfo *local_res;

   tcp_rr_request =
     (struct tcp_rr_request_struct *)netperf_request.content.test_specific_data;
   tcp_rr_response=
     (struct tcp_rr_response_struct *)netperf_response.content.test_specific_data;
   tcp_rr_result	=
     (struct tcp_rr_results_struct *)netperf_response.content.test_specific_data;

 #ifdef WANT_HISTOGRAM
   if (verbosity > 1) {
     time_hist = HIST_new();
   }
 #endif /* WANT_HISTOGRAM */

   /* since we are now disconnected from the code that established the */
   /* control socket, and since we want to be able to use different */
   /* protocols and such, we are passed the name of the remote host and */
   /* must turn that into the test specific addressing information. */

   bzero((char *)&server,
 	sizeof(server));

   complete_addrinfos(&remote_res,
 		     &local_res,
 		     remote_host,
 		     SOCK_STREAM,
 		     IPPROTO_TCP,
 		     0);

   if ( print_headers ) {
     print_top_test_header("TCP Non-Blocking REQUEST/RESPONSE TEST",local_res,remote_res);
   }

   /* initialize a few counters */

   send_ring = NULL;
   recv_ring = NULL;
   confidence_iteration = 1;
   init_stat();

   /* we have a great-big while loop which controls the number of times */
   /* we run a particular test. this is for the calculation of a */
   /* confidence interval (I really should have stayed awake during */
   /* probstats :). If the user did not request confidence measurement */
   /* (no confidence is the default) then we will only go though the */
   /* loop once. the confidence stuff originates from the folks at IBM */

   while (((confidence < 0) && (confidence_iteration < iteration_max)) ||
 	 (confidence_iteration <= iteration_min)) {

     /* initialize a few counters. we have to remember that we might be */
     /* going through the loop more than once. */

     nummessages     = 0;
     bytes_xferd     = 0.0;
     times_up        = 0;
     timed_out       = 0;
     trans_remaining = 0;

     /* set-up the data buffers with the requested alignment and offset. */
     /* since this is a request/response test, default the send_width and */
     /* recv_width to 1 and not two raj 7/94 */

     if (send_width == 0) send_width = 1;
     if (recv_width == 0) recv_width = 1;

     if (send_ring == NULL) {
       send_ring = allocate_buffer_ring(send_width,
 				       req_size,
 				       local_send_align,
 				       local_send_offset);
     }

     if (recv_ring == NULL) {
       recv_ring = allocate_buffer_ring(recv_width,
 				       rsp_size,
 				       local_recv_align,
 				       local_recv_offset);
     }

     /*set up the data socket                        */
     send_socket = create_data_socket(local_res);

     if (send_socket == INVALID_SOCKET){
       perror("netperf: send_tcp_nbrr: tcp stream data socket");
       exit(1);
     }

     if (debug) {
       fprintf(where,"send_tcp_nbrr: send_socket obtained...\n");
     }

     /* If the user has requested cpu utilization measurements, we must */
     /* calibrate the cpu(s). We will perform this task within the tests */
     /* themselves. If the user has specified the cpu rate, then */
     /* calibrate_local_cpu will return rather quickly as it will have */
     /* nothing to do. If local_cpu_rate is zero, then we will go through */
     /* all the "normal" calibration stuff and return the rate back.*/

     if (local_cpu_usage) {
       local_cpu_rate = calibrate_local_cpu(local_cpu_rate);
     }

     /* Tell the remote end to do a listen. The server alters the socket */
     /* paramters on the other side at this point, hence the reason for */
     /* all the values being passed in the setup message. If the user did */
     /* not specify any of the parameters, they will be passed as 0, which */
     /* will indicate to the remote that no changes beyond the system's */
     /* default should be used. Alignment is the exception, it will */
     /* default to 8, which will be no alignment alterations. */

     netperf_request.content.request_type	=	DO_TCP_NBRR;
     tcp_rr_request->recv_buf_size	=	rsr_size_req;
     tcp_rr_request->send_buf_size	=	rss_size_req;
     tcp_rr_request->recv_alignment      =	remote_recv_align;
     tcp_rr_request->recv_offset	        =	remote_recv_offset;
     tcp_rr_request->send_alignment      =	remote_send_align;
     tcp_rr_request->send_offset	        =	remote_send_offset;
     tcp_rr_request->request_size	=	req_size;
     tcp_rr_request->response_size	=	rsp_size;
     tcp_rr_request->no_delay	        =	rem_nodelay;
     tcp_rr_request->measure_cpu	        =	remote_cpu_usage;
     tcp_rr_request->cpu_rate	        =	remote_cpu_rate;
     tcp_rr_request->so_rcvavoid	        =	rem_rcvavoid;
     tcp_rr_request->so_sndavoid	        =	rem_sndavoid;
     if (test_time) {
       tcp_rr_request->test_length	=	test_time;
     }
     else {
       tcp_rr_request->test_length	=	test_trans * -1;
     }

     if (debug > 1) {
       fprintf(where,"netperf: send_tcp_nbrr: requesting TCP rr test\n");
     }

     send_request();

     /* The response from the remote will contain all of the relevant 	*/
     /* socket parameters for this test type. We will put them back into */
     /* the variables here so they can be displayed if desired.  The	*/
     /* remote will have calibrated CPU if necessary, and will have done	*/
     /* all the needed set-up we will have calibrated the cpu locally	*/
     /* before sending the request, and will grab the counter value right*/
     /* after the connect returns. The remote will grab the counter right*/
     /* after the accept call. This saves the hassle of extra messages	*/
     /* being sent for the TCP tests.					*/

     recv_response();

     if (!netperf_response.content.serv_errno) {
       if (debug)
 	fprintf(where,"remote listen done.\n");
       rsr_size          = tcp_rr_response->recv_buf_size;
       rss_size          = tcp_rr_response->send_buf_size;
       rem_nodelay       = tcp_rr_response->no_delay;
       remote_cpu_usage  = tcp_rr_response->measure_cpu;
       remote_cpu_rate   = tcp_rr_response->cpu_rate;
       /* make sure that port numbers are in network order */
       server.sin_port   = (unsigned short)tcp_rr_response->data_port_number;
       server.sin_port   = htons(server.sin_port);
     }
     else {
       Set_errno(netperf_response.content.serv_errno);
       fprintf(where,
 	      "netperf: remote error %d",
 	      netperf_response.content.serv_errno);
       perror("");
       fflush(where);
       exit(1);
     }

     /*Connect up to the remote port on the data socket  */
     if (connect(send_socket,
 		remote_res->ai_addr,
 		remote_res->ai_addrlen) == INVALID_SOCKET){
       perror("netperf: data socket connect failed");

       exit(1);
     }

     /* now that we are connected, mark the socket as non-blocking */
     if (!set_nonblock(send_socket)) {
       perror("netperf: set_nonblock");
       exit(1);
     }

 #ifdef WIN32
   /* this is used so the timer thread can close the socket out from */
   /* under us, which to date is the easiest/cleanest/least */
   /* Windows-specific way I can find to force the winsock calls to */
   /* return WSAEINTR with the test is over. anything that will run on */
   /* 95 and NT and is closer to what netperf expects from Unix signals */
   /* and such would be appreciated raj 1/96 */
   win_kludge_socket = send_socket;
 #endif /* WIN32 */

     /* Data Socket set-up is finished. If there were problems, either the */
     /* connect would have failed, or the previous response would have */
     /* indicated a problem. I failed to see the value of the extra */
     /* message after the accept on the remote. If it failed, we'll see it */
     /* here. If it didn't, we might as well start pumping data. */

     /* Set-up the test end conditions. For a request/response test, they */
     /* can be either time or transaction based. */

     if (test_time) {
       /* The user wanted to end the test after a period of time. */
       times_up = 0;
       trans_remaining = 0;
       start_timer(test_time);
     }
     else {
       /* The tester wanted to send a number of bytes. */
       trans_remaining = test_bytes;
       times_up = 1;
     }

     /* The cpu_start routine will grab the current time and possibly */
     /* value of the idle counter for later use in measuring cpu */
     /* utilization and/or service demand and thruput. */

     cpu_start(local_cpu_usage);

 #ifdef WANT_INTERVALS
     INTERVALS_INIT();
 #endif /* WANT_INTERVALS */

     /* We use an "OR" to control test execution. When the test is */
     /* controlled by time, the byte count check will always return false. */
     /* When the test is controlled by byte count, the time test will */
     /* always return false. When the test is finished, the whole */
     /* expression will go false and we will stop sending data. I think I */
     /* just arbitrarily decrement trans_remaining for the timed test, but */
     /* will not do that just yet... One other question is whether or not */
     /* the send buffer and the receive buffer should be the same buffer. */

     while ((!times_up) || (trans_remaining > 0)) {
       /* send the request. we assume that if we use a blocking socket, */
       /* the request will be sent at one shot. */

 #ifdef WANT_HISTOGRAM
       if (verbosity > 1) {
 	/* timestamp just before our call to send, and then again just */
 	/* after the receive raj 8/94 */
 	HIST_timestamp(&time_one);
       }
 #endif /* WANT_HISTOGRAM */

       /* even though this is a non-blocking socket, we will assume for */
       /* the time being that we will be able to send an entire request */
       /* without getting an EAGAIN */
       if((len=send(send_socket,
 		   send_ring->buffer_ptr,
 		   req_size,
 		   0)) != req_size) {
 	if (SOCKET_EINTR(len)) {
 	  /* we hit the end of a */
 	  /* timed test. */
 	  timed_out = 1;
 	  break;
 	}
 	perror("send_tcp_nbrr: data send error");
 	exit(1);
       }
       send_ring = send_ring->next;

       /* receive the response. since we are using non-blocking I/O, we */
       /* will "spin" on the recvs */
       rsp_bytes_left = rsp_size;
       temp_message_ptr  = recv_ring->buffer_ptr;
       while(rsp_bytes_left > 0) {
 	if((rsp_bytes_recvd=recv(send_socket,
 				 temp_message_ptr,
 				 rsp_bytes_left,
 				 0)) == SOCKET_ERROR) {
 	  if (SOCKET_EINTR(rsp_bytes_recvd))
 	  {
 	    /* We hit the end of a timed test. */
 	    timed_out = 1;
 	    break;
 	  }
 #ifndef WIN32  // But what does WinNT indicate in this situation...
 	  else if (errno == EAGAIN) {
 	    Set_errno(0);
 	    continue;
 	  }
 #endif
 	  else {
 	    perror("send_tcp_nbrr: data recv error");
 	    exit(1);
 	  }
 	}
 	rsp_bytes_left -= rsp_bytes_recvd;
 	temp_message_ptr  += rsp_bytes_recvd;
       }
       recv_ring = recv_ring->next;

       if (timed_out) {
 	/* we may have been in a nested while loop - we need */
 	/* another call to break. */
 	break;
       }

 #ifdef WANT_HISTOGRAM
       if (verbosity > 1) {
 	HIST_timestamp(&time_two);
 	HIST_add(time_hist,delta_micro(&time_one,&time_two));
       }
 #endif /* WANT_HISTOGRAM */
 #ifdef WANT_INTERVALS
       INTERVALS_WAIT();
 #endif /* WANT_INTERVALS */

       nummessages++;
       if (trans_remaining) {
 	trans_remaining--;
       }

       if (debug > 3) {
 	if ((nummessages % 100) == 0) {
 	  fprintf(where,
 		  "Transaction %d completed\n",
 		  nummessages);
 	  fflush(where);
 	}
       }
     }

     /* At this point we used to call shutdown on the data socket to be */
     /* sure all the data was delivered, but this was not germane in a */
     /* request/response test, and it was causing the tests to "hang" when */
     /* they were being controlled by time. So, I have replaced this */
     /* shutdown call with a call to close that can be found later in the */
     /* procedure. */

     /* this call will always give us the elapsed time for the test, and */
     /* will also store-away the necessaries for cpu utilization */

     cpu_stop(local_cpu_usage,&elapsed_time);	/* was cpu being */
 						/* measured? how long */
 						/* did we really run? */

     /* Get the statistics from the remote end. The remote will have */
     /* calculated service demand and all those interesting things. If it */
     /* wasn't supposed to care, it will return obvious values. */

     recv_response();
     if (!netperf_response.content.serv_errno) {
       if (debug)
 	fprintf(where,"remote results obtained\n");
     }
     else {
       Set_errno(netperf_response.content.serv_errno);
       fprintf(where,
 	      "netperf: remote error %d",
 	      netperf_response.content.serv_errno);
       perror("");
       fflush(where);

       exit(1);
     }

     /* We now calculate what our thruput was for the test. */

     bytes_xferd	= (req_size * nummessages) + (rsp_size * nummessages);
     thruput	= nummessages/elapsed_time;

     if (local_cpu_usage || remote_cpu_usage) {
       /* We must now do a little math for service demand and cpu */
       /* utilization for the system(s) */
       /* Of course, some of the information might be bogus because */
       /* there was no idle counter in the kernel(s). We need to make */
       /* a note of this for the user's benefit...*/
       if (local_cpu_usage) {
 	local_cpu_utilization = calc_cpu_util(0.0);
 	/* since calc_service demand is doing ms/Kunit we will */
 	/* multiply the number of transaction by 1024 to get */
 	/* "good" numbers */
 	local_service_demand  = calc_service_demand((double) nummessages*1024,
 						    0.0,
 						    0.0,
 						    0);
       }
       else {
 	local_cpu_utilization	= (float) -1.0;
 	local_service_demand	= (float) -1.0;
       }

       if (remote_cpu_usage) {
 	remote_cpu_utilization = tcp_rr_result->cpu_util;
 	/* since calc_service demand is doing ms/Kunit we will */
 	/* multiply the number of transaction by 1024 to get */
 	/* "good" numbers */
 	remote_service_demand = calc_service_demand((double) nummessages*1024,
 						    0.0,
 						    remote_cpu_utilization,
 						    tcp_rr_result->num_cpus);
       }
       else {
 	remote_cpu_utilization = (float) -1.0;
 	remote_service_demand  = (float) -1.0;
       }

     }
     else {
       /* we were not measuring cpu, for the confidence stuff, we */
       /* should make it -1.0 */
       local_cpu_utilization	= (float) -1.0;
       local_service_demand	= (float) -1.0;
       remote_cpu_utilization = (float) -1.0;
       remote_service_demand  = (float) -1.0;
     }

     /* at this point, we want to calculate the confidence information. */
     /* if debugging is on, calculate_confidence will print-out the */
     /* parameters we pass it */

     calculate_confidence(confidence_iteration,
 			 elapsed_time,
 			 thruput,
 			 local_cpu_utilization,
 			 remote_cpu_utilization,
 			 local_service_demand,
 			 remote_service_demand);


     confidence_iteration++;

     /* we are now done with the socket, so close it */
     close(send_socket);

   }

   retrieve_confident_values(&elapsed_time,
 			    &thruput,
 			    &local_cpu_utilization,
 			    &remote_cpu_utilization,
 			    &local_service_demand,
 			    &remote_service_demand);

   /* We are now ready to print all the information. If the user */
   /* has specified zero-level verbosity, we will just print the */
   /* local service demand, or the remote service demand. If the */
   /* user has requested verbosity level 1, he will get the basic */
   /* "streamperf" numbers. If the user has specified a verbosity */
   /* of greater than 1, we will display a veritable plethora of */
   /* background information from outside of this block as it it */
   /* not cpu_measurement specific...  */

   if (confidence < 0) {
     /* we did not hit confidence, but were we asked to look for it? */
     if (iteration_max > 1) {
       display_confidence();
     }
   }

   if (local_cpu_usage || remote_cpu_usage) {
     local_cpu_method = format_cpu_method(cpu_method);
     remote_cpu_method = format_cpu_method(tcp_rr_result->cpu_method);

     switch (verbosity) {
     case 0:
       if (local_cpu_usage) {
 	fprintf(where,
 		cpu_fmt_0,
 		local_service_demand,
 		local_cpu_method);
       }
       else {
 	fprintf(where,
 		cpu_fmt_0,
 		remote_service_demand,
 		remote_cpu_method);
       }
       break;
     case 1:
     case 2:
       if (print_headers) {
 	fprintf(where,
 		cpu_title,
 		local_cpu_method,
 		remote_cpu_method);
       }

       fprintf(where,
 	      cpu_fmt_1_line_1,		/* the format string */
 	      lss_size,		/* local sendbuf size */
 	      lsr_size,
 	      req_size,		/* how large were the requests */
 	      rsp_size,		/* guess */
 	      elapsed_time,		/* how long was the test */
 	      thruput,
 	      local_cpu_utilization,	/* local cpu */
 	      remote_cpu_utilization,	/* remote cpu */
 	      local_service_demand,	/* local service demand */
 	      remote_service_demand);	/* remote service demand */
       fprintf(where,
 	      cpu_fmt_1_line_2,
 	      rss_size,
 	      rsr_size);
       break;
     }
   }
   else {
     /* The tester did not wish to measure service demand. */

     switch (verbosity) {
     case 0:
       fprintf(where,
 	      tput_fmt_0,
 	      thruput);
       break;
     case 1:
     case 2:
       if (print_headers) {
 	fprintf(where,tput_title,format_units());
       }

       fprintf(where,
 	      tput_fmt_1_line_1,	/* the format string */
 	      lss_size,
 	      lsr_size,
 	      req_size,		/* how large were the requests */
 	      rsp_size,		/* how large were the responses */
 	      elapsed_time, 		/* how long did it take */
 	      thruput);
       fprintf(where,
 	      tput_fmt_1_line_2,
 	      rss_size, 		/* remote recvbuf size */
 	      rsr_size);

       break;
     }
   }

   /* it would be a good thing to include information about some of the */
   /* other parameters that may have been set for this test, but at the */
   /* moment, I do not wish to figure-out all the  formatting, so I will */
   /* just put this comment here to help remind me that it is something */
   /* that should be done at a later time. */

   /* how to handle the verbose information in the presence of */
   /* confidence intervals is yet to be determined... raj 11/94 */
   if (verbosity > 1) {
     /* The user wanted to know it all, so we will give it to him. */
     /* This information will include as much as we can find about */
     /* TCP statistics, the alignments of the sends and receives */
     /* and all that sort of rot... */

     fprintf(where,
 	    ksink_fmt,
 	    local_send_align,
 	    remote_recv_offset,
 	    local_send_offset,
 	    remote_recv_offset);

 #ifdef WANT_HISTOGRAM
     fprintf(where,"\nHistogram of request/response times\n");
     fflush(where);
     HIST_report(time_hist);
 #endif /* WANT_HISTOGRAM */

   }

 }

  /* this routine implements the receive (netserver) side of a TCP_RR */
  /* test */
 void
 recv_tcp_nbrr()
 {

   struct ring_elt *send_ring;
   struct ring_elt *recv_ring;

   struct	sockaddr_in        myaddr_in,
   peeraddr_in;
   SOCKET	s_listen,s_data;
   netperf_socklen_t 	addrlen;
   char	*temp_message_ptr;
   int	trans_received;
   int	trans_remaining;
   int	bytes_sent;
   int	request_bytes_recvd;
   int	request_bytes_remaining;
   int	timed_out = 0;
   float	elapsed_time;

   struct addrinfo *local_res;
   char local_name[BUFSIZ];
   char port_buffer[PORTBUFSIZE];

   struct	tcp_rr_request_struct	*tcp_rr_request;
   struct	tcp_rr_response_struct	*tcp_rr_response;
   struct	tcp_rr_results_struct	*tcp_rr_results;

   tcp_rr_request =
     (struct tcp_rr_request_struct *)netperf_request.content.test_specific_data;
   tcp_rr_response =
     (struct tcp_rr_response_struct *)netperf_response.content.test_specific_data;
   tcp_rr_results =
     (struct tcp_rr_results_struct *)netperf_response.content.test_specific_data;

   if (debug) {
     fprintf(where,"netserver: recv_tcp_nbrr: entered...\n");
     fflush(where);
   }

   /* We want to set-up the listen socket with all the desired */
   /* parameters and then let the initiator know that all is ready. If */
   /* socket size defaults are to be used, then the initiator will have */
   /* sent us 0's. If the socket sizes cannot be changed, then we will */
   /* send-back what they are. If that information cannot be determined, */
   /* then we send-back -1's for the sizes. If things go wrong for any */
   /* reason, we will drop back ten yards and punt. */

   /* If anything goes wrong, we want the remote to know about it. It */
   /* would be best if the error that the remote reports to the user is */
   /* the actual error we encountered, rather than some bogus unexpected */
   /* response type message. */

   if (debug) {
     fprintf(where,"recv_tcp_nbrr: setting the response type...\n");
     fflush(where);
   }

   netperf_response.content.response_type = TCP_RR_RESPONSE;

   if (debug) {
     fprintf(where,"recv_tcp_nbrr: the response type is set...\n");
     fflush(where);
   }

   /* allocate the recv and send rings with the requested alignments */
   /* and offsets. raj 7/94 */
   if (debug) {
     fprintf(where,"recv_tcp_nbrr: requested recv alignment of %d offset %d\n",
 	    tcp_rr_request->recv_alignment,
 	    tcp_rr_request->recv_offset);
     fprintf(where,"recv_tcp_nbrr: requested send alignment of %d offset %d\n",
 	    tcp_rr_request->send_alignment,
 	    tcp_rr_request->send_offset);
     fflush(where);
   }

   /* at some point, these need to come to us from the remote system */
   if (send_width == 0) send_width = 1;
   if (recv_width == 0) recv_width = 1;

   send_ring = allocate_buffer_ring(send_width,
 				   tcp_rr_request->response_size,
 				   tcp_rr_request->send_alignment,
 				   tcp_rr_request->send_offset);

   recv_ring = allocate_buffer_ring(recv_width,
 				   tcp_rr_request->request_size,
 				   tcp_rr_request->recv_alignment,
 				   tcp_rr_request->recv_offset);


   /* Let's clear-out our sockaddr for the sake of cleanlines. Then we */
   /* can put in OUR values !-) At some point, we may want to nail this */
   /* socket to a particular network-level address, but for now, */
   /* INADDR_ANY should be just fine. */

   bzero((char *)&myaddr_in,
 	sizeof(myaddr_in));
   myaddr_in.sin_family      = AF_INET;
   myaddr_in.sin_addr.s_addr = INADDR_ANY;
   myaddr_in.sin_port        = htons((unsigned short)tcp_rr_request->port);

   /* Grab a socket to listen on, and then listen on it. */

   if (debug) {
     fprintf(where,"recv_tcp_nbrr: grabbing a socket...\n");
     fflush(where);
   }

   /* create_data_socket expects to find some things in the global */
   /* variables, so set the globals based on the values in the request. */
   /* once the socket has been created, we will set the response values */
   /* based on the updated value of those globals. raj 7/94 */
   lss_size_req = tcp_rr_request->send_buf_size;
   lsr_size_req = tcp_rr_request->recv_buf_size;
   loc_nodelay = tcp_rr_request->no_delay;
   loc_rcvavoid = tcp_rr_request->so_rcvavoid;
   loc_sndavoid = tcp_rr_request->so_sndavoid;

   set_hostname_and_port(local_name,
 			port_buffer,
 			nf_to_af(tcp_rr_request->ipfamily),
 			tcp_rr_request->port);

   local_res = complete_addrinfo(local_name,
 				local_name,
 				port_buffer,
 				nf_to_af(tcp_rr_request->ipfamily),
 				SOCK_STREAM,
 				IPPROTO_TCP,
 				0);

   s_listen = create_data_socket(local_res);

   if (s_listen == INVALID_SOCKET) {
     netperf_response.content.serv_errno = errno;
     send_response();

     exit(1);
   }

   /* Let's get an address assigned to this socket so we can tell the */
   /* initiator how to reach the data socket. There may be a desire to */
   /* nail this socket to a specific IP address in a multi-homed, */
   /* multi-connection situation, but for now, we'll ignore the issue */
   /* and concentrate on single connection testing. */

   if (bind(s_listen,
 	   (struct sockaddr *)&myaddr_in,
 	   sizeof(myaddr_in)) == SOCKET_ERROR) {
     netperf_response.content.serv_errno = errno;
     close(s_listen);
     send_response();

     exit(1);
   }

   /* Now, let's set-up the socket to listen for connections */
   if (listen(s_listen, 5) == SOCKET_ERROR) {
     netperf_response.content.serv_errno = errno;
     close(s_listen);
     send_response();

     exit(1);
   }


   /* now get the port number assigned by the system  */
   addrlen = sizeof(myaddr_in);
   if (getsockname(s_listen,
 		  (struct sockaddr *)&myaddr_in, &addrlen) == SOCKET_ERROR){
     netperf_response.content.serv_errno = errno;
     close(s_listen);
     send_response();

     exit(1);
   }

   /* Now myaddr_in contains the port and the internet address this is */
   /* returned to the sender also implicitly telling the sender that the */
   /* socket buffer sizing has been done. */

   tcp_rr_response->data_port_number = (int) ntohs(myaddr_in.sin_port);
   netperf_response.content.serv_errno   = 0;

   /* But wait, there's more. If the initiator wanted cpu measurements, */
   /* then we must call the calibrate routine, which will return the max */
   /* rate back to the initiator. If the CPU was not to be measured, or */
   /* something went wrong with the calibration, we will return a 0.0 to */
   /* the initiator. */

   tcp_rr_response->cpu_rate = 0.0; 	/* assume no cpu */
   tcp_rr_response->measure_cpu = 0;

   if (tcp_rr_request->measure_cpu) {
     tcp_rr_response->measure_cpu = 1;
     tcp_rr_response->cpu_rate = calibrate_local_cpu(tcp_rr_request->cpu_rate);
   }


   /* before we send the response back to the initiator, pull some of */
   /* the socket parms from the globals */
   tcp_rr_response->send_buf_size = lss_size;
   tcp_rr_response->recv_buf_size = lsr_size;
   tcp_rr_response->no_delay = loc_nodelay;
   tcp_rr_response->so_rcvavoid = loc_rcvavoid;
   tcp_rr_response->so_sndavoid = loc_sndavoid;
   tcp_rr_response->test_length = tcp_rr_request->test_length;
   send_response();

   addrlen = sizeof(peeraddr_in);

   if ((s_data = accept(s_listen,
 		       (struct sockaddr *)&peeraddr_in,
 		       &addrlen)) == INVALID_SOCKET) {
     /* Let's just punt. The remote will be given some information */
     close(s_listen);
     exit(1);
   }

   if (debug) {
     fprintf(where,"recv_tcp_nbrr: accept completes on the data connection.\n");
     fflush(where);
   }

 #ifdef KLUDGE_SOCKET_OPTIONS
   /* this is for those systems which *INCORRECTLY* fail to pass */
   /* attributes across an accept() call. Including this goes against */
   /* my better judgement :( raj 11/95 */

   kludge_socket_options(s_data);

 #endif /* KLUDGE_SOCKET_OPTIONS */

   /* now that we are connected, mark the socket as non-blocking */
   if (!set_nonblock(s_data)) {
     close(s_data);
     exit(1);
   }


   /* Now it's time to start receiving data on the connection. We will */
   /* first grab the apropriate counters and then start grabbing. */

   cpu_start(tcp_rr_request->measure_cpu);

 #ifdef WIN32
   /* this is used so the timer thread can close the socket out from */
   /* under us, which to date is the easiest/cleanest/least */
   /* Windows-specific way I can find to force the winsock calls to */
   /* return WSAEINTR with the test is over. anything that will run on */
   /* 95 and NT and is closer to what netperf expects from Unix signals */
   /* and such would be appreciated raj 1/96 */
   win_kludge_socket = s_data;
 #endif /* WIN32 */

   /* The loop will exit when the sender does a shutdown, which will */
   /* return a length of zero   */

   if (tcp_rr_request->test_length > 0) {
     times_up = 0;
     trans_remaining = 0;
     start_timer(tcp_rr_request->test_length + PAD_TIME);
   }
   else {
     times_up = 1;
     trans_remaining = tcp_rr_request->test_length * -1;
   }

   trans_received = 0;

   while ((!times_up) || (trans_remaining > 0)) {
     temp_message_ptr = recv_ring->buffer_ptr;
     request_bytes_remaining	= tcp_rr_request->request_size;
     while(request_bytes_remaining > 0) {
       if((request_bytes_recvd=recv(s_data,
 				   temp_message_ptr,
 				   request_bytes_remaining,
 				   0)) == SOCKET_ERROR) {
 	    if ( SOCKET_EINTR(request_bytes_recvd))
 		{
 	      /* the timer popped */
 	      timed_out = 1;
 	      break;
 		}
 #ifndef WIN32  // But what does WinNT indicate in this situation...
 	    else if (errno == EAGAIN) {
 	      Set_errno(0);
 	      if (times_up) {
 	        timed_out = 1;
 	        break;
 		  }
 	      continue;
 		}
 #endif
 	    else {
 	      netperf_response.content.serv_errno = errno;
 	      send_response();
 	      exit(1);
 		}
       }
       else {
 	request_bytes_remaining -= request_bytes_recvd;
 	temp_message_ptr  += request_bytes_recvd;
       }
     }

     recv_ring = recv_ring->next;

     if (timed_out) {
       /* we hit the end of the test based on time - lets */
       /* bail out of here now... */
       fprintf(where,"yo5\n");
       fflush(where);
       break;
     }

     /* Now, send the response to the remote */
     if((bytes_sent=send(s_data,
 			send_ring->buffer_ptr,
 			tcp_rr_request->response_size,
 			0)) == SOCKET_ERROR) {
       if (SOCKET_EINTR(bytes_sent)) {
 	/* the test timer has popped */
 	timed_out = 1;
 	fprintf(where,"yo6\n");
 	fflush(where);
 	break;
       }
       netperf_response.content.serv_errno = 992;
       send_response();
       exit(1);
     }

     send_ring = send_ring->next;

     trans_received++;
     if (trans_remaining) {
       trans_remaining--;
     }
   }


   /* The loop now exits due to timeout or transaction count being */
   /* reached */

   cpu_stop(tcp_rr_request->measure_cpu,&elapsed_time);

   stop_timer();

   if (timed_out) {
     /* we ended the test by time, which was at least 2 seconds */
     /* longer than we wanted to run. so, we want to subtract */
     /* PAD_TIME from the elapsed_time. */
     elapsed_time -= PAD_TIME;
   }

   /* send the results to the sender			*/

   if (debug) {
     fprintf(where,
 	    "recv_tcp_nbrr: got %d transactions\n",
 	    trans_received);
     fflush(where);
   }

   tcp_rr_results->bytes_received = (trans_received *
 				    (tcp_rr_request->request_size +
 				     tcp_rr_request->response_size));
   tcp_rr_results->trans_received = trans_received;
   tcp_rr_results->elapsed_time   = elapsed_time;
   tcp_rr_results->cpu_method     = cpu_method;
   tcp_rr_results->num_cpus       = lib_num_loc_cpus;
   if (tcp_rr_request->measure_cpu) {
     tcp_rr_results->cpu_util	= calc_cpu_util(elapsed_time);
   }

   if (debug) {
     fprintf(where,
 	    "recv_tcp_nbrr: test complete, sending results.\n");
     fflush(where);
   }

   /* we are done with the socket, free it */
   close(s_data);

   send_response();

 }

 #endif /* DO_NBRR */


  /* this test is intended to test the performance of establishing a */
  /* connection, and then closing it again. this test is of somewhat */
  /* arcane interest since no packets are exchanged between the */
  /* user-space processes, but it will show the raw overhead of */
  /* establishing a TCP connection. that service demand could then be */
  /* compared with the sum of the service demands of a TCP_CRR and */
  /* TCP_RR test - presumeably, they would all relate */

 void
 send_tcp_cc(char remote_host[])
 {

   char *tput_title = "\
 Local /Remote\n\
 Socket Size   Request  Resp.   Elapsed  Trans.\n\
 Send   Recv   Size     Size    Time     Rate         \n\
 bytes  Bytes  bytes    bytes   secs.    per sec   \n\n";

   char *tput_fmt_0 =
     "%7.2f\n";

   char *tput_fmt_1_line_1 = "\
 %-6d %-6d %-6d   %-6d  %-6.2f   %7.2f   \n";
   char *tput_fmt_1_line_2 = "\
 %-6d %-6d\n";

   char *cpu_title = "\
 Local /Remote\n\
 Socket Size   Request Resp.  Elapsed Trans.   CPU    CPU    S.dem   S.dem\n\
 Send   Recv   Size    Size   Time    Rate     local  remote local   remote\n\
 bytes  bytes  bytes   bytes  secs.   per sec  %%      %%      us/Tr   us/Tr\n\n";

   char *cpu_fmt_0 =
     "%6.3f\n";

   char *cpu_fmt_1_line_1 = "\
 %-6d %-6d %-6d  %-6d %-6.2f  %-6.2f   %-6.2f %-6.2f %-6.3f  %-6.3f\n";

   char *cpu_fmt_1_line_2 = "\
 %-6d %-6d\n";

   char *ksink_fmt = "\n\
 Alignment      Offset\n\
 Local  Remote  Local  Remote\n\
 Send   Recv    Send   Recv\n\
 %5d  %5d   %5d  %5d\n";


   int			timed_out = 0;
   float			elapsed_time;

   char	temp_message_ptr[1];
   int	nummessages;
   SOCKET	send_socket;
   int	trans_remaining;
   double	bytes_xferd;
   int	rsp_bytes_left = 1;
   int	rsp_bytes_recvd;

   float	local_cpu_utilization;
   float	local_service_demand;
   float	remote_cpu_utilization;
   float	remote_service_demand;
   double	thruput;

   struct addrinfo *local_res;
   struct addrinfo *remote_res;

   int                           myport;
   int                           ret;

   struct	tcp_cc_request_struct	*tcp_cc_request;
   struct	tcp_cc_response_struct	*tcp_cc_response;
   struct	tcp_cc_results_struct	*tcp_cc_result;

   tcp_cc_request =
     (struct tcp_cc_request_struct *)netperf_request.content.test_specific_data;
   tcp_cc_response =
     (struct tcp_cc_response_struct *)netperf_response.content.test_specific_data;
   tcp_cc_result =
     (struct tcp_cc_results_struct *)netperf_response.content.test_specific_data;


 #ifdef WANT_HISTOGRAM
   if (verbosity > 1) {
     time_hist = HIST_new();
   }
 #endif /* WANT_HISTOGRAM */

   /* since we are now disconnected from the code that established the */
   /* control socket, and since we want to be able to use different */
   /* protocols and such, we are passed the name of the remote host and */
   /* must turn that into the test specific addressing information. */

   complete_addrinfos(&remote_res,
 		     &local_res,
 		     remote_host,
 		     SOCK_STREAM,
 		     IPPROTO_TCP,
 		     0);

   if ( print_headers ) {
     print_top_test_header("TCP Connect/Close TEST",local_res,remote_res);
   }

   /* initialize a few counters */

   nummessages	=	0;
   bytes_xferd	=	0.0;
   times_up 	= 	0;

   /* since there are no data buffers in this test, we need no send or */
   /* recv rings */

   if (debug) {
     fprintf(where,"send_tcp_cc: send_socket obtained...\n");
   }

   /* If the user has requested cpu utilization measurements, we must */
   /* calibrate the cpu(s). We will perform this task within the tests */
   /* themselves. If the user has specified the cpu rate, then */
   /* calibrate_local_cpu will return rather quickly as it will have */
   /* nothing to do. If local_cpu_rate is zero, then we will go through */
   /* all the "normal" calibration stuff and return the rate back.*/

   if (local_cpu_usage) {
     local_cpu_rate = calibrate_local_cpu(local_cpu_rate);
   }

   /* Tell the remote end to do a listen. The server alters the socket */
   /* paramters on the other side at this point, hence the reason for */
   /* all the values being passed in the setup message. If the user did */
   /* not specify any of the parameters, they will be passed as 0, which */
   /* will indicate to the remote that no changes beyond the system's */
   /* default should be used. Alignment is the exception, it will */
   /* default to 8, which will be no alignment alterations. */

   netperf_request.content.request_type	=	DO_TCP_CC;
   tcp_cc_request->recv_buf_size	        =	rsr_size_req;
   tcp_cc_request->send_buf_size	        =	rss_size_req;
   tcp_cc_request->recv_alignment	=	remote_recv_align;
   tcp_cc_request->recv_offset	        =	remote_recv_offset;
   tcp_cc_request->send_alignment	=	remote_send_align;
   tcp_cc_request->send_offset	        =	remote_send_offset;
   tcp_cc_request->request_size	        =	req_size;
   tcp_cc_request->response_size	        =	rsp_size;
   tcp_cc_request->no_delay	        =	rem_nodelay;
   tcp_cc_request->measure_cpu	        =	remote_cpu_usage;
   tcp_cc_request->cpu_rate	        =	remote_cpu_rate;
   tcp_cc_request->so_rcvavoid	=	rem_rcvavoid;
   tcp_cc_request->so_sndavoid	=	rem_sndavoid;
   if (test_time) {
     tcp_cc_request->test_length	=	test_time;
   }
   else {
     tcp_cc_request->test_length	=	test_trans * -1;
   }
   tcp_cc_request->port          = atoi(remote_data_port);
   tcp_cc_request->ipfamily  = af_to_nf(remote_res->ai_family);

   if (debug > 1) {
     fprintf(where,"netperf: send_tcp_cc: requesting TCP crr test\n");
   }

   send_request();

   /* The response from the remote will contain all of the relevant 	*/
   /* socket parameters for this test type. We will put them back into 	*/
   /* the variables here so they can be displayed if desired.  The	*/
   /* remote will have calibrated CPU if necessary, and will have done	*/
   /* all the needed set-up we will have calibrated the cpu locally	*/
   /* before sending the request, and will grab the counter value right	*/
   /* after the connect returns. The remote will grab the counter right	*/
   /* after the accept call. This saves the hassle of extra messages	*/
   /* being sent for the TCP tests.					*/

   recv_response();

   if (!netperf_response.content.serv_errno) {
     rsr_size	=	tcp_cc_response->recv_buf_size;
     rss_size	=	tcp_cc_response->send_buf_size;
     rem_nodelay	=	tcp_cc_response->no_delay;
     remote_cpu_usage=	tcp_cc_response->measure_cpu;
     remote_cpu_rate = 	tcp_cc_response->cpu_rate;
     /* make sure that port numbers are in network order */
     set_port_number(remote_res,(unsigned short)tcp_cc_response->data_port_number);

     if (debug) {
       fprintf(where,"remote listen done.\n");
       fprintf(where,"remote port is %d\n",get_port_number(remote_res));
       fflush(where);
     }
   }
   else {
     Set_errno(netperf_response.content.serv_errno);
     fprintf(where,
 	    "netperf: remote error %d",
 	    netperf_response.content.serv_errno);
     perror("");
     fflush(where);
     exit(1);
   }

 #ifdef WANT_DEMO
   DEMO_RR_SETUP(100)
 #endif

   /* pick a nice random spot between client_port_min and */
   /* client_port_max for our initial port number */
   srand(getpid());
   if (client_port_max - client_port_min) {
     myport = client_port_min +
       (rand() % (client_port_max - client_port_min));
   }
   else {
     myport = client_port_min;
   }
   /* there will be a ++ before the first call to bind, so subtract one */
   myport--;

   /* Set-up the test end conditions. For a request/response test, they */
   /* can be either time or transaction based. */

   if (test_time) {
     /* The user wanted to end the test after a period of time. */
     times_up = 0;
     trans_remaining = 0;
     start_timer(test_time);
   }
   else {
     /* The tester wanted to send a number of bytes. */
     trans_remaining = test_bytes;
     times_up = 1;
   }

   /* The cpu_start routine will grab the current time and possibly */
   /* value of the idle counter for later use in measuring cpu */
   /* utilization and/or service demand and thruput. */

   cpu_start(local_cpu_usage);

 #ifdef WANT_DEMO
   if (demo_mode) {
     HIST_timestamp(demo_one_ptr);
   }
 #endif

   /* We use an "OR" to control test execution. When the test is */
   /* controlled by time, the byte count check will always return false. */
   /* When the test is controlled by byte count, the time test will */
   /* always return false. When the test is finished, the whole */
   /* expression will go false and we will stop sending data. I think I */
   /* just arbitrarily decrement trans_remaining for the timed test, but */
   /* will not do that just yet... One other question is whether or not */
   /* the send buffer and the receive buffer should be the same buffer. */

   while ((!times_up) || (trans_remaining > 0)) {

 #ifdef WANT_HISTOGRAM
     if (verbosity > 1) {
       /* timestamp just before our call to create the socket, and then */
       /* again just after the receive raj 3/95 */
       HIST_timestamp(&time_one);
     }
 #endif /* WANT_HISTOGRAM */

     /* set up the data socket */
     /* newport: is this label really required any longer? */
     /* pick a new port number */
     myport++;

     /* wrap the port number when we get to client_port_max. NOTE, some */
     /* broken TCP's might treat the port number as a signed 16 bit */
     /* quantity.  we aren't interested in testing such broken */
     /* implementations :) so we won't make sure that it is below 32767 */
     /* raj 8/94  */
     if (myport >= client_port_max) {
       myport = client_port_min;
     }

     /* we do not want to use the port number that the server is */
     /* sitting at - this would cause us to fail in a loopback test. we */
     /* could just rely on the failure of the bind to get us past this, */
     /* but I'm guessing that in this one case at least, it is much */
     /* faster, given that we *know* that port number is already in use */
     /* (or rather would be in a loopback test) */

     if (myport == get_port_number(remote_res)) myport++;

     if (debug) {
       if ((nummessages % 100) == 0) {
 	printf("port %d\n",myport);
       }
     }
     set_port_number(local_res, (unsigned short)myport);
     send_socket = create_data_socket(local_res);

     if (send_socket == INVALID_SOCKET) {
       perror("netperf: send_tcp_cc: tcp stream data socket");
       exit(1);
     }

 #ifdef WIN32
     /* this is used so the timer thread can close the socket out from */
     /* under us, which to date is the easiest/cleanest/least */
     /* Windows-specific way I can find to force the winsock calls to */
     /* return WSAEINTR with the test is over. anything that will run on */
     /* 95 and NT and is closer to what netperf expects from Unix signals */
     /* and such would be appreciated raj 1/96 */
     win_kludge_socket = send_socket;
 #endif /* WIN32 */

     /* we used to have a call to bind() here, but that is being
        taken care of by create_data_socket(). raj 2005-02-08 */

     /* Connect up to the remote port on the data socket  */
     if ((ret = connect(send_socket,
 		       remote_res->ai_addr,
 		       remote_res->ai_addrlen)) == INVALID_SOCKET){
       if (SOCKET_EINTR(ret))
 	  {
 	    /* we hit the end of a */
 	    /* timed test. */
 	    timed_out = 1;
 	    break;
       }
       perror("netperf: data socket connect failed");
       printf("\tattempted to connect on socket %d to port %d",
 	     send_socket,
 	     get_port_number(remote_res));
       printf(" from port %u \n",get_port_number(local_res));
       exit(1);
     }

     /* we hang in a recv() to get the remote's close indication */

     rsp_bytes_recvd=recv(send_socket,
 			 temp_message_ptr,
 			 rsp_bytes_left,
 			 0);


     if (rsp_bytes_recvd == 0) {
       /* connection close, call close. we assume that the requisite */
       /* number of bytes have been received */

 #ifdef WANT_HISTOGRAM
       if (verbosity > 1) {
 	HIST_timestamp(&time_two);
 	HIST_add(time_hist,delta_micro(&time_one,&time_two));
       }
 #endif /* WANT_HISTOGRAM */

 #ifdef WANT_DEMO
       DEMO_RR_INTERVAL(1)
 #endif

       nummessages++;
       if (trans_remaining) {
 	trans_remaining--;
       }

       if (debug > 3) {
 	fprintf(where,
 		"Transaction %d completed on local port %u\n",
 		nummessages,
 		get_port_number(local_res));
 	fflush(where);
       }

       close(send_socket);

     }
     else {
       /* it was less than zero - an error occured */
       if (SOCKET_EINTR(rsp_bytes_recvd))
 	  {
 	    /* We hit the end of a timed test. */
 	    timed_out = 1;
 	    break;
 	  }
 	  perror("send_tcp_cc: data recv error");
 	  exit(1);
     }

   }


   /* this call will always give us the elapsed time for the test, and */
   /* will also store-away the necessaries for cpu utilization */

   cpu_stop(local_cpu_usage,&elapsed_time);	/* was cpu being measured? */
   /* how long did we really run? */

   /* Get the statistics from the remote end. The remote will have */
   /* calculated service demand and all those interesting things. If it */
   /* wasn't supposed to care, it will return obvious values. */

   recv_response();
   if (!netperf_response.content.serv_errno) {
     if (debug)
       fprintf(where,"remote results obtained\n");
   }
   else {
     Set_errno(netperf_response.content.serv_errno);
     fprintf(where,
 	    "netperf: remote error %d",
 	     netperf_response.content.serv_errno);
     perror("");
     fflush(where);

     exit(1);
   }

   /* We now calculate what our thruput was for the test. In the future, */
   /* we may want to include a calculation of the thruput measured by */
   /* the remote, but it should be the case that for a TCP stream test, */
   /* that the two numbers should be *very* close... We calculate */
   /* bytes_sent regardless of the way the test length was controlled. */
   /* If it was time, we needed to, and if it was by bytes, the user may */
   /* have specified a number of bytes that wasn't a multiple of the */
   /* send_size, so we really didn't send what he asked for ;-) We use */
   /* Kbytes/s as the units of thruput for a TCP stream test, where K = */
   /* 1024. A future enhancement *might* be to choose from a couple of */
   /* unit selections. */

   bytes_xferd	= (req_size * nummessages) + (rsp_size * nummessages);
   thruput	= calc_thruput(bytes_xferd);

   if (local_cpu_usage || remote_cpu_usage) {
     /* We must now do a little math for service demand and cpu */
     /* utilization for the system(s) */
     /* Of course, some of the information might be bogus because */
     /* there was no idle counter in the kernel(s). We need to make */
     /* a note of this for the user's benefit...*/
     if (local_cpu_usage) {
       if (local_cpu_rate == 0.0) {
 	fprintf(where,"WARNING WARNING WARNING  WARNING WARNING WARNING  WARNING!\n");
 	fprintf(where,"Local CPU usage numbers based on process information only!\n");
 	fflush(where);
       }
       local_cpu_utilization = calc_cpu_util(0.0);
       /* since calc_service demand is doing ms/Kunit we will */
       /* multiply the number of transaction by 1024 to get */
       /* "good" numbers */
       local_service_demand  = calc_service_demand((double) nummessages*1024,
 						  0.0,
 						  0.0,
 						  0);
     }
     else {
       local_cpu_utilization	= (float) -1.0;
       local_service_demand	= (float) -1.0;
     }

     if (remote_cpu_usage) {
       if (remote_cpu_rate == 0.0) {
 	fprintf(where,"DANGER  DANGER  DANGER    DANGER  DANGER  DANGER    DANGER!\n");
 	fprintf(where,"Remote CPU usage numbers based on process information only!\n");
 	fflush(where);
       }
       remote_cpu_utilization = tcp_cc_result->cpu_util;
       /* since calc_service demand is doing ms/Kunit we will */
       /* multiply the number of transaction by 1024 to get */
       /* "good" numbers */
       remote_service_demand = calc_service_demand((double) nummessages*1024,
 						  0.0,
 						  remote_cpu_utilization,
 						  tcp_cc_result->num_cpus);
     }
     else {
       remote_cpu_utilization = (float) -1.0;
       remote_service_demand  = (float) -1.0;
     }

     /* We are now ready to print all the information. If the user */
     /* has specified zero-level verbosity, we will just print the */
     /* local service demand, or the remote service demand. If the */
     /* user has requested verbosity level 1, he will get the basic */
     /* "streamperf" numbers. If the user has specified a verbosity */
     /* of greater than 1, we will display a veritable plethora of */
     /* background information from outside of this block as it it */
     /* not cpu_measurement specific...  */

     switch (verbosity) {
     case 0:
       if (local_cpu_usage) {
 	fprintf(where,
 		cpu_fmt_0,
 		local_service_demand);
       }
       else {
 	fprintf(where,
 		cpu_fmt_0,
 		remote_service_demand);
       }
       break;
     case 1:
     case 2:

       if (print_headers) {
 	fprintf(where,
 		cpu_title,
 		local_cpu_method,
 		remote_cpu_method);
       }

       fprintf(where,
 	      cpu_fmt_1_line_1,		/* the format string */
 	      lss_size,		/* local sendbuf size */
 	      lsr_size,
 	      req_size,		/* how large were the requests */
 	      rsp_size,		/* guess */
 	      elapsed_time,		/* how long was the test */
 	      nummessages/elapsed_time,
 	      local_cpu_utilization,	/* local cpu */
 	      remote_cpu_utilization,	/* remote cpu */
 	      local_service_demand,	/* local service demand */
 	      remote_service_demand);	/* remote service demand */
       fprintf(where,
 	      cpu_fmt_1_line_2,
 	      rss_size,
 	      rsr_size);
       break;
     }
   }
   else {
     /* The tester did not wish to measure service demand. */
     switch (verbosity) {
     case 0:
       fprintf(where,
 	      tput_fmt_0,
 	      nummessages/elapsed_time);
       break;
     case 1:
     case 2:
       if (print_headers) {
 	fprintf(where,tput_title,format_units());
       }

       fprintf(where,
 	      tput_fmt_1_line_1,	/* the format string */
 	      lss_size,
 	      lsr_size,
 	      req_size,		/* how large were the requests */
 	      rsp_size,		/* how large were the responses */
 	      elapsed_time, 		/* how long did it take */
 	      nummessages/elapsed_time);
       fprintf(where,
 	      tput_fmt_1_line_2,
 	      rss_size, 		/* remote recvbuf size */
 	      rsr_size);

       break;
     }
   }

   /* it would be a good thing to include information about some of the */
   /* other parameters that may have been set for this test, but at the */
   /* moment, I do not wish to figure-out all the  formatting, so I will */
   /* just put this comment here to help remind me that it is something */
   /* that should be done at a later time. */

   if (verbosity > 1) {
     /* The user wanted to know it all, so we will give it to him. */
     /* This information will include as much as we can find about */
     /* TCP statistics, the alignments of the sends and receives */
     /* and all that sort of rot... */

     fprintf(where,
 	    ksink_fmt,
 	    local_send_align,
 	    remote_recv_offset,
 	    local_send_offset,
 	    remote_recv_offset);

 #ifdef WANT_HISTOGRAM
     fprintf(where,"\nHistogram of request/response times\n");
     fflush(where);
     HIST_report(time_hist);
 #endif /* WANT_HISTOGRAM */

   }

 }


 void
 recv_tcp_cc()
 {

   char  *message;

   struct addrinfo *local_res;
   char local_name[BUFSIZ];
   char port_buffer[PORTBUFSIZE];

   struct	sockaddr_storage        myaddr_in,  peeraddr_in;
   SOCKET	s_listen,s_data;
   netperf_socklen_t 	addrlen;
   char	*recv_message_ptr;
   char	*send_message_ptr;
   int	trans_received;
   int	trans_remaining;
   int	timed_out = 0;
   float	elapsed_time;

   struct	tcp_cc_request_struct	*tcp_cc_request;
   struct	tcp_cc_response_struct	*tcp_cc_response;
   struct	tcp_cc_results_struct	*tcp_cc_results;

   tcp_cc_request =
     (struct tcp_cc_request_struct *)netperf_request.content.test_specific_data;
   tcp_cc_response =
     (struct tcp_cc_response_struct *)netperf_response.content.test_specific_data;
   tcp_cc_results =
     (struct tcp_cc_results_struct *)netperf_response.content.test_specific_data;

   if (debug) {
     fprintf(where,"netserver: recv_tcp_cc: entered...\n");
     fflush(where);
   }

   /* We want to set-up the listen socket with all the desired */
   /* parameters and then let the initiator know that all is ready. If */
   /* socket size defaults are to be used, then the initiator will have */
   /* sent us 0's. If the socket sizes cannot be changed, then we will */
   /* send-back what they are. If that information cannot be determined, */
   /* then we send-back -1's for the sizes. If things go wrong for any */
   /* reason, we will drop back ten yards and punt. */

   /* If anything goes wrong, we want the remote to know about it. It */
   /* would be best if the error that the remote reports to the user is */
   /* the actual error we encountered, rather than some bogus unexpected */
   /* response type message. */

   if (debug) {
     fprintf(where,"recv_tcp_cc: setting the response type...\n");
     fflush(where);
   }

   netperf_response.content.response_type = TCP_CC_RESPONSE;

   if (debug) {
     fprintf(where,"recv_tcp_cc: the response type is set...\n");
     fflush(where);
   }

   /* set-up the data buffer with the requested alignment and offset */
   message = (char *)malloc(DATABUFFERLEN);
   if (message == NULL) {
     printf("malloc(%d) failed!\n", DATABUFFERLEN);
     exit(1);
   }

   /* We now alter the message_ptr variables to be at the desired */
   /* alignments with the desired offsets. */

   if (debug) {
     fprintf(where,
 	    "recv_tcp_cc: requested recv alignment of %d offset %d\n",
 	    tcp_cc_request->recv_alignment,
 	    tcp_cc_request->recv_offset);
     fprintf(where,
 	    "recv_tcp_cc: requested send alignment of %d offset %d\n",
 	    tcp_cc_request->send_alignment,
 	    tcp_cc_request->send_offset);
     fflush(where);
   }

   recv_message_ptr = ALIGN_BUFFER(message, tcp_cc_request->recv_alignment, tcp_cc_request->recv_offset);

   send_message_ptr = ALIGN_BUFFER(message, tcp_cc_request->send_alignment, tcp_cc_request->send_offset);

   if (debug) {
     fprintf(where,"recv_tcp_cc: receive alignment and offset set...\n");
     fflush(where);
   }

   /* Grab a socket to listen on, and then listen on it. */

   if (debug) {
     fprintf(where,"recv_tcp_cc: grabbing a socket...\n");
     fflush(where);
   }

   /* create_data_socket expects to find some things in the global */
   /* variables, so set the globals based on the values in the request. */
   /* once the socket has been created, we will set the response values */
   /* based on the updated value of those globals. raj 7/94 */
   lss_size_req = tcp_cc_request->send_buf_size;
   lsr_size_req = tcp_cc_request->recv_buf_size;
   loc_nodelay = tcp_cc_request->no_delay;
   loc_rcvavoid = tcp_cc_request->so_rcvavoid;
   loc_sndavoid = tcp_cc_request->so_sndavoid;

   set_hostname_and_port(local_name,
 			port_buffer,
 			nf_to_af(tcp_cc_request->ipfamily),
 			tcp_cc_request->port);

   local_res = complete_addrinfo(local_name,
 				local_name,
 				port_buffer,
 				nf_to_af(tcp_cc_request->ipfamily),
 				SOCK_STREAM,
 				IPPROTO_TCP,
 				0);

   s_listen = create_data_socket(local_res);

   if (s_listen == INVALID_SOCKET) {
     netperf_response.content.serv_errno = errno;
     send_response();
     if (debug) {
       fprintf(where,"could not create data socket\n");
       fflush(where);
     }
     exit(1);
   }

 #ifdef WIN32
   /* The test timer can fire during operations on the listening socket,
      so to make the start_timer below work we have to move
      it to close s_listen while we are blocked on accept. */
   win_kludge_socket2 = s_listen;
 #endif


   /* Now, let's set-up the socket to listen for connections */
   if (listen(s_listen, 5) == SOCKET_ERROR) {
     netperf_response.content.serv_errno = errno;
     close(s_listen);
     send_response();
     if (debug) {
       fprintf(where,"could not listen\n");
       fflush(where);
     }
     exit(1);
   }

   /* now get the port number assigned by the system  */
   addrlen = sizeof(myaddr_in);
   if (getsockname(s_listen,
 		  (struct sockaddr *)&myaddr_in,
 		  &addrlen) == SOCKET_ERROR){
     netperf_response.content.serv_errno = errno;
     close(s_listen);
     send_response();
     if (debug) {
       fprintf(where,"could not geetsockname\n");
       fflush(where);
     }
     exit(1);
   }

   /* Now myaddr_in contains the port and the internet address this is */
   /* returned to the sender also implicitly telling the sender that the */
   /* socket buffer sizing has been done. */

   tcp_cc_response->data_port_number =
     (int) ntohs(((struct sockaddr_in *)&myaddr_in)->sin_port);
   if (debug) {
     fprintf(where,"telling the remote to call me at %d\n",
 	    tcp_cc_response->data_port_number);
     fflush(where);
   }
   netperf_response.content.serv_errno   = 0;

   /* But wait, there's more. If the initiator wanted cpu measurements, */
   /* then we must call the calibrate routine, which will return the max */
   /* rate back to the initiator. If the CPU was not to be measured, or */
   /* something went wrong with the calibration, we will return a 0.0 to */
   /* the initiator. */

   tcp_cc_response->cpu_rate = (float)0.0; 	/* assume no cpu */
   if (tcp_cc_request->measure_cpu) {
     tcp_cc_response->measure_cpu = 1;
     tcp_cc_response->cpu_rate =
       calibrate_local_cpu(tcp_cc_request->cpu_rate);
   }


   /* before we send the response back to the initiator, pull some of */
   /* the socket parms from the globals */
   tcp_cc_response->send_buf_size = lss_size;
   tcp_cc_response->recv_buf_size = lsr_size;
   tcp_cc_response->no_delay = loc_nodelay;
   tcp_cc_response->so_rcvavoid = loc_rcvavoid;
   tcp_cc_response->so_sndavoid = loc_sndavoid;

   send_response();

   addrlen = sizeof(peeraddr_in);

   /* Now it's time to start receiving data on the connection. We will */
   /* first grab the apropriate counters and then start grabbing. */

   cpu_start(tcp_cc_request->measure_cpu);

   /* The loop will exit when the sender does a shutdown, which will */
   /* return a length of zero   */

   if (tcp_cc_request->test_length > 0) {
     times_up = 0;
     trans_remaining = 0;
     start_timer(tcp_cc_request->test_length + PAD_TIME);
   }
   else {
     times_up = 1;
     trans_remaining = tcp_cc_request->test_length * -1;
   }

   trans_received = 0;

   while ((!times_up) || (trans_remaining > 0)) {
 #ifdef WIN32
     /* The test timer will probably fire during this accept,
        so to make the start_timer above work we have to move
        it to close s_listen while we are blocked on accept. */
     win_kludge_socket = s_listen;
 #endif
     /* accept a connection from the remote */
     if ((s_data=accept(s_listen,
 		       (struct sockaddr *)&peeraddr_in,
 		       &addrlen)) == INVALID_SOCKET) {
       if (errno == EINTR) {
 	/* the timer popped */
 	timed_out = 1;
 	break;
       }
       fprintf(where,"recv_tcp_cc: accept: errno = %d\n",errno);
       fflush(where);
       close(s_listen);

       exit(1);
     }

 #ifdef KLUDGE_SOCKET_OPTIONS
     /* this is for those systems which *INCORRECTLY* fail to pass */
     /* attributes across an accept() call. Including this goes against */
     /* my better judgement :( raj 11/95 */

     kludge_socket_options(s_data);

 #endif /* KLUDGE_SOCKET_OPTIONS */

 #ifdef WIN32
   /* this is used so the timer thread can close the socket out from */
   /* under us, which to date is the easiest/cleanest/least */
   /* Windows-specific way I can find to force the winsock calls to */
   /* return WSAEINTR with the test is over. anything that will run on */
   /* 95 and NT and is closer to what netperf expects from Unix signals */
   /* and such would be appreciated raj 1/96 */
   win_kludge_socket = s_data;
 #endif /* WIN32 */

     if (debug) {
       fprintf(where,"recv_tcp_cc: accepted data connection.\n");
       fflush(where);
     }


     /* close the connection. the server will likely do a graceful */
     /* close of the connection, insuring that all data has arrived at */
     /* the client. for this it will call shutdown(), and then recv() and */
     /* then close(). I'm reasonably confident that this is the */
     /* appropriate sequence of calls - I would like to hear of */
     /* examples in web servers to the contrary. raj 10/95*/
     close(s_data);

     trans_received++;
     if (trans_remaining) {
       trans_remaining--;
     }

     if (debug) {
       fprintf(where,
 	      "recv_tcp_cc: Transaction %d complete\n",
 	      trans_received);
       fflush(where);
     }

   }


   /* The loop now exits due to timeout or transaction count being */
   /* reached */

   cpu_stop(tcp_cc_request->measure_cpu,&elapsed_time);

   if (timed_out) {
     /* we ended the test by time, which was at least 2 seconds */
     /* longer than we wanted to run. so, we want to subtract */
     /* PAD_TIME from the elapsed_time. */
     elapsed_time -= PAD_TIME;
   }
   /* send the results to the sender			*/

   if (debug) {
     fprintf(where,
 	    "recv_tcp_cc: got %d transactions\n",
 	    trans_received);
     fflush(where);
   }

   tcp_cc_results->bytes_received	= (trans_received *
 					   (tcp_cc_request->request_size +
 					    tcp_cc_request->response_size));
   tcp_cc_results->trans_received	= trans_received;
   tcp_cc_results->elapsed_time	= elapsed_time;
   if (tcp_cc_request->measure_cpu) {
     tcp_cc_results->cpu_util	= calc_cpu_util(elapsed_time);
   }

   if (debug) {
     fprintf(where,
 	    "recv_tcp_cc: test complete, sending results.\n");
     fflush(where);
   }

   send_response();

 }

 void
 print_sockets_usage()
 {

   fwrite(sockets_usage, sizeof(char), strlen(sockets_usage), stdout);
   exit(1);

 }

 void
 scan_sockets_args(int argc, char *argv[])

 {

 #define SOCKETS_ARGS "b:CDnNhH:L:m:M:p:P:r:s:S:T:Vw:W:z46"

   extern char	*optarg;	  /* pointer to option string	*/

   int		c;

   char
     arg1[BUFSIZ],  /* argument holders		*/
     arg2[BUFSIZ];

   if (debug) {
     int i;
     printf("%s called with the following argument vector\n",
 	   __func__);
     for (i = 0; i< argc; i++) {
       printf("%s ",argv[i]);
     }
     printf("\n");
   }

   strncpy(local_data_port,"0",sizeof(local_data_port));
   strncpy(remote_data_port,"0",sizeof(remote_data_port));

   /* Go through all the command line arguments and break them */
   /* out. For those options that take two parms, specifying only */
   /* the first will set both to that value. Specifying only the */
   /* second will leave the first untouched. To change only the */
   /* first, use the form "first," (see the routine break_args.. */

   while ((c= getopt(argc, argv, SOCKETS_ARGS)) != EOF) {
     switch (c) {
     case '?':
     case '4':
       remote_data_family = AF_INET;
       local_data_family = AF_INET;
       break;
     case '6':
 #if defined(AF_INET6)
       remote_data_family = AF_INET6;
       local_data_family = AF_INET6;
 #else
       fprintf(stderr,
 	      "This netperf was not compiled on an IPv6 capable host!\n");
       fflush(stderr);
       exit(-1);
 #endif
       break;
     case 'h':
       print_sockets_usage();
       exit(1);
     case 'b':
 #ifdef WANT_FIRST_BURST
       first_burst_size = atoi(optarg);
 #else /* WANT_FIRST_BURST */
       printf("Initial request burst functionality not compiled-in!\n");
 #endif /* WANT_FIRST_BURST */
       break;
     case 'C':
 #ifdef TCP_CORK
       /* set TCP_CORK */
       loc_tcpcork = 1;
       rem_tcpcork = 1; /* however, at first, we ony have cork affect loc */
 #else
       printf("WARNING: TCP_CORK not available on this platform!\n");
 #endif /* TCP_CORK */
       break;
     case 'D':
       /* set the TCP nodelay flag */
       loc_nodelay = 1;
       rem_nodelay = 1;
       break;
     case 'H':
       break_args_explicit(optarg,arg1,arg2);
       if (arg1[0]) {
 	/* make sure we leave room for the NULL termination boys and
 	   girls. raj 2005-02-82 */
 	remote_data_address = malloc(strlen(arg1)+1);
 	strncpy(remote_data_address,arg1,strlen(arg1));
       }
       if (arg2[0])
 	remote_data_family = parse_address_family(arg2);
       break;
     case 'L':
       break_args_explicit(optarg,arg1,arg2);
       if (arg1[0]) {
 	/* make sure we leave room for the NULL termination boys and
 	   girls. raj 2005-02-82 */
 	local_data_address = malloc(strlen(arg1)+1);
 	strncpy(local_data_address,arg1,strlen(arg1));
       }
       if (arg2[0])
 	local_data_family = parse_address_family(arg2);
       break;
     case 's':
       /* set local socket sizes */
       break_args(optarg,arg1,arg2);
       if (arg1[0])
 	lss_size_req = convert(arg1);
       if (arg2[0])
 	lsr_size_req = convert(arg2);
       break;
     case 'S':
       /* set remote socket sizes */
       break_args(optarg,arg1,arg2);
       if (arg1[0])
 	rss_size_req = convert(arg1);
       if (arg2[0])
 	rsr_size_req = convert(arg2);
       break;
     case 'r':
       /* set the request/response sizes */
       break_args(optarg,arg1,arg2);
       if (arg1[0])
 	req_size = convert(arg1);
       if (arg2[0])
 	rsp_size = convert(arg2);
       break;
     case 'm':
       /* set the send size */
       send_size = convert(optarg);
       break;
     case 'M':
       /* set the recv size */
       recv_size = convert(optarg);
       break;
     case 'n':
       /* set the local socket type*/
       local_connected = 1;
       break;
     case 'N':
       /* set the remote socket type*/
       remote_connected = 1;
       break;
     case 'p':
       /* set the min and max port numbers for the TCP_CRR and TCP_TRR */
       /* tests. */
       break_args(optarg,arg1,arg2);
       if (arg1[0])
 	client_port_min = atoi(arg1);
       if (arg2[0])
 	client_port_max = atoi(arg2);
       break;
     case 'P':
       /* set the local and remote data port numbers for the tests to
 	 allow them to run through those blankety blank end-to-end
 	 breaking firewalls. raj 2004-06-15 */
       break_args(optarg,arg1,arg2);
       if (arg1[0])
 	strncpy(local_data_port,arg1,sizeof(local_data_port));
       if (arg2[0])
 	strncpy(remote_data_port,arg2,sizeof(remote_data_port));
       break;
     case 't':
       /* set the test name */
       strcpy(test_name,optarg);
       break;
     case 'W':
       /* set the "width" of the user space data */
       /* buffer. This will be the number of */
       /* send_size buffers malloc'd in the */
       /* *_STREAM test. It may be enhanced to set */
       /* both send and receive "widths" but for now */
       /* it is just the sending *_STREAM. */
       send_width = convert(optarg);
       break;
     case 'V' :
       /* we want to do copy avoidance and will set */
       /* it for everything, everywhere, if we really */
       /* can. of course, we don't know anything */
       /* about the remote... */
 #ifdef SO_SND_COPYAVOID
       loc_sndavoid = 1;
 #else
       loc_sndavoid = 0;
       printf("Local send copy avoidance not available.\n");
 #endif
 #ifdef SO_RCV_COPYAVOID
       loc_rcvavoid = 1;
 #else
       loc_rcvavoid = 0;
       printf("Local recv copy avoidance not available.\n");
 #endif
       rem_sndavoid = 1;
       rem_rcvavoid = 1;
       break;
     };
   }

 #if defined(WANT_FIRST_BURST)
 #if defined(WANT_HISTOGRAM)
   /* if WANT_FIRST_BURST and WANT_HISTOGRAM are defined and the user
      indeed wants a non-zero first burst size, and we would emit a
      histogram, then we should emit a warning that the two are not
      compatible. raj 2006-01-31 */
   if ((first_burst_size > 0) && (verbosity >= 2)) {
     fprintf(stderr,
 	    "WARNING! Histograms and first bursts are incompatible!\n");
     fflush(stderr);
   }
 #endif
 #endif

   /* we do not want to make remote_data_address non-NULL because if
      the user has not specified a remote adata address, we want to
      take it from the hostname in the -H global option. raj
      2005-02-08 */

   /* so, if there is to be no control connection, we want to have some
      different settings for a few things */

   if (no_control) {

     if (strcmp(remote_data_port,"0") == 0) {
       /* we need to select either the discard port, echo port or
 	 chargen port dedepending on the test name. raj 2007-02-08 */
       if (strstr(test_name,"STREAM") ||
 	  strstr(test_name,"SENDFILE")) {
 	strncpy(remote_data_port,"discard",sizeof(remote_data_port));
       }
       else if (strstr(test_name,"RR")) {
 	strncpy(remote_data_port,"echo",sizeof(remote_data_port));
       }
       else if (strstr(test_name,"MAERTS")) {
 	strncpy(remote_data_port,"chargen",sizeof(remote_data_port));
       }
       else {
 	printf("No default port known for the %s test, please set one yourself\n",test_name);
 	exit(-1);
       }
     }
     remote_data_port[sizeof(remote_data_port) - 1] = '\0';

     /* I go back and forth on whether these should become -1 or if
        they should become 0 for a no_control test. what do you think?
        raj 2006-02-08 */

     rem_rcvavoid = -1;
     rem_sndavoid = -1;
     rss_size_req = -1;
     rsr_size_req = -1;
     rem_nodelay = -1;

     if (strstr(test_name,"STREAM") ||
 	strstr(test_name,"SENDFILE")) {
       recv_size = -1;
     }
     else if (strstr(test_name,"RR")) {
       /* I am however _certain_ that for a no control RR test the
 	 response size must equal the request size since 99 times out
 	 of ten we will be speaking to the echo service somewhere */
       rsp_size = req_size;
     }
     else if (strstr(test_name,"MAERTS")) {
       send_size = -1;
     }
     else {
       printf("No default port known for the %s test, please set one yourself\n",test_name);
       exit(-1);
     }
   }
 }