pgm_socket.cpp 21.8 KB
Newer Older
malosek's avatar
malosek committed
1
/*
Martin Sustrik's avatar
Martin Sustrik committed
2
    Copyright (c) 2009-2011 250bpm s.r.o.
3 4
    Copyright (c) 2007-2009 iMatix Corporation
    Copyright (c) 2010-2011 Miru Limited
5
    Copyright (c) 2007-2011 Other contributors as noted in the AUTHORS file
malosek's avatar
malosek committed
6 7 8 9

    This file is part of 0MQ.

    0MQ is free software; you can redistribute it and/or modify it under
10
    the terms of the GNU Lesser General Public License as published by
malosek's avatar
malosek committed
11 12 13 14 15 16
    the Free Software Foundation; either version 3 of the License, or
    (at your option) any later version.

    0MQ is distributed in the hope that it will be useful,
    but WITHOUT ANY WARRANTY; without even the implied warranty of
    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
17
    GNU Lesser General Public License for more details.
malosek's avatar
malosek committed
18

19
    You should have received a copy of the GNU Lesser General Public License
malosek's avatar
malosek committed
20 21 22 23 24
    along with this program.  If not, see <http://www.gnu.org/licenses/>.
*/

#include "platform.hpp"

malosek's avatar
malosek committed
25
#ifdef ZMQ_HAVE_OPENPGM
malosek's avatar
malosek committed
26

27 28 29 30
#ifdef ZMQ_HAVE_WINDOWS
#include "windows.hpp"
#endif

malosek's avatar
malosek committed
31
#ifdef ZMQ_HAVE_LINUX
32
#include <poll.h>
malosek's avatar
malosek committed
33 34
#endif

Martin Sustrik's avatar
Martin Sustrik committed
35
#include <stdlib.h>
36
#include <string.h>
malosek's avatar
malosek committed
37 38 39 40 41 42
#include <string>

#include "options.hpp"
#include "pgm_socket.hpp"
#include "config.hpp"
#include "err.hpp"
43
#include "random.hpp"
Martin Sustrik's avatar
Martin Sustrik committed
44
#include "stdint.hpp"
malosek's avatar
malosek committed
45

46
#ifndef MSG_ERRQUEUE
Martin Sustrik's avatar
Martin Sustrik committed
47
#define MSG_ERRQUEUE 0x2000
48 49
#endif

malosek's avatar
malosek committed
50
zmq::pgm_socket_t::pgm_socket_t (bool receiver_, const options_t &options_) :
Steven McCoy's avatar
Steven McCoy committed
51
    sock (NULL),
malosek's avatar
malosek committed
52 53 54
    options (options_),
    receiver (receiver_),
    pgm_msgv (NULL),
55
    pgm_msgv_len (0),
malosek's avatar
malosek committed
56 57
    nbytes_rec (0),
    nbytes_processed (0),
58
    pgm_msgv_processed (0)
malosek's avatar
malosek committed
59 60 61
{
}

62
//  Resolve PGM socket address.
63 64 65 66
//  network_ of the form <interface & multicast group decls>:<IP port>
//  e.g. eth0;239.192.0.1:7500
//       link-local;224.250.0.1,224.250.0.2;224.250.0.3:8000
//       ;[fe80::1%en0]:7500
67
int zmq::pgm_socket_t::init_address (const char *network_,
Ian Barber's avatar
Ian Barber committed
68
    struct pgm_addrinfo_t **res, uint16_t *port_number)
malosek's avatar
malosek committed
69
{
Steven McCoy's avatar
Steven McCoy committed
70 71
    //  Parse port number, start from end for IPv6
    const char *port_delim = strrchr (network_, ':');
malosek's avatar
malosek committed
72 73 74 75 76
    if (!port_delim) {
        errno = EINVAL;
        return -1;
    }

77
    *port_number = atoi (port_delim + 1);
malosek's avatar
malosek committed
78
  
Martin Sustrik's avatar
Martin Sustrik committed
79
    char network [256];
80
    if (port_delim - network_ >= (int) sizeof (network) - 1) {
malosek's avatar
malosek committed
81 82 83 84
        errno = EINVAL;
        return -1;
    }
    memset (network, '\0', sizeof (network));
85
    memcpy (network, network_, port_delim - network_);
malosek's avatar
malosek committed
86

Steven McCoy's avatar
Steven McCoy committed
87
    pgm_error_t *pgm_error = NULL;
Ian Barber's avatar
Ian Barber committed
88
    struct pgm_addrinfo_t hints;
Steven McCoy's avatar
Steven McCoy committed
89 90 91

    memset (&hints, 0, sizeof (hints));
    hints.ai_family = AF_UNSPEC;
Ian Barber's avatar
Ian Barber committed
92
    if (!pgm_getaddrinfo (network, NULL, res, &pgm_error)) {
93 94

        //  Invalid parameters don't set pgm_error_t.
95
        zmq_assert (pgm_error != NULL);
96
        if (pgm_error->domain == PGM_ERROR_DOMAIN_IF &&
97 98

              //  NB: cannot catch EAI_BADFLAGS.
99 100
            ( pgm_error->code != PGM_ERROR_SERVICE &&
              pgm_error->code != PGM_ERROR_SOCKTNOSUPPORT)) {
101 102

            //  User, host, or network configuration or transient error.
103 104 105 106
            pgm_error_free (pgm_error);
            errno = EINVAL;
            return -1;
        }
Steven McCoy's avatar
Steven McCoy committed
107

108
        //  Fatal OpenPGM internal error.
109
        zmq_assert (false);
malosek's avatar
malosek committed
110
    }
111 112 113 114 115 116 117 118 119 120 121 122 123 124 125 126 127 128 129 130 131 132 133 134
    return 0;
}

//  Create, bind and connect PGM socket.
int zmq::pgm_socket_t::init (bool udp_encapsulation_, const char *network_)
{
    //  Can not open transport before destroying old one.
    zmq_assert (sock == NULL);
    zmq_assert (options.rate > 0);

    //  Zero counter used in msgrecv.
    nbytes_rec = 0;
    nbytes_processed = 0;
    pgm_msgv_processed = 0;

    uint16_t port_number;
    struct pgm_addrinfo_t *res = NULL;
    sa_family_t sa_family;

    pgm_error_t *pgm_error = NULL;

    if (init_address(network_, &res, &port_number) < 0) {
        goto err_abort;
    }
malosek's avatar
malosek committed
135

136 137
    zmq_assert (res != NULL);

138
    //  Pick up detected IP family.
Steven McCoy's avatar
Steven McCoy committed
139
    sa_family = res->ai_send_addrs[0].gsr_group.ss_family;
malosek's avatar
malosek committed
140

141
    //  Create IP/PGM or UDP/PGM socket.
Martin Sustrik's avatar
Martin Sustrik committed
142
    if (udp_encapsulation_) {
143 144 145 146
        if (!pgm_socket (&sock, sa_family, SOCK_SEQPACKET, IPPROTO_UDP,
              &pgm_error)) {

            //  Invalid parameters don't set pgm_error_t.
147
            zmq_assert (pgm_error != NULL);
Steven McCoy's avatar
Steven McCoy committed
148
            if (pgm_error->domain == PGM_ERROR_DOMAIN_SOCKET && (
149 150 151 152
                  pgm_error->code != PGM_ERROR_BADF &&
                  pgm_error->code != PGM_ERROR_FAULT &&
                  pgm_error->code != PGM_ERROR_NOPROTOOPT &&
                  pgm_error->code != PGM_ERROR_FAILED))
153 154

                //  User, host, or network configuration or transient error.
Steven McCoy's avatar
Steven McCoy committed
155 156
                goto err_abort;

157
            //  Fatal OpenPGM internal error.
Steven McCoy's avatar
Steven McCoy committed
158
            zmq_assert (false);
159 160
        }

Steven McCoy's avatar
Steven McCoy committed
161 162
        //  All options are of data type int
        const int encapsulation_port = port_number;
163
        if (!pgm_setsockopt (sock, IPPROTO_PGM, PGM_UDP_ENCAP_UCAST_PORT,
164 165 166
                &encapsulation_port, sizeof (encapsulation_port)))
            goto err_abort;
        if (!pgm_setsockopt (sock, IPPROTO_PGM, PGM_UDP_ENCAP_MCAST_PORT,
167
                &encapsulation_port, sizeof (encapsulation_port)))
Steven McCoy's avatar
Steven McCoy committed
168
            goto err_abort;
169 170 171 172 173 174
    }
    else {
        if (!pgm_socket (&sock, sa_family, SOCK_SEQPACKET, IPPROTO_PGM,
              &pgm_error)) {

            //  Invalid parameters don't set pgm_error_t.
175
            zmq_assert (pgm_error != NULL);
Steven McCoy's avatar
Steven McCoy committed
176
            if (pgm_error->domain == PGM_ERROR_DOMAIN_SOCKET && (
177 178 179 180
                  pgm_error->code != PGM_ERROR_BADF &&
                  pgm_error->code != PGM_ERROR_FAULT &&
                  pgm_error->code != PGM_ERROR_NOPROTOOPT &&
                  pgm_error->code != PGM_ERROR_FAILED))
181 182

                //  User, host, or network configuration or transient error.
Steven McCoy's avatar
Steven McCoy committed
183 184
                goto err_abort;

185
            //  Fatal OpenPGM internal error.
Steven McCoy's avatar
Steven McCoy committed
186 187
            zmq_assert (false);
        }
malosek's avatar
malosek committed
188 189
    }

Steven McCoy's avatar
Steven McCoy committed
190
    {
191 192 193 194 195 196 197 198 199 200 201 202 203 204 205 206 207 208
		const int rcvbuf = (int) options.rcvbuf;
		if (rcvbuf) {
		    if (!pgm_setsockopt (sock, SOL_SOCKET, SO_RCVBUF, &rcvbuf,
		          sizeof (rcvbuf)))
		        goto err_abort;
		}

		const int sndbuf = (int) options.sndbuf;
		if (sndbuf) {
		    if (!pgm_setsockopt (sock, SOL_SOCKET, SO_SNDBUF, &sndbuf,
		          sizeof (sndbuf)))
		        goto err_abort;
		}

		const int max_tpdu = (int) pgm_max_tpdu;
		if (!pgm_setsockopt (sock, IPPROTO_PGM, PGM_MTU, &max_tpdu,
		      sizeof (max_tpdu)))
		    goto err_abort;
malosek's avatar
malosek committed
209 210
    }

malosek's avatar
malosek committed
211
    if (receiver) {
Steven McCoy's avatar
Steven McCoy committed
212
        const int recv_only        = 1,
213
                  rxw_max_tpdu     = (int) pgm_max_tpdu,
214
                  rxw_sqns         = compute_sqns (rxw_max_tpdu),
215
                  peer_expiry      = pgm_secs (300),
Steven McCoy's avatar
Steven McCoy committed
216 217 218 219
                  spmr_expiry      = pgm_msecs (25),
                  nak_bo_ivl       = pgm_msecs (50),
                  nak_rpt_ivl      = pgm_msecs (200),
                  nak_rdata_ivl    = pgm_msecs (200),
220 221
                  nak_data_retries = 50,
                  nak_ncf_retries  = 50;
Steven McCoy's avatar
Steven McCoy committed
222

223 224
        if (!pgm_setsockopt (sock, IPPROTO_PGM, PGM_RECV_ONLY, &recv_only,
                sizeof (recv_only)) ||
225 226
            !pgm_setsockopt (sock, IPPROTO_PGM, PGM_RXW_SQNS, &rxw_sqns,
                sizeof (rxw_sqns)) ||
227 228 229 230 231 232 233 234 235 236 237 238 239 240
            !pgm_setsockopt (sock, IPPROTO_PGM, PGM_PEER_EXPIRY, &peer_expiry,
                sizeof (peer_expiry)) ||
            !pgm_setsockopt (sock, IPPROTO_PGM, PGM_SPMR_EXPIRY, &spmr_expiry,
                sizeof (spmr_expiry)) ||
            !pgm_setsockopt (sock, IPPROTO_PGM, PGM_NAK_BO_IVL, &nak_bo_ivl,
                sizeof (nak_bo_ivl)) ||
            !pgm_setsockopt (sock, IPPROTO_PGM, PGM_NAK_RPT_IVL, &nak_rpt_ivl,
                sizeof (nak_rpt_ivl)) ||
            !pgm_setsockopt (sock, IPPROTO_PGM, PGM_NAK_RDATA_IVL,
                &nak_rdata_ivl, sizeof (nak_rdata_ivl)) ||
            !pgm_setsockopt (sock, IPPROTO_PGM, PGM_NAK_DATA_RETRIES,
                &nak_data_retries, sizeof (nak_data_retries)) ||
            !pgm_setsockopt (sock, IPPROTO_PGM, PGM_NAK_NCF_RETRIES,
                &nak_ncf_retries, sizeof (nak_ncf_retries)))
Steven McCoy's avatar
Steven McCoy committed
241
            goto err_abort;
242 243
    }
    else {
Steven McCoy's avatar
Steven McCoy committed
244
        const int send_only        = 1,
Steven McCoy's avatar
Steven McCoy committed
245
                  max_rte      = (int) ((options.rate * 1000) / 8),
246
                  txw_max_tpdu     = (int) pgm_max_tpdu,
247
                  txw_sqns         = compute_sqns (txw_max_tpdu),
248 249 250 251 252 253 254 255 256 257
                  ambient_spm      = pgm_secs (30),
                  heartbeat_spm[]  = { pgm_msecs (100),
                                       pgm_msecs (100),
                                       pgm_msecs (100),
                                       pgm_msecs (100),
                                       pgm_msecs (1300),
                                       pgm_secs  (7),
                                       pgm_secs  (16),
                                       pgm_secs  (25),
                                       pgm_secs  (30) };
Steven McCoy's avatar
Steven McCoy committed
258

259 260
        if (!pgm_setsockopt (sock, IPPROTO_PGM, PGM_SEND_ONLY,
                &send_only, sizeof (send_only)) ||
Steven McCoy's avatar
Steven McCoy committed
261 262
            !pgm_setsockopt (sock, IPPROTO_PGM, PGM_ODATA_MAX_RTE,
                &max_rte, sizeof (max_rte)) ||
263 264
            !pgm_setsockopt (sock, IPPROTO_PGM, PGM_TXW_SQNS,
                &txw_sqns, sizeof (txw_sqns)) ||
265 266 267 268
            !pgm_setsockopt (sock, IPPROTO_PGM, PGM_AMBIENT_SPM,
                &ambient_spm, sizeof (ambient_spm)) ||
            !pgm_setsockopt (sock, IPPROTO_PGM, PGM_HEARTBEAT_SPM,
                &heartbeat_spm, sizeof (heartbeat_spm)))
Steven McCoy's avatar
Steven McCoy committed
269 270
            goto err_abort;
    }
malosek's avatar
malosek committed
271

Steven McCoy's avatar
Steven McCoy committed
272 273
    //  PGM transport GSI.
    struct pgm_sockaddr_t addr;
Martin Sustrik's avatar
Martin Sustrik committed
274

Steven McCoy's avatar
Steven McCoy committed
275 276 277
    memset (&addr, 0, sizeof(addr));
    addr.sa_port = port_number;
    addr.sa_addr.sport = DEFAULT_DATA_SOURCE_PORT;
malosek's avatar
malosek committed
278

279 280 281 282 283 284
    //  Create random GSI.
    uint32_t buf [2];
    buf [0] = generate_random ();
    buf [1] = generate_random ();
    if (!pgm_gsi_create_from_data (&addr.sa_addr.gsi, (uint8_t*) buf, 8))
        goto err_abort;
285

malosek's avatar
malosek committed
286

Steven McCoy's avatar
Steven McCoy committed
287 288 289 290 291 292 293 294 295
    //  Bind a transport to the specified network devices.
    struct pgm_interface_req_t if_req;
    memset (&if_req, 0, sizeof(if_req));
    if_req.ir_interface = res->ai_recv_addrs[0].gsr_interface;
    if_req.ir_scope_id  = 0;
    if (AF_INET6 == sa_family) {
        struct sockaddr_in6 sa6;
        memcpy (&sa6, &res->ai_recv_addrs[0].gsr_group, sizeof (sa6));
        if_req.ir_scope_id = sa6.sin6_scope_id;
malosek's avatar
malosek committed
296
    }
297 298 299 300
    if (!pgm_bind3 (sock, &addr, sizeof (addr), &if_req, sizeof (if_req),
          &if_req, sizeof (if_req), &pgm_error)) {

        //  Invalid parameters don't set pgm_error_t.
301 302 303 304 305 306
        zmq_assert (pgm_error != NULL);
        if ((pgm_error->domain == PGM_ERROR_DOMAIN_SOCKET ||
             pgm_error->domain == PGM_ERROR_DOMAIN_IF) && (
             pgm_error->code != PGM_ERROR_INVAL &&
             pgm_error->code != PGM_ERROR_BADF &&
             pgm_error->code != PGM_ERROR_FAULT))
307 308

            //  User, host, or network configuration or transient error.
Steven McCoy's avatar
Steven McCoy committed
309 310
            goto err_abort;

311
        //  Fatal OpenPGM internal error.
Steven McCoy's avatar
Steven McCoy committed
312
        zmq_assert (false);
malosek's avatar
malosek committed
313 314
    }

315 316 317 318
    //  Join IP multicast groups.
    for (unsigned i = 0; i < res->ai_recv_addrs_len; i++) {
        if (!pgm_setsockopt (sock, IPPROTO_PGM, PGM_JOIN_GROUP,
              &res->ai_recv_addrs [i], sizeof (struct group_req)))
Steven McCoy's avatar
Steven McCoy committed
319 320
            goto err_abort;
    }
321 322
    if (!pgm_setsockopt (sock, IPPROTO_PGM, PGM_SEND_GROUP,
          &res->ai_send_addrs [0], sizeof (struct group_req)))
Steven McCoy's avatar
Steven McCoy committed
323
        goto err_abort;
324

Steven McCoy's avatar
Steven McCoy committed
325
    pgm_freeaddrinfo (res);
326
    res = NULL;
327

328
    //  Set IP level parameters.
Steven McCoy's avatar
Steven McCoy committed
329
    {
Rohan's avatar
Rohan committed
330
		// Multicast loopback disabled by default
331 332 333 334 335 336 337 338 339 340 341
		const int multicast_loop = 0;
		if (!pgm_setsockopt (sock, IPPROTO_PGM, PGM_MULTICAST_LOOP,
		      &multicast_loop, sizeof (multicast_loop)))
		    goto err_abort;

		const int multicast_hops = options.multicast_hops;
		if (!pgm_setsockopt (sock, IPPROTO_PGM, PGM_MULTICAST_HOPS,
		        &multicast_hops, sizeof (multicast_hops)))
		    goto err_abort;

		//  Expedited Forwarding PHB for network elements, no ECN.
Rohan's avatar
Rohan committed
342
		const int dscp = 0x2e << 2;
343 344
		if (AF_INET6 != sa_family && !pgm_setsockopt (sock,
		      IPPROTO_PGM, PGM_TOS, &dscp, sizeof (dscp)))
Rohan's avatar
Rohan committed
345
		    goto err_abort;
346 347 348 349 350

		const int nonblocking = 1;
		if (!pgm_setsockopt (sock, IPPROTO_PGM, PGM_NOBLOCK,
		      &nonblocking, sizeof (nonblocking)))
		    goto err_abort;
351
    }
malosek's avatar
malosek committed
352

353 354
    //  Connect PGM transport to start state machine.
    if (!pgm_connect (sock, &pgm_error)) {
355 356

        //  Invalid parameters don't set pgm_error_t.
357 358 359 360
        zmq_assert (pgm_error != NULL);
        goto err_abort;
    }

Martin Sustrik's avatar
Martin Sustrik committed
361 362 363 364 365 366 367 368 369 370
    //  For receiver transport preallocate pgm_msgv array.
    if (receiver) {
        zmq_assert (in_batch_size > 0);
        size_t max_tsdu_size = get_max_tsdu_size ();
        pgm_msgv_len = (int) in_batch_size / max_tsdu_size;
        if ((int) in_batch_size % max_tsdu_size)
            pgm_msgv_len++;
        zmq_assert (pgm_msgv_len);

        pgm_msgv = (pgm_msgv_t*) malloc (sizeof (pgm_msgv_t) * pgm_msgv_len);
371
        alloc_assert (pgm_msgv);
Martin Sustrik's avatar
Martin Sustrik committed
372 373
    }

malosek's avatar
malosek committed
374
    return 0;
Steven McCoy's avatar
Steven McCoy committed
375 376 377 378 379 380 381 382 383 384 385 386 387 388 389 390

err_abort:
    if (sock != NULL) {
        pgm_close (sock, FALSE);
        sock = NULL;
    }
    if (res != NULL) {
        pgm_freeaddrinfo (res);
        res = NULL;
    }
    if (pgm_error != NULL) {
        pgm_error_free (pgm_error);
        pgm_error = NULL;
    }
    errno = EINVAL;
    return -1;
malosek's avatar
malosek committed
391 392 393 394
}

zmq::pgm_socket_t::~pgm_socket_t ()
{
Martin Sustrik's avatar
Martin Sustrik committed
395 396
    if (pgm_msgv)
        free (pgm_msgv);
Steven McCoy's avatar
Steven McCoy committed
397 398
    if (sock) 
        pgm_close (sock, TRUE);
malosek's avatar
malosek committed
399 400
}

401 402
//  Get receiver fds. receive_fd_ is signaled for incoming packets,
//  waiting_pipe_fd_ is signaled for state driven events and data.
403 404
void zmq::pgm_socket_t::get_receiver_fds (fd_t *receive_fd_, 
    fd_t *waiting_pipe_fd_)
malosek's avatar
malosek committed
405
{
Steven McCoy's avatar
Steven McCoy committed
406 407 408
    socklen_t socklen;
    bool rc;

409 410 411
    zmq_assert (receive_fd_);
    zmq_assert (waiting_pipe_fd_);

Steven McCoy's avatar
Steven McCoy committed
412
    socklen = sizeof (*receive_fd_);
413 414
    rc = pgm_getsockopt (sock, IPPROTO_PGM, PGM_RECV_SOCK, receive_fd_,
        &socklen);
Steven McCoy's avatar
Steven McCoy committed
415 416
    zmq_assert (rc);
    zmq_assert (socklen == sizeof (*receive_fd_));
417

Steven McCoy's avatar
Steven McCoy committed
418
    socklen = sizeof (*waiting_pipe_fd_);
419 420
    rc = pgm_getsockopt (sock, IPPROTO_PGM, PGM_PENDING_SOCK, waiting_pipe_fd_,
        &socklen);
Steven McCoy's avatar
Steven McCoy committed
421 422
    zmq_assert (rc);
    zmq_assert (socklen == sizeof (*waiting_pipe_fd_));
malosek's avatar
malosek committed
423 424
}

425
//  Get fds and store them into user allocated memory. 
Steven McCoy's avatar
Steven McCoy committed
426 427 428 429
//  send_fd is for non-blocking send wire notifications.
//  receive_fd_ is for incoming back-channel protocol packets.
//  rdata_notify_fd_ is raised for waiting repair transmissions.
//  pending_notify_fd_ is for state driven events.
430 431
void zmq::pgm_socket_t::get_sender_fds (fd_t *send_fd_, fd_t *receive_fd_, 
    fd_t *rdata_notify_fd_, fd_t *pending_notify_fd_)
malosek's avatar
malosek committed
432
{
Steven McCoy's avatar
Steven McCoy committed
433 434 435
    socklen_t socklen;
    bool rc;

malosek's avatar
malosek committed
436 437
    zmq_assert (send_fd_);
    zmq_assert (receive_fd_);
438
    zmq_assert (rdata_notify_fd_);
439
    zmq_assert (pending_notify_fd_);
440

Steven McCoy's avatar
Steven McCoy committed
441 442 443 444 445 446
    socklen = sizeof (*send_fd_);
    rc = pgm_getsockopt (sock, IPPROTO_PGM, PGM_SEND_SOCK, send_fd_, &socklen);
    zmq_assert (rc);
    zmq_assert (socklen == sizeof (*receive_fd_));

    socklen = sizeof (*receive_fd_);
447 448
    rc = pgm_getsockopt (sock, IPPROTO_PGM, PGM_RECV_SOCK, receive_fd_,
        &socklen);
Steven McCoy's avatar
Steven McCoy committed
449 450 451 452
    zmq_assert (rc);
    zmq_assert (socklen == sizeof (*receive_fd_));

    socklen = sizeof (*rdata_notify_fd_);
453 454
    rc = pgm_getsockopt (sock, IPPROTO_PGM, PGM_REPAIR_SOCK, rdata_notify_fd_,
        &socklen);
Steven McCoy's avatar
Steven McCoy committed
455 456 457 458
    zmq_assert (rc);
    zmq_assert (socklen == sizeof (*rdata_notify_fd_));

    socklen = sizeof (*pending_notify_fd_);
459 460
    rc = pgm_getsockopt (sock, IPPROTO_PGM, PGM_PENDING_SOCK,
        pending_notify_fd_, &socklen);
Steven McCoy's avatar
Steven McCoy committed
461 462
    zmq_assert (rc);
    zmq_assert (socklen == sizeof (*pending_notify_fd_));
malosek's avatar
malosek committed
463 464 465
}

//  Send one APDU, transmit window owned memory.
Steven McCoy's avatar
Steven McCoy committed
466
//  data_len_ must be less than one TPDU.
malosek's avatar
malosek committed
467 468
size_t zmq::pgm_socket_t::send (unsigned char *data_, size_t data_len_)
{
malosek's avatar
malosek committed
469 470
    size_t nbytes = 0;
   
Steven McCoy's avatar
Steven McCoy committed
471
    const int status = pgm_send (sock, data_, data_len_, &nbytes);
malosek's avatar
malosek committed
472

473
    //  We have to write all data as one packet.
474 475
    if (nbytes > 0) {
        zmq_assert (status == PGM_IO_STATUS_NORMAL);
Martin Hurton's avatar
Martin Hurton committed
476
        zmq_assert (nbytes == data_len_);
477 478
    }
    else {
479 480
        zmq_assert (status == PGM_IO_STATUS_RATE_LIMITED ||
            status == PGM_IO_STATUS_WOULD_BLOCK);
481 482 483 484 485 486 487

        if (status == PGM_IO_STATUS_RATE_LIMITED)
            errno = ENOMEM;
        else
            errno = EBUSY;
    }

488
    //  Save return value.
489
    last_tx_status = status;
malosek's avatar
malosek committed
490 491 492 493

    return nbytes;
}

494 495
long zmq::pgm_socket_t::get_rx_timeout ()
{
496 497
    if (last_rx_status != PGM_IO_STATUS_RATE_LIMITED &&
          last_rx_status != PGM_IO_STATUS_TIMER_PENDING)
498 499 500 501
        return -1;

    struct timeval tv;
    socklen_t optlen = sizeof (tv);
502 503 504
    const bool rc = pgm_getsockopt (sock, IPPROTO_PGM,
        last_rx_status == PGM_IO_STATUS_RATE_LIMITED ? PGM_RATE_REMAIN :
        PGM_TIME_REMAIN, &tv, &optlen);
505 506 507 508 509 510 511 512 513 514 515 516 517 518
    zmq_assert (rc);

    const long timeout = (tv.tv_sec * 1000) + (tv.tv_usec / 1000);

    return timeout;
}

long zmq::pgm_socket_t::get_tx_timeout ()
{
    if (last_tx_status != PGM_IO_STATUS_RATE_LIMITED)
        return -1;

    struct timeval tv;
    socklen_t optlen = sizeof (tv);
519 520
    const bool rc = pgm_getsockopt (sock, IPPROTO_PGM, PGM_RATE_REMAIN, &tv,
        &optlen);
521 522 523 524 525 526 527
    zmq_assert (rc);

    const long timeout = (tv.tv_sec * 1000) + (tv.tv_usec / 1000);

    return timeout;
}

malosek's avatar
malosek committed
528
//  Return max TSDU size without fragmentation from current PGM transport.
529
size_t zmq::pgm_socket_t::get_max_tsdu_size ()
malosek's avatar
malosek committed
530
{
Steven McCoy's avatar
Steven McCoy committed
531 532 533 534 535 536 537
    int max_tsdu = 0;
    socklen_t optlen = sizeof (max_tsdu);

    bool rc = pgm_getsockopt (sock, IPPROTO_PGM, PGM_MSS, &max_tsdu, &optlen);
    zmq_assert (rc);
    zmq_assert (optlen == sizeof (max_tsdu));
    return (size_t) max_tsdu;
malosek's avatar
malosek committed
538 539
}

540 541
//  pgm_recvmsgv is called to fill the pgm_msgv array up to  pgm_msgv_len.
//  In subsequent calls data from pgm_msgv structure are returned.
malosek's avatar
malosek committed
542
ssize_t zmq::pgm_socket_t::receive (void **raw_data_, const pgm_tsi_t **tsi_)
malosek's avatar
malosek committed
543
{
malosek's avatar
malosek committed
544 545
    size_t raw_data_len = 0;

malosek's avatar
malosek committed
546 547 548 549 550 551 552 553
    //  We just sent all data from pgm_transport_recvmsgv up 
    //  and have to return 0 that another engine in this thread is scheduled.
    if (nbytes_rec == nbytes_processed && nbytes_rec > 0) {

        //  Reset all the counters.
        nbytes_rec = 0;
        nbytes_processed = 0;
        pgm_msgv_processed = 0;
554
        errno = EAGAIN;
555
        return 0;
malosek's avatar
malosek committed
556 557 558
    }

    //  If we have are going first time or if we have processed all pgm_msgv_t
559
    //  structure previously read from the pgm socket.
malosek's avatar
malosek committed
560 561 562 563 564 565 566 567 568
    if (nbytes_rec == nbytes_processed) {

        //  Check program flow.
        zmq_assert (pgm_msgv_processed == 0);
        zmq_assert (nbytes_processed == 0);
        zmq_assert (nbytes_rec == 0);

        //  Receive a vector of Application Protocol Domain Unit's (APDUs) 
        //  from the transport.
Steven McCoy's avatar
Steven McCoy committed
569
        pgm_error_t *pgm_error = NULL;
malosek's avatar
malosek committed
570

Steven McCoy's avatar
Steven McCoy committed
571 572
        const int status = pgm_recvmsgv (sock, pgm_msgv,
            pgm_msgv_len, MSG_ERRQUEUE, &nbytes_rec, &pgm_error);
573

574
        //  Invalid parameters.
Martin Sustrik's avatar
Martin Sustrik committed
575
        zmq_assert (status != PGM_IO_STATUS_ERROR);
576

577 578
        last_rx_status = status;

malosek's avatar
malosek committed
579
        //  In a case when no ODATA/RDATA fired POLLIN event (SPM...)
Steven McCoy's avatar
Steven McCoy committed
580
        //  pgm_recvmsg returns PGM_IO_STATUS_TIMER_PENDING.
581 582
        if (status == PGM_IO_STATUS_TIMER_PENDING) {

583 584
            zmq_assert (nbytes_rec == 0);

malosek's avatar
malosek committed
585 586 587
            //  In case if no RDATA/ODATA caused POLLIN 0 is 
            //  returned.
            nbytes_rec = 0;
588
            errno = EBUSY;
589
            return 0;
malosek's avatar
malosek committed
590
        }
591

Steven McCoy's avatar
Steven McCoy committed
592 593 594 595 596
        //  Send SPMR, NAK, ACK is rate limited.
        if (status == PGM_IO_STATUS_RATE_LIMITED) {

            zmq_assert (nbytes_rec == 0);

597
            //  In case if no RDATA/ODATA caused POLLIN 0 is returned.
Steven McCoy's avatar
Steven McCoy committed
598
            nbytes_rec = 0;
599 600
            errno = ENOMEM;
            return 0;
Steven McCoy's avatar
Steven McCoy committed
601 602 603 604 605 606 607
        }

        //  No peers and hence no incoming packets.
        if (status == PGM_IO_STATUS_WOULD_BLOCK) {

            zmq_assert (nbytes_rec == 0);

608
            //  In case if no RDATA/ODATA caused POLLIN 0 is returned.
Steven McCoy's avatar
Steven McCoy committed
609
            nbytes_rec = 0;
610
            errno = EAGAIN;
611
            return 0;
Steven McCoy's avatar
Steven McCoy committed
612 613
        }

614 615 616
        //  Data loss.
        if (status == PGM_IO_STATUS_RESET) {

617
            struct pgm_sk_buff_t* skb = pgm_msgv [0].msgv_skb [0];
618 619

            //  Save lost data TSI.
Steven McCoy's avatar
Steven McCoy committed
620
            *tsi_ = &skb->tsi;
621 622 623
            nbytes_rec = 0;

            //  In case of dala loss -1 is returned.
624
            errno = EINVAL;
Steven McCoy's avatar
Steven McCoy committed
625
            pgm_free_skb (skb);
626 627 628
            return -1;
        }

629
        zmq_assert (status == PGM_IO_STATUS_NORMAL);
malosek's avatar
malosek committed
630
    }
631 632 633 634
    else
    {
        zmq_assert (pgm_msgv_processed <= pgm_msgv_len);
    }
malosek's avatar
malosek committed
635

636
    // Zero byte payloads are valid in PGM, but not 0MQ protocol.
malosek's avatar
malosek committed
637 638
    zmq_assert (nbytes_rec > 0);

malosek's avatar
malosek committed
639 640 641 642 643 644 645 646 647 648 649 650
    // Only one APDU per pgm_msgv_t structure is allowed.
    zmq_assert (pgm_msgv [pgm_msgv_processed].msgv_len == 1);
 
    struct pgm_sk_buff_t* skb = 
        pgm_msgv [pgm_msgv_processed].msgv_skb [0];

    //  Take pointers from pgm_msgv_t structure.
    *raw_data_ = skb->data;
    raw_data_len = skb->len;

    //  Save current TSI.
    *tsi_ = &skb->tsi;
malosek's avatar
malosek committed
651 652 653

    //  Move the the next pgm_msgv_t structure.
    pgm_msgv_processed++;
654
    zmq_assert (pgm_msgv_processed <= pgm_msgv_len);
malosek's avatar
malosek committed
655 656 657 658 659
    nbytes_processed +=raw_data_len;

    return raw_data_len;
}

660
void zmq::pgm_socket_t::process_upstream ()
malosek's avatar
malosek committed
661
{
malosek's avatar
malosek committed
662
    pgm_msgv_t dummy_msg;
malosek's avatar
malosek committed
663

malosek's avatar
malosek committed
664
    size_t dummy_bytes = 0;
Steven McCoy's avatar
Steven McCoy committed
665
    pgm_error_t *pgm_error = NULL;
malosek's avatar
malosek committed
666

Steven McCoy's avatar
Steven McCoy committed
667 668
    const int status = pgm_recvmsgv (sock, &dummy_msg,
        1, MSG_ERRQUEUE, &dummy_bytes, &pgm_error);
malosek's avatar
malosek committed
669

670
    //  Invalid parameters.
Martin Sustrik's avatar
Martin Sustrik committed
671
    zmq_assert (status != PGM_IO_STATUS_ERROR);
672

malosek's avatar
malosek committed
673
    //  No data should be returned.
674
    zmq_assert (dummy_bytes == 0 && (status == PGM_IO_STATUS_TIMER_PENDING || 
675 676
        status == PGM_IO_STATUS_RATE_LIMITED ||
        status == PGM_IO_STATUS_WOULD_BLOCK));
677 678 679 680 681

    last_rx_status = status;

    if (status == PGM_IO_STATUS_TIMER_PENDING)
        errno = EBUSY;
682 683
    else
    if (status == PGM_IO_STATUS_RATE_LIMITED)
684 685 686
        errno = ENOMEM;
    else
        errno = EAGAIN;
malosek's avatar
malosek committed
687 688
}

689 690 691
int zmq::pgm_socket_t::compute_sqns (int tpdu_)
{
    //  Convert rate into B/ms.
692
    uint64_t rate = uint64_t (options.rate) / 8;
693 694
        
    //  Compute the size of the buffer in bytes.
695
    uint64_t size = uint64_t (options.recovery_ivl) * rate;
696 697 698 699

    //  Translate the size into number of packets.
    uint64_t sqns = size / tpdu_;

700
    //  Buffer should be able to hold at least one packet.
701 702 703
    if (sqns == 0)
        sqns = 1;

704
    return (int) sqns;
705 706
}

malosek's avatar
malosek committed
707 708
#endif