api/html/totempg_8c_source.html

/*

 * Copyright (c) 2003-2005 MontaVista Software, Inc.

 * Copyright (c) 2005 OSDL.

 * Copyright (c) 2006-2012 Red Hat, Inc.

 *

 * All rights reserved.

 *

 * Author: Steven Dake (sdake@redhat.com)

 * Author: Mark Haverkamp (markh@osdl.org)

 *

 * This software licensed under BSD license, the text of which follows:

 *

 * Redistribution and use in source and binary forms, with or without

 * modification, are permitted provided that the following conditions are met:

 *

 * - Redistributions of source code must retain the above copyright notice,

 *   this list of conditions and the following disclaimer.

 * - Redistributions in binary form must reproduce the above copyright notice,

 *   this list of conditions and the following disclaimer in the documentation

 *   and/or other materials provided with the distribution.

 * - Neither the name of the MontaVista Software, Inc. nor the names of its

 *   contributors may be used to endorse or promote products derived from this

 *   software without specific prior written permission.

 *

 * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"

 * AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE

 * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE

 * ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE

 * LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR

 * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF

 * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS

 * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN

 * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)

 * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF

 * THE POSSIBILITY OF SUCH DAMAGE.

 */


/*

 * FRAGMENTATION AND PACKING ALGORITHM:

 *

 * Assemble the entire message into one buffer

 * if full fragment

 *       store fragment into lengths list

 *      for each full fragment

 *              multicast fragment

 *              set length and fragment fields of pg mesage

 *      store remaining multicast into head of fragmentation data and set lens field

 *

 * If a message exceeds the maximum packet size allowed by the totem

 * single ring protocol, the protocol could lose forward progress.

 * Statically calculating the allowed data amount doesn't work because

 * the amount of data allowed depends on the number of fragments in

 * each message.  In this implementation, the maximum fragment size

 * is dynamically calculated for each fragment added to the message.


 * It is possible for a message to be two bytes short of the maximum

 * packet size.  This occurs when a message or collection of

 * messages + the mcast header + the lens are two bytes short of the

 * end of the packet.  Since another len field consumes two bytes, the

 * len field would consume the rest of the packet without room for data.

 *

 * One optimization would be to forgo the final len field and determine

 * it from the size of the udp datagram.  Then this condition would no

 * longer occur.

 */


/*

 * ASSEMBLY AND UNPACKING ALGORITHM:

 *

 * copy incoming packet into assembly data buffer indexed by current

 * location of end of fragment

 *

 * if not fragmented

 *      deliver all messages in assembly data buffer

 * else

 * if msg_count > 1 and fragmented

 *      deliver all messages except last message in assembly data buffer

 *      copy last fragmented section to start of assembly data buffer

 * else

 * if msg_count = 1 and fragmented

 *      do nothing

 *

 */


#include <config.h>


#ifdef HAVE_ALLOCA_H

#include <alloca.h>

#endif

#include <sys/types.h>

#include <sys/socket.h>

#include <netinet/in.h>

#include <arpa/inet.h>

#include <sys/uio.h>

#include <stdio.h>

#include <stdlib.h>

#include <string.h>

#include <assert.h>

#include <pthread.h>

#include <errno.h>

#include <limits.h>


#include <corosync/swab.h>

#include <qb/qblist.h>

#include <qb/qbloop.h>

#include <qb/qbipcs.h>

#include <corosync/totem/totempg.h>

#define LOGSYS_UTILS_ONLY 1

#include <corosync/logsys.h>


#include "util.h"

#include "totemsrp.h"


struct totempg_mcast_header {

        short version;

        short type;

};


#if !(defined(__i386__) || defined(__x86_64__))

/*

 * Need align on architectures different then i386 or x86_64

 */

#define TOTEMPG_NEED_ALIGN 1

#endif


/*

 * totempg_mcast structure

 *

 * header:                              Identify the mcast.

 * fragmented:                  Set if this message continues into next message

 * continuation:                Set if this message is a continuation from last message

 * msg_count                    Indicates how many packed messages are contained

 *                                              in the mcast.

 * Also, the size of each packed message and the messages themselves are

 * appended to the end of this structure when sent.

 */


struct totempg_mcast {

        struct totempg_mcast_header header;

        unsigned char fragmented;

        unsigned char continuation;

        unsigned short msg_count;

        /*

         * short msg_len[msg_count];

         */

        /*

         * data for messages

         */

};


/*

 * Maximum packet size for totem pg messages

 */


#define TOTEMPG_PACKET_SIZE (totempg_totem_config->net_mtu - \

        sizeof (struct totempg_mcast))


/*

 * Local variables used for packing small messages

 */

static unsigned short mcast_packed_msg_lens[FRAME_SIZE_MAX];


static int mcast_packed_msg_count = 0;


static int totempg_reserved = 1;


static unsigned int totempg_size_limit;


static totem_queue_level_changed_fn totem_queue_level_changed = NULL;


static uint32_t totempg_threaded_mode = 0;


static void *totemsrp_context;


/*

 * Function and data used to log messages

 */

static int totempg_log_level_security;

static int totempg_log_level_error;

static int totempg_log_level_warning;

static int totempg_log_level_notice;

static int totempg_log_level_debug;

static int totempg_subsys_id;

static void (*totempg_log_printf) (

        int level,

        int subsys,

        const char *function,

        const char *file,

        int line,

        const char *format, ...) __attribute__((format(printf, 6, 7)));


struct totem_config *totempg_totem_config;


static totempg_stats_t totempg_stats;


enum throw_away_mode {

        THROW_AWAY_INACTIVE,

        THROW_AWAY_ACTIVE

};


struct assembly {

        unsigned int nodeid;

        unsigned char data[MESSAGE_SIZE_MAX+KNET_MAX_PACKET_SIZE];

        int index;

        unsigned char last_frag_num;

        enum throw_away_mode throw_away_mode;

        struct qb_list_head list;

};


static void assembly_deref (struct assembly *assembly);


static int callback_token_received_fn (enum totem_callback_token_type type,

        const void *data);


QB_LIST_DECLARE(assembly_list_inuse);


/*

 * Free list is used both for transitional and operational assemblies

 */

QB_LIST_DECLARE(assembly_list_free);


QB_LIST_DECLARE(assembly_list_inuse_trans);


QB_LIST_DECLARE(totempg_groups_list);


/*

 * Staging buffer for packed messages.  Messages are staged in this buffer

 * before sending.  Multiple messages may fit which cuts down on the

 * number of mcasts sent.  If a message doesn't completely fit, then

 * the mcast header has a fragment bit set that says that there are more

 * data to follow.  fragment_size is an index into the buffer.  It indicates

 * the size of message data and where to place new message data.

 * fragment_contuation indicates whether the first packed message in

 * the buffer is a continuation of a previously packed fragment.

 */

static unsigned char *fragmentation_data;


static int fragment_size = 0;


static int fragment_continuation = 0;


static int totempg_waiting_transack = 0;


struct totempg_group_instance {

        void (*deliver_fn) (

                unsigned int nodeid,

                const void *msg,

                unsigned int msg_len,

                int endian_conversion_required);


        void (*confchg_fn) (

                enum totem_configuration_type configuration_type,

                const unsigned int *member_list, size_t member_list_entries,

                const unsigned int *left_list, size_t left_list_entries,

                const unsigned int *joined_list, size_t joined_list_entries,

                const struct memb_ring_id *ring_id);


        struct totempg_group *groups;


        int groups_cnt;

        int32_t q_level;


        struct qb_list_head list;

};


static unsigned char next_fragment = 1;


static pthread_mutex_t totempg_mutex = PTHREAD_MUTEX_INITIALIZER;


static pthread_mutex_t callback_token_mutex = PTHREAD_MUTEX_INITIALIZER;


static pthread_mutex_t mcast_msg_mutex = PTHREAD_MUTEX_INITIALIZER;


#define log_printf(level, format, args...)                      \

do {                                                            \

        totempg_log_printf(level,                               \

                           totempg_subsys_id,                   \

                           __FUNCTION__, __FILE__, __LINE__,    \

                           format, ##args);                     \

} while (0);


static int msg_count_send_ok (int msg_count);


static int byte_count_send_ok (int byte_count);


static void totempg_waiting_trans_ack_cb (int waiting_trans_ack)

{

        log_printf(LOG_DEBUG, "waiting_trans_ack changed to %u", waiting_trans_ack);

        totempg_waiting_transack = waiting_trans_ack;

}


static struct assembly *assembly_ref (unsigned int nodeid)

{

        struct assembly *assembly;

        struct qb_list_head *list;

        struct qb_list_head *active_assembly_list_inuse;


        if (totempg_waiting_transack) {

                active_assembly_list_inuse = &assembly_list_inuse_trans;

        } else {

                active_assembly_list_inuse = &assembly_list_inuse;

        }


        /*

         * Search inuse list for node id and return assembly buffer if found

         */

        qb_list_for_each(list, active_assembly_list_inuse) {

                assembly = qb_list_entry (list, struct assembly, list);


                if (nodeid == assembly->nodeid) {

                        return (assembly);

                }

        }


        /*

         * Nothing found in inuse list get one from free list if available

         */

        if (qb_list_empty (&assembly_list_free) == 0) {

                assembly = qb_list_first_entry (&assembly_list_free, struct assembly, list);

                qb_list_del (&assembly->list);

                qb_list_add (&assembly->list, active_assembly_list_inuse);

                assembly->nodeid = nodeid;

                assembly->index = 0;

                assembly->last_frag_num = 0;

                assembly->throw_away_mode = THROW_AWAY_INACTIVE;

                return (assembly);

        }


        /*

         * Nothing available in inuse or free list, so allocate a new one

         */

        assembly = malloc (sizeof (struct assembly));

        /*

         * TODO handle memory allocation failure here

         */

        assert (assembly);

        assembly->nodeid = nodeid;

        assembly->data[0] = 0;

        assembly->index = 0;

        assembly->last_frag_num = 0;

        assembly->throw_away_mode = THROW_AWAY_INACTIVE;

        qb_list_init (&assembly->list);

        qb_list_add (&assembly->list, active_assembly_list_inuse);


        return (assembly);

}


static void assembly_deref (struct assembly *assembly)

{

        qb_list_del (&assembly->list);

        qb_list_add (&assembly->list, &assembly_list_free);

}


static void assembly_deref_from_normal_and_trans (int nodeid)

{

        int j;

        struct qb_list_head *list, *tmp_iter;

        struct qb_list_head *active_assembly_list_inuse;

        struct assembly *assembly;


        for (j = 0; j < 2; j++) {

                if (j == 0) {

                        active_assembly_list_inuse = &assembly_list_inuse;

                } else {

                        active_assembly_list_inuse = &assembly_list_inuse_trans;

                }


                qb_list_for_each_safe(list, tmp_iter, active_assembly_list_inuse) {

                        assembly = qb_list_entry (list, struct assembly, list);


                        if (nodeid == assembly->nodeid) {

                                qb_list_del (&assembly->list);

                                qb_list_add (&assembly->list, &assembly_list_free);

                        }

                }

        }


}


static inline void app_confchg_fn (

        enum totem_configuration_type configuration_type,

        const unsigned int *member_list, size_t member_list_entries,

        const unsigned int *left_list, size_t left_list_entries,

        const unsigned int *joined_list, size_t joined_list_entries,

        const struct memb_ring_id *ring_id)

{

        int i;

        struct totempg_group_instance *instance;

        struct qb_list_head *list;


        /*

         * For every leaving processor, add to free list

         * This also has the side effect of clearing out the dataset

         * In the leaving processor's assembly buffer.

         */

        for (i = 0; i < left_list_entries; i++) {

                assembly_deref_from_normal_and_trans (left_list[i]);

        }


        qb_list_for_each(list, &totempg_groups_list) {

                instance = qb_list_entry (list, struct totempg_group_instance, list);


                if (instance->confchg_fn) {

                        instance->confchg_fn (

                                configuration_type,

                                member_list,

                                member_list_entries,

                                left_list,

                                left_list_entries,

                                joined_list,

                                joined_list_entries,

                                ring_id);

                }

        }

}


static inline void group_endian_convert (

        void *msg,

        int msg_len)

{

        unsigned short *group_len;

        int i;

        char *aligned_msg;


#ifdef TOTEMPG_NEED_ALIGN

        /*

         * Align data structure for not i386 or x86_64

         */

        if ((size_t)msg % sizeof(char *) != 0) {

                aligned_msg = alloca(msg_len);

                memcpy(aligned_msg, msg, msg_len);

        } else {

                aligned_msg = msg;

        }

#else

        aligned_msg = msg;

#endif


        group_len = (unsigned short *)aligned_msg;

        group_len[0] = swab16(group_len[0]);

        for (i = 1; i < group_len[0] + 1; i++) {

                group_len[i] = swab16(group_len[i]);

        }


        if (aligned_msg != msg) {

                memcpy(msg, aligned_msg, msg_len);

        }

}


static inline int group_matches (

        struct iovec *iovec,

        unsigned int iov_len,

        struct totempg_group *groups_b,

        unsigned int group_b_cnt,

        unsigned int *adjust_iovec)

{

        unsigned short *group_len;

        char *group_name;

        int i;

        int j;

#ifdef TOTEMPG_NEED_ALIGN

        struct iovec iovec_aligned = { NULL, 0 };

#endif


        assert (iov_len == 1);


#ifdef TOTEMPG_NEED_ALIGN

        /*

         * Align data structure for not i386 or x86_64

         */

        if ((size_t)iovec->iov_base % sizeof(char *) != 0) {

                iovec_aligned.iov_base = alloca(iovec->iov_len);

                memcpy(iovec_aligned.iov_base, iovec->iov_base, iovec->iov_len);

                iovec_aligned.iov_len = iovec->iov_len;

                iovec = &iovec_aligned;

        }

#endif


        group_len = (unsigned short *)iovec->iov_base;

        group_name = ((char *)iovec->iov_base) +

                sizeof (unsigned short) * (group_len[0] + 1);


        /*

         * Calculate amount to adjust the iovec by before delivering to app

         */

        *adjust_iovec = sizeof (unsigned short) * (group_len[0] + 1);

        for (i = 1; i < group_len[0] + 1; i++) {

                *adjust_iovec += group_len[i];

        }


        /*

         * Determine if this message should be delivered to this instance

         */

        for (i = 1; i < group_len[0] + 1; i++) {

                for (j = 0; j < group_b_cnt; j++) {

                        if ((group_len[i] == groups_b[j].group_len) &&

                                (memcmp (groups_b[j].group, group_name, group_len[i]) == 0)) {

                                return (1);

                        }

                }

                group_name += group_len[i];

        }

        return (0);

}


static inline void app_deliver_fn (

        unsigned int nodeid,

        void *msg,

        unsigned int msg_len,

        int endian_conversion_required)

{

        struct totempg_group_instance *instance;

        struct iovec stripped_iovec;

        unsigned int adjust_iovec;

        struct iovec *iovec;

        struct qb_list_head *list;


        struct iovec aligned_iovec = { NULL, 0 };


        if (endian_conversion_required) {

                group_endian_convert (msg, msg_len);

        }


        /*

         * TODO: segmentation/assembly need to be redesigned to provide aligned access

         * in all cases to avoid memory copies on non386 archs. Probably broke backwars

         * compatibility

         */


#ifdef TOTEMPG_NEED_ALIGN

        /*

         * Align data structure for not i386 or x86_64

         */

        aligned_iovec.iov_base = alloca(msg_len);

        aligned_iovec.iov_len = msg_len;

        memcpy(aligned_iovec.iov_base, msg, msg_len);

#else

        aligned_iovec.iov_base = msg;

        aligned_iovec.iov_len = msg_len;

#endif


        iovec = &aligned_iovec;


        qb_list_for_each(list, &totempg_groups_list) {

                instance = qb_list_entry (list, struct totempg_group_instance, list);

                if (group_matches (iovec, 1, instance->groups, instance->groups_cnt, &adjust_iovec)) {

                        stripped_iovec.iov_len = iovec->iov_len - adjust_iovec;

                        stripped_iovec.iov_base = (char *)iovec->iov_base + adjust_iovec;


#ifdef TOTEMPG_NEED_ALIGN

                        /*

                         * Align data structure for not i386 or x86_64

                         */

                        if ((uintptr_t)((char *)iovec->iov_base + adjust_iovec) % (sizeof(char *)) != 0) {

                                /*

                                 * Deal with misalignment

                                 */

                                stripped_iovec.iov_base =

                                        alloca (stripped_iovec.iov_len);

                                memcpy (stripped_iovec.iov_base,

                                         (char *)iovec->iov_base + adjust_iovec,

                                        stripped_iovec.iov_len);

                        }

#endif

                        instance->deliver_fn (

                                nodeid,

                                stripped_iovec.iov_base,

                                stripped_iovec.iov_len,

                                endian_conversion_required);

                }

        }

}


static void totempg_confchg_fn (

        enum totem_configuration_type configuration_type,

        const unsigned int *member_list, size_t member_list_entries,

        const unsigned int *left_list, size_t left_list_entries,

        const unsigned int *joined_list, size_t joined_list_entries,

        const struct memb_ring_id *ring_id)

{

// TODO optimize this

        app_confchg_fn (configuration_type,

                member_list, member_list_entries,

                left_list, left_list_entries,

                joined_list, joined_list_entries,

                ring_id);

}


static void totempg_deliver_fn (

        unsigned int nodeid,

        const void *msg,

        unsigned int msg_len,

        int endian_conversion_required)

{

        struct totempg_mcast *mcast;

        unsigned short *msg_lens;

        int i;

        struct assembly *assembly;

        char header[FRAME_SIZE_MAX];

        int msg_count;

        int continuation;

        int start;

        const char *data;

        int datasize;

        struct iovec iov_delv;

        size_t expected_msg_len;


        assembly = assembly_ref (nodeid);

        assert (assembly);


        if (msg_len < sizeof(struct totempg_mcast)) {

                log_printf(LOG_WARNING,

                    "Message (totempg_mcast) received from node " CS_PRI_NODE_ID " is too short...  Ignoring.", nodeid);


                return ;

        }


        /*

         * Assemble the header into one block of data and

         * assemble the packet contents into one block of data to simplify delivery

         */


        mcast = (struct totempg_mcast *)msg;

        if (endian_conversion_required) {

                mcast->msg_count = swab16 (mcast->msg_count);

        }


        msg_count = mcast->msg_count;

        datasize = sizeof (struct totempg_mcast) +

                msg_count * sizeof (unsigned short);


        if (msg_len < datasize) {

                log_printf(LOG_WARNING,

                    "Message (totempg_mcast datasize) received from node " CS_PRI_NODE_ID

                    " is too short...  Ignoring.", nodeid);


                return ;

        }


        memcpy (header, msg, datasize);

        data = msg;


        msg_lens = (unsigned short *) (header + sizeof (struct totempg_mcast));

        expected_msg_len = datasize;

        for (i = 0; i < mcast->msg_count; i++) {

                if (endian_conversion_required) {

                        msg_lens[i] = swab16 (msg_lens[i]);

                }


                expected_msg_len += msg_lens[i];

        }


        if (msg_len != expected_msg_len) {

                log_printf(LOG_WARNING,

                    "Message (totempg_mcast) received from node " CS_PRI_NODE_ID

                    " doesn't have expected length of %zu (has %u) bytes...  Ignoring.",

                    nodeid, expected_msg_len, msg_len);


                return ;

        }


        assert((assembly->index+msg_len) < sizeof(assembly->data));

        memcpy (&assembly->data[assembly->index], &data[datasize],

                msg_len - datasize);


        /*

         * If the last message in the buffer is a fragment, then we

         * can't deliver it.  We'll first deliver the full messages

         * then adjust the assembly buffer so we can add the rest of the

         * fragment when it arrives.

         */

        msg_count = mcast->fragmented ? mcast->msg_count - 1 : mcast->msg_count;

        continuation = mcast->continuation;

        iov_delv.iov_base = (void *)&assembly->data[0];

        iov_delv.iov_len = assembly->index + msg_lens[0];


        /*

         * Make sure that if this message is a continuation, that it

         * matches the sequence number of the previous fragment.

         * Also, if the first packed message is a continuation

         * of a previous message, but the assembly buffer

         * is empty, then we need to discard it since we can't

         * assemble a complete message. Likewise, if this message isn't a

         * continuation and the assembly buffer is empty, we have to discard

         * the continued message.

         */

        start = 0;


        if (assembly->throw_away_mode == THROW_AWAY_ACTIVE) {

                 /* Throw away the first msg block */

                if (mcast->fragmented == 0 || mcast->fragmented == 1) {

                        assembly->throw_away_mode = THROW_AWAY_INACTIVE;


                        assembly->index += msg_lens[0];

                        iov_delv.iov_base = (void *)&assembly->data[assembly->index];

                        iov_delv.iov_len = msg_lens[1];

                        start = 1;

                }

        } else

        if (assembly->throw_away_mode == THROW_AWAY_INACTIVE) {

                if (continuation == assembly->last_frag_num) {

                        assembly->last_frag_num = mcast->fragmented;

                        for  (i = start; i < msg_count; i++) {

                                app_deliver_fn(nodeid, iov_delv.iov_base, iov_delv.iov_len,

                                        endian_conversion_required);

                                assembly->index += msg_lens[i];

                                iov_delv.iov_base = (void *)&assembly->data[assembly->index];

                                if (i < (msg_count - 1)) {

                                        iov_delv.iov_len = msg_lens[i + 1];

                                }

                        }

                } else {

                        log_printf (LOG_DEBUG, "fragmented continuation %u is not equal to assembly last_frag_num %u",

                                        continuation, assembly->last_frag_num);

                        assembly->throw_away_mode = THROW_AWAY_ACTIVE;

                }

        }


        if (mcast->fragmented == 0) {

                /*

                 * End of messages, dereference assembly struct

                 */

                assembly->last_frag_num = 0;

                assembly->index = 0;

                assembly_deref (assembly);

        } else {

                /*

                 * Message is fragmented, keep around assembly list

                 */

                if (mcast->msg_count > 1) {

                        memmove (&assembly->data[0],

                                &assembly->data[assembly->index],

                                msg_lens[msg_count]);


                        assembly->index = 0;

                }

                assembly->index += msg_lens[msg_count];

        }

}


/*

 * Totem Process Group Abstraction

 * depends on poll abstraction, POSIX, IPV4

 */


void *callback_token_received_handle;


int callback_token_received_fn (enum totem_callback_token_type type,

                                const void *data)

{

        struct totempg_mcast mcast;

        struct iovec iovecs[3];


        if (totempg_threaded_mode == 1) {

                pthread_mutex_lock (&mcast_msg_mutex);

        }

        if (mcast_packed_msg_count == 0) {

                if (totempg_threaded_mode == 1) {

                        pthread_mutex_unlock (&mcast_msg_mutex);

                }

                return (0);

        }

        if (totemsrp_avail(totemsrp_context) == 0) {

                if (totempg_threaded_mode == 1) {

                        pthread_mutex_unlock (&mcast_msg_mutex);

                }

                return (0);

        }

        mcast.header.version = 0;

        mcast.header.type = 0;

        mcast.fragmented = 0;


        /*

         * Was the first message in this buffer a continuation of a

         * fragmented message?

         */

        mcast.continuation = fragment_continuation;

        fragment_continuation = 0;


        mcast.msg_count = mcast_packed_msg_count;


        iovecs[0].iov_base = (void *)&mcast;

        iovecs[0].iov_len = sizeof (struct totempg_mcast);

        iovecs[1].iov_base = (void *)mcast_packed_msg_lens;

        iovecs[1].iov_len = mcast_packed_msg_count * sizeof (unsigned short);

        iovecs[2].iov_base = (void *)&fragmentation_data[0];

        iovecs[2].iov_len = fragment_size;

        (void)totemsrp_mcast (totemsrp_context, iovecs, 3, 0);


        mcast_packed_msg_count = 0;

        fragment_size = 0;


        if (totempg_threaded_mode == 1) {

                pthread_mutex_unlock (&mcast_msg_mutex);

        }

        return (0);

}


/*

 * Initialize the totem process group abstraction

 */


int totempg_initialize (

        qb_loop_t *poll_handle,

        struct totem_config *totem_config)

{

        int res;


        totempg_totem_config = totem_config;

        totempg_log_level_security = totem_config->totem_logging_configuration.log_level_security;

        totempg_log_level_error = totem_config->totem_logging_configuration.log_level_error;

        totempg_log_level_warning = totem_config->totem_logging_configuration.log_level_warning;

        totempg_log_level_notice = totem_config->totem_logging_configuration.log_level_notice;

        totempg_log_level_debug = totem_config->totem_logging_configuration.log_level_debug;

        totempg_log_printf = totem_config->totem_logging_configuration.log_printf;

        totempg_subsys_id = totem_config->totem_logging_configuration.log_subsys_id;


        fragmentation_data = malloc (TOTEMPG_PACKET_SIZE);

        if (fragmentation_data == 0) {

                return (-1);

        }


        totemsrp_net_mtu_adjust (totem_config);


        res = totemsrp_initialize (

                poll_handle,

                &totemsrp_context,

                totem_config,

                &totempg_stats,

                totempg_deliver_fn,

                totempg_confchg_fn,

                totempg_waiting_trans_ack_cb);


        if (res == -1) {

                goto error_exit;

        }


        totemsrp_callback_token_create (

                totemsrp_context,

                &callback_token_received_handle,

                TOTEM_CALLBACK_TOKEN_RECEIVED,

                0,

                callback_token_received_fn,

                0);


        totempg_size_limit = (totemsrp_avail(totemsrp_context) - 1) *

                (totempg_totem_config->net_mtu -

                sizeof (struct totempg_mcast) - 16);


        qb_list_init (&totempg_groups_list);


error_exit:

        return (res);

}


void totempg_finalize (void)

{

        if (totempg_threaded_mode == 1) {

                pthread_mutex_lock (&totempg_mutex);

        }

        totemsrp_finalize (totemsrp_context);

        if (totempg_threaded_mode == 1) {

                pthread_mutex_unlock (&totempg_mutex);

        }

}


/*

 * Multicast a message

 */

static int mcast_msg (

        struct iovec *iovec_in,

        unsigned int iov_len,

        int guarantee)

{

        int res = 0;

        struct totempg_mcast mcast;

        struct iovec iovecs[3];

        struct iovec iovec[64];

        int i;

        int dest, src;

        int max_packet_size = 0;

        int copy_len = 0;

        int copy_base = 0;

        int total_size = 0;


        if (totempg_threaded_mode == 1) {

                pthread_mutex_lock (&mcast_msg_mutex);

        }

        totemsrp_event_signal (totemsrp_context, TOTEM_EVENT_NEW_MSG, 1);


        /*

         * Remove zero length iovectors from the list

         */

        assert (iov_len < 64);

        for (dest = 0, src = 0; src < iov_len; src++) {

                if (iovec_in[src].iov_len) {

                        memcpy (&iovec[dest++], &iovec_in[src],

                                sizeof (struct iovec));

                }

        }

        iov_len = dest;


        max_packet_size = TOTEMPG_PACKET_SIZE -

                (sizeof (unsigned short) * (mcast_packed_msg_count + 1));


        mcast_packed_msg_lens[mcast_packed_msg_count] = 0;


        /*

         * Check if we would overwrite new message queue

         */

        for (i = 0; i < iov_len; i++) {

                total_size += iovec[i].iov_len;

        }


        if (byte_count_send_ok (total_size + sizeof(unsigned short) *

                (mcast_packed_msg_count)) == 0) {


                if (totempg_threaded_mode == 1) {

                        pthread_mutex_unlock (&mcast_msg_mutex);

                }

                return(-1);

        }


        memset(&mcast, 0, sizeof(mcast));


        mcast.header.version = 0;

        for (i = 0; i < iov_len; ) {

                mcast.fragmented = 0;

                mcast.continuation = fragment_continuation;

                copy_len = iovec[i].iov_len - copy_base;


                /*

                 * If it all fits with room left over, copy it in.

                 * We need to leave at least sizeof(short) + 1 bytes in the

                 * fragment_buffer on exit so that max_packet_size + fragment_size

                 * doesn't exceed the size of the fragment_buffer on the next call.

                 */

                if ((iovec[i].iov_len + fragment_size) <

                        (max_packet_size - sizeof (unsigned short))) {


                        memcpy (&fragmentation_data[fragment_size],

                                (char *)iovec[i].iov_base + copy_base, copy_len);

                        fragment_size += copy_len;

                        mcast_packed_msg_lens[mcast_packed_msg_count] += copy_len;

                        next_fragment = 1;

                        copy_len = 0;

                        copy_base = 0;

                        i++;

                        continue;


                /*

                 * If it just fits or is too big, then send out what fits.

                 */

                } else {

                        unsigned char *data_ptr;


                        copy_len = min(copy_len, max_packet_size - fragment_size);

                        if( copy_len == max_packet_size )

                                data_ptr = (unsigned char *)iovec[i].iov_base + copy_base;

                        else {

                                data_ptr = fragmentation_data;

                        }


                        memcpy (&fragmentation_data[fragment_size],

                                (unsigned char *)iovec[i].iov_base + copy_base, copy_len);

                        mcast_packed_msg_lens[mcast_packed_msg_count] += copy_len;


                        /*

                         * if we're not on the last iovec or the iovec is too large to

                         * fit, then indicate a fragment. This also means that the next

                         * message will have the continuation of this one.

                         */

                        if ((i < (iov_len - 1)) ||

                                        ((copy_base + copy_len) < iovec[i].iov_len)) {

                                if (!next_fragment) {

                                        next_fragment++;

                                }

                                fragment_continuation = next_fragment;

                                mcast.fragmented = next_fragment++;

                                assert(fragment_continuation != 0);

                                assert(mcast.fragmented != 0);

                        } else {

                                fragment_continuation = 0;

                        }


                        /*

                         * assemble the message and send it

                         */

                        mcast.msg_count = ++mcast_packed_msg_count;

                        iovecs[0].iov_base = (void *)&mcast;

                        iovecs[0].iov_len = sizeof(struct totempg_mcast);

                        iovecs[1].iov_base = (void *)mcast_packed_msg_lens;

                        iovecs[1].iov_len = mcast_packed_msg_count *

                                sizeof(unsigned short);

                        iovecs[2].iov_base = (void *)data_ptr;

                        iovecs[2].iov_len = fragment_size + copy_len;

                        assert (totemsrp_avail(totemsrp_context) > 0);

                        res = totemsrp_mcast (totemsrp_context, iovecs, 3, guarantee);

                        if (res == -1) {

                                goto error_exit;

                        }


                        /*

                         * Recalculate counts and indexes for the next.

                         */

                        mcast_packed_msg_lens[0] = 0;

                        mcast_packed_msg_count = 0;

                        fragment_size = 0;

                        max_packet_size = TOTEMPG_PACKET_SIZE - (sizeof(unsigned short));


                        /*

                         * If the iovec all fit, go to the next iovec

                         */

                        if ((copy_base + copy_len) == iovec[i].iov_len) {

                                copy_len = 0;

                                copy_base = 0;

                                i++;


                        /*

                         * Continue with the rest of the current iovec.

                         */

                        } else {

                                copy_base += copy_len;

                        }

                }

        }


        /*

         * Bump only if we added message data.  This may be zero if

         * the last buffer just fit into the fragmentation_data buffer

         * and we were at the last iovec.

         */

        if (mcast_packed_msg_lens[mcast_packed_msg_count]) {

                        mcast_packed_msg_count++;

        }


error_exit:

        if (totempg_threaded_mode == 1) {

                pthread_mutex_unlock (&mcast_msg_mutex);

        }

        return (res);

}


/*

 * Determine if a message of msg_size could be queued

 */

static int msg_count_send_ok (

        int msg_count)

{

        int avail = 0;


        avail = totemsrp_avail (totemsrp_context);

        totempg_stats.msg_queue_avail = avail;


        return ((avail - totempg_reserved) > msg_count);

}


static int byte_count_send_ok (

        int byte_count)

{

        unsigned int msg_count = 0;

        int avail = 0;


        avail = totemsrp_avail (totemsrp_context);


        msg_count = (byte_count / (totempg_totem_config->net_mtu - sizeof (struct totempg_mcast) - 16)) + 1;


        return (avail >= msg_count);

}


static int send_reserve (

        int msg_size)

{

        unsigned int msg_count = 0;


        msg_count = (msg_size / (totempg_totem_config->net_mtu - sizeof (struct totempg_mcast) - 16)) + 1;

        totempg_reserved += msg_count;

        totempg_stats.msg_reserved = totempg_reserved;


        return (msg_count);

}


static void send_release (

        int msg_count)

{

        totempg_reserved -= msg_count;

        totempg_stats.msg_reserved = totempg_reserved;

}


#ifndef HAVE_SMALL_MEMORY_FOOTPRINT

#undef MESSAGE_QUEUE_MAX

#define MESSAGE_QUEUE_MAX       ((4 * MESSAGE_SIZE_MAX) / totempg_totem_config->net_mtu)

#endif /* HAVE_SMALL_MEMORY_FOOTPRINT */


static uint32_t q_level_precent_used(void)

{

        return (100 - (((totemsrp_avail(totemsrp_context) - totempg_reserved) * 100) / MESSAGE_QUEUE_MAX));

}


int totempg_callback_token_create (

        void **handle_out,

        enum totem_callback_token_type type,

        int delete,

        int (*callback_fn) (enum totem_callback_token_type type, const void *),

        const void *data)

{

        unsigned int res;

        if (totempg_threaded_mode == 1) {

                pthread_mutex_lock (&callback_token_mutex);

        }

        res = totemsrp_callback_token_create (totemsrp_context, handle_out, type, delete,

                callback_fn, data);

        if (totempg_threaded_mode == 1) {

                pthread_mutex_unlock (&callback_token_mutex);

        }

        return (res);

}


void totempg_callback_token_destroy (

        void *handle_out)

{

        if (totempg_threaded_mode == 1) {

                pthread_mutex_lock (&callback_token_mutex);

        }

        totemsrp_callback_token_destroy (totemsrp_context, handle_out);

        if (totempg_threaded_mode == 1) {

                pthread_mutex_unlock (&callback_token_mutex);

        }

}


/*

 *      vi: set autoindent tabstop=4 shiftwidth=4 :

 */


int totempg_groups_initialize (

        void **totempg_groups_instance,


        void (*deliver_fn) (

                unsigned int nodeid,

                const void *msg,

                unsigned int msg_len,

                int endian_conversion_required),


        void (*confchg_fn) (

                enum totem_configuration_type configuration_type,

                const unsigned int *member_list, size_t member_list_entries,

                const unsigned int *left_list, size_t left_list_entries,

                const unsigned int *joined_list, size_t joined_list_entries,

                const struct memb_ring_id *ring_id))

{

        struct totempg_group_instance *instance;


        if (totempg_threaded_mode == 1) {

                pthread_mutex_lock (&totempg_mutex);

        }


        instance = malloc (sizeof (struct totempg_group_instance));

        if (instance == NULL) {

                goto error_exit;

        }


        instance->deliver_fn = deliver_fn;

        instance->confchg_fn = confchg_fn;

        instance->groups = 0;

        instance->groups_cnt = 0;

        instance->q_level = QB_LOOP_MED;

        qb_list_init (&instance->list);

        qb_list_add (&instance->list, &totempg_groups_list);


        if (totempg_threaded_mode == 1) {

                pthread_mutex_unlock (&totempg_mutex);

        }

        *totempg_groups_instance = instance;

        return (0);


error_exit:

        if (totempg_threaded_mode == 1) {

                pthread_mutex_unlock (&totempg_mutex);

        }

        return (-1);

}


int totempg_groups_join (

        void *totempg_groups_instance,

        const struct totempg_group *groups,

        size_t group_cnt)

{

        struct totempg_group_instance *instance = (struct totempg_group_instance *)totempg_groups_instance;

        struct totempg_group *new_groups;

        int res = 0;


        if (totempg_threaded_mode == 1) {

                pthread_mutex_lock (&totempg_mutex);

        }


        new_groups = realloc (instance->groups,

                sizeof (struct totempg_group) *

                (instance->groups_cnt + group_cnt));

        if (new_groups == 0) {

                res = -1;

                goto error_exit;

        }

        memcpy (&new_groups[instance->groups_cnt],

                groups, group_cnt * sizeof (struct totempg_group));

        instance->groups = new_groups;

        instance->groups_cnt += group_cnt;


error_exit:

        if (totempg_threaded_mode == 1) {

                pthread_mutex_unlock (&totempg_mutex);

        }

        return (res);

}


int totempg_groups_leave (

        void *totempg_groups_instance,

        const struct totempg_group *groups,

        size_t group_cnt)

{

        if (totempg_threaded_mode == 1) {

                pthread_mutex_lock (&totempg_mutex);

        }


        if (totempg_threaded_mode == 1) {

                pthread_mutex_unlock (&totempg_mutex);

        }

        return (0);

}


#define MAX_IOVECS_FROM_APP 32

#define MAX_GROUPS_PER_MSG 32


int totempg_groups_mcast_joined (

        void *totempg_groups_instance,

        const struct iovec *iovec,

        unsigned int iov_len,

        int guarantee)

{

        struct totempg_group_instance *instance = (struct totempg_group_instance *)totempg_groups_instance;

        unsigned short group_len[MAX_GROUPS_PER_MSG + 1];

        struct iovec iovec_mcast[MAX_GROUPS_PER_MSG + 1 + MAX_IOVECS_FROM_APP];

        int i;

        unsigned int res;


        if (totempg_threaded_mode == 1) {

                pthread_mutex_lock (&totempg_mutex);

        }


        /*

         * Build group_len structure and the iovec_mcast structure

         */

        group_len[0] = instance->groups_cnt;

        for (i = 0; i < instance->groups_cnt; i++) {

                group_len[i + 1] = instance->groups[i].group_len;

                iovec_mcast[i + 1].iov_len = instance->groups[i].group_len;

                iovec_mcast[i + 1].iov_base = (void *) instance->groups[i].group;

        }

        iovec_mcast[0].iov_len = (instance->groups_cnt + 1) * sizeof (unsigned short);

        iovec_mcast[0].iov_base = group_len;

        for (i = 0; i < iov_len; i++) {

                iovec_mcast[i + instance->groups_cnt + 1].iov_len = iovec[i].iov_len;

                iovec_mcast[i + instance->groups_cnt + 1].iov_base = iovec[i].iov_base;

        }


        res = mcast_msg (iovec_mcast, iov_len + instance->groups_cnt + 1, guarantee);


        if (totempg_threaded_mode == 1) {

                pthread_mutex_unlock (&totempg_mutex);

        }


        return (res);

}


static void check_q_level(

        void *totempg_groups_instance)

{

        struct totempg_group_instance *instance = (struct totempg_group_instance *)totempg_groups_instance;

        int32_t old_level = instance->q_level;

        int32_t percent_used = q_level_precent_used();


        if (percent_used >= 75 && instance->q_level != TOTEM_Q_LEVEL_CRITICAL) {

                instance->q_level = TOTEM_Q_LEVEL_CRITICAL;

        } else if (percent_used < 30 && instance->q_level != TOTEM_Q_LEVEL_LOW) {

                instance->q_level = TOTEM_Q_LEVEL_LOW;

        } else if (percent_used > 40 && percent_used < 50 && instance->q_level != TOTEM_Q_LEVEL_GOOD) {

                instance->q_level = TOTEM_Q_LEVEL_GOOD;

        } else if (percent_used > 60 && percent_used < 70 && instance->q_level != TOTEM_Q_LEVEL_HIGH) {

                instance->q_level = TOTEM_Q_LEVEL_HIGH;

        }

        if (totem_queue_level_changed && old_level != instance->q_level) {

                totem_queue_level_changed(instance->q_level);

        }

}


void totempg_check_q_level(

        void *totempg_groups_instance)

{

        struct totempg_group_instance *instance = (struct totempg_group_instance *)totempg_groups_instance;


        check_q_level(instance);

}


int totempg_groups_joined_reserve (

        void *totempg_groups_instance,

        const struct iovec *iovec,

        unsigned int iov_len)

{

        struct totempg_group_instance *instance = (struct totempg_group_instance *)totempg_groups_instance;

        unsigned int size = 0;

        unsigned int i;

        unsigned int reserved = 0;


        if (totempg_threaded_mode == 1) {

                pthread_mutex_lock (&totempg_mutex);

                pthread_mutex_lock (&mcast_msg_mutex);

        }


        for (i = 0; i < instance->groups_cnt; i++) {

                size += instance->groups[i].group_len;

        }

        for (i = 0; i < iov_len; i++) {

                size += iovec[i].iov_len;

        }


        if (size >= totempg_size_limit) {

                reserved = -1;

                goto error_exit;

        }


        if (byte_count_send_ok (size)) {

                reserved = send_reserve (size);

        } else {

                reserved = 0;

        }


error_exit:

        check_q_level(instance);


        if (totempg_threaded_mode == 1) {

                pthread_mutex_unlock (&mcast_msg_mutex);

                pthread_mutex_unlock (&totempg_mutex);

        }

        return (reserved);

}


int totempg_groups_joined_release (int msg_count)

{

        if (totempg_threaded_mode == 1) {

                pthread_mutex_lock (&totempg_mutex);

                pthread_mutex_lock (&mcast_msg_mutex);

        }

        send_release (msg_count);

        if (totempg_threaded_mode == 1) {

                pthread_mutex_unlock (&mcast_msg_mutex);

                pthread_mutex_unlock (&totempg_mutex);

        }

        return 0;

}


int totempg_groups_mcast_groups (

        void *totempg_groups_instance,

        int guarantee,

        const struct totempg_group *groups,

        size_t groups_cnt,

        const struct iovec *iovec,

        unsigned int iov_len)

{

        unsigned short group_len[MAX_GROUPS_PER_MSG + 1];

        struct iovec iovec_mcast[MAX_GROUPS_PER_MSG + 1 + MAX_IOVECS_FROM_APP];

        int i;

        unsigned int res;


        if (totempg_threaded_mode == 1) {

                pthread_mutex_lock (&totempg_mutex);

        }


        /*

         * Build group_len structure and the iovec_mcast structure

         */

        group_len[0] = groups_cnt;

        for (i = 0; i < groups_cnt; i++) {

                group_len[i + 1] = groups[i].group_len;

                iovec_mcast[i + 1].iov_len = groups[i].group_len;

                iovec_mcast[i + 1].iov_base = (void *) groups[i].group;

        }

        iovec_mcast[0].iov_len = (groups_cnt + 1) * sizeof (unsigned short);

        iovec_mcast[0].iov_base = group_len;

        for (i = 0; i < iov_len; i++) {

                iovec_mcast[i + groups_cnt + 1].iov_len = iovec[i].iov_len;

                iovec_mcast[i + groups_cnt + 1].iov_base = iovec[i].iov_base;

        }


        res = mcast_msg (iovec_mcast, iov_len + groups_cnt + 1, guarantee);


        if (totempg_threaded_mode == 1) {

                pthread_mutex_unlock (&totempg_mutex);

        }

        return (res);

}


/*

 * Returns -1 if error, 0 if can't send, 1 if can send the message

 */


int totempg_groups_send_ok_groups (

        void *totempg_groups_instance,

        const struct totempg_group *groups,

        size_t groups_cnt,

        const struct iovec *iovec,

        unsigned int iov_len)

{

        unsigned int size = 0;

        unsigned int i;

        unsigned int res;


        if (totempg_threaded_mode == 1) {

                pthread_mutex_lock (&totempg_mutex);

        }


        for (i = 0; i < groups_cnt; i++) {

                size += groups[i].group_len;

        }

        for (i = 0; i < iov_len; i++) {

                size += iovec[i].iov_len;

        }


        res = msg_count_send_ok (size);


        if (totempg_threaded_mode == 1) {

                pthread_mutex_unlock (&totempg_mutex);

        }

        return (res);

}


int totempg_iface_set (

        struct totem_ip_address *interface_addr,

        unsigned short ip_port,

        unsigned int iface_no)

{

        int res;


        res = totemsrp_iface_set (

                totemsrp_context,

                interface_addr,

                ip_port,

                iface_no);


        return (res);

}


int totempg_nodestatus_get (unsigned int nodeid,

                            struct totem_node_status *node_status)

{

        memset(node_status, 0, sizeof(struct totem_node_status));

        return totemsrp_nodestatus_get (totemsrp_context, nodeid, node_status);

}


int totempg_ifaces_get (

        unsigned int nodeid,

        unsigned int *interface_id,

        struct totem_ip_address *interfaces,

        unsigned int interfaces_size,

        char ***status,

        unsigned int *iface_count)

{

        int res;


        res = totemsrp_ifaces_get (

                totemsrp_context,

                nodeid,

                interface_id,

                interfaces,

                interfaces_size,

                status,

                iface_count);


        return (res);

}


void totempg_event_signal (enum totem_event_type type, int value)

{

        totemsrp_event_signal (totemsrp_context, type, value);

}


void* totempg_get_stats (void)

{

        return &totempg_stats;

}


int totempg_crypto_set (

        const char *cipher_type,

        const char *hash_type)

{

        int res;


        res = totemsrp_crypto_set (totemsrp_context, cipher_type, hash_type);


        return (res);

}


#define ONE_IFACE_LEN 63


const char *totempg_ifaces_print (unsigned int nodeid)

{

        static char iface_string[256 * INTERFACE_MAX];

        char one_iface[ONE_IFACE_LEN+1];

        struct totem_ip_address interfaces[INTERFACE_MAX];

        unsigned int iface_count;

        unsigned int iface_ids[INTERFACE_MAX];

        unsigned int i;

        int res;


        iface_string[0] = '\0';


        res = totempg_ifaces_get (nodeid, iface_ids, interfaces, INTERFACE_MAX, NULL, &iface_count);

        if (res == -1) {

                return ("no interface found for nodeid");

        }


        res = totempg_ifaces_get (nodeid, iface_ids, interfaces, INTERFACE_MAX, NULL, &iface_count);


        for (i = 0; i < iface_count; i++) {

                if (!interfaces[i].family) {

                        continue;

                }

                snprintf (one_iface, ONE_IFACE_LEN,

                          "r(%d) ip(%s) ",

                          i, totemip_print (&interfaces[i]));

                strcat (iface_string, one_iface);

        }

        return (iface_string);

}


unsigned int totempg_my_nodeid_get (void)

{

        return (totemsrp_my_nodeid_get(totemsrp_context));

}


int totempg_my_family_get (void)

{

        return (totemsrp_my_family_get(totemsrp_context));

}


extern void totempg_service_ready_register (

        void (*totem_service_ready) (void))

{

        totemsrp_service_ready_register (totemsrp_context, totem_service_ready);

}


void totempg_queue_level_register_callback (totem_queue_level_changed_fn fn)

{

        totem_queue_level_changed = fn;

}


extern int totempg_member_add (

        const struct totem_ip_address *member,

        int ring_no)

{

        return totemsrp_member_add (totemsrp_context, member, ring_no);

}


extern int totempg_member_remove (

        const struct totem_ip_address *member,

        int ring_no)

{

        return totemsrp_member_remove (totemsrp_context, member, ring_no);

}


extern int totempg_reconfigure (void)

{

        return totemsrp_reconfigure (totemsrp_context, totempg_totem_config);

}


extern int totempg_crypto_reconfigure_phase (cfg_message_crypto_reconfig_phase_t phase)

{

        return totemsrp_crypto_reconfigure_phase (totemsrp_context, totempg_totem_config, phase);

}


extern void totempg_stats_clear (int flags)

{

        if (flags & TOTEMPG_STATS_CLEAR_TOTEM) {

                totempg_stats.msg_reserved = 0;

                totempg_stats.msg_queue_avail = 0;

        }

        return totemsrp_stats_clear (totemsrp_context, flags);

}


void totempg_threaded_mode_enable (void)

{

        totempg_threaded_mode = 1;

        totemsrp_threaded_mode_enable (totemsrp_context);

}


void totempg_trans_ack (void)

{

        totemsrp_trans_ack (totemsrp_context);

}


void totempg_force_gather (void)

{

        totemsrp_force_gather(totemsrp_context);

}


/* Assumes ->orig_interfaces is already allocated */


void totempg_get_config(struct totem_config *config)

{

        struct totem_interface *temp_if = config->orig_interfaces;


        memcpy(config, totempg_totem_config, sizeof(struct totem_config));

        config->orig_interfaces = temp_if;

        memcpy(config->orig_interfaces, totempg_totem_config->interfaces, sizeof(struct totem_interface) * INTERFACE_MAX);

        config->interfaces = NULL;

}


void totempg_put_config(struct totem_config *config)

{

        struct totem_interface *temp_if = totempg_totem_config->interfaces;


        /* Preseve the existing interfaces[] array as transports might have pointers saved */

        memcpy(totempg_totem_config->interfaces, config->interfaces, sizeof(struct totem_interface) * INTERFACE_MAX);

        memcpy(totempg_totem_config, config, sizeof(struct totem_config));

        totempg_totem_config->interfaces = temp_if;

}


config.h

totem_configuration_type
totem_configuration_type
The totem_configuration_type enum.
Definition coroapi.h:132

INTERFACE_MAX
#define INTERFACE_MAX
Definition coroapi.h:88

family
unsigned short family
Definition coroapi.h:1

MESSAGE_SIZE_MAX
#define MESSAGE_SIZE_MAX
Definition coroapi.h:97

nodeid
unsigned int nodeid
Definition coroapi.h:0

totem_callback_token_type
totem_callback_token_type
The totem_callback_token_type enum.
Definition coroapi.h:142

TOTEM_CALLBACK_TOKEN_RECEIVED
@ TOTEM_CALLBACK_TOKEN_RECEIVED
Definition coroapi.h:143

CS_PRI_NODE_ID
#define CS_PRI_NODE_ID
Definition corotypes.h:59

min
#define min(a, b)
Definition exec/util.h:66

flags
uint32_t flags
Definition exec/votequorum.c:4

value
uint32_t value
Definition exec/votequorum.c:2

util.h

logsys.h

assembly
Definition totempg.c:199

assembly::index
int index
Definition totempg.c:202

assembly::list
struct qb_list_head list
Definition totempg.c:205

assembly::nodeid
unsigned int nodeid
Definition totempg.c:200

assembly::last_frag_num
unsigned char last_frag_num
Definition totempg.c:203

assembly::throw_away_mode
enum throw_away_mode throw_away_mode
Definition totempg.c:204

assembly::data
unsigned char data[MESSAGE_SIZE_MAX+KNET_MAX_PACKET_SIZE]
Definition totempg.c:201

mcast
Definition totemsrp.c:183

mcast::header
struct totem_message_header header
Definition totemsrp.c:184

memb_ring_id
The memb_ring_id struct.
Definition coroapi.h:122

totem_config
Definition totem.h:159

totem_config::totem_logging_configuration
struct totem_logging_configuration totem_logging_configuration
Definition totem.h:208

totem_config::interfaces
struct totem_interface * interfaces
Definition totem.h:165

totem_config::net_mtu
unsigned int net_mtu
Definition totem.h:210

totem_interface
Definition totem.h:82

totem_ip_address
The totem_ip_address struct.
Definition coroapi.h:111

totem_logging_configuration::log_subsys_id
int log_subsys_id
Definition totem.h:116

totem_logging_configuration::log_level_error
int log_level_error
Definition totem.h:111

totem_logging_configuration::log_level_notice
int log_level_notice
Definition totem.h:113

totem_logging_configuration::log_level_debug
int log_level_debug
Definition totem.h:114

totem_logging_configuration::log_level_warning
int log_level_warning
Definition totem.h:112

totem_logging_configuration::log_printf
void(* log_printf)(int level, int subsys, const char *function_name, const char *file_name, int file_line, const char *format,...) __attribute__((format(printf
Definition totem.h:101

totem_logging_configuration::log_level_security
void(*) in log_level_security)
Definition totem.h:110

totem_message_header::type
char type
Definition totem.h:129

totem_message_header::version
char version
Definition totem.h:128

totem_node_status
Definition totem.h:265

totempg_group_instance
Definition totempg.c:242

totempg_group_instance::groups_cnt
int groups_cnt
Definition totempg.c:258

totempg_group_instance::list
struct qb_list_head list
Definition totempg.c:261

totempg_group_instance::confchg_fn
void(* confchg_fn)(enum totem_configuration_type configuration_type, const unsigned int *member_list, size_t member_list_entries, const unsigned int *left_list, size_t left_list_entries, const unsigned int *joined_list, size_t joined_list_entries, const struct memb_ring_id *ring_id)
Definition totempg.c:249

totempg_group_instance::groups
struct totempg_group * groups
Definition totempg.c:256

totempg_group_instance::q_level
int32_t q_level
Definition totempg.c:259

totempg_group_instance::deliver_fn
void(* deliver_fn)(unsigned int nodeid, const void *msg, unsigned int msg_len, int endian_conversion_required)
Definition totempg.c:243

totempg_group
Definition totempg.h:55

totempg_group::group
const void * group
Definition totempg.h:56

totempg_group::group_len
size_t group_len
Definition totempg.h:57

totempg_mcast_header
Definition totempg.c:114

totempg_mcast_header::type
short type
Definition totempg.c:116

totempg_mcast_header::version
short version
Definition totempg.c:115

totempg_mcast
Definition totempg.c:137

totempg_mcast::msg_count
unsigned short msg_count
Definition totempg.c:141

totempg_mcast::fragmented
unsigned char fragmented
Definition totempg.c:139

totempg_mcast::header
struct totempg_mcast_header header
Definition totempg.c:138

totempg_mcast::continuation
unsigned char continuation
Definition totempg.c:140

totempg_stats_t
Definition totemstats.h:94

totempg_stats_t::msg_queue_avail
uint32_t msg_queue_avail
Definition totemstats.h:98

totempg_stats_t::msg_reserved
uint32_t msg_reserved
Definition totemstats.h:97

swab.h

swab16
#define swab16(x)
The swab16 macro.
Definition swab.h:39

__attribute__
typedef __attribute__

totem_event_type
totem_event_type
Definition totem.h:290

TOTEM_EVENT_NEW_MSG
@ TOTEM_EVENT_NEW_MSG
Definition totem.h:292

FRAME_SIZE_MAX
#define FRAME_SIZE_MAX
Definition totem.h:52

cfg_message_crypto_reconfig_phase_t
cfg_message_crypto_reconfig_phase_t
Definition totem.h:154

type
char type
Definition totem.h:2

totemip_print
const char * totemip_print(const struct totem_ip_address *addr)
Definition totemip.c:256

totempg_my_family_get
int totempg_my_family_get(void)
Definition totempg.c:1537

totempg_my_nodeid_get
unsigned int totempg_my_nodeid_get(void)
Definition totempg.c:1532

totempg_totem_config
static void(*) struct totem_config totempg_totem_config)
Definition totempg.c:190

totempg_groups_leave
int totempg_groups_leave(void *totempg_groups_instance, const struct totempg_group *groups, size_t group_cnt)
Definition totempg.c:1214

totempg_check_q_level
void totempg_check_q_level(void *totempg_groups_instance)
Definition totempg.c:1294

totempg_callback_token_create
int totempg_callback_token_create(void **handle_out, enum totem_callback_token_type type, int delete, int(*callback_fn)(enum totem_callback_token_type type, const void *), const void *data)
Definition totempg.c:1099

log_printf
#define log_printf(level, format, args...)
Definition totempg.c:272

throw_away_mode
throw_away_mode
Definition totempg.c:194

THROW_AWAY_INACTIVE
@ THROW_AWAY_INACTIVE
Definition totempg.c:195

THROW_AWAY_ACTIVE
@ THROW_AWAY_ACTIVE
Definition totempg.c:196

totempg_ifaces_print
const char * totempg_ifaces_print(unsigned int nodeid)
Definition totempg.c:1501

ONE_IFACE_LEN
#define ONE_IFACE_LEN
Definition totempg.c:1500

totempg_groups_joined_reserve
int totempg_groups_joined_reserve(void *totempg_groups_instance, const struct iovec *iovec, unsigned int iov_len)
Definition totempg.c:1302

QB_LIST_DECLARE
QB_LIST_DECLARE(assembly_list_inuse)

totempg_groups_initialize
int totempg_groups_initialize(void **totempg_groups_instance, void(*deliver_fn)(unsigned int nodeid, const void *msg, unsigned int msg_len, int endian_conversion_required), void(*confchg_fn)(enum totem_configuration_type configuration_type, const unsigned int *member_list, size_t member_list_entries, const unsigned int *left_list, size_t left_list_entries, const unsigned int *joined_list, size_t joined_list_entries, const struct memb_ring_id *ring_id))
Initialize a groups instance.
Definition totempg.c:1134

MAX_IOVECS_FROM_APP
#define MAX_IOVECS_FROM_APP
Definition totempg.c:1229

totempg_crypto_set
int totempg_crypto_set(const char *cipher_type, const char *hash_type)
Definition totempg.c:1489

totempg_get_config
void totempg_get_config(struct totem_config *config)
Definition totempg.c:1602

callback_token_received_handle
void * callback_token_received_handle
Definition totempg.c:746

MESSAGE_QUEUE_MAX
#define MESSAGE_QUEUE_MAX
Definition totempg.c:1091

totempg_iface_set
int totempg_iface_set(struct totem_ip_address *interface_addr, unsigned short ip_port, unsigned int iface_no)
Definition totempg.c:1434

totempg_nodestatus_get
int totempg_nodestatus_get(unsigned int nodeid, struct totem_node_status *node_status)
Definition totempg.c:1450

totempg_put_config
void totempg_put_config(struct totem_config *config)
Definition totempg.c:1612

totempg_reconfigure
int totempg_reconfigure(void)
Definition totempg.c:1566

TOTEMPG_PACKET_SIZE
#define TOTEMPG_PACKET_SIZE
Definition totempg.c:153

totempg_crypto_reconfigure_phase
int totempg_crypto_reconfigure_phase(cfg_message_crypto_reconfig_phase_t phase)
Definition totempg.c:1571

totempg_trans_ack
void totempg_trans_ack(void)
Definition totempg.c:1591

totempg_force_gather
void totempg_force_gather(void)
Definition totempg.c:1596

totempg_member_remove
int totempg_member_remove(const struct totem_ip_address *member, int ring_no)
Definition totempg.c:1559

totempg_queue_level_register_callback
void totempg_queue_level_register_callback(totem_queue_level_changed_fn fn)
Definition totempg.c:1547

totempg_initialize
int totempg_initialize(qb_loop_t *poll_handle, struct totem_config *totem_config)
Initialize the totem process groups abstraction.
Definition totempg.c:802

totempg_groups_joined_release
int totempg_groups_joined_release(int msg_count)
Definition totempg.c:1346

MAX_GROUPS_PER_MSG
#define MAX_GROUPS_PER_MSG
Definition totempg.c:1230

totempg_service_ready_register
void totempg_service_ready_register(void(*totem_service_ready)(void))
Definition totempg.c:1541

totempg_ifaces_get
int totempg_ifaces_get(unsigned int nodeid, unsigned int *interface_id, struct totem_ip_address *interfaces, unsigned int interfaces_size, char ***status, unsigned int *iface_count)
Definition totempg.c:1457

totempg_callback_token_destroy
void totempg_callback_token_destroy(void *handle_out)
Definition totempg.c:1118

totempg_event_signal
void totempg_event_signal(enum totem_event_type type, int value)
Definition totempg.c:1479

totempg_stats_clear
void totempg_stats_clear(int flags)
Definition totempg.c:1576

totempg_finalize
void totempg_finalize(void)
Definition totempg.c:855

totempg_get_stats
void * totempg_get_stats(void)
Definition totempg.c:1484

totempg_groups_mcast_joined
int totempg_groups_mcast_joined(void *totempg_groups_instance, const struct iovec *iovec, unsigned int iov_len, int guarantee)
Definition totempg.c:1232

totempg_threaded_mode_enable
void totempg_threaded_mode_enable(void)
Definition totempg.c:1585

totempg_groups_send_ok_groups
int totempg_groups_send_ok_groups(void *totempg_groups_instance, const struct totempg_group *groups, size_t groups_cnt, const struct iovec *iovec, unsigned int iov_len)
Definition totempg.c:1404

totempg_groups_mcast_groups
int totempg_groups_mcast_groups(void *totempg_groups_instance, int guarantee, const struct totempg_group *groups, size_t groups_cnt, const struct iovec *iovec, unsigned int iov_len)
Definition totempg.c:1360

totempg_member_add
int totempg_member_add(const struct totem_ip_address *member, int ring_no)
Definition totempg.c:1552

totempg_groups_join
int totempg_groups_join(void *totempg_groups_instance, const struct totempg_group *groups, size_t group_cnt)
Definition totempg.c:1182

totempg.h
Totem Single Ring Protocol.

totem_queue_level_changed_fn
void(* totem_queue_level_changed_fn)(enum totem_q_level level)
Definition totempg.h:189

TOTEM_Q_LEVEL_GOOD
@ TOTEM_Q_LEVEL_GOOD
Definition totempg.h:182

TOTEM_Q_LEVEL_HIGH
@ TOTEM_Q_LEVEL_HIGH
Definition totempg.h:183

TOTEM_Q_LEVEL_LOW
@ TOTEM_Q_LEVEL_LOW
Definition totempg.h:181

TOTEM_Q_LEVEL_CRITICAL
@ TOTEM_Q_LEVEL_CRITICAL
Definition totempg.h:184

totemsrp_my_family_get
int totemsrp_my_family_get(void *srp_context)
Definition totemsrp.c:1133

totemsrp_force_gather
void totemsrp_force_gather(void *context)
Definition totemsrp.c:5277

totemsrp_service_ready_register
void totemsrp_service_ready_register(void *context, void(*totem_service_ready)(void))
Definition totemsrp.c:5198

totemsrp_initialize
int totemsrp_initialize(qb_loop_t *poll_handle, void **srp_context, struct totem_config *totem_config, totempg_stats_t *stats, void(*deliver_fn)(unsigned int nodeid, const void *msg, unsigned int msg_len, int endian_conversion_required), void(*confchg_fn)(enum totem_configuration_type configuration_type, const unsigned int *member_list, size_t member_list_entries, const unsigned int *left_list, size_t left_list_entries, const unsigned int *joined_list, size_t joined_list_entries, const struct memb_ring_id *ring_id), void(*waiting_trans_ack_cb_fn)(int waiting_trans_ack))
Create a protocol instance.
Definition totemsrp.c:818

totemsrp_callback_token_create
int totemsrp_callback_token_create(void *srp_context, void **handle_out, enum totem_callback_token_type type, int delete, int(*callback_fn)(enum totem_callback_token_type type, const void *), const void *data)
Definition totemsrp.c:3496

totemsrp_threaded_mode_enable
void totemsrp_threaded_mode_enable(void *context)
Definition totemsrp.c:5233

totemsrp_net_mtu_adjust
void totemsrp_net_mtu_adjust(struct totem_config *totem_config)
Definition totemsrp.c:5194

totemsrp_nodestatus_get
int totemsrp_nodestatus_get(void *srp_context, unsigned int nodeid, struct totem_node_status *node_status)
Definition totemsrp.c:1041

guarantee
int guarantee
Definition totemsrp.c:6

totemsrp_crypto_set
int totemsrp_crypto_set(void *srp_context, const char *cipher_type, const char *hash_type)
Definition totemsrp.c:1108

totemsrp_avail
int totemsrp_avail(void *srp_context)
Return number of available messages that can be queued.
Definition totemsrp.c:2568

totemsrp_stats_clear
void totemsrp_stats_clear(void *context, int flags)
Definition totemsrp.c:5267

totemsrp_iface_set
int totemsrp_iface_set(void *context, const struct totem_ip_address *interface_addr, unsigned short ip_port, unsigned int iface_no)
Definition totemsrp.c:5114

totemsrp_finalize
void totemsrp_finalize(void *srp_context)
Definition totemsrp.c:1026

ring_id
struct memb_ring_id ring_id
Definition totemsrp.c:4

totemsrp_trans_ack
void totemsrp_trans_ack(void *context)
Definition totemsrp.c:5240

header
struct totem_message_header header
Definition totemsrp.c:0

totemsrp_crypto_reconfigure_phase
int totemsrp_crypto_reconfigure_phase(void *context, struct totem_config *totem_config, cfg_message_crypto_reconfig_phase_t phase)
Definition totemsrp.c:5258

totemsrp_my_nodeid_get
unsigned int totemsrp_my_nodeid_get(void *srp_context)
Definition totemsrp.c:1122

totemsrp_event_signal
void totemsrp_event_signal(void *srp_context, enum totem_event_type type, int value)
Definition totemsrp.c:2488

totemsrp_callback_token_destroy
void totemsrp_callback_token_destroy(void *srp_context, void **handle_out)
Definition totemsrp.c:3531

totemsrp_member_add
int totemsrp_member_add(void *context, const struct totem_ip_address *member, int iface_no)
Definition totemsrp.c:5207

totemsrp_ifaces_get
int totemsrp_ifaces_get(void *srp_context, unsigned int nodeid, unsigned int *interface_id, struct totem_ip_address *interfaces, unsigned int interfaces_size, char ***status, unsigned int *iface_count)
Definition totemsrp.c:1070

totemsrp_reconfigure
int totemsrp_reconfigure(void *context, struct totem_config *totem_config)
Definition totemsrp.c:5249

totemsrp_member_remove
int totemsrp_member_remove(void *context, const struct totem_ip_address *member, int iface_no)
Definition totemsrp.c:5220

totemsrp_mcast
int totemsrp_mcast(void *srp_context, struct iovec *iovec, unsigned int iov_len, int guarantee)
Multicast a message.
Definition totemsrp.c:2497

totemsrp.h
Totem Single Ring Protocol.

TOTEMPG_STATS_CLEAR_TOTEM
#define TOTEMPG_STATS_CLEAR_TOTEM
Definition totemstats.h:115