diff --git a/core/avl_tree.c b/core/avl_tree.c
index 6b12bd037..468a2afd6 100644
--- a/core/avl_tree.c
+++ b/core/avl_tree.c
@@ -5,6 +5,7 @@
 /* Copied and modified from http://pine.cs.yale.edu/pinewiki/C/AvlTree google cache */
 
 #include "avl_tree.h"
+#include "ross.h"
 
 /* implementation of an AVL tree with explicit heights */
 
@@ -254,7 +255,7 @@ avlDelete(AvlTree *t, tw_event *key)
     AvlTree oldroot;
     
     if (*t == AVL_EMPTY) {
-        tw_error(TW_LOC, "We never look for non-existent events!");
+//        tw_error(TW_LOC, "We never look for non-existent events!");
         return target;
     }
     
diff --git a/core/hole-network-mpi.c b/core/hole-network-mpi.c
new file mode 100644
index 000000000..2e7a64d39
--- /dev/null
+++ b/core/hole-network-mpi.c
@@ -0,0 +1,888 @@
+#include <ross.h>
+#include <mpi.h>
+
+MPI_Comm MPI_COMM_ROSS = MPI_COMM_WORLD;
+int custom_communicator = 0;
+
+/**
+ * @struct act_q
+ * @brief Keeps track of posted send or recv operations.
+ */
+struct act_q
+{
+    const char *name;
+
+    tw_event **event_list;    /**< list of event pointers in this queue */
+    MPI_Request *req_list;    /**< list of MPI request handles */
+    int *idx_list;            /**< indices in this queue of finished operations */
+    MPI_Status *status_list;  /**< list of MPI_Status handles */
+    unsigned int cur;         /**< index of first open spot in the queue */
+    int *overflow_anti;
+    unsigned int length;
+
+};
+
+#define EVENT_TAG 1
+
+#define EVENT_SIZE(e) g_tw_event_msg_sz
+
+static struct act_q posted_sends;
+static struct act_q posted_recvs;
+static tw_eventq outq;
+
+static unsigned int read_buffer = 16;
+static unsigned int send_buffer = 1024;
+static int world_size = 1;
+
+static const tw_optdef mpi_opts[] = {
+        TWOPT_GROUP("ROSS MPI Kernel"),
+        TWOPT_UINT(
+                "read-buffer",
+                read_buffer,
+                "network read buffer size in # of events"),
+        TWOPT_UINT(
+                "send-buffer",
+                send_buffer,
+                "network send buffer size in # of events"),
+        TWOPT_END()
+};
+
+// Forward declarations of functions used in MPI network message processing
+static int recv_begin(tw_pe *me);
+static void recv_finish(tw_pe *me, tw_event *e, char * buffer,struct act_q * q, int id);
+static int send_begin(tw_pe *me);
+static void send_finish(tw_pe *me, tw_event *e, char * buffer,struct act_q * q, int id);
+static void late_recv_finish(tw_pe *me, tw_event *e, char * buffer, struct act_q* q, int id);
+
+// Start of implmentation of network processing routines/functions
+void tw_comm_set(MPI_Comm comm)
+{
+    MPI_COMM_ROSS = comm;
+    custom_communicator = 1;
+}
+
+const tw_optdef *
+tw_net_init(int *argc, char ***argv)
+{
+    int my_rank;
+    int initialized;
+    MPI_Initialized(&initialized);
+
+    if (!initialized) {
+        if (MPI_Init(argc, argv) != MPI_SUCCESS)
+            tw_error(TW_LOC, "MPI_Init failed.");
+    }
+
+    if (MPI_Comm_rank(MPI_COMM_ROSS, &my_rank) != MPI_SUCCESS)
+        tw_error(TW_LOC, "Cannot get MPI_Comm_rank(MPI_COMM_ROSS)");
+
+    g_tw_masternode = 0;
+    g_tw_mynode = my_rank;
+
+    return mpi_opts;
+}
+
+/**
+ * @brief Initializes queues used for posted sends and receives
+ *
+ * @param[in] q pointer to the queue to be initialized
+ * @param[in] name name of the queue
+ */
+static void
+init_q(struct act_q *q, const char *name)
+{
+    unsigned int n;
+
+    if(q == &posted_sends)
+        n = send_buffer;
+    else
+        n = read_buffer;
+
+    q->name = name;
+    q->event_list = (tw_event **) tw_calloc(TW_LOC, name, sizeof(*q->event_list), n);
+    q->req_list = (MPI_Request *) tw_calloc(TW_LOC, name, sizeof(*q->req_list), n);
+    q->idx_list = (int *) tw_calloc(TW_LOC, name, sizeof(*q->idx_list), n);
+    q->status_list = (MPI_Status *) tw_calloc(TW_LOC, name, sizeof(*q->status_list), n);
+    q->overflow_anti = (int *) tw_calloc(TW_LOC, name, sizeof(*q->idx_list), (n/2)+2);// queue, at most (n/2) can be out of order, first element is # of elements in queue
+    q->overflow_anti[0]=1;
+    q->length = n;
+
+}
+
+void check_b_ind( int * b_index, struct act_q * q)
+{
+    while(0 <= *b_index && *b_index<=q->length)
+    {
+
+        if(q->event_list[*b_index]== NULL)
+        {
+            *b_index = *b_index-1;
+        }
+        else
+        {
+            return;
+        }
+
+
+    }
+    *b_index = 0;
+    return;
+
+}
+
+
+unsigned int
+tw_nnodes(void)
+{
+    return world_size;
+}
+
+void
+tw_net_start(void)
+{
+    if (MPI_Comm_size(MPI_COMM_ROSS, &world_size) != MPI_SUCCESS)
+        tw_error(TW_LOC, "Cannot get MPI_Comm_size(MPI_COMM_ROSS)");
+
+    if( g_tw_mynode == 0)
+    {
+        printf("tw_net_start: Found world size to be %d \n", world_size );
+    }
+
+    // Check after tw_nnodes is defined
+    if(tw_nnodes() == 1) {
+        // force the setting of SEQUENTIAL protocol
+        if (g_tw_synchronization_protocol == NO_SYNCH) {
+            g_tw_synchronization_protocol = SEQUENTIAL;
+        } else if(g_tw_synchronization_protocol == CONSERVATIVE || g_tw_synchronization_protocol == OPTIMISTIC) {
+            g_tw_synchronization_protocol = SEQUENTIAL;
+            fprintf(stderr, "Warning: Defaulting to Sequential Simulation, not enough PEs defined.\n");
+        }
+    }
+
+    tw_pe_init();
+
+    //If we're in (some variation of) optimistic mode, we need this hash
+    if (g_tw_synchronization_protocol == OPTIMISTIC ||
+        g_tw_synchronization_protocol == OPTIMISTIC_DEBUG ||
+        g_tw_synchronization_protocol == OPTIMISTIC_REALTIME) {
+        g_tw_pe->hash_t = tw_hash_create();
+    } else {
+        g_tw_pe->hash_t = NULL;
+    }
+
+    if (send_buffer < 1)
+        tw_error(TW_LOC, "network send buffer must be >= 1");
+    if (read_buffer < 1)
+        tw_error(TW_LOC, "network read buffer must be >= 1");
+
+    init_q(&posted_sends, "MPI send queue");
+    init_q(&posted_recvs, "MPI recv queue");
+
+    g_tw_net_device_size = read_buffer;
+
+    // pre-post all the Irecv operations
+    recv_begin(g_tw_pe);
+}
+
+void
+tw_net_abort(void)
+{
+    MPI_Abort(MPI_COMM_ROSS, 1);
+    exit(1);
+}
+
+void
+tw_net_stop(void)
+{
+#ifdef USE_DAMARIS
+    if (g_st_damaris_enabled)
+        st_damaris_ross_finalize();
+    else
+    {
+        if (!custom_communicator) {
+            if (MPI_Finalize() != MPI_SUCCESS)
+                tw_error(TW_LOC, "Failed to finalize MPI");
+        }
+    }
+#else
+    if (!custom_communicator) {
+        if (MPI_Finalize() != MPI_SUCCESS)
+            tw_error(TW_LOC, "Failed to finalize MPI");
+    }
+#endif
+}
+
+void
+tw_net_barrier(void)
+{
+    if (MPI_Barrier(MPI_COMM_ROSS) != MPI_SUCCESS)
+        tw_error(TW_LOC, "Failed to wait for MPI_Barrier");
+}
+
+tw_stime
+tw_net_minimum(void)
+{
+    tw_stime m = DBL_MAX;
+    tw_event *e;
+    unsigned int i;
+
+    e = outq.head;
+    while (e) {
+        if (m > e->recv_ts)
+            m = e->recv_ts;
+        e = e->next;
+    }
+
+    for (i = 0; i < posted_sends.cur; i++) {
+        e = posted_sends.event_list[i];
+        if (m > e->recv_ts)
+            m = e->recv_ts;
+    }
+
+    return m;
+}
+
+/**
+ * @brief Calls MPI_Testsome on the provided queue, to check for finished operations.
+ *
+ * @param[in] q queue to check
+ * @param[in] me pointer to the PE
+ * @param[in] finish pointer to function that will perform the appropriate send/recv
+ * finish functionality
+ *
+ * @return 0 if MPI_Testsome did not return any finished operations, 1 otherwise.
+ */
+//Here, I did not split test_q into two functions for each, instead opting for a boolean indicator
+static int
+test_q(
+        struct act_q * q,
+        tw_pe *me,
+        int pick_queue,
+        void (*finish)(tw_pe *, tw_event *, char *, struct act_q*, int id))
+{
+    int ready, i, n, indicator;
+    q->overflow_anti[0] = 1; //
+    indicator = 1;
+
+
+    if (!q->cur)
+    {
+        return 0;
+    }
+
+    if (MPI_Testsome(
+            q->cur,
+            q->req_list,
+            &ready,
+            q->idx_list,
+            q->status_list) != MPI_SUCCESS) {
+        tw_error(
+                TW_LOC,
+                "MPI_testsome failed with %u items in %s",
+                q->cur,
+                q->name);
+    }
+
+    if (1 > ready)
+        return 0;
+
+    if (pick_queue == 1)
+    {
+
+        for (i = 0; i < ready; i++)
+        {
+
+            tw_event *e;
+
+            n = q->idx_list[i];
+            e = q->event_list[n];
+
+
+            finish(me, e, NULL, q, n);
+
+            if (indicator != q->overflow_anti[0])
+            {
+                indicator = q->overflow_anti[0];
+            }
+            else
+            {
+                q->event_list[n] = NULL;
+            }
+        }
+        i = 1;
+        while (i < q->overflow_anti[0]) {
+
+            tw_event *e;
+            n = q->overflow_anti[i];
+            e = q->event_list[n];
+            late_recv_finish(me, e, NULL, q, n);
+            q->event_list[n] = NULL;
+
+            i++;
+
+        }
+    }
+    else
+    {
+        for (i = 0; i < ready; i++)
+        {
+
+            tw_event *e;
+
+            n = q->idx_list[i];
+            e = q->event_list[n];
+            q->event_list[n] = NULL;
+
+
+
+            finish(me, e, NULL, q, n);
+
+        }
+
+    }
+
+    i = 0;
+
+    int b_index;
+
+    b_index = q->cur-1;
+
+
+    while(i<ready)
+    {
+        n = q->idx_list[i];
+
+        check_b_ind(&b_index, q);
+        if (n < b_index)
+        {
+
+            q->event_list[n] = q->event_list[b_index];
+            memcpy(&q->req_list[n],&q->req_list[b_index],sizeof(q->req_list[0]));
+            b_index--;
+
+        }
+        i++;
+
+    }
+    q->cur -= ready;
+
+    return 1;
+}
+
+/**
+ * @brief If there are any openings in the posted_recvs queue, post more Irecvs.
+ *
+ * @param[in] me pointer to the PE
+ * @return 0 if no changes are made to the queue, 1 otherwise.
+ */
+static int
+recv_begin(tw_pe *me)
+{
+    tw_event	*e = NULL;
+
+    int changed = 0;
+
+    while (posted_recvs.cur < read_buffer)
+    {
+        unsigned id = posted_recvs.cur;
+
+        if(!(e = tw_event_grab(me)))
+        {
+            if(tw_gvt_inprogress(me))
+                tw_error(TW_LOC, "Out of events in GVT! Consider increasing --extramem");
+            return changed;
+        }
+
+        if( MPI_Irecv(e,
+                      (int)EVENT_SIZE(e),
+                      MPI_BYTE,
+                      MPI_ANY_SOURCE,
+                      EVENT_TAG,
+                      MPI_COMM_ROSS,
+                      &posted_recvs.req_list[id]) != MPI_SUCCESS)
+        {
+            tw_event_free(me, e);
+            return changed;
+        }
+
+        posted_recvs.event_list[id] = e;
+        posted_recvs.cur++;
+        changed = 1;
+    }
+
+    return changed;
+}
+
+/**
+ * @brief Determines how to handle the newly received event.
+ *
+ * @param[in] me pointer to PE
+ * @param[in] e pointer to event that we just received
+ * @param[in] buffer not currently used
+ */
+static void recv_finish(tw_pe *me, tw_event *e, char * buffer,struct act_q * q, int id)
+{
+    (void) buffer;
+    tw_pe		*dest_pe;
+    tw_clock start;
+
+    me->stats.s_nread_network++;
+    me->s_nwhite_recv++;
+
+    //  printf("recv_finish: remote event [cancel %u] FROM: LP %lu, PE %lu, TO: LP %lu, PE %lu at TS %lf \n",
+    //	 e->state.cancel_q, (tw_lpid)e->src_lp, e->send_pe, (tw_lpid)e->dest_lp, me->id, e->recv_ts);
+
+    e->dest_lp = tw_getlocal_lp((tw_lpid) e->dest_lp);
+    dest_pe = e->dest_lp->pe;
+    // instrumentation
+    e->dest_lp->kp->kp_stats->s_nread_network++;
+    e->dest_lp->lp_stats->s_nread_network++;
+
+    if(e->send_pe > tw_nnodes()-1)
+        tw_error(TW_LOC, "bad sendpe_id: %d", e->send_pe);
+
+
+
+
+    if(e->recv_ts < me->GVT)
+        tw_error(TW_LOC, "%d: Received straggler from %d: %lf (%d)",
+                 me->id,  e->send_pe, e->recv_ts, e->state.cancel_q);
+
+    if(tw_gvt_inprogress(me))
+        me->trans_msg_ts = ROSS_MIN(me->trans_msg_ts, e->recv_ts);
+
+    // if cancel event, retrieve and flush
+    // else, store in hash table
+    if(e->state.cancel_q)
+    {
+        tw_event *cancel = tw_hash_remove(me->hash_t, e, e->send_pe);
+
+        // NOTE: it is possible to cancel the event we
+        // are currently processing at this PE since this
+        // MPI module lets me read cancel events during
+        // event sends over the network.
+
+        if(cancel!=NULL) // if correct order, do what is needed
+        {
+
+            e->cancel_next = NULL;
+            e->caused_by_me = NULL;
+            e->cause_next = NULL;
+
+            cancel->state.cancel_q = 1;
+            cancel->state.remote = 0;
+            cancel->cancel_next = dest_pe->cancel_q;
+            dest_pe->cancel_q = cancel;
+            tw_event_free(me, e);
+        }
+        else //if out of order, process later
+        {
+            q->overflow_anti[q->overflow_anti[0]] = id; //add id stuff later
+            q->overflow_anti[0]++;
+        }
+
+
+        return;
+    }
+
+    e->cancel_next = NULL;
+    e->caused_by_me = NULL;
+    e->cause_next = NULL;
+
+    if (g_tw_synchronization_protocol == OPTIMISTIC ||
+        g_tw_synchronization_protocol == OPTIMISTIC_DEBUG ||
+        g_tw_synchronization_protocol == OPTIMISTIC_REALTIME ) {
+        tw_hash_insert(me->hash_t, e, e->send_pe);
+        e->state.remote = 1;
+    }
+
+    /* NOTE: the final check in the if conditional below was added to make sure
+     * that we do not execute the fast case unless the cancellation queue is
+     * empty on the destination PE.  Otherwise we need to invoke the normal
+     * scheduling routines to make sure that a forward event doesn't bypass a
+     * cancellation event with an earlier timestamp.  This is helpful for
+     * stateful models that produce incorrect results when presented with
+     * duplicate messages with no rollback between them.
+     */
+    if(me == dest_pe && e->dest_lp->kp->last_time <= e->recv_ts && !dest_pe->cancel_q) {
+        /* Fast case, we are sending to our own PE and
+         * there is no rollback caused by this send.
+         */
+        start = tw_clock_read();
+        tw_pq_enqueue(dest_pe->pq, e);
+        dest_pe->stats.s_pq += tw_clock_read() - start;
+        return;
+    }
+
+    if (me->id == dest_pe->id) {
+        /* Slower, but still local send, so put into top
+         * of dest_pe->event_q.
+         */
+        e->state.owner = TW_pe_event_q;
+        tw_eventq_push(&dest_pe->event_q, e);
+        return;
+    }
+
+    /* Never should happen; MPI should have gotten the
+     * message to the correct node without needing us
+     * to redirect the message there for it.  This is
+     * probably a serious bug with the event headers
+     * not being formatted right.
+     */
+    tw_error(
+            TW_LOC,
+            "Event recived by PE %u but meant for PE %u",
+            me->id,
+            dest_pe->id);
+}
+
+
+
+static void
+late_recv_finish(tw_pe *me, tw_event *e, char * buffer, struct act_q * q, int id )
+{
+    tw_pe		*dest_pe;
+    tw_clock       start;
+
+#if ROSS_MEMORY
+    tw_memory	*memory;
+  tw_memory	*last;
+  tw_fd		 mem_fd;
+
+  size_t		 mem_size;
+
+  unsigned	 position = 0;
+
+  memcpy(e, buffer, g_tw_event_msg_sz);
+  position += g_tw_event_msg_sz;
+#endif
+
+    dest_pe = e->dest_lp->pe;
+    if(e->send_pe > tw_nnodes()-1)
+        tw_error(TW_LOC, "bad sendpe_id: %d", e->send_pe);
+
+    e->cancel_next = NULL;
+    e->caused_by_me = NULL;
+    e->cause_next = NULL;
+
+
+    if(e->recv_ts < me->GVT)
+        tw_error(TW_LOC, "%d: Received straggler from %d: %lf (%d)",
+                 me->id,  e->send_pe, e->recv_ts, e->state.cancel_q);
+
+    if(tw_gvt_inprogress(me))
+        me->trans_msg_ts = ROSS_MIN(me->trans_msg_ts, e->recv_ts);
+
+    // if cancel event, retrieve and flush
+    // else, store in hash table
+
+    tw_event *cancel = tw_hash_remove(me->hash_t, e, e->send_pe);
+    g_tw_pe->avl_tree_size++;//needed because tw_hash_remove is called twice, decrementing this var
+
+    // NOTE: it is possible to cancel the event we
+    // are currently processing at this PE since this
+    // MPI module lets me read cancel events during
+    // event sends over the network.
+
+    cancel->state.cancel_q = 1;
+    cancel->state.remote = 0;
+    cancel->cancel_next = dest_pe->cancel_q;
+    dest_pe->cancel_q = cancel;
+    tw_event_free(me, e);
+
+    return;
+
+}
+
+/**
+ * @brief If there are any openings in the posted_sends queue, start sends
+ * for events in the outgoing queue.
+ *
+ * @param[in] me pointer to the PE
+ * @return 0 if no changes are made to the posted_sends queue, 1 otherwise.
+ */
+static int
+send_begin(tw_pe *me)
+{
+    int changed = 0;
+
+    while (posted_sends.cur < send_buffer)
+    {
+        tw_event *e = tw_eventq_peek(&outq);
+        tw_peid dest_pe;
+
+        unsigned id = posted_sends.cur;
+
+        if (!e)
+            break;
+
+        if(e == me->abort_event)
+            tw_error(TW_LOC, "Sending abort event!");
+
+        dest_pe = (*e->src_lp->type->map) ((tw_lpid) e->dest_lp);
+
+        e->send_pe = (tw_peid) g_tw_mynode;
+        e->send_lp = e->src_lp->gid;
+
+        if (MPI_Isend(e,
+                      (int)EVENT_SIZE(e),
+                      MPI_BYTE,
+                      (int)dest_pe,
+                      EVENT_TAG,
+                      MPI_COMM_ROSS,
+                      &posted_sends.req_list[id]) != MPI_SUCCESS) {
+            return changed;
+        }
+
+        tw_eventq_pop(&outq);
+        e->state.owner = e->state.cancel_q
+                         ? TW_net_acancel
+                         : TW_net_asend;
+
+        posted_sends.event_list[id] = e;
+        posted_sends.cur++;
+        me->s_nwhite_sent++;
+
+        changed = 1;
+    }
+    return changed;
+}
+
+/**
+ * @brief Determines how to handle the buffer of event whose send operation
+ * just finished.
+ *
+ * @param[in] me pointer to PE
+ * @param[in] e pointer to event that we just received
+ * @param[in] buffer not currently used
+ */
+static void
+send_finish(tw_pe *me, tw_event *e, char * buffer,struct act_q * q, int id)
+{
+    (void) buffer;
+    me->stats.s_nsend_network++;
+    // instrumentation
+    e->src_lp->kp->kp_stats->s_nsend_network++;
+    e->src_lp->lp_stats->s_nsend_network++;
+
+    if (e->state.owner == TW_net_asend) {
+        if (e->state.cancel_asend) {
+            /* Event was cancelled during transmission.  We must
+             * send another message to pass the cancel flag to
+             * the other node.
+             */
+            e->state.cancel_asend = 0;
+            e->state.cancel_q = 1;
+            tw_eventq_push(&outq, e);
+        } else {
+            /* Event finished transmission and was not cancelled.
+             * Add to our sent event queue so we can retain the
+             * event in case we need to cancel it later.  Note it
+             * is currently in remote format and must be converted
+             * back to local format for fossil collection.
+             */
+            e->state.owner = TW_pe_sevent_q;
+            if( g_tw_synchronization_protocol == CONSERVATIVE )
+                tw_event_free(me, e);
+        }
+
+        return;
+    }
+
+    if (e->state.owner == TW_net_acancel) {
+        /* We just finished sending the cancellation message
+         * for this event.  We need to free the buffer and
+         * make it available for reuse.
+         */
+        tw_event_free(me, e);
+        return;
+    }
+
+    /* Never should happen, not unless we somehow broke this
+     * module's other functions related to sending an event.
+     */
+
+    tw_error(
+            TW_LOC,
+            "Don't know how to finish send of owner=%u, cancel_q=%d",
+            e->state.owner,
+            e->state.cancel_q);
+
+}
+
+/**
+ * @brief Start checks for finished operations in send/recv queues,
+ * and post new sends/recvs if possible.
+ * @param[in] me pointer to PE
+ */
+static void
+service_queues(tw_pe *me)
+{
+    int changed;
+    do {
+        changed  = test_q(&posted_recvs, me,1, recv_finish);
+        changed |= test_q(&posted_sends, me,0, send_finish);
+        changed |= recv_begin(me);
+        changed |= send_begin(me);
+    } while (changed);
+}
+
+/*
+ * NOTE: Chris believes that this network layer is too aggressive at
+ * reading events out of the network.. so we are modifying the algorithm
+ * to only send events when tw_net_send it called, and only read events
+ * when tw_net_read is called.
+ */
+void
+tw_net_read(tw_pe *me)
+{
+    service_queues(me);
+}
+
+void
+tw_net_send(tw_event *e)
+{
+    tw_pe * me = e->src_lp->pe;
+    int changed = 0;
+
+    e->state.remote = 0;
+    e->state.owner = TW_net_outq;
+    tw_eventq_unshift(&outq, e);
+
+    do
+    {
+        changed = test_q(&posted_sends, me, 0, send_finish);
+        changed |= send_begin(me);
+    } while (changed);
+}
+
+void
+tw_net_cancel(tw_event *e)
+{
+    tw_pe *src_pe = e->src_lp->pe;
+
+    switch (e->state.owner) {
+        case TW_net_outq:
+            /* Cancelled before we could transmit it.  Do not
+             * transmit the event and instead just release the
+             * buffer back into our own free list.
+             */
+            tw_eventq_delete_any(&outq, e);
+            tw_event_free(src_pe, e);
+
+            return;
+
+            break;
+
+        case TW_net_asend:
+            /* Too late.  We've already let MPI start to send
+             * this event over the network.  We can't pull it
+             * back now without sending another message to do
+             * the cancel.
+             *
+             * Setting the cancel_q flag will signal us to do
+             * another message send once the current send of
+             * this message is completed.
+             */
+            e->state.cancel_asend = 1;
+            break;
+
+        case TW_pe_sevent_q:
+            /* Way late; the event was already sent and is in
+             * our sent event queue.  Mark it as a cancel and
+             * place it at the front of the outq.
+             */
+            e->state.cancel_q = 1;
+            tw_eventq_unshift(&outq, e);
+            break;
+
+        default:
+            /* Huh?  Where did you come from?  Why are we being
+             * told about you?  We did not send you so we cannot
+             * cancel you!
+             */
+            tw_error(
+                    TW_LOC,
+                    "Don't know how to cancel event owned by %u",
+                    e->state.owner);
+    }
+
+    service_queues(src_pe);
+}
+
+/**
+ * tw_net_statistics
+ * @brief Function to output the statistics
+ * @attention Notice that the MPI_Reduce "count" parameter is greater than one.
+ * We are reducing on multiple variables *simultaneously* so if you change
+ * this function or the struct tw_statistics, you must update the other.
+ **/
+tw_statistics	*
+tw_net_statistics(tw_pe * me, tw_statistics * s)
+{
+    if(MPI_Reduce(&(s->s_max_run_time),
+                  &me->stats.s_max_run_time,
+                  1,
+                  MPI_DOUBLE,
+                  MPI_MAX,
+                  (int)g_tw_masternode,
+                  MPI_COMM_ROSS) != MPI_SUCCESS)
+        tw_error(TW_LOC, "Unable to reduce statistics!");
+
+    if(MPI_Reduce(&(s->s_net_events),
+                  &me->stats.s_net_events,
+                  17,
+                  MPI_UNSIGNED_LONG_LONG,
+                  MPI_SUM,
+                  (int)g_tw_masternode,
+                  MPI_COMM_ROSS) != MPI_SUCCESS)
+        tw_error(TW_LOC, "Unable to reduce statistics!");
+
+    if(MPI_Reduce(&s->s_min_detected_offset,
+                  &me->stats.s_min_detected_offset,
+                  1,
+                  MPI_DOUBLE,
+                  MPI_MIN,
+                  (int)g_tw_masternode,
+                  MPI_COMM_ROSS) != MPI_SUCCESS)
+        tw_error(TW_LOC, "Unable to reduce statistics!");
+
+    if(MPI_Reduce(&(s->s_total),
+                  &me->stats.s_total,
+                  16,
+                  MPI_UNSIGNED_LONG_LONG,
+                  MPI_MAX,
+                  (int)g_tw_masternode,
+                  MPI_COMM_ROSS) != MPI_SUCCESS)
+        tw_error(TW_LOC, "Unable to reduce statistics!");
+
+    if (MPI_Reduce(&s->s_events_past_end,
+                   &me->stats.s_events_past_end,
+                   3,
+                   MPI_UNSIGNED_LONG_LONG,
+                   MPI_SUM,
+                   (int)g_tw_masternode,
+                   MPI_COMM_ROSS) != MPI_SUCCESS)
+        tw_error(TW_LOC, "Unable to reduce statistics!");
+
+#ifdef USE_RIO
+    if (MPI_Reduce(&s->s_rio_load,
+            &me->stats.s_rio_load,
+            1,
+            MPI_UNSIGNED_LONG_LONG,
+            MPI_MAX,
+            (int)g_tw_masternode,
+            MPI_COMM_ROSS) != MPI_SUCCESS)
+        tw_error(TW_LOC, "Unable to reduce statistics!");
+    if (MPI_Reduce(&s->s_rio_lp_init,
+            &me->stats.s_rio_lp_init,
+            1,
+            MPI_UNSIGNED_LONG_LONG,
+            MPI_MAX,
+            (int)g_tw_masternode,
+            MPI_COMM_ROSS) != MPI_SUCCESS)
+        tw_error(TW_LOC, "Unable to reduce statistics!");
+#endif
+
+    return &me->stats;
+}
diff --git a/core/hybrid-mpi-layer.c b/core/hybrid-mpi-layer.c
new file mode 100644
index 000000000..bbd4c8122
--- /dev/null
+++ b/core/hybrid-mpi-layer.c
@@ -0,0 +1,931 @@
+#include <ross.h>
+#include <mpi.h>
+
+MPI_Comm MPI_COMM_ROSS = MPI_COMM_WORLD;
+int custom_communicator = 0;
+
+// This is the hybrid version, where send_q is filled from back, recv_q has completed events overwritten
+
+/**
+ * @struct act_q
+ * @brief Keeps track of posted send or recv operations.
+ */
+
+struct act_q
+{
+    const char *name;
+
+    tw_event **event_list;    /**< list of event pointers in this queue */
+    MPI_Request *req_list;    /**< list of MPI request handles */
+    int *idx_list;            /**< indices in this queue of finished operations */
+    MPI_Status *status_list;  /**< list of MPI_Status handles */
+    unsigned int cur;         /**< index of first open spot in the queue */
+
+    unsigned *free_idx_list;//add, stack of free indices
+    unsigned *overflow_anti;
+    unsigned int front;//add, top of stack
+    int size_of_fr_q;//add, size of stack array
+    int num_in_fr_q;//add, number of elements on stack
+
+};
+
+#define EVENT_TAG 1
+
+#define EVENT_SIZE(e) g_tw_event_msg_sz
+
+static struct act_q posted_sends;
+static struct act_q posted_recvs;
+static tw_eventq outq;
+
+static unsigned int read_buffer = 16;
+static unsigned int send_buffer = 1024;
+static int world_size = 1;
+
+
+void deal_with_cur(struct act_q *q)// this is for MPI_testsome input
+{
+    if(q->cur < (q->front))
+    {
+        q->cur++;
+        return;
+    }
+    else
+    {
+        return;
+    }
+}
+
+void fr_q_aq(struct act_q *q, unsigned ele) // free index queue; add to queue
+{
+    q->front--;
+    q->free_idx_list[q->front] = ele;
+    return;
+}
+
+unsigned fr_q_dq(struct act_q *q) // free index queue; dequeue
+{
+    unsigned rv = q->free_idx_list[q->front];
+    q->front++;
+    q->num_in_fr_q--;
+    return rv;
+}
+
+void check_b_ind( int * b_index, struct act_q * q)
+{
+    while((0 <= *b_index) && (*b_index<=q->size_of_fr_q))
+    {
+
+        if(q->event_list[*b_index]== NULL)
+        {
+            *b_index = *b_index-1;
+        }
+        else
+        {
+            return;
+        }
+
+    }
+    *b_index = 0;
+    return;
+
+}
+
+
+static const tw_optdef mpi_opts[] = {
+        TWOPT_GROUP("ROSS MPI Kernel"),
+        TWOPT_UINT(
+                "read-buffer",
+                read_buffer,
+                "network read buffer size in # of events"),
+        TWOPT_UINT(
+                "send-buffer",
+                send_buffer,
+                "network send buffer size in # of events"),
+        TWOPT_END()
+};
+
+// Forward declarations of functions used in MPI network message processing
+static int recv_begin(tw_pe *me);
+static int send_begin(tw_pe *me);
+static void send_finish(tw_pe *me, tw_event *e, char * buffer, struct act_q* q, unsigned id);
+static void recv_finish(tw_pe *me, tw_event *e, char * buffer, struct act_q* q, unsigned id);
+static void late_recv_finish(tw_pe *me, tw_event *e, char * buffer, struct act_q* q, unsigned id);
+
+// Start of implmentation of network processing routines/functions
+void tw_comm_set(MPI_Comm comm)
+{
+    MPI_COMM_ROSS = comm;
+    custom_communicator = 1;
+}
+
+const tw_optdef *
+tw_net_init(int *argc, char ***argv)
+{
+    int my_rank;
+    int initialized;
+    MPI_Initialized(&initialized);
+
+    if (!initialized) {
+        if (MPI_Init(argc, argv) != MPI_SUCCESS)
+            tw_error(TW_LOC, "MPI_Init failed.");
+    }
+
+    if (MPI_Comm_rank(MPI_COMM_ROSS, &my_rank) != MPI_SUCCESS)
+        tw_error(TW_LOC, "Cannot get MPI_Comm_rank(MPI_COMM_ROSS)");
+
+    g_tw_masternode = 0;
+    g_tw_mynode = my_rank;
+
+    return mpi_opts;
+}
+
+/**
+ * @brief Initializes queues used for posted sends and receives
+ *
+ * @param[in] q pointer to the queue to be initialized
+ * @param[in] name name of the queue
+ */
+
+
+
+static void
+init_q(struct act_q *q, const char *name)
+{
+    unsigned int n;
+
+    if(q == &posted_sends)
+        n = send_buffer;
+    else
+        n = read_buffer;
+
+    q->name = name;
+    q->event_list = (tw_event **) tw_calloc(TW_LOC, name, sizeof(*q->event_list), n);
+    q->req_list = (MPI_Request *) tw_calloc(TW_LOC, name, sizeof(*q->req_list), n);
+    q->idx_list = (int *) tw_calloc(TW_LOC, name, sizeof(*q->idx_list), n);
+    q->status_list = (MPI_Status *) tw_calloc(TW_LOC, name, sizeof(*q->status_list), n);
+    q->free_idx_list = (int *) tw_calloc(TW_LOC, name, sizeof(*q->idx_list), n+1);// queue, n+1 is meant to prevent a full queue
+    q->overflow_anti = (int *) tw_calloc(TW_LOC, name, sizeof(*q->idx_list), (n/2)+2);// queue, at most (n/2) can be out of order, first element is # of elements in queue
+    q->front = 0;// front of queue
+    q->size_of_fr_q = n+1;// for wraparound
+    q->num_in_fr_q = 0; // number of elements in queue
+
+    unsigned i = 0;
+    while(i<n) // initializes the queue
+    {
+        q->free_idx_list[i] = i;
+        i++;
+    }
+    q->overflow_anti[0]=1;
+    q->num_in_fr_q = n;
+}
+
+unsigned int
+tw_nnodes(void)
+{
+    return world_size;
+}
+
+void
+tw_net_start(void)
+{
+    if (MPI_Comm_size(MPI_COMM_ROSS, &world_size) != MPI_SUCCESS)
+        tw_error(TW_LOC, "Cannot get MPI_Comm_size(MPI_COMM_ROSS)");
+
+    if( g_tw_mynode == 0)
+    {
+        printf("tw_net_start: Found world size to be %d \n", world_size );
+    }
+
+    // Check after tw_nnodes is defined
+    if(tw_nnodes() == 1) {
+        // force the setting of SEQUENTIAL protocol
+        if (g_tw_synchronization_protocol == NO_SYNCH) {
+            g_tw_synchronization_protocol = SEQUENTIAL;
+        } else if(g_tw_synchronization_protocol == CONSERVATIVE || g_tw_synchronization_protocol == OPTIMISTIC) {
+            g_tw_synchronization_protocol = SEQUENTIAL;
+            fprintf(stderr, "Warning: Defaulting to Sequential Simulation, not enough PEs defined.\n");
+        }
+    }
+
+    tw_pe_init();
+
+    //If we're in (some variation of) optimistic mode, we need this hash
+    if (g_tw_synchronization_protocol == OPTIMISTIC ||
+        g_tw_synchronization_protocol == OPTIMISTIC_DEBUG ||
+        g_tw_synchronization_protocol == OPTIMISTIC_REALTIME) {
+        g_tw_pe->hash_t = tw_hash_create();
+    } else {
+        g_tw_pe->hash_t = NULL;
+    }
+
+    if (send_buffer < 1)
+        tw_error(TW_LOC, "network send buffer must be >= 1");
+    if (read_buffer < 1)
+        tw_error(TW_LOC, "network read buffer must be >= 1");
+
+    init_q(&posted_sends, "MPI send queue");
+    init_q(&posted_recvs, "MPI recv queue");
+
+    g_tw_net_device_size = read_buffer;
+
+    // pre-post all the Irecv operations
+    recv_begin(g_tw_pe);
+}
+
+void
+tw_net_abort(void)
+{
+    MPI_Abort(MPI_COMM_ROSS, 1);
+    exit(1);
+}
+
+void
+tw_net_stop(void)
+{
+#ifdef USE_DAMARIS
+    if (g_st_damaris_enabled)
+        st_damaris_ross_finalize();
+    else
+    {
+        if (!custom_communicator) {
+            if (MPI_Finalize() != MPI_SUCCESS)
+                tw_error(TW_LOC, "Failed to finalize MPI");
+        }
+    }
+#else
+    if (!custom_communicator) {
+        if (MPI_Finalize() != MPI_SUCCESS)
+            tw_error(TW_LOC, "Failed to finalize MPI");
+    }
+#endif
+}
+
+void
+tw_net_barrier(void)
+{
+    if (MPI_Barrier(MPI_COMM_ROSS) != MPI_SUCCESS)
+        tw_error(TW_LOC, "Failed to wait for MPI_Barrier");
+}
+
+tw_stime
+tw_net_minimum(void)
+{
+    tw_stime m = DBL_MAX;
+    tw_event *e;
+    unsigned int i;
+
+    e = outq.head;
+    while (e) {
+        if (m > e->recv_ts)
+            m = e->recv_ts;
+        e = e->next;
+    }
+
+    for (i = 0; i < posted_sends.cur; i++) {
+        e = posted_sends.event_list[i];
+        if (m > e->recv_ts)
+            m = e->recv_ts;
+    }
+
+    return m;
+}
+
+/**
+ * @brief Calls MPI_Testsome on the provided queue, to check for finished operations.
+ *
+ * @param[in] q queue to check
+ * @param[in] me pointer to the PE
+ * @param[in] finish pointer to function that will perform the appropriate send/recv
+ * finish functionality
+ *
+ * @return 0 if MPI_Testsome did not return any finished operations, 1 otherwise.
+ */
+
+
+
+static int
+test_q_recv(
+        struct act_q * q,
+        tw_pe *me,
+        void (*finish)(tw_pe *, tw_event *, char *, struct act_q*, unsigned id))
+{
+    int ready, i, n, indicator;
+    indicator = 1;
+
+
+    if( q->num_in_fr_q == ((q->size_of_fr_q)-1) )
+        return 0;
+
+    if (MPI_Testsome(
+            q->cur,
+            q->req_list,
+            &ready,
+            q->idx_list,
+            q->status_list) != MPI_SUCCESS) {
+        tw_error(
+                TW_LOC,
+                "MPI_testsome failed with %u items in %s",
+                q->cur,
+                q->name);
+    }
+
+    if (1 > ready)
+        return 0;
+
+    q->overflow_anti[0]=1;
+    q->num_in_fr_q+=ready;
+    i = ready-1;
+    while ( -1 != i)
+    {
+
+        tw_event *e;
+        n = q->idx_list[i];
+        e = q->event_list[n];
+        fr_q_aq(q, n); //add n onto queue
+
+        finish(me, e, NULL, q, n);
+
+        if (indicator != q->overflow_anti[0])
+        {
+            indicator = q->overflow_anti[0];
+        }
+        else
+        {
+            q->event_list[n] = NULL;
+        }
+        i--;
+    }
+
+    i = 1; // first element of q->overflow_anti is the number of elements in the array
+
+    while (i < q->overflow_anti[0])//takes care of out of order messages
+    {
+
+        tw_event *e;
+        n = q->overflow_anti[i];
+        e = q->event_list[n];
+        q->event_list[n] = NULL;
+        late_recv_finish(me, e, NULL, q, n);
+        //might need an augmented version for ROSS_MEMORY?
+        i++;
+    }
+
+    return 1;
+}
+
+static int
+test_q_send(
+        struct act_q * q,
+        tw_pe *me,
+        void (*finish)(tw_pe *, tw_event *, char *, struct act_q*, unsigned id))
+{
+    int ready, i, n;
+
+
+    if (!q->cur)
+    {
+        return 0;
+    }
+
+    if (MPI_Testsome(
+            q->cur,
+            q->req_list,
+            &ready,
+            q->idx_list,
+            q->status_list) != MPI_SUCCESS) {
+        tw_error(
+                TW_LOC,
+                "MPI_testsome failed with %u items in %s",
+                q->cur,
+                q->name);
+    }
+
+    if (1 > ready)
+        return 0;
+
+    i = ready-1;
+
+    while(-1 != i)
+    {
+
+        tw_event *e;
+
+        n = q->idx_list[i];
+        e = q->event_list[n];
+        q->event_list[n] = NULL;
+        i--;
+
+        finish(me, e, NULL, q, n);
+    }
+
+
+    i = 0;
+
+    int b_index;
+    b_index = q->cur-1;
+
+    while(i<ready)
+    {
+        n = q->idx_list[i];
+
+        check_b_ind(&b_index, q);
+        if (n < b_index)
+        {
+            q->event_list[n] = q->event_list[b_index];
+            memcpy(&q->req_list[n],&q->req_list[b_index],sizeof(q->req_list[0]));
+            b_index--;
+        }
+        i++;
+
+    }
+
+    q->cur -= ready;
+
+    return 1;
+}
+
+
+/**
+ * @brief If there are any openings in the posted_recvs queue, post more Irecvs.
+ *
+ * @param[in] me pointer to the PE
+ * @return 0 if no changes are made to the queue, 1 otherwise.
+ */
+
+static int
+recv_begin(tw_pe *me)
+{
+
+    tw_event	*e = NULL;
+
+    int changed = 0;
+
+    while (0 < posted_recvs.num_in_fr_q)
+    {
+
+        if(!(e = tw_event_grab(me)))
+        {
+            if(tw_gvt_inprogress(me))
+                tw_error(TW_LOC, "Out of events in GVT! Consider increasing --extramem");
+            return changed;
+        }
+
+        unsigned id = fr_q_dq(&posted_recvs);
+
+        if( MPI_Irecv(e,
+                      (int)EVENT_SIZE(e),
+                      MPI_BYTE,
+                      MPI_ANY_SOURCE,
+                      EVENT_TAG,
+                      MPI_COMM_ROSS,
+                      &posted_recvs.req_list[id]) != MPI_SUCCESS)
+        {
+            tw_event_free(me, e);
+            return changed;
+        }
+
+        posted_recvs.event_list[id] = e;
+        deal_with_cur(&posted_recvs);
+        changed = 1;
+    }
+    return changed;
+}
+
+
+
+
+
+/**
+ * @brief Determines how to handle the newly received event.
+ *
+ * @param[in] me pointer to PE
+ * @param[in] e pointer to event that we just received
+ * @param[in] buffer not currently used
+ */
+
+
+
+static void
+recv_finish(tw_pe *me, tw_event *e, char * buffer, struct act_q * q, unsigned id )
+{
+    (void) buffer;
+    tw_pe		*dest_pe;
+    tw_clock start;
+
+    me->stats.s_nread_network++;
+    me->s_nwhite_recv++;
+
+    //  printf("recv_finish: remote event [cancel %u] FROM: LP %lu, PE %lu, TO: LP %lu, PE %lu at TS %lf \n",
+    //	 e->state.cancel_q, (tw_lpid)e->src_lp, e->send_pe, (tw_lpid)e->dest_lp, me->id, e->recv_ts);
+
+    e->dest_lp = tw_getlocal_lp((tw_lpid) e->dest_lp);
+    dest_pe = e->dest_lp->pe;
+    // instrumentation
+    e->dest_lp->kp->kp_stats->s_nread_network++;
+    e->dest_lp->lp_stats->s_nread_network++;
+
+    if(e->send_pe > tw_nnodes()-1)
+        tw_error(TW_LOC, "bad sendpe_id: %d", e->send_pe);
+
+    e->cancel_next = NULL;
+    e->caused_by_me = NULL;
+    e->cause_next = NULL;
+
+
+
+    if(e->recv_ts < me->GVT)
+        tw_error(TW_LOC, "%d: Received straggler from %d: %lf (%d)",
+                 me->id,  e->send_pe, e->recv_ts, e->state.cancel_q);
+
+    if(tw_gvt_inprogress(me))
+        me->trans_msg_ts = ROSS_MIN(me->trans_msg_ts, e->recv_ts);
+
+    // if cancel event, retrieve and flush
+    // else, store in hash table
+    if(e->state.cancel_q)
+    {
+        tw_event *cancel = tw_hash_remove(me->hash_t, e, e->send_pe);
+
+        // NOTE: it is possible to cancel the event we
+        // are currently processing at this PE since this
+        // MPI module lets me read cancel events during
+        // event sends over the network.
+
+        if(cancel!=NULL)//if cancel is not null, then it's not out of order, do expected
+        {
+
+            cancel->state.cancel_q = 1;
+            cancel->state.remote = 0;
+            cancel->cancel_next = dest_pe->cancel_q;
+            dest_pe->cancel_q = cancel;
+            tw_event_free(me, e);
+        }
+        else // add out of order event to late queue
+        {
+            q->overflow_anti[q->overflow_anti[0]] = id;
+            q->overflow_anti[0]++;
+        }
+
+        return;
+
+    }
+
+    if (g_tw_synchronization_protocol == OPTIMISTIC ||
+        g_tw_synchronization_protocol == OPTIMISTIC_DEBUG ||
+        g_tw_synchronization_protocol == OPTIMISTIC_REALTIME ) {
+        tw_hash_insert(me->hash_t, e, e->send_pe);
+        e->state.remote = 1;
+    }
+
+    /* NOTE: the final check in the if conditional below was added to make sure
+     * that we do not execute the fast case unless the cancellation queue is
+     * empty on the destination PE.  Otherwise we need to invoke the normal
+     * scheduling routines to make sure that a forward event doesn't bypass a
+     * cancellation event with an earlier timestamp.  This is helpful for
+     * stateful models that produce incorrect results when presented with
+     * duplicate messages with no rollback between them.
+     */
+    if(me == dest_pe && e->dest_lp->kp->last_time <= e->recv_ts && !dest_pe->cancel_q) {
+        /* Fast case, we are sending to our own PE and
+         * there is no rollback caused by this send.
+         */
+        start = tw_clock_read();
+        tw_pq_enqueue(dest_pe->pq, e);
+        dest_pe->stats.s_pq += tw_clock_read() - start;
+        return;
+    }
+
+    if (me->id == dest_pe->id) {
+        /* Slower, but still local send, so put into top
+         * of dest_pe->event_q.
+         */
+        e->state.owner = TW_pe_event_q;
+        tw_eventq_push(&dest_pe->event_q, e);
+        return;
+    }
+
+    /* Never should happen; MPI should have gotten the
+     * message to the correct node without needing us
+     * to redirect the message there for it.  This is
+     * probably a serious bug with the event headers
+     * not being formatted right.
+     */
+    tw_error(
+            TW_LOC,
+            "Event recived by PE %u but meant for PE %u",
+            me->id,
+            dest_pe->id);
+}
+
+static void
+late_recv_finish(tw_pe *me, tw_event *e, char * buffer, struct act_q * q, unsigned id )
+{
+
+    tw_pe		*dest_pe;
+    dest_pe = e->dest_lp->pe;
+    tw_event *cancel = tw_hash_remove(me->hash_t, e, e->send_pe);
+    g_tw_pe->avl_tree_size++;
+
+    cancel->state.cancel_q = 1;
+    cancel->state.remote = 0;
+    cancel->cancel_next = dest_pe->cancel_q;
+    dest_pe->cancel_q = cancel;
+    tw_event_free(me, e);
+
+    return;
+
+}
+
+/**
+ * @brief If there are any openings in the posted_sends queue, start sends
+ * for events in the outgoing queue.
+ *
+ * @param[in] me pointer to the PE
+ * @return 0 if no changes are made to the posted_sends queue, 1 otherwise.
+ */
+
+static int
+send_begin(tw_pe *me)
+{
+    int changed = 0;
+
+    while (posted_sends.cur < send_buffer)
+    {
+        tw_event *e = tw_eventq_peek(&outq);
+        tw_peid dest_pe;
+
+        unsigned id = posted_sends.cur;
+
+        if (!e)
+            break;
+
+        if(e == me->abort_event)
+            tw_error(TW_LOC, "Sending abort event!");
+
+        dest_pe = (*e->src_lp->type->map) ((tw_lpid) e->dest_lp);
+
+        e->send_pe = (tw_peid) g_tw_mynode;
+        e->send_lp = e->src_lp->gid;
+
+        if (MPI_Isend(e,
+                      (int)EVENT_SIZE(e),
+                      MPI_BYTE,
+                      (int)dest_pe,
+                      EVENT_TAG,
+                      MPI_COMM_ROSS,
+                      &posted_sends.req_list[id]) != MPI_SUCCESS) {
+            return changed;
+        }
+
+        tw_eventq_pop(&outq);
+        e->state.owner = e->state.cancel_q
+                         ? TW_net_acancel
+                         : TW_net_asend;
+
+        posted_sends.event_list[id] = e;
+        posted_sends.cur++;
+        me->s_nwhite_sent++;
+
+        changed = 1;
+    }
+    return changed;
+}
+
+/**
+ * @brief Determines how to handle the buffer of event whose send operation
+ * just finished.
+ *
+ * @param[in] me pointer to PE
+ * @param[in] e pointer to event that we just received
+ * @param[in] buffer not currently used
+ */
+static void
+send_finish(tw_pe *me, tw_event *e, char * buffer, struct act_q * q, unsigned id)
+{
+    (void) buffer;
+    me->stats.s_nsend_network++;
+    // instrumentation
+    e->src_lp->kp->kp_stats->s_nsend_network++;
+    e->src_lp->lp_stats->s_nsend_network++;
+
+    if (e->state.owner == TW_net_asend) {
+        if (e->state.cancel_asend) {
+            /* Event was cancelled during transmission.  We must
+             * send another message to pass the cancel flag to
+             * the other node.
+             */
+            e->state.cancel_asend = 0;
+            e->state.cancel_q = 1;
+            tw_eventq_push(&outq, e);
+        } else {
+            /* Event finished transmission and was not cancelled.
+             * Add to our sent event queue so we can retain the
+             * event in case we need to cancel it later.  Note it
+             * is currently in remote format and must be converted
+             * back to local format for fossil collection.
+             */
+            e->state.owner = TW_pe_sevent_q;
+            if( g_tw_synchronization_protocol == CONSERVATIVE )
+                tw_event_free(me, e);
+        }
+
+        return;
+    }
+
+    if (e->state.owner == TW_net_acancel) {
+        /* We just finished sending the cancellation message
+         * for this event.  We need to free the buffer and
+         * make it available for reuse.
+         */
+        tw_event_free(me, e);
+        return;
+    }
+
+    /* Never should happen, not unless we somehow broke this
+     * module's other functions related to sending an event.
+     */
+
+    tw_error(
+            TW_LOC,
+            "Don't know how to finish send of owner=%u, cancel_q=%d",
+            e->state.owner,
+            e->state.cancel_q);
+
+}
+
+/**
+ * @brief Start checks for finished operations in send/recv queues,
+ * and post new sends/recvs if possible.
+ * @param[in] me pointer to PE
+ */
+static void
+service_queues(tw_pe *me)
+{
+    int changed;
+    do {
+        changed  = test_q_recv(&posted_recvs, me, recv_finish);
+        changed |= test_q_send(&posted_sends, me, send_finish);
+        changed |= recv_begin(me);
+        changed |= send_begin(me);
+    } while (changed);
+}
+
+/*
+ * NOTE: Chris believes that this network layer is too aggressive at
+ * reading events out of the network.. so we are modifying the algorithm
+ * to only send events when tw_net_send it called, and only read events
+ * when tw_net_read is called.
+ */
+void
+tw_net_read(tw_pe *me)
+{
+    service_queues(me);
+}
+
+void
+tw_net_send(tw_event *e)
+{
+    tw_pe * me = e->src_lp->pe;
+    int changed = 0;
+
+    e->state.remote = 0;
+    e->state.owner = TW_net_outq;
+    tw_eventq_unshift(&outq, e);
+
+    do
+    {
+        changed = test_q_send(&posted_sends, me, send_finish);
+        changed |= send_begin(me);
+    } while (changed);
+}
+
+void
+tw_net_cancel(tw_event *e)
+{
+    tw_pe *src_pe = e->src_lp->pe;
+
+    switch (e->state.owner) {
+        case TW_net_outq:
+            /* Cancelled before we could transmit it.  Do not
+             * transmit the event and instead just release the
+             * buffer back into our own free list.
+             */
+            tw_eventq_delete_any(&outq, e);
+            tw_event_free(src_pe, e);
+
+            return;
+
+            break;
+
+        case TW_net_asend:
+            /* Too late.  We've already let MPI start to send
+             * this event over the network.  We can't pull it
+             * back now without sending another message to do
+             * the cancel.
+             *
+             * Setting the cancel_q flag will signal us to do
+             * another message send once the current send of
+             * this message is completed.
+             */
+            e->state.cancel_asend = 1;
+            break;
+
+        case TW_pe_sevent_q:
+            /* Way late; the event was already sent and is in
+             * our sent event queue.  Mark it as a cancel and
+             * place it at the front of the outq.
+             */
+            e->state.cancel_q = 1;
+            tw_eventq_unshift(&outq, e);
+            break;
+
+        default:
+            /* Huh?  Where did you come from?  Why are we being
+             * told about you?  We did not send you so we cannot
+             * cancel you!
+             */
+            tw_error(
+                    TW_LOC,
+                    "Don't know how to cancel event owned by %u",
+                    e->state.owner);
+    }
+
+    service_queues(src_pe);
+}
+
+/**
+ * tw_net_statistics
+ * @brief Function to output the statistics
+ * @attention Notice that the MPI_Reduce "count" parameter is greater than one.
+ * We are reducing on multiple variables *simultaneously* so if you change
+ * this function or the struct tw_statistics, you must update the other.
+ **/
+tw_statistics	*
+tw_net_statistics(tw_pe * me, tw_statistics * s)
+{
+    if(MPI_Reduce(&(s->s_max_run_time),
+                  &me->stats.s_max_run_time,
+                  1,
+                  MPI_DOUBLE,
+                  MPI_MAX,
+                  (int)g_tw_masternode,
+                  MPI_COMM_ROSS) != MPI_SUCCESS)
+        tw_error(TW_LOC, "Unable to reduce statistics!");
+
+    if(MPI_Reduce(&(s->s_net_events),
+                  &me->stats.s_net_events,
+                  17,
+                  MPI_UNSIGNED_LONG_LONG,
+                  MPI_SUM,
+                  (int)g_tw_masternode,
+                  MPI_COMM_ROSS) != MPI_SUCCESS)
+        tw_error(TW_LOC, "Unable to reduce statistics!");
+
+    if(MPI_Reduce(&s->s_min_detected_offset,
+                  &me->stats.s_min_detected_offset,
+                  1,
+                  MPI_DOUBLE,
+                  MPI_MIN,
+                  (int)g_tw_masternode,
+                  MPI_COMM_ROSS) != MPI_SUCCESS)
+        tw_error(TW_LOC, "Unable to reduce statistics!");
+
+    if(MPI_Reduce(&(s->s_total),
+                  &me->stats.s_total,
+                  16,
+                  MPI_UNSIGNED_LONG_LONG,
+                  MPI_MAX,
+                  (int)g_tw_masternode,
+                  MPI_COMM_ROSS) != MPI_SUCCESS)
+        tw_error(TW_LOC, "Unable to reduce statistics!");
+
+    if (MPI_Reduce(&s->s_events_past_end,
+                   &me->stats.s_events_past_end,
+                   3,
+                   MPI_UNSIGNED_LONG_LONG,
+                   MPI_SUM,
+                   (int)g_tw_masternode,
+                   MPI_COMM_ROSS) != MPI_SUCCESS)
+        tw_error(TW_LOC, "Unable to reduce statistics!");
+
+#ifdef USE_RIO
+    if (MPI_Reduce(&s->s_rio_load,
+            &me->stats.s_rio_load,
+            1,
+            MPI_UNSIGNED_LONG_LONG,
+            MPI_MAX,
+            (int)g_tw_masternode,
+            MPI_COMM_ROSS) != MPI_SUCCESS)
+        tw_error(TW_LOC, "Unable to reduce statistics!");
+    if (MPI_Reduce(&s->s_rio_lp_init,
+            &me->stats.s_rio_lp_init,
+            1,
+            MPI_UNSIGNED_LONG_LONG,
+            MPI_MAX,
+            (int)g_tw_masternode,
+            MPI_COMM_ROSS) != MPI_SUCCESS)
+        tw_error(TW_LOC, "Unable to reduce statistics!");
+#endif
+
+    return &me->stats;
+}
diff --git a/core/network-mpi.c b/core/network-mpi.c
index 5ccf0adee..cd74232c6 100644
--- a/core/network-mpi.c
+++ b/core/network-mpi.c
@@ -1,5 +1,6 @@
 #include <ross.h>
 #include <mpi.h>
+#include "ross.h"
 
 MPI_Comm MPI_COMM_ROSS = MPI_COMM_WORLD;
 int custom_communicator = 0;
@@ -8,17 +9,25 @@ static long id_tmp;
 
 struct act_q
 {
-  const char	 *name;
+    const char	 *name;
+
+    tw_event	**event_list;
+    MPI_Request	 *req_list;
+    int		 *idx_list;
+    MPI_Status	 *status_list;
+    int        *free_idx_list;//add, que of free indices
+    int        *overflow_anti;
 
-  tw_event	**event_list;
-  MPI_Request	 *req_list;
-  int		 *idx_list;
-  MPI_Status	 *status_list;
 #if ROSS_MEMORY
-  char		**buffers;
+    char		**buffers;
 #endif
+    unsigned int cur;
+    int front;//add, front of queue
+    int coda;//add, back of queue but back is already a variable somewhere
+    int size_of_fr_q;//add, size of queue array
+    int num_in_fr_q;//add, number of elements in queue
+    int reset_var;// a variable determining if the queue has been reset lately.
 
-  unsigned int	  cur;
 };
 
 #define EVENT_TAG 1
@@ -37,74 +46,219 @@ static unsigned int read_buffer = 16;
 static unsigned int send_buffer = 1024;
 static int world_size = 1;
 
+void deal_with_cur(struct act_q *q)// this is for MPI_testsome input
+{
+    if(q->cur < (q->size_of_fr_q-1))//checks to see if
+    {
+        q->cur++;
+        return;
+    }
+    else
+    {  //not sure if best placement is here or in fr_q_chq. probably fr_q_chq.
+        return;
+    }
+}
+
+void old_fr_q_reset(struct act_q *q)//experimental
+{
+    if(q->num_in_fr_q == (q->size_of_fr_q-1)) //if the queue is filled with free
+    {
+        int i = 0;
+        while( i < q->cur)//resets all entries in the array so that they are properly ordered from one to cur
+        {
+            q->free_idx_list[i] = i;
+            i++;
+        }
+        //resets queue to default positions
+        q->front = 0;
+        q->coda  = 0;
+        q->cur   = 0;
+
+        return;
+    }
+    else
+    {
+        return;
+    }
+
+}
+
+void fr_q_reset(struct act_q *q)//experimental
+{
+    if(q->num_in_fr_q == (q->size_of_fr_q-1))//if the queue is filled with free
+    {
+        //resets queue to default positions
+        q->reset_var = 1;
+        q->front = 0;
+        q->coda  = 0;
+        q->cur   = 0;
+
+        return;
+    }
+    else
+    {
+        return;
+    }
+
+}
+
+
+void fr_q_chq(struct act_q *q, int *frontOrCoda) //free index queue; check for modulating the front or back index of que
+{
+    if(*frontOrCoda != q->size_of_fr_q)//don't mess with queue
+    {
+        return;// return probably not necessary
+    }
+    else//mess with queue
+    {
+        q->reset_var = 0;
+        *frontOrCoda = 0;
+        return;
+    }
+}
+
+void fr_q_aq(struct act_q *q, int ele) // free index queue; add to queue
+{
+
+    q->free_idx_list[q->coda] = ele;
+    q->coda++;
+    q->num_in_fr_q++;
+    fr_q_chq(q,&q->coda);//wraps the queue array around
+
+}
+
+
+
+int fr_q_dq(struct act_q *q) // free index queue; dequeue
+{
+    int rv;
+    rv = q->free_idx_list[q->front];
+    q->front++;
+    q->num_in_fr_q--;//can we get rid of this here?
+    fr_q_chq(q, &q->front);// wraps the queue array around
+    return rv;
+
+}
+
+int send_fr_q_dq(struct act_q *q) // free index queue; dequeue
+{
+
+    int rv;
+
+    if(q->reset_var == 0) // if not recently reset, take from front of queue
+    {
+        rv =q->free_idx_list[q->front];
+        q->front++;
+        q->num_in_fr_q--;
+        fr_q_chq(q, &q->front);// wraps the queue array around
+    }
+    else //if recently reset, return q->front. This works because front will just give the numbers sequentially so we
+    {    //don't need an explicit assignment
+
+        rv = q->front;
+        q->front++;
+        q->num_in_fr_q--;
+        fr_q_chq( q, &q->front );// wraps the queue array around
+
+    }
+    return rv;
+
+}
+
+
 static const tw_optdef mpi_opts[] = {
-  TWOPT_GROUP("ROSS MPI Kernel"),
-  TWOPT_UINT(
-	     "read-buffer",
-	     read_buffer,
-	     "network read buffer size in # of events"),
-  TWOPT_UINT(
-	     "send-buffer",
-	     send_buffer,
-	     "network send buffer size in # of events"),
-  TWOPT_END()
+        TWOPT_GROUP("ROSS MPI Kernel"),
+        TWOPT_UINT(
+                "read-buffer",
+                read_buffer,
+                "network read buffer size in # of events"),
+        TWOPT_UINT(
+                "send-buffer",
+                send_buffer,
+                "network send buffer size in # of events"),
+        TWOPT_END()
 };
 
 // Forward declarations of functions used in MPI network message processing
 static int recv_begin(tw_pe *me);
-static void recv_finish(tw_pe *me, tw_event *e, char * buffer);
+static void recv_finish(tw_pe *me, tw_event *e, char * buffer, struct act_q* q, int id);
+static void late_recv_finish(tw_pe *me, tw_event *e, char * buffer, struct act_q* q, int id);
 static int send_begin(tw_pe *me);
-static void send_finish(tw_pe *me, tw_event *e, char * buffer);
+static void send_finish(tw_pe *me, tw_event *e, char * buffer, struct act_q* q, int id);
 
 // Start of implmentation of network processing routines/functions
 void tw_comm_set(MPI_Comm comm)
 {
-	MPI_COMM_ROSS = comm;
-	custom_communicator = 1;
+    MPI_COMM_ROSS = comm;
+    custom_communicator = 1;
 }
 
 const tw_optdef *
 tw_net_init(int *argc, char ***argv)
 {
-  int my_rank;
+    int my_rank;
 
-  int initialized;
-  MPI_Initialized(&initialized);
+    int initialized;
+    MPI_Initialized(&initialized);
 
-  if (!initialized) {
-    if (MPI_Init(argc, argv) != MPI_SUCCESS)
-      tw_error(TW_LOC, "MPI_Init failed.");
-  }
-  if (MPI_Comm_rank(MPI_COMM_ROSS, &my_rank) != MPI_SUCCESS)
-    tw_error(TW_LOC, "Cannot get MPI_Comm_rank(MPI_COMM_ROSS)");
+    if (!initialized) {
+        if (MPI_Init(argc, argv) != MPI_SUCCESS)
+            tw_error(TW_LOC, "MPI_Init failed.");
+    }
+    if (MPI_Comm_rank(MPI_COMM_ROSS, &my_rank) != MPI_SUCCESS)
+        tw_error(TW_LOC, "Cannot get MPI_Comm_rank(MPI_COMM_ROSS)");
 
-  g_tw_masternode = 0;
-  g_tw_mynode = my_rank;
+    g_tw_masternode = 0;
+    g_tw_mynode = my_rank;
 
-  return mpi_opts;
+    return mpi_opts;
 }
 
 static void
 init_q(struct act_q *q, const char *name)
 {
-  unsigned int n;
+    unsigned int n;
 #if ROSS_MEMORY
-  unsigned int i;
+    unsigned int i;
 #endif
 
-  if(q == &posted_sends)
-    n = send_buffer;
-  else
-    n = read_buffer;
+    if(q == &posted_sends)
+    {
+        q->reset_var = 1;
+        n = send_buffer;
+    }
+    else
+    {
+        q->reset_var = 0;
+
+        n = read_buffer;
+    }
+    q->name = name;
+    q->event_list = (tw_event **) tw_calloc(TW_LOC, name, sizeof(*q->event_list), n);
+    q->req_list = (MPI_Request *) tw_calloc(TW_LOC, name, sizeof(*q->req_list), n);
+    q->idx_list = (int *) tw_calloc(TW_LOC, name, sizeof(*q->idx_list), n);
+    q->status_list = (MPI_Status *) tw_calloc(TW_LOC, name, sizeof(*q->status_list), n);
+    //can I shrink this initialization?
+    q->free_idx_list = (int *) tw_calloc(TW_LOC, name, sizeof(*q->idx_list), n+1);// queue, n+1 is meant to prevent a full queue
+    q->overflow_anti = (int *) tw_calloc(TW_LOC, name, sizeof(*q->idx_list), (n/2)+2);// queue, at most (n/2) can be out of order, first element is # of elements in queue
+    q->front = 0;// front of queue
+    q->coda  = 0;// end of queue
+    q->size_of_fr_q = n+1;// for wraparound
+    q->reset_var = 1;
+    q->num_in_fr_q = 0; // number of elements in queue
+
+    int i = 0;
+    while(i<n) // initializes the queue
+    {
+        fr_q_aq( q , i) ;
+        i++;
+    }
+    q->overflow_anti[0]=1;
+//    q->num_in_fr_q = n;// number of elements in queue
 
-  q->name = name;
-  q->event_list = (tw_event **) tw_calloc(TW_LOC, name, sizeof(*q->event_list), n);
-  q->req_list = (MPI_Request *) tw_calloc(TW_LOC, name, sizeof(*q->req_list), n);
-  q->idx_list = (int *) tw_calloc(TW_LOC, name, sizeof(*q->idx_list), n);
-  q->status_list = (MPI_Status *) tw_calloc(TW_LOC, name, sizeof(*q->status_list), n);
 
 #if ROSS_MEMORY
-  q->buffers = tw_calloc(TW_LOC, name, sizeof(*q->buffers), n);
+    q->buffers = tw_calloc(TW_LOC, name, sizeof(*q->buffers), n);
 
   for(i = 0; i < n; i++)
     q->buffers[i] = tw_calloc(TW_LOC, "", TW_MEMORY_BUFFER_SIZE, 1);
@@ -112,210 +266,279 @@ init_q(struct act_q *q, const char *name)
 }
 
 tw_node * tw_net_onnode(tw_peid gid) {
-  id_tmp = gid;
-  return &id_tmp;
+    id_tmp = gid;
+    return &id_tmp;
 }
 
 unsigned int
 tw_nnodes(void)
 {
-  return world_size;
+    return world_size;
 }
 
 void
 tw_net_start(void)
 {
-  if (MPI_Comm_size(MPI_COMM_ROSS, &world_size) != MPI_SUCCESS)
-    tw_error(TW_LOC, "Cannot get MPI_Comm_size(MPI_COMM_ROSS)");
+    if (MPI_Comm_size(MPI_COMM_ROSS, &world_size) != MPI_SUCCESS)
+        tw_error(TW_LOC, "Cannot get MPI_Comm_size(MPI_COMM_ROSS)");
 
-  if( g_tw_mynode == 0)
+    if( g_tw_mynode == 0)
     {
-      printf("tw_net_start: Found world size to be %d \n", world_size );
+        printf("tw_net_start: Found world size to be %d \n", world_size );
     }
 
-  // Check after tw_nnodes is defined
-  if(tw_nnodes() == 1 && g_tw_npe == 1) {
-      // force the setting of SEQUENTIAL protocol
-      if (g_tw_synchronization_protocol == NO_SYNCH) {
-          g_tw_synchronization_protocol = SEQUENTIAL;
-      } else if(g_tw_synchronization_protocol == CONSERVATIVE || g_tw_synchronization_protocol == OPTIMISTIC) {
-          g_tw_synchronization_protocol = SEQUENTIAL;
-          fprintf(stderr, "Warning: Defaulting to Sequential Simulation, not enought PEs defined.\n");
-      }
-  }
+    // Check after tw_nnodes is defined
+    if(tw_nnodes() == 1 && g_tw_npe == 1) {
+        // force the setting of SEQUENTIAL protocol
+        if (g_tw_synchronization_protocol == NO_SYNCH) {
+            g_tw_synchronization_protocol = SEQUENTIAL;
+        } else if(g_tw_synchronization_protocol == CONSERVATIVE || g_tw_synchronization_protocol == OPTIMISTIC) {
+            g_tw_synchronization_protocol = SEQUENTIAL;
+            fprintf(stderr, "Warning: Defaulting to Sequential Simulation, not enought PEs defined.\n");
+        }
+    }
 
-  tw_pe_create(1);
-  tw_pe_init(0, g_tw_mynode);
+    tw_pe_create(1);
+    tw_pe_init(0, g_tw_mynode);
 
-  //If we're in (some variation of) optimistic mode, we need this hash
-  if (g_tw_synchronization_protocol == OPTIMISTIC ||
-      g_tw_synchronization_protocol == OPTIMISTIC_DEBUG ||
-      g_tw_synchronization_protocol == OPTIMISTIC_REALTIME) {
-    g_tw_pe[0]->hash_t = tw_hash_create();
-  } else {
-    g_tw_pe[0]->hash_t = NULL;
-  }
+    //If we're in (some variation of) optimistic mode, we need this hash
+    if (g_tw_synchronization_protocol == OPTIMISTIC ||
+        g_tw_synchronization_protocol == OPTIMISTIC_DEBUG ||
+        g_tw_synchronization_protocol == OPTIMISTIC_REALTIME) {
+        g_tw_pe[0]->hash_t = tw_hash_create();
+    } else {
+        g_tw_pe[0]->hash_t = NULL;
+    }
 
-  if (send_buffer < 1)
-    tw_error(TW_LOC, "network send buffer must be >= 1");
-  if (read_buffer < 1)
-    tw_error(TW_LOC, "network read buffer must be >= 1");
+    if (send_buffer < 1)
+        tw_error(TW_LOC, "network send buffer must be >= 1");
+    if (read_buffer < 1)
+        tw_error(TW_LOC, "network read buffer must be >= 1");
 
-  init_q(&posted_sends, "MPI send queue");
-  init_q(&posted_recvs, "MPI recv queue");
+    init_q(&posted_sends, "MPI send queue");
+    init_q(&posted_recvs, "MPI recv queue");
 
-  g_tw_net_device_size = read_buffer;
+    g_tw_net_device_size = read_buffer;
 
-  // pre-post all the Irecv operations
-  recv_begin( g_tw_pe[0] );
+    // pre-post all the Irecv operations
+    recv_begin( g_tw_pe[0] );
 }
 
 void
 tw_net_abort(void)
 {
-  MPI_Abort(MPI_COMM_ROSS, 1);
-  exit(1);
+    MPI_Abort(MPI_COMM_ROSS, 1);
+    exit(1);
 }
 
 void
 tw_net_stop(void)
 {
-  if (!custom_communicator) {
-    if (MPI_Finalize() != MPI_SUCCESS)
-      tw_error(TW_LOC, "Failed to finalize MPI");
-  }
+    if (!custom_communicator) {
+        if (MPI_Finalize() != MPI_SUCCESS)
+            tw_error(TW_LOC, "Failed to finalize MPI");
+    }
 }
 
 void
 tw_net_barrier(tw_pe * pe)
 {
-  if (MPI_Barrier(MPI_COMM_ROSS) != MPI_SUCCESS)
-    tw_error(TW_LOC, "Failed to wait for MPI_Barrier");
+    if (MPI_Barrier(MPI_COMM_ROSS) != MPI_SUCCESS)
+        tw_error(TW_LOC, "Failed to wait for MPI_Barrier");
 }
 
 tw_stime
 tw_net_minimum(tw_pe *me)
 {
-  tw_stime m = DBL_MAX;
-  tw_event *e;
-  int i;
-
-  e = outq.head;
-  while (e) {
-    if (m > e->recv_ts)
-      m = e->recv_ts;
-    e = e->next;
-  }
-
-  for (i = 0; i < posted_sends.cur; i++) {
-    e = posted_sends.event_list[i];
-    if (m > e->recv_ts)
-      m = e->recv_ts;
-  }
-
-  return m;
+    tw_stime m = DBL_MAX;
+    tw_event *e;
+    int i;
+
+    e = outq.head;
+    while (e) {
+        if (m > e->recv_ts)
+            m = e->recv_ts;
+        e = e->next;
+    }
+
+    for (i = 0; i < posted_sends.cur; i++) { //fix this line (?)
+        e = posted_sends.event_list[i];
+        if(e == NULL)
+        {}
+        else if(m > e->recv_ts)
+            m = e->recv_ts;
+        else
+        {}
+    }
+
+    return m;
 }
 
 static int
-test_q(
-       struct act_q *q,
-       tw_pe *me,
-       void (*finish)(tw_pe *, tw_event *, char *))
+test_q_recv(
+        struct act_q * q,
+        tw_pe *me,
+        void (*finish)(tw_pe *, tw_event *, char *, struct act_q*, int id))
 {
-  int ready, i, n;
+    int ready, i=0, n, indicator;
+    indicator = 1;
 
 #if ROSS_MEMORY
-  char *tmp;
+    char *tmp;
 #endif
 
-  if (!q->cur)
-    return 0;
 
-  if (MPI_Testsome(
-		   q->cur,
-		   q->req_list,
-		   &ready,
-		   q->idx_list,
-		   q->status_list) != MPI_SUCCESS) {
-    tw_error(
-	     TW_LOC,
-	     "MPI_testsome failed with %u items in %s",
-	     q->cur,
-	     q->name);
-  }
+    if( q->num_in_fr_q == ((q->size_of_fr_q)-1) )
+        return 0;
+
+    if (MPI_Testsome(
+            q->cur,
+            q->req_list,
+            &ready,
+            q->idx_list,
+            q->status_list) != MPI_SUCCESS) {
+        tw_error(
+                TW_LOC,
+                "MPI_testsome failed with %u items in %s",
+                q->cur,
+                q->name);
+    }
+
+    if (1 > ready)
+        return 0;
 
-  if (1 > ready)
-    return 0;
+    q->overflow_anti[0]=1;
+//    q->num_in_fr_q+=ready;
 
-  for (i = 0; i < ready; i++)
+    while ( i < ready)
     {
-      tw_event *e;
 
-      n = q->idx_list[i];
-      e = q->event_list[n];
-      q->event_list[n] = NULL;
+        tw_event *e;
+        n = q->idx_list[i];
+        e = q->event_list[n];
+        fr_q_aq(q, n); //add n onto queue
 
 #if ROSS_MEMORY
-      finish(me, e, q->buffers[n]);
+            finish(me, e, q->buffers[n], q, n);
 #else
-      finish(me, e, NULL);
+            finish(me, e, NULL, q, n);
+#endif
+        if (indicator != q->overflow_anti[0])
+        {
+            indicator = q->overflow_anti[0];
+        }
+        else
+        {
+            q->event_list[n] = NULL;
+        }
+        i++;
+    }
+
+    i = 1; // first element of q->overflow_anti is the number of
+
+    while (i < q->overflow_anti[0])//takes care of out of order messages
+    {
+
+        tw_event *e;
+        n = q->overflow_anti[i];
+        e = q->event_list[n];
+        q->event_list[n] = NULL;
+        late_recv_finish(me, e, NULL, q, n);
+            //might need an augmented version for ROSS_MEMORY?
+        i++;
+    }
+
+//    V breaks everything.
+//    fr_q_reset(q);
+
+
+    return 1;
+}
+
+
+static int
+test_q_send(
+        struct act_q * q,
+        tw_pe *me,
+        void (*finish)(tw_pe *, tw_event *, char *, struct act_q*, int id))
+{
+    int ready, i=0, n;
+
+#if ROSS_MEMORY
+    char *tmp;
 #endif
+
+
+    if( q->num_in_fr_q == ((q->size_of_fr_q)-1) )
+        return 0;
+
+    if (MPI_Testsome(
+            q->cur,
+            q->req_list,
+            &ready,
+            q->idx_list,
+            q->status_list) != MPI_SUCCESS) {
+        tw_error(
+                TW_LOC,
+                "MPI_testsome failed with %u items in %s",
+                q->cur,
+                q->name);
     }
 
-  /* Collapse the lists to remove any holes we left. */
-  for (i = 0, n = 0; i < q->cur; i++)
-  {
-    if (q->event_list[i])
+    if (1 > ready)
+        return 0;
+
+
+    while(i < ready)
     {
-      if (i != n)
-      {
-	// swap the event pointers
-	  q->event_list[n] = q->event_list[i];
-
-	// copy the request handles
-	  memcpy(
-	      &q->req_list[n],
-	      &q->req_list[i],
-	      sizeof(q->req_list[0]));
-	  
+
+        tw_event *e;
+
+        n = q->idx_list[i];
+        e = q->event_list[n];
+        fr_q_aq(q, n);//add n onto queue
+        q->event_list[n] = NULL;
+        i++;
+
 #if ROSS_MEMORY
-	  // swap the buffers
-	  tmp = q->buffers[n];
-	  q->buffers[n] = q->buffers[i];
-	  q->buffers[i] = tmp;
+            finish(me, e, q->buffers[n], q, n);
+#else
+        finish(me, e, NULL, q, n);
 #endif
-      } // endif (i != n)
-      n++;
-    } // endif (q->event_list[i])
-  }
-  q->cur -= ready;
+    }
+
+
+ //   q->num_in_fr_q+=ready;
+//  after all elements are removed from queue, checks if queue is empty and resets ordering if so.
+    fr_q_reset(q);
 
-  return 1;
+    return 1;
 }
 
 static int
 recv_begin(tw_pe *me)
 {
-  MPI_Status status;
+    MPI_Status status;
 
-  tw_event	*e = NULL;
+    tw_event	*e = NULL;
 
-  int flag = 0;
-  int changed = 0;
+    int flag = 0;
+    int changed = 0;
 
-  while (posted_recvs.cur < read_buffer)
+    while (0 < posted_recvs.num_in_fr_q)//fix these lines
     {
-      unsigned id = posted_recvs.cur;
 
-      if(!(e = tw_event_grab(me)))
-      {
-	  if(tw_gvt_inprogress(me))
-	      tw_error(TW_LOC, "Out of events in GVT! Consider increasing --extramem");
-	  return changed;	  
-      }
+        if(!(e = tw_event_grab(me)))
+        {
+            if(tw_gvt_inprogress(me))
+                tw_error(TW_LOC, "Out of events in GVT! Consider increasing --extramem");
+            return changed;
+        }
+
+        int id = fr_q_dq(&posted_recvs);
 
 #if ROSS_MEMORY
-      if( MPI_Irecv(posted_recvs.buffers[id],
+        if( MPI_Irecv(posted_recvs.buffers[id],
 		   EVENT_SIZE(e),
 		   MPI_BYTE,
 		   MPI_ANY_SOURCE,
@@ -323,37 +546,35 @@ recv_begin(tw_pe *me)
 		   MPI_COMM_ROSS,
 		   &posted_recvs.req_list[id]) != MPI_SUCCESS)
 #else
-	if( MPI_Irecv(e,
-		     (int)EVENT_SIZE(e),
-		     MPI_BYTE,
-		     MPI_ANY_SOURCE,
-		     EVENT_TAG,
-		     MPI_COMM_ROSS,
-		     &posted_recvs.req_list[id]) != MPI_SUCCESS)
+        if( MPI_Irecv(e,
+                      (int)EVENT_SIZE(e),
+                      MPI_BYTE,
+                      MPI_ANY_SOURCE,
+                      EVENT_TAG,
+                      MPI_COMM_ROSS,
+                      &posted_recvs.req_list[id]) != MPI_SUCCESS)
 #endif
-	  {
-	    tw_event_free(me, e);
-	    return changed;
-	  }
-
-      posted_recvs.event_list[id] = e;
-      posted_recvs.cur++;
-      changed = 1;
+        {
+            tw_event_free(me, e);
+            return changed;
+        }
+
+        posted_recvs.event_list[id] = e;
+        deal_with_cur(&posted_recvs);
+        changed = 1;
     }
-
-  return changed;
+    posted_recvs.num_in_fr_q = 0;
+    return changed;
 }
 
+
 static void
-recv_finish(tw_pe *me, tw_event *e, char * buffer)
+late_recv_finish(tw_pe *me, tw_event *e, char * buffer, struct act_q * q, int id )
 {
-  tw_pe		*dest_pe;
-  tw_clock start;
-
+    /*
 #if ROSS_MEMORY
-  tw_memory	*memory;
+    tw_memory	*memory;
   tw_memory	*last;
-
   tw_fd		 mem_fd;
 
   size_t		 mem_size;
@@ -363,66 +584,129 @@ recv_finish(tw_pe *me, tw_event *e, char * buffer)
   memcpy(e, buffer, g_tw_event_msg_sz);
   position += g_tw_event_msg_sz;
 #endif
+    /*
 
-  me->stats.s_nread_network++;
-  me->s_nwhite_recv++;
+    /*
+    if(e->send_pe > tw_nnodes()-1)
+        tw_error(TW_LOC, "bad sendpe_id: %d", e->send_pe);
 
-  //  printf("recv_finish: remote event [cancel %u] FROM: LP %lu, PE %lu, TO: LP %lu, PE %lu at TS %lf \n",
-  //	 e->state.cancel_q, (tw_lpid)e->src_lp, e->send_pe, (tw_lpid)e->dest_lp, me->id, e->recv_ts);
 
-  e->dest_lp = tw_getlocal_lp((tw_lpid) e->dest_lp);
-  dest_pe = e->dest_lp->pe;
-  // instrumentation
-  e->dest_lp->kp->kp_stats->s_nread_network++;
-  e->dest_lp->lp_stats->s_nread_network++;
+    if(e->recv_ts < me->GVT)
+        tw_error(TW_LOC, "%d: Received straggler from %d: %lf (%d)",
+                 me->id,  e->send_pe, e->recv_ts, e->state.cancel_q);
 
-  if(e->send_pe > tw_nnodes()-1)
-    tw_error(TW_LOC, "bad sendpe_id: %d", e->send_pe);
+    if(tw_gvt_inprogress(me))
+        me->trans_msg_ts = ROSS_MIN(me->trans_msg_ts, e->recv_ts);
 
-  e->cancel_next = NULL;
-  e->caused_by_me = NULL;
-  e->cause_next = NULL;
+    // if cancel event, retrieve and flush
+    // else, store in hash table
+    */
 
+    // NOTE: it is possible to cancel the event we
+    // are currently processing at this PE since this
+    // MPI module lets me read cancel events during
+    // event sends over the network.
 
+    tw_pe		*dest_pe;
+    dest_pe = e->dest_lp->pe;
+    tw_event *cancel = tw_hash_remove(me->hash_t, e, e->send_pe);
+    g_tw_pe[0]->avl_tree_size++;
 
-  if(e->recv_ts < me->GVT)
-    tw_error(TW_LOC, "%d: Received straggler from %d: %lf (%d)",
-	     me->id,  e->send_pe, e->recv_ts, e->state.cancel_q);
+    cancel->state.cancel_q = 1;
+    cancel->state.remote = 0;
+    cancel->cancel_next = dest_pe->cancel_q;
+    dest_pe->cancel_q = cancel;
+    tw_event_free(me, e);
 
-  if(tw_gvt_inprogress(me))
-    me->trans_msg_ts = ROSS_MIN(me->trans_msg_ts, e->recv_ts);
+    return;
 
-  // if cancel event, retrieve and flush
-  // else, store in hash table
-  if(e->state.cancel_q)
-    {
-      tw_event *cancel = tw_hash_remove(me->hash_t, e, e->send_pe);
+}
 
-      // NOTE: it is possible to cancel the event we
-      // are currently processing at this PE since this
-      // MPI module lets me read cancel events during
-      // event sends over the network.
+static void
+recv_finish(tw_pe *me, tw_event *e, char * buffer, struct act_q * q, int id )
+{
+    tw_pe		*dest_pe;
+    tw_clock       start;
+
+#if ROSS_MEMORY
+    tw_memory	*memory;
+  tw_memory	*last;
+  tw_fd		 mem_fd;
 
-      cancel->state.cancel_q = 1;
-      cancel->state.remote = 0;
+  size_t		 mem_size;
+
+  unsigned	 position = 0;
 
-      cancel->cancel_next = dest_pe->cancel_q;
-      dest_pe->cancel_q = cancel;
+  memcpy(e, buffer, g_tw_event_msg_sz);
+  position += g_tw_event_msg_sz;
+#endif
+    me->stats.s_nread_network++;
+    me->s_nwhite_recv++;
+    e->dest_lp = tw_getlocal_lp((tw_lpid) e->dest_lp);
+    dest_pe = e->dest_lp->pe;
 
-      tw_event_free(me, e);
 
-      return;
+    // instrumentation
+    e->dest_lp->kp->kp_stats->s_nread_network++;
+    e->dest_lp->lp_stats->s_nread_network++;
+
+    e->cancel_next = NULL;
+    e->caused_by_me = NULL;
+    e->cause_next = NULL;
+
+    if(e->send_pe > tw_nnodes()-1)
+        tw_error(TW_LOC, "bad sendpe_id: %d", e->send_pe);
+
+
+    if(e->recv_ts < me->GVT)
+        tw_error(TW_LOC, "%d: Received straggler from %d: %lf (%d)",
+                 me->id,  e->send_pe, e->recv_ts, e->state.cancel_q);
+
+    if(tw_gvt_inprogress(me))
+        me->trans_msg_ts = ROSS_MIN(me->trans_msg_ts, e->recv_ts);
+
+    // if cancel event, retrieve and flush
+    // else, store in hash table
+
+    if(e->state.cancel_q)
+    {
+
+        tw_event *cancel = tw_hash_remove(me->hash_t, e, e->send_pe);
+
+        // NOTE: it is possible to cancel the event we
+        // are currently processing at this PE since this
+        // MPI module lets me read cancel events during
+        // event sends over the network.
+
+        if(cancel!=NULL)
+        {
+
+            cancel->state.cancel_q = 1;
+            cancel->state.remote = 0;
+            cancel->cancel_next = dest_pe->cancel_q;
+            dest_pe->cancel_q = cancel;
+            tw_event_free(me, e);
+        }
+        else
+        {
+            q->overflow_anti[q->overflow_anti[0]] = id; //add id stuff later
+            q->overflow_anti[0]++;
+        }
+
+        return;
     }
 
-  if (g_tw_synchronization_protocol == OPTIMISTIC ||
-      g_tw_synchronization_protocol == OPTIMISTIC_DEBUG ||
-      g_tw_synchronization_protocol == OPTIMISTIC_REALTIME ) {
-    tw_hash_insert(me->hash_t, e, e->send_pe);
-    e->state.remote = 1;
-  }
+
+
+    if (g_tw_synchronization_protocol == OPTIMISTIC ||
+        g_tw_synchronization_protocol == OPTIMISTIC_DEBUG ||
+        g_tw_synchronization_protocol == OPTIMISTIC_REALTIME ) {
+        tw_hash_insert(me->hash_t, e, e->send_pe);
+        e->state.remote = 1;
+    }
 
 #if ROSS_MEMORY
-  mem_size = (size_t) e->memory;
+    mem_size = (size_t) e->memory;
   mem_fd = (tw_fd) e->prev;
 
   last = NULL;
@@ -448,60 +732,58 @@ recv_finish(tw_pe *me, tw_event *e, char * buffer)
     }
 #endif
 
-  /* NOTE: the final check in the if conditional below was added to make sure
-   * that we do not execute the fast case unless the cancellation queue is
-   * empty on the destination PE.  Otherwise we need to invoke the normal
-   * scheduling routines to make sure that a forward event doesn't bypass a
-   * cancellation event with an earlier timestamp.  This is helpful for
-   * stateful models that produce incorrect results when presented with
-   * duplicate messages with no rollback between them.
-   */
-  if(me == dest_pe && e->dest_lp->kp->last_time <= e->recv_ts && !dest_pe->cancel_q) {
-    /* Fast case, we are sending to our own PE and
-     * there is no rollback caused by this send.
+    /* NOTE: the final check in the if conditional below was added to make sure
+     * that we do not execute the fast case unless the cancellation queue is
+     * empty on the destination PE.  Otherwise we need to invoke the normal
+     * scheduling routines to make sure that a forward event doesn't bypass a
+     * cancellation event with an earlier timestamp.  This is helpful for
+     * stateful models that produce incorrect results when presented with
+     * duplicate messages with no rollback between them.
      */
-    start = tw_clock_read();
-    tw_pq_enqueue(dest_pe->pq, e);
-    dest_pe->stats.s_pq += tw_clock_read() - start;
-    return;
-  }
+    if(me == dest_pe && e->dest_lp->kp->last_time <= e->recv_ts && !dest_pe->cancel_q) {
+        /* Fast case, we are sending to our own PE and
+         * there is no rollback caused by this send.
+         */
+        start = tw_clock_read();
+        tw_pq_enqueue(dest_pe->pq, e);
+        dest_pe->stats.s_pq += tw_clock_read() - start;
+        return;
+    }
 
-  if (me->node == dest_pe->node) {
-    /* Slower, but still local send, so put into top
-     * of dest_pe->event_q.
+    if (me->node == dest_pe->node) {
+        /* Slower, but still local send, so put into top
+         * of dest_pe->event_q.
+         */
+        e->state.owner = TW_pe_event_q;
+        tw_eventq_push(&dest_pe->event_q, e);
+        return;
+    }
+
+    /* Never should happen; MPI should have gotten the
+     * message to the correct node without needing us
+     * to redirect the message there for it.  This is
+     * probably a serious bug with the event headers
+     * not being formatted right.
      */
-    e->state.owner = TW_pe_event_q;
-    tw_eventq_push(&dest_pe->event_q, e);
-    return;
-  }
-
-  /* Never should happen; MPI should have gotten the
-   * message to the correct node without needing us
-   * to redirect the message there for it.  This is
-   * probably a serious bug with the event headers
-   * not being formatted right.
-   */
-  tw_error(
-	   TW_LOC,
-	   "Event recived by PE %u but meant for PE %u",
-	   me->id,
-	   dest_pe->id);
+    tw_error(
+            TW_LOC,
+            "Event received by PE %u but meant for PE %u",
+            me->id,
+            dest_pe->id);
 }
 
 static int
 send_begin(tw_pe *me)
 {
-  int changed = 0;
+    int changed = 0;
 
-  while (posted_sends.cur < send_buffer)
+    while (0 < posted_sends.num_in_fr_q)
     {
-      tw_event *e = tw_eventq_peek(&outq);
-      tw_node	*dest_node = NULL;
-
-      unsigned id = posted_sends.cur;
+        tw_event *e = tw_eventq_peek(&outq);//next event
+        tw_node	*dest_node = NULL;
 
 #if ROSS_MEMORY
-      tw_event *tmp_prev = NULL;
+            tw_event *tmp_prev = NULL;
 
       tw_lp *tmp_lp = NULL;
 
@@ -515,23 +797,24 @@ send_begin(tw_pe *me)
       unsigned position = 0;
 #endif
 
-      if (!e)
-	break;
+        if (!e)
+            break;
 
-      if(e == me->abort_event)
-	tw_error(TW_LOC, "Sending abort event!");
+        if(e == me->abort_event)
+            tw_error(TW_LOC, "Sending abort event!");
 
-      dest_node = tw_net_onnode((*e->src_lp->type->map)
-				((tw_lpid) e->dest_lp));
+        int id =  send_fr_q_dq(&posted_sends);// fixed, grabs from front of queue, moves front up one element
+        dest_node = tw_net_onnode((*e->src_lp->type->map)
+                                          ((tw_lpid) e->dest_lp));
 
-      //if(!e->state.cancel_q)
-	//e->event_id = (tw_eventid) ++me->seq_num;
+        //if(!e->state.cancel_q)
+        //e->event_id = (tw_eventid) ++me->seq_num;
 
-      e->send_pe = (tw_peid) g_tw_mynode;
-      e->send_lp = e->src_lp->gid;
+        e->send_pe = (tw_peid) g_tw_mynode;
+        e->send_lp = e->src_lp->gid;
 
 #if ROSS_MEMORY
-      // pack pointers
+        // pack pointers
       tmp_prev = e->prev;
       tmp_lp = e->src_lp;
 
@@ -592,94 +875,94 @@ send_begin(tw_pe *me)
 	return changed;
       }
 #else
-      if (MPI_Isend(e,
-		    (int)EVENT_SIZE(e),
-		    MPI_BYTE,
-		    (int)*dest_node,
-		    EVENT_TAG,
-		    MPI_COMM_ROSS,
-		    &posted_sends.req_list[id]) != MPI_SUCCESS) {
-	return changed;
-      }
+        if (MPI_Isend(e,
+                      (int)EVENT_SIZE(e),
+                      MPI_BYTE,
+                      (int)*dest_node,
+                      EVENT_TAG,
+                      MPI_COMM_ROSS,
+                      &posted_sends.req_list[id]) != MPI_SUCCESS) {
+            return changed;
+        }
 #endif
 
-      tw_eventq_pop(&outq);
-      e->state.owner = e->state.cancel_q
-	? TW_net_acancel
-	: TW_net_asend;
+        tw_eventq_pop(&outq);
+        e->state.owner = e->state.cancel_q
+                         ? TW_net_acancel
+                         : TW_net_asend;
 
-      posted_sends.event_list[id] = e;
-      posted_sends.cur++;
-      me->s_nwhite_sent++;
+        posted_sends.event_list[id] = e;
+        deal_with_cur(&posted_sends);
 
-      changed = 1;
+        me->s_nwhite_sent++;
+        changed = 1;
     }
-  return changed;
+    return changed;
 }
 
 static void
-send_finish(tw_pe *me, tw_event *e, char * buffer)
+send_finish(tw_pe *me, tw_event *e, char * buffer, struct act_q * q, int id)
 {
-  me->stats.s_nsend_network++;
-  // instrumentation
-  e->src_lp->kp->kp_stats->s_nsend_network++;
-  e->src_lp->lp_stats->s_nsend_network++;
-
-  if (e->state.owner == TW_net_asend) {
-    if (e->state.cancel_asend) {
-      /* Event was cancelled during transmission.  We must
-       * send another message to pass the cancel flag to
-       * the other node.
-       */
-      e->state.cancel_asend = 0;
-      e->state.cancel_q = 1;
-      tw_eventq_push(&outq, e);
-    } else {
-      /* Event finished transmission and was not cancelled.
-       * Add to our sent event queue so we can retain the
-       * event in case we need to cancel it later.  Note it
-       * is currently in remote format and must be converted
-       * back to local format for fossil collection.
-       */
-      e->state.owner = TW_pe_sevent_q;
-      if( g_tw_synchronization_protocol == CONSERVATIVE )
-	tw_event_free(me, e);
+    me->stats.s_nsend_network++;
+    // instrumentation
+    e->src_lp->kp->kp_stats->s_nsend_network++;
+    e->src_lp->lp_stats->s_nsend_network++;
+
+    if (e->state.owner == TW_net_asend) {
+        if (e->state.cancel_asend) {
+            /* Event was cancelled during transmission.  We must
+             * send another message to pass the cancel flag to
+             * the other node.
+             */
+            e->state.cancel_asend = 0;
+            e->state.cancel_q = 1;
+            tw_eventq_push(&outq, e);
+        } else {
+            /* Event finished transmission and was not cancelled.
+             * Add to our sent event queue so we can retain the
+             * event in case we need to cancel it later.  Note it
+             * is currently in remote format and must be converted
+             * back to local format for fossil collection.
+             */
+            e->state.owner = TW_pe_sevent_q;
+            if( g_tw_synchronization_protocol == CONSERVATIVE )
+                tw_event_free(me, e);
+        }
+
+        return;
     }
 
-    return;
-  }
+    if (e->state.owner == TW_net_acancel) {
+        /* We just finished sending the cancellation message
+         * for this event.  We need to free the buffer and
+         * make it available for reuse.
+         */
+        tw_event_free(me, e);
+        return;
+    }
 
-  if (e->state.owner == TW_net_acancel) {
-    /* We just finished sending the cancellation message
-     * for this event.  We need to free the buffer and
-     * make it available for reuse.
+    /* Never should happen, not unless we somehow broke this
+     * module's other functions related to sending an event.
      */
-    tw_event_free(me, e);
-    return;
-  }
-
-  /* Never should happen, not unless we somehow broke this
-   * module's other functions related to sending an event.
-   */
 
-  tw_error(
-	   TW_LOC,
-	   "Don't know how to finish send of owner=%u, cancel_q=%d",
-	   e->state.owner,
-	   e->state.cancel_q);
+    tw_error(
+            TW_LOC,
+            "Don't know how to finish send of owner=%u, cancel_q=%d",
+            e->state.owner,
+            e->state.cancel_q);
 
 }
 
 static void
 service_queues(tw_pe *me)
 {
-  int changed;
-  do {
-    changed  = test_q(&posted_recvs, me, recv_finish);
-    changed |= test_q(&posted_sends, me, send_finish);
-    changed |= recv_begin(me);
-    changed |= send_begin(me);
-  } while (changed);
+    int changed;
+    do {
+        changed  = test_q_recv(&posted_recvs, me, recv_finish);
+        changed |= test_q_send(&posted_sends, me, send_finish);
+        changed |= recv_begin(me);
+        changed |= send_begin(me);
+    } while (changed);
 }
 
 /*
@@ -691,78 +974,78 @@ service_queues(tw_pe *me)
 void
 tw_net_read(tw_pe *me)
 {
-  service_queues(me);
+    service_queues(me);
 }
 
 void
 tw_net_send(tw_event *e)
 {
-  tw_pe * me = e->src_lp->pe;
-  int changed = 0;
+    tw_pe * me = e->src_lp->pe;
+    int changed = 0;
 
-  e->state.remote = 0;
-  e->state.owner = TW_net_outq;
-  tw_eventq_unshift(&outq, e);
+    e->state.remote = 0;
+    e->state.owner = TW_net_outq;
+    tw_eventq_unshift(&outq, e);
 
-  do
+    do
     {
-      changed = test_q(&posted_sends, me, send_finish);
-      changed |= send_begin(me);
+        changed = test_q_send(&posted_sends, me, send_finish);
+        changed |= send_begin(me);
     } while (changed);
 }
 
 void
 tw_net_cancel(tw_event *e)
 {
-  tw_pe *src_pe = e->src_lp->pe;
-
-  switch (e->state.owner) {
-  case TW_net_outq:
-    /* Cancelled before we could transmit it.  Do not
-     * transmit the event and instead just release the
-     * buffer back into our own free list.
-     */
-    tw_eventq_delete_any(&outq, e);
-    tw_event_free(src_pe, e);
-
-    return;
-
-    break;
-
-  case TW_net_asend:
-    /* Too late.  We've already let MPI start to send
-     * this event over the network.  We can't pull it
-     * back now without sending another message to do
-     * the cancel.
-     *
-     * Setting the cancel_q flag will signal us to do
-     * another message send once the current send of
-     * this message is completed.
-     */
-    e->state.cancel_asend = 1;
-    break;
-
-  case TW_pe_sevent_q:
-    /* Way late; the event was already sent and is in
-     * our sent event queue.  Mark it as a cancel and
-     * place it at the front of the outq.
-     */
-    e->state.cancel_q = 1;
-    tw_eventq_unshift(&outq, e);
-    break;
-
-  default:
-    /* Huh?  Where did you come from?  Why are we being
-     * told about you?  We did not send you so we cannot
-     * cancel you!
-     */
-    tw_error(
-	     TW_LOC,
-	     "Don't know how to cancel event owned by %u",
-	     e->state.owner);
-  }
+    tw_pe *src_pe = e->src_lp->pe;
+
+    switch (e->state.owner) {
+        case TW_net_outq:
+            /* Cancelled before we could transmit it.  Do not
+             * transmit the event and instead just release the
+             * buffer back into our own free list.
+             */
+            tw_eventq_delete_any(&outq, e);
+            tw_event_free(src_pe, e);
+
+            return;
+
+            break;
+
+        case TW_net_asend:
+            /* Too late.  We've already let MPI start to send
+             * this event over the network.  We can't pull it
+             * back now without sending another message to do
+             * the cancel.
+             *
+             * Setting the cancel_q flag will signal us to do
+             * another message send once the current send of
+             * this message is completed.
+             */
+            e->state.cancel_asend = 1;
+            break;
+
+        case TW_pe_sevent_q:
+            /* Way late; the event was already sent and is in
+             * our sent event queue.  Mark it as a cancel and
+             * place it at the front of the outq.
+             */
+            e->state.cancel_q = 1;
+            tw_eventq_unshift(&outq, e);
+            break;
+
+        default:
+            /* Huh?  Where did you come from?  Why are we being
+             * told about you?  We did not send you so we cannot
+             * cancel you!
+             */
+            tw_error(
+                    TW_LOC,
+                    "Don't know how to cancel event owned by %u",
+                    e->state.owner);
+    }
 
-  service_queues(src_pe);
+    service_queues(src_pe);
 }
 
 /**
@@ -775,50 +1058,50 @@ tw_net_cancel(tw_event *e)
 tw_statistics	*
 tw_net_statistics(tw_pe * me, tw_statistics * s)
 {
-  if(MPI_Reduce(&(s->s_max_run_time),
-		&me->stats.s_max_run_time,
-		1,
-		MPI_DOUBLE,
-		MPI_MAX,
-		(int)g_tw_masternode,
-		MPI_COMM_ROSS) != MPI_SUCCESS)
-    tw_error(TW_LOC, "Unable to reduce statistics!");
-
-  if(MPI_Reduce(&(s->s_net_events),
-		&me->stats.s_net_events,
-		17,
-		MPI_UNSIGNED_LONG_LONG,
-		MPI_SUM,
-		(int)g_tw_masternode,
-		MPI_COMM_ROSS) != MPI_SUCCESS)
-    tw_error(TW_LOC, "Unable to reduce statistics!");
-
-  if(MPI_Reduce(&s->s_min_detected_offset,
-        &me->stats.s_min_detected_offset,
-        1,
-        MPI_DOUBLE,
-        MPI_MIN,
-        (int)g_tw_masternode,
-        MPI_COMM_ROSS) != MPI_SUCCESS)
-    tw_error(TW_LOC, "Unable to reduce statistics!");
-
-  if(MPI_Reduce(&(s->s_total),
-		&me->stats.s_total,
-		16,
-		MPI_UNSIGNED_LONG_LONG,
-		MPI_MAX,
-		(int)g_tw_masternode,
-		MPI_COMM_ROSS) != MPI_SUCCESS)
-    tw_error(TW_LOC, "Unable to reduce statistics!");
+    if(MPI_Reduce(&(s->s_max_run_time),
+                  &me->stats.s_max_run_time,
+                  1,
+                  MPI_DOUBLE,
+                  MPI_MAX,
+                  (int)g_tw_masternode,
+                  MPI_COMM_ROSS) != MPI_SUCCESS)
+        tw_error(TW_LOC, "Unable to reduce statistics!");
+
+    if(MPI_Reduce(&(s->s_net_events),
+                  &me->stats.s_net_events,
+                  17,
+                  MPI_UNSIGNED_LONG_LONG,
+                  MPI_SUM,
+                  (int)g_tw_masternode,
+                  MPI_COMM_ROSS) != MPI_SUCCESS)
+        tw_error(TW_LOC, "Unable to reduce statistics!");
+
+    if(MPI_Reduce(&s->s_min_detected_offset,
+                  &me->stats.s_min_detected_offset,
+                  1,
+                  MPI_DOUBLE,
+                  MPI_MIN,
+                  (int)g_tw_masternode,
+                  MPI_COMM_ROSS) != MPI_SUCCESS)
+        tw_error(TW_LOC, "Unable to reduce statistics!");
+
+    if(MPI_Reduce(&(s->s_total),
+                  &me->stats.s_total,
+                  16,
+                  MPI_UNSIGNED_LONG_LONG,
+                  MPI_MAX,
+                  (int)g_tw_masternode,
+                  MPI_COMM_ROSS) != MPI_SUCCESS)
+        tw_error(TW_LOC, "Unable to reduce statistics!");
 
     if (MPI_Reduce(&s->s_events_past_end,
-        &me->stats.s_events_past_end,
-        3,
-        MPI_UNSIGNED_LONG_LONG,
-        MPI_SUM,
-        (int)g_tw_masternode,
-        MPI_COMM_ROSS) != MPI_SUCCESS)
-    tw_error(TW_LOC, "Unable to reduce statistics!");
+                   &me->stats.s_events_past_end,
+                   3,
+                   MPI_UNSIGNED_LONG_LONG,
+                   MPI_SUM,
+                   (int)g_tw_masternode,
+                   MPI_COMM_ROSS) != MPI_SUCCESS)
+        tw_error(TW_LOC, "Unable to reduce statistics!");
 
 #ifdef USE_RIO
     if (MPI_Reduce(&s->s_rio_load,
@@ -839,5 +1122,6 @@ tw_net_statistics(tw_pe * me, tw_statistics * s)
         tw_error(TW_LOC, "Unable to reduce statistics!");
 #endif
 
-  return &me->stats;
+    return &me->stats;
 }
+
diff --git a/core/queue-network-mpi.c b/core/queue-network-mpi.c
new file mode 100644
index 000000000..9ebdb800a
--- /dev/null
+++ b/core/queue-network-mpi.c
@@ -0,0 +1,1055 @@
+#include <ross.h>
+#include <mpi.h>
+#include "ross.h"
+
+MPI_Comm MPI_COMM_ROSS = MPI_COMM_WORLD;
+int custom_communicator = 0;
+
+static long id_tmp;
+
+struct act_q
+{
+    const char	 *name;
+
+    tw_event	**event_list;
+    MPI_Request	 *req_list;
+    int		 *idx_list;
+    MPI_Status	 *status_list;
+    int        *free_idx_list;//add, que of free indices
+    int        *overflow_anti;
+
+#if ROSS_MEMORY
+    char		**buffers;
+#endif
+    unsigned int cur;
+    unsigned int front;//add, front of queue
+    //int coda;//add, back of queue but back is already a variable somewhere
+    int size_of_fr_q;//add, size of queue array
+    int num_in_fr_q;//add, number of elements in queue
+
+};
+
+#define EVENT_TAG 1
+
+#if ROSS_MEMORY
+#define EVENT_SIZE(e) TW_MEMORY_BUFFER_SIZE
+#else
+#define EVENT_SIZE(e) g_tw_event_msg_sz
+#endif
+
+static struct act_q posted_sends;
+static struct act_q posted_recvs;
+static tw_eventq outq;
+
+static unsigned int read_buffer = 16;
+static unsigned int send_buffer = 1024;
+static int world_size = 1;
+
+void deal_with_cur(struct act_q *q)// this is for MPI_testsome input
+{
+//    printf("cur = %d, front %d\n", q->cur,q->front);
+    if(q->cur < (q->front))//(q->front))//checks to see if
+    {
+        q->cur++;
+//        printf("%s: CUR IS %d\n",q->name, q->cur);
+
+        return;
+    }
+    else
+    {
+        return;
+    }
+}
+
+
+
+void fr_q_chq(struct act_q *q, int *frontOrCoda) //free index queue; check for modulating the front or back index of que
+{
+    if(*frontOrCoda != q->size_of_fr_q)//don't mess with queue
+    {
+        return;
+    }
+    else//mess with queue
+    {
+        *frontOrCoda = 0;
+        return;
+    }
+}
+
+void fr_q_aq(struct act_q *q, int ele) // free index queue; add to queue
+{
+    q->front--;
+    q->free_idx_list[q->front] = ele;
+    return;
+}
+
+int fr_q_dq(struct act_q *q) // free index queue; dequeue
+{
+    int rv = q->free_idx_list[q->front];
+    q->front++;
+    q->num_in_fr_q--;
+    return rv;
+}
+
+static const tw_optdef mpi_opts[] = {
+        TWOPT_GROUP("ROSS MPI Kernel"),
+        TWOPT_UINT(
+                "read-buffer",
+                read_buffer,
+                "network read buffer size in # of events"),
+        TWOPT_UINT(
+                "send-buffer",
+                send_buffer,
+                "network send buffer size in # of events"),
+        TWOPT_END()
+};
+
+// Forward declarations of functions used in MPI network message processing
+static int recv_begin(tw_pe *me);
+static void recv_finish(tw_pe *me, tw_event *e, char * buffer, struct act_q* q, int id);
+static void late_recv_finish(tw_pe *me, tw_event *e, char * buffer, struct act_q* q, int id);
+static int send_begin(tw_pe *me);
+static void send_finish(tw_pe *me, tw_event *e, char * buffer, struct act_q* q, int id);
+
+// Start of implmentation of network processing routines/functions
+void tw_comm_set(MPI_Comm comm)
+{
+    MPI_COMM_ROSS = comm;
+    custom_communicator = 1;
+}
+
+const tw_optdef *
+tw_net_init(int *argc, char ***argv)
+{
+    int my_rank;
+
+    int initialized;
+    MPI_Initialized(&initialized);
+
+    if (!initialized) {
+        if (MPI_Init(argc, argv) != MPI_SUCCESS)
+            tw_error(TW_LOC, "MPI_Init failed.");
+    }
+    if (MPI_Comm_rank(MPI_COMM_ROSS, &my_rank) != MPI_SUCCESS)
+        tw_error(TW_LOC, "Cannot get MPI_Comm_rank(MPI_COMM_ROSS)");
+
+    g_tw_masternode = 0;
+    g_tw_mynode = my_rank;
+
+    return mpi_opts;
+}
+
+static void
+init_q(struct act_q *q, const char *name)
+{
+    unsigned int n;
+#if ROSS_MEMORY
+    unsigned int i;
+#endif
+
+    if(q == &posted_sends)
+    {
+        n = send_buffer;
+    }
+    else
+    {
+
+        n = read_buffer;
+    }
+    q->name = name;
+    q->event_list = (tw_event **) tw_calloc(TW_LOC, name, sizeof(*q->event_list), n);
+    q->req_list = (MPI_Request *) tw_calloc(TW_LOC, name, sizeof(*q->req_list), n);
+    q->idx_list = (int *) tw_calloc(TW_LOC, name, sizeof(*q->idx_list), n);
+    q->status_list = (MPI_Status *) tw_calloc(TW_LOC, name, sizeof(*q->status_list), n);
+    //can I shrink this initialization?
+    q->free_idx_list = (int *) tw_calloc(TW_LOC, name, sizeof(*q->idx_list), n+1);// queue, n+1 is meant to prevent a full queue
+    q->overflow_anti = (int *) tw_calloc(TW_LOC, name, sizeof(*q->idx_list), (n/2)+2);// queue, at most (n/2) can be out of order, first element is # of elements in queue
+    q->front = 0;// front of queue
+    q->size_of_fr_q = n+1;// for wraparound
+    q->num_in_fr_q = 0; // number of elements in queue
+
+    int i = 0;
+    while(i<n) // initializes the queue
+    {
+        q->free_idx_list[i] = i;
+//        fr_q_aq(q,i);
+        i++;
+    }
+//    q->front = 1;
+//    printf("front = %d\n",q->front);
+    q->overflow_anti[0]=1;
+    q->num_in_fr_q = n;// number of elements in queue
+
+
+#if ROSS_MEMORY
+    q->buffers = tw_calloc(TW_LOC, name, sizeof(*q->buffers), n);
+
+  for(i = 0; i < n; i++)
+    q->buffers[i] = tw_calloc(TW_LOC, "", TW_MEMORY_BUFFER_SIZE, 1);
+#endif
+}
+
+tw_node * tw_net_onnode(tw_peid gid) {
+    id_tmp = gid;
+    return &id_tmp;
+}
+
+unsigned int
+tw_nnodes(void)
+{
+    return world_size;
+}
+
+void
+tw_net_start(void)
+{
+    if (MPI_Comm_size(MPI_COMM_ROSS, &world_size) != MPI_SUCCESS)
+        tw_error(TW_LOC, "Cannot get MPI_Comm_size(MPI_COMM_ROSS)");
+
+    if( g_tw_mynode == 0)
+    {
+        printf("tw_net_start: Found world size to be %d \n", world_size );
+    }
+
+    // Check after tw_nnodes is defined
+    if(tw_nnodes() == 1) {
+        // force the setting of SEQUENTIAL protocol
+        if (g_tw_synchronization_protocol == NO_SYNCH) {
+            g_tw_synchronization_protocol = SEQUENTIAL;
+        } else if(g_tw_synchronization_protocol == CONSERVATIVE || g_tw_synchronization_protocol == OPTIMISTIC) {
+            g_tw_synchronization_protocol = SEQUENTIAL;
+            fprintf(stderr, "Warning: Defaulting to Sequential Simulation, not enought PEs defined.\n");
+        }
+    }
+
+//    tw_pe_create(1);
+    tw_pe_init();
+
+    //If we're in (some variation of) optimistic mode, we need this hash
+    if (g_tw_synchronization_protocol == OPTIMISTIC ||
+        g_tw_synchronization_protocol == OPTIMISTIC_DEBUG ||
+        g_tw_synchronization_protocol == OPTIMISTIC_REALTIME) {
+        g_tw_pe->hash_t = tw_hash_create();
+    } else {
+        g_tw_pe->hash_t = NULL;
+    }
+
+    if (send_buffer < 1)
+        tw_error(TW_LOC, "network send buffer must be >= 1");
+    if (read_buffer < 1)
+        tw_error(TW_LOC, "network read buffer must be >= 1");
+
+    init_q(&posted_sends, "MPI send queue");
+    init_q(&posted_recvs, "MPI recv queue");
+
+    g_tw_net_device_size = read_buffer;
+
+    // pre-post all the Irecv operations
+    recv_begin( g_tw_pe );
+} 
+
+void
+tw_net_abort(void)
+{
+    MPI_Abort(MPI_COMM_ROSS, 1);
+    exit(1);
+}
+
+void
+tw_net_stop(void)
+{
+    if (!custom_communicator) {
+        if (MPI_Finalize() != MPI_SUCCESS)
+            tw_error(TW_LOC, "Failed to finalize MPI");
+    }
+}
+
+void
+tw_net_barrier(void)
+{
+    if (MPI_Barrier(MPI_COMM_ROSS) != MPI_SUCCESS)
+        tw_error(TW_LOC, "Failed to wait for MPI_Barrier");
+}
+
+tw_stime
+tw_net_minimum(void)
+{
+    tw_stime m = DBL_MAX;
+    tw_event *e;
+    int i;
+
+    e = outq.head;
+    while (e) {
+        if (m > e->recv_ts)
+            m = e->recv_ts;
+        e = e->next;
+    }
+
+    for (i = 0; i < posted_sends.cur; i++) { //fix this line (?)
+        e = posted_sends.event_list[i];
+        if(e == NULL)
+        {}
+        else if(m > e->recv_ts)
+            m = e->recv_ts;
+        else
+        {}
+    }
+
+    return m;
+}
+
+static int
+test_q_recv(
+        struct act_q * q,
+        tw_pe *me,
+        void (*finish)(tw_pe *, tw_event *, char *, struct act_q*, int id))
+{
+    int ready, i, n, indicator;
+    indicator = 1;
+
+#if ROSS_MEMORY
+    char *tmp;
+#endif
+
+
+    if( q->num_in_fr_q == ((q->size_of_fr_q)-1) )
+        return 0;
+
+    if (MPI_Testsome(
+            q->cur,
+            q->req_list,
+            &ready,
+            q->idx_list,
+            q->status_list) != MPI_SUCCESS) {
+        tw_error(
+                TW_LOC,
+                "MPI_testsome failed with %u items in %s",
+                q->cur,
+                q->name);
+    }
+
+    if (1 > ready)
+        return 0;
+
+    q->overflow_anti[0]=1;
+    q->num_in_fr_q+=ready;
+    i = ready-1;
+    while ( -1 != i)
+    {
+
+        tw_event *e;
+        n = q->idx_list[i];
+        e = q->event_list[n];
+        fr_q_aq(q, n); //add n onto queue
+//        cur_reduction(q,n);
+
+
+#if ROSS_MEMORY
+        finish(me, e, q->buffers[n], q, n);
+#else
+        finish(me, e, NULL, q, n);
+#endif
+        if (indicator != q->overflow_anti[0])
+        {
+            indicator = q->overflow_anti[0];
+        }
+        else
+        {
+            q->event_list[n] = NULL;
+        }
+        i--;
+    }
+
+    i = 1; // first element of q->overflow_anti is the number of
+
+    while (i < q->overflow_anti[0])//takes care of out of order messages
+    {
+
+        tw_event *e;
+        n = q->overflow_anti[i];
+        e = q->event_list[n];
+        q->event_list[n] = NULL;
+        late_recv_finish(me, e, NULL, q, n);
+        //might need an augmented version for ROSS_MEMORY?
+        i++;
+    }
+
+//    V breaks everything.
+//    alter_cur(q);
+
+    return 1;
+}
+
+
+static int
+test_q_send(
+        struct act_q * q,
+        tw_pe *me,
+        void (*finish)(tw_pe *, tw_event *, char *, struct act_q*, int id))
+{
+    int ready, i, n;
+
+#if ROSS_MEMORY
+    char *tmp;
+#endif
+
+
+    if( q->num_in_fr_q == ((q->size_of_fr_q)-1) )
+        return 0;
+
+    if (MPI_Testsome(
+            q->cur,
+            q->req_list,
+            &ready,
+            q->idx_list,
+            q->status_list) != MPI_SUCCESS) {
+        tw_error(
+                TW_LOC,
+                "MPI_testsome failed with %u items in %s",
+                q->cur,
+                q->name);
+    }
+
+    if (1 > ready)
+        return 0;
+
+    i = ready-1;
+
+    while(-1 != i)
+    {
+
+        tw_event *e;
+
+        n = q->idx_list[i];
+        e = q->event_list[n];
+        fr_q_aq(q, n);//add n onto queue
+//        cur_reduction(q,n);
+        q->event_list[n] = NULL;
+        i--;
+
+#if ROSS_MEMORY
+        finish(me, e, q->buffers[n], q, n);
+#else
+        finish(me, e, NULL, q, n);
+#endif
+    }
+
+
+    q->num_in_fr_q+=ready;
+//    alter_cur(q);
+
+    return 1;
+}
+
+
+
+
+static int
+recv_begin(tw_pe *me)
+{
+    MPI_Status status;
+
+    tw_event	*e = NULL;
+
+    int flag = 0;
+    int changed = 0;
+
+    while (0 < posted_recvs.num_in_fr_q)//fix these lines
+    {
+
+        if(!(e = tw_event_grab(me)))
+        {
+            if(tw_gvt_inprogress(me))
+                tw_error(TW_LOC, "Out of events in GVT! Consider increasing --extramem");
+            return changed;
+        }
+
+        int id = fr_q_dq(&posted_recvs);
+
+#if ROSS_MEMORY
+        if( MPI_Irecv(posted_recvs.buffers[id],
+		   EVENT_SIZE(e),
+		   MPI_BYTE,
+		   MPI_ANY_SOURCE,
+		   EVENT_TAG,
+		   MPI_COMM_ROSS,
+		   &posted_recvs.req_list[id]) != MPI_SUCCESS)
+#else
+        if( MPI_Irecv(e,
+                      (int)EVENT_SIZE(e),
+                      MPI_BYTE,
+                      MPI_ANY_SOURCE,
+                      EVENT_TAG,
+                      MPI_COMM_ROSS,
+                      &posted_recvs.req_list[id]) != MPI_SUCCESS)
+#endif
+        {
+            tw_event_free(me, e);
+            return changed;
+        }
+
+        posted_recvs.event_list[id] = e;
+        deal_with_cur(&posted_recvs);
+        changed = 1;
+    }
+    return changed;
+}
+
+
+static void
+late_recv_finish(tw_pe *me, tw_event *e, char * buffer, struct act_q * q, int id )
+{
+    /*
+#if ROSS_MEMORY
+    tw_memory	*memory;
+  tw_memory	*last;
+  tw_fd		 mem_fd;
+
+  size_t		 mem_size;
+
+  unsigned	 position = 0;
+
+  memcpy(e, buffer, g_tw_event_msg_sz);
+  position += g_tw_event_msg_sz;
+#endif
+    /*
+
+    /*
+    if(e->send_pe > tw_nnodes()-1)
+        tw_error(TW_LOC, "bad sendpe_id: %d", e->send_pe);
+
+
+    if(e->recv_ts < me->GVT)
+        tw_error(TW_LOC, "%d: Received straggler from %d: %lf (%d)",
+                 me->id,  e->send_pe, e->recv_ts, e->state.cancel_q);
+
+    if(tw_gvt_inprogress(me))
+        me->trans_msg_ts = ROSS_MIN(me->trans_msg_ts, e->recv_ts);
+
+    // if cancel event, retrieve and flush
+    // else, store in hash table
+    */
+
+    // NOTE: it is possible to cancel the event we
+    // are currently processing at this PE since this
+    // MPI module lets me read cancel events during
+    // event sends over the network.
+
+    tw_pe		*dest_pe;
+    dest_pe = e->dest_lp->pe;
+    tw_event *cancel = tw_hash_remove(me->hash_t, e, e->send_pe);
+    g_tw_pe->avl_tree_size++;
+
+    cancel->state.cancel_q = 1;
+    cancel->state.remote = 0;
+    cancel->cancel_next = dest_pe->cancel_q;
+    dest_pe->cancel_q = cancel;
+    tw_event_free(me, e);
+
+    return;
+
+}
+
+static void
+recv_finish(tw_pe *me, tw_event *e, char * buffer, struct act_q * q, int id )
+{
+    tw_pe		*dest_pe;
+    tw_clock       start;
+
+#if ROSS_MEMORY
+    tw_memory	*memory;
+  tw_memory	*last;
+  tw_fd		 mem_fd;
+
+  size_t		 mem_size;
+
+  unsigned	 position = 0;
+
+  memcpy(e, buffer, g_tw_event_msg_sz);
+  position += g_tw_event_msg_sz;
+#endif
+    me->stats.s_nread_network++;
+    me->s_nwhite_recv++;
+    e->dest_lp = tw_getlocal_lp((tw_lpid) e->dest_lp);
+    dest_pe = e->dest_lp->pe;
+
+
+    // instrumentation
+    e->dest_lp->kp->kp_stats->s_nread_network++;
+    e->dest_lp->lp_stats->s_nread_network++;
+
+    e->cancel_next = NULL;
+    e->caused_by_me = NULL;
+    e->cause_next = NULL;
+
+    if(e->send_pe > tw_nnodes()-1)
+        tw_error(TW_LOC, "bad sendpe_id: %d", e->send_pe);
+
+
+    if(e->recv_ts < me->GVT)
+        tw_error(TW_LOC, "%d: Received straggler from %d: %lf (%d)",
+                 me->id,  e->send_pe, e->recv_ts, e->state.cancel_q);
+
+    if(tw_gvt_inprogress(me))
+        me->trans_msg_ts = ROSS_MIN(me->trans_msg_ts, e->recv_ts);
+
+    // if cancel event, retrieve and flush
+    // else, store in hash table
+
+    if(e->state.cancel_q)
+    {
+
+        tw_event *cancel = tw_hash_remove(me->hash_t, e, e->send_pe);
+
+        // NOTE: it is possible to cancel the event we
+        // are currently processing at this PE since this
+        // MPI module lets me read cancel events during
+        // event sends over the network.
+
+        if(cancel!=NULL)
+        {
+
+            cancel->state.cancel_q = 1;
+            cancel->state.remote = 0;
+            cancel->cancel_next = dest_pe->cancel_q;
+            dest_pe->cancel_q = cancel;
+            tw_event_free(me, e);
+        }
+        else
+        {
+            q->overflow_anti[q->overflow_anti[0]] = id; //add id stuff later
+            q->overflow_anti[0]++;
+        }
+
+        return;
+    }
+
+
+
+    if (g_tw_synchronization_protocol == OPTIMISTIC ||
+        g_tw_synchronization_protocol == OPTIMISTIC_DEBUG ||
+        g_tw_synchronization_protocol == OPTIMISTIC_REALTIME ) {
+        tw_hash_insert(me->hash_t, e, e->send_pe);
+        e->state.remote = 1;
+    }
+
+#if ROSS_MEMORY
+    mem_size = (size_t) e->memory;
+  mem_fd = (tw_fd) e->prev;
+
+  last = NULL;
+  while(mem_size)
+    {
+      memory = tw_memory_alloc(e->dest_lp, mem_fd);
+
+      if(last)
+	last->next = memory;
+      else
+	e->memory = memory;
+
+      memcpy(memory, &buffer[position], mem_size);
+      position += mem_size;
+
+      memory->fd = mem_fd;
+      memory->nrefs = 1;
+
+      mem_size = (size_t) memory->next;
+      mem_fd = memory->fd;
+
+      last = memory;
+    }
+#endif
+
+    /* NOTE: the final check in the if conditional below was added to make sure
+     * that we do not execute the fast case unless the cancellation queue is
+     * empty on the destination PE.  Otherwise we need to invoke the normal
+     * scheduling routines to make sure that a forward event doesn't bypass a
+     * cancellation event with an earlier timestamp.  This is helpful for
+     * stateful models that produce incorrect results when presented with
+     * duplicate messages with no rollback between them.
+     */
+    if(me == dest_pe && e->dest_lp->kp->last_time <= e->recv_ts && !dest_pe->cancel_q) {
+        /* Fast case, we are sending to our own PE and
+         * there is no rollback caused by this send.
+         */
+        start = tw_clock_read();
+        tw_pq_enqueue(dest_pe->pq, e);
+        dest_pe->stats.s_pq += tw_clock_read() - start;
+        return;
+    }
+
+    if (me->id == dest_pe->id) {
+        /* Slower, but still local send, so put into top
+         * of dest_pe->event_q.
+         */
+        e->state.owner = TW_pe_event_q;
+        tw_eventq_push(&dest_pe->event_q, e);
+        return;
+    }
+
+    /* Never should happen; MPI should have gotten the
+     * message to the correct node without needing us
+     * to redirect the message there for it.  This is
+     * probably a serious bug with the event headers
+     * not being formatted right.
+     */
+    tw_error(
+            TW_LOC,
+            "Event received by PE %u but meant for PE %u",
+            me->id,
+            dest_pe->id);
+}
+
+static int
+send_begin(tw_pe *me)
+{
+    int changed = 0;
+
+    while (0 < posted_sends.num_in_fr_q)
+    {
+        tw_event *e = tw_eventq_peek(&outq);//next event
+        tw_node	*dest_node = NULL;
+
+#if ROSS_MEMORY
+        tw_event *tmp_prev = NULL;
+
+      tw_lp *tmp_lp = NULL;
+
+      tw_memory *memory = NULL;
+      tw_memory *m = NULL;
+
+      char *buffer = NULL;
+
+      size_t mem_size = 0;
+
+      unsigned position = 0;
+#endif
+
+        if (!e)
+            break;
+
+        if(e == me->abort_event)
+            tw_error(TW_LOC, "Sending abort event!");
+
+        int id =  fr_q_dq(&posted_sends);// fixed, grabs from front of queue, moves front up one element
+        dest_node = tw_net_onnode((*e->src_lp->type->map)
+                                          ((tw_lpid) e->dest_lp));
+
+        //if(!e->state.cancel_q)
+        //e->event_id = (tw_eventid) ++me->seq_num;
+
+        e->send_pe = (tw_peid) g_tw_mynode;
+        e->send_lp = e->src_lp->gid;
+
+#if ROSS_MEMORY
+        // pack pointers
+      tmp_prev = e->prev;
+      tmp_lp = e->src_lp;
+
+      // delete when working
+      e->src_lp = NULL;
+
+      memory = NULL;
+      if(e->memory)
+	{
+	  memory = e->memory;
+	  e->memory = (tw_memory *) tw_memory_getsize(me, memory->fd);
+	  e->prev = (tw_event *) memory->fd;
+	  mem_size = (size_t) e->memory;
+	}
+
+      buffer = posted_sends.buffers[id];
+      memcpy(&buffer[position], e, g_tw_event_msg_sz);
+      position += g_tw_event_msg_sz;
+
+      // restore pointers
+      e->prev = tmp_prev;
+      e->src_lp = tmp_lp;
+
+      m = NULL;
+      while(memory)
+	{
+	  m = memory->next;
+
+	  if(m)
+	    {
+	      memory->next = (tw_memory *)
+		tw_memory_getsize(me, m->fd);
+	      memory->fd = m->fd;
+	    }
+
+	  if(position + mem_size > TW_MEMORY_BUFFER_SIZE)
+	    tw_error(TW_LOC, "Out of buffer space!");
+
+	  memcpy(&buffer[position], memory, mem_size);
+	  position += mem_size;
+
+	  memory->nrefs--;
+	  tw_memory_unshift(e->src_lp, memory, memory->fd);
+
+	  if(NULL != (memory = m))
+	    mem_size = tw_memory_getsize(me, memory->fd);
+	}
+
+      e->memory = NULL;
+
+      if (MPI_Isend(buffer,
+		    EVENT_SIZE(e),
+		    MPI_BYTE,
+		    *dest_node,
+		    EVENT_TAG,
+		    MPI_COMM_ROSS,
+		    &posted_sends.req_list[id]) != MPI_SUCCESS) {
+	return changed;
+      }
+#else
+        if (MPI_Isend(e,
+                      (int)EVENT_SIZE(e),
+                      MPI_BYTE,
+                      (int)*dest_node,
+                      EVENT_TAG,
+                      MPI_COMM_ROSS,
+                      &posted_sends.req_list[id]) != MPI_SUCCESS) {
+            return changed;
+        }
+#endif
+
+        tw_eventq_pop(&outq);
+        e->state.owner = e->state.cancel_q
+                         ? TW_net_acancel
+                         : TW_net_asend;
+
+        posted_sends.event_list[id] = e;
+        deal_with_cur(&posted_sends);
+
+        me->s_nwhite_sent++;
+        changed = 1;
+    }
+    return changed;
+}
+
+static void
+send_finish(tw_pe *me, tw_event *e, char * buffer, struct act_q * q, int id)
+{
+    me->stats.s_nsend_network++;
+    // instrumentation
+    e->src_lp->kp->kp_stats->s_nsend_network++;
+    e->src_lp->lp_stats->s_nsend_network++;
+
+    if (e->state.owner == TW_net_asend) {
+        if (e->state.cancel_asend) {
+            /* Event was cancelled during transmission.  We must
+             * send another message to pass the cancel flag to
+             * the other node.
+             */
+            e->state.cancel_asend = 0;
+            e->state.cancel_q = 1;
+            tw_eventq_push(&outq, e);
+        } else {
+            /* Event finished transmission and was not cancelled.
+             * Add to our sent event queue so we can retain the
+             * event in case we need to cancel it later.  Note it
+             * is currently in remote format and must be converted
+             * back to local format for fossil collection.
+             */
+            e->state.owner = TW_pe_sevent_q;
+            if( g_tw_synchronization_protocol == CONSERVATIVE )
+                tw_event_free(me, e);
+        }
+
+        return;
+    }
+
+    if (e->state.owner == TW_net_acancel) {
+        /* We just finished sending the cancellation message
+         * for this event.  We need to free the buffer and
+         * make it available for reuse.
+         */
+        tw_event_free(me, e);
+        return;
+    }
+
+    /* Never should happen, not unless we somehow broke this
+     * module's other functions related to sending an event.
+     */
+
+    tw_error(
+            TW_LOC,
+            "Don't know how to finish send of owner=%u, cancel_q=%d",
+            e->state.owner,
+            e->state.cancel_q);
+
+}
+
+static void
+service_queues(tw_pe *me)
+{
+    int changed;
+    do {
+        changed  = test_q_recv(&posted_recvs, me, recv_finish);
+        changed |= test_q_send(&posted_sends, me, send_finish);
+        changed |= recv_begin(me);
+        changed |= send_begin(me);
+    } while (changed);
+}
+
+/*
+ * NOTE: Chris believes that this network layer is too aggressive at
+ * reading events out of the network.. so we are modifying the algorithm
+ * to only send events when tw_net_send it called, and only read events
+ * when tw_net_read is called.
+ */
+void
+tw_net_read(tw_pe *me)
+{
+    service_queues(me);
+}
+
+void
+tw_net_send(tw_event *e)
+{
+    tw_pe * me = e->src_lp->pe;
+    int changed = 0;
+
+    e->state.remote = 0;
+    e->state.owner = TW_net_outq;
+    tw_eventq_unshift(&outq, e);
+
+    do
+    {
+        changed = test_q_send(&posted_sends, me, send_finish);
+        changed |= send_begin(me);
+    } while (changed);
+}
+
+void
+tw_net_cancel(tw_event *e)
+{
+    tw_pe *src_pe = e->src_lp->pe;
+
+    switch (e->state.owner) {
+        case TW_net_outq:
+            /* Cancelled before we could transmit it.  Do not
+             * transmit the event and instead just release the
+             * buffer back into our own free list.
+             */
+            tw_eventq_delete_any(&outq, e);
+            tw_event_free(src_pe, e);
+
+            return;
+
+            break;
+
+        case TW_net_asend:
+            /* Too late.  We've already let MPI start to send
+             * this event over the network.  We can't pull it
+             * back now without sending another message to do
+             * the cancel.
+             *
+             * Setting the cancel_q flag will signal us to do
+             * another message send once the current send of
+             * this message is completed.
+             */
+            e->state.cancel_asend = 1;
+            break;
+
+        case TW_pe_sevent_q:
+            /* Way late; the event was already sent and is in
+             * our sent event queue.  Mark it as a cancel and
+             * place it at the front of the outq.
+             */
+            e->state.cancel_q = 1;
+            tw_eventq_unshift(&outq, e);
+            break;
+
+        default:
+            /* Huh?  Where did you come from?  Why are we being
+             * told about you?  We did not send you so we cannot
+             * cancel you!
+             */
+            tw_error(
+                    TW_LOC,
+                    "Don't know how to cancel event owned by %u",
+                    e->state.owner);
+    }
+
+    service_queues(src_pe);
+}
+
+/**
+ * tw_net_statistics
+ * @brief Function to output the statistics
+ * @attention Notice that the MPI_Reduce "count" parameter is greater than one.
+ * We are reducing on multiple variables *simultaneously* so if you change
+ * this function or the struct tw_statistics, you must update the other.
+ **/
+tw_statistics	*
+tw_net_statistics(tw_pe * me, tw_statistics * s)
+{
+    if(MPI_Reduce(&(s->s_max_run_time),
+                  &me->stats.s_max_run_time,
+                  1,
+                  MPI_DOUBLE,
+                  MPI_MAX,
+                  (int)g_tw_masternode,
+                  MPI_COMM_ROSS) != MPI_SUCCESS)
+        tw_error(TW_LOC, "Unable to reduce statistics!");
+
+    if(MPI_Reduce(&(s->s_net_events),
+                  &me->stats.s_net_events,
+                  17,
+                  MPI_UNSIGNED_LONG_LONG,
+                  MPI_SUM,
+                  (int)g_tw_masternode,
+                  MPI_COMM_ROSS) != MPI_SUCCESS)
+        tw_error(TW_LOC, "Unable to reduce statistics!");
+
+    if(MPI_Reduce(&s->s_min_detected_offset,
+                  &me->stats.s_min_detected_offset,
+                  1,
+                  MPI_DOUBLE,
+                  MPI_MIN,
+                  (int)g_tw_masternode,
+                  MPI_COMM_ROSS) != MPI_SUCCESS)
+        tw_error(TW_LOC, "Unable to reduce statistics!");
+
+    if(MPI_Reduce(&(s->s_total),
+                  &me->stats.s_total,
+                  16,
+                  MPI_UNSIGNED_LONG_LONG,
+                  MPI_MAX,
+                  (int)g_tw_masternode,
+                  MPI_COMM_ROSS) != MPI_SUCCESS)
+        tw_error(TW_LOC, "Unable to reduce statistics!");
+
+    if (MPI_Reduce(&s->s_events_past_end,
+                   &me->stats.s_events_past_end,
+                   3,
+                   MPI_UNSIGNED_LONG_LONG,
+                   MPI_SUM,
+                   (int)g_tw_masternode,
+                   MPI_COMM_ROSS) != MPI_SUCCESS)
+        tw_error(TW_LOC, "Unable to reduce statistics!");
+
+#ifdef USE_RIO
+    if (MPI_Reduce(&s->s_rio_load,
+            &me->stats.s_rio_load,
+            1,
+            MPI_UNSIGNED_LONG_LONG,
+            MPI_MAX,
+            (int)g_tw_masternode,
+            MPI_COMM_ROSS) != MPI_SUCCESS)
+        tw_error(TW_LOC, "Unable to reduce statistics!");
+    if (MPI_Reduce(&s->s_rio_lp_init,
+            &me->stats.s_rio_lp_init,
+            1,
+            MPI_UNSIGNED_LONG_LONG,
+            MPI_MAX,
+            (int)g_tw_masternode,
+            MPI_COMM_ROSS) != MPI_SUCCESS)
+        tw_error(TW_LOC, "Unable to reduce statistics!");
+#endif
+
+    return &me->stats;
+}
+