initialize array of ptls associated with each proc

This commit was SVN r430.
2004-01-15 19:51:06 +00:00 · 2004-01-15 19:51:06 +00:00 · 1cb615ff63
--- a/src/mca/mpi/pml/pml.h
+++ b/src/mca/mpi/pml/pml.h
@ -128,16 +128,6 @@ typedef int (*mca_pml_base_wait_fn_t)(
    lam_status_public_t* status
 );
 /**
 * PTL->PML Upcall from PTL to PML to add themself to proc array
 */
 typedef int (*mca_ptl_pml_add_proc_fn_t)(
    struct lam_proc_t* proc,
    struct mca_ptl_t* ptl,
    struct mca_ptl_addr_t*
 );
 /**
 *  PML instance interface functions.
@ -161,9 +151,6 @@ struct mca_pml_t {
    mca_pml_base_start_fn_t        pml_start;
    mca_pml_base_test_fn_t         pml_test;
    mca_pml_base_wait_fn_t         pml_wait;
    /* upcalls from PTL to PML */
    mca_ptl_pml_add_proc_fn_t      ptl_pml_add_proc;
 };
 typedef struct mca_pml_t mca_pml_t;
--- a/src/mca/mpi/pml/teg/src/pml_ptl_array.h
+++ b/src/mca/mpi/pml/teg/src/pml_ptl_array.h
@ -55,6 +55,18 @@ static inline mca_ptl_proc_t* mca_ptl_array_insert(mca_ptl_array_t* array)
    return &array->ptl_procs[array->ptl_size++];
 }
 static inline mca_ptl_proc_t* mca_ptl_array_get_index(mca_ptl_array_t* array, size_t index)
 {
 #if LAM_ENABLE_DEBUG
    if(index >= array->ptl_size) {
        lam_output(0, "mca_ptl_array_get_index: invalid array index %d >= %d",
            index, array->ptl_size);
        return 0;
    }
 #endif
    return &array->ptl_procs[index];
 }
 static inline mca_ptl_proc_t* mca_ptl_array_get_next(mca_ptl_array_t* array)
 {
 #if LAM_ENABLE_DEBUG
--- a/src/mca/mpi/pml/teg/src/pml_teg.c
+++ b/src/mca/mpi/pml/teg/src/pml_teg.c
@ -2,6 +2,7 @@
 * $HEADER$
 */
 #include <stdlib.h>
 #include "lam/mem/malloc.h"
 #include "mca/mpi/pml/pml.h"
 #include "mca/mpi/ptl/ptl.h"
@ -35,6 +36,8 @@ int mca_pml_teg_add_comm(lam_communicator_t* comm)
 {
    /* allocate pml specific comm data */
    struct mca_pml_comm_t* pml_comm = (mca_pml_comm_t*)LAM_MALLOC(sizeof(mca_pml_comm_t));
    if(pml_comm == 0)
        return LAM_ERR_OUT_OF_RESOURCE;
    mca_pml_ptl_comm_init(pml_comm, comm->c_remote_group->g_proc_count);
    comm->c_pml_comm = pml_comm;
    return LAM_SUCCESS;
@ -47,21 +50,43 @@ int mca_pml_teg_del_comm(lam_communicator_t* comm)
    return LAM_SUCCESS;
 }
 static int ptl_exclusivity_compare(const void* arg1, const void* arg2)
 {
    mca_ptl_t* ptl1 = *(struct mca_ptl_t**)arg1;
    mca_ptl_t* ptl2 = *(struct mca_ptl_t**)arg2;
    if( ptl1->ptl_exclusivity > ptl2->ptl_exclusivity )
        return 1;
    else if (ptl1->ptl_exclusivity == ptl2->ptl_exclusivity )
        return 0;
    else
        return -1;
 }
 int mca_pml_teg_add_ptls(struct mca_ptl_t** ptls, size_t nptls)
 {
    /* sort the ptls by exclusivity */
    qsort(ptls, nptls, sizeof(struct mca_ptl_t*), ptl_exclusivity_compare);
    mca_pml_teg.teg_ptls = ptls;
    mca_pml_teg.teg_num_ptls = nptls;
    return LAM_SUCCESS;
 }
 /*
 *   For each proc setup a datastructure that indicates the PTLs
 *   that can be used to reach the destination.
 *
 */
 int mca_pml_teg_add_procs(lam_proc_t** procs, size_t nprocs)
 {
    size_t i;
    size_t p;
    for(p=0; p<nprocs; p++) {
        lam_proc_t *proc = procs[p];
        uint64_t total_bandwidth = 0;
        uint32_t latency = 0;
        size_t n_index, p_index; 
        size_t n_size;
        /* initialize each proc */
        mca_pml_proc_t* proc_pml = proc->proc_pml;
@ -83,8 +108,8 @@ int mca_pml_teg_add_procs(lam_proc_t** procs, size_t nprocs)
        }
        /* allow each ptl to register with the proc */
-        for(i=0; i<mca_pml_teg.teg_num_ptls; i++) {
+        for(p_index = 0; p_index < mca_pml_teg.teg_num_ptls; p_index++) {
-            mca_ptl_t* ptl = mca_pml_teg.teg_ptls[i];
+            mca_ptl_t* ptl = mca_pml_teg.teg_ptls[p_index];
            /* if the ptl can reach the destination proc it will return 
             * addressing information that will be cached on the proc
@ -102,35 +127,108 @@ int mca_pml_teg_add_procs(lam_proc_t** procs, size_t nprocs)
                /* if this ptl supports exclusive access then don't allow 
                 * subsequent ptls to register
                 */
-                if(ptl->ptl_exclusive)
+                if(ptl->ptl_exclusivity)
                    break;
            }
        }
-        /* compute a weighting factor for each ptl */
+        /* (1) determine the total bandwidth available across all ptls
-        for(i=0; i<mca_ptl_array_get_size(&proc_pml->proc_ptl_next); i++) {
+         *     note that we need to do this here, as we may already have ptls configured
-            
+         * (2) determine the highest priority ranking for latency
         */
        n_size = mca_ptl_array_get_size(&proc_pml->proc_ptl_next); 
        for(n_index = 0; n_index < n_size; n_index++) {
            struct mca_ptl_proc_t* ptl_proc = mca_ptl_array_get_index(&proc_pml->proc_ptl_next, n_index);
            struct mca_ptl_t* ptl = ptl_proc->ptl;
            total_bandwidth += ptl_proc->ptl->ptl_bandwidth; 
            if(ptl->ptl_latency > latency)
                latency = ptl->ptl_latency;
        }
        /* (1) set the weight of each ptl as a percentage of overall bandwidth
         * (2) copy all ptl instances at the highest priority ranking into the
         *     list of ptls used for first fragments
         */
        for(n_index = 0; n_index < n_size; n_index++) {
            struct mca_ptl_proc_t* ptl_proc = mca_ptl_array_get_index(&proc_pml->proc_ptl_next, n_index);
            struct mca_ptl_t *ptl = ptl_proc->ptl;
            if(ptl->ptl_bandwidth)
                ptl_proc->ptl_weight = total_bandwidth / ptl_proc->ptl->ptl_bandwidth;
            /* check to see if this ptl is already in the array of ptls used for first
             * fragments - if not add it.
             */
            if(ptl->ptl_latency == latency) {
                size_t f_index;
                size_t f_size = mca_ptl_array_get_size(&proc_pml->proc_ptl_first);
                for(f_index=0; f_index < f_size; f_index++) {
                    struct mca_ptl_proc_t* existing_proc = mca_ptl_array_get_index(&proc_pml->proc_ptl_first, f_index);
                    if(existing_proc->ptl == ptl) {
                        *existing_proc = *ptl_proc; /* update existing definition */
                        break;
                    }
                }
                /* not found add a new entry */
                if(f_index == f_size) {
                    struct mca_ptl_proc_t* new_proc = mca_ptl_array_insert(&proc_pml->proc_ptl_first);
                    *new_proc = *ptl_proc;
                }
            }
        }
    }
    return LAM_SUCCESS;
 }
 /*
 * iterate through each proc and notify any PTLs associated
 * with the proc that it is/has gone away
 */
 int mca_pml_teg_del_procs(lam_proc_t** procs, size_t nprocs)
 {
-#if 0
+    size_t p;
-    size_t i;
+    for(p = 0; p < nprocs; p++) {
-    for(i=0; i<nprocs; i++) {
+        lam_proc_t *proc = procs[p];
        lam_proc_t *proc = procs[i];
        mca_pml_proc_t* proc_pml = proc->proc_pml;
        size_t f_index, f_size;
        size_t n_index, n_size;
        /* notify each ptl that the proc is going away */
-        size_t p;
+        f_size = mca_ptl_array_get_size(&proc_pml->proc_ptl_first);
-        for(p=0; p<proc_pml->proc_ptl_first.ptl_size; p++) {
+        for(f_index = 0; f_index < f_size; f_index++) {
-            mca_ptl_info_t* ptl_info = proc_pml->proc_ptl_first.ptl_array[p];
+            mca_ptl_proc_t* ptl_proc = mca_ptl_array_get_index(&proc_pml->proc_ptl_first, f_index);
-            ptl_info->ptl->ptl_del_proc(proc);
+            mca_ptl_t* ptl = ptl_proc->ptl;
            ptl->ptl_del_proc(ptl,proc,ptl_proc->ptl_addr);
            /* remove this from next array so that we dont call it twice w/ 
             * the same address pointer
             */
            f_size = mca_ptl_array_get_size(&proc_pml->proc_ptl_first);
            for(n_index = 0; n_index < n_size; n_index++) {
                mca_ptl_proc_t* next_proc = mca_ptl_array_get_index(&proc_pml->proc_ptl_next, n_index);
                if(next_proc->ptl == ptl) {
                    memset(next_proc, 0, sizeof(mca_ptl_proc_t));
                    break;
                }
            }
        }
        /* notify each ptl that was not in the array of ptls for first fragments */
        n_size = mca_ptl_array_get_size(&proc_pml->proc_ptl_next);
        for(n_index = 0; n_index < n_size; n_index++) {
            mca_ptl_proc_t* ptl_proc = mca_ptl_array_get_index(&proc_pml->proc_ptl_first, n_index);
            mca_ptl_t* ptl = ptl_proc->ptl;
            if (ptl != 0)
                ptl->ptl_del_proc(ptl,proc,ptl_proc->ptl_addr);
        }
        /* do any required cleanup */
        mca_pml_teg_proc_destroy(proc_pml);
        LAM_FREE(proc_pml);
        proc->proc_pml = 0;
    }
 #endif
    return LAM_SUCCESS;
 }
--- a/src/mca/mpi/pml/teg/src/pml_teg_module.c
+++ b/src/mca/mpi/pml/teg/src/pml_teg_module.c
@ -11,9 +11,6 @@
 #include "pml_teg.h"
 #include "pml_teg_proc.h"
 #define mca_pml_teg_param_register_int(n,v) \
    mca_base_param_lookup_int( \
        mca_base_param_register_int("pml","teg",n,0,v))
 mca_pml_base_module_1_0_0_t mca_pml_teg_module = {
--- a/src/mca/mpi/pml/teg/src/pml_teg_sendreq.h
+++ b/src/mca/mpi/pml/teg/src/pml_teg_sendreq.h
@ -55,6 +55,7 @@ static inline int mca_pml_teg_send_request_start(
        THREAD_SCOPED_LOCK(&mca_pml_teg.teg_lock,
            lam_list_append(&mca_pml_teg.teg_incomplete_sends, (lam_list_item_t*)req));
    }
    return LAM_SUCCESS;
 }
--- a/src/mca/mpi/ptl/ptl.h
+++ b/src/mca/mpi/ptl/ptl.h
@ -89,6 +89,20 @@ typedef int (*mca_ptl_base_add_proc_fn_t)(
    struct mca_ptl_addr_t**
 );
 /**
 *  PML->PTL notification of change in the process list.
 *
 *  @param ptl (IN)     
 *  @param procs (IN)   
 *  @param nprocs (IN)  
 *  @return            
 */
 typedef int (*mca_ptl_base_del_proc_fn_t)(
    struct mca_ptl_t* ptl, 
    struct lam_proc_t* proc, 
    struct mca_ptl_addr_t*
 );
 /**
 *  MCA->PTL Clean up any resources held by PTL instance before the module is unloaded.
 *  
@ -127,15 +141,16 @@ struct mca_ptl_t {
    /* PTL common attributes */
    mca_ptl_base_module_t* ptl_module;
    int         ptl_exclusive;         /**< indicates this PTL should be used exclusively */
    size_t      ptl_first_frag_size;   /**< maximum size of first fragment */
    size_t      ptl_min_frag_size;     /**< threshold below which the PTL will not fragment */
    size_t      ptl_max_frag_size;     /**< maximum fragment size supported by the PTL */
-    uint32_t    ptl_latency;           /**< relative/absolute measure of latency */
+    uint32_t    ptl_exclusivity;       /**< indicates this PTL should be used exclusively */
-    uint64_t    ptl_bandwidth;         /**< bandwidth (bytes/sec) supported by each endpoint */
+    uint32_t    ptl_latency;           /**< relative ranking of latency used to prioritize ptls */
    uint32_t    ptl_bandwidth;         /**< bandwidth (Mbytes/sec) supported by each endpoint */
    /* PTL function table */
    mca_ptl_base_add_proc_fn_t       ptl_add_proc;
    mca_ptl_base_del_proc_fn_t       ptl_del_proc;
    mca_ptl_base_fini_fn_t           ptl_fini;
    mca_ptl_base_send_fn_t           ptl_send;
    mca_ptl_base_request_alloc_fn_t  ptl_request_alloc;