Hi,

I am running a MPI program using cluster and tcp communication.

To run I am using:  mpirun --prefix /usr/local/ --mca btl tcp,self --hostfile slaves -np 6 scatter


I am getting following output:

Process 0 on host host1 has elements 0 1 2 3
Process 1 on host host1 has elements 4 5 6 7
Process 2 on host host1 has elements 8 9 10 11
Process 3 on host host1 has elements 12 13 14 15
[slave1][[24708,1],5][btl_tcp_endpoint.c:486:mca_btl_tcp_endpoint_recv_connect_ack] received unexpected process identifier [[24708,1],4]

When trying to communicate with slave1 i get received unexpected process identifier error.

My PATH and LD_LIBRARY_PATH are correctly set in .bashrc file.



Source code -

    
#include <stdlib.h>
#include <stdio.h>
#include "mpi.h"
#define MAXPROC 8    /* Max number of procsses */
#define LENGTH 24    /* length of buffer */
 
int main(int argc, char* argv[]) {
  int i, j, np, me;
  const int nametag  = 40;    /* Tag value for sending name */
  const int datatag  = 45;    /* Tag value for sending data */
  const int root = 0;         /* Root process in scatter */
  MPI_Status status;          /* Status object for receive */
 
  char myname[MPI_MAX_PROCESSOR_NAME];       /* Local host name string */
  char hostname[MAXPROC][MPI_MAX_PROCESSOR_NAME];  /* Received host names */
  int namelen;
 
  int x[LENGTH];        /* Send buffer */
  int y[LENGTH];        /* Receive buffer */
 
  MPI_Init(&argc, &argv);                /* Initialize MPI */
  MPI_Comm_size(MPI_COMM_WORLD, &np);    /* Get nr of processes */
  MPI_Comm_rank(MPI_COMM_WORLD, &me);    /* Get own identifier */
  
  MPI_Get_processor_name(myname, &namelen);  /* Get host name */
  myname[namelen++] = (char)0;               /* Terminating null byte */
 
  /* Check that we have an even number of processes and at most MAXPROC */
  if (np>MAXPROC || np%2 != 0) {
    if (me == 0) {
      printf("You have to use an even number of processes (at most %d)\n", MAXPROC);
    }
    MPI_Finalize();
    exit(0);
  }
 
  if (me == 0) {    /* Process 0 does this */
    
    /* Initialize the array x with values 0 .. LENGTH-1 */
    for (i=0; i<LENGTH; i++) {
      x[i] = i;
    }
 
    printf("Process %d on host %s is distributing array x to all %d processes\n\n",
       me, myname, np);
 
    /* Scatter the array x to all proceses, place it in y */
    MPI_Scatter(x, LENGTH/np, MPI_INT, y, LENGTH/np, MPI_INT, root,
        MPI_COMM_WORLD);
 
    /* Print out own portion of the scattered array */
    printf("Process %d on host %s has elements", me, myname);
    for (i=0; i<LENGTH/np; i++) {
      printf(" %d", y[i]);
    }
    printf("\n");
 
    /* Receive messages with hostname and the scattered data */
    /* from all other processes */
    for (i=1; i<np; i++) {
      MPI_Recv (hostname[i], namelen, MPI_CHAR, i, nametag, MPI_COMM_WORLD,
        &status);
      MPI_Recv (y, LENGTH/np, MPI_INT, i, datatag, MPI_COMM_WORLD, &status);
      printf("Process %d on host %s has elements", i, hostname[i]);
      for (j=0; j<LENGTH/np; j++) {
    printf(" %d", y[j]);
      }
      printf("\n");
    }
    
    printf("Ready\n");
 
 
  } else { /* all other processes do this */
 
    /* Receive the scattered array from process 0, place it in array y */
    MPI_Scatter(x, LENGTH/np, MPI_INT, y, LENGTH/np, MPI_INT, root, \
        MPI_COMM_WORLD);
    /* Send own name back to process 0 */
    MPI_Send (myname, namelen, MPI_CHAR, 0, nametag, MPI_COMM_WORLD);
    /* Send the received array back to process 0 */
    MPI_Send (y, LENGTH/np, MPI_INT, 0, datatag, MPI_COMM_WORLD);
 
  }
 
  MPI_Finalize();
  exit(0);
}

Any idea what could be wrong?


Thanks