uvarc
diff --git a/‎content/courses/fortran-introduction/array_intrinsics.md
+2-1 b/‎content/courses/fortran-introduction/array_intrinsics.md
+2-1
diff --git a/‎content/courses/fortran-introduction/codes/a.out
17.6 KB b/‎content/courses/fortran-introduction/codes/a.out
17.6 KB
diff --git a/‎content/courses/fortran-introduction/codes/reshape.f90
+13 b/‎content/courses/fortran-introduction/codes/reshape.f90
+13
diff --git a/‎content/courses/parallel-computing-introduction/codes/a.out
30.6 KB b/‎content/courses/parallel-computing-introduction/codes/a.out
30.6 KB
diff --git a/‎content/courses/parallel-computing-introduction/codes/mpi_nonblock_halo.cxx
+1-1 b/‎content/courses/parallel-computing-introduction/codes/mpi_nonblock_halo.cxx
+1-1
diff --git a/‎content/courses/parallel-computing-introduction/codes/mpi_vector_type.cxx
+133 b/‎content/courses/parallel-computing-introduction/codes/mpi_vector_type.cxx
+133
diff --git a/‎content/courses/parallel-computing-introduction/codes/mpi_vector_type.f90
+47-32 b/‎content/courses/parallel-computing-introduction/codes/mpi_vector_type.f90
+47-32
diff --git a/‎content/courses/parallel-computing-introduction/codes/mpi_vector_type.py
+83 b/‎content/courses/parallel-computing-introduction/codes/mpi_vector_type.py
+83
diff --git a/‎content/courses/parallel-computing-introduction/distributed_mpi_build_run.md
+1-1 b/‎content/courses/parallel-computing-introduction/distributed_mpi_build_run.md
+1-1
@@ -38,9 +38,10 @@ SPREAD(SOURCE,DIM,NCOPIES)
 ```
 **Example**
 ```fortran
-!Array and mask are of size NxM
+!Array and mask are of shape NxM
 mask=A<0
 merge(A,0,mask)
+!B of shape MxN
 B=reshape(A,(/M,N/))
 ! for C=1, D=[1,2]
 print *, spread(C, 1, 2)            ! "1 1"
 
@@ -0,0 +1,13 @@
+PROGRAM test_sum
+INTEGER, DIMENSION(2)  :: S
+INTEGER, DIMENSION(12) :: X
+INTEGER, DIMENSION(4,3):: A
+
+    x=[(i,i=1,12)]
+    s=[3,4]
+    A=RESHAPE(x,(/4,3/))
+    print *, SIZE(A),SHAPE(x),SHAPE(A)
+
+END PROGRAM
+
+
@@ -92,8 +92,8 @@ int main (int argc, char *argv[]) {
          }
     }
 
-    MPI_Request requests[4];
     int nrequests=4;
+    MPI_Request requests[nrequests];
 
     MPI_Irecv(&w[nrl+1][1], ncl, MPI_DOUBLE, down, tag, MPI_COMM_WORLD, &requests[0]);
     MPI_Irecv(&w[0][1], ncl, MPI_DOUBLE, up, tag, MPI_COMM_WORLD, &requests[1]);
 
@@ -0,0 +1,133 @@
+#include <iostream>
+#include <iomanip>
+#include <mpi.h>
+
+using namespace std;
+
+int main (int argc, char *argv[]) {
+
+    int i, j;
+    int N;
+
+   // Added for MPI
+    int nr, nc;
+    int rank, nprocs;
+    int root=0, tag=0;
+    int src, dest;
+
+     //Initialize MPI
+    MPI_Init(&argc, &argv);
+    MPI_Comm_size(MPI_COMM_WORLD,&nprocs);
+    MPI_Comm_rank(MPI_COMM_WORLD,&rank);
+
+    N = nprocs;
+    nr = N+2;
+    nc = N;
+
+    double **w=new double*[nr];
+    double *wptr=new double[(nr)*(nc)];
+
+    for (i=0;i<nr;++i,wptr+=nc) {
+       w[i] = wptr;
+    }
+
+    for ( i = 0; i < nr; i++ ) {
+         for (j = 0; j < nc; j++ ) {
+             w[i][j] = 0.;
+         }
+    }
+
+    double **u=new double*[nr];
+    double *uptr=new double[(nr)*(nc)];
+
+    for (i=0;i<nr;++i,uptr+=nc) {
+       u[i] = uptr;
+    }
+
+    double counter=1.;
+    for ( i = 0; i < nr; i++ ) {
+         for (j = 0; j < nc; j++ ) {
+             u[i][j] = counter;
+             counter++;
+         }
+    }
+
+    //#Cyclic sending
+    if (rank == nprocs-1) {
+        src=rank-1;
+        dest=0;
+    }
+    else if (rank==0) {
+        src=nprocs-1;
+        dest=1;
+    }
+    else {
+        src=rank-1;
+        dest=rank+1;
+    }
+
+    //These values pick a total of nc (ncount) items, one item
+    //(blocklength) taken for each nr (stride) items
+
+    //The length of the column is the number of rows
+    int ncount=nr;
+    //The number of items picked from each stride is 1
+    int blocklength=1;
+    //The length of the row is the number of columns
+    int stride=nc;
+
+    MPI_Datatype cols;
+    MPI_Type_vector(ncount,blocklength,stride,MPI_DOUBLE,&cols);
+    MPI_Type_commit(&cols);
+
+    int nrequests=2;
+    MPI_Request requests[nrequests];
+
+    if (rank==0) {
+        MPI_Irecv(&w[0][0], 1, cols, src, tag, MPI_COMM_WORLD, &requests[0]);
+        MPI_Isend(&u[0][0], 1, cols, dest, tag, MPI_COMM_WORLD, &requests[1]);
+    }
+    else if (rank==nprocs-1) {
+        MPI_Irecv(&w[0][nprocs-1], 1, cols, src, tag, MPI_COMM_WORLD, &requests[0]);
+        MPI_Isend(&u[0][nprocs-1], 1, cols, dest, tag, MPI_COMM_WORLD, &requests[1]);
+    }
+    else {
+        MPI_Irecv(&w[0][rank], 1, cols, src, tag, MPI_COMM_WORLD, &requests[0]);
+        MPI_Isend(&u[0][rank], 1, cols, dest, tag, MPI_COMM_WORLD, &requests[1]);
+    }
+
+    MPI_Status status_arr[nrequests];
+    MPI_Waitall(nrequests,requests,status_arr);
+
+
+    MPI_Type_free(&cols);
+
+    //Try to print neatly
+
+    //U is the same for each rank in this example
+
+    if (rank==0) {
+        cout<<"U"<<endl;
+        for (i=0;i<nr;i++) {
+            for (j=0;j<nc;j++) {
+                cout<<setprecision(6)<<u[i][j]<<" ";
+            }
+            cout<<endl;
+        }
+    }
+
+    MPI_Barrier(MPI_COMM_WORLD);
+    cout<<endl;
+    MPI_Barrier(MPI_COMM_WORLD);
+    cout<<"W for rank "<<rank<<endl;
+    for (i=0;i<nr;i++) {
+        for (j=0;j<nc;j++) {
+            cout<<setprecision(6)<<w[i][j]<<" ";
+        }
+        cout<<endl;
+    }
+    cout<<endl;
+
+    MPI_Finalize();
+
+}
@@ -7,8 +7,8 @@ program sendrows
 
    integer            :: nr, nc
    integer            :: rank, nprocs, tag=0
-   integer            :: err, errcode
    integer            :: ncount, blocklength, stride
+   integer            :: nrequests
    type(MPI_Status),  dimension(:), allocatable  :: mpi_status_arr
    type(MPI_Request), dimension(:), allocatable  :: mpi_requests
    type(MPI_Datatype) :: rows
@@ -21,13 +21,17 @@ program sendrows
    call MPI_COMM_SIZE(MPI_COMM_WORLD,nprocs)
    call MPI_COMM_RANK(MPI_COMM_WORLD,rank)
 
-   !We will make the matrix scale with number of processes for simplicity
-   nr=nprocs
-   nc=nprocs
+   N=nprocs
+   nr=N
+   nc=N+2
+
+   nrequests=2
 
    allocate(u(nr,nc),w(nr,nc))
-   allocate(mpi_requests(2*nprocs),mpi_status_arr(2*nprocs))
-   u=0.0d0
+   allocate(mpi_requests(nrequests),mpi_status_arr(nrequests))
+
+   u=reshape([(i,i=1,nr*nc)],(/nr,nc/))
+
    w=0.0d0
 
    !Cyclic sending
@@ -36,51 +40,62 @@ program sendrows
        dest=0
    else if (rank==0) then
        src=nprocs-1
-       dest=rank+1
+       dest=1
    else
        src=rank-1
        dest=rank+1
    endif
 
-   ncount=1
-   blocklength=nc
+   ! These values pick a total of nc (ncount) items, one item 
+   ! (blocklength) taken for each nr (stride) items
+
+   ! The length of the row is the number of columns
+   ncount=nc
+   ! The number of items picked from each stride is 1
+   blocklength=1
+   ! The length of the column is the number of rows
    stride=nr
 
    call MPI_Type_vector(ncount,blocklength,stride,MPI_DOUBLE_PRECISION,rows)
 
    call MPI_TYPE_COMMIT(rows)
 
-   do i=0,nprocs-1
-       if (rank==i) then
-           tag=i
-           print *, i,i+1,i+nprocs+1
-           if (i==0) then
-               call MPI_Irecv(w(nprocs,1),1,rows,src,tag,MPI_COMM_WORLD,mpi_requests(i+1))
-               call MPI_Isend(u(i+1,1),1,rows,dest,tag,MPI_COMM_WORLD,mpi_requests(i+nprocs+1))
-            else if (i==nprocs-1) then
-               call MPI_Irecv(w(1,1),1,rows,src,tag,MPI_COMM_WORLD,mpi_requests(i+1))
-               call MPI_Isend(u(nprocs,1),1,rows,dest,tag,MPI_COMM_WORLD,mpi_requests(i+nprocs+1))
-            else
-               call MPI_Irecv(w(i+2,1),1,rows,src,tag,MPI_COMM_WORLD,mpi_requests(i+1))
-               call MPI_Isend(u(i+1,1),1,rows,dest,tag,MPI_COMM_WORLD,mpi_requests(i+nprocs+1))
-            endif
-        endif
-   enddo
+   if (rank==0) then
+       call MPI_Irecv(w(1,1),1,rows,src,tag,MPI_COMM_WORLD,mpi_requests(1))
+       call MPI_Isend(u(1,1),1,rows,dest,tag,MPI_COMM_WORLD,mpi_requests(2))
+   else if (rank==nprocs-1) then
+       call MPI_Irecv(w(nprocs,1),1,rows,src,tag,MPI_COMM_WORLD,mpi_requests(1))
+       call MPI_Isend(u(nprocs,1),1,rows,dest,tag,MPI_COMM_WORLD,mpi_requests(2))
+   else
+       call MPI_Irecv(w(rank+1,1),1,rows,src,tag,MPI_COMM_WORLD,mpi_requests(1))
+       call MPI_Isend(u(rank+1,1),1,rows,dest,tag,MPI_COMM_WORLD,mpi_requests(2))
+   endif
 
    call MPI_Waitall(size(mpi_requests),mpi_requests,mpi_status_arr)
 
-
    call MPI_TYPE_FREE(rows)
 
    !Print neatly
-   do i=1,nr
-      write(*,*) "|",u(i,:),"|","    |",w(i,:),"|"
+
+   ! U is the same for each rank in this example
+   if (rank==0) then
+         write(*,*) "U"
+         do j=1,nr
+            write(*,'(*(g12.6))') u(j,:)
+         enddo
+   endif
+   call MPI_Barrier(MPI_COMM_WORLD)
+   do i=1,nprocs
+      call MPI_Barrier(MPI_COMM_WORLD)
+      if (rank==i-1) then
+         write(*,*) 
+         write(*,*) "W for rank ",rank
+         do j=1,nr
+            write(*,'(*(g12.6))') w(j,:)
+         enddo
+      endif
    enddo
 
    call MPI_Finalize()
 
 end program
-
-
-
-
 
@@ -0,0 +1,83 @@
+import sys
+import numpy as np
+from mpi4py import MPI
+
+comm = MPI.COMM_WORLD
+rank = comm.Get_rank()
+nprocs = comm.Get_size()
+
+N = nprocs
+nr = N+2
+nc = N
+
+u = np.arange(1,nr*nc+1).reshape(nr,nc)
+
+w = np.zeros_like(u)
+
+#Cyclic sending
+if rank == nprocs-1:
+    src=rank-1
+    dest=0
+elif (rank==0):
+    src=nprocs-1
+    dest=1
+else:
+    src=rank-1
+    dest=rank+1
+
+#These values pick a total of nc (ncount) items, one item
+#(blocklength) taken for each nr (stride) items
+
+#The length of the column is the number of rows
+ncount=nr
+#The number of items picked from each stride is 1
+blocklength=1
+#The length of the row is the number of columns
+stride=nc
+
+cols = MPI.DOUBLE.Create_vector(ncount, blocklength, stride)
+cols.Commit()
+
+if rank==0:
+    recv_request=comm.Irecv([np.frombuffer(w.data,np.double,offset=0),1,cols],src)
+    send_request=comm.Isend([np.frombuffer(u.data,np.double,offset=0),1,cols],dest)
+elif rank==nprocs-1:
+    sendcol=nprocs-1
+    recv_request=comm.Irecv([np.frombuffer(w.data,np.double,offset=sendcol*np.dtype('double').itemsize),1,cols],src)
+    send_request=comm.Isend([np.frombuffer(u.data,np.double,offset=sendcol*np.dtype('double').itemsize),1,cols],dest)
+else:
+    sendcol=rank
+    recv_request=comm.Irecv([np.frombuffer(w.data,np.double,offset=sendcol*np.dtype('double').itemsize),1,cols],src)
+    send_request=comm.Isend([np.frombuffer(u.data,np.double,offset=sendcol*np.dtype('double').itemsize),1,cols],dest)
+
+requests=[recv_request,send_request]
+
+MPI.Request.Waitall(requests)
+
+cols.Free()
+
+#Print neatly
+
+#U is the same for each rank in this example
+
+if rank==0:
+    print("U")
+    for i in range(nr):
+        for j in range(nc):
+            print("{:12.6f}".format(u[i,j]),end="")
+        print()
+
+    print()
+
+comm.Barrier()
+
+print("W for rank", rank)
+comm.Barrier()
+for i in range(nr):
+    for j in range(nc):
+        print("{:12.6f}".format(w[i,j]),end="")
+    print()
+
+print()
+
+
@@ -27,7 +27,7 @@ Each MPI program must include the `mpi.h` header file. If the MPI distribution w
 
 All new Fortran programs should use the `mpi` module provided by the MPI software. if the MPI distribution was installed correctly, the `mpif90` or equivalent will find the module and link to the correct library.
 
-Any recent MPI will also provide an `mpi_f08` module.  Its use is recommended, but we will wait till [later](courses/paralll-incomputing-introduction/distributed_mpi_nonblocking_exchange) to introduce it. This new module takes better advance of modern Fortran features such as types.  The compiler used must support at least the Fortran 2008 standard.
+Any recent MPI will also provide an `mpi_f08` module.  Its use is recommended, but we will wait till [later](courses/paralll-incomputing-introduction/distributed_mpi_nonblocking_exchange) to introduce it. This new module takes better advance of modern Fortran features such as types. In addition, the ubuiquitous "ierror" parameter at the end of most argument lists becomes an _optional_ argument in the mpi_f08 subroutine definitions.  The compiler used must support at least the Fortran 2008 standard.
 
 {{< spoiler text="Fortran" >}}
 {{< code-download file="/courses/parallel-computing-introduction/codes/mpi1.f90" lang="fortran" >}}
Original file line number	Diff line number	Diff line change
`@@ -92,8 +92,8 @@ int main (int argc, char *argv[]) {`
`92`	`92`	`}`
`93`	`93`	`}`
`94`	`94`
`95`		`- MPI_Request requests[4];`
`96`	`95`	`int nrequests=4;`
	`96`	`+ MPI_Request requests[nrequests];`
`97`	`97`
`98`	`98`	`MPI_Irecv(&w[nrl+1][1], ncl, MPI_DOUBLE, down, tag, MPI_COMM_WORLD, &requests[0]);`
`99`	`99`	`MPI_Irecv(&w[0][1], ncl, MPI_DOUBLE, up, tag, MPI_COMM_WORLD, &requests[1]);`