forked from moebiusband/NuSiF-Solver
		
	Initial checkin
This commit is contained in:
		
							
								
								
									
										61
									
								
								BasicSolver/2D-mpi/src/affinity.c
									
									
									
									
									
										Normal file
									
								
							
							
						
						
									
										61
									
								
								BasicSolver/2D-mpi/src/affinity.c
									
									
									
									
									
										Normal file
									
								
							@@ -0,0 +1,61 @@
 | 
			
		||||
/*
 | 
			
		||||
 * Copyright (C) 2022 NHR@FAU, University Erlangen-Nuremberg.
 | 
			
		||||
 * All rights reserved.
 | 
			
		||||
 * Use of this source code is governed by a MIT-style
 | 
			
		||||
 * license that can be found in the LICENSE file.
 | 
			
		||||
 */
 | 
			
		||||
#ifdef __linux__
 | 
			
		||||
#ifdef _OPENMP
 | 
			
		||||
#include <pthread.h>
 | 
			
		||||
#include <sched.h>
 | 
			
		||||
#include <stdio.h>
 | 
			
		||||
#include <stdlib.h>
 | 
			
		||||
#include <sys/syscall.h>
 | 
			
		||||
#include <sys/types.h>
 | 
			
		||||
#include <unistd.h>
 | 
			
		||||
 | 
			
		||||
#define MAX_NUM_THREADS 128
 | 
			
		||||
#define gettid()        syscall(SYS_gettid)
 | 
			
		||||
 | 
			
		||||
static int getProcessorID(cpu_set_t* cpu_set)
 | 
			
		||||
{
 | 
			
		||||
    int processorId;
 | 
			
		||||
 | 
			
		||||
    for (processorId = 0; processorId < MAX_NUM_THREADS; processorId++) {
 | 
			
		||||
        if (CPU_ISSET(processorId, cpu_set)) {
 | 
			
		||||
            break;
 | 
			
		||||
        }
 | 
			
		||||
    }
 | 
			
		||||
    return processorId;
 | 
			
		||||
}
 | 
			
		||||
 | 
			
		||||
int affinity_getProcessorId()
 | 
			
		||||
{
 | 
			
		||||
    cpu_set_t cpu_set;
 | 
			
		||||
    CPU_ZERO(&cpu_set);
 | 
			
		||||
    sched_getaffinity(gettid(), sizeof(cpu_set_t), &cpu_set);
 | 
			
		||||
 | 
			
		||||
    return getProcessorID(&cpu_set);
 | 
			
		||||
}
 | 
			
		||||
 | 
			
		||||
void affinity_pinThread(int processorId)
 | 
			
		||||
{
 | 
			
		||||
    cpu_set_t cpuset;
 | 
			
		||||
    pthread_t thread;
 | 
			
		||||
 | 
			
		||||
    thread = pthread_self();
 | 
			
		||||
    CPU_ZERO(&cpuset);
 | 
			
		||||
    CPU_SET(processorId, &cpuset);
 | 
			
		||||
    pthread_setaffinity_np(thread, sizeof(cpu_set_t), &cpuset);
 | 
			
		||||
}
 | 
			
		||||
 | 
			
		||||
void affinity_pinProcess(int processorId)
 | 
			
		||||
{
 | 
			
		||||
    cpu_set_t cpuset;
 | 
			
		||||
 | 
			
		||||
    CPU_ZERO(&cpuset);
 | 
			
		||||
    CPU_SET(processorId, &cpuset);
 | 
			
		||||
    sched_setaffinity(0, sizeof(cpu_set_t), &cpuset);
 | 
			
		||||
}
 | 
			
		||||
#endif /*_OPENMP*/
 | 
			
		||||
#endif /*__linux__*/
 | 
			
		||||
							
								
								
									
										14
									
								
								BasicSolver/2D-mpi/src/affinity.h
									
									
									
									
									
										Normal file
									
								
							
							
						
						
									
										14
									
								
								BasicSolver/2D-mpi/src/affinity.h
									
									
									
									
									
										Normal file
									
								
							@@ -0,0 +1,14 @@
 | 
			
		||||
/*
 | 
			
		||||
 * Copyright (C) 2022 NHR@FAU, University Erlangen-Nuremberg.
 | 
			
		||||
 * All rights reserved.
 | 
			
		||||
 * Use of this source code is governed by a MIT-style
 | 
			
		||||
 * license that can be found in the LICENSE file.
 | 
			
		||||
 */
 | 
			
		||||
#ifndef AFFINITY_H
 | 
			
		||||
#define AFFINITY_H
 | 
			
		||||
 | 
			
		||||
extern int affinity_getProcessorId();
 | 
			
		||||
extern void affinity_pinProcess(int);
 | 
			
		||||
extern void affinity_pinThread(int);
 | 
			
		||||
 | 
			
		||||
#endif /*AFFINITY_H*/
 | 
			
		||||
							
								
								
									
										35
									
								
								BasicSolver/2D-mpi/src/allocate.c
									
									
									
									
									
										Normal file
									
								
							
							
						
						
									
										35
									
								
								BasicSolver/2D-mpi/src/allocate.c
									
									
									
									
									
										Normal file
									
								
							@@ -0,0 +1,35 @@
 | 
			
		||||
/*
 | 
			
		||||
 * Copyright (C) 2022 NHR@FAU, University Erlangen-Nuremberg.
 | 
			
		||||
 * All rights reserved.
 | 
			
		||||
 * Use of this source code is governed by a MIT-style
 | 
			
		||||
 * license that can be found in the LICENSE file.
 | 
			
		||||
 */
 | 
			
		||||
#include <errno.h>
 | 
			
		||||
#include <stdio.h>
 | 
			
		||||
#include <stdlib.h>
 | 
			
		||||
 | 
			
		||||
void* allocate(int alignment, size_t bytesize)
 | 
			
		||||
{
 | 
			
		||||
    int errorCode;
 | 
			
		||||
    void* ptr;
 | 
			
		||||
 | 
			
		||||
    errorCode = posix_memalign(&ptr, alignment, bytesize);
 | 
			
		||||
 | 
			
		||||
    if (errorCode) {
 | 
			
		||||
        if (errorCode == EINVAL) {
 | 
			
		||||
            fprintf(stderr, "Error: Alignment parameter is not a power of two\n");
 | 
			
		||||
            exit(EXIT_FAILURE);
 | 
			
		||||
        }
 | 
			
		||||
        if (errorCode == ENOMEM) {
 | 
			
		||||
            fprintf(stderr, "Error: Insufficient memory to fulfill the request\n");
 | 
			
		||||
            exit(EXIT_FAILURE);
 | 
			
		||||
        }
 | 
			
		||||
    }
 | 
			
		||||
 | 
			
		||||
    if (ptr == NULL) {
 | 
			
		||||
        fprintf(stderr, "Error: posix_memalign failed!\n");
 | 
			
		||||
        exit(EXIT_FAILURE);
 | 
			
		||||
    }
 | 
			
		||||
 | 
			
		||||
    return ptr;
 | 
			
		||||
}
 | 
			
		||||
							
								
								
									
										13
									
								
								BasicSolver/2D-mpi/src/allocate.h
									
									
									
									
									
										Normal file
									
								
							
							
						
						
									
										13
									
								
								BasicSolver/2D-mpi/src/allocate.h
									
									
									
									
									
										Normal file
									
								
							@@ -0,0 +1,13 @@
 | 
			
		||||
/*
 | 
			
		||||
 * Copyright (C) 2022 NHR@FAU, University Erlangen-Nuremberg.
 | 
			
		||||
 * All rights reserved.
 | 
			
		||||
 * Use of this source code is governed by a MIT-style
 | 
			
		||||
 * license that can be found in the LICENSE file.
 | 
			
		||||
 */
 | 
			
		||||
#ifndef __ALLOCATE_H_
 | 
			
		||||
#define __ALLOCATE_H_
 | 
			
		||||
#include <stdlib.h>
 | 
			
		||||
 | 
			
		||||
extern void* allocate(int alignment, size_t bytesize);
 | 
			
		||||
 | 
			
		||||
#endif
 | 
			
		||||
							
								
								
									
										326
									
								
								BasicSolver/2D-mpi/src/comm.c
									
									
									
									
									
										Normal file
									
								
							
							
						
						
									
										326
									
								
								BasicSolver/2D-mpi/src/comm.c
									
									
									
									
									
										Normal file
									
								
							@@ -0,0 +1,326 @@
 | 
			
		||||
/*
 | 
			
		||||
 * Copyright (C) 2022 NHR@FAU, University Erlangen-Nuremberg.
 | 
			
		||||
 * All rights reserved. This file is part of nusif-solver.
 | 
			
		||||
 * Use of this source code is governed by a MIT style
 | 
			
		||||
 * license that can be found in the LICENSE file.
 | 
			
		||||
 */
 | 
			
		||||
#include <stddef.h>
 | 
			
		||||
#include <stdio.h>
 | 
			
		||||
#include <stdlib.h>
 | 
			
		||||
 | 
			
		||||
#include "comm.h"
 | 
			
		||||
 | 
			
		||||
// subroutines local to this module
 | 
			
		||||
static int sizeOfRank(int rank, int size, int N)
 | 
			
		||||
{
 | 
			
		||||
    return N / size + ((N % size > rank) ? 1 : 0);
 | 
			
		||||
}
 | 
			
		||||
 | 
			
		||||
static void setupCommunication(Comm* c, int direction, int layer)
 | 
			
		||||
{
 | 
			
		||||
    MPI_Datatype type;
 | 
			
		||||
    size_t dblsize = sizeof(double);
 | 
			
		||||
    int imaxLocal  = c->imaxLocal;
 | 
			
		||||
    int jmaxLocal  = c->jmaxLocal;
 | 
			
		||||
    int sizes[NDIMS];
 | 
			
		||||
    int subSizes[NDIMS];
 | 
			
		||||
    int starts[NDIMS];
 | 
			
		||||
    int offset = 0;
 | 
			
		||||
 | 
			
		||||
    sizes[IDIM] = imaxLocal + 2;
 | 
			
		||||
    sizes[JDIM] = jmaxLocal + 2;
 | 
			
		||||
 | 
			
		||||
    if (layer == HALO) {
 | 
			
		||||
        offset = 1;
 | 
			
		||||
    }
 | 
			
		||||
 | 
			
		||||
    switch (direction) {
 | 
			
		||||
    case LEFT:
 | 
			
		||||
        subSizes[IDIM] = 1;
 | 
			
		||||
        subSizes[JDIM] = jmaxLocal;
 | 
			
		||||
        starts[IDIM]   = 1 - offset;
 | 
			
		||||
        starts[JDIM]   = 1;
 | 
			
		||||
        break;
 | 
			
		||||
    case RIGHT:
 | 
			
		||||
        subSizes[IDIM] = 1;
 | 
			
		||||
        subSizes[JDIM] = jmaxLocal;
 | 
			
		||||
        starts[IDIM]   = imaxLocal + offset;
 | 
			
		||||
        starts[JDIM]   = 1;
 | 
			
		||||
        break;
 | 
			
		||||
    case BOTTOM:
 | 
			
		||||
        subSizes[IDIM] = imaxLocal;
 | 
			
		||||
        subSizes[JDIM] = 1;
 | 
			
		||||
        starts[IDIM]   = 1;
 | 
			
		||||
        starts[JDIM]   = 1 - offset;
 | 
			
		||||
        break;
 | 
			
		||||
    case TOP:
 | 
			
		||||
        subSizes[IDIM] = imaxLocal;
 | 
			
		||||
        subSizes[JDIM] = 1;
 | 
			
		||||
        starts[IDIM]   = 1;
 | 
			
		||||
        starts[JDIM]   = jmaxLocal + offset;
 | 
			
		||||
        break;
 | 
			
		||||
    }
 | 
			
		||||
 | 
			
		||||
    MPI_Type_create_subarray(NDIMS,
 | 
			
		||||
        sizes,
 | 
			
		||||
        subSizes,
 | 
			
		||||
        starts,
 | 
			
		||||
        MPI_ORDER_C,
 | 
			
		||||
        MPI_DOUBLE,
 | 
			
		||||
        &type);
 | 
			
		||||
    MPI_Type_commit(&type);
 | 
			
		||||
 | 
			
		||||
    if (layer == HALO) {
 | 
			
		||||
        c->rbufferTypes[direction] = type;
 | 
			
		||||
    } else if (layer == BULK) {
 | 
			
		||||
        c->sbufferTypes[direction] = type;
 | 
			
		||||
    }
 | 
			
		||||
}
 | 
			
		||||
 | 
			
		||||
static void assembleResult(Comm* c,
 | 
			
		||||
    double* src,
 | 
			
		||||
    double* dst,
 | 
			
		||||
    int imaxLocal[],
 | 
			
		||||
    int jmaxLocal[],
 | 
			
		||||
    int offset[],
 | 
			
		||||
    int jmax,
 | 
			
		||||
    int imax)
 | 
			
		||||
{
 | 
			
		||||
    MPI_Request* requests;
 | 
			
		||||
    int numRequests = 1;
 | 
			
		||||
 | 
			
		||||
    if (c->rank == 0) {
 | 
			
		||||
        numRequests = c->size + 1;
 | 
			
		||||
    } else {
 | 
			
		||||
        numRequests = 1;
 | 
			
		||||
    }
 | 
			
		||||
 | 
			
		||||
    requests = (MPI_Request*)malloc(numRequests * sizeof(MPI_Request));
 | 
			
		||||
 | 
			
		||||
    /* all ranks send their bulk array */
 | 
			
		||||
    MPI_Datatype bulkType;
 | 
			
		||||
    int oldSizes[NDIMS] = { c->jmaxLocal + 2, c->imaxLocal + 2 };
 | 
			
		||||
    int newSizes[NDIMS] = { c->jmaxLocal, c->imaxLocal };
 | 
			
		||||
    int starts[NDIMS]   = { 1, 1 };
 | 
			
		||||
    MPI_Type_create_subarray(NDIMS,
 | 
			
		||||
        oldSizes,
 | 
			
		||||
        newSizes,
 | 
			
		||||
        starts,
 | 
			
		||||
        MPI_ORDER_C,
 | 
			
		||||
        MPI_DOUBLE,
 | 
			
		||||
        &bulkType);
 | 
			
		||||
    MPI_Type_commit(&bulkType);
 | 
			
		||||
 | 
			
		||||
    MPI_Isend(src, 1, bulkType, 0, 0, c->comm, &requests[0]);
 | 
			
		||||
 | 
			
		||||
    /* rank 0 assembles the subdomains */
 | 
			
		||||
    if (c->rank == 0) {
 | 
			
		||||
        for (int i = 0; i < c->size; i++) {
 | 
			
		||||
            MPI_Datatype domainType;
 | 
			
		||||
            int oldSizes[NDIMS] = { jmax, imax };
 | 
			
		||||
            int newSizes[NDIMS] = { jmaxLocal[i], imaxLocal[i] };
 | 
			
		||||
            int starts[NDIMS]   = { offset[i * NDIMS + JDIM], offset[i * NDIMS + IDIM] };
 | 
			
		||||
            MPI_Type_create_subarray(NDIMS,
 | 
			
		||||
                oldSizes,
 | 
			
		||||
                newSizes,
 | 
			
		||||
                starts,
 | 
			
		||||
                MPI_ORDER_C,
 | 
			
		||||
                MPI_DOUBLE,
 | 
			
		||||
                &domainType);
 | 
			
		||||
            MPI_Type_commit(&domainType);
 | 
			
		||||
 | 
			
		||||
            MPI_Irecv(dst, 1, domainType, i, 0, c->comm, &requests[i + 1]);
 | 
			
		||||
        }
 | 
			
		||||
    }
 | 
			
		||||
 | 
			
		||||
    MPI_Waitall(numRequests, requests, MPI_STATUSES_IGNORE);
 | 
			
		||||
}
 | 
			
		||||
 | 
			
		||||
static int sum(int* sizes, int position)
 | 
			
		||||
{
 | 
			
		||||
    int sum = 0;
 | 
			
		||||
 | 
			
		||||
    for (int i = 0; i < position; i++) {
 | 
			
		||||
        sum += sizes[i];
 | 
			
		||||
    }
 | 
			
		||||
 | 
			
		||||
    return sum;
 | 
			
		||||
}
 | 
			
		||||
 | 
			
		||||
// exported subroutines
 | 
			
		||||
void commReduction(double* v, int op)
 | 
			
		||||
{
 | 
			
		||||
    if (op == MAX) {
 | 
			
		||||
        MPI_Allreduce(MPI_IN_PLACE, v, 1, MPI_DOUBLE, MPI_MAX, MPI_COMM_WORLD);
 | 
			
		||||
    } else if (op == SUM) {
 | 
			
		||||
        MPI_Allreduce(MPI_IN_PLACE, v, 1, MPI_DOUBLE, MPI_SUM, MPI_COMM_WORLD);
 | 
			
		||||
    }
 | 
			
		||||
}
 | 
			
		||||
 | 
			
		||||
int commIsBoundary(Comm* c, int direction)
 | 
			
		||||
{
 | 
			
		||||
    switch (direction) {
 | 
			
		||||
    case LEFT:
 | 
			
		||||
        return c->coords[IDIM] == 0;
 | 
			
		||||
        break;
 | 
			
		||||
    case RIGHT:
 | 
			
		||||
        return c->coords[IDIM] == (c->dims[IDIM] - 1);
 | 
			
		||||
        break;
 | 
			
		||||
    case BOTTOM:
 | 
			
		||||
        return c->coords[JDIM] == 0;
 | 
			
		||||
        break;
 | 
			
		||||
    case TOP:
 | 
			
		||||
        return c->coords[JDIM] == (c->dims[JDIM] - 1);
 | 
			
		||||
        break;
 | 
			
		||||
    }
 | 
			
		||||
 | 
			
		||||
    return 0;
 | 
			
		||||
}
 | 
			
		||||
 | 
			
		||||
void commExchange(Comm* c, double* grid)
 | 
			
		||||
{
 | 
			
		||||
    int counts[NDIRS]      = { 1, 1, 1, 1 };
 | 
			
		||||
    MPI_Aint displs[NDIRS] = { 0, 0, 0, 0 };
 | 
			
		||||
 | 
			
		||||
    MPI_Neighbor_alltoallw(grid,
 | 
			
		||||
        counts,
 | 
			
		||||
        displs,
 | 
			
		||||
        c->sbufferTypes,
 | 
			
		||||
        grid,
 | 
			
		||||
        counts,
 | 
			
		||||
        displs,
 | 
			
		||||
        c->rbufferTypes,
 | 
			
		||||
        c->comm);
 | 
			
		||||
}
 | 
			
		||||
 | 
			
		||||
void commShift(Comm* c, double* f, double* g)
 | 
			
		||||
{
 | 
			
		||||
    MPI_Request requests[4] = { MPI_REQUEST_NULL,
 | 
			
		||||
        MPI_REQUEST_NULL,
 | 
			
		||||
        MPI_REQUEST_NULL,
 | 
			
		||||
        MPI_REQUEST_NULL };
 | 
			
		||||
 | 
			
		||||
    /* shift G */
 | 
			
		||||
    /* receive ghost cells from bottom neighbor */
 | 
			
		||||
    MPI_Irecv(g,
 | 
			
		||||
        1,
 | 
			
		||||
        c->rbufferTypes[BOTTOM],
 | 
			
		||||
        c->neighbours[BOTTOM],
 | 
			
		||||
        0,
 | 
			
		||||
        c->comm,
 | 
			
		||||
        &requests[0]);
 | 
			
		||||
 | 
			
		||||
    /* send ghost cells to top neighbor */
 | 
			
		||||
    MPI_Isend(g, 1, c->sbufferTypes[TOP], c->neighbours[TOP], 0, c->comm, &requests[1]);
 | 
			
		||||
 | 
			
		||||
    /* shift F */
 | 
			
		||||
    /* receive ghost cells from left neighbor */
 | 
			
		||||
    MPI_Irecv(f, 1, c->rbufferTypes[LEFT], c->neighbours[LEFT], 1, c->comm, &requests[2]);
 | 
			
		||||
 | 
			
		||||
    /* send ghost cells to right neighbor */
 | 
			
		||||
    MPI_Isend(f,
 | 
			
		||||
        1,
 | 
			
		||||
        c->sbufferTypes[RIGHT],
 | 
			
		||||
        c->neighbours[RIGHT],
 | 
			
		||||
        1,
 | 
			
		||||
        c->comm,
 | 
			
		||||
        &requests[3]);
 | 
			
		||||
 | 
			
		||||
    MPI_Waitall(4, requests, MPI_STATUSES_IGNORE);
 | 
			
		||||
}
 | 
			
		||||
 | 
			
		||||
void commCollectResult(Comm* c,
 | 
			
		||||
    double* ug,
 | 
			
		||||
    double* vg,
 | 
			
		||||
    double* pg,
 | 
			
		||||
    double* u,
 | 
			
		||||
    double* v,
 | 
			
		||||
    double* p,
 | 
			
		||||
    int jmax,
 | 
			
		||||
    int imax)
 | 
			
		||||
{
 | 
			
		||||
    int offset[c->size * NDIMS];
 | 
			
		||||
    int imaxLocal[c->size];
 | 
			
		||||
    int jmaxLocal[c->size];
 | 
			
		||||
 | 
			
		||||
    MPI_Gather(&c->imaxLocal, 1, MPI_INT, imaxLocal, 1, MPI_INT, 0, MPI_COMM_WORLD);
 | 
			
		||||
    MPI_Gather(&c->jmaxLocal, 1, MPI_INT, jmaxLocal, 1, MPI_INT, 0, MPI_COMM_WORLD);
 | 
			
		||||
 | 
			
		||||
    if (c->rank == 0) {
 | 
			
		||||
        for (int i = 0; i < c->size; i++) {
 | 
			
		||||
            int coords[NDIMS];
 | 
			
		||||
            MPI_Cart_coords(c->comm, i, NDIMS, coords);
 | 
			
		||||
            offset[i * NDIMS + IDIM] = sum(imaxLocal, coords[IDIM]);
 | 
			
		||||
            offset[i * NDIMS + JDIM] = sum(jmaxLocal, coords[JDIM]);
 | 
			
		||||
            printf("Rank: %d, Coords(j,i): %d %d, Size(j,i): %d %d "
 | 
			
		||||
                   "Offset(j,i): %d %d\n",
 | 
			
		||||
                i,
 | 
			
		||||
                coords[JDIM],
 | 
			
		||||
                coords[IDIM],
 | 
			
		||||
                jmaxLocal[i],
 | 
			
		||||
                imaxLocal[i],
 | 
			
		||||
                offset[i * NDIMS + JDIM],
 | 
			
		||||
                offset[i * NDIMS + IDIM]);
 | 
			
		||||
        }
 | 
			
		||||
    }
 | 
			
		||||
 | 
			
		||||
    /* collect P */
 | 
			
		||||
    assembleResult(c, p, pg, imaxLocal, jmaxLocal, offset, jmax, imax);
 | 
			
		||||
 | 
			
		||||
    /* collect U */
 | 
			
		||||
    assembleResult(c, u, ug, imaxLocal, jmaxLocal, offset, jmax, imax);
 | 
			
		||||
 | 
			
		||||
    /* collect V */
 | 
			
		||||
    assembleResult(c, v, vg, imaxLocal, jmaxLocal, offset, jmax, imax);
 | 
			
		||||
}
 | 
			
		||||
 | 
			
		||||
void commPrintConfig(Comm* c)
 | 
			
		||||
{
 | 
			
		||||
    fflush(stdout);
 | 
			
		||||
    MPI_Barrier(MPI_COMM_WORLD);
 | 
			
		||||
    if (commIsMaster(c)) {
 | 
			
		||||
        printf("Communication setup:\n");
 | 
			
		||||
    }
 | 
			
		||||
 | 
			
		||||
    for (int i = 0; i < c->size; i++) {
 | 
			
		||||
        if (i == c->rank) {
 | 
			
		||||
            printf("\tRank %d of %d\n", c->rank, c->size);
 | 
			
		||||
            printf("\tNeighbours (bottom, top, left, right): %d %d, %d, %d\n",
 | 
			
		||||
                c->neighbours[BOTTOM],
 | 
			
		||||
                c->neighbours[TOP],
 | 
			
		||||
                c->neighbours[LEFT],
 | 
			
		||||
                c->neighbours[RIGHT]);
 | 
			
		||||
            printf("\tCoordinates (j,i) %d %d\n", c->coords[JDIM], c->coords[IDIM]);
 | 
			
		||||
            printf("\tLocal domain size (j,i) %dx%d\n", c->jmaxLocal, c->imaxLocal);
 | 
			
		||||
            fflush(stdout);
 | 
			
		||||
        }
 | 
			
		||||
    }
 | 
			
		||||
    MPI_Barrier(MPI_COMM_WORLD);
 | 
			
		||||
}
 | 
			
		||||
 | 
			
		||||
void commInit(Comm* c, int jmax, int imax)
 | 
			
		||||
{
 | 
			
		||||
    /* setup communication */
 | 
			
		||||
    MPI_Comm_rank(MPI_COMM_WORLD, &(c->rank));
 | 
			
		||||
    MPI_Comm_size(MPI_COMM_WORLD, &(c->size));
 | 
			
		||||
    int dims[NDIMS]    = { 0, 0 };
 | 
			
		||||
    int periods[NDIMS] = { 0, 0 };
 | 
			
		||||
    MPI_Dims_create(c->size, NDIMS, dims);
 | 
			
		||||
    MPI_Cart_create(MPI_COMM_WORLD, NDIMS, dims, periods, 0, &c->comm);
 | 
			
		||||
    MPI_Cart_shift(c->comm, IDIM, 1, &c->neighbours[LEFT], &c->neighbours[RIGHT]);
 | 
			
		||||
    MPI_Cart_shift(c->comm, JDIM, 1, &c->neighbours[BOTTOM], &c->neighbours[TOP]);
 | 
			
		||||
    MPI_Cart_get(c->comm, NDIMS, c->dims, periods, c->coords);
 | 
			
		||||
 | 
			
		||||
    c->imaxLocal = sizeOfRank(c->rank, dims[IDIM], imax);
 | 
			
		||||
    c->jmaxLocal = sizeOfRank(c->rank, dims[JDIM], jmax);
 | 
			
		||||
 | 
			
		||||
    // setup buffer types for communication
 | 
			
		||||
    setupCommunication(c, LEFT, BULK);
 | 
			
		||||
    setupCommunication(c, LEFT, HALO);
 | 
			
		||||
    setupCommunication(c, RIGHT, BULK);
 | 
			
		||||
    setupCommunication(c, RIGHT, HALO);
 | 
			
		||||
    setupCommunication(c, BOTTOM, BULK);
 | 
			
		||||
    setupCommunication(c, BOTTOM, HALO);
 | 
			
		||||
    setupCommunication(c, TOP, BULK);
 | 
			
		||||
    setupCommunication(c, TOP, HALO);
 | 
			
		||||
}
 | 
			
		||||
							
								
								
									
										44
									
								
								BasicSolver/2D-mpi/src/comm.h
									
									
									
									
									
										Normal file
									
								
							
							
						
						
									
										44
									
								
								BasicSolver/2D-mpi/src/comm.h
									
									
									
									
									
										Normal file
									
								
							@@ -0,0 +1,44 @@
 | 
			
		||||
/*
 | 
			
		||||
 * Copyright (C) 2022 NHR@FAU, University Erlangen-Nuremberg.
 | 
			
		||||
 * All rights reserved. This file is part of nusif-solver.
 | 
			
		||||
 * Use of this source code is governed by a MIT style
 | 
			
		||||
 * license that can be found in the LICENSE file.
 | 
			
		||||
 */
 | 
			
		||||
#ifndef __COMM_H_
 | 
			
		||||
#define __COMM_H_
 | 
			
		||||
#include <mpi.h>
 | 
			
		||||
 | 
			
		||||
enum direction { LEFT = 0, RIGHT, BOTTOM, TOP, NDIRS };
 | 
			
		||||
enum dimension { JDIM = 0, IDIM, NDIMS };
 | 
			
		||||
enum layer { HALO = 0, BULK };
 | 
			
		||||
enum op { MAX = 0, SUM };
 | 
			
		||||
 | 
			
		||||
typedef struct {
 | 
			
		||||
    int rank;
 | 
			
		||||
    int size;
 | 
			
		||||
    MPI_Comm comm;
 | 
			
		||||
    MPI_Datatype sbufferTypes[NDIRS];
 | 
			
		||||
    MPI_Datatype rbufferTypes[NDIRS];
 | 
			
		||||
    int neighbours[NDIRS];
 | 
			
		||||
    int coords[NDIMS], dims[NDIMS];
 | 
			
		||||
    int imaxLocal, jmaxLocal;
 | 
			
		||||
} Comm;
 | 
			
		||||
 | 
			
		||||
extern void commInit(Comm* c, int jmax, int imax);
 | 
			
		||||
extern void commPrintConfig(Comm*);
 | 
			
		||||
extern void commExchange(Comm*, double*);
 | 
			
		||||
extern void commShift(Comm* c, double* f, double* g);
 | 
			
		||||
extern void commReduction(double* v, int op);
 | 
			
		||||
extern int commIsBoundary(Comm* c, int direction);
 | 
			
		||||
extern void commCollectResult(Comm* c,
 | 
			
		||||
    double* ug,
 | 
			
		||||
    double* vg,
 | 
			
		||||
    double* pg,
 | 
			
		||||
    double* u,
 | 
			
		||||
    double* v,
 | 
			
		||||
    double* p,
 | 
			
		||||
    int jmax,
 | 
			
		||||
    int imax);
 | 
			
		||||
 | 
			
		||||
static inline int commIsMaster(Comm* c) { return c->rank == 0; }
 | 
			
		||||
#endif // __COMM_H_
 | 
			
		||||
							
								
								
									
										54
									
								
								BasicSolver/2D-mpi/src/likwid-marker.h
									
									
									
									
									
										Normal file
									
								
							
							
						
						
									
										54
									
								
								BasicSolver/2D-mpi/src/likwid-marker.h
									
									
									
									
									
										Normal file
									
								
							@@ -0,0 +1,54 @@
 | 
			
		||||
/*
 | 
			
		||||
 * =======================================================================================
 | 
			
		||||
 *
 | 
			
		||||
 *      Author:   Jan Eitzinger (je), jan.eitzinger@fau.de
 | 
			
		||||
 *      Copyright (c) 2020 RRZE, University Erlangen-Nuremberg
 | 
			
		||||
 *
 | 
			
		||||
 *      Permission is hereby granted, free of charge, to any person obtaining a copy
 | 
			
		||||
 *      of this software and associated documentation files (the "Software"), to deal
 | 
			
		||||
 *      in the Software without restriction, including without limitation the rights
 | 
			
		||||
 *      to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
 | 
			
		||||
 *      copies of the Software, and to permit persons to whom the Software is
 | 
			
		||||
 *      furnished to do so, subject to the following conditions:
 | 
			
		||||
 *
 | 
			
		||||
 *      The above copyright notice and this permission notice shall be included in all
 | 
			
		||||
 *      copies or substantial portions of the Software.
 | 
			
		||||
 *
 | 
			
		||||
 *      THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
 | 
			
		||||
 *      IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
 | 
			
		||||
 *      FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
 | 
			
		||||
 *      AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
 | 
			
		||||
 *      LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
 | 
			
		||||
 *      OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
 | 
			
		||||
 *      SOFTWARE.
 | 
			
		||||
 *
 | 
			
		||||
 * =======================================================================================
 | 
			
		||||
 */
 | 
			
		||||
#ifndef LIKWID_MARKERS_H
 | 
			
		||||
#define LIKWID_MARKERS_H
 | 
			
		||||
 | 
			
		||||
#ifdef LIKWID_PERFMON
 | 
			
		||||
#include <likwid.h>
 | 
			
		||||
#define LIKWID_MARKER_INIT                likwid_markerInit()
 | 
			
		||||
#define LIKWID_MARKER_THREADINIT          likwid_markerThreadInit()
 | 
			
		||||
#define LIKWID_MARKER_SWITCH              likwid_markerNextGroup()
 | 
			
		||||
#define LIKWID_MARKER_REGISTER(regionTag) likwid_markerRegisterRegion(regionTag)
 | 
			
		||||
#define LIKWID_MARKER_START(regionTag)    likwid_markerStartRegion(regionTag)
 | 
			
		||||
#define LIKWID_MARKER_STOP(regionTag)     likwid_markerStopRegion(regionTag)
 | 
			
		||||
#define LIKWID_MARKER_CLOSE               likwid_markerClose()
 | 
			
		||||
#define LIKWID_MARKER_RESET(regionTag)    likwid_markerResetRegion(regionTag)
 | 
			
		||||
#define LIKWID_MARKER_GET(regionTag, nevents, events, time, count)                       \
 | 
			
		||||
    likwid_markerGetRegion(regionTag, nevents, events, time, count)
 | 
			
		||||
#else /* LIKWID_PERFMON */
 | 
			
		||||
#define LIKWID_MARKER_INIT
 | 
			
		||||
#define LIKWID_MARKER_THREADINIT
 | 
			
		||||
#define LIKWID_MARKER_SWITCH
 | 
			
		||||
#define LIKWID_MARKER_REGISTER(regionTag)
 | 
			
		||||
#define LIKWID_MARKER_START(regionTag)
 | 
			
		||||
#define LIKWID_MARKER_STOP(regionTag)
 | 
			
		||||
#define LIKWID_MARKER_CLOSE
 | 
			
		||||
#define LIKWID_MARKER_GET(regionTag, nevents, events, time, count)
 | 
			
		||||
#define LIKWID_MARKER_RESET(regionTag)
 | 
			
		||||
#endif /* LIKWID_PERFMON */
 | 
			
		||||
 | 
			
		||||
#endif /*LIKWID_MARKERS_H*/
 | 
			
		||||
							
								
								
									
										95
									
								
								BasicSolver/2D-mpi/src/main.c
									
									
									
									
									
										Normal file
									
								
							
							
						
						
									
										95
									
								
								BasicSolver/2D-mpi/src/main.c
									
									
									
									
									
										Normal file
									
								
							@@ -0,0 +1,95 @@
 | 
			
		||||
/*
 | 
			
		||||
 * Copyright (C) 2022 NHR@FAU, University Erlangen-Nuremberg.
 | 
			
		||||
 * All rights reserved.
 | 
			
		||||
 * Use of this source code is governed by a MIT-style
 | 
			
		||||
 * license that can be found in the LICENSE file.
 | 
			
		||||
 */
 | 
			
		||||
#include <float.h>
 | 
			
		||||
#include <limits.h>
 | 
			
		||||
#include <stdio.h>
 | 
			
		||||
#include <stdlib.h>
 | 
			
		||||
#include <unistd.h>
 | 
			
		||||
 | 
			
		||||
#include "allocate.h"
 | 
			
		||||
#include "parameter.h"
 | 
			
		||||
#include "progress.h"
 | 
			
		||||
#include "solver.h"
 | 
			
		||||
#include "timing.h"
 | 
			
		||||
#include <mpi.h>
 | 
			
		||||
 | 
			
		||||
int main(int argc, char** argv)
 | 
			
		||||
{
 | 
			
		||||
    int rank;
 | 
			
		||||
    double S, E;
 | 
			
		||||
    Parameter params;
 | 
			
		||||
    Solver solver;
 | 
			
		||||
 | 
			
		||||
    MPI_Init(&argc, &argv);
 | 
			
		||||
    MPI_Comm_rank(MPI_COMM_WORLD, &rank);
 | 
			
		||||
    initParameter(¶ms);
 | 
			
		||||
 | 
			
		||||
    if (argc != 2) {
 | 
			
		||||
        printf("Usage: %s <configFile>\n", argv[0]);
 | 
			
		||||
        exit(EXIT_SUCCESS);
 | 
			
		||||
    }
 | 
			
		||||
 | 
			
		||||
    readParameter(¶ms, argv[1]);
 | 
			
		||||
    if (rank == 0) {
 | 
			
		||||
        printParameter(¶ms);
 | 
			
		||||
    }
 | 
			
		||||
    initSolver(&solver, ¶ms);
 | 
			
		||||
    /* debugExchange(&solver); */
 | 
			
		||||
    /* exit(EXIT_SUCCESS); */
 | 
			
		||||
    initProgress(solver.te);
 | 
			
		||||
 | 
			
		||||
    double tau = solver.tau;
 | 
			
		||||
    double te  = solver.te;
 | 
			
		||||
    double t   = 0.0;
 | 
			
		||||
 | 
			
		||||
    S = getTimeStamp();
 | 
			
		||||
    while (t <= te) {
 | 
			
		||||
        if (tau > 0.0) {
 | 
			
		||||
            computeTimestep(&solver);
 | 
			
		||||
        }
 | 
			
		||||
 | 
			
		||||
        setBoundaryConditions(&solver);
 | 
			
		||||
        setSpecialBoundaryCondition(&solver);
 | 
			
		||||
        computeFG(&solver);
 | 
			
		||||
        computeRHS(&solver);
 | 
			
		||||
        solve(&solver);
 | 
			
		||||
        adaptUV(&solver);
 | 
			
		||||
        t += solver.dt;
 | 
			
		||||
 | 
			
		||||
#ifdef VERBOSE
 | 
			
		||||
        if (rank == 0) {
 | 
			
		||||
            printf("TIME %f , TIMESTEP %f\n", t, solver.dt);
 | 
			
		||||
        }
 | 
			
		||||
#else
 | 
			
		||||
        printProgress(t);
 | 
			
		||||
#endif
 | 
			
		||||
    }
 | 
			
		||||
    E = getTimeStamp();
 | 
			
		||||
    stopProgress();
 | 
			
		||||
    if (rank == 0) {
 | 
			
		||||
        printf("Solution took %.2fs\n", E - S);
 | 
			
		||||
    }
 | 
			
		||||
    size_t bytesize = solver.imax * solver.jmax * sizeof(double);
 | 
			
		||||
 | 
			
		||||
    double* ug = allocate(64, bytesize);
 | 
			
		||||
    double* vg = allocate(64, bytesize);
 | 
			
		||||
    double* pg = allocate(64, bytesize);
 | 
			
		||||
 | 
			
		||||
    commCollectResult(&solver.comm,
 | 
			
		||||
        ug,
 | 
			
		||||
        vg,
 | 
			
		||||
        pg,
 | 
			
		||||
        solver.u,
 | 
			
		||||
        solver.v,
 | 
			
		||||
        solver.p,
 | 
			
		||||
        solver.jmax,
 | 
			
		||||
        solver.imax);
 | 
			
		||||
    writeResult(&solver, ug, vg, pg);
 | 
			
		||||
 | 
			
		||||
    MPI_Finalize();
 | 
			
		||||
    return EXIT_SUCCESS;
 | 
			
		||||
}
 | 
			
		||||
							
								
								
									
										108
									
								
								BasicSolver/2D-mpi/src/parameter.c
									
									
									
									
									
										Normal file
									
								
							
							
						
						
									
										108
									
								
								BasicSolver/2D-mpi/src/parameter.c
									
									
									
									
									
										Normal file
									
								
							@@ -0,0 +1,108 @@
 | 
			
		||||
/*
 | 
			
		||||
 * Copyright (C) 2022 NHR@FAU, University Erlangen-Nuremberg.
 | 
			
		||||
 * All rights reserved. This file is part of nusif-solver.
 | 
			
		||||
 * Use of this source code is governed by a MIT style
 | 
			
		||||
 * license that can be found in the LICENSE file.
 | 
			
		||||
 */
 | 
			
		||||
#include <stdio.h>
 | 
			
		||||
#include <stdlib.h>
 | 
			
		||||
#include <string.h>
 | 
			
		||||
 | 
			
		||||
#include "parameter.h"
 | 
			
		||||
#include "util.h"
 | 
			
		||||
#define MAXLINE 4096
 | 
			
		||||
 | 
			
		||||
void initParameter(Parameter* param)
 | 
			
		||||
{
 | 
			
		||||
    param->xlength = 1.0;
 | 
			
		||||
    param->ylength = 1.0;
 | 
			
		||||
    param->imax    = 100;
 | 
			
		||||
    param->jmax    = 100;
 | 
			
		||||
    param->itermax = 1000;
 | 
			
		||||
    param->eps     = 0.0001;
 | 
			
		||||
    param->omg     = 1.8;
 | 
			
		||||
}
 | 
			
		||||
 | 
			
		||||
void readParameter(Parameter* param, const char* filename)
 | 
			
		||||
{
 | 
			
		||||
    FILE* fp = fopen(filename, "r");
 | 
			
		||||
    char line[MAXLINE];
 | 
			
		||||
    int i;
 | 
			
		||||
 | 
			
		||||
    if (!fp) {
 | 
			
		||||
        fprintf(stderr, "Could not open parameter file: %s\n", filename);
 | 
			
		||||
        exit(EXIT_FAILURE);
 | 
			
		||||
    }
 | 
			
		||||
 | 
			
		||||
    while (!feof(fp)) {
 | 
			
		||||
        line[0] = '\0';
 | 
			
		||||
        fgets(line, MAXLINE, fp);
 | 
			
		||||
        for (i = 0; line[i] != '\0' && line[i] != '#'; i++)
 | 
			
		||||
            ;
 | 
			
		||||
        line[i] = '\0';
 | 
			
		||||
 | 
			
		||||
        char* tok = strtok(line, " ");
 | 
			
		||||
        char* val = strtok(NULL, " ");
 | 
			
		||||
 | 
			
		||||
#define PARSE_PARAM(p, f)                                                                \
 | 
			
		||||
    if (strncmp(tok, #p, sizeof(#p) / sizeof(#p[0]) - 1) == 0) {                         \
 | 
			
		||||
        param->p = f(val);                                                               \
 | 
			
		||||
    }
 | 
			
		||||
#define PARSE_STRING(p) PARSE_PARAM(p, strdup)
 | 
			
		||||
#define PARSE_INT(p)    PARSE_PARAM(p, atoi)
 | 
			
		||||
#define PARSE_REAL(p)   PARSE_PARAM(p, atof)
 | 
			
		||||
 | 
			
		||||
        if (tok != NULL && val != NULL) {
 | 
			
		||||
            PARSE_REAL(xlength);
 | 
			
		||||
            PARSE_REAL(ylength);
 | 
			
		||||
            PARSE_INT(imax);
 | 
			
		||||
            PARSE_INT(jmax);
 | 
			
		||||
            PARSE_INT(itermax);
 | 
			
		||||
            PARSE_REAL(eps);
 | 
			
		||||
            PARSE_REAL(omg);
 | 
			
		||||
            PARSE_REAL(re);
 | 
			
		||||
            PARSE_REAL(tau);
 | 
			
		||||
            PARSE_REAL(gamma);
 | 
			
		||||
            PARSE_REAL(dt);
 | 
			
		||||
            PARSE_REAL(te);
 | 
			
		||||
            PARSE_REAL(gx);
 | 
			
		||||
            PARSE_REAL(gy);
 | 
			
		||||
            PARSE_STRING(name);
 | 
			
		||||
            PARSE_INT(bcLeft);
 | 
			
		||||
            PARSE_INT(bcRight);
 | 
			
		||||
            PARSE_INT(bcBottom);
 | 
			
		||||
            PARSE_INT(bcTop);
 | 
			
		||||
            PARSE_REAL(u_init);
 | 
			
		||||
            PARSE_REAL(v_init);
 | 
			
		||||
            PARSE_REAL(p_init);
 | 
			
		||||
        }
 | 
			
		||||
    }
 | 
			
		||||
 | 
			
		||||
    fclose(fp);
 | 
			
		||||
}
 | 
			
		||||
 | 
			
		||||
void printParameter(Parameter* param)
 | 
			
		||||
{
 | 
			
		||||
    printf("Parameters for %s\n", param->name);
 | 
			
		||||
    printf("Boundary conditions Left:%d Right:%d Bottom:%d Top:%d\n",
 | 
			
		||||
        param->bcLeft,
 | 
			
		||||
        param->bcRight,
 | 
			
		||||
        param->bcBottom,
 | 
			
		||||
        param->bcTop);
 | 
			
		||||
    printf("\tReynolds number: %.2f\n", param->re);
 | 
			
		||||
    printf("\tInit arrays: U:%.2f V:%.2f P:%.2f\n",
 | 
			
		||||
        param->u_init,
 | 
			
		||||
        param->v_init,
 | 
			
		||||
        param->p_init);
 | 
			
		||||
    printf("Geometry data:\n");
 | 
			
		||||
    printf("\tDomain box size (x, y): %.2f, %.2f\n", param->xlength, param->ylength);
 | 
			
		||||
    printf("\tCells (x, y): %d, %d\n", param->imax, param->jmax);
 | 
			
		||||
    printf("Timestep parameters:\n");
 | 
			
		||||
    printf("\tDefault stepsize: %.2f, Final time %.2f\n", param->dt, param->te);
 | 
			
		||||
    printf("\tTau factor: %.2f\n", param->tau);
 | 
			
		||||
    printf("Iterative solver parameters:\n");
 | 
			
		||||
    printf("\tMax iterations: %d\n", param->itermax);
 | 
			
		||||
    printf("\tepsilon (stopping tolerance) : %f\n", param->eps);
 | 
			
		||||
    printf("\tgamma (stopping tolerance) : %f\n", param->gamma);
 | 
			
		||||
    printf("\tomega (SOR relaxation): %f\n", param->omg);
 | 
			
		||||
}
 | 
			
		||||
							
								
								
									
										26
									
								
								BasicSolver/2D-mpi/src/parameter.h
									
									
									
									
									
										Normal file
									
								
							
							
						
						
									
										26
									
								
								BasicSolver/2D-mpi/src/parameter.h
									
									
									
									
									
										Normal file
									
								
							@@ -0,0 +1,26 @@
 | 
			
		||||
/*
 | 
			
		||||
 * Copyright (C) 2022 NHR@FAU, University Erlangen-Nuremberg.
 | 
			
		||||
 * All rights reserved. This file is part of nusif-solver.
 | 
			
		||||
 * Use of this source code is governed by a MIT style
 | 
			
		||||
 * license that can be found in the LICENSE file.
 | 
			
		||||
 */
 | 
			
		||||
#ifndef __PARAMETER_H_
 | 
			
		||||
#define __PARAMETER_H_
 | 
			
		||||
 | 
			
		||||
typedef struct {
 | 
			
		||||
    double xlength, ylength;
 | 
			
		||||
    int imax, jmax;
 | 
			
		||||
    int itermax;
 | 
			
		||||
    double eps, omg;
 | 
			
		||||
    double re, tau, gamma;
 | 
			
		||||
    double te, dt;
 | 
			
		||||
    double gx, gy;
 | 
			
		||||
    char* name;
 | 
			
		||||
    int bcLeft, bcRight, bcBottom, bcTop;
 | 
			
		||||
    double u_init, v_init, p_init;
 | 
			
		||||
} Parameter;
 | 
			
		||||
 | 
			
		||||
void initParameter(Parameter*);
 | 
			
		||||
void readParameter(Parameter*, const char*);
 | 
			
		||||
void printParameter(Parameter*);
 | 
			
		||||
#endif
 | 
			
		||||
							
								
								
									
										60
									
								
								BasicSolver/2D-mpi/src/progress.c
									
									
									
									
									
										Normal file
									
								
							
							
						
						
									
										60
									
								
								BasicSolver/2D-mpi/src/progress.c
									
									
									
									
									
										Normal file
									
								
							@@ -0,0 +1,60 @@
 | 
			
		||||
/*
 | 
			
		||||
 * Copyright (C) 2022 NHR@FAU, University Erlangen-Nuremberg.
 | 
			
		||||
 * All rights reserved. This file is part of nusif-solver.
 | 
			
		||||
 * Use of this source code is governed by a MIT style
 | 
			
		||||
 * license that can be found in the LICENSE file.
 | 
			
		||||
 */
 | 
			
		||||
#include <math.h>
 | 
			
		||||
#include <mpi.h>
 | 
			
		||||
#include <stdio.h>
 | 
			
		||||
#include <stdlib.h>
 | 
			
		||||
#include <string.h>
 | 
			
		||||
 | 
			
		||||
#include "progress.h"
 | 
			
		||||
 | 
			
		||||
static double _end;
 | 
			
		||||
static int _current;
 | 
			
		||||
static int _rank = -1;
 | 
			
		||||
 | 
			
		||||
void initProgress(double end)
 | 
			
		||||
{
 | 
			
		||||
    MPI_Comm_rank(MPI_COMM_WORLD, &_rank);
 | 
			
		||||
    _end     = end;
 | 
			
		||||
    _current = 0;
 | 
			
		||||
 | 
			
		||||
    if (_rank == 0) {
 | 
			
		||||
        printf("[          ]");
 | 
			
		||||
        fflush(stdout);
 | 
			
		||||
    }
 | 
			
		||||
}
 | 
			
		||||
 | 
			
		||||
void printProgress(double current)
 | 
			
		||||
{
 | 
			
		||||
    if (_rank == 0) {
 | 
			
		||||
        int new = (int)rint((current / _end) * 10.0);
 | 
			
		||||
 | 
			
		||||
        if (new > _current) {
 | 
			
		||||
            char progress[11];
 | 
			
		||||
            _current    = new;
 | 
			
		||||
            progress[0] = 0;
 | 
			
		||||
 | 
			
		||||
            for (int i = 0; i < 10; i++) {
 | 
			
		||||
                if (i < _current) {
 | 
			
		||||
                    sprintf(progress + strlen(progress), "#");
 | 
			
		||||
                } else {
 | 
			
		||||
                    sprintf(progress + strlen(progress), " ");
 | 
			
		||||
                }
 | 
			
		||||
            }
 | 
			
		||||
            printf("\r[%s]", progress);
 | 
			
		||||
        }
 | 
			
		||||
        fflush(stdout);
 | 
			
		||||
    }
 | 
			
		||||
}
 | 
			
		||||
 | 
			
		||||
void stopProgress()
 | 
			
		||||
{
 | 
			
		||||
    if (_rank == 0) {
 | 
			
		||||
        printf("\n");
 | 
			
		||||
        fflush(stdout);
 | 
			
		||||
    }
 | 
			
		||||
}
 | 
			
		||||
							
								
								
									
										14
									
								
								BasicSolver/2D-mpi/src/progress.h
									
									
									
									
									
										Normal file
									
								
							
							
						
						
									
										14
									
								
								BasicSolver/2D-mpi/src/progress.h
									
									
									
									
									
										Normal file
									
								
							@@ -0,0 +1,14 @@
 | 
			
		||||
/*
 | 
			
		||||
 * Copyright (C) 2022 NHR@FAU, University Erlangen-Nuremberg.
 | 
			
		||||
 * All rights reserved.
 | 
			
		||||
 * Use of this source code is governed by a MIT-style
 | 
			
		||||
 * license that can be found in the LICENSE file.
 | 
			
		||||
 */
 | 
			
		||||
#ifndef __PROGRESS_H_
 | 
			
		||||
#define __PROGRESS_H_
 | 
			
		||||
 | 
			
		||||
extern void initProgress(double);
 | 
			
		||||
extern void printProgress(double);
 | 
			
		||||
extern void stopProgress();
 | 
			
		||||
 | 
			
		||||
#endif
 | 
			
		||||
							
								
								
									
										546
									
								
								BasicSolver/2D-mpi/src/solver.c
									
									
									
									
									
										Normal file
									
								
							
							
						
						
									
										546
									
								
								BasicSolver/2D-mpi/src/solver.c
									
									
									
									
									
										Normal file
									
								
							@@ -0,0 +1,546 @@
 | 
			
		||||
/*
 | 
			
		||||
 * Copyright (C) 2022 NHR@FAU, University Erlangen-Nuremberg.
 | 
			
		||||
 * All rights reserved. This file is part of nusif-solver.
 | 
			
		||||
 * Use of this source code is governed by a MIT style
 | 
			
		||||
 * license that can be found in the LICENSE file.
 | 
			
		||||
 */
 | 
			
		||||
#include <float.h>
 | 
			
		||||
#include <math.h>
 | 
			
		||||
#include <stdio.h>
 | 
			
		||||
#include <stdlib.h>
 | 
			
		||||
#include <string.h>
 | 
			
		||||
 | 
			
		||||
#include "allocate.h"
 | 
			
		||||
#include "comm.h"
 | 
			
		||||
#include "parameter.h"
 | 
			
		||||
#include "solver.h"
 | 
			
		||||
#include "util.h"
 | 
			
		||||
 | 
			
		||||
#define P(i, j)   p[(j) * (imaxLocal + 2) + (i)]
 | 
			
		||||
#define F(i, j)   f[(j) * (imaxLocal + 2) + (i)]
 | 
			
		||||
#define G(i, j)   g[(j) * (imaxLocal + 2) + (i)]
 | 
			
		||||
#define U(i, j)   u[(j) * (imaxLocal + 2) + (i)]
 | 
			
		||||
#define V(i, j)   v[(j) * (imaxLocal + 2) + (i)]
 | 
			
		||||
#define RHS(i, j) rhs[(j) * (imaxLocal + 2) + (i)]
 | 
			
		||||
 | 
			
		||||
static void printConfig(Solver* s)
 | 
			
		||||
{
 | 
			
		||||
    if (commIsMaster(&s->comm)) {
 | 
			
		||||
        printf("Parameters for #%s#\n", s->problem);
 | 
			
		||||
        printf("BC Left:%d Right:%d Bottom:%d Top:%d\n",
 | 
			
		||||
            s->bcLeft,
 | 
			
		||||
            s->bcRight,
 | 
			
		||||
            s->bcBottom,
 | 
			
		||||
            s->bcTop);
 | 
			
		||||
        printf("\tReynolds number: %.2f\n", s->re);
 | 
			
		||||
        printf("\tGx Gy: %.2f %.2f\n", s->gx, s->gy);
 | 
			
		||||
        printf("Geometry data:\n");
 | 
			
		||||
        printf("\tDomain box size (x, y): %.2f, %.2f\n", s->xlength, s->ylength);
 | 
			
		||||
        printf("\tCells (x, y): %d, %d\n", s->imax, s->jmax);
 | 
			
		||||
        printf("\tCell size (dx, dy): %f, %f\n", s->dx, s->dy);
 | 
			
		||||
        printf("Timestep parameters:\n");
 | 
			
		||||
        printf("\tDefault stepsize: %.2f, Final time %.2f\n", s->dt, s->te);
 | 
			
		||||
        printf("\tdt bound: %.6f\n", s->dtBound);
 | 
			
		||||
        printf("\tTau factor: %.2f\n", s->tau);
 | 
			
		||||
        printf("Iterative s parameters:\n");
 | 
			
		||||
        printf("\tMax iterations: %d\n", s->itermax);
 | 
			
		||||
        printf("\tepsilon (stopping tolerance) : %f\n", s->eps);
 | 
			
		||||
        printf("\tgamma factor: %f\n", s->gamma);
 | 
			
		||||
        printf("\tomega (SOR relaxation): %f\n", s->omega);
 | 
			
		||||
    }
 | 
			
		||||
    commPrintConfig(&s->comm);
 | 
			
		||||
}
 | 
			
		||||
 | 
			
		||||
void initSolver(Solver* s, Parameter* params)
 | 
			
		||||
{
 | 
			
		||||
    s->problem  = params->name;
 | 
			
		||||
    s->bcLeft   = params->bcLeft;
 | 
			
		||||
    s->bcRight  = params->bcRight;
 | 
			
		||||
    s->bcBottom = params->bcBottom;
 | 
			
		||||
    s->bcTop    = params->bcTop;
 | 
			
		||||
    s->imax     = params->imax;
 | 
			
		||||
    s->jmax     = params->jmax;
 | 
			
		||||
    s->xlength  = params->xlength;
 | 
			
		||||
    s->ylength  = params->ylength;
 | 
			
		||||
    s->dx       = params->xlength / params->imax;
 | 
			
		||||
    s->dy       = params->ylength / params->jmax;
 | 
			
		||||
    s->eps      = params->eps;
 | 
			
		||||
    s->omega    = params->omg;
 | 
			
		||||
    s->itermax  = params->itermax;
 | 
			
		||||
    s->re       = params->re;
 | 
			
		||||
    s->gx       = params->gx;
 | 
			
		||||
    s->gy       = params->gy;
 | 
			
		||||
    s->dt       = params->dt;
 | 
			
		||||
    s->te       = params->te;
 | 
			
		||||
    s->tau      = params->tau;
 | 
			
		||||
    s->gamma    = params->gamma;
 | 
			
		||||
 | 
			
		||||
    commInit(&s->comm, s->jmax, s->imax);
 | 
			
		||||
 | 
			
		||||
    /* allocate arrays */
 | 
			
		||||
    int imaxLocal = s->comm.imaxLocal;
 | 
			
		||||
    int jmaxLocal = s->comm.jmaxLocal;
 | 
			
		||||
    size_t size   = (imaxLocal + 2) * (jmaxLocal + 2);
 | 
			
		||||
 | 
			
		||||
    s->u   = allocate(64, size * sizeof(double));
 | 
			
		||||
    s->v   = allocate(64, size * sizeof(double));
 | 
			
		||||
    s->p   = allocate(64, size * sizeof(double));
 | 
			
		||||
    s->rhs = allocate(64, size * sizeof(double));
 | 
			
		||||
    s->f   = allocate(64, size * sizeof(double));
 | 
			
		||||
    s->g   = allocate(64, size * sizeof(double));
 | 
			
		||||
 | 
			
		||||
    for (int i = 0; i < size; i++) {
 | 
			
		||||
        s->u[i]   = params->u_init;
 | 
			
		||||
        s->v[i]   = params->v_init;
 | 
			
		||||
        s->p[i]   = params->p_init;
 | 
			
		||||
        s->rhs[i] = 0.0;
 | 
			
		||||
        s->f[i]   = 0.0;
 | 
			
		||||
        s->g[i]   = 0.0;
 | 
			
		||||
    }
 | 
			
		||||
 | 
			
		||||
    double dx = s->dx;
 | 
			
		||||
    double dy = s->dy;
 | 
			
		||||
 | 
			
		||||
    double invSqrSum = 1.0 / (dx * dx) + 1.0 / (dy * dy);
 | 
			
		||||
    s->dtBound       = 0.5 * s->re * 1.0 / invSqrSum;
 | 
			
		||||
#ifdef VERBOSE
 | 
			
		||||
    printConfig(s);
 | 
			
		||||
#endif
 | 
			
		||||
}
 | 
			
		||||
 | 
			
		||||
void computeRHS(Solver* s)
 | 
			
		||||
{
 | 
			
		||||
    int imaxLocal = s->comm.imaxLocal;
 | 
			
		||||
    int jmaxLocal = s->comm.jmaxLocal;
 | 
			
		||||
    double idx    = 1.0 / s->dx;
 | 
			
		||||
    double idy    = 1.0 / s->dy;
 | 
			
		||||
    double idt    = 1.0 / s->dt;
 | 
			
		||||
    double* rhs   = s->rhs;
 | 
			
		||||
    double* f     = s->f;
 | 
			
		||||
    double* g     = s->g;
 | 
			
		||||
 | 
			
		||||
    commShift(&s->comm, f, g);
 | 
			
		||||
 | 
			
		||||
    for (int j = 1; j < jmaxLocal + 1; j++) {
 | 
			
		||||
        for (int i = 1; i < imaxLocal + 1; i++) {
 | 
			
		||||
            RHS(i, j) = ((F(i, j) - F(i - 1, j)) * idx + (G(i, j) - G(i, j - 1)) * idy) *
 | 
			
		||||
                        idt;
 | 
			
		||||
        }
 | 
			
		||||
    }
 | 
			
		||||
}
 | 
			
		||||
 | 
			
		||||
int solve(Solver* s)
 | 
			
		||||
{
 | 
			
		||||
    int imax      = s->imax;
 | 
			
		||||
    int jmax      = s->jmax;
 | 
			
		||||
    int imaxLocal = s->comm.imaxLocal;
 | 
			
		||||
    int jmaxLocal = s->comm.jmaxLocal;
 | 
			
		||||
    double eps    = s->eps;
 | 
			
		||||
    int itermax   = s->itermax;
 | 
			
		||||
    double dx2    = s->dx * s->dx;
 | 
			
		||||
    double dy2    = s->dy * s->dy;
 | 
			
		||||
    double idx2   = 1.0 / dx2;
 | 
			
		||||
    double idy2   = 1.0 / dy2;
 | 
			
		||||
    double factor = s->omega * 0.5 * (dx2 * dy2) / (dx2 + dy2);
 | 
			
		||||
    double* p     = s->p;
 | 
			
		||||
    double* rhs   = s->rhs;
 | 
			
		||||
    double epssq  = eps * eps;
 | 
			
		||||
    int it        = 0;
 | 
			
		||||
    double res    = 1.0;
 | 
			
		||||
    commExchange(&s->comm, p);
 | 
			
		||||
 | 
			
		||||
    while ((res >= epssq) && (it < itermax)) {
 | 
			
		||||
        res = 0.0;
 | 
			
		||||
 | 
			
		||||
        for (int j = 1; j < jmaxLocal + 1; j++) {
 | 
			
		||||
            for (int i = 1; i < imaxLocal + 1; i++) {
 | 
			
		||||
 | 
			
		||||
                double r = RHS(i, j) -
 | 
			
		||||
                           ((P(i + 1, j) - 2.0 * P(i, j) + P(i - 1, j)) * idx2 +
 | 
			
		||||
                               (P(i, j + 1) - 2.0 * P(i, j) + P(i, j - 1)) * idy2);
 | 
			
		||||
 | 
			
		||||
                P(i, j) -= (factor * r);
 | 
			
		||||
                res += (r * r);
 | 
			
		||||
            }
 | 
			
		||||
        }
 | 
			
		||||
 | 
			
		||||
        if (commIsBoundary(&s->comm, BOTTOM)) { // set bottom bc
 | 
			
		||||
            for (int i = 1; i < imaxLocal + 1; i++) {
 | 
			
		||||
                P(i, 0) = P(i, 1);
 | 
			
		||||
            }
 | 
			
		||||
        }
 | 
			
		||||
 | 
			
		||||
        if (commIsBoundary(&s->comm, TOP)) { // set top bc
 | 
			
		||||
            for (int i = 1; i < imaxLocal + 1; i++) {
 | 
			
		||||
                P(i, jmaxLocal + 1) = P(i, jmaxLocal);
 | 
			
		||||
            }
 | 
			
		||||
        }
 | 
			
		||||
 | 
			
		||||
        if (commIsBoundary(&s->comm, LEFT)) { // set left bc
 | 
			
		||||
            for (int j = 1; j < jmaxLocal + 1; j++) {
 | 
			
		||||
                P(0, j) = P(1, j);
 | 
			
		||||
            }
 | 
			
		||||
        }
 | 
			
		||||
 | 
			
		||||
        if (commIsBoundary(&s->comm, RIGHT)) { // set right bc
 | 
			
		||||
            for (int j = 1; j < jmaxLocal + 1; j++) {
 | 
			
		||||
                P(imaxLocal + 1, j) = P(imaxLocal, j);
 | 
			
		||||
            }
 | 
			
		||||
        }
 | 
			
		||||
 | 
			
		||||
        commReduction(&res, SUM);
 | 
			
		||||
        res = res / (double)(imax * jmax);
 | 
			
		||||
#ifdef DEBUG
 | 
			
		||||
        if (commIsMaster(&s->comm)) {
 | 
			
		||||
            printf("%d Residuum: %e\n", it, res);
 | 
			
		||||
        }
 | 
			
		||||
#endif
 | 
			
		||||
        it++;
 | 
			
		||||
    }
 | 
			
		||||
 | 
			
		||||
#ifdef VERBOSE
 | 
			
		||||
    if (commIsMaster(&s->comm)) {
 | 
			
		||||
        printf("Solver took %d iterations to reach %f\n", it, sqrt(res));
 | 
			
		||||
    }
 | 
			
		||||
#endif
 | 
			
		||||
    if (res < eps) {
 | 
			
		||||
        return 0;
 | 
			
		||||
    } else {
 | 
			
		||||
        return 1;
 | 
			
		||||
    }
 | 
			
		||||
}
 | 
			
		||||
 | 
			
		||||
static double maxElement(Solver* s, double* m)
 | 
			
		||||
{
 | 
			
		||||
    int imaxLocal = s->comm.imaxLocal;
 | 
			
		||||
    int jmaxLocal = s->comm.jmaxLocal;
 | 
			
		||||
    int size      = (imaxLocal + 2) * (jmaxLocal + 2);
 | 
			
		||||
    double maxval = DBL_MIN;
 | 
			
		||||
 | 
			
		||||
    for (int i = 0; i < size; i++) {
 | 
			
		||||
        maxval = MAX(maxval, fabs(m[i]));
 | 
			
		||||
    }
 | 
			
		||||
 | 
			
		||||
    commReduction(&maxval, MAX);
 | 
			
		||||
    return maxval;
 | 
			
		||||
}
 | 
			
		||||
 | 
			
		||||
void computeTimestep(Solver* s)
 | 
			
		||||
{
 | 
			
		||||
    double dt   = s->dtBound;
 | 
			
		||||
    double dx   = s->dx;
 | 
			
		||||
    double dy   = s->dy;
 | 
			
		||||
    double umax = maxElement(s, s->u);
 | 
			
		||||
    double vmax = maxElement(s, s->v);
 | 
			
		||||
 | 
			
		||||
    if (umax > 0) {
 | 
			
		||||
        dt = (dt > dx / umax) ? dx / umax : dt;
 | 
			
		||||
    }
 | 
			
		||||
    if (vmax > 0) {
 | 
			
		||||
        dt = (dt > dy / vmax) ? dy / vmax : dt;
 | 
			
		||||
    }
 | 
			
		||||
 | 
			
		||||
    s->dt = dt * s->tau;
 | 
			
		||||
}
 | 
			
		||||
 | 
			
		||||
void setBoundaryConditions(Solver* s)
 | 
			
		||||
{
 | 
			
		||||
    int imaxLocal = s->comm.imaxLocal;
 | 
			
		||||
    int jmaxLocal = s->comm.jmaxLocal;
 | 
			
		||||
    double* u     = s->u;
 | 
			
		||||
    double* v     = s->v;
 | 
			
		||||
 | 
			
		||||
    if (commIsBoundary(&s->comm, TOP)) {
 | 
			
		||||
        switch (s->bcTop) {
 | 
			
		||||
        case NOSLIP:
 | 
			
		||||
            for (int i = 1; i < imaxLocal + 1; i++) {
 | 
			
		||||
                V(i, jmaxLocal)     = 0.0;
 | 
			
		||||
                U(i, jmaxLocal + 1) = -U(i, jmaxLocal);
 | 
			
		||||
            }
 | 
			
		||||
            break;
 | 
			
		||||
        case SLIP:
 | 
			
		||||
            for (int i = 1; i < imaxLocal + 1; i++) {
 | 
			
		||||
                V(i, jmaxLocal)     = 0.0;
 | 
			
		||||
                U(i, jmaxLocal + 1) = U(i, jmaxLocal);
 | 
			
		||||
            }
 | 
			
		||||
            break;
 | 
			
		||||
        case OUTFLOW:
 | 
			
		||||
            for (int i = 1; i < imaxLocal + 1; i++) {
 | 
			
		||||
                U(i, jmaxLocal + 1) = U(i, jmaxLocal);
 | 
			
		||||
                V(i, jmaxLocal)     = V(i, jmaxLocal - 1);
 | 
			
		||||
            }
 | 
			
		||||
            break;
 | 
			
		||||
        case PERIODIC:
 | 
			
		||||
            break;
 | 
			
		||||
        }
 | 
			
		||||
    }
 | 
			
		||||
 | 
			
		||||
    if (commIsBoundary(&s->comm, BOTTOM)) {
 | 
			
		||||
        switch (s->bcBottom) {
 | 
			
		||||
        case NOSLIP:
 | 
			
		||||
            for (int i = 1; i < imaxLocal + 1; i++) {
 | 
			
		||||
                V(i, 0) = 0.0;
 | 
			
		||||
                U(i, 0) = -U(i, 1);
 | 
			
		||||
            }
 | 
			
		||||
            break;
 | 
			
		||||
        case SLIP:
 | 
			
		||||
            for (int i = 1; i < imaxLocal + 1; i++) {
 | 
			
		||||
                V(i, 0) = 0.0;
 | 
			
		||||
                U(i, 0) = U(i, 1);
 | 
			
		||||
            }
 | 
			
		||||
            break;
 | 
			
		||||
        case OUTFLOW:
 | 
			
		||||
            for (int i = 1; i < imaxLocal + 1; i++) {
 | 
			
		||||
                U(i, 0) = U(i, 1);
 | 
			
		||||
                V(i, 0) = V(i, 1);
 | 
			
		||||
            }
 | 
			
		||||
            break;
 | 
			
		||||
        case PERIODIC:
 | 
			
		||||
            break;
 | 
			
		||||
        }
 | 
			
		||||
    }
 | 
			
		||||
 | 
			
		||||
    if (commIsBoundary(&s->comm, RIGHT)) {
 | 
			
		||||
        switch (s->bcRight) {
 | 
			
		||||
        case NOSLIP:
 | 
			
		||||
            for (int j = 1; j < jmaxLocal + 1; j++) {
 | 
			
		||||
                U(imaxLocal, j)     = 0.0;
 | 
			
		||||
                V(imaxLocal + 1, j) = -V(imaxLocal, j);
 | 
			
		||||
            }
 | 
			
		||||
            break;
 | 
			
		||||
        case SLIP:
 | 
			
		||||
            for (int j = 1; j < jmaxLocal + 1; j++) {
 | 
			
		||||
                U(imaxLocal, j)     = 0.0;
 | 
			
		||||
                V(imaxLocal + 1, j) = V(imaxLocal, j);
 | 
			
		||||
            }
 | 
			
		||||
            break;
 | 
			
		||||
        case OUTFLOW:
 | 
			
		||||
            for (int j = 1; j < jmaxLocal + 1; j++) {
 | 
			
		||||
                U(imaxLocal, j)     = U(imaxLocal - 1, j);
 | 
			
		||||
                V(imaxLocal + 1, j) = V(imaxLocal, j);
 | 
			
		||||
            }
 | 
			
		||||
            break;
 | 
			
		||||
        case PERIODIC:
 | 
			
		||||
            break;
 | 
			
		||||
        }
 | 
			
		||||
    }
 | 
			
		||||
 | 
			
		||||
    if (commIsBoundary(&s->comm, LEFT)) {
 | 
			
		||||
        switch (s->bcLeft) {
 | 
			
		||||
        case NOSLIP:
 | 
			
		||||
            for (int j = 1; j < jmaxLocal + 1; j++) {
 | 
			
		||||
                U(0, j) = 0.0;
 | 
			
		||||
                V(0, j) = -V(1, j);
 | 
			
		||||
            }
 | 
			
		||||
            break;
 | 
			
		||||
        case SLIP:
 | 
			
		||||
            for (int j = 1; j < jmaxLocal + 1; j++) {
 | 
			
		||||
                U(0, j) = 0.0;
 | 
			
		||||
                V(0, j) = V(1, j);
 | 
			
		||||
            }
 | 
			
		||||
            break;
 | 
			
		||||
        case OUTFLOW:
 | 
			
		||||
            for (int j = 1; j < jmaxLocal + 1; j++) {
 | 
			
		||||
                U(0, j) = U(1, j);
 | 
			
		||||
                V(0, j) = V(1, j);
 | 
			
		||||
            }
 | 
			
		||||
            break;
 | 
			
		||||
        case PERIODIC:
 | 
			
		||||
            break;
 | 
			
		||||
        }
 | 
			
		||||
    }
 | 
			
		||||
}
 | 
			
		||||
 | 
			
		||||
void setSpecialBoundaryCondition(Solver* s)
 | 
			
		||||
{
 | 
			
		||||
    int imaxLocal = s->comm.imaxLocal;
 | 
			
		||||
    int jmaxLocal = s->comm.jmaxLocal;
 | 
			
		||||
    double* u     = s->u;
 | 
			
		||||
 | 
			
		||||
    if (strcmp(s->problem, "dcavity") == 0) {
 | 
			
		||||
        if (commIsBoundary(&s->comm, TOP)) {
 | 
			
		||||
            for (int i = 1; i < imaxLocal + 1; i++) {
 | 
			
		||||
                U(i, jmaxLocal + 1) = 2.0 - U(i, jmaxLocal);
 | 
			
		||||
            }
 | 
			
		||||
        }
 | 
			
		||||
    } else if (strcmp(s->problem, "canal") == 0) {
 | 
			
		||||
        if (commIsBoundary(&s->comm, LEFT)) {
 | 
			
		||||
            double ylength = s->ylength;
 | 
			
		||||
            double dy      = s->dy;
 | 
			
		||||
            int rest       = s->jmax % s->comm.size;
 | 
			
		||||
            int yc    = s->comm.rank * (s->jmax / s->comm.size) + MIN(rest, s->comm.rank);
 | 
			
		||||
            double ys = dy * (yc + 0.5);
 | 
			
		||||
            double y;
 | 
			
		||||
 | 
			
		||||
            /* printf("RANK %d yc: %d ys: %f\n", solver->rank, yc, ys); */
 | 
			
		||||
 | 
			
		||||
            for (int j = 1; j < jmaxLocal + 1; j++) {
 | 
			
		||||
                y       = ys + dy * (j - 0.5);
 | 
			
		||||
                U(0, j) = y * (ylength - y) * 4.0 / (ylength * ylength);
 | 
			
		||||
            }
 | 
			
		||||
        }
 | 
			
		||||
    }
 | 
			
		||||
    /* print(solver, solver->u); */
 | 
			
		||||
}
 | 
			
		||||
 | 
			
		||||
void computeFG(Solver* s)
 | 
			
		||||
{
 | 
			
		||||
    double* u = s->u;
 | 
			
		||||
    double* v = s->v;
 | 
			
		||||
    double* f = s->f;
 | 
			
		||||
    double* g = s->g;
 | 
			
		||||
 | 
			
		||||
    int imaxLocal = s->comm.imaxLocal;
 | 
			
		||||
    int jmaxLocal = s->comm.jmaxLocal;
 | 
			
		||||
 | 
			
		||||
    double gx        = s->gx;
 | 
			
		||||
    double gy        = s->gy;
 | 
			
		||||
    double gamma     = s->gamma;
 | 
			
		||||
    double dt        = s->dt;
 | 
			
		||||
    double inverseRe = 1.0 / s->re;
 | 
			
		||||
    double inverseDx = 1.0 / s->dx;
 | 
			
		||||
    double inverseDy = 1.0 / s->dy;
 | 
			
		||||
    double du2dx, dv2dy, duvdx, duvdy;
 | 
			
		||||
    double du2dx2, du2dy2, dv2dx2, dv2dy2;
 | 
			
		||||
 | 
			
		||||
    commExchange(&s->comm, u);
 | 
			
		||||
    commExchange(&s->comm, v);
 | 
			
		||||
 | 
			
		||||
    for (int j = 1; j < jmaxLocal + 1; j++) {
 | 
			
		||||
        for (int i = 1; i < imaxLocal + 1; i++) {
 | 
			
		||||
            du2dx = inverseDx * 0.25 *
 | 
			
		||||
                        ((U(i, j) + U(i + 1, j)) * (U(i, j) + U(i + 1, j)) -
 | 
			
		||||
                            (U(i, j) + U(i - 1, j)) * (U(i, j) + U(i - 1, j))) +
 | 
			
		||||
                    gamma * inverseDx * 0.25 *
 | 
			
		||||
                        (fabs(U(i, j) + U(i + 1, j)) * (U(i, j) - U(i + 1, j)) +
 | 
			
		||||
                            fabs(U(i, j) + U(i - 1, j)) * (U(i, j) - U(i - 1, j)));
 | 
			
		||||
 | 
			
		||||
            duvdy = inverseDy * 0.25 *
 | 
			
		||||
                        ((V(i, j) + V(i + 1, j)) * (U(i, j) + U(i, j + 1)) -
 | 
			
		||||
                            (V(i, j - 1) + V(i + 1, j - 1)) * (U(i, j) + U(i, j - 1))) +
 | 
			
		||||
                    gamma * inverseDy * 0.25 *
 | 
			
		||||
                        (fabs(V(i, j) + V(i + 1, j)) * (U(i, j) - U(i, j + 1)) +
 | 
			
		||||
                            fabs(V(i, j - 1) + V(i + 1, j - 1)) *
 | 
			
		||||
                                (U(i, j) - U(i, j - 1)));
 | 
			
		||||
 | 
			
		||||
            du2dx2  = inverseDx * inverseDx * (U(i + 1, j) - 2.0 * U(i, j) + U(i - 1, j));
 | 
			
		||||
            du2dy2  = inverseDy * inverseDy * (U(i, j + 1) - 2.0 * U(i, j) + U(i, j - 1));
 | 
			
		||||
            F(i, j) = U(i, j) + dt * (inverseRe * (du2dx2 + du2dy2) - du2dx - duvdy + gx);
 | 
			
		||||
 | 
			
		||||
            duvdx = inverseDx * 0.25 *
 | 
			
		||||
                        ((U(i, j) + U(i, j + 1)) * (V(i, j) + V(i + 1, j)) -
 | 
			
		||||
                            (U(i - 1, j) + U(i - 1, j + 1)) * (V(i, j) + V(i - 1, j))) +
 | 
			
		||||
                    gamma * inverseDx * 0.25 *
 | 
			
		||||
                        (fabs(U(i, j) + U(i, j + 1)) * (V(i, j) - V(i + 1, j)) +
 | 
			
		||||
                            fabs(U(i - 1, j) + U(i - 1, j + 1)) *
 | 
			
		||||
                                (V(i, j) - V(i - 1, j)));
 | 
			
		||||
 | 
			
		||||
            dv2dy = inverseDy * 0.25 *
 | 
			
		||||
                        ((V(i, j) + V(i, j + 1)) * (V(i, j) + V(i, j + 1)) -
 | 
			
		||||
                            (V(i, j) + V(i, j - 1)) * (V(i, j) + V(i, j - 1))) +
 | 
			
		||||
                    gamma * inverseDy * 0.25 *
 | 
			
		||||
                        (fabs(V(i, j) + V(i, j + 1)) * (V(i, j) - V(i, j + 1)) +
 | 
			
		||||
                            fabs(V(i, j) + V(i, j - 1)) * (V(i, j) - V(i, j - 1)));
 | 
			
		||||
 | 
			
		||||
            dv2dx2  = inverseDx * inverseDx * (V(i + 1, j) - 2.0 * V(i, j) + V(i - 1, j));
 | 
			
		||||
            dv2dy2  = inverseDy * inverseDy * (V(i, j + 1) - 2.0 * V(i, j) + V(i, j - 1));
 | 
			
		||||
            G(i, j) = V(i, j) + dt * (inverseRe * (dv2dx2 + dv2dy2) - duvdx - dv2dy + gy);
 | 
			
		||||
        }
 | 
			
		||||
    }
 | 
			
		||||
 | 
			
		||||
    /* ----------------------------- boundary of F --------------------------- */
 | 
			
		||||
    if (commIsBoundary(&s->comm, LEFT)) {
 | 
			
		||||
        for (int j = 1; j < jmaxLocal + 1; j++) {
 | 
			
		||||
            F(0, j) = U(0, j);
 | 
			
		||||
        }
 | 
			
		||||
    }
 | 
			
		||||
 | 
			
		||||
    if (commIsBoundary(&s->comm, RIGHT)) {
 | 
			
		||||
        for (int j = 1; j < jmaxLocal + 1; j++) {
 | 
			
		||||
            F(imaxLocal, j) = U(imaxLocal, j);
 | 
			
		||||
        }
 | 
			
		||||
    }
 | 
			
		||||
 | 
			
		||||
    /* ----------------------------- boundary of G --------------------------- */
 | 
			
		||||
    if (commIsBoundary(&s->comm, BOTTOM)) {
 | 
			
		||||
        for (int i = 1; i < imaxLocal + 1; i++) {
 | 
			
		||||
            G(i, 0) = V(i, 0);
 | 
			
		||||
        }
 | 
			
		||||
    }
 | 
			
		||||
 | 
			
		||||
    if (commIsBoundary(&s->comm, TOP)) {
 | 
			
		||||
        for (int i = 1; i < imaxLocal + 1; i++) {
 | 
			
		||||
            G(i, jmaxLocal) = V(i, jmaxLocal);
 | 
			
		||||
        }
 | 
			
		||||
    }
 | 
			
		||||
}
 | 
			
		||||
 | 
			
		||||
void adaptUV(Solver* s)
 | 
			
		||||
{
 | 
			
		||||
    int imaxLocal = s->comm.imaxLocal;
 | 
			
		||||
    int jmaxLocal = s->comm.jmaxLocal;
 | 
			
		||||
 | 
			
		||||
    double* p = s->p;
 | 
			
		||||
    double* u = s->u;
 | 
			
		||||
    double* v = s->v;
 | 
			
		||||
    double* f = s->f;
 | 
			
		||||
    double* g = s->g;
 | 
			
		||||
 | 
			
		||||
    double factorX = s->dt / s->dx;
 | 
			
		||||
    double factorY = s->dt / s->dy;
 | 
			
		||||
 | 
			
		||||
    for (int j = 1; j < jmaxLocal + 1; j++) {
 | 
			
		||||
        for (int i = 1; i < imaxLocal + 1; i++) {
 | 
			
		||||
            U(i, j) = F(i, j) - (P(i + 1, j) - P(i, j)) * factorX;
 | 
			
		||||
            V(i, j) = G(i, j) - (P(i, j + 1) - P(i, j)) * factorY;
 | 
			
		||||
        }
 | 
			
		||||
    }
 | 
			
		||||
}
 | 
			
		||||
 | 
			
		||||
void writeResult(Solver* s, double* u, double* v, double* p)
 | 
			
		||||
{
 | 
			
		||||
    int imax  = s->imax;
 | 
			
		||||
    int jmax  = s->jmax;
 | 
			
		||||
    double dx = s->dx;
 | 
			
		||||
    double dy = s->dy;
 | 
			
		||||
    double x = 0.0, y = 0.0;
 | 
			
		||||
 | 
			
		||||
    FILE* fp;
 | 
			
		||||
    fp = fopen("pressure.dat", "w");
 | 
			
		||||
 | 
			
		||||
    if (fp == NULL) {
 | 
			
		||||
        printf("Error!\n");
 | 
			
		||||
        exit(EXIT_FAILURE);
 | 
			
		||||
    }
 | 
			
		||||
 | 
			
		||||
    for (int j = 1; j < jmax; j++) {
 | 
			
		||||
        y = (double)(j - 0.5) * dy;
 | 
			
		||||
        for (int i = 1; i < imax; i++) {
 | 
			
		||||
            x = (double)(i - 0.5) * dx;
 | 
			
		||||
            fprintf(fp, "%.2f %.2f %f\n", x, y, p[j * (imax) + i]);
 | 
			
		||||
        }
 | 
			
		||||
        fprintf(fp, "\n");
 | 
			
		||||
    }
 | 
			
		||||
 | 
			
		||||
    fclose(fp);
 | 
			
		||||
 | 
			
		||||
    fp = fopen("velocity.dat", "w");
 | 
			
		||||
 | 
			
		||||
    if (fp == NULL) {
 | 
			
		||||
        printf("Error!\n");
 | 
			
		||||
        exit(EXIT_FAILURE);
 | 
			
		||||
    }
 | 
			
		||||
 | 
			
		||||
    for (int j = 1; j < jmax; j++) {
 | 
			
		||||
        y = dy * (j - 0.5);
 | 
			
		||||
        for (int i = 1; i < imax; i++) {
 | 
			
		||||
            x            = dx * (i - 0.5);
 | 
			
		||||
            double vel_u = (u[j * (imax) + i] + u[j * (imax) + (i - 1)]) / 2.0;
 | 
			
		||||
            double vel_v = (v[j * (imax) + i] + v[(j - 1) * (imax) + i]) / 2.0;
 | 
			
		||||
            double len   = sqrt((vel_u * vel_u) + (vel_v * vel_v));
 | 
			
		||||
            fprintf(fp, "%.2f %.2f %f %f %f\n", x, y, vel_u, vel_v, len);
 | 
			
		||||
        }
 | 
			
		||||
    }
 | 
			
		||||
 | 
			
		||||
    fclose(fp);
 | 
			
		||||
}
 | 
			
		||||
							
								
								
									
										47
									
								
								BasicSolver/2D-mpi/src/solver.h
									
									
									
									
									
										Normal file
									
								
							
							
						
						
									
										47
									
								
								BasicSolver/2D-mpi/src/solver.h
									
									
									
									
									
										Normal file
									
								
							@@ -0,0 +1,47 @@
 | 
			
		||||
/*
 | 
			
		||||
 * Copyright (C) 2022 NHR@FAU, University Erlangen-Nuremberg.
 | 
			
		||||
 * All rights reserved. This file is part of nusif-solver.
 | 
			
		||||
 * Use of this source code is governed by a MIT style
 | 
			
		||||
 * license that can be found in the LICENSE file.
 | 
			
		||||
 */
 | 
			
		||||
#ifndef __SOLVER_H_
 | 
			
		||||
#define __SOLVER_H_
 | 
			
		||||
#include "comm.h"
 | 
			
		||||
#include "parameter.h"
 | 
			
		||||
 | 
			
		||||
enum BC { NOSLIP = 1, SLIP, OUTFLOW, PERIODIC };
 | 
			
		||||
 | 
			
		||||
typedef struct {
 | 
			
		||||
    /* geometry and grid information */
 | 
			
		||||
    double dx, dy;
 | 
			
		||||
    int imax, jmax;
 | 
			
		||||
    double xlength, ylength;
 | 
			
		||||
    /* arrays */
 | 
			
		||||
    double *p, *rhs;
 | 
			
		||||
    double *f, *g;
 | 
			
		||||
    double *u, *v;
 | 
			
		||||
    /* parameters */
 | 
			
		||||
    double eps, omega;
 | 
			
		||||
    double re, tau, gamma;
 | 
			
		||||
    double gx, gy;
 | 
			
		||||
    /* time stepping */
 | 
			
		||||
    int itermax;
 | 
			
		||||
    double dt, te;
 | 
			
		||||
    double dtBound;
 | 
			
		||||
    char* problem;
 | 
			
		||||
    int bcLeft, bcRight, bcBottom, bcTop;
 | 
			
		||||
    /* communication */
 | 
			
		||||
    Comm comm;
 | 
			
		||||
} Solver;
 | 
			
		||||
 | 
			
		||||
void initSolver(Solver*, Parameter*);
 | 
			
		||||
void computeRHS(Solver*);
 | 
			
		||||
int solve(Solver*);
 | 
			
		||||
void normalizePressure(Solver*);
 | 
			
		||||
void computeTimestep(Solver*);
 | 
			
		||||
void setBoundaryConditions(Solver*);
 | 
			
		||||
void setSpecialBoundaryCondition(Solver*);
 | 
			
		||||
void computeFG(Solver*);
 | 
			
		||||
void adaptUV(Solver*);
 | 
			
		||||
void writeResult(Solver* s, double* u, double* v, double* p);
 | 
			
		||||
#endif
 | 
			
		||||
							
								
								
									
										24
									
								
								BasicSolver/2D-mpi/src/timing.c
									
									
									
									
									
										Normal file
									
								
							
							
						
						
									
										24
									
								
								BasicSolver/2D-mpi/src/timing.c
									
									
									
									
									
										Normal file
									
								
							@@ -0,0 +1,24 @@
 | 
			
		||||
/*
 | 
			
		||||
 * Copyright (C) 2022 NHR@FAU, University Erlangen-Nuremberg.
 | 
			
		||||
 * All rights reserved.
 | 
			
		||||
 * Use of this source code is governed by a MIT-style
 | 
			
		||||
 * license that can be found in the LICENSE file.
 | 
			
		||||
 */
 | 
			
		||||
#include <stdlib.h>
 | 
			
		||||
#include <time.h>
 | 
			
		||||
 | 
			
		||||
double getTimeStamp()
 | 
			
		||||
{
 | 
			
		||||
    struct timespec ts;
 | 
			
		||||
    clock_gettime(CLOCK_MONOTONIC, &ts);
 | 
			
		||||
    return (double)ts.tv_sec + (double)ts.tv_nsec * 1.e-9;
 | 
			
		||||
}
 | 
			
		||||
 | 
			
		||||
double getTimeResolution()
 | 
			
		||||
{
 | 
			
		||||
    struct timespec ts;
 | 
			
		||||
    clock_getres(CLOCK_MONOTONIC, &ts);
 | 
			
		||||
    return (double)ts.tv_sec + (double)ts.tv_nsec * 1.e-9;
 | 
			
		||||
}
 | 
			
		||||
 | 
			
		||||
double getTimeStamp_() { return getTimeStamp(); }
 | 
			
		||||
							
								
								
									
										14
									
								
								BasicSolver/2D-mpi/src/timing.h
									
									
									
									
									
										Normal file
									
								
							
							
						
						
									
										14
									
								
								BasicSolver/2D-mpi/src/timing.h
									
									
									
									
									
										Normal file
									
								
							@@ -0,0 +1,14 @@
 | 
			
		||||
/*
 | 
			
		||||
 * Copyright (C) 2022 NHR@FAU, University Erlangen-Nuremberg.
 | 
			
		||||
 * All rights reserved.
 | 
			
		||||
 * Use of this source code is governed by a MIT-style
 | 
			
		||||
 * license that can be found in the LICENSE file.
 | 
			
		||||
 */
 | 
			
		||||
#ifndef __TIMING_H_
 | 
			
		||||
#define __TIMING_H_
 | 
			
		||||
 | 
			
		||||
extern double getTimeStamp();
 | 
			
		||||
extern double getTimeResolution();
 | 
			
		||||
extern double getTimeStamp_();
 | 
			
		||||
 | 
			
		||||
#endif // __TIMING_H_
 | 
			
		||||
							
								
								
									
										22
									
								
								BasicSolver/2D-mpi/src/util.h
									
									
									
									
									
										Normal file
									
								
							
							
						
						
									
										22
									
								
								BasicSolver/2D-mpi/src/util.h
									
									
									
									
									
										Normal file
									
								
							@@ -0,0 +1,22 @@
 | 
			
		||||
/*
 | 
			
		||||
 * Copyright (C) 2022 NHR@FAU, University Erlangen-Nuremberg.
 | 
			
		||||
 * All rights reserved.
 | 
			
		||||
 * Use of this source code is governed by a MIT-style
 | 
			
		||||
 * license that can be found in the LICENSE file.
 | 
			
		||||
 */
 | 
			
		||||
#ifndef __UTIL_H_
 | 
			
		||||
#define __UTIL_H_
 | 
			
		||||
#define HLINE                                                                            \
 | 
			
		||||
    "----------------------------------------------------------------------------\n"
 | 
			
		||||
 | 
			
		||||
#ifndef MIN
 | 
			
		||||
#define MIN(x, y) ((x) < (y) ? (x) : (y))
 | 
			
		||||
#endif
 | 
			
		||||
#ifndef MAX
 | 
			
		||||
#define MAX(x, y) ((x) > (y) ? (x) : (y))
 | 
			
		||||
#endif
 | 
			
		||||
#ifndef ABS
 | 
			
		||||
#define ABS(a) ((a) >= 0 ? (a) : -(a))
 | 
			
		||||
#endif
 | 
			
		||||
 | 
			
		||||
#endif // __UTIL_H_
 | 
			
		||||
		Reference in New Issue
	
	Block a user