forked from moebiusband/NuSiF-Solver
		
	Merge 3D mpi versions
This commit is contained in:
		@@ -1,71 +0,0 @@
 | 
			
		||||
#=======================================================================================
 | 
			
		||||
# Copyright (C) 2022 NHR@FAU, University Erlangen-Nuremberg.
 | 
			
		||||
# All rights reserved.
 | 
			
		||||
# Use of this source code is governed by a MIT-style
 | 
			
		||||
# license that can be found in the LICENSE file.
 | 
			
		||||
#=======================================================================================
 | 
			
		||||
 | 
			
		||||
#CONFIGURE BUILD SYSTEM
 | 
			
		||||
TARGET	   = exe-$(TAG)
 | 
			
		||||
BUILD_DIR  = ./$(TAG)
 | 
			
		||||
SRC_DIR    = ./src
 | 
			
		||||
MAKE_DIR   = ./
 | 
			
		||||
Q         ?= @
 | 
			
		||||
 | 
			
		||||
#DO NOT EDIT BELOW
 | 
			
		||||
include $(MAKE_DIR)/config.mk
 | 
			
		||||
include $(MAKE_DIR)/include_$(TAG).mk
 | 
			
		||||
INCLUDES  += -I$(SRC_DIR) -I$(BUILD_DIR)
 | 
			
		||||
 | 
			
		||||
VPATH     = $(SRC_DIR)
 | 
			
		||||
SRC       = $(wildcard $(SRC_DIR)/*.c)
 | 
			
		||||
ASM       = $(patsubst $(SRC_DIR)/%.c, $(BUILD_DIR)/%.s, $(SRC))
 | 
			
		||||
OBJ       = $(patsubst $(SRC_DIR)/%.c, $(BUILD_DIR)/%.o, $(SRC))
 | 
			
		||||
SOURCES   = $(SRC) $(wildcard $(SRC_DIR)/*.h)
 | 
			
		||||
CPPFLAGS := $(CPPFLAGS) $(DEFINES) $(OPTIONS) $(INCLUDES)
 | 
			
		||||
 | 
			
		||||
${TARGET}: $(BUILD_DIR) $(OBJ)
 | 
			
		||||
	$(info ===>  LINKING  $(TARGET))
 | 
			
		||||
	$(Q)${LINKER} ${LFLAGS} -o $(TARGET) $(OBJ) $(LIBS)
 | 
			
		||||
 | 
			
		||||
$(BUILD_DIR)/%.o:  %.c $(MAKE_DIR)/include_$(TAG).mk $(MAKE_DIR)/config.mk
 | 
			
		||||
	$(info ===>  COMPILE  $@)
 | 
			
		||||
	$(CC) -c $(CPPFLAGS) $(CFLAGS) $< -o $@
 | 
			
		||||
	$(Q)$(GCC) $(CPPFLAGS) -MT $(@:.d=.o) -MM  $< > $(BUILD_DIR)/$*.d
 | 
			
		||||
 | 
			
		||||
$(BUILD_DIR)/%.s:  %.c
 | 
			
		||||
	$(info ===>  GENERATE ASM  $@)
 | 
			
		||||
	$(CC) -S $(CPPFLAGS) $(CFLAGS) $< -o $@
 | 
			
		||||
 | 
			
		||||
.PHONY: clean distclean tags info asm format
 | 
			
		||||
 | 
			
		||||
clean:
 | 
			
		||||
	$(info ===>  CLEAN)
 | 
			
		||||
	@rm -rf $(BUILD_DIR)
 | 
			
		||||
	@rm -f tags
 | 
			
		||||
 | 
			
		||||
distclean: clean
 | 
			
		||||
	$(info ===>  DIST CLEAN)
 | 
			
		||||
	@rm -f $(TARGET)
 | 
			
		||||
 | 
			
		||||
info:
 | 
			
		||||
	$(info $(CFLAGS))
 | 
			
		||||
	$(Q)$(CC) $(VERSION)
 | 
			
		||||
 | 
			
		||||
asm:  $(BUILD_DIR) $(ASM)
 | 
			
		||||
 | 
			
		||||
tags:
 | 
			
		||||
	$(info ===>  GENERATE TAGS)
 | 
			
		||||
	$(Q)ctags -R
 | 
			
		||||
 | 
			
		||||
format:
 | 
			
		||||
	@for src in $(SOURCES) ; do \
 | 
			
		||||
		echo "Formatting $$src" ; \
 | 
			
		||||
		clang-format -i $$src ; \
 | 
			
		||||
	done
 | 
			
		||||
	@echo "Done"
 | 
			
		||||
 | 
			
		||||
$(BUILD_DIR):
 | 
			
		||||
	@mkdir $(BUILD_DIR)
 | 
			
		||||
 | 
			
		||||
-include $(OBJ:.o=.d)
 | 
			
		||||
@@ -1,78 +0,0 @@
 | 
			
		||||
# C source skeleton
 | 
			
		||||
 | 
			
		||||
## Build
 | 
			
		||||
 | 
			
		||||
1. Configure the toolchain and additional options in `config.mk`:
 | 
			
		||||
```
 | 
			
		||||
# Supported: GCC, CLANG, ICC
 | 
			
		||||
TAG ?= GCC
 | 
			
		||||
ENABLE_OPENMP ?= false
 | 
			
		||||
 | 
			
		||||
OPTIONS +=  -DARRAY_ALIGNMENT=64
 | 
			
		||||
#OPTIONS +=  -DVERBOSE
 | 
			
		||||
#OPTIONS +=  -DVERBOSE_AFFINITY
 | 
			
		||||
#OPTIONS +=  -DVERBOSE_DATASIZE
 | 
			
		||||
#OPTIONS +=  -DVERBOSE_TIMER
 | 
			
		||||
```
 | 
			
		||||
 | 
			
		||||
The verbosity options enable detailed output about solver, affinity settings, allocation sizes and timer resolution.
 | 
			
		||||
For debugging you may want to set the VERBOSE option:
 | 
			
		||||
```
 | 
			
		||||
# Supported: GCC, CLANG, ICC
 | 
			
		||||
TAG ?= GCC
 | 
			
		||||
ENABLE_OPENMP ?= false
 | 
			
		||||
 | 
			
		||||
OPTIONS +=  -DARRAY_ALIGNMENT=64
 | 
			
		||||
OPTIONS +=  -DVERBOSE
 | 
			
		||||
#OPTIONS +=  -DVERBOSE_AFFINITY
 | 
			
		||||
#OPTIONS +=  -DVERBOSE_DATASIZE
 | 
			
		||||
#OPTIONS +=  -DVERBOSE_TIMER
 | 
			
		||||
`
 | 
			
		||||
 | 
			
		||||
2. Build with:
 | 
			
		||||
```
 | 
			
		||||
make
 | 
			
		||||
```
 | 
			
		||||
 | 
			
		||||
You can build multiple toolchains in the same directory, but notice that the Makefile is only acting on the one currently set.
 | 
			
		||||
Intermediate build results are located in the `<TOOLCHAIN>` directory.
 | 
			
		||||
 | 
			
		||||
To output the executed commands use:
 | 
			
		||||
```
 | 
			
		||||
make Q=
 | 
			
		||||
```
 | 
			
		||||
 | 
			
		||||
3. Clean up with:
 | 
			
		||||
```
 | 
			
		||||
make clean
 | 
			
		||||
```
 | 
			
		||||
to clean intermediate build results.
 | 
			
		||||
 | 
			
		||||
```
 | 
			
		||||
make distclean
 | 
			
		||||
```
 | 
			
		||||
to clean intermediate build results and binary.
 | 
			
		||||
 | 
			
		||||
4. (Optional) Generate assembler:
 | 
			
		||||
```
 | 
			
		||||
make asm
 | 
			
		||||
```
 | 
			
		||||
The assembler files will also be located in the `<TOOLCHAIN>` directory.
 | 
			
		||||
 | 
			
		||||
## Usage
 | 
			
		||||
 | 
			
		||||
You have to provide a parameter file describing the problem you want to solve:
 | 
			
		||||
```
 | 
			
		||||
./exe-CLANG  dcavity.par
 | 
			
		||||
```
 | 
			
		||||
 | 
			
		||||
Examples are given in in dcavity (a lid driven cavity test case) and canal (simulating a empty canal).
 | 
			
		||||
 | 
			
		||||
You can plot the resulting velocity and pressure fields using gnuplot:
 | 
			
		||||
```
 | 
			
		||||
gnuplot vector.plot
 | 
			
		||||
```
 | 
			
		||||
and for the pressure:
 | 
			
		||||
```
 | 
			
		||||
gnuplot surface.plot
 | 
			
		||||
```
 | 
			
		||||
@@ -1,52 +0,0 @@
 | 
			
		||||
#==============================================================================
 | 
			
		||||
#                            Laminar Canal Flow
 | 
			
		||||
#==============================================================================
 | 
			
		||||
 | 
			
		||||
# Problem specific Data:
 | 
			
		||||
# ---------------------
 | 
			
		||||
 | 
			
		||||
name canal             # name of flow setup
 | 
			
		||||
 | 
			
		||||
bcLeft    3			#  flags for boundary conditions
 | 
			
		||||
bcRight   3			#  1 = no-slip      3 = outflow
 | 
			
		||||
bcBottom  1			#  2 = free-slip    4 = periodic
 | 
			
		||||
bcTop     1			#
 | 
			
		||||
bcFront   1			#
 | 
			
		||||
bcBack    1			#
 | 
			
		||||
 | 
			
		||||
gx     0.0      # Body forces (e.g. gravity)
 | 
			
		||||
gy     0.0      #
 | 
			
		||||
gz     0.0      #
 | 
			
		||||
 | 
			
		||||
re            100.0	   # Reynolds number
 | 
			
		||||
 | 
			
		||||
u_init        1.0      # initial value for velocity in x-direction
 | 
			
		||||
v_init        0.0      # initial value for velocity in y-direction
 | 
			
		||||
w_init        0.0      # initial value for velocity in z-direction
 | 
			
		||||
p_init        0.0      # initial value for pressure
 | 
			
		||||
 | 
			
		||||
# Geometry Data:
 | 
			
		||||
# -------------
 | 
			
		||||
 | 
			
		||||
xlength       30.0     # domain size in x-direction
 | 
			
		||||
ylength       4.0	   # domain size in y-direction
 | 
			
		||||
zlength       4.0	   # domain size in z-direction
 | 
			
		||||
imax          200      # number of interior cells in x-direction
 | 
			
		||||
jmax          50	   # number of interior cells in y-direction
 | 
			
		||||
kmax          50	   # number of interior cells in z-direction
 | 
			
		||||
 | 
			
		||||
# Time Data:
 | 
			
		||||
# ---------
 | 
			
		||||
 | 
			
		||||
te       100.0   # final time
 | 
			
		||||
dt       0.02    # time stepsize
 | 
			
		||||
tau      0.5     # safety factor for time stepsize control (<0 constant delt)
 | 
			
		||||
 | 
			
		||||
# Pressure Iteration Data:
 | 
			
		||||
# -----------------------
 | 
			
		||||
 | 
			
		||||
itermax       500       # maximal number of pressure iteration in one time step
 | 
			
		||||
eps           0.0001   # stopping tolerance for pressure iteration
 | 
			
		||||
omg           1.3       # relaxation parameter for SOR iteration
 | 
			
		||||
gamma         0.9       # upwind differencing factor gamma
 | 
			
		||||
#===============================================================================
 | 
			
		||||
@@ -1,13 +0,0 @@
 | 
			
		||||
# Supported: GCC, CLANG, ICC
 | 
			
		||||
TAG ?= CLANG
 | 
			
		||||
ENABLE_MPI ?= true
 | 
			
		||||
ENABLE_OPENMP ?= false
 | 
			
		||||
 | 
			
		||||
#Feature options
 | 
			
		||||
OPTIONS +=  -DARRAY_ALIGNMENT=64
 | 
			
		||||
OPTIONS +=  -DVERBOSE
 | 
			
		||||
#OPTIONS +=  -DDEBUG
 | 
			
		||||
#OPTIONS +=  -DBOUNDCHECK
 | 
			
		||||
#OPTIONS +=  -DVERBOSE_AFFINITY
 | 
			
		||||
#OPTIONS +=  -DVERBOSE_DATASIZE
 | 
			
		||||
#OPTIONS +=  -DVERBOSE_TIMER
 | 
			
		||||
@@ -1,52 +0,0 @@
 | 
			
		||||
#==============================================================================
 | 
			
		||||
#                              Driven Cavity
 | 
			
		||||
#==============================================================================
 | 
			
		||||
 | 
			
		||||
# Problem specific Data:
 | 
			
		||||
# ---------------------
 | 
			
		||||
 | 
			
		||||
name dcavity        # name of flow setup
 | 
			
		||||
 | 
			
		||||
bcLeft    1			#  flags for boundary conditions
 | 
			
		||||
bcRight   1			#  1 = no-slip      3 = outflow
 | 
			
		||||
bcBottom  1			#  2 = free-slip    4 = periodic
 | 
			
		||||
bcTop     1			#
 | 
			
		||||
bcFront   1			#
 | 
			
		||||
bcBack    1			#
 | 
			
		||||
 | 
			
		||||
gx    0.0			# Body forces (e.g. gravity)
 | 
			
		||||
gy    0.0			#
 | 
			
		||||
gz    0.0			#
 | 
			
		||||
 | 
			
		||||
re    1000.0		    # Reynolds number
 | 
			
		||||
 | 
			
		||||
u_init    0.0		# initial value for velocity in x-direction
 | 
			
		||||
v_init    0.0		# initial value for velocity in y-direction
 | 
			
		||||
w_init    0.0		# initial value for velocity in z-direction
 | 
			
		||||
p_init    0.0		# initial value for pressure
 | 
			
		||||
 | 
			
		||||
# Geometry Data:
 | 
			
		||||
# -------------
 | 
			
		||||
 | 
			
		||||
xlength    1.0		# domain size in x-direction
 | 
			
		||||
ylength    1.0		# domain size in y-direction
 | 
			
		||||
zlength    1.0		# domain size in z-direction
 | 
			
		||||
imax       128		# number of interior cells in x-direction
 | 
			
		||||
jmax       128		# number of interior cells in y-direction
 | 
			
		||||
kmax       128		# number of interior cells in z-direction
 | 
			
		||||
 | 
			
		||||
# Time Data:
 | 
			
		||||
# ---------
 | 
			
		||||
 | 
			
		||||
te       10.0		# final time
 | 
			
		||||
dt       0.02	    # time stepsize
 | 
			
		||||
tau      0.5		# safety factor for time stepsize control (<0 constant delt)
 | 
			
		||||
 | 
			
		||||
# Pressure Iteration Data:
 | 
			
		||||
# -----------------------
 | 
			
		||||
 | 
			
		||||
itermax  1000		# maximal number of pressure iteration in one time step
 | 
			
		||||
eps      0.001		# stopping tolerance for pressure iteration
 | 
			
		||||
omg      1.8		# relaxation parameter for SOR iteration
 | 
			
		||||
gamma    0.9		# upwind differencing factor gamma
 | 
			
		||||
#===============================================================================
 | 
			
		||||
@@ -1,21 +0,0 @@
 | 
			
		||||
ifeq ($(ENABLE_MPI),true)
 | 
			
		||||
CC   = mpicc
 | 
			
		||||
DEFINES  = -D_MPI
 | 
			
		||||
else
 | 
			
		||||
CC   = cc
 | 
			
		||||
endif
 | 
			
		||||
 | 
			
		||||
GCC  = cc
 | 
			
		||||
LINKER = $(CC)
 | 
			
		||||
 | 
			
		||||
ifeq ($(ENABLE_OPENMP),true)
 | 
			
		||||
OPENMP   = -fopenmp
 | 
			
		||||
#OPENMP   = -Xpreprocessor -fopenmp #required on Macos with homebrew libomp
 | 
			
		||||
LIBS     = # -lomp
 | 
			
		||||
endif
 | 
			
		||||
 | 
			
		||||
VERSION  = --version
 | 
			
		||||
CFLAGS   = -Ofast -std=c17
 | 
			
		||||
LFLAGS   = $(OPENMP) -lm
 | 
			
		||||
DEFINES  += -D_GNU_SOURCE# -DDEBUG
 | 
			
		||||
INCLUDES =
 | 
			
		||||
@@ -1,14 +0,0 @@
 | 
			
		||||
CC   = gcc
 | 
			
		||||
GCC  = gcc
 | 
			
		||||
LINKER = $(CC)
 | 
			
		||||
 | 
			
		||||
ifeq ($(ENABLE_OPENMP),true)
 | 
			
		||||
OPENMP   = -fopenmp
 | 
			
		||||
endif
 | 
			
		||||
 | 
			
		||||
VERSION  = --version
 | 
			
		||||
CFLAGS   = -Ofast -ffreestanding -std=c99 $(OPENMP)
 | 
			
		||||
LFLAGS   = $(OPENMP)
 | 
			
		||||
DEFINES  = -D_GNU_SOURCE
 | 
			
		||||
INCLUDES =
 | 
			
		||||
LIBS     =
 | 
			
		||||
@@ -1,14 +0,0 @@
 | 
			
		||||
CC   = icc
 | 
			
		||||
GCC  = gcc
 | 
			
		||||
LINKER = $(CC)
 | 
			
		||||
 | 
			
		||||
ifeq ($(ENABLE_OPENMP),true)
 | 
			
		||||
OPENMP   = -qopenmp
 | 
			
		||||
endif
 | 
			
		||||
 | 
			
		||||
VERSION  = --version
 | 
			
		||||
CFLAGS   =  -O3 -xHost -qopt-zmm-usage=high -std=c99 $(OPENMP)
 | 
			
		||||
LFLAGS   = $(OPENMP)
 | 
			
		||||
DEFINES  = -D_GNU_SOURCE
 | 
			
		||||
INCLUDES =
 | 
			
		||||
LIBS     =
 | 
			
		||||
@@ -1,38 +0,0 @@
 | 
			
		||||
/*
 | 
			
		||||
 * Copyright (C) 2022 NHR@FAU, University Erlangen-Nuremberg.
 | 
			
		||||
 * All rights reserved.
 | 
			
		||||
 * Use of this source code is governed by a MIT-style
 | 
			
		||||
 * license that can be found in the LICENSE file.
 | 
			
		||||
 */
 | 
			
		||||
#include <errno.h>
 | 
			
		||||
#include <stddef.h>
 | 
			
		||||
#include <stdio.h>
 | 
			
		||||
#include <stdlib.h>
 | 
			
		||||
 | 
			
		||||
#include "allocate.h"
 | 
			
		||||
 | 
			
		||||
void* allocate(size_t alignment, size_t bytesize)
 | 
			
		||||
{
 | 
			
		||||
    int errorCode;
 | 
			
		||||
    void* ptr;
 | 
			
		||||
 | 
			
		||||
    errorCode = posix_memalign(&ptr, alignment, bytesize);
 | 
			
		||||
 | 
			
		||||
    if (errorCode) {
 | 
			
		||||
        if (errorCode == EINVAL) {
 | 
			
		||||
            fprintf(stderr, "Error: Alignment parameter is not a power of two\n");
 | 
			
		||||
            exit(EXIT_FAILURE);
 | 
			
		||||
        }
 | 
			
		||||
        if (errorCode == ENOMEM) {
 | 
			
		||||
            fprintf(stderr, "Error: Insufficient memory to fulfill the request\n");
 | 
			
		||||
            exit(EXIT_FAILURE);
 | 
			
		||||
        }
 | 
			
		||||
    }
 | 
			
		||||
 | 
			
		||||
    if (ptr == NULL) {
 | 
			
		||||
        fprintf(stderr, "Error: posix_memalign failed!\n");
 | 
			
		||||
        exit(EXIT_FAILURE);
 | 
			
		||||
    }
 | 
			
		||||
 | 
			
		||||
    return ptr;
 | 
			
		||||
}
 | 
			
		||||
@@ -1,13 +0,0 @@
 | 
			
		||||
/*
 | 
			
		||||
 * Copyright (C) 2022 NHR@FAU, University Erlangen-Nuremberg.
 | 
			
		||||
 * All rights reserved.
 | 
			
		||||
 * Use of this source code is governed by a MIT-style
 | 
			
		||||
 * license that can be found in the LICENSE file.
 | 
			
		||||
 */
 | 
			
		||||
#ifndef __ALLOCATE_H_
 | 
			
		||||
#define __ALLOCATE_H_
 | 
			
		||||
#include <stdlib.h>
 | 
			
		||||
 | 
			
		||||
extern void* allocate(size_t alignment, size_t bytesize);
 | 
			
		||||
 | 
			
		||||
#endif
 | 
			
		||||
@@ -1,359 +0,0 @@
 | 
			
		||||
/*
 | 
			
		||||
 * Copyright (C) 2022 NHR@FAU, University Erlangen-Nuremberg.
 | 
			
		||||
 * All rights reserved. This file is part of nusif-solver.
 | 
			
		||||
 * Use of this source code is governed by a MIT style
 | 
			
		||||
 * license that can be found in the LICENSE file.
 | 
			
		||||
 */
 | 
			
		||||
#if defined(_MPI)
 | 
			
		||||
#include <mpi.h>
 | 
			
		||||
#endif
 | 
			
		||||
#include <stddef.h>
 | 
			
		||||
#include <stdio.h>
 | 
			
		||||
#include <stdlib.h>
 | 
			
		||||
 | 
			
		||||
#include "allocate.h"
 | 
			
		||||
#include "comm.h"
 | 
			
		||||
 | 
			
		||||
#if defined(_MPI)
 | 
			
		||||
// subroutines local to this module
 | 
			
		||||
static int sizeOfRank(int rank, int size, int N)
 | 
			
		||||
{
 | 
			
		||||
    return N / size + ((N % size > rank) ? 1 : 0);
 | 
			
		||||
}
 | 
			
		||||
 | 
			
		||||
static void setupCommunication(Comm* c, Direction direction, int layer)
 | 
			
		||||
{
 | 
			
		||||
    int imaxLocal = c->imaxLocal;
 | 
			
		||||
    int jmaxLocal = c->jmaxLocal;
 | 
			
		||||
    int kmaxLocal = c->kmaxLocal;
 | 
			
		||||
 | 
			
		||||
    size_t dblsize = sizeof(double);
 | 
			
		||||
    int sizes[NDIMS];
 | 
			
		||||
    int subSizes[NDIMS];
 | 
			
		||||
    int starts[NDIMS];
 | 
			
		||||
    int offset = 0;
 | 
			
		||||
 | 
			
		||||
    sizes[IDIM] = imaxLocal + 2;
 | 
			
		||||
    sizes[JDIM] = jmaxLocal + 2;
 | 
			
		||||
    sizes[KDIM] = kmaxLocal + 2;
 | 
			
		||||
 | 
			
		||||
    if (layer == HALO) {
 | 
			
		||||
        offset = 1;
 | 
			
		||||
    }
 | 
			
		||||
 | 
			
		||||
    switch (direction) {
 | 
			
		||||
    case LEFT:
 | 
			
		||||
        subSizes[IDIM] = 1;
 | 
			
		||||
        subSizes[JDIM] = jmaxLocal;
 | 
			
		||||
        subSizes[KDIM] = kmaxLocal;
 | 
			
		||||
        starts[IDIM]   = 1 - offset;
 | 
			
		||||
        starts[JDIM]   = 1;
 | 
			
		||||
        starts[KDIM]   = 1;
 | 
			
		||||
        break;
 | 
			
		||||
    case RIGHT:
 | 
			
		||||
        subSizes[IDIM] = 1;
 | 
			
		||||
        subSizes[JDIM] = jmaxLocal;
 | 
			
		||||
        subSizes[KDIM] = kmaxLocal;
 | 
			
		||||
        starts[IDIM]   = imaxLocal + offset;
 | 
			
		||||
        starts[JDIM]   = 1;
 | 
			
		||||
        starts[KDIM]   = 1;
 | 
			
		||||
        break;
 | 
			
		||||
    case BOTTOM:
 | 
			
		||||
        subSizes[IDIM] = imaxLocal;
 | 
			
		||||
        subSizes[JDIM] = 1;
 | 
			
		||||
        subSizes[KDIM] = kmaxLocal;
 | 
			
		||||
        starts[IDIM]   = 1;
 | 
			
		||||
        starts[JDIM]   = 1 - offset;
 | 
			
		||||
        starts[KDIM]   = 1;
 | 
			
		||||
        break;
 | 
			
		||||
    case TOP:
 | 
			
		||||
        subSizes[IDIM] = imaxLocal;
 | 
			
		||||
        subSizes[JDIM] = 1;
 | 
			
		||||
        subSizes[KDIM] = kmaxLocal;
 | 
			
		||||
        starts[IDIM]   = 1;
 | 
			
		||||
        starts[JDIM]   = jmaxLocal + offset;
 | 
			
		||||
        starts[KDIM]   = 1;
 | 
			
		||||
        break;
 | 
			
		||||
    case FRONT:
 | 
			
		||||
        subSizes[IDIM] = imaxLocal;
 | 
			
		||||
        subSizes[JDIM] = jmaxLocal;
 | 
			
		||||
        subSizes[KDIM] = 1;
 | 
			
		||||
        starts[IDIM]   = 1;
 | 
			
		||||
        starts[JDIM]   = 1;
 | 
			
		||||
        starts[KDIM]   = 1 - offset;
 | 
			
		||||
        break;
 | 
			
		||||
    case BACK:
 | 
			
		||||
        subSizes[IDIM] = imaxLocal;
 | 
			
		||||
        subSizes[JDIM] = jmaxLocal;
 | 
			
		||||
        subSizes[KDIM] = 1;
 | 
			
		||||
        starts[IDIM]   = 1;
 | 
			
		||||
        starts[JDIM]   = 1;
 | 
			
		||||
        starts[KDIM]   = kmaxLocal + offset;
 | 
			
		||||
        break;
 | 
			
		||||
    case NDIRS:
 | 
			
		||||
        printf("ERROR!\n");
 | 
			
		||||
        break;
 | 
			
		||||
    }
 | 
			
		||||
 | 
			
		||||
    if (layer == HALO) {
 | 
			
		||||
        MPI_Type_create_subarray(NDIMS,
 | 
			
		||||
            sizes,
 | 
			
		||||
            subSizes,
 | 
			
		||||
            starts,
 | 
			
		||||
            MPI_ORDER_C,
 | 
			
		||||
            MPI_DOUBLE,
 | 
			
		||||
            &c->rbufferTypes[direction]);
 | 
			
		||||
        MPI_Type_commit(&c->rbufferTypes[direction]);
 | 
			
		||||
    } else if (layer == BULK) {
 | 
			
		||||
        MPI_Type_create_subarray(NDIMS,
 | 
			
		||||
            sizes,
 | 
			
		||||
            subSizes,
 | 
			
		||||
            starts,
 | 
			
		||||
            MPI_ORDER_C,
 | 
			
		||||
            MPI_DOUBLE,
 | 
			
		||||
            &c->sbufferTypes[direction]);
 | 
			
		||||
        MPI_Type_commit(&c->sbufferTypes[direction]);
 | 
			
		||||
    }
 | 
			
		||||
}
 | 
			
		||||
 | 
			
		||||
static int sum(int* sizes, int position)
 | 
			
		||||
{
 | 
			
		||||
    int sum = 0;
 | 
			
		||||
 | 
			
		||||
    for (int i = 0; i < position; i++) {
 | 
			
		||||
        sum += sizes[i];
 | 
			
		||||
    }
 | 
			
		||||
 | 
			
		||||
    return sum;
 | 
			
		||||
}
 | 
			
		||||
#endif
 | 
			
		||||
 | 
			
		||||
// exported subroutines
 | 
			
		||||
void commReduction(double* v, int op)
 | 
			
		||||
{
 | 
			
		||||
#if defined(_MPI)
 | 
			
		||||
    if (op == MAX) {
 | 
			
		||||
        MPI_Allreduce(MPI_IN_PLACE, v, 1, MPI_DOUBLE, MPI_MAX, MPI_COMM_WORLD);
 | 
			
		||||
    } else if (op == SUM) {
 | 
			
		||||
        MPI_Allreduce(MPI_IN_PLACE, v, 1, MPI_DOUBLE, MPI_SUM, MPI_COMM_WORLD);
 | 
			
		||||
    }
 | 
			
		||||
#endif
 | 
			
		||||
}
 | 
			
		||||
 | 
			
		||||
int commIsBoundary(Comm* c, Direction direction)
 | 
			
		||||
{
 | 
			
		||||
#if defined(_MPI)
 | 
			
		||||
    switch (direction) {
 | 
			
		||||
    case LEFT:
 | 
			
		||||
        return c->coords[ICORD] == 0;
 | 
			
		||||
        break;
 | 
			
		||||
    case RIGHT:
 | 
			
		||||
        return c->coords[ICORD] == (c->dims[ICORD] - 1);
 | 
			
		||||
        break;
 | 
			
		||||
    case BOTTOM:
 | 
			
		||||
        return c->coords[JCORD] == 0;
 | 
			
		||||
        break;
 | 
			
		||||
    case TOP:
 | 
			
		||||
        return c->coords[JCORD] == (c->dims[JCORD] - 1);
 | 
			
		||||
        break;
 | 
			
		||||
    case FRONT:
 | 
			
		||||
        return c->coords[KCORD] == 0;
 | 
			
		||||
        break;
 | 
			
		||||
    case BACK:
 | 
			
		||||
        return c->coords[KCORD] == (c->dims[KCORD] - 1);
 | 
			
		||||
        break;
 | 
			
		||||
    case NDIRS:
 | 
			
		||||
        printf("ERROR!\n");
 | 
			
		||||
        break;
 | 
			
		||||
    }
 | 
			
		||||
#endif
 | 
			
		||||
 | 
			
		||||
    return 1;
 | 
			
		||||
}
 | 
			
		||||
 | 
			
		||||
void commExchange(Comm* c, double* grid)
 | 
			
		||||
{
 | 
			
		||||
#if defined(_MPI)
 | 
			
		||||
    int counts[6]      = { 1, 1, 1, 1, 1, 1 };
 | 
			
		||||
    MPI_Aint displs[6] = { 0, 0, 0, 0, 0, 0 };
 | 
			
		||||
 | 
			
		||||
    MPI_Neighbor_alltoallw(grid,
 | 
			
		||||
        counts,
 | 
			
		||||
        displs,
 | 
			
		||||
        c->sbufferTypes,
 | 
			
		||||
        grid,
 | 
			
		||||
        counts,
 | 
			
		||||
        displs,
 | 
			
		||||
        c->rbufferTypes,
 | 
			
		||||
        c->comm);
 | 
			
		||||
#endif
 | 
			
		||||
}
 | 
			
		||||
 | 
			
		||||
void commShift(Comm* c, double* f, double* g, double* h)
 | 
			
		||||
{
 | 
			
		||||
#if defined(_MPI)
 | 
			
		||||
    MPI_Request requests[6] = { MPI_REQUEST_NULL,
 | 
			
		||||
        MPI_REQUEST_NULL,
 | 
			
		||||
        MPI_REQUEST_NULL,
 | 
			
		||||
        MPI_REQUEST_NULL,
 | 
			
		||||
        MPI_REQUEST_NULL,
 | 
			
		||||
        MPI_REQUEST_NULL };
 | 
			
		||||
 | 
			
		||||
    /* shift G */
 | 
			
		||||
    /* receive ghost cells from bottom neighbor */
 | 
			
		||||
    MPI_Irecv(g,
 | 
			
		||||
        1,
 | 
			
		||||
        c->rbufferTypes[BOTTOM],
 | 
			
		||||
        c->neighbours[BOTTOM],
 | 
			
		||||
        0,
 | 
			
		||||
        c->comm,
 | 
			
		||||
        &requests[0]);
 | 
			
		||||
 | 
			
		||||
    /* send ghost cells to top neighbor */
 | 
			
		||||
    MPI_Isend(g, 1, c->sbufferTypes[TOP], c->neighbours[TOP], 0, c->comm, &requests[1]);
 | 
			
		||||
 | 
			
		||||
    /* shift F */
 | 
			
		||||
    /* receive ghost cells from left neighbor */
 | 
			
		||||
    MPI_Irecv(f, 1, c->rbufferTypes[LEFT], c->neighbours[LEFT], 1, c->comm, &requests[2]);
 | 
			
		||||
 | 
			
		||||
    /* send ghost cells to right neighbor */
 | 
			
		||||
    MPI_Isend(f,
 | 
			
		||||
        1,
 | 
			
		||||
        c->sbufferTypes[RIGHT],
 | 
			
		||||
        c->neighbours[RIGHT],
 | 
			
		||||
        1,
 | 
			
		||||
        c->comm,
 | 
			
		||||
        &requests[3]);
 | 
			
		||||
 | 
			
		||||
    /* shift H */
 | 
			
		||||
    /* receive ghost cells from front neighbor */
 | 
			
		||||
    MPI_Irecv(h,
 | 
			
		||||
        1,
 | 
			
		||||
        c->rbufferTypes[FRONT],
 | 
			
		||||
        c->neighbours[FRONT],
 | 
			
		||||
        2,
 | 
			
		||||
        c->comm,
 | 
			
		||||
        &requests[4]);
 | 
			
		||||
 | 
			
		||||
    /* send ghost cells to back neighbor */
 | 
			
		||||
    MPI_Isend(h, 1, c->sbufferTypes[BACK], c->neighbours[BACK], 2, c->comm, &requests[5]);
 | 
			
		||||
 | 
			
		||||
    MPI_Waitall(6, requests, MPI_STATUSES_IGNORE);
 | 
			
		||||
#endif
 | 
			
		||||
}
 | 
			
		||||
 | 
			
		||||
void commGetOffsets(Comm* c, int offsets[], int kmax, int jmax, int imax)
 | 
			
		||||
{
 | 
			
		||||
#if defined(_MPI)
 | 
			
		||||
    int sum = 0;
 | 
			
		||||
 | 
			
		||||
    for (int i = 0; i < c->coords[ICORD]; i++) {
 | 
			
		||||
        sum += sizeOfRank(i, c->dims[ICORD], imax);
 | 
			
		||||
    }
 | 
			
		||||
    offsets[IDIM] = sum;
 | 
			
		||||
    sum           = 0;
 | 
			
		||||
 | 
			
		||||
    for (int i = 0; i < c->coords[JCORD]; i++) {
 | 
			
		||||
        sum += sizeOfRank(i, c->dims[JCORD], jmax);
 | 
			
		||||
    }
 | 
			
		||||
    offsets[JDIM] = sum;
 | 
			
		||||
    sum           = 0;
 | 
			
		||||
 | 
			
		||||
    for (int i = 0; i < c->coords[KCORD]; i++) {
 | 
			
		||||
        sum += sizeOfRank(i, c->dims[KCORD], kmax);
 | 
			
		||||
    }
 | 
			
		||||
    offsets[KDIM] = sum;
 | 
			
		||||
#endif
 | 
			
		||||
}
 | 
			
		||||
 | 
			
		||||
void commPrintConfig(Comm* c)
 | 
			
		||||
{
 | 
			
		||||
#if defined(_MPI)
 | 
			
		||||
    fflush(stdout);
 | 
			
		||||
    MPI_Barrier(MPI_COMM_WORLD);
 | 
			
		||||
    if (commIsMaster(c)) {
 | 
			
		||||
        printf("Communication setup:\n");
 | 
			
		||||
    }
 | 
			
		||||
 | 
			
		||||
    for (int i = 0; i < c->size; i++) {
 | 
			
		||||
        if (i == c->rank) {
 | 
			
		||||
            printf("\tRank %d of %d\n", c->rank, c->size);
 | 
			
		||||
            printf("\tNeighbours (front, back, bottom, top, left, right): %d, %d, %d, "
 | 
			
		||||
                   "%d, %d, %d\n",
 | 
			
		||||
                c->neighbours[FRONT],
 | 
			
		||||
                c->neighbours[BACK],
 | 
			
		||||
                c->neighbours[BOTTOM],
 | 
			
		||||
                c->neighbours[TOP],
 | 
			
		||||
                c->neighbours[LEFT],
 | 
			
		||||
                c->neighbours[RIGHT]);
 | 
			
		||||
            printf("\tCoordinates (k,j,i) %d %d %d\n",
 | 
			
		||||
                c->coords[KCORD],
 | 
			
		||||
                c->coords[JCORD],
 | 
			
		||||
                c->coords[ICORD]);
 | 
			
		||||
            printf("\tLocal domain size (k,j,i) %dx%dx%d\n",
 | 
			
		||||
                c->kmaxLocal,
 | 
			
		||||
                c->jmaxLocal,
 | 
			
		||||
                c->imaxLocal);
 | 
			
		||||
            fflush(stdout);
 | 
			
		||||
        }
 | 
			
		||||
    }
 | 
			
		||||
    MPI_Barrier(MPI_COMM_WORLD);
 | 
			
		||||
#endif
 | 
			
		||||
}
 | 
			
		||||
 | 
			
		||||
void commInit(Comm* c, int argc, char** argv)
 | 
			
		||||
{
 | 
			
		||||
#if defined(_MPI)
 | 
			
		||||
    MPI_Init(&argc, &argv);
 | 
			
		||||
    MPI_Comm_rank(MPI_COMM_WORLD, &(c->rank));
 | 
			
		||||
    MPI_Comm_size(MPI_COMM_WORLD, &(c->size));
 | 
			
		||||
#endif
 | 
			
		||||
}
 | 
			
		||||
 | 
			
		||||
void commPartition(Comm* c, int kmax, int jmax, int imax)
 | 
			
		||||
{
 | 
			
		||||
#if defined(_MPI)
 | 
			
		||||
    int dims[NDIMS]    = { 0, 0, 0 };
 | 
			
		||||
    int periods[NDIMS] = { 0, 0, 0 };
 | 
			
		||||
    MPI_Dims_create(c->size, NDIMS, dims);
 | 
			
		||||
    MPI_Cart_create(MPI_COMM_WORLD, NCORDS, dims, periods, 0, &c->comm);
 | 
			
		||||
    MPI_Cart_shift(c->comm, ICORD, 1, &c->neighbours[LEFT], &c->neighbours[RIGHT]);
 | 
			
		||||
    MPI_Cart_shift(c->comm, JCORD, 1, &c->neighbours[BOTTOM], &c->neighbours[TOP]);
 | 
			
		||||
    MPI_Cart_shift(c->comm, KCORD, 1, &c->neighbours[FRONT], &c->neighbours[BACK]);
 | 
			
		||||
    MPI_Cart_get(c->comm, NCORDS, c->dims, periods, c->coords);
 | 
			
		||||
 | 
			
		||||
    c->imaxLocal = sizeOfRank(c->rank, dims[ICORD], imax);
 | 
			
		||||
    c->jmaxLocal = sizeOfRank(c->rank, dims[JCORD], jmax);
 | 
			
		||||
    c->kmaxLocal = sizeOfRank(c->rank, dims[KCORD], kmax);
 | 
			
		||||
 | 
			
		||||
    // setup buffer types for communication
 | 
			
		||||
    setupCommunication(c, LEFT, BULK);
 | 
			
		||||
    setupCommunication(c, LEFT, HALO);
 | 
			
		||||
    setupCommunication(c, RIGHT, BULK);
 | 
			
		||||
    setupCommunication(c, RIGHT, HALO);
 | 
			
		||||
    setupCommunication(c, BOTTOM, BULK);
 | 
			
		||||
    setupCommunication(c, BOTTOM, HALO);
 | 
			
		||||
    setupCommunication(c, TOP, BULK);
 | 
			
		||||
    setupCommunication(c, TOP, HALO);
 | 
			
		||||
    setupCommunication(c, FRONT, BULK);
 | 
			
		||||
    setupCommunication(c, FRONT, HALO);
 | 
			
		||||
    setupCommunication(c, BACK, BULK);
 | 
			
		||||
    setupCommunication(c, BACK, HALO);
 | 
			
		||||
#else
 | 
			
		||||
    c->imaxLocal = imax;
 | 
			
		||||
    c->jmaxLocal = jmax;
 | 
			
		||||
    c->kmaxLocal = kmax;
 | 
			
		||||
#endif
 | 
			
		||||
}
 | 
			
		||||
 | 
			
		||||
void commFinalize(Comm* c)
 | 
			
		||||
{
 | 
			
		||||
#if defined(_MPI)
 | 
			
		||||
    for (int i = 0; i < NDIRS; i++) {
 | 
			
		||||
        MPI_Type_free(&c->sbufferTypes[i]);
 | 
			
		||||
        MPI_Type_free(&c->rbufferTypes[i]);
 | 
			
		||||
    }
 | 
			
		||||
 | 
			
		||||
    MPI_Finalize();
 | 
			
		||||
#endif
 | 
			
		||||
}
 | 
			
		||||
@@ -1,51 +0,0 @@
 | 
			
		||||
/*
 | 
			
		||||
 * Copyright (C) 2024 NHR@FAU, University Erlangen-Nuremberg.
 | 
			
		||||
 * All rights reserved. This file is part of nusif-solver.
 | 
			
		||||
 * Use of this source code is governed by a MIT style
 | 
			
		||||
 * license that can be found in the LICENSE file.
 | 
			
		||||
 */
 | 
			
		||||
#ifndef __COMM_H_
 | 
			
		||||
#define __COMM_H_
 | 
			
		||||
#if defined(_MPI)
 | 
			
		||||
#include <mpi.h>
 | 
			
		||||
#endif
 | 
			
		||||
/*
 | 
			
		||||
 * Spatial directions:
 | 
			
		||||
 * ICORD (0) from 0 (LEFT) to imax (RIGHT)
 | 
			
		||||
 * JCORD (1) from 0 (BOTTOM) to jmax (TOP)
 | 
			
		||||
 * KCORD (2) from 0 (FRONT) to kmax (BACK)
 | 
			
		||||
 * All derived Subarray types are in C ordering
 | 
			
		||||
 * with indices KDIM (0), JDIM(1) and IDIM(2)
 | 
			
		||||
 * */
 | 
			
		||||
typedef enum direction { LEFT = 0, RIGHT, BOTTOM, TOP, FRONT, BACK, NDIRS } Direction;
 | 
			
		||||
typedef enum coordinates { ICORD = 0, JCORD, KCORD, NCORDS } Coordinates;
 | 
			
		||||
typedef enum dimension { KDIM = 0, JDIM, IDIM, NDIMS } Dimension;
 | 
			
		||||
enum layer { HALO = 0, BULK };
 | 
			
		||||
enum op { MAX = 0, SUM };
 | 
			
		||||
 | 
			
		||||
typedef struct {
 | 
			
		||||
    int rank;
 | 
			
		||||
    int size;
 | 
			
		||||
#if defined(_MPI)
 | 
			
		||||
    MPI_Comm comm;
 | 
			
		||||
    MPI_Datatype sbufferTypes[NDIRS];
 | 
			
		||||
    MPI_Datatype rbufferTypes[NDIRS];
 | 
			
		||||
#endif
 | 
			
		||||
    int neighbours[NDIRS];
 | 
			
		||||
    int coords[NDIMS], dims[NDIMS];
 | 
			
		||||
    int imaxLocal, jmaxLocal, kmaxLocal;
 | 
			
		||||
    MPI_File fh;
 | 
			
		||||
} Comm;
 | 
			
		||||
 | 
			
		||||
extern void commInit(Comm* c, int argc, char** argv);
 | 
			
		||||
extern void commPartition(Comm* c, int kmax, int jmax, int imax);
 | 
			
		||||
extern void commFinalize(Comm* comm);
 | 
			
		||||
extern void commPrintConfig(Comm*);
 | 
			
		||||
extern void commExchange(Comm*, double*);
 | 
			
		||||
extern void commShift(Comm* c, double* f, double* g, double* h);
 | 
			
		||||
extern void commReduction(double* v, int op);
 | 
			
		||||
extern int commIsBoundary(Comm* c, Direction direction);
 | 
			
		||||
extern void commGetOffsets(Comm* c, int offsets[], int kmax, int jmax, int imax);
 | 
			
		||||
 | 
			
		||||
static inline int commIsMaster(Comm* c) { return c->rank == 0; }
 | 
			
		||||
#endif // __COMM_H_
 | 
			
		||||
@@ -1,16 +0,0 @@
 | 
			
		||||
/*
 | 
			
		||||
 * Copyright (C) 2022 NHR@FAU, University Erlangen-Nuremberg.
 | 
			
		||||
 * All rights reserved. This file is part of nusif-solver.
 | 
			
		||||
 * Use of this source code is governed by a MIT style
 | 
			
		||||
 * license that can be found in the LICENSE file.
 | 
			
		||||
 */
 | 
			
		||||
#ifndef __GRID_H_
 | 
			
		||||
#define __GRID_H_
 | 
			
		||||
 | 
			
		||||
typedef struct {
 | 
			
		||||
    double dx, dy, dz;
 | 
			
		||||
    int imax, jmax, kmax;
 | 
			
		||||
    double xlength, ylength, zlength;
 | 
			
		||||
} Grid;
 | 
			
		||||
 | 
			
		||||
#endif // __GRID_H_
 | 
			
		||||
@@ -1,54 +0,0 @@
 | 
			
		||||
/*
 | 
			
		||||
 * =======================================================================================
 | 
			
		||||
 *
 | 
			
		||||
 *      Author:   Jan Eitzinger (je), jan.eitzinger@fau.de
 | 
			
		||||
 *      Copyright (c) 2020 RRZE, University Erlangen-Nuremberg
 | 
			
		||||
 *
 | 
			
		||||
 *      Permission is hereby granted, free of charge, to any person obtaining a copy
 | 
			
		||||
 *      of this software and associated documentation files (the "Software"), to deal
 | 
			
		||||
 *      in the Software without restriction, including without limitation the rights
 | 
			
		||||
 *      to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
 | 
			
		||||
 *      copies of the Software, and to permit persons to whom the Software is
 | 
			
		||||
 *      furnished to do so, subject to the following conditions:
 | 
			
		||||
 *
 | 
			
		||||
 *      The above copyright notice and this permission notice shall be included in all
 | 
			
		||||
 *      copies or substantial portions of the Software.
 | 
			
		||||
 *
 | 
			
		||||
 *      THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
 | 
			
		||||
 *      IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
 | 
			
		||||
 *      FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
 | 
			
		||||
 *      AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
 | 
			
		||||
 *      LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
 | 
			
		||||
 *      OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
 | 
			
		||||
 *      SOFTWARE.
 | 
			
		||||
 *
 | 
			
		||||
 * =======================================================================================
 | 
			
		||||
 */
 | 
			
		||||
#ifndef LIKWID_MARKERS_H
 | 
			
		||||
#define LIKWID_MARKERS_H
 | 
			
		||||
 | 
			
		||||
#ifdef LIKWID_PERFMON
 | 
			
		||||
#include <likwid.h>
 | 
			
		||||
#define LIKWID_MARKER_INIT                likwid_markerInit()
 | 
			
		||||
#define LIKWID_MARKER_THREADINIT          likwid_markerThreadInit()
 | 
			
		||||
#define LIKWID_MARKER_SWITCH              likwid_markerNextGroup()
 | 
			
		||||
#define LIKWID_MARKER_REGISTER(regionTag) likwid_markerRegisterRegion(regionTag)
 | 
			
		||||
#define LIKWID_MARKER_START(regionTag)    likwid_markerStartRegion(regionTag)
 | 
			
		||||
#define LIKWID_MARKER_STOP(regionTag)     likwid_markerStopRegion(regionTag)
 | 
			
		||||
#define LIKWID_MARKER_CLOSE               likwid_markerClose()
 | 
			
		||||
#define LIKWID_MARKER_RESET(regionTag)    likwid_markerResetRegion(regionTag)
 | 
			
		||||
#define LIKWID_MARKER_GET(regionTag, nevents, events, time, count)                       \
 | 
			
		||||
    likwid_markerGetRegion(regionTag, nevents, events, time, count)
 | 
			
		||||
#else /* LIKWID_PERFMON */
 | 
			
		||||
#define LIKWID_MARKER_INIT
 | 
			
		||||
#define LIKWID_MARKER_THREADINIT
 | 
			
		||||
#define LIKWID_MARKER_SWITCH
 | 
			
		||||
#define LIKWID_MARKER_REGISTER(regionTag)
 | 
			
		||||
#define LIKWID_MARKER_START(regionTag)
 | 
			
		||||
#define LIKWID_MARKER_STOP(regionTag)
 | 
			
		||||
#define LIKWID_MARKER_CLOSE
 | 
			
		||||
#define LIKWID_MARKER_GET(regionTag, nevents, events, time, count)
 | 
			
		||||
#define LIKWID_MARKER_RESET(regionTag)
 | 
			
		||||
#endif /* LIKWID_PERFMON */
 | 
			
		||||
 | 
			
		||||
#endif /*LIKWID_MARKERS_H*/
 | 
			
		||||
@@ -1,84 +0,0 @@
 | 
			
		||||
/*
 | 
			
		||||
 * Copyright (C) 2024 NHR@FAU, University Erlangen-Nuremberg.
 | 
			
		||||
 * All rights reserved.
 | 
			
		||||
 * Use of this source code is governed by a MIT-style
 | 
			
		||||
 * license that can be found in the LICENSE file.
 | 
			
		||||
 */
 | 
			
		||||
#include <float.h>
 | 
			
		||||
#include <limits.h>
 | 
			
		||||
#include <stdio.h>
 | 
			
		||||
#include <stdlib.h>
 | 
			
		||||
#include <unistd.h>
 | 
			
		||||
 | 
			
		||||
#include "allocate.h"
 | 
			
		||||
#include "comm.h"
 | 
			
		||||
#include "parameter.h"
 | 
			
		||||
#include "progress.h"
 | 
			
		||||
#include "solver.h"
 | 
			
		||||
#include "timing.h"
 | 
			
		||||
#include "vtkWriter.h"
 | 
			
		||||
 | 
			
		||||
int main(int argc, char** argv)
 | 
			
		||||
{
 | 
			
		||||
    double timeStart, timeStop;
 | 
			
		||||
    Parameter p;
 | 
			
		||||
    Solver s;
 | 
			
		||||
 | 
			
		||||
    commInit(&s.comm, argc, argv);
 | 
			
		||||
    initParameter(&p);
 | 
			
		||||
 | 
			
		||||
    if (argc != 2) {
 | 
			
		||||
        printf("Usage: %s <configFile>\n", argv[0]);
 | 
			
		||||
        exit(EXIT_SUCCESS);
 | 
			
		||||
    }
 | 
			
		||||
 | 
			
		||||
    readParameter(&p, argv[1]);
 | 
			
		||||
    commPartition(&s.comm, p.kmax, p.jmax, p.imax);
 | 
			
		||||
    if (commIsMaster(&s.comm)) {
 | 
			
		||||
        printParameter(&p);
 | 
			
		||||
    }
 | 
			
		||||
    initSolver(&s, &p);
 | 
			
		||||
#ifndef VERBOSE
 | 
			
		||||
    initProgress(s.te);
 | 
			
		||||
#endif
 | 
			
		||||
 | 
			
		||||
    double tau = s.tau;
 | 
			
		||||
    double te  = s.te;
 | 
			
		||||
    double t   = 0.0;
 | 
			
		||||
 | 
			
		||||
    timeStart = getTimeStamp();
 | 
			
		||||
    while (t <= te) {
 | 
			
		||||
        if (tau > 0.0) computeTimestep(&s);
 | 
			
		||||
        setBoundaryConditions(&s);
 | 
			
		||||
        setSpecialBoundaryCondition(&s);
 | 
			
		||||
        computeFG(&s);
 | 
			
		||||
        computeRHS(&s);
 | 
			
		||||
        solve(&s);
 | 
			
		||||
        adaptUV(&s);
 | 
			
		||||
        t += s.dt;
 | 
			
		||||
 | 
			
		||||
#ifdef VERBOSE
 | 
			
		||||
        if (commIsMaster(&s.comm)) {
 | 
			
		||||
            printf("TIME %f , TIMESTEP %f\n", t, s.dt);
 | 
			
		||||
        }
 | 
			
		||||
#else
 | 
			
		||||
        printProgress(t);
 | 
			
		||||
#endif
 | 
			
		||||
    }
 | 
			
		||||
    timeStop = getTimeStamp();
 | 
			
		||||
#ifndef VERBOSE
 | 
			
		||||
    stopProgress();
 | 
			
		||||
#endif
 | 
			
		||||
    if (commIsMaster(&s.comm)) {
 | 
			
		||||
        printf("Solution took %.2fs\n", timeStop - timeStart);
 | 
			
		||||
    }
 | 
			
		||||
 | 
			
		||||
    VtkOptions opts = { .grid = s.grid, .comm = s.comm };
 | 
			
		||||
    vtkOpen(&opts, s.problem);
 | 
			
		||||
    vtkScalar(&opts, "pressure", s.p);
 | 
			
		||||
    vtkVector(&opts, "velocity", (VtkVector) { s.u, s.v, s.w });
 | 
			
		||||
    vtkClose(&opts);
 | 
			
		||||
 | 
			
		||||
    commFinalize(&s.comm);
 | 
			
		||||
    return EXIT_SUCCESS;
 | 
			
		||||
}
 | 
			
		||||
@@ -1,126 +0,0 @@
 | 
			
		||||
/*
 | 
			
		||||
 * Copyright (C) 2022 NHR@FAU, University Erlangen-Nuremberg.
 | 
			
		||||
 * All rights reserved. This file is part of nusif-solver.
 | 
			
		||||
 * Use of this source code is governed by a MIT style
 | 
			
		||||
 * license that can be found in the LICENSE file.
 | 
			
		||||
 */
 | 
			
		||||
#include <stdio.h>
 | 
			
		||||
#include <stdlib.h>
 | 
			
		||||
#include <string.h>
 | 
			
		||||
 | 
			
		||||
#include "parameter.h"
 | 
			
		||||
#include "util.h"
 | 
			
		||||
#define MAXLINE 4096
 | 
			
		||||
 | 
			
		||||
void initParameter(Parameter* param)
 | 
			
		||||
{
 | 
			
		||||
    param->xlength = 1.0;
 | 
			
		||||
    param->ylength = 1.0;
 | 
			
		||||
    param->zlength = 1.0;
 | 
			
		||||
    param->imax    = 100;
 | 
			
		||||
    param->jmax    = 100;
 | 
			
		||||
    param->kmax    = 100;
 | 
			
		||||
    param->itermax = 1000;
 | 
			
		||||
    param->eps     = 0.0001;
 | 
			
		||||
    param->omg     = 1.7;
 | 
			
		||||
    param->re      = 100.0;
 | 
			
		||||
    param->gamma   = 0.9;
 | 
			
		||||
    param->tau     = 0.5;
 | 
			
		||||
}
 | 
			
		||||
 | 
			
		||||
void readParameter(Parameter* param, const char* filename)
 | 
			
		||||
{
 | 
			
		||||
    FILE* fp = fopen(filename, "r");
 | 
			
		||||
    char line[MAXLINE];
 | 
			
		||||
    int i;
 | 
			
		||||
 | 
			
		||||
    if (!fp) {
 | 
			
		||||
        fprintf(stderr, "Could not open parameter file: %s\n", filename);
 | 
			
		||||
        exit(EXIT_FAILURE);
 | 
			
		||||
    }
 | 
			
		||||
 | 
			
		||||
    while (!feof(fp)) {
 | 
			
		||||
        line[0] = '\0';
 | 
			
		||||
        fgets(line, MAXLINE, fp);
 | 
			
		||||
        for (i = 0; line[i] != '\0' && line[i] != '#'; i++)
 | 
			
		||||
            ;
 | 
			
		||||
        line[i] = '\0';
 | 
			
		||||
 | 
			
		||||
        char* tok = strtok(line, " ");
 | 
			
		||||
        char* val = strtok(NULL, " ");
 | 
			
		||||
 | 
			
		||||
#define PARSE_PARAM(p, f)                                                                \
 | 
			
		||||
    if (strncmp(tok, #p, sizeof(#p) / sizeof(#p[0]) - 1) == 0) {                         \
 | 
			
		||||
        param->p = f(val);                                                               \
 | 
			
		||||
    }
 | 
			
		||||
#define PARSE_STRING(p) PARSE_PARAM(p, strdup)
 | 
			
		||||
#define PARSE_INT(p)    PARSE_PARAM(p, atoi)
 | 
			
		||||
#define PARSE_REAL(p)   PARSE_PARAM(p, atof)
 | 
			
		||||
 | 
			
		||||
        if (tok != NULL && val != NULL) {
 | 
			
		||||
            PARSE_REAL(xlength);
 | 
			
		||||
            PARSE_REAL(ylength);
 | 
			
		||||
            PARSE_REAL(zlength);
 | 
			
		||||
            PARSE_INT(imax);
 | 
			
		||||
            PARSE_INT(jmax);
 | 
			
		||||
            PARSE_INT(kmax);
 | 
			
		||||
            PARSE_INT(itermax);
 | 
			
		||||
            PARSE_REAL(eps);
 | 
			
		||||
            PARSE_REAL(omg);
 | 
			
		||||
            PARSE_REAL(re);
 | 
			
		||||
            PARSE_REAL(tau);
 | 
			
		||||
            PARSE_REAL(gamma);
 | 
			
		||||
            PARSE_REAL(dt);
 | 
			
		||||
            PARSE_REAL(te);
 | 
			
		||||
            PARSE_REAL(gx);
 | 
			
		||||
            PARSE_REAL(gy);
 | 
			
		||||
            PARSE_REAL(gz);
 | 
			
		||||
            PARSE_STRING(name);
 | 
			
		||||
            PARSE_INT(bcLeft);
 | 
			
		||||
            PARSE_INT(bcRight);
 | 
			
		||||
            PARSE_INT(bcBottom);
 | 
			
		||||
            PARSE_INT(bcTop);
 | 
			
		||||
            PARSE_INT(bcFront);
 | 
			
		||||
            PARSE_INT(bcBack);
 | 
			
		||||
            PARSE_REAL(u_init);
 | 
			
		||||
            PARSE_REAL(v_init);
 | 
			
		||||
            PARSE_REAL(w_init);
 | 
			
		||||
            PARSE_REAL(p_init);
 | 
			
		||||
        }
 | 
			
		||||
    }
 | 
			
		||||
 | 
			
		||||
    fclose(fp);
 | 
			
		||||
}
 | 
			
		||||
 | 
			
		||||
void printParameter(Parameter* param)
 | 
			
		||||
{
 | 
			
		||||
    printf("Parameters for %s\n", param->name);
 | 
			
		||||
    printf("Boundary conditions Left:%d Right:%d Bottom:%d Top:%d Front:%d "
 | 
			
		||||
           "Back:%d\n",
 | 
			
		||||
        param->bcLeft,
 | 
			
		||||
        param->bcRight,
 | 
			
		||||
        param->bcBottom,
 | 
			
		||||
        param->bcTop,
 | 
			
		||||
        param->bcFront,
 | 
			
		||||
        param->bcBack);
 | 
			
		||||
    printf("\tReynolds number: %.2f\n", param->re);
 | 
			
		||||
    printf("\tInit arrays: U:%.2f V:%.2f W:%.2f P:%.2f\n",
 | 
			
		||||
        param->u_init,
 | 
			
		||||
        param->v_init,
 | 
			
		||||
        param->w_init,
 | 
			
		||||
        param->p_init);
 | 
			
		||||
    printf("Geometry data:\n");
 | 
			
		||||
    printf("\tDomain box size (x, y, z): %.2f, %.2f, %.2f\n",
 | 
			
		||||
        param->xlength,
 | 
			
		||||
        param->ylength,
 | 
			
		||||
        param->zlength);
 | 
			
		||||
    printf("\tCells (x, y, z): %d, %d, %d\n", param->imax, param->jmax, param->kmax);
 | 
			
		||||
    printf("Timestep parameters:\n");
 | 
			
		||||
    printf("\tDefault stepsize: %.2f, Final time %.2f\n", param->dt, param->te);
 | 
			
		||||
    printf("\tTau factor: %.2f\n", param->tau);
 | 
			
		||||
    printf("Iterative solver parameters:\n");
 | 
			
		||||
    printf("\tMax iterations: %d\n", param->itermax);
 | 
			
		||||
    printf("\tepsilon (stopping tolerance) : %f\n", param->eps);
 | 
			
		||||
    printf("\tgamma (stopping tolerance) : %f\n", param->gamma);
 | 
			
		||||
    printf("\tomega (SOR relaxation): %f\n", param->omg);
 | 
			
		||||
}
 | 
			
		||||
@@ -1,26 +0,0 @@
 | 
			
		||||
/*
 | 
			
		||||
 * Copyright (C) 2022 NHR@FAU, University Erlangen-Nuremberg.
 | 
			
		||||
 * All rights reserved. This file is part of nusif-solver.
 | 
			
		||||
 * Use of this source code is governed by a MIT style
 | 
			
		||||
 * license that can be found in the LICENSE file.
 | 
			
		||||
 */
 | 
			
		||||
#ifndef __PARAMETER_H_
 | 
			
		||||
#define __PARAMETER_H_
 | 
			
		||||
 | 
			
		||||
typedef struct {
 | 
			
		||||
    int imax, jmax, kmax;
 | 
			
		||||
    double xlength, ylength, zlength;
 | 
			
		||||
    int itermax;
 | 
			
		||||
    double eps, omg;
 | 
			
		||||
    double re, tau, gamma;
 | 
			
		||||
    double te, dt;
 | 
			
		||||
    double gx, gy, gz;
 | 
			
		||||
    char* name;
 | 
			
		||||
    int bcLeft, bcRight, bcBottom, bcTop, bcFront, bcBack;
 | 
			
		||||
    double u_init, v_init, w_init, p_init;
 | 
			
		||||
} Parameter;
 | 
			
		||||
 | 
			
		||||
void initParameter(Parameter*);
 | 
			
		||||
void readParameter(Parameter*, const char*);
 | 
			
		||||
void printParameter(Parameter*);
 | 
			
		||||
#endif
 | 
			
		||||
@@ -1,51 +0,0 @@
 | 
			
		||||
/*
 | 
			
		||||
 * Copyright (C) 2022 NHR@FAU, University Erlangen-Nuremberg.
 | 
			
		||||
 * All rights reserved. This file is part of nusif-solver.
 | 
			
		||||
 * Use of this source code is governed by a MIT style
 | 
			
		||||
 * license that can be found in the LICENSE file.
 | 
			
		||||
 */
 | 
			
		||||
#include <math.h>
 | 
			
		||||
#include <stdio.h>
 | 
			
		||||
#include <stdlib.h>
 | 
			
		||||
#include <string.h>
 | 
			
		||||
 | 
			
		||||
#include "progress.h"
 | 
			
		||||
 | 
			
		||||
static double _end;
 | 
			
		||||
static int _current;
 | 
			
		||||
 | 
			
		||||
void initProgress(double end)
 | 
			
		||||
{
 | 
			
		||||
    _end     = end;
 | 
			
		||||
    _current = 0;
 | 
			
		||||
 | 
			
		||||
    printf("[          ]");
 | 
			
		||||
    fflush(stdout);
 | 
			
		||||
}
 | 
			
		||||
 | 
			
		||||
void printProgress(double current)
 | 
			
		||||
{
 | 
			
		||||
    int new = (int)rint((current / _end) * 10.0);
 | 
			
		||||
 | 
			
		||||
    if (new > _current) {
 | 
			
		||||
        char progress[11];
 | 
			
		||||
        _current    = new;
 | 
			
		||||
        progress[0] = 0;
 | 
			
		||||
 | 
			
		||||
        for (int i = 0; i < 10; i++) {
 | 
			
		||||
            if (i < _current) {
 | 
			
		||||
                sprintf(progress + strlen(progress), "#");
 | 
			
		||||
            } else {
 | 
			
		||||
                sprintf(progress + strlen(progress), " ");
 | 
			
		||||
            }
 | 
			
		||||
        }
 | 
			
		||||
        printf("\r[%s]", progress);
 | 
			
		||||
    }
 | 
			
		||||
    fflush(stdout);
 | 
			
		||||
}
 | 
			
		||||
 | 
			
		||||
void stopProgress()
 | 
			
		||||
{
 | 
			
		||||
    printf("\n");
 | 
			
		||||
    fflush(stdout);
 | 
			
		||||
}
 | 
			
		||||
@@ -1,14 +0,0 @@
 | 
			
		||||
/*
 | 
			
		||||
 * Copyright (C) 2022 NHR@FAU, University Erlangen-Nuremberg.
 | 
			
		||||
 * All rights reserved.
 | 
			
		||||
 * Use of this source code is governed by a MIT-style
 | 
			
		||||
 * license that can be found in the LICENSE file.
 | 
			
		||||
 */
 | 
			
		||||
#ifndef __PROGRESS_H_
 | 
			
		||||
#define __PROGRESS_H_
 | 
			
		||||
 | 
			
		||||
extern void initProgress(double);
 | 
			
		||||
extern void printProgress(double);
 | 
			
		||||
extern void stopProgress(void);
 | 
			
		||||
 | 
			
		||||
#endif
 | 
			
		||||
@@ -1,853 +0,0 @@
 | 
			
		||||
/*
 | 
			
		||||
 * Copyright (C) 2022 NHR@FAU, University Erlangen-Nuremberg.
 | 
			
		||||
 * All rights reserved. This file is part of nusif-solver.
 | 
			
		||||
 * Use of this source code is governed by a MIT style
 | 
			
		||||
 * license that can be found in the LICENSE file.
 | 
			
		||||
 */
 | 
			
		||||
#include <float.h>
 | 
			
		||||
#include <math.h>
 | 
			
		||||
#include <stdio.h>
 | 
			
		||||
#include <stdlib.h>
 | 
			
		||||
#include <string.h>
 | 
			
		||||
 | 
			
		||||
#include "allocate.h"
 | 
			
		||||
#include "comm.h"
 | 
			
		||||
#include "parameter.h"
 | 
			
		||||
#include "solver.h"
 | 
			
		||||
#include "util.h"
 | 
			
		||||
 | 
			
		||||
#define P(i, j, k)                                                                       \
 | 
			
		||||
    p[(k) * (imaxLocal + 2) * (jmaxLocal + 2) + (j) * (imaxLocal + 2) + (i)]
 | 
			
		||||
#define F(i, j, k)                                                                       \
 | 
			
		||||
    f[(k) * (imaxLocal + 2) * (jmaxLocal + 2) + (j) * (imaxLocal + 2) + (i)]
 | 
			
		||||
#define G(i, j, k)                                                                       \
 | 
			
		||||
    g[(k) * (imaxLocal + 2) * (jmaxLocal + 2) + (j) * (imaxLocal + 2) + (i)]
 | 
			
		||||
#define H(i, j, k)                                                                       \
 | 
			
		||||
    h[(k) * (imaxLocal + 2) * (jmaxLocal + 2) + (j) * (imaxLocal + 2) + (i)]
 | 
			
		||||
#define U(i, j, k)                                                                       \
 | 
			
		||||
    u[(k) * (imaxLocal + 2) * (jmaxLocal + 2) + (j) * (imaxLocal + 2) + (i)]
 | 
			
		||||
#define V(i, j, k)                                                                       \
 | 
			
		||||
    v[(k) * (imaxLocal + 2) * (jmaxLocal + 2) + (j) * (imaxLocal + 2) + (i)]
 | 
			
		||||
#define W(i, j, k)                                                                       \
 | 
			
		||||
    w[(k) * (imaxLocal + 2) * (jmaxLocal + 2) + (j) * (imaxLocal + 2) + (i)]
 | 
			
		||||
#define RHS(i, j, k)                                                                     \
 | 
			
		||||
    rhs[(k) * (imaxLocal + 2) * (jmaxLocal + 2) + (j) * (imaxLocal + 2) + (i)]
 | 
			
		||||
 | 
			
		||||
static void printConfig(Solver* s)
 | 
			
		||||
{
 | 
			
		||||
    if (commIsMaster(&s->comm)) {
 | 
			
		||||
        printf("Parameters for #%s#\n", s->problem);
 | 
			
		||||
        printf("BC Left:%d Right:%d Bottom:%d Top:%d Front:%d Back:%d\n",
 | 
			
		||||
            s->bcLeft,
 | 
			
		||||
            s->bcRight,
 | 
			
		||||
            s->bcBottom,
 | 
			
		||||
            s->bcTop,
 | 
			
		||||
            s->bcFront,
 | 
			
		||||
            s->bcBack);
 | 
			
		||||
        printf("\tReynolds number: %.2f\n", s->re);
 | 
			
		||||
        printf("\tGx Gy: %.2f %.2f %.2f\n", s->gx, s->gy, s->gz);
 | 
			
		||||
        printf("Geometry data:\n");
 | 
			
		||||
        printf("\tDomain box size (x, y, z): %.2f, %.2f, %.2f\n",
 | 
			
		||||
            s->grid.xlength,
 | 
			
		||||
            s->grid.ylength,
 | 
			
		||||
            s->grid.zlength);
 | 
			
		||||
        printf("\tCells (x, y, z): %d, %d, %d\n",
 | 
			
		||||
            s->grid.imax,
 | 
			
		||||
            s->grid.jmax,
 | 
			
		||||
            s->grid.kmax);
 | 
			
		||||
        printf("\tCell size (dx, dy, dz): %f, %f, %f\n",
 | 
			
		||||
            s->grid.dx,
 | 
			
		||||
            s->grid.dy,
 | 
			
		||||
            s->grid.dz);
 | 
			
		||||
        printf("Timestep parameters:\n");
 | 
			
		||||
        printf("\tDefault stepsize: %.2f, Final time %.2f\n", s->dt, s->te);
 | 
			
		||||
        printf("\tdt bound: %.6f\n", s->dtBound);
 | 
			
		||||
        printf("\tTau factor: %.2f\n", s->tau);
 | 
			
		||||
        printf("Iterative parameters:\n");
 | 
			
		||||
        printf("\tMax iterations: %d\n", s->itermax);
 | 
			
		||||
        printf("\tepsilon (stopping tolerance) : %f\n", s->eps);
 | 
			
		||||
        printf("\tgamma factor: %f\n", s->gamma);
 | 
			
		||||
        printf("\tomega (SOR relaxation): %f\n", s->omega);
 | 
			
		||||
    }
 | 
			
		||||
    commPrintConfig(&s->comm);
 | 
			
		||||
}
 | 
			
		||||
 | 
			
		||||
void initSolver(Solver* s, Parameter* params)
 | 
			
		||||
{
 | 
			
		||||
    s->problem  = params->name;
 | 
			
		||||
    s->bcLeft   = params->bcLeft;
 | 
			
		||||
    s->bcRight  = params->bcRight;
 | 
			
		||||
    s->bcBottom = params->bcBottom;
 | 
			
		||||
    s->bcTop    = params->bcTop;
 | 
			
		||||
    s->bcFront  = params->bcFront;
 | 
			
		||||
    s->bcBack   = params->bcBack;
 | 
			
		||||
 | 
			
		||||
    s->grid.imax    = params->imax;
 | 
			
		||||
    s->grid.jmax    = params->jmax;
 | 
			
		||||
    s->grid.kmax    = params->kmax;
 | 
			
		||||
    s->grid.xlength = params->xlength;
 | 
			
		||||
    s->grid.ylength = params->ylength;
 | 
			
		||||
    s->grid.zlength = params->zlength;
 | 
			
		||||
    s->grid.dx      = params->xlength / params->imax;
 | 
			
		||||
    s->grid.dy      = params->ylength / params->jmax;
 | 
			
		||||
    s->grid.dz      = params->zlength / params->kmax;
 | 
			
		||||
 | 
			
		||||
    s->eps     = params->eps;
 | 
			
		||||
    s->omega   = params->omg;
 | 
			
		||||
    s->itermax = params->itermax;
 | 
			
		||||
    s->re      = params->re;
 | 
			
		||||
    s->gx      = params->gx;
 | 
			
		||||
    s->gy      = params->gy;
 | 
			
		||||
    s->gz      = params->gz;
 | 
			
		||||
    s->dt      = params->dt;
 | 
			
		||||
    s->te      = params->te;
 | 
			
		||||
    s->tau     = params->tau;
 | 
			
		||||
    s->gamma   = params->gamma;
 | 
			
		||||
 | 
			
		||||
    /* allocate arrays */
 | 
			
		||||
    int imaxLocal = s->comm.imaxLocal;
 | 
			
		||||
    int jmaxLocal = s->comm.jmaxLocal;
 | 
			
		||||
    int kmaxLocal = s->comm.kmaxLocal;
 | 
			
		||||
    size_t size   = (imaxLocal + 2) * (jmaxLocal + 2) * (kmaxLocal + 2);
 | 
			
		||||
 | 
			
		||||
    s->u   = allocate(64, size * sizeof(double));
 | 
			
		||||
    s->v   = allocate(64, size * sizeof(double));
 | 
			
		||||
    s->w   = allocate(64, size * sizeof(double));
 | 
			
		||||
    s->p   = allocate(64, size * sizeof(double));
 | 
			
		||||
    s->rhs = allocate(64, size * sizeof(double));
 | 
			
		||||
    s->f   = allocate(64, size * sizeof(double));
 | 
			
		||||
    s->g   = allocate(64, size * sizeof(double));
 | 
			
		||||
    s->h   = allocate(64, size * sizeof(double));
 | 
			
		||||
 | 
			
		||||
    for (int i = 0; i < size; i++) {
 | 
			
		||||
        s->u[i]   = params->u_init;
 | 
			
		||||
        s->v[i]   = params->v_init;
 | 
			
		||||
        s->w[i]   = params->w_init;
 | 
			
		||||
        s->p[i]   = params->p_init;
 | 
			
		||||
        s->rhs[i] = 0.0;
 | 
			
		||||
        s->f[i]   = 0.0;
 | 
			
		||||
        s->g[i]   = 0.0;
 | 
			
		||||
        s->h[i]   = 0.0;
 | 
			
		||||
    }
 | 
			
		||||
 | 
			
		||||
    double dx = s->grid.dx;
 | 
			
		||||
    double dy = s->grid.dy;
 | 
			
		||||
    double dz = s->grid.dz;
 | 
			
		||||
 | 
			
		||||
    double invSqrSum = 1.0 / (dx * dx) + 1.0 / (dy * dy) + 1.0 / (dz * dz);
 | 
			
		||||
    s->dtBound       = 0.5 * s->re * 1.0 / invSqrSum;
 | 
			
		||||
 | 
			
		||||
#ifdef VERBOSE
 | 
			
		||||
    printConfig(s);
 | 
			
		||||
#endif /* VERBOSE */
 | 
			
		||||
}
 | 
			
		||||
 | 
			
		||||
void computeRHS(Solver* s)
 | 
			
		||||
{
 | 
			
		||||
    int imaxLocal = s->comm.imaxLocal;
 | 
			
		||||
    int jmaxLocal = s->comm.jmaxLocal;
 | 
			
		||||
    int kmaxLocal = s->comm.kmaxLocal;
 | 
			
		||||
 | 
			
		||||
    double idx = 1.0 / s->grid.dx;
 | 
			
		||||
    double idy = 1.0 / s->grid.dy;
 | 
			
		||||
    double idz = 1.0 / s->grid.dz;
 | 
			
		||||
    double idt = 1.0 / s->dt;
 | 
			
		||||
 | 
			
		||||
    double* rhs = s->rhs;
 | 
			
		||||
    double* f   = s->f;
 | 
			
		||||
    double* g   = s->g;
 | 
			
		||||
    double* h   = s->h;
 | 
			
		||||
 | 
			
		||||
    commShift(&s->comm, f, g, h);
 | 
			
		||||
 | 
			
		||||
    for (int k = 1; k < kmaxLocal + 1; k++) {
 | 
			
		||||
        for (int j = 1; j < jmaxLocal + 1; j++) {
 | 
			
		||||
            for (int i = 1; i < imaxLocal + 1; i++) {
 | 
			
		||||
                RHS(i, j, k) = ((F(i, j, k) - F(i - 1, j, k)) * idx +
 | 
			
		||||
                                   (G(i, j, k) - G(i, j - 1, k)) * idy +
 | 
			
		||||
                                   (H(i, j, k) - H(i, j, k - 1)) * idz) *
 | 
			
		||||
                               idt;
 | 
			
		||||
            }
 | 
			
		||||
        }
 | 
			
		||||
    }
 | 
			
		||||
}
 | 
			
		||||
 | 
			
		||||
void solve(Solver* s)
 | 
			
		||||
{
 | 
			
		||||
    int imaxLocal = s->comm.imaxLocal;
 | 
			
		||||
    int jmaxLocal = s->comm.jmaxLocal;
 | 
			
		||||
    int kmaxLocal = s->comm.kmaxLocal;
 | 
			
		||||
 | 
			
		||||
    int imax = s->grid.imax;
 | 
			
		||||
    int jmax = s->grid.jmax;
 | 
			
		||||
    int kmax = s->grid.kmax;
 | 
			
		||||
 | 
			
		||||
    double eps  = s->eps;
 | 
			
		||||
    int itermax = s->itermax;
 | 
			
		||||
    double dx2  = s->grid.dx * s->grid.dx;
 | 
			
		||||
    double dy2  = s->grid.dy * s->grid.dy;
 | 
			
		||||
    double dz2  = s->grid.dz * s->grid.dz;
 | 
			
		||||
    double idx2 = 1.0 / dx2;
 | 
			
		||||
    double idy2 = 1.0 / dy2;
 | 
			
		||||
    double idz2 = 1.0 / dz2;
 | 
			
		||||
 | 
			
		||||
    double factor = s->omega * 0.5 * (dx2 * dy2 * dz2) /
 | 
			
		||||
                    (dy2 * dz2 + dx2 * dz2 + dx2 * dy2);
 | 
			
		||||
    double* p    = s->p;
 | 
			
		||||
    double* rhs  = s->rhs;
 | 
			
		||||
    double epssq = eps * eps;
 | 
			
		||||
    int it       = 0;
 | 
			
		||||
    double res   = 1.0;
 | 
			
		||||
    int pass, ksw, jsw, isw;
 | 
			
		||||
 | 
			
		||||
    while ((res >= epssq) && (it < itermax)) {
 | 
			
		||||
        ksw = 1;
 | 
			
		||||
 | 
			
		||||
        for (pass = 0; pass < 2; pass++) {
 | 
			
		||||
            jsw = ksw;
 | 
			
		||||
            commExchange(&s->comm, p);
 | 
			
		||||
 | 
			
		||||
        for (int k = 1; k < kmaxLocal + 1; k++) {
 | 
			
		||||
                isw = jsw;
 | 
			
		||||
            for (int j = 1; j < jmaxLocal + 1; j++) {
 | 
			
		||||
                    for (int i = isw; i < imaxLocal + 1; i += 2) {
 | 
			
		||||
 | 
			
		||||
                        double r =
 | 
			
		||||
                            RHS(i, j, k) -
 | 
			
		||||
                            ((P(i + 1, j, k) - 2.0 * P(i, j, k) + P(i - 1, j, k)) * idx2 +
 | 
			
		||||
                                   (P(i, j + 1, k) - 2.0 * P(i, j, k) + P(i, j - 1, k)) *
 | 
			
		||||
                                       idy2 +
 | 
			
		||||
                                   (P(i, j, k + 1) - 2.0 * P(i, j, k) + P(i, j, k - 1)) *
 | 
			
		||||
                                       idz2);
 | 
			
		||||
 | 
			
		||||
                    P(i, j, k) -= (factor * r);
 | 
			
		||||
                    res += (r * r);
 | 
			
		||||
                }
 | 
			
		||||
                    isw = 3 - isw;
 | 
			
		||||
            }
 | 
			
		||||
                jsw = 3 - jsw;
 | 
			
		||||
            }
 | 
			
		||||
            ksw = 3 - ksw;
 | 
			
		||||
        }
 | 
			
		||||
 | 
			
		||||
        if (commIsBoundary(&s->comm, FRONT)) {
 | 
			
		||||
            for (int j = 1; j < jmaxLocal + 1; j++) {
 | 
			
		||||
                for (int i = 1; i < imaxLocal + 1; i++) {
 | 
			
		||||
                    P(i, j, 0) = P(i, j, 1);
 | 
			
		||||
                }
 | 
			
		||||
            }
 | 
			
		||||
        }
 | 
			
		||||
 | 
			
		||||
        if (commIsBoundary(&s->comm, BACK)) {
 | 
			
		||||
            for (int j = 1; j < jmaxLocal + 1; j++) {
 | 
			
		||||
                for (int i = 1; i < imaxLocal + 1; i++) {
 | 
			
		||||
                    P(i, j, kmaxLocal + 1) = P(i, j, kmaxLocal);
 | 
			
		||||
                }
 | 
			
		||||
            }
 | 
			
		||||
        }
 | 
			
		||||
 | 
			
		||||
        if (commIsBoundary(&s->comm, BOTTOM)) {
 | 
			
		||||
            for (int k = 1; k < kmaxLocal + 1; k++) {
 | 
			
		||||
                for (int i = 1; i < imaxLocal + 1; i++) {
 | 
			
		||||
                    P(i, 0, k) = P(i, 1, k);
 | 
			
		||||
                }
 | 
			
		||||
            }
 | 
			
		||||
        }
 | 
			
		||||
 | 
			
		||||
        if (commIsBoundary(&s->comm, TOP)) {
 | 
			
		||||
            for (int k = 1; k < kmaxLocal + 1; k++) {
 | 
			
		||||
                for (int i = 1; i < imaxLocal + 1; i++) {
 | 
			
		||||
                    P(i, jmaxLocal + 1, k) = P(i, jmaxLocal, k);
 | 
			
		||||
                }
 | 
			
		||||
            }
 | 
			
		||||
        }
 | 
			
		||||
 | 
			
		||||
        if (commIsBoundary(&s->comm, LEFT)) {
 | 
			
		||||
            for (int k = 1; k < kmaxLocal + 1; k++) {
 | 
			
		||||
                for (int j = 1; j < jmaxLocal + 1; j++) {
 | 
			
		||||
                    P(0, j, k) = P(1, j, k);
 | 
			
		||||
                }
 | 
			
		||||
            }
 | 
			
		||||
        }
 | 
			
		||||
 | 
			
		||||
        if (commIsBoundary(&s->comm, RIGHT)) {
 | 
			
		||||
            for (int k = 1; k < kmaxLocal + 1; k++) {
 | 
			
		||||
                for (int j = 1; j < jmaxLocal + 1; j++) {
 | 
			
		||||
                    P(imaxLocal + 1, j, k) = P(imaxLocal, j, k);
 | 
			
		||||
                }
 | 
			
		||||
            }
 | 
			
		||||
        }
 | 
			
		||||
 | 
			
		||||
        commReduction(&res, SUM);
 | 
			
		||||
        res = res / (double)(imax * jmax * kmax);
 | 
			
		||||
#ifdef DEBUG
 | 
			
		||||
        if (commIsMaster(&s->comm)) {
 | 
			
		||||
            printf("%d Residuum: %e\n", it, res);
 | 
			
		||||
        }
 | 
			
		||||
#endif
 | 
			
		||||
        commExchange(&s->comm, p);
 | 
			
		||||
        it++;
 | 
			
		||||
    }
 | 
			
		||||
 | 
			
		||||
#ifdef VERBOSE
 | 
			
		||||
    if (commIsMaster(&s->comm)) {
 | 
			
		||||
        printf("Solver took %d iterations to reach %f\n", it, sqrt(res));
 | 
			
		||||
    }
 | 
			
		||||
#endif
 | 
			
		||||
}
 | 
			
		||||
 | 
			
		||||
static double maxElement(Solver* s, double* m)
 | 
			
		||||
{
 | 
			
		||||
    int size = (s->comm.imaxLocal + 2) * (s->comm.jmaxLocal + 2) *
 | 
			
		||||
               (s->comm.kmaxLocal + 2);
 | 
			
		||||
    double maxval = DBL_MIN;
 | 
			
		||||
 | 
			
		||||
    for (int i = 0; i < size; i++) {
 | 
			
		||||
        maxval = MAX(maxval, fabs(m[i]));
 | 
			
		||||
    }
 | 
			
		||||
    commReduction(&maxval, MAX);
 | 
			
		||||
    return maxval;
 | 
			
		||||
}
 | 
			
		||||
 | 
			
		||||
void normalizePressure(Solver* s)
 | 
			
		||||
{
 | 
			
		||||
    int imaxLocal = s->comm.imaxLocal;
 | 
			
		||||
    int jmaxLocal = s->comm.jmaxLocal;
 | 
			
		||||
    int kmaxLocal = s->comm.kmaxLocal;
 | 
			
		||||
 | 
			
		||||
    double* p   = s->p;
 | 
			
		||||
    double avgP = 0.0;
 | 
			
		||||
 | 
			
		||||
    for (int k = 1; k < kmaxLocal + 1; k++) {
 | 
			
		||||
        for (int j = 1; j < jmaxLocal + 1; j++) {
 | 
			
		||||
            for (int i = 1; i < imaxLocal + 1; i++) {
 | 
			
		||||
                avgP += P(i, j, k);
 | 
			
		||||
            }
 | 
			
		||||
        }
 | 
			
		||||
    }
 | 
			
		||||
    commReduction(&avgP, SUM);
 | 
			
		||||
    avgP /= (s->grid.imax * s->grid.jmax * s->grid.kmax);
 | 
			
		||||
 | 
			
		||||
    for (int k = 1; k < kmaxLocal + 1; k++) {
 | 
			
		||||
        for (int j = 1; j < jmaxLocal + 1; j++) {
 | 
			
		||||
            for (int i = 1; i < imaxLocal + 1; i++) {
 | 
			
		||||
                P(i, j, k) = P(i, j, k) - avgP;
 | 
			
		||||
            }
 | 
			
		||||
        }
 | 
			
		||||
    }
 | 
			
		||||
}
 | 
			
		||||
 | 
			
		||||
void computeTimestep(Solver* s)
 | 
			
		||||
{
 | 
			
		||||
    double dt = s->dtBound;
 | 
			
		||||
    double dx = s->grid.dx;
 | 
			
		||||
    double dy = s->grid.dy;
 | 
			
		||||
    double dz = s->grid.dz;
 | 
			
		||||
 | 
			
		||||
    double umax = maxElement(s, s->u);
 | 
			
		||||
    double vmax = maxElement(s, s->v);
 | 
			
		||||
    double wmax = maxElement(s, s->w);
 | 
			
		||||
 | 
			
		||||
    if (umax > 0) {
 | 
			
		||||
        dt = (dt > dx / umax) ? dx / umax : dt;
 | 
			
		||||
    }
 | 
			
		||||
    if (vmax > 0) {
 | 
			
		||||
        dt = (dt > dy / vmax) ? dy / vmax : dt;
 | 
			
		||||
    }
 | 
			
		||||
    if (wmax > 0) {
 | 
			
		||||
        dt = (dt > dz / wmax) ? dz / wmax : dt;
 | 
			
		||||
    }
 | 
			
		||||
 | 
			
		||||
    s->dt = dt * s->tau;
 | 
			
		||||
}
 | 
			
		||||
 | 
			
		||||
void setBoundaryConditions(Solver* s)
 | 
			
		||||
{
 | 
			
		||||
    int imaxLocal = s->comm.imaxLocal;
 | 
			
		||||
    int jmaxLocal = s->comm.jmaxLocal;
 | 
			
		||||
    int kmaxLocal = s->comm.kmaxLocal;
 | 
			
		||||
 | 
			
		||||
    double* u = s->u;
 | 
			
		||||
    double* v = s->v;
 | 
			
		||||
    double* w = s->w;
 | 
			
		||||
 | 
			
		||||
    if (commIsBoundary(&s->comm, TOP)) {
 | 
			
		||||
        switch (s->bcTop) {
 | 
			
		||||
        case NOSLIP:
 | 
			
		||||
            for (int k = 1; k < kmaxLocal + 1; k++) {
 | 
			
		||||
                for (int i = 1; i < imaxLocal + 1; i++) {
 | 
			
		||||
                    U(i, jmaxLocal + 1, k) = -U(i, jmaxLocal, k);
 | 
			
		||||
                    V(i, jmaxLocal, k)     = 0.0;
 | 
			
		||||
                    W(i, jmaxLocal + 1, k) = -W(i, jmaxLocal, k);
 | 
			
		||||
                }
 | 
			
		||||
            }
 | 
			
		||||
            break;
 | 
			
		||||
        case SLIP:
 | 
			
		||||
            for (int k = 1; k < kmaxLocal + 1; k++) {
 | 
			
		||||
                for (int i = 1; i < imaxLocal + 1; i++) {
 | 
			
		||||
                    U(i, jmaxLocal + 1, k) = U(i, jmaxLocal, k);
 | 
			
		||||
                    V(i, jmaxLocal, k)     = 0.0;
 | 
			
		||||
                    W(i, jmaxLocal + 1, k) = W(i, jmaxLocal, k);
 | 
			
		||||
                }
 | 
			
		||||
            }
 | 
			
		||||
            break;
 | 
			
		||||
        case OUTFLOW:
 | 
			
		||||
            for (int k = 1; k < kmaxLocal + 1; k++) {
 | 
			
		||||
                for (int i = 1; i < imaxLocal + 1; i++) {
 | 
			
		||||
                    U(i, jmaxLocal + 1, k) = U(i, jmaxLocal, k);
 | 
			
		||||
                    V(i, jmaxLocal, k)     = V(i, jmaxLocal - 1, k);
 | 
			
		||||
                    W(i, jmaxLocal + 1, k) = W(i, jmaxLocal, k);
 | 
			
		||||
                }
 | 
			
		||||
            }
 | 
			
		||||
            break;
 | 
			
		||||
        case PERIODIC:
 | 
			
		||||
            break;
 | 
			
		||||
        }
 | 
			
		||||
    }
 | 
			
		||||
 | 
			
		||||
    if (commIsBoundary(&s->comm, BOTTOM)) {
 | 
			
		||||
        switch (s->bcBottom) {
 | 
			
		||||
        case NOSLIP:
 | 
			
		||||
            for (int k = 1; k < kmaxLocal + 1; k++) {
 | 
			
		||||
                for (int i = 1; i < imaxLocal + 1; i++) {
 | 
			
		||||
                    U(i, 0, k) = -U(i, 1, k);
 | 
			
		||||
                    V(i, 0, k) = 0.0;
 | 
			
		||||
                    W(i, 0, k) = -W(i, 1, k);
 | 
			
		||||
                }
 | 
			
		||||
            }
 | 
			
		||||
            break;
 | 
			
		||||
        case SLIP:
 | 
			
		||||
            for (int k = 1; k < kmaxLocal + 1; k++) {
 | 
			
		||||
                for (int i = 1; i < imaxLocal + 1; i++) {
 | 
			
		||||
                    U(i, 0, k) = U(i, 1, k);
 | 
			
		||||
                    V(i, 0, k) = 0.0;
 | 
			
		||||
                    W(i, 0, k) = W(i, 1, k);
 | 
			
		||||
                }
 | 
			
		||||
            }
 | 
			
		||||
            break;
 | 
			
		||||
        case OUTFLOW:
 | 
			
		||||
            for (int k = 1; k < kmaxLocal + 1; k++) {
 | 
			
		||||
                for (int i = 1; i < imaxLocal + 1; i++) {
 | 
			
		||||
                    U(i, 0, k) = U(i, 1, k);
 | 
			
		||||
                    V(i, 0, k) = V(i, 1, k);
 | 
			
		||||
                    W(i, 0, k) = W(i, 1, k);
 | 
			
		||||
                }
 | 
			
		||||
            }
 | 
			
		||||
            break;
 | 
			
		||||
        case PERIODIC:
 | 
			
		||||
            break;
 | 
			
		||||
        }
 | 
			
		||||
    }
 | 
			
		||||
 | 
			
		||||
    if (commIsBoundary(&s->comm, LEFT)) {
 | 
			
		||||
        switch (s->bcLeft) {
 | 
			
		||||
        case NOSLIP:
 | 
			
		||||
            for (int k = 1; k < kmaxLocal + 1; k++) {
 | 
			
		||||
                for (int j = 1; j < jmaxLocal + 1; j++) {
 | 
			
		||||
                    U(0, j, k) = 0.0;
 | 
			
		||||
                    V(0, j, k) = -V(1, j, k);
 | 
			
		||||
                    W(0, j, k) = -W(1, j, k);
 | 
			
		||||
                }
 | 
			
		||||
            }
 | 
			
		||||
            break;
 | 
			
		||||
        case SLIP:
 | 
			
		||||
            for (int k = 1; k < kmaxLocal + 1; k++) {
 | 
			
		||||
                for (int j = 1; j < jmaxLocal + 1; j++) {
 | 
			
		||||
                    U(0, j, k) = 0.0;
 | 
			
		||||
                    V(0, j, k) = V(1, j, k);
 | 
			
		||||
                    W(0, j, k) = W(1, j, k);
 | 
			
		||||
                }
 | 
			
		||||
            }
 | 
			
		||||
            break;
 | 
			
		||||
        case OUTFLOW:
 | 
			
		||||
            for (int k = 1; k < kmaxLocal + 1; k++) {
 | 
			
		||||
                for (int j = 1; j < jmaxLocal + 1; j++) {
 | 
			
		||||
                    U(0, j, k) = U(1, j, k);
 | 
			
		||||
                    V(0, j, k) = V(1, j, k);
 | 
			
		||||
                    W(0, j, k) = W(1, j, k);
 | 
			
		||||
                }
 | 
			
		||||
            }
 | 
			
		||||
            break;
 | 
			
		||||
        case PERIODIC:
 | 
			
		||||
            break;
 | 
			
		||||
        }
 | 
			
		||||
    }
 | 
			
		||||
 | 
			
		||||
    if (commIsBoundary(&s->comm, RIGHT)) {
 | 
			
		||||
        switch (s->bcRight) {
 | 
			
		||||
        case NOSLIP:
 | 
			
		||||
            for (int k = 1; k < kmaxLocal + 1; k++) {
 | 
			
		||||
                for (int j = 1; j < jmaxLocal + 1; j++) {
 | 
			
		||||
                    U(imaxLocal, j, k)     = 0.0;
 | 
			
		||||
                    V(imaxLocal + 1, j, k) = -V(imaxLocal, j, k);
 | 
			
		||||
                    W(imaxLocal + 1, j, k) = -W(imaxLocal, j, k);
 | 
			
		||||
                }
 | 
			
		||||
            }
 | 
			
		||||
            break;
 | 
			
		||||
        case SLIP:
 | 
			
		||||
            for (int k = 1; k < kmaxLocal + 1; k++) {
 | 
			
		||||
                for (int j = 1; j < jmaxLocal + 1; j++) {
 | 
			
		||||
                    U(imaxLocal, j, k)     = 0.0;
 | 
			
		||||
                    V(imaxLocal + 1, j, k) = V(imaxLocal, j, k);
 | 
			
		||||
                    W(imaxLocal + 1, j, k) = W(imaxLocal, j, k);
 | 
			
		||||
                }
 | 
			
		||||
            }
 | 
			
		||||
            break;
 | 
			
		||||
        case OUTFLOW:
 | 
			
		||||
            for (int k = 1; k < kmaxLocal + 1; k++) {
 | 
			
		||||
                for (int j = 1; j < jmaxLocal + 1; j++) {
 | 
			
		||||
                    U(imaxLocal, j, k)     = U(imaxLocal - 1, j, k);
 | 
			
		||||
                    V(imaxLocal + 1, j, k) = V(imaxLocal, j, k);
 | 
			
		||||
                    W(imaxLocal + 1, j, k) = W(imaxLocal, j, k);
 | 
			
		||||
                }
 | 
			
		||||
            }
 | 
			
		||||
            break;
 | 
			
		||||
        case PERIODIC:
 | 
			
		||||
            break;
 | 
			
		||||
        }
 | 
			
		||||
    }
 | 
			
		||||
 | 
			
		||||
    if (commIsBoundary(&s->comm, FRONT)) {
 | 
			
		||||
        switch (s->bcFront) {
 | 
			
		||||
        case NOSLIP:
 | 
			
		||||
            for (int j = 1; j < jmaxLocal + 1; j++) {
 | 
			
		||||
                for (int i = 1; i < imaxLocal + 1; i++) {
 | 
			
		||||
                    U(i, j, 0) = -U(i, j, 1);
 | 
			
		||||
                    V(i, j, 0) = -V(i, j, 1);
 | 
			
		||||
                    W(i, j, 0) = 0.0;
 | 
			
		||||
                }
 | 
			
		||||
            }
 | 
			
		||||
            break;
 | 
			
		||||
        case SLIP:
 | 
			
		||||
            for (int j = 1; j < jmaxLocal + 1; j++) {
 | 
			
		||||
                for (int i = 1; i < imaxLocal + 1; i++) {
 | 
			
		||||
                    U(i, j, 0) = U(i, j, 1);
 | 
			
		||||
                    V(i, j, 0) = V(i, j, 1);
 | 
			
		||||
                    W(i, j, 0) = 0.0;
 | 
			
		||||
                }
 | 
			
		||||
            }
 | 
			
		||||
            break;
 | 
			
		||||
        case OUTFLOW:
 | 
			
		||||
            for (int j = 1; j < jmaxLocal + 1; j++) {
 | 
			
		||||
                for (int i = 1; i < imaxLocal + 1; i++) {
 | 
			
		||||
                    U(i, j, 0) = U(i, j, 1);
 | 
			
		||||
                    V(i, j, 0) = V(i, j, 1);
 | 
			
		||||
                    W(i, j, 0) = W(i, j, 1);
 | 
			
		||||
                }
 | 
			
		||||
            }
 | 
			
		||||
            break;
 | 
			
		||||
        case PERIODIC:
 | 
			
		||||
            break;
 | 
			
		||||
        }
 | 
			
		||||
    }
 | 
			
		||||
 | 
			
		||||
    if (commIsBoundary(&s->comm, BACK)) {
 | 
			
		||||
        switch (s->bcBack) {
 | 
			
		||||
        case NOSLIP:
 | 
			
		||||
            for (int j = 1; j < jmaxLocal + 1; j++) {
 | 
			
		||||
                for (int i = 1; i < imaxLocal + 1; i++) {
 | 
			
		||||
                    U(i, j, kmaxLocal + 1) = -U(i, j, kmaxLocal);
 | 
			
		||||
                    V(i, j, kmaxLocal + 1) = -V(i, j, kmaxLocal);
 | 
			
		||||
                    W(i, j, kmaxLocal)     = 0.0;
 | 
			
		||||
                }
 | 
			
		||||
            }
 | 
			
		||||
            break;
 | 
			
		||||
        case SLIP:
 | 
			
		||||
            for (int j = 1; j < jmaxLocal + 1; j++) {
 | 
			
		||||
                for (int i = 1; i < imaxLocal + 1; i++) {
 | 
			
		||||
                    U(i, j, kmaxLocal + 1) = U(i, j, kmaxLocal);
 | 
			
		||||
                    V(i, j, kmaxLocal + 1) = V(i, j, kmaxLocal);
 | 
			
		||||
                    W(i, j, kmaxLocal)     = 0.0;
 | 
			
		||||
                }
 | 
			
		||||
            }
 | 
			
		||||
            break;
 | 
			
		||||
        case OUTFLOW:
 | 
			
		||||
            for (int j = 1; j < jmaxLocal + 1; j++) {
 | 
			
		||||
                for (int i = 1; i < imaxLocal + 1; i++) {
 | 
			
		||||
                    U(i, j, kmaxLocal + 1) = U(i, j, kmaxLocal);
 | 
			
		||||
                    V(i, j, kmaxLocal + 1) = V(i, j, kmaxLocal);
 | 
			
		||||
                    W(i, j, kmaxLocal)     = W(i, j, kmaxLocal - 1);
 | 
			
		||||
                }
 | 
			
		||||
            }
 | 
			
		||||
            break;
 | 
			
		||||
        case PERIODIC:
 | 
			
		||||
            break;
 | 
			
		||||
        }
 | 
			
		||||
    }
 | 
			
		||||
}
 | 
			
		||||
 | 
			
		||||
void setSpecialBoundaryCondition(Solver* s)
 | 
			
		||||
{
 | 
			
		||||
    int imaxLocal = s->comm.imaxLocal;
 | 
			
		||||
    int jmaxLocal = s->comm.jmaxLocal;
 | 
			
		||||
    int kmaxLocal = s->comm.kmaxLocal;
 | 
			
		||||
 | 
			
		||||
    double* u = s->u;
 | 
			
		||||
 | 
			
		||||
    if (strcmp(s->problem, "dcavity") == 0) {
 | 
			
		||||
        if (commIsBoundary(&s->comm, TOP)) {
 | 
			
		||||
            for (int k = 1; k < kmaxLocal; k++) {
 | 
			
		||||
                for (int i = 1; i < imaxLocal; i++) {
 | 
			
		||||
                    U(i, jmaxLocal + 1, k) = 2.0 - U(i, jmaxLocal, k);
 | 
			
		||||
                }
 | 
			
		||||
            }
 | 
			
		||||
        }
 | 
			
		||||
    } else if (strcmp(s->problem, "canal") == 0) {
 | 
			
		||||
        if (commIsBoundary(&s->comm, LEFT)) {
 | 
			
		||||
            for (int k = 1; k < kmaxLocal + 1; k++) {
 | 
			
		||||
                for (int j = 1; j < jmaxLocal + 1; j++) {
 | 
			
		||||
                    U(0, j, k) = 2.0;
 | 
			
		||||
                }
 | 
			
		||||
            }
 | 
			
		||||
        }
 | 
			
		||||
    }
 | 
			
		||||
}
 | 
			
		||||
 | 
			
		||||
void computeFG(Solver* s)
 | 
			
		||||
{
 | 
			
		||||
    int imaxLocal = s->comm.imaxLocal;
 | 
			
		||||
    int jmaxLocal = s->comm.jmaxLocal;
 | 
			
		||||
    int kmaxLocal = s->comm.kmaxLocal;
 | 
			
		||||
 | 
			
		||||
    double* u = s->u;
 | 
			
		||||
    double* v = s->v;
 | 
			
		||||
    double* w = s->w;
 | 
			
		||||
    double* f = s->f;
 | 
			
		||||
    double* g = s->g;
 | 
			
		||||
    double* h = s->h;
 | 
			
		||||
 | 
			
		||||
    double gx = s->gx;
 | 
			
		||||
    double gy = s->gy;
 | 
			
		||||
    double gz = s->gz;
 | 
			
		||||
    double dt = s->dt;
 | 
			
		||||
 | 
			
		||||
    double gamma     = s->gamma;
 | 
			
		||||
    double inverseRe = 1.0 / s->re;
 | 
			
		||||
    double inverseDx = 1.0 / s->grid.dx;
 | 
			
		||||
    double inverseDy = 1.0 / s->grid.dy;
 | 
			
		||||
    double inverseDz = 1.0 / s->grid.dz;
 | 
			
		||||
    double du2dx, dv2dy, dw2dz;
 | 
			
		||||
    double duvdx, duwdx, duvdy, dvwdy, duwdz, dvwdz;
 | 
			
		||||
    double du2dx2, du2dy2, du2dz2;
 | 
			
		||||
    double dv2dx2, dv2dy2, dv2dz2;
 | 
			
		||||
    double dw2dx2, dw2dy2, dw2dz2;
 | 
			
		||||
 | 
			
		||||
    commExchange(&s->comm, u);
 | 
			
		||||
    commExchange(&s->comm, v);
 | 
			
		||||
    commExchange(&s->comm, w);
 | 
			
		||||
 | 
			
		||||
    for (int k = 1; k < kmaxLocal + 1; k++) {
 | 
			
		||||
        for (int j = 1; j < jmaxLocal + 1; j++) {
 | 
			
		||||
            for (int i = 1; i < imaxLocal + 1; i++) {
 | 
			
		||||
                du2dx = inverseDx * 0.25 *
 | 
			
		||||
                            ((U(i, j, k) + U(i + 1, j, k)) *
 | 
			
		||||
                                    (U(i, j, k) + U(i + 1, j, k)) -
 | 
			
		||||
                                (U(i, j, k) + U(i - 1, j, k)) *
 | 
			
		||||
                                    (U(i, j, k) + U(i - 1, j, k))) +
 | 
			
		||||
                        gamma * inverseDx * 0.25 *
 | 
			
		||||
                            (fabs(U(i, j, k) + U(i + 1, j, k)) *
 | 
			
		||||
                                    (U(i, j, k) - U(i + 1, j, k)) +
 | 
			
		||||
                                fabs(U(i, j, k) + U(i - 1, j, k)) *
 | 
			
		||||
                                    (U(i, j, k) - U(i - 1, j, k)));
 | 
			
		||||
 | 
			
		||||
                duvdy = inverseDy * 0.25 *
 | 
			
		||||
                            ((V(i, j, k) + V(i + 1, j, k)) *
 | 
			
		||||
                                    (U(i, j, k) + U(i, j + 1, k)) -
 | 
			
		||||
                                (V(i, j - 1, k) + V(i + 1, j - 1, k)) *
 | 
			
		||||
                                    (U(i, j, k) + U(i, j - 1, k))) +
 | 
			
		||||
                        gamma * inverseDy * 0.25 *
 | 
			
		||||
                            (fabs(V(i, j, k) + V(i + 1, j, k)) *
 | 
			
		||||
                                    (U(i, j, k) - U(i, j + 1, k)) +
 | 
			
		||||
                                fabs(V(i, j - 1, k) + V(i + 1, j - 1, k)) *
 | 
			
		||||
                                    (U(i, j, k) - U(i, j - 1, k)));
 | 
			
		||||
 | 
			
		||||
                duwdz = inverseDz * 0.25 *
 | 
			
		||||
                            ((W(i, j, k) + W(i + 1, j, k)) *
 | 
			
		||||
                                    (U(i, j, k) + U(i, j, k + 1)) -
 | 
			
		||||
                                (W(i, j, k - 1) + W(i + 1, j, k - 1)) *
 | 
			
		||||
                                    (U(i, j, k) + U(i, j, k - 1))) +
 | 
			
		||||
                        gamma * inverseDz * 0.25 *
 | 
			
		||||
                            (fabs(W(i, j, k) + W(i + 1, j, k)) *
 | 
			
		||||
                                    (U(i, j, k) - U(i, j, k + 1)) +
 | 
			
		||||
                                fabs(W(i, j, k - 1) + W(i + 1, j, k - 1)) *
 | 
			
		||||
                                    (U(i, j, k) - U(i, j, k - 1)));
 | 
			
		||||
 | 
			
		||||
                du2dx2 = inverseDx * inverseDx *
 | 
			
		||||
                         (U(i + 1, j, k) - 2.0 * U(i, j, k) + U(i - 1, j, k));
 | 
			
		||||
                du2dy2 = inverseDy * inverseDy *
 | 
			
		||||
                         (U(i, j + 1, k) - 2.0 * U(i, j, k) + U(i, j - 1, k));
 | 
			
		||||
                du2dz2 = inverseDz * inverseDz *
 | 
			
		||||
                         (U(i, j, k + 1) - 2.0 * U(i, j, k) + U(i, j, k - 1));
 | 
			
		||||
                F(i, j, k) = U(i, j, k) + dt * (inverseRe * (du2dx2 + du2dy2 + du2dz2) -
 | 
			
		||||
                                                   du2dx - duvdy - duwdz + gx);
 | 
			
		||||
 | 
			
		||||
                duvdx = inverseDx * 0.25 *
 | 
			
		||||
                            ((U(i, j, k) + U(i, j + 1, k)) *
 | 
			
		||||
                                    (V(i, j, k) + V(i + 1, j, k)) -
 | 
			
		||||
                                (U(i - 1, j, k) + U(i - 1, j + 1, k)) *
 | 
			
		||||
                                    (V(i, j, k) + V(i - 1, j, k))) +
 | 
			
		||||
                        gamma * inverseDx * 0.25 *
 | 
			
		||||
                            (fabs(U(i, j, k) + U(i, j + 1, k)) *
 | 
			
		||||
                                    (V(i, j, k) - V(i + 1, j, k)) +
 | 
			
		||||
                                fabs(U(i - 1, j, k) + U(i - 1, j + 1, k)) *
 | 
			
		||||
                                    (V(i, j, k) - V(i - 1, j, k)));
 | 
			
		||||
 | 
			
		||||
                dv2dy = inverseDy * 0.25 *
 | 
			
		||||
                            ((V(i, j, k) + V(i, j + 1, k)) *
 | 
			
		||||
                                    (V(i, j, k) + V(i, j + 1, k)) -
 | 
			
		||||
                                (V(i, j, k) + V(i, j - 1, k)) *
 | 
			
		||||
                                    (V(i, j, k) + V(i, j - 1, k))) +
 | 
			
		||||
                        gamma * inverseDy * 0.25 *
 | 
			
		||||
                            (fabs(V(i, j, k) + V(i, j + 1, k)) *
 | 
			
		||||
                                    (V(i, j, k) - V(i, j + 1, k)) +
 | 
			
		||||
                                fabs(V(i, j, k) + V(i, j - 1, k)) *
 | 
			
		||||
                                    (V(i, j, k) - V(i, j - 1, k)));
 | 
			
		||||
 | 
			
		||||
                dvwdz = inverseDz * 0.25 *
 | 
			
		||||
                            ((W(i, j, k) + W(i, j + 1, k)) *
 | 
			
		||||
                                    (V(i, j, k) + V(i, j, k + 1)) -
 | 
			
		||||
                                (W(i, j, k - 1) + W(i, j + 1, k - 1)) *
 | 
			
		||||
                                    (V(i, j, k) + V(i, j, k + 1))) +
 | 
			
		||||
                        gamma * inverseDz * 0.25 *
 | 
			
		||||
                            (fabs(W(i, j, k) + W(i, j + 1, k)) *
 | 
			
		||||
                                    (V(i, j, k) - V(i, j, k + 1)) +
 | 
			
		||||
                                fabs(W(i, j, k - 1) + W(i, j + 1, k - 1)) *
 | 
			
		||||
                                    (V(i, j, k) - V(i, j, k + 1)));
 | 
			
		||||
 | 
			
		||||
                dv2dx2 = inverseDx * inverseDx *
 | 
			
		||||
                         (V(i + 1, j, k) - 2.0 * V(i, j, k) + V(i - 1, j, k));
 | 
			
		||||
                dv2dy2 = inverseDy * inverseDy *
 | 
			
		||||
                         (V(i, j + 1, k) - 2.0 * V(i, j, k) + V(i, j - 1, k));
 | 
			
		||||
                dv2dz2 = inverseDz * inverseDz *
 | 
			
		||||
                         (V(i, j, k + 1) - 2.0 * V(i, j, k) + V(i, j, k - 1));
 | 
			
		||||
                G(i, j, k) = V(i, j, k) + dt * (inverseRe * (dv2dx2 + dv2dy2 + dv2dz2) -
 | 
			
		||||
                                                   duvdx - dv2dy - dvwdz + gy);
 | 
			
		||||
 | 
			
		||||
                duwdx = inverseDx * 0.25 *
 | 
			
		||||
                            ((U(i, j, k) + U(i, j, k + 1)) *
 | 
			
		||||
                                    (W(i, j, k) + W(i + 1, j, k)) -
 | 
			
		||||
                                (U(i - 1, j, k) + U(i - 1, j, k + 1)) *
 | 
			
		||||
                                    (W(i, j, k) + W(i - 1, j, k))) +
 | 
			
		||||
                        gamma * inverseDx * 0.25 *
 | 
			
		||||
                            (fabs(U(i, j, k) + U(i, j, k + 1)) *
 | 
			
		||||
                                    (W(i, j, k) - W(i + 1, j, k)) +
 | 
			
		||||
                                fabs(U(i - 1, j, k) + U(i - 1, j, k + 1)) *
 | 
			
		||||
                                    (W(i, j, k) - W(i - 1, j, k)));
 | 
			
		||||
 | 
			
		||||
                dvwdy = inverseDy * 0.25 *
 | 
			
		||||
                            ((V(i, j, k) + V(i, j, k + 1)) *
 | 
			
		||||
                                    (W(i, j, k) + W(i, j + 1, k)) -
 | 
			
		||||
                                (V(i, j - 1, k + 1) + V(i, j - 1, k)) *
 | 
			
		||||
                                    (W(i, j, k) + W(i, j - 1, k))) +
 | 
			
		||||
                        gamma * inverseDy * 0.25 *
 | 
			
		||||
                            (fabs(V(i, j, k) + V(i, j, k + 1)) *
 | 
			
		||||
                                    (W(i, j, k) - W(i, j + 1, k)) +
 | 
			
		||||
                                fabs(V(i, j - 1, k + 1) + V(i, j - 1, k)) *
 | 
			
		||||
                                    (W(i, j, k) - W(i, j - 1, k)));
 | 
			
		||||
 | 
			
		||||
                dw2dz = inverseDz * 0.25 *
 | 
			
		||||
                            ((W(i, j, k) + W(i, j, k + 1)) *
 | 
			
		||||
                                    (W(i, j, k) + W(i, j, k + 1)) -
 | 
			
		||||
                                (W(i, j, k) + W(i, j, k - 1)) *
 | 
			
		||||
                                    (W(i, j, k) + W(i, j, k - 1))) +
 | 
			
		||||
                        gamma * inverseDz * 0.25 *
 | 
			
		||||
                            (fabs(W(i, j, k) + W(i, j, k + 1)) *
 | 
			
		||||
                                    (W(i, j, k) - W(i, j, k + 1)) +
 | 
			
		||||
                                fabs(W(i, j, k) + W(i, j, k - 1)) *
 | 
			
		||||
                                    (W(i, j, k) - W(i, j, k - 1)));
 | 
			
		||||
 | 
			
		||||
                dw2dx2 = inverseDx * inverseDx *
 | 
			
		||||
                         (W(i + 1, j, k) - 2.0 * W(i, j, k) + W(i - 1, j, k));
 | 
			
		||||
                dw2dy2 = inverseDy * inverseDy *
 | 
			
		||||
                         (W(i, j + 1, k) - 2.0 * W(i, j, k) + W(i, j - 1, k));
 | 
			
		||||
                dw2dz2 = inverseDz * inverseDz *
 | 
			
		||||
                         (W(i, j, k + 1) - 2.0 * W(i, j, k) + W(i, j, k - 1));
 | 
			
		||||
                H(i, j, k) = W(i, j, k) + dt * (inverseRe * (dw2dx2 + dw2dy2 + dw2dz2) -
 | 
			
		||||
                                                   duwdx - dvwdy - dw2dz + gz);
 | 
			
		||||
            }
 | 
			
		||||
        }
 | 
			
		||||
    }
 | 
			
		||||
 | 
			
		||||
    /* ----------------------------- boundary of F ---------------------------
 | 
			
		||||
     */
 | 
			
		||||
    if (commIsBoundary(&s->comm, LEFT)) {
 | 
			
		||||
        for (int k = 1; k < kmaxLocal + 1; k++) {
 | 
			
		||||
            for (int j = 1; j < jmaxLocal + 1; j++) {
 | 
			
		||||
                F(0, j, k) = U(0, j, k);
 | 
			
		||||
            }
 | 
			
		||||
        }
 | 
			
		||||
    }
 | 
			
		||||
 | 
			
		||||
    if (commIsBoundary(&s->comm, RIGHT)) {
 | 
			
		||||
        for (int k = 1; k < kmaxLocal + 1; k++) {
 | 
			
		||||
            for (int j = 1; j < jmaxLocal + 1; j++) {
 | 
			
		||||
                F(imaxLocal, j, k) = U(imaxLocal, j, k);
 | 
			
		||||
            }
 | 
			
		||||
        }
 | 
			
		||||
    }
 | 
			
		||||
 | 
			
		||||
    /* ----------------------------- boundary of G ---------------------------
 | 
			
		||||
     */
 | 
			
		||||
    if (commIsBoundary(&s->comm, BOTTOM)) {
 | 
			
		||||
        for (int k = 1; k < kmaxLocal + 1; k++) {
 | 
			
		||||
            for (int i = 1; i < imaxLocal + 1; i++) {
 | 
			
		||||
                G(i, 0, k) = V(i, 0, k);
 | 
			
		||||
            }
 | 
			
		||||
        }
 | 
			
		||||
    }
 | 
			
		||||
 | 
			
		||||
    if (commIsBoundary(&s->comm, TOP)) {
 | 
			
		||||
        for (int k = 1; k < kmaxLocal + 1; k++) {
 | 
			
		||||
            for (int i = 1; i < imaxLocal + 1; i++) {
 | 
			
		||||
                G(i, jmaxLocal, k) = V(i, jmaxLocal, k);
 | 
			
		||||
            }
 | 
			
		||||
        }
 | 
			
		||||
    }
 | 
			
		||||
 | 
			
		||||
    /* ----------------------------- boundary of H ---------------------------
 | 
			
		||||
     */
 | 
			
		||||
    if (commIsBoundary(&s->comm, FRONT)) {
 | 
			
		||||
        for (int j = 1; j < jmaxLocal + 1; j++) {
 | 
			
		||||
            for (int i = 1; i < imaxLocal + 1; i++) {
 | 
			
		||||
                H(i, j, 0) = W(i, j, 0);
 | 
			
		||||
            }
 | 
			
		||||
        }
 | 
			
		||||
    }
 | 
			
		||||
 | 
			
		||||
    if (commIsBoundary(&s->comm, BACK)) {
 | 
			
		||||
        for (int j = 1; j < jmaxLocal + 1; j++) {
 | 
			
		||||
            for (int i = 1; i < imaxLocal + 1; i++) {
 | 
			
		||||
                H(i, j, kmaxLocal) = W(i, j, kmaxLocal);
 | 
			
		||||
            }
 | 
			
		||||
        }
 | 
			
		||||
    }
 | 
			
		||||
}
 | 
			
		||||
 | 
			
		||||
void adaptUV(Solver* s)
 | 
			
		||||
{
 | 
			
		||||
    int imaxLocal = s->comm.imaxLocal;
 | 
			
		||||
    int jmaxLocal = s->comm.jmaxLocal;
 | 
			
		||||
    int kmaxLocal = s->comm.kmaxLocal;
 | 
			
		||||
 | 
			
		||||
    double* p = s->p;
 | 
			
		||||
    double* u = s->u;
 | 
			
		||||
    double* v = s->v;
 | 
			
		||||
    double* w = s->w;
 | 
			
		||||
    double* f = s->f;
 | 
			
		||||
    double* g = s->g;
 | 
			
		||||
    double* h = s->h;
 | 
			
		||||
 | 
			
		||||
    double factorX = s->dt / s->grid.dx;
 | 
			
		||||
    double factorY = s->dt / s->grid.dy;
 | 
			
		||||
    double factorZ = s->dt / s->grid.dz;
 | 
			
		||||
 | 
			
		||||
    for (int k = 1; k < kmaxLocal + 1; k++) {
 | 
			
		||||
        for (int j = 1; j < jmaxLocal + 1; j++) {
 | 
			
		||||
            for (int i = 1; i < imaxLocal + 1; i++) {
 | 
			
		||||
                U(i, j, k) = F(i, j, k) - (P(i + 1, j, k) - P(i, j, k)) * factorX;
 | 
			
		||||
                V(i, j, k) = G(i, j, k) - (P(i, j + 1, k) - P(i, j, k)) * factorY;
 | 
			
		||||
                W(i, j, k) = H(i, j, k) - (P(i, j, k + 1) - P(i, j, k)) * factorZ;
 | 
			
		||||
            }
 | 
			
		||||
        }
 | 
			
		||||
    }
 | 
			
		||||
}
 | 
			
		||||
@@ -1,45 +0,0 @@
 | 
			
		||||
/*
 | 
			
		||||
 * Copyright (C) 2022 NHR@FAU, University Erlangen-Nuremberg.
 | 
			
		||||
 * All rights reserved. This file is part of nusif-solver.
 | 
			
		||||
 * Use of this source code is governed by a MIT style
 | 
			
		||||
 * license that can be found in the LICENSE file.
 | 
			
		||||
 */
 | 
			
		||||
#ifndef __SOLVER_H_
 | 
			
		||||
#define __SOLVER_H_
 | 
			
		||||
#include "comm.h"
 | 
			
		||||
#include "grid.h"
 | 
			
		||||
#include "parameter.h"
 | 
			
		||||
 | 
			
		||||
enum BC { NOSLIP = 1, SLIP, OUTFLOW, PERIODIC };
 | 
			
		||||
 | 
			
		||||
typedef struct {
 | 
			
		||||
    /* geometry and grid information */
 | 
			
		||||
    Grid grid;
 | 
			
		||||
    /* arrays */
 | 
			
		||||
    double *p, *rhs;
 | 
			
		||||
    double *f, *g, *h;
 | 
			
		||||
    double *u, *v, *w;
 | 
			
		||||
    /* parameters */
 | 
			
		||||
    double eps, omega;
 | 
			
		||||
    double re, tau, gamma;
 | 
			
		||||
    double gx, gy, gz;
 | 
			
		||||
    /* time stepping */
 | 
			
		||||
    int itermax;
 | 
			
		||||
    double dt, te;
 | 
			
		||||
    double dtBound;
 | 
			
		||||
    char* problem;
 | 
			
		||||
    int bcLeft, bcRight, bcBottom, bcTop, bcFront, bcBack;
 | 
			
		||||
    /* communication */
 | 
			
		||||
    Comm comm;
 | 
			
		||||
} Solver;
 | 
			
		||||
 | 
			
		||||
extern void initSolver(Solver*, Parameter*);
 | 
			
		||||
extern void computeRHS(Solver*);
 | 
			
		||||
extern void solve(Solver*);
 | 
			
		||||
extern void normalizePressure(Solver*);
 | 
			
		||||
extern void computeTimestep(Solver*);
 | 
			
		||||
extern void setBoundaryConditions(Solver*);
 | 
			
		||||
extern void setSpecialBoundaryCondition(Solver*);
 | 
			
		||||
extern void computeFG(Solver*);
 | 
			
		||||
extern void adaptUV(Solver*);
 | 
			
		||||
#endif
 | 
			
		||||
@@ -1,129 +0,0 @@
 | 
			
		||||
/*
 | 
			
		||||
 * Copyright (C) 2022 NHR@FAU, University Erlangen-Nuremberg.
 | 
			
		||||
 * All rights reserved.
 | 
			
		||||
 * Use of this source code is governed by a MIT-style
 | 
			
		||||
 * license that can be found in the LICENSE file.
 | 
			
		||||
 */
 | 
			
		||||
#include <stdio.h>
 | 
			
		||||
#include <string.h>
 | 
			
		||||
 | 
			
		||||
#include "test.h"
 | 
			
		||||
 | 
			
		||||
#define G(v, i, j, k)                                                                    \
 | 
			
		||||
    v[(k) * (imaxLocal + 2) * (jmaxLocal + 2) + (j) * (imaxLocal + 2) + (i)]
 | 
			
		||||
 | 
			
		||||
void testInit(Solver* s)
 | 
			
		||||
{
 | 
			
		||||
    int imaxLocal = s->comm.imaxLocal;
 | 
			
		||||
    int jmaxLocal = s->comm.jmaxLocal;
 | 
			
		||||
    int kmaxLocal = s->comm.kmaxLocal;
 | 
			
		||||
    int myrank    = s->comm.rank;
 | 
			
		||||
    double* p     = s->p;
 | 
			
		||||
    double* f     = s->f;
 | 
			
		||||
    double* g     = s->g;
 | 
			
		||||
    double* h     = s->h;
 | 
			
		||||
 | 
			
		||||
    for (int k = 0; k < kmaxLocal + 2; k++) {
 | 
			
		||||
        for (int j = 0; j < jmaxLocal + 2; j++) {
 | 
			
		||||
            for (int i = 0; i < imaxLocal + 2; i++) {
 | 
			
		||||
                G(p, i, j, k) = 10.0;
 | 
			
		||||
                G(f, i, j, k) = myrank + 1.0;
 | 
			
		||||
                G(g, i, j, k) = myrank + 1.0;
 | 
			
		||||
                G(h, i, j, k) = myrank + 1.0;
 | 
			
		||||
            }
 | 
			
		||||
        }
 | 
			
		||||
    }
 | 
			
		||||
 | 
			
		||||
    for (int k = 1; k < kmaxLocal + 1; k++) {
 | 
			
		||||
        for (int j = 1; j < jmaxLocal + 1; j++) {
 | 
			
		||||
            for (int i = 1; i < imaxLocal + 1; i++) {
 | 
			
		||||
                G(p, i, j, k) = myrank + 1.0;
 | 
			
		||||
                G(f, i, j, k) = myrank + 1.0;
 | 
			
		||||
                G(g, i, j, k) = myrank + 1.0;
 | 
			
		||||
                G(h, i, j, k) = myrank + 1.0;
 | 
			
		||||
            }
 | 
			
		||||
        }
 | 
			
		||||
    }
 | 
			
		||||
}
 | 
			
		||||
 | 
			
		||||
static char* direction2String(Direction dir)
 | 
			
		||||
{
 | 
			
		||||
    switch (dir) {
 | 
			
		||||
    case LEFT:
 | 
			
		||||
        return "left";
 | 
			
		||||
        break;
 | 
			
		||||
    case RIGHT:
 | 
			
		||||
        return "right";
 | 
			
		||||
        break;
 | 
			
		||||
    case BOTTOM:
 | 
			
		||||
        return "bottom";
 | 
			
		||||
        break;
 | 
			
		||||
    case TOP:
 | 
			
		||||
        return "top";
 | 
			
		||||
        break;
 | 
			
		||||
    case FRONT:
 | 
			
		||||
        return "front";
 | 
			
		||||
        break;
 | 
			
		||||
    case BACK:
 | 
			
		||||
        return "back";
 | 
			
		||||
        break;
 | 
			
		||||
    case NDIRS:
 | 
			
		||||
        return "ERROR";
 | 
			
		||||
    default:
 | 
			
		||||
        return "ERROR";
 | 
			
		||||
    }
 | 
			
		||||
}
 | 
			
		||||
 | 
			
		||||
static void printPlane(Solver* s, double* a, int ymax, int xmax, Direction dir)
 | 
			
		||||
{
 | 
			
		||||
    int imaxLocal = s->comm.imaxLocal;
 | 
			
		||||
    int jmaxLocal = s->comm.jmaxLocal;
 | 
			
		||||
    int kmaxLocal = s->comm.kmaxLocal;
 | 
			
		||||
    char filename[50];
 | 
			
		||||
    snprintf(filename, 50, "halo-%s-r%d.txt", direction2String(dir), s->comm.rank);
 | 
			
		||||
    FILE* fh = fopen(filename, "w");
 | 
			
		||||
 | 
			
		||||
    for (int y = 0; y < ymax; y++) {
 | 
			
		||||
        for (int x = 0; x < xmax; x++) {
 | 
			
		||||
            switch (dir) {
 | 
			
		||||
            case LEFT:
 | 
			
		||||
                fprintf(fh, "%12.8f ", G(a, 0, x, y));
 | 
			
		||||
                break;
 | 
			
		||||
            case RIGHT:
 | 
			
		||||
                fprintf(fh, "%12.8f ", G(a, imaxLocal + 1, x, y));
 | 
			
		||||
                break;
 | 
			
		||||
            case BOTTOM:
 | 
			
		||||
                fprintf(fh, "%12.8f ", G(a, x, 0, y));
 | 
			
		||||
                break;
 | 
			
		||||
            case TOP:
 | 
			
		||||
                fprintf(fh, "%12.8f ", G(a, x, jmaxLocal + 1, y));
 | 
			
		||||
                break;
 | 
			
		||||
            case FRONT:
 | 
			
		||||
                fprintf(fh, "%12.8f ", G(a, x, y, 0));
 | 
			
		||||
                break;
 | 
			
		||||
            case BACK:
 | 
			
		||||
                fprintf(fh, "%12.8f ", G(a, x, y, kmaxLocal + 1));
 | 
			
		||||
                break;
 | 
			
		||||
            case NDIRS:
 | 
			
		||||
                printf("ERROR\n");
 | 
			
		||||
                break;
 | 
			
		||||
            }
 | 
			
		||||
        }
 | 
			
		||||
        fprintf(fh, "\n");
 | 
			
		||||
    }
 | 
			
		||||
    fclose(fh);
 | 
			
		||||
}
 | 
			
		||||
 | 
			
		||||
void testPrintHalo(Solver* s, double* a)
 | 
			
		||||
{
 | 
			
		||||
    int imaxLocal = s->comm.imaxLocal;
 | 
			
		||||
    int jmaxLocal = s->comm.jmaxLocal;
 | 
			
		||||
    int kmaxLocal = s->comm.kmaxLocal;
 | 
			
		||||
 | 
			
		||||
    printPlane(s, a, kmaxLocal + 2, imaxLocal + 2, BOTTOM);
 | 
			
		||||
    printPlane(s, a, kmaxLocal + 2, imaxLocal + 2, TOP);
 | 
			
		||||
    printPlane(s, a, kmaxLocal + 2, jmaxLocal + 2, LEFT);
 | 
			
		||||
    printPlane(s, a, kmaxLocal + 2, jmaxLocal + 2, RIGHT);
 | 
			
		||||
    printPlane(s, a, jmaxLocal + 2, imaxLocal + 2, FRONT);
 | 
			
		||||
    printPlane(s, a, jmaxLocal + 2, imaxLocal + 2, BACK);
 | 
			
		||||
}
 | 
			
		||||
@@ -1,13 +0,0 @@
 | 
			
		||||
/*
 | 
			
		||||
 * Copyright (C) 2022 NHR@FAU, University Erlangen-Nuremberg.
 | 
			
		||||
 * All rights reserved. This file is part of nusif-solver.
 | 
			
		||||
 * Use of this source code is governed by a MIT style
 | 
			
		||||
 * license that can be found in the LICENSE file.
 | 
			
		||||
 */
 | 
			
		||||
#ifndef __TEST_H_
 | 
			
		||||
#define __TEST_H_
 | 
			
		||||
#include "solver.h"
 | 
			
		||||
 | 
			
		||||
extern void testInit(Solver* s);
 | 
			
		||||
extern void testPrintHalo(Solver* s, double* a);
 | 
			
		||||
#endif // __TEST_H_
 | 
			
		||||
@@ -1,22 +0,0 @@
 | 
			
		||||
/*
 | 
			
		||||
 * Copyright (C) 2022 NHR@FAU, University Erlangen-Nuremberg.
 | 
			
		||||
 * All rights reserved.
 | 
			
		||||
 * Use of this source code is governed by a MIT-style
 | 
			
		||||
 * license that can be found in the LICENSE file.
 | 
			
		||||
 */
 | 
			
		||||
#include <stdlib.h>
 | 
			
		||||
#include <time.h>
 | 
			
		||||
 | 
			
		||||
double getTimeStamp(void)
 | 
			
		||||
{
 | 
			
		||||
    struct timespec ts;
 | 
			
		||||
    clock_gettime(CLOCK_MONOTONIC, &ts);
 | 
			
		||||
    return (double)ts.tv_sec + (double)ts.tv_nsec * 1.e-9;
 | 
			
		||||
}
 | 
			
		||||
 | 
			
		||||
double getTimeResolution(void)
 | 
			
		||||
{
 | 
			
		||||
    struct timespec ts;
 | 
			
		||||
    clock_getres(CLOCK_MONOTONIC, &ts);
 | 
			
		||||
    return (double)ts.tv_sec + (double)ts.tv_nsec * 1.e-9;
 | 
			
		||||
}
 | 
			
		||||
@@ -1,13 +0,0 @@
 | 
			
		||||
/*
 | 
			
		||||
 * Copyright (C) 2022 NHR@FAU, University Erlangen-Nuremberg.
 | 
			
		||||
 * All rights reserved.
 | 
			
		||||
 * Use of this source code is governed by a MIT-style
 | 
			
		||||
 * license that can be found in the LICENSE file.
 | 
			
		||||
 */
 | 
			
		||||
#ifndef __TIMING_H_
 | 
			
		||||
#define __TIMING_H_
 | 
			
		||||
 | 
			
		||||
extern double getTimeStamp(void);
 | 
			
		||||
extern double getTimeResolution(void);
 | 
			
		||||
 | 
			
		||||
#endif // __TIMING_H_
 | 
			
		||||
@@ -1,22 +0,0 @@
 | 
			
		||||
/*
 | 
			
		||||
 * Copyright (C) 2022 NHR@FAU, University Erlangen-Nuremberg.
 | 
			
		||||
 * All rights reserved.
 | 
			
		||||
 * Use of this source code is governed by a MIT-style
 | 
			
		||||
 * license that can be found in the LICENSE file.
 | 
			
		||||
 */
 | 
			
		||||
#ifndef __UTIL_H_
 | 
			
		||||
#define __UTIL_H_
 | 
			
		||||
#define HLINE                                                                            \
 | 
			
		||||
    "----------------------------------------------------------------------------\n"
 | 
			
		||||
 | 
			
		||||
#ifndef MIN
 | 
			
		||||
#define MIN(x, y) ((x) < (y) ? (x) : (y))
 | 
			
		||||
#endif
 | 
			
		||||
#ifndef MAX
 | 
			
		||||
#define MAX(x, y) ((x) > (y) ? (x) : (y))
 | 
			
		||||
#endif
 | 
			
		||||
#ifndef ABS
 | 
			
		||||
#define ABS(a) ((a) >= 0 ? (a) : -(a))
 | 
			
		||||
#endif
 | 
			
		||||
 | 
			
		||||
#endif // __UTIL_H_
 | 
			
		||||
@@ -1,29 +0,0 @@
 | 
			
		||||
/*
 | 
			
		||||
 * Copyright (C) 2022 NHR@FAU, University Erlangen-Nuremberg.
 | 
			
		||||
 * All rights reserved. This file is part of nusif-solver.
 | 
			
		||||
 * Use of this source code is governed by a MIT style
 | 
			
		||||
 * license that can be found in the LICENSE file.
 | 
			
		||||
 */
 | 
			
		||||
#ifndef __VTKWRITER_H_
 | 
			
		||||
#define __VTKWRITER_H_
 | 
			
		||||
#include <mpi.h>
 | 
			
		||||
#include <stdio.h>
 | 
			
		||||
 | 
			
		||||
#include "comm.h"
 | 
			
		||||
#include "grid.h"
 | 
			
		||||
 | 
			
		||||
typedef struct VtkOptions {
 | 
			
		||||
    Grid grid;
 | 
			
		||||
    MPI_File fh;
 | 
			
		||||
    Comm comm;
 | 
			
		||||
} VtkOptions;
 | 
			
		||||
 | 
			
		||||
typedef struct VtkVector {
 | 
			
		||||
    double *u, *v, *w;
 | 
			
		||||
} VtkVector;
 | 
			
		||||
 | 
			
		||||
extern void vtkOpen(VtkOptions* opts, char* filename);
 | 
			
		||||
extern void vtkVector(VtkOptions* opts, char* name, VtkVector vec);
 | 
			
		||||
extern void vtkScalar(VtkOptions* opts, char* name, double* p);
 | 
			
		||||
extern void vtkClose(VtkOptions* opts);
 | 
			
		||||
#endif // __VTKWRITER_H_
 | 
			
		||||
@@ -1,5 +1,5 @@
 | 
			
		||||
#=======================================================================================
 | 
			
		||||
# Copyright (C) 2022 NHR@FAU, University Erlangen-Nuremberg.
 | 
			
		||||
# Copyright (C) NHR@FAU, University Erlangen-Nuremberg.
 | 
			
		||||
# All rights reserved.
 | 
			
		||||
# Use of this source code is governed by a MIT-style
 | 
			
		||||
# license that can be found in the LICENSE file.
 | 
			
		||||
@@ -18,13 +18,18 @@ include $(MAKE_DIR)/include_$(TAG).mk
 | 
			
		||||
INCLUDES  += -I$(SRC_DIR) -I$(BUILD_DIR)
 | 
			
		||||
 | 
			
		||||
VPATH     = $(SRC_DIR)
 | 
			
		||||
SRC       = $(wildcard $(SRC_DIR)/*.c)
 | 
			
		||||
SRC       = $(filter-out $(wildcard $(SRC_DIR)/*-*.c),$(wildcard $(SRC_DIR)/*.c))
 | 
			
		||||
ASM       = $(patsubst $(SRC_DIR)/%.c, $(BUILD_DIR)/%.s, $(SRC))
 | 
			
		||||
OBJ       = $(patsubst $(SRC_DIR)/%.c, $(BUILD_DIR)/%.o, $(SRC))
 | 
			
		||||
OBJ      += $(BUILD_DIR)/vtkWriter-$(VTK_OUTPUT_FMT).o
 | 
			
		||||
SOURCES   = $(SRC) $(wildcard $(SRC_DIR)/*.h)
 | 
			
		||||
ifeq ($(VTK_OUTPUT_FMT),mpi)
 | 
			
		||||
DEFINES  += -D_VTK_WRITER_MPI
 | 
			
		||||
endif
 | 
			
		||||
 | 
			
		||||
CPPFLAGS := $(CPPFLAGS) $(DEFINES) $(OPTIONS) $(INCLUDES)
 | 
			
		||||
 | 
			
		||||
${TARGET}: $(BUILD_DIR) $(OBJ)
 | 
			
		||||
${TARGET}: sanity-checks $(BUILD_DIR) $(OBJ)
 | 
			
		||||
	$(info ===>  LINKING  $(TARGET))
 | 
			
		||||
	$(Q)${LINKER} ${LFLAGS} -o $(TARGET) $(OBJ) $(LIBS)
 | 
			
		||||
 | 
			
		||||
@@ -65,6 +70,14 @@ format:
 | 
			
		||||
	done
 | 
			
		||||
	@echo "Done"
 | 
			
		||||
 | 
			
		||||
sanity-checks:
 | 
			
		||||
ifeq ($(VTK_OUTPUT_FMT),mpi)
 | 
			
		||||
ifeq ($(ENABLE_MPI),false)
 | 
			
		||||
	$(error VTK_OUTPUT_FMT mpi only supported for ENABLE_MPI true!)
 | 
			
		||||
endif
 | 
			
		||||
endif
 | 
			
		||||
 | 
			
		||||
 | 
			
		||||
$(BUILD_DIR):
 | 
			
		||||
	@mkdir $(BUILD_DIR)
 | 
			
		||||
 | 
			
		||||
 
 | 
			
		||||
@@ -2,6 +2,8 @@
 | 
			
		||||
TAG ?= CLANG
 | 
			
		||||
ENABLE_MPI ?= true
 | 
			
		||||
ENABLE_OPENMP ?= false
 | 
			
		||||
# Supported: seq, mpi
 | 
			
		||||
VTK_OUTPUT_FMT ?= seq
 | 
			
		||||
 | 
			
		||||
#Feature options
 | 
			
		||||
OPTIONS +=  -DARRAY_ALIGNMENT=64
 | 
			
		||||
 
 | 
			
		||||
@@ -2,7 +2,7 @@ ifeq ($(ENABLE_MPI),true)
 | 
			
		||||
CC   = mpicc
 | 
			
		||||
DEFINES  = -D_MPI
 | 
			
		||||
else
 | 
			
		||||
CC = cc
 | 
			
		||||
CC   = cc
 | 
			
		||||
endif
 | 
			
		||||
 | 
			
		||||
GCC  = cc
 | 
			
		||||
@@ -18,4 +18,4 @@ VERSION  = --version
 | 
			
		||||
CFLAGS   = -Ofast -std=c17
 | 
			
		||||
LFLAGS   = $(OPENMP) -lm
 | 
			
		||||
DEFINES  += -D_GNU_SOURCE# -DDEBUG
 | 
			
		||||
INCLUDES =
 | 
			
		||||
INCLUDES = -I/opt/homebrew/include
 | 
			
		||||
 
 | 
			
		||||
@@ -1,4 +1,10 @@
 | 
			
		||||
ifeq ($(ENABLE_MPI),true)
 | 
			
		||||
CC   = mpicc
 | 
			
		||||
DEFINES  = -D_MPI
 | 
			
		||||
else
 | 
			
		||||
CC   = gcc
 | 
			
		||||
endif
 | 
			
		||||
 | 
			
		||||
GCC  = gcc
 | 
			
		||||
LINKER = $(CC)
 | 
			
		||||
 | 
			
		||||
@@ -9,6 +15,6 @@ endif
 | 
			
		||||
VERSION  = --version
 | 
			
		||||
CFLAGS   = -Ofast -ffreestanding -std=c99 $(OPENMP)
 | 
			
		||||
LFLAGS   = $(OPENMP)
 | 
			
		||||
DEFINES  = -D_GNU_SOURCE
 | 
			
		||||
DEFINES  += -D_GNU_SOURCE
 | 
			
		||||
INCLUDES =
 | 
			
		||||
LIBS     =
 | 
			
		||||
 
 | 
			
		||||
@@ -1,4 +1,10 @@
 | 
			
		||||
ifeq ($(ENABLE_MPI),true)
 | 
			
		||||
CC   = mpiicc
 | 
			
		||||
DEFINES  = -D_MPI
 | 
			
		||||
else
 | 
			
		||||
CC   = icc
 | 
			
		||||
endif
 | 
			
		||||
 | 
			
		||||
GCC  = gcc
 | 
			
		||||
LINKER = $(CC)
 | 
			
		||||
 | 
			
		||||
@@ -9,6 +15,6 @@ endif
 | 
			
		||||
VERSION  = --version
 | 
			
		||||
CFLAGS   =  -O3 -xHost -qopt-zmm-usage=high -std=c99 $(OPENMP)
 | 
			
		||||
LFLAGS   = $(OPENMP)
 | 
			
		||||
DEFINES  = -D_GNU_SOURCE
 | 
			
		||||
DEFINES  += -D_GNU_SOURCE
 | 
			
		||||
INCLUDES =
 | 
			
		||||
LIBS     =
 | 
			
		||||
 
 | 
			
		||||
@@ -1,5 +1,5 @@
 | 
			
		||||
/*
 | 
			
		||||
 * Copyright (C) 2022 NHR@FAU, University Erlangen-Nuremberg.
 | 
			
		||||
 * Copyright (C)  NHR@FAU, University Erlangen-Nuremberg.
 | 
			
		||||
 * All rights reserved.
 | 
			
		||||
 * Use of this source code is governed by a MIT-style
 | 
			
		||||
 * license that can be found in the LICENSE file.
 | 
			
		||||
 
 | 
			
		||||
@@ -1,5 +1,5 @@
 | 
			
		||||
/*
 | 
			
		||||
 * Copyright (C) 2022 NHR@FAU, University Erlangen-Nuremberg.
 | 
			
		||||
 * Copyright (C)  NHR@FAU, University Erlangen-Nuremberg.
 | 
			
		||||
 * All rights reserved.
 | 
			
		||||
 * Use of this source code is governed by a MIT-style
 | 
			
		||||
 * license that can be found in the LICENSE file.
 | 
			
		||||
 
 | 
			
		||||
@@ -1,5 +1,5 @@
 | 
			
		||||
/*
 | 
			
		||||
 * Copyright (C) 2022 NHR@FAU, University Erlangen-Nuremberg.
 | 
			
		||||
 * Copyright (C)  NHR@FAU, University Erlangen-Nuremberg.
 | 
			
		||||
 * All rights reserved. This file is part of nusif-solver.
 | 
			
		||||
 * Use of this source code is governed by a MIT style
 | 
			
		||||
 * license that can be found in the LICENSE file.
 | 
			
		||||
@@ -296,6 +296,30 @@ void commShift(Comm* c, double* f, double* g, double* h)
 | 
			
		||||
#endif
 | 
			
		||||
}
 | 
			
		||||
 | 
			
		||||
void commGetOffsets(Comm* c, int offsets[], int kmax, int jmax, int imax)
 | 
			
		||||
{
 | 
			
		||||
#if defined(_MPI)
 | 
			
		||||
    int sum = 0;
 | 
			
		||||
 | 
			
		||||
    for (int i = 0; i < c->coords[ICORD]; i++) {
 | 
			
		||||
        sum += sizeOfRank(i, c->dims[ICORD], imax);
 | 
			
		||||
    }
 | 
			
		||||
    offsets[IDIM] = sum;
 | 
			
		||||
    sum           = 0;
 | 
			
		||||
 | 
			
		||||
    for (int i = 0; i < c->coords[JCORD]; i++) {
 | 
			
		||||
        sum += sizeOfRank(i, c->dims[JCORD], jmax);
 | 
			
		||||
    }
 | 
			
		||||
    offsets[JDIM] = sum;
 | 
			
		||||
    sum           = 0;
 | 
			
		||||
 | 
			
		||||
    for (int i = 0; i < c->coords[KCORD]; i++) {
 | 
			
		||||
        sum += sizeOfRank(i, c->dims[KCORD], kmax);
 | 
			
		||||
    }
 | 
			
		||||
    offsets[KDIM] = sum;
 | 
			
		||||
#endif
 | 
			
		||||
}
 | 
			
		||||
 | 
			
		||||
#define G(v, i, j, k)                                                                    \
 | 
			
		||||
    v[(k) * (imaxLocal + 2) * (jmaxLocal + 2) + (j) * (imaxLocal + 2) + (i)]
 | 
			
		||||
 | 
			
		||||
@@ -445,7 +469,7 @@ void commCollectResult(Comm* c,
 | 
			
		||||
    for (int k = 1; k < kmaxLocal + 1; k++) {
 | 
			
		||||
        for (int j = 1; j < jmaxLocal + 1; j++) {
 | 
			
		||||
            for (int i = 1; i < imaxLocal + 1; i++) {
 | 
			
		||||
                pg[idx++] = G(s->p, i, j, k);
 | 
			
		||||
                pg[idx++] = G(p, i, j, k);
 | 
			
		||||
            }
 | 
			
		||||
        }
 | 
			
		||||
    }
 | 
			
		||||
@@ -455,7 +479,7 @@ void commCollectResult(Comm* c,
 | 
			
		||||
    for (int k = 1; k < kmaxLocal + 1; k++) {
 | 
			
		||||
        for (int j = 1; j < jmaxLocal + 1; j++) {
 | 
			
		||||
            for (int i = 1; i < imaxLocal + 1; i++) {
 | 
			
		||||
                ug[idx++] = (G(s->u, i, j, k) + G(s->u, i - 1, j, k)) / 2.0;
 | 
			
		||||
                ug[idx++] = (G(u, i, j, k) + G(u, i - 1, j, k)) / 2.0;
 | 
			
		||||
            }
 | 
			
		||||
        }
 | 
			
		||||
    }
 | 
			
		||||
@@ -465,7 +489,7 @@ void commCollectResult(Comm* c,
 | 
			
		||||
    for (int k = 1; k < kmaxLocal + 1; k++) {
 | 
			
		||||
        for (int j = 1; j < jmaxLocal + 1; j++) {
 | 
			
		||||
            for (int i = 1; i < imaxLocal + 1; i++) {
 | 
			
		||||
                vg[idx++] = (G(s->v, i, j, k) + G(s->v, i, j - 1, k)) / 2.0;
 | 
			
		||||
                vg[idx++] = (G(v, i, j, k) + G(v, i, j - 1, k)) / 2.0;
 | 
			
		||||
            }
 | 
			
		||||
        }
 | 
			
		||||
    }
 | 
			
		||||
@@ -475,7 +499,7 @@ void commCollectResult(Comm* c,
 | 
			
		||||
    for (int k = 1; k < kmaxLocal + 1; k++) {
 | 
			
		||||
        for (int j = 1; j < jmaxLocal + 1; j++) {
 | 
			
		||||
            for (int i = 1; i < imaxLocal + 1; i++) {
 | 
			
		||||
                wg[idx++] = (G(s->w, i, j, k) + G(s->w, i, j, k - 1)) / 2.0;
 | 
			
		||||
                wg[idx++] = (G(w, i, j, k) + G(w, i, j, k - 1)) / 2.0;
 | 
			
		||||
            }
 | 
			
		||||
        }
 | 
			
		||||
    }
 | 
			
		||||
@@ -524,8 +548,8 @@ void commInit(Comm* c, int argc, char** argv)
 | 
			
		||||
    MPI_Comm_rank(MPI_COMM_WORLD, &(c->rank));
 | 
			
		||||
    MPI_Comm_size(MPI_COMM_WORLD, &(c->size));
 | 
			
		||||
#else
 | 
			
		||||
    c->rank      = 0;
 | 
			
		||||
    c->size      = 1;
 | 
			
		||||
    c->rank = 0;
 | 
			
		||||
    c->size = 1;
 | 
			
		||||
#endif
 | 
			
		||||
}
 | 
			
		||||
 | 
			
		||||
 
 | 
			
		||||
@@ -1,5 +1,5 @@
 | 
			
		||||
/*
 | 
			
		||||
 * Copyright (C) 2024 NHR@FAU, University Erlangen-Nuremberg.
 | 
			
		||||
 * Copyright (C)  NHR@FAU, University Erlangen-Nuremberg.
 | 
			
		||||
 * All rights reserved. This file is part of nusif-solver.
 | 
			
		||||
 * Use of this source code is governed by a MIT style
 | 
			
		||||
 * license that can be found in the LICENSE file.
 | 
			
		||||
@@ -44,6 +44,7 @@ extern void commExchange(Comm*, double*);
 | 
			
		||||
extern void commShift(Comm* c, double* f, double* g, double* h);
 | 
			
		||||
extern void commReduction(double* v, int op);
 | 
			
		||||
extern int commIsBoundary(Comm* c, Direction direction);
 | 
			
		||||
extern void commGetOffsets(Comm* c, int offsets[], int kmax, int jmax, int imax);
 | 
			
		||||
extern void commCollectResult(Comm* c,
 | 
			
		||||
    double* ug,
 | 
			
		||||
    double* vg,
 | 
			
		||||
 
 | 
			
		||||
@@ -1,5 +1,5 @@
 | 
			
		||||
/*
 | 
			
		||||
 * Copyright (C) 2022 NHR@FAU, University Erlangen-Nuremberg.
 | 
			
		||||
 * Copyright (C)  NHR@FAU, University Erlangen-Nuremberg.
 | 
			
		||||
 * All rights reserved. This file is part of nusif-solver.
 | 
			
		||||
 * Use of this source code is governed by a MIT style
 | 
			
		||||
 * license that can be found in the LICENSE file.
 | 
			
		||||
 
 | 
			
		||||
@@ -1,11 +1,9 @@
 | 
			
		||||
/*
 | 
			
		||||
 * Copyright (C) 2024 NHR@FAU, University Erlangen-Nuremberg.
 | 
			
		||||
 * Copyright (C)  NHR@FAU, University Erlangen-Nuremberg.
 | 
			
		||||
 * All rights reserved.
 | 
			
		||||
 * Use of this source code is governed by a MIT-style
 | 
			
		||||
 * license that can be found in the LICENSE file.
 | 
			
		||||
 */
 | 
			
		||||
#include <float.h>
 | 
			
		||||
#include <limits.h>
 | 
			
		||||
#include <stdio.h>
 | 
			
		||||
#include <stdlib.h>
 | 
			
		||||
#include <unistd.h>
 | 
			
		||||
@@ -73,6 +71,13 @@ int main(int argc, char** argv)
 | 
			
		||||
        printf("Solution took %.2fs\n", timeStop - timeStart);
 | 
			
		||||
    }
 | 
			
		||||
 | 
			
		||||
#ifdef _VTK_WRITER_MPI
 | 
			
		||||
    VtkOptions opts = { .grid = s.grid, .comm = s.comm };
 | 
			
		||||
    vtkOpen(&opts, s.problem);
 | 
			
		||||
    vtkScalar(&opts, "pressure", s.p);
 | 
			
		||||
    vtkVector(&opts, "velocity", (VtkVector) { s.u, s.v, s.w });
 | 
			
		||||
    vtkClose(&opts);
 | 
			
		||||
#else
 | 
			
		||||
    double *pg, *ug, *vg, *wg;
 | 
			
		||||
 | 
			
		||||
    if (commIsMaster(&s.comm)) {
 | 
			
		||||
@@ -104,6 +109,7 @@ int main(int argc, char** argv)
 | 
			
		||||
        vtkVector(&opts, "velocity", (VtkVector) { ug, vg, wg });
 | 
			
		||||
        vtkClose(&opts);
 | 
			
		||||
    }
 | 
			
		||||
#endif
 | 
			
		||||
 | 
			
		||||
    commFinalize(&s.comm);
 | 
			
		||||
    return EXIT_SUCCESS;
 | 
			
		||||
 
 | 
			
		||||
@@ -1,5 +1,5 @@
 | 
			
		||||
/*
 | 
			
		||||
 * Copyright (C) 2022 NHR@FAU, University Erlangen-Nuremberg.
 | 
			
		||||
 * Copyright (C)  NHR@FAU, University Erlangen-Nuremberg.
 | 
			
		||||
 * All rights reserved. This file is part of nusif-solver.
 | 
			
		||||
 * Use of this source code is governed by a MIT style
 | 
			
		||||
 * license that can be found in the LICENSE file.
 | 
			
		||||
 
 | 
			
		||||
@@ -1,5 +1,5 @@
 | 
			
		||||
/*
 | 
			
		||||
 * Copyright (C) 2022 NHR@FAU, University Erlangen-Nuremberg.
 | 
			
		||||
 * Copyright (C)  NHR@FAU, University Erlangen-Nuremberg.
 | 
			
		||||
 * All rights reserved. This file is part of nusif-solver.
 | 
			
		||||
 * Use of this source code is governed by a MIT style
 | 
			
		||||
 * license that can be found in the LICENSE file.
 | 
			
		||||
 
 | 
			
		||||
@@ -1,5 +1,5 @@
 | 
			
		||||
/*
 | 
			
		||||
 * Copyright (C) 2022 NHR@FAU, University Erlangen-Nuremberg.
 | 
			
		||||
 * Copyright (C)  NHR@FAU, University Erlangen-Nuremberg.
 | 
			
		||||
 * All rights reserved. This file is part of nusif-solver.
 | 
			
		||||
 * Use of this source code is governed by a MIT style
 | 
			
		||||
 * license that can be found in the LICENSE file.
 | 
			
		||||
 
 | 
			
		||||
@@ -1,5 +1,5 @@
 | 
			
		||||
/*
 | 
			
		||||
 * Copyright (C) 2022 NHR@FAU, University Erlangen-Nuremberg.
 | 
			
		||||
 * Copyright (C)  NHR@FAU, University Erlangen-Nuremberg.
 | 
			
		||||
 * All rights reserved.
 | 
			
		||||
 * Use of this source code is governed by a MIT-style
 | 
			
		||||
 * license that can be found in the LICENSE file.
 | 
			
		||||
 
 | 
			
		||||
@@ -1,5 +1,5 @@
 | 
			
		||||
/*
 | 
			
		||||
 * Copyright (C) 2022 NHR@FAU, University Erlangen-Nuremberg.
 | 
			
		||||
 * Copyright (C)  NHR@FAU, University Erlangen-Nuremberg.
 | 
			
		||||
 * All rights reserved. This file is part of nusif-solver.
 | 
			
		||||
 * Use of this source code is governed by a MIT style
 | 
			
		||||
 * license that can be found in the LICENSE file.
 | 
			
		||||
@@ -207,24 +207,24 @@ void solve(Solver* s)
 | 
			
		||||
            jsw = ksw;
 | 
			
		||||
            commExchange(&s->comm, p);
 | 
			
		||||
 | 
			
		||||
            for (int k = 1; k < kmaxLocal + 1; k++) {
 | 
			
		||||
        for (int k = 1; k < kmaxLocal + 1; k++) {
 | 
			
		||||
                isw = jsw;
 | 
			
		||||
                for (int j = 1; j < jmaxLocal + 1; j++) {
 | 
			
		||||
            for (int j = 1; j < jmaxLocal + 1; j++) {
 | 
			
		||||
                    for (int i = isw; i < imaxLocal + 1; i += 2) {
 | 
			
		||||
 | 
			
		||||
                        double r =
 | 
			
		||||
                            RHS(i, j, k) -
 | 
			
		||||
                            ((P(i + 1, j, k) - 2.0 * P(i, j, k) + P(i - 1, j, k)) * idx2 +
 | 
			
		||||
                                (P(i, j + 1, k) - 2.0 * P(i, j, k) + P(i, j - 1, k)) *
 | 
			
		||||
                                    idy2 +
 | 
			
		||||
                                (P(i, j, k + 1) - 2.0 * P(i, j, k) + P(i, j, k - 1)) *
 | 
			
		||||
                                    idz2);
 | 
			
		||||
                                   (P(i, j + 1, k) - 2.0 * P(i, j, k) + P(i, j - 1, k)) *
 | 
			
		||||
                                       idy2 +
 | 
			
		||||
                                   (P(i, j, k + 1) - 2.0 * P(i, j, k) + P(i, j, k - 1)) *
 | 
			
		||||
                                       idz2);
 | 
			
		||||
 | 
			
		||||
                        P(i, j, k) -= (factor * r);
 | 
			
		||||
                        res += (r * r);
 | 
			
		||||
                    }
 | 
			
		||||
                    isw = 3 - isw;
 | 
			
		||||
                    P(i, j, k) -= (factor * r);
 | 
			
		||||
                    res += (r * r);
 | 
			
		||||
                }
 | 
			
		||||
                    isw = 3 - isw;
 | 
			
		||||
            }
 | 
			
		||||
                jsw = 3 - jsw;
 | 
			
		||||
            }
 | 
			
		||||
            ksw = 3 - ksw;
 | 
			
		||||
 
 | 
			
		||||
@@ -1,5 +1,5 @@
 | 
			
		||||
/*
 | 
			
		||||
 * Copyright (C) 2022 NHR@FAU, University Erlangen-Nuremberg.
 | 
			
		||||
 * Copyright (C)  NHR@FAU, University Erlangen-Nuremberg.
 | 
			
		||||
 * All rights reserved. This file is part of nusif-solver.
 | 
			
		||||
 * Use of this source code is governed by a MIT style
 | 
			
		||||
 * license that can be found in the LICENSE file.
 | 
			
		||||
 
 | 
			
		||||
@@ -1,5 +1,5 @@
 | 
			
		||||
/*
 | 
			
		||||
 * Copyright (C) 2022 NHR@FAU, University Erlangen-Nuremberg.
 | 
			
		||||
 * Copyright (C)  NHR@FAU, University Erlangen-Nuremberg.
 | 
			
		||||
 * All rights reserved.
 | 
			
		||||
 * Use of this source code is governed by a MIT-style
 | 
			
		||||
 * license that can be found in the LICENSE file.
 | 
			
		||||
@@ -26,10 +26,21 @@ void testInit(Solver* s)
 | 
			
		||||
    for (int k = 0; k < kmaxLocal + 2; k++) {
 | 
			
		||||
        for (int j = 0; j < jmaxLocal + 2; j++) {
 | 
			
		||||
            for (int i = 0; i < imaxLocal + 2; i++) {
 | 
			
		||||
                G(p, i, j, k) = myrank;
 | 
			
		||||
                G(f, i, j, k) = myrank;
 | 
			
		||||
                G(g, i, j, k) = myrank;
 | 
			
		||||
                G(h, i, j, k) = myrank;
 | 
			
		||||
                G(p, i, j, k) = 10.0;
 | 
			
		||||
                G(f, i, j, k) = myrank + 1.0;
 | 
			
		||||
                G(g, i, j, k) = myrank + 1.0;
 | 
			
		||||
                G(h, i, j, k) = myrank + 1.0;
 | 
			
		||||
            }
 | 
			
		||||
        }
 | 
			
		||||
    }
 | 
			
		||||
 | 
			
		||||
    for (int k = 1; k < kmaxLocal + 1; k++) {
 | 
			
		||||
        for (int j = 1; j < jmaxLocal + 1; j++) {
 | 
			
		||||
            for (int i = 1; i < imaxLocal + 1; i++) {
 | 
			
		||||
                G(p, i, j, k) = myrank + 1.0;
 | 
			
		||||
                G(f, i, j, k) = myrank + 1.0;
 | 
			
		||||
                G(g, i, j, k) = myrank + 1.0;
 | 
			
		||||
                G(h, i, j, k) = myrank + 1.0;
 | 
			
		||||
            }
 | 
			
		||||
        }
 | 
			
		||||
    }
 | 
			
		||||
 
 | 
			
		||||
@@ -1,5 +1,5 @@
 | 
			
		||||
/*
 | 
			
		||||
 * Copyright (C) 2022 NHR@FAU, University Erlangen-Nuremberg.
 | 
			
		||||
 * Copyright (C)  NHR@FAU, University Erlangen-Nuremberg.
 | 
			
		||||
 * All rights reserved. This file is part of nusif-solver.
 | 
			
		||||
 * Use of this source code is governed by a MIT style
 | 
			
		||||
 * license that can be found in the LICENSE file.
 | 
			
		||||
 
 | 
			
		||||
@@ -1,5 +1,5 @@
 | 
			
		||||
/*
 | 
			
		||||
 * Copyright (C) 2022 NHR@FAU, University Erlangen-Nuremberg.
 | 
			
		||||
 * Copyright (C)  NHR@FAU, University Erlangen-Nuremberg.
 | 
			
		||||
 * All rights reserved.
 | 
			
		||||
 * Use of this source code is governed by a MIT-style
 | 
			
		||||
 * license that can be found in the LICENSE file.
 | 
			
		||||
 
 | 
			
		||||
@@ -1,5 +1,5 @@
 | 
			
		||||
/*
 | 
			
		||||
 * Copyright (C) 2022 NHR@FAU, University Erlangen-Nuremberg.
 | 
			
		||||
 * Copyright (C)  NHR@FAU, University Erlangen-Nuremberg.
 | 
			
		||||
 * All rights reserved.
 | 
			
		||||
 * Use of this source code is governed by a MIT-style
 | 
			
		||||
 * license that can be found in the LICENSE file.
 | 
			
		||||
 
 | 
			
		||||
@@ -1,5 +1,5 @@
 | 
			
		||||
/*
 | 
			
		||||
 * Copyright (C) 2022 NHR@FAU, University Erlangen-Nuremberg.
 | 
			
		||||
 * Copyright (C)  NHR@FAU, University Erlangen-Nuremberg.
 | 
			
		||||
 * All rights reserved.
 | 
			
		||||
 * Use of this source code is governed by a MIT-style
 | 
			
		||||
 * license that can be found in the LICENSE file.
 | 
			
		||||
 
 | 
			
		||||
@@ -1,5 +1,5 @@
 | 
			
		||||
/*
 | 
			
		||||
 * Copyright (C) 2022 NHR@FAU, University Erlangen-Nuremberg.
 | 
			
		||||
 * Copyright (C) NHR@FAU, University Erlangen-Nuremberg.
 | 
			
		||||
 * All rights reserved. This file is part of nusif-solver.
 | 
			
		||||
 * Use of this source code is governed by a MIT style
 | 
			
		||||
 * license that can be found in the LICENSE file.
 | 
			
		||||
@@ -14,24 +14,32 @@
 | 
			
		||||
#include "comm.h"
 | 
			
		||||
#include "vtkWriter.h"
 | 
			
		||||
 | 
			
		||||
// reset fileview for output of string headers
 | 
			
		||||
static void resetFileview(VtkOptions* o)
 | 
			
		||||
{
 | 
			
		||||
    // reset fileview for output of string header
 | 
			
		||||
    MPI_Offset disp;
 | 
			
		||||
    MPI_File_sync(o->fh);
 | 
			
		||||
    MPI_Barrier(o->comm.comm);
 | 
			
		||||
    MPI_File_get_size(o->fh, &disp);
 | 
			
		||||
    MPI_File_set_view(o->fh, disp, MPI_CHAR, MPI_CHAR, "native", MPI_INFO_NULL);
 | 
			
		||||
    // printf("Rank %d disp %lld\n", o->comm.rank, disp);
 | 
			
		||||
}
 | 
			
		||||
 | 
			
		||||
static void writeVersion(VtkOptions* o)
 | 
			
		||||
{
 | 
			
		||||
    char header[50] = "# vtk DataFile Version 3.0\n";
 | 
			
		||||
    // always overwrite exiting files
 | 
			
		||||
    MPI_File_set_view(o->fh, 0, MPI_CHAR, MPI_CHAR, "native", MPI_INFO_NULL);
 | 
			
		||||
 | 
			
		||||
    if (commIsMaster(&o->comm)) {
 | 
			
		||||
        MPI_File_write(o->fh, header, (int)strlen(header), MPI_CHAR, MPI_STATUS_IGNORE);
 | 
			
		||||
    }
 | 
			
		||||
}
 | 
			
		||||
 | 
			
		||||
static void writeHeader(VtkOptions* o)
 | 
			
		||||
{
 | 
			
		||||
    const size_t MAX_HEADER = 200;
 | 
			
		||||
 | 
			
		||||
    char* header = (char*)malloc(MAX_HEADER);
 | 
			
		||||
    char header[400];
 | 
			
		||||
    char* cursor = header;
 | 
			
		||||
 | 
			
		||||
    cursor += sprintf(cursor, "# vtk DataFile Version 3.0\n");
 | 
			
		||||
    cursor += sprintf(cursor, "PAMPI cfd solver output\n");
 | 
			
		||||
    cursor += sprintf(cursor, "BINARY\n");
 | 
			
		||||
 | 
			
		||||
@@ -52,13 +60,10 @@ static void writeHeader(VtkOptions* o)
 | 
			
		||||
        o->grid.imax * o->grid.jmax * o->grid.kmax);
 | 
			
		||||
 | 
			
		||||
    if (commIsMaster(&o->comm)) {
 | 
			
		||||
        MPI_File_write(o->fh, header, strlen(header), MPI_CHAR, MPI_STATUS_IGNORE);
 | 
			
		||||
        MPI_File_write(o->fh, header, (int)strlen(header), MPI_CHAR, MPI_STATUS_IGNORE);
 | 
			
		||||
    }
 | 
			
		||||
 | 
			
		||||
    free(header);
 | 
			
		||||
}
 | 
			
		||||
 | 
			
		||||
// TODO Check inputs for length
 | 
			
		||||
void vtkOpen(VtkOptions* o, char* problem)
 | 
			
		||||
{
 | 
			
		||||
    char filename[50];
 | 
			
		||||
@@ -66,7 +71,7 @@ void vtkOpen(VtkOptions* o, char* problem)
 | 
			
		||||
    snprintf(filename, 50, "%s-p%d.vtk", problem, o->comm.size);
 | 
			
		||||
    MPI_File_open(o->comm.comm,
 | 
			
		||||
        filename,
 | 
			
		||||
        MPI_MODE_WRONLY | MPI_MODE_CREATE | MPI_MODE_EXCL,
 | 
			
		||||
        MPI_MODE_WRONLY | MPI_MODE_CREATE,
 | 
			
		||||
        MPI_INFO_NULL,
 | 
			
		||||
        &o->fh);
 | 
			
		||||
 | 
			
		||||
@@ -74,35 +79,32 @@ void vtkOpen(VtkOptions* o, char* problem)
 | 
			
		||||
        printf("Writing VTK output for %s\n", problem);
 | 
			
		||||
    }
 | 
			
		||||
 | 
			
		||||
    resetFileview(o);
 | 
			
		||||
    writeVersion(o);
 | 
			
		||||
    writeHeader(o);
 | 
			
		||||
}
 | 
			
		||||
 | 
			
		||||
void vtkScalar(VtkOptions* o, char* name, double* s)
 | 
			
		||||
{
 | 
			
		||||
    resetFileview(o);
 | 
			
		||||
 | 
			
		||||
    if (commIsMaster(&o->comm)) printf("Register scalar %s\n", name);
 | 
			
		||||
    const size_t MAX_HEADER = 100;
 | 
			
		||||
 | 
			
		||||
    char* header = (char*)malloc(MAX_HEADER);
 | 
			
		||||
    char header[100];
 | 
			
		||||
    char* cursor = header;
 | 
			
		||||
 | 
			
		||||
    cursor += sprintf(cursor, "SCALARS %s double 1\n", name);
 | 
			
		||||
    cursor += sprintf(cursor, "LOOKUP_TABLE default\n");
 | 
			
		||||
 | 
			
		||||
    if (commIsMaster(&o->comm)) {
 | 
			
		||||
        MPI_File_write(o->fh, header, strlen(header), MPI_CHAR, MPI_STATUS_IGNORE);
 | 
			
		||||
        MPI_File_write(o->fh, header, (int)strlen(header), MPI_CHAR, MPI_STATUS_IGNORE);
 | 
			
		||||
    }
 | 
			
		||||
 | 
			
		||||
    free(header);
 | 
			
		||||
 | 
			
		||||
    int offsets[NDIMS];
 | 
			
		||||
    commGetOffsets(&o->comm, offsets, o->grid.imax, o->grid.jmax, o->grid.kmax);
 | 
			
		||||
    commGetOffsets(&o->comm, offsets, o->grid.kmax, o->grid.jmax, o->grid.imax);
 | 
			
		||||
 | 
			
		||||
    // set global view in file
 | 
			
		||||
    MPI_Offset disp;
 | 
			
		||||
    MPI_Datatype fileViewType;
 | 
			
		||||
    MPI_File_sync(o->fh);
 | 
			
		||||
    MPI_Barrier(o->comm.comm);
 | 
			
		||||
    MPI_File_get_size(o->fh, &disp);
 | 
			
		||||
 | 
			
		||||
@@ -172,15 +174,16 @@ void vtkVector(VtkOptions* o, char* name, VtkVector vec)
 | 
			
		||||
 | 
			
		||||
    resetFileview(o);
 | 
			
		||||
    if (commIsMaster(&o->comm)) {
 | 
			
		||||
        MPI_File_write(o->fh, header, strlen(header), MPI_CHAR, MPI_STATUS_IGNORE);
 | 
			
		||||
        MPI_File_write(o->fh, header, (int)strlen(header), MPI_CHAR, MPI_STATUS_IGNORE);
 | 
			
		||||
    }
 | 
			
		||||
 | 
			
		||||
    int offsets[NDIMS];
 | 
			
		||||
    commGetOffsets(&o->comm, offsets, o->grid.imax, o->grid.jmax, o->grid.kmax);
 | 
			
		||||
    commGetOffsets(&o->comm, offsets, o->grid.kmax, o->grid.jmax, o->grid.imax);
 | 
			
		||||
 | 
			
		||||
    // set global view in file
 | 
			
		||||
    MPI_Offset disp;
 | 
			
		||||
    MPI_Datatype fileViewType, vectorType;
 | 
			
		||||
    MPI_File_sync(o->fh);
 | 
			
		||||
    MPI_Barrier(o->comm.comm);
 | 
			
		||||
    MPI_File_get_size(o->fh, &disp);
 | 
			
		||||
 | 
			
		||||
@@ -1,5 +1,5 @@
 | 
			
		||||
/*
 | 
			
		||||
 * Copyright (C) 2022 NHR@FAU, University Erlangen-Nuremberg.
 | 
			
		||||
 * Copyright (C)  NHR@FAU, University Erlangen-Nuremberg.
 | 
			
		||||
 * All rights reserved. This file is part of nusif-solver.
 | 
			
		||||
 * Use of this source code is governed by a MIT style
 | 
			
		||||
 * license that can be found in the LICENSE file.
 | 
			
		||||
@@ -1,5 +1,5 @@
 | 
			
		||||
/*
 | 
			
		||||
 * Copyright (C) 2022 NHR@FAU, University Erlangen-Nuremberg.
 | 
			
		||||
 * Copyright (C) NHR@FAU, University Erlangen-Nuremberg.
 | 
			
		||||
 * All rights reserved. This file is part of nusif-solver.
 | 
			
		||||
 * Use of this source code is governed by a MIT style
 | 
			
		||||
 * license that can be found in the LICENSE file.
 | 
			
		||||
@@ -8,14 +8,20 @@
 | 
			
		||||
#define __VTKWRITER_H_
 | 
			
		||||
#include <stdio.h>
 | 
			
		||||
 | 
			
		||||
#include "comm.h"
 | 
			
		||||
#include "grid.h"
 | 
			
		||||
 | 
			
		||||
typedef enum VtkFormat { ASCII = 0, BINARY } VtkFormat;
 | 
			
		||||
 | 
			
		||||
typedef struct VtkOptions {
 | 
			
		||||
    VtkFormat fmt;
 | 
			
		||||
    Grid grid;
 | 
			
		||||
#ifdef _VTK_WRITER_MPI
 | 
			
		||||
    MPI_File fh;
 | 
			
		||||
#else
 | 
			
		||||
    FILE* fh;
 | 
			
		||||
    VtkFormat fmt;
 | 
			
		||||
#endif // _VTK_WRITER_MPI
 | 
			
		||||
    Comm comm;
 | 
			
		||||
} VtkOptions;
 | 
			
		||||
 | 
			
		||||
typedef struct VtkVector {
 | 
			
		||||
 
 | 
			
		||||
		Reference in New Issue
	
	Block a user