/* ---------------------------------------------------------------------- LAMMPS - Large-scale Atomic/Molecular Massively Parallel Simulator https://www.lammps.org/, Sandia National Laboratories LAMMPS development team: developers@lammps.org Copyright (2003) Sandia Corporation. Under the terms of Contract DE-AC04-94AL85000 with Sandia Corporation, the U.S. Government retains certain rights in this software. This software is distributed under the GNU General Public License. See the README file in the top-level LAMMPS directory. ------------------------------------------------------------------------- */ /* ---------------------------------------------------------------------- Contributing author: Paul Coffman (IBM) ------------------------------------------------------------------------- */ #include "dump_atom_mpiio.h" #include "domain.h" #include "error.h" #include "memory.h" #include "update.h" #include #include #include "omp_compat.h" #if defined(_OPENMP) #include #endif using namespace LAMMPS_NS; #define MAX_TEXT_HEADER_SIZE 4096 #define DUMP_BUF_CHUNK_SIZE 16384 #define DUMP_BUF_INCREMENT_SIZE 4096 /* ---------------------------------------------------------------------- */ DumpAtomMPIIO::DumpAtomMPIIO(LAMMPS *lmp, int narg, char **arg) : DumpAtom(lmp, narg, arg) { if (me == 0) error->warning(FLERR, "MPI-IO output is unmaintained and unreliable. Use with caution."); } /* ---------------------------------------------------------------------- */ DumpAtomMPIIO::~DumpAtomMPIIO() { if (multifile == 0) MPI_File_close(&mpifh); } /* ---------------------------------------------------------------------- */ void DumpAtomMPIIO::openfile() { if (singlefile_opened) { // single file already opened, so just return after resetting filesize mpifo = currentFileSize; MPI_File_set_size(mpifh, mpifo + headerSize + sumFileSize); currentFileSize = mpifo + headerSize + sumFileSize; return; } if (multifile == 0) singlefile_opened = 1; // if one file per timestep, replace '*' with current timestep filecurrent = filename; if (multifile) { filecurrent = utils::strdup(utils::star_subst(filecurrent, update->ntimestep, padflag)); if (maxfiles > 0) { if (numfiles < maxfiles) { nameslist[numfiles] = utils::strdup(filecurrent); ++numfiles; } else { remove(nameslist[fileidx]); delete[] nameslist[fileidx]; nameslist[fileidx] = utils::strdup(filecurrent); fileidx = (fileidx + 1) % maxfiles; } } } if (append_flag) { // append open int err = MPI_File_open(world, filecurrent, MPI_MODE_CREATE | MPI_MODE_APPEND | MPI_MODE_WRONLY, MPI_INFO_NULL, &mpifh); if (err != MPI_SUCCESS) error->one(FLERR, "Cannot open dump file {}: {}", filecurrent, utils::getsyserror()); int myrank; MPI_Comm_rank(world, &myrank); if (myrank == 0) MPI_File_get_size(mpifh, &mpifo); MPI_Bcast(&mpifo, 1, MPI_LMP_BIGINT, 0, world); MPI_File_set_size(mpifh, mpifo + headerSize + sumFileSize); currentFileSize = mpifo + headerSize + sumFileSize; } else { // replace open int err = MPI_File_open(world, filecurrent, MPI_MODE_CREATE | MPI_MODE_WRONLY, MPI_INFO_NULL, &mpifh); if (err != MPI_SUCCESS) error->one(FLERR, "Cannot open dump file {}: {}", filecurrent, utils::getsyserror()); mpifo = 0; MPI_File_set_size(mpifh, (MPI_Offset) (headerSize + sumFileSize)); currentFileSize = (headerSize + sumFileSize); } } /* ---------------------------------------------------------------------- */ void DumpAtomMPIIO::write() { if (domain->triclinic == 0) { boxxlo = domain->boxlo[0]; boxxhi = domain->boxhi[0]; boxylo = domain->boxlo[1]; boxyhi = domain->boxhi[1]; boxzlo = domain->boxlo[2]; boxzhi = domain->boxhi[2]; } else { boxxlo = domain->boxlo_bound[0]; boxxhi = domain->boxhi_bound[0]; boxylo = domain->boxlo_bound[1]; boxyhi = domain->boxhi_bound[1]; boxzlo = domain->boxlo_bound[2]; boxzhi = domain->boxhi_bound[2]; boxxy = domain->xy; boxxz = domain->xz; boxyz = domain->yz; } // nme = # of dump lines this proc contributes to dump nme = count(); // ntotal = total # of dump lines in snapshot // nmax = max # of dump lines on any proc bigint bnme = nme; MPI_Allreduce(&bnme, &ntotal, 1, MPI_LMP_BIGINT, MPI_SUM, world); int nmax; MPI_Allreduce(&nme, &nmax, 1, MPI_INT, MPI_MAX, world); // write timestep header // for multiproc, // nheader = # of lines in this file via Allreduce on clustercomm bigint nheader = ntotal; // ensure filewriter proc can receive everyone's info // limit nmax*size_one to int since used as arg in MPI_Rsend() below // pack my data into buf // if sorting on IDs also request ID list from pack() // sort buf as needed if (nmax > maxbuf) { if ((bigint) nmax * size_one > MAXSMALLINT) error->all(FLERR, "Too much per-proc info for dump"); maxbuf = nmax; memory->destroy(buf); memory->create(buf, (maxbuf * size_one), "dump:buf"); } if (sort_flag && sortcol == 0 && nmax > maxids) { maxids = nmax; memory->destroy(ids); memory->create(ids, maxids, "dump:ids"); } if (sort_flag && sortcol == 0) pack(ids); else pack(nullptr); if (sort_flag) sort(); // determine how much data needs to be written for setting the file size and prepocess it prior to writing performEstimate = 1; write_header(nheader); write_data(nme, buf); MPI_Bcast(&sumFileSize, 1, MPI_LMP_BIGINT, (nprocs - 1), world); openfile(); performEstimate = 0; write_header(nheader); // mpifo now points to end of header info // now actually write the data performEstimate = 0; write_data(nme, buf); if (multifile) MPI_File_close(&mpifh); if (multifile) delete[] filecurrent; } /* ---------------------------------------------------------------------- */ void DumpAtomMPIIO::init_style() { if (image_flag == 0) size_one = 5; else size_one = 8; // format = copy of default or user-specified line format // default depends on image flags delete[] format; if (format_line_user) { format = utils::strdup(std::string(format_line_user) + "\n"); } else { if (image_flag == 0) format = utils::strdup(TAGINT_FORMAT " %d %g %g %g\n"); else format = utils::strdup(TAGINT_FORMAT " %d %g %g %g %d %d %d\n"); } // setup boundary string domain->boundary_string(boundstr); // setup column string std::string default_columns; if (scale_flag == 0 && image_flag == 0) default_columns = "id type x y z"; else if (scale_flag == 0 && image_flag == 1) default_columns = "id type x y z ix iy iz"; else if (scale_flag == 1 && image_flag == 0) default_columns = "id type xs ys zs"; else if (scale_flag == 1 && image_flag == 1) default_columns = "id type xs ys zs ix iy iz"; int icol = 0; columns.clear(); for (const auto &item : utils::split_words(default_columns)) { if (columns.size()) columns += " "; if (keyword_user[icol].size()) columns += keyword_user[icol]; else columns += item; ++icol; } // setup function ptrs if (binary && domain->triclinic == 0) header_choice = &DumpAtomMPIIO::header_binary; else if (binary && domain->triclinic == 1) header_choice = &DumpAtomMPIIO::header_binary_triclinic; else if (!binary && domain->triclinic == 0) header_choice = &DumpAtomMPIIO::header_item; else if (!binary && domain->triclinic == 1) header_choice = &DumpAtomMPIIO::header_item_triclinic; if (scale_flag == 1 && image_flag == 0 && domain->triclinic == 0) pack_choice = &DumpAtomMPIIO::pack_scale_noimage; else if (scale_flag == 1 && image_flag == 1 && domain->triclinic == 0) pack_choice = &DumpAtomMPIIO::pack_scale_image; else if (scale_flag == 1 && image_flag == 0 && domain->triclinic == 1) pack_choice = &DumpAtomMPIIO::pack_scale_noimage_triclinic; else if (scale_flag == 1 && image_flag == 1 && domain->triclinic == 1) pack_choice = &DumpAtomMPIIO::pack_scale_image_triclinic; else if (scale_flag == 0 && image_flag == 0) pack_choice = &DumpAtomMPIIO::pack_noscale_noimage; else if (scale_flag == 0 && image_flag == 1) pack_choice = &DumpAtomMPIIO::pack_noscale_image; if (binary) write_choice = &DumpAtomMPIIO::write_binary; else if (buffer_flag == 1) write_choice = &DumpAtomMPIIO::write_string; else if (image_flag == 0) write_choice = &DumpAtomMPIIO::write_lines_noimage; else if (image_flag == 1) write_choice = &DumpAtomMPIIO::write_lines_image; } /* ---------------------------------------------------------------------- */ void DumpAtomMPIIO::write_header(bigint ndump) { (this->*header_choice)(ndump); } /* ---------------------------------------------------------------------- */ void DumpAtomMPIIO::header_binary(bigint ndump) { if (performEstimate) { headerBuffer = (char *) malloc((2 * sizeof(bigint)) + (9 * sizeof(int)) + (6 * sizeof(double))); headerSize = 0; memcpy(headerBuffer + headerSize, &update->ntimestep, sizeof(bigint)); headerSize += sizeof(bigint); memcpy(headerBuffer + headerSize, &ndump, sizeof(bigint)); headerSize += sizeof(bigint); memcpy(headerBuffer + headerSize, &domain->triclinic, sizeof(int)); headerSize += sizeof(int); memcpy(headerBuffer + headerSize, &domain->boundary[0][0], 6 * sizeof(int)); headerSize += 6 * sizeof(int); memcpy(headerBuffer + headerSize, &boxxlo, sizeof(double)); headerSize += sizeof(double); memcpy(headerBuffer + headerSize, &boxxhi, sizeof(double)); headerSize += sizeof(double); memcpy(headerBuffer + headerSize, &boxylo, sizeof(double)); headerSize += sizeof(double); memcpy(headerBuffer + headerSize, &boxyhi, sizeof(double)); headerSize += sizeof(double); memcpy(headerBuffer + headerSize, &boxzlo, sizeof(double)); headerSize += sizeof(double); memcpy(headerBuffer + headerSize, &boxzhi, sizeof(double)); headerSize += sizeof(double); memcpy(headerBuffer + headerSize, &size_one, sizeof(int)); headerSize += sizeof(int); memcpy(headerBuffer + headerSize, &nprocs, sizeof(int)); headerSize += sizeof(int); } else { // write data if (me == 0) MPI_File_write_at(mpifh, mpifo, headerBuffer, headerSize, MPI_BYTE, MPI_STATUS_IGNORE); mpifo += headerSize; free(headerBuffer); } } /* ---------------------------------------------------------------------- */ void DumpAtomMPIIO::header_binary_triclinic(bigint ndump) { if (performEstimate) { headerBuffer = (char *) malloc((2 * sizeof(bigint)) + (9 * sizeof(int)) + (9 * sizeof(double))); headerSize = 0; memcpy(headerBuffer + headerSize, &update->ntimestep, sizeof(bigint)); headerSize += sizeof(bigint); memcpy(headerBuffer + headerSize, &ndump, sizeof(bigint)); headerSize += sizeof(bigint); memcpy(headerBuffer + headerSize, &domain->triclinic, sizeof(int)); headerSize += sizeof(int); memcpy(headerBuffer + headerSize, &domain->boundary[0][0], 6 * sizeof(int)); headerSize += 6 * sizeof(int); memcpy(headerBuffer + headerSize, &boxxlo, sizeof(double)); headerSize += sizeof(double); memcpy(headerBuffer + headerSize, &boxxhi, sizeof(double)); headerSize += sizeof(double); memcpy(headerBuffer + headerSize, &boxylo, sizeof(double)); headerSize += sizeof(double); memcpy(headerBuffer + headerSize, &boxyhi, sizeof(double)); headerSize += sizeof(double); memcpy(headerBuffer + headerSize, &boxzlo, sizeof(double)); headerSize += sizeof(double); memcpy(headerBuffer + headerSize, &boxzhi, sizeof(double)); headerSize += sizeof(double); memcpy(headerBuffer + headerSize, &boxxy, sizeof(double)); headerSize += sizeof(double); memcpy(headerBuffer + headerSize, &boxxz, sizeof(double)); headerSize += sizeof(double); memcpy(headerBuffer + headerSize, &boxyz, sizeof(double)); headerSize += sizeof(double); memcpy(headerBuffer + headerSize, &size_one, sizeof(int)); headerSize += sizeof(int); memcpy(headerBuffer + headerSize, &nprocs, sizeof(int)); headerSize += sizeof(int); } else { // write data if (me == 0) MPI_File_write_at(mpifh, mpifo, headerBuffer, headerSize, MPI_BYTE, MPI_STATUS_IGNORE); mpifo += headerSize; free(headerBuffer); } } /* ---------------------------------------------------------------------- */ void DumpAtomMPIIO::header_item(bigint ndump) { if (performEstimate) { auto itemtxt = fmt::format("ITEM: TIMESTEP\n{}\n", update->ntimestep); itemtxt += fmt::format("ITEM: NUMBER OF ATOMS\n{}\n", ndump); itemtxt += fmt::format("ITEM: BOX BOUNDS {}\n", boundstr); itemtxt += fmt::format("{} {}\n{} {}\n{} {}\n", boxxlo, boxxhi, boxylo, boxyhi, boxzlo, boxzhi); itemtxt += fmt::format("ITEM: ATOMS {}\n", columns); headerSize = itemtxt.size(); headerBuffer = utils::strdup(itemtxt); } else { // write data if (me == 0) MPI_File_write_at(mpifh, mpifo, headerBuffer, headerSize, MPI_CHAR, MPI_STATUS_IGNORE); mpifo += headerSize; delete[] headerBuffer; } } /* ---------------------------------------------------------------------- */ void DumpAtomMPIIO::header_item_triclinic(bigint ndump) { if (performEstimate) { auto itemtxt = fmt::format("ITEM: TIMESTEP\n{}\n", update->ntimestep); itemtxt += fmt::format("ITEM: NUMBER OF ATOMS\n{}\n", ndump); itemtxt += fmt::format("ITEM: BOX BOUNDS xy xz yz {}\n", boundstr); itemtxt += fmt::format("{} {} {}\n{} {} {}\n{} {} {}\n", boxxlo, boxxhi, boxxy, boxylo, boxyhi, boxxz, boxzlo, boxzhi, boxyz); itemtxt += fmt::format("ITEM: ATOMS {}\n", columns); headerSize = itemtxt.size(); headerBuffer = utils::strdup(itemtxt); } else { // write data if (me == 0) MPI_File_write_at(mpifh, mpifo, headerBuffer, headerSize, MPI_CHAR, MPI_STATUS_IGNORE); mpifo += headerSize; delete[] headerBuffer; } } /* ---------------------------------------------------------------------- */ void DumpAtomMPIIO::write_data(int n, double *mybuf) { (this->*write_choice)(n, mybuf); } /* ---------------------------------------------------------------------- */ void DumpAtomMPIIO::write_binary(int n, double *mybuf) { n *= size_one; if (performEstimate) { bigint incPrefix = 0; bigint bigintNme = (bigint) nme; MPI_Scan(&bigintNme, &incPrefix, 1, MPI_LMP_BIGINT, MPI_SUM, world); sumFileSize = (incPrefix * size_one * sizeof(double)) + (nprocs * sizeof(int)); offsetFromHeader = ((incPrefix - bigintNme) * size_one * sizeof(double)) + (me * sizeof(int)); } else { int byteBufSize = (n * sizeof(double)) + sizeof(int); char *bufWithSize; memory->create(bufWithSize, byteBufSize, "dump:bufWithSize"); memcpy(bufWithSize, (char *) (&n), sizeof(int)); memcpy(&((char *) bufWithSize)[sizeof(int)], mybuf, (n * sizeof(double))); MPI_File_write_at_all(mpifh, mpifo + offsetFromHeader, bufWithSize, byteBufSize, MPI_BYTE, MPI_STATUS_IGNORE); memory->destroy(bufWithSize); if (flush_flag) MPI_File_sync(mpifh); } } /* ---------------------------------------------------------------------- */ void DumpAtomMPIIO::write_string(int n, double *mybuf) { if (performEstimate) { #if defined(_OPENMP) int nthreads = omp_get_max_threads(); if (nthreads > 1) nsme = convert_string_omp(n, mybuf); else { nsme = convert_string(n, mybuf); } #else nsme = convert_string(n, mybuf); #endif bigint incPrefix = 0; bigint bigintNsme = (bigint) nsme; MPI_Scan(&bigintNsme, &incPrefix, 1, MPI_LMP_BIGINT, MPI_SUM, world); sumFileSize = (incPrefix * sizeof(char)); offsetFromHeader = ((incPrefix - bigintNsme) * sizeof(char)); } else { MPI_File_write_at_all(mpifh, mpifo + offsetFromHeader, sbuf, nsme, MPI_CHAR, MPI_STATUS_IGNORE); if (flush_flag) MPI_File_sync(mpifh); } } /* ---------------------------------------------------------------------- */ int DumpAtomMPIIO::convert_string(int n, double *mybuf) { if (image_flag == 0) return convert_noimage(n, mybuf); else return convert_image(n, mybuf); } /* ---------------------------------------------------------------------- */ #if defined(_OPENMP) int DumpAtomMPIIO::convert_string_omp(int n, double *mybuf) { if (image_flag == 0) return convert_noimage_omp(n, mybuf); else return convert_image_omp(n, mybuf); } /* ---------------------------------------------------------------------- multithreaded version - convert mybuf of doubles to one big formatted string in sbuf return -1 if strlen exceeds an int, since used as arg in MPI calls in Dump ------------------------------------------------------------------------- */ int DumpAtomMPIIO::convert_image_omp(int n, double *mybuf) { char **mpifh_buffer_line_per_thread; int mpifhStringCount; int *mpifhStringCountPerThread, *bufOffset, *bufRange, *bufLength; mpifhStringCount = 0; int nthreads = omp_get_max_threads(); if (nthreads > n) { // call serial version convert_string(n, mybuf); } else { memory->create(mpifhStringCountPerThread, nthreads, "dump:mpifhStringCountPerThread"); mpifh_buffer_line_per_thread = (char **) malloc(nthreads * sizeof(char *)); memory->create(bufOffset, nthreads, "dump:bufOffset"); memory->create(bufRange, nthreads, "dump:bufRange"); memory->create(bufLength, nthreads, "dump:bufLength"); int i = 0; for (i = 0; i < (nthreads - 1); i++) { mpifhStringCountPerThread[i] = 0; bufOffset[i] = (int) (i * (int) (floor((double) n / (double) nthreads)) * size_one); bufRange[i] = (int) (floor((double) n / (double) nthreads)); bufLength[i] = DUMP_BUF_CHUNK_SIZE; mpifh_buffer_line_per_thread[i] = (char *) malloc(DUMP_BUF_CHUNK_SIZE * sizeof(char)); mpifh_buffer_line_per_thread[i][0] = '\0'; } mpifhStringCountPerThread[i] = 0; bufOffset[i] = (int) (i * (int) (floor((double) n / (double) nthreads)) * size_one); bufRange[i] = n - (i * (int) (floor((double) n / (double) nthreads))); bufLength[i] = DUMP_BUF_CHUNK_SIZE; mpifh_buffer_line_per_thread[i] = (char *) malloc(DUMP_BUF_CHUNK_SIZE * sizeof(char)); mpifh_buffer_line_per_thread[i][0] = '\0'; #pragma omp parallel LMP_DEFAULT_NONE LMP_SHARED(bufOffset, bufRange, bufLength, \ mpifhStringCountPerThread, \ mpifh_buffer_line_per_thread, mybuf) { int tid = omp_get_thread_num(); int m = 0; for (int i = 0; i < bufRange[tid]; i++) { if ((bufLength[tid] - mpifhStringCountPerThread[tid]) < DUMP_BUF_INCREMENT_SIZE) { mpifh_buffer_line_per_thread[tid] = (char *) realloc( mpifh_buffer_line_per_thread[tid], (mpifhStringCountPerThread[tid] + DUMP_BUF_CHUNK_SIZE) * sizeof(char)); bufLength[tid] = (mpifhStringCountPerThread[tid] + DUMP_BUF_CHUNK_SIZE) * sizeof(char); } mpifhStringCountPerThread[tid] += sprintf(&(mpifh_buffer_line_per_thread[tid][mpifhStringCountPerThread[tid]]), format, static_cast(mybuf[bufOffset[tid] + m]), static_cast(mybuf[bufOffset[tid] + m + 1]), mybuf[bufOffset[tid] + m + 2], mybuf[bufOffset[tid] + m + 3], mybuf[bufOffset[tid] + m + 4], static_cast(mybuf[bufOffset[tid] + m + 5]), static_cast(mybuf[bufOffset[tid] + m + 6]), static_cast(mybuf[bufOffset[tid] + m + 7])); m += size_one; } } #pragma omp barrier mpifhStringCount = 0; for (i = 0; i < nthreads; i++) { mpifhStringCount += mpifhStringCountPerThread[i]; } memory->destroy(bufOffset); memory->destroy(bufRange); memory->destroy(bufLength); if (mpifhStringCount > 0) { if (mpifhStringCount > maxsbuf) { if (mpifhStringCount > MAXSMALLINT) return -1; maxsbuf = mpifhStringCount + 1; memory->grow(sbuf, maxsbuf, "dump:sbuf"); } sbuf[0] = '\0'; } for (int i = 0; i < nthreads; i++) { strcat(sbuf, mpifh_buffer_line_per_thread[i]); free(mpifh_buffer_line_per_thread[i]); } memory->destroy(mpifhStringCountPerThread); free(mpifh_buffer_line_per_thread); } return mpifhStringCount; } /* ---------------------------------------------------------------------- multithreaded version - convert mybuf of doubles to one big formatted string in sbuf return -1 if strlen exceeds an int, since used as arg in MPI calls in Dump ------------------------------------------------------------------------- */ int DumpAtomMPIIO::convert_noimage_omp(int n, double *mybuf) { char **mpifh_buffer_line_per_thread; int mpifhStringCount; int *mpifhStringCountPerThread, *bufOffset, *bufRange, *bufLength; mpifhStringCount = 0; int nthreads = omp_get_max_threads(); if (nthreads > n) { // call serial version convert_string(n, mybuf); } else { memory->create(mpifhStringCountPerThread, nthreads, "dump:mpifhStringCountPerThread"); mpifh_buffer_line_per_thread = (char **) malloc(nthreads * sizeof(char *)); memory->create(bufOffset, nthreads, "dump:bufOffset"); memory->create(bufRange, nthreads, "dump:bufRange"); memory->create(bufLength, nthreads, "dump:bufLength"); int i = 0; for (i = 0; i < (nthreads - 1); i++) { mpifhStringCountPerThread[i] = 0; bufOffset[i] = (int) (i * (int) (floor((double) n / (double) nthreads)) * size_one); bufRange[i] = (int) (floor((double) n / (double) nthreads)); bufLength[i] = DUMP_BUF_CHUNK_SIZE; mpifh_buffer_line_per_thread[i] = (char *) malloc(DUMP_BUF_CHUNK_SIZE * sizeof(char)); mpifh_buffer_line_per_thread[i][0] = '\0'; } mpifhStringCountPerThread[i] = 0; bufOffset[i] = (int) (i * (int) (floor((double) n / (double) nthreads)) * size_one); bufRange[i] = n - (i * (int) (floor((double) n / (double) nthreads))); bufLength[i] = DUMP_BUF_CHUNK_SIZE; mpifh_buffer_line_per_thread[i] = (char *) malloc(DUMP_BUF_CHUNK_SIZE * sizeof(char)); mpifh_buffer_line_per_thread[i][0] = '\0'; #pragma omp parallel LMP_DEFAULT_NONE LMP_SHARED(bufOffset, bufRange, bufLength, \ mpifhStringCountPerThread, \ mpifh_buffer_line_per_thread, mybuf) { int tid = omp_get_thread_num(); int m = 0; for (int i = 0; i < bufRange[tid]; i++) { if ((bufLength[tid] - mpifhStringCountPerThread[tid]) < DUMP_BUF_INCREMENT_SIZE) { mpifh_buffer_line_per_thread[tid] = (char *) realloc( mpifh_buffer_line_per_thread[tid], (mpifhStringCountPerThread[tid] + DUMP_BUF_CHUNK_SIZE) * sizeof(char)); bufLength[tid] = (mpifhStringCountPerThread[tid] + DUMP_BUF_CHUNK_SIZE) * sizeof(char); } mpifhStringCountPerThread[tid] += sprintf(&(mpifh_buffer_line_per_thread[tid][mpifhStringCountPerThread[tid]]), format, static_cast(mybuf[bufOffset[tid] + m]), static_cast(mybuf[bufOffset[tid] + m + 1]), mybuf[bufOffset[tid] + m + 2], mybuf[bufOffset[tid] + m + 3], mybuf[bufOffset[tid] + m + 4]); m += size_one; } } #pragma omp barrier mpifhStringCount = 0; for (i = 0; i < nthreads; i++) { mpifhStringCount += mpifhStringCountPerThread[i]; } memory->destroy(bufOffset); memory->destroy(bufRange); memory->destroy(bufLength); if (mpifhStringCount > 0) { if (mpifhStringCount > maxsbuf) { if (mpifhStringCount > MAXSMALLINT) return -1; maxsbuf = mpifhStringCount + 1; memory->grow(sbuf, maxsbuf, "dump:sbuf"); } sbuf[0] = '\0'; } for (int i = 0; i < nthreads; i++) { strcat(sbuf, mpifh_buffer_line_per_thread[i]); free(mpifh_buffer_line_per_thread[i]); } memory->destroy(mpifhStringCountPerThread); free(mpifh_buffer_line_per_thread); } return mpifhStringCount; } #endif