diff --git a/.github/workflows/ci-macos.yml b/.github/workflows/ci-macos.yml
index 3e61e9bbe6c2..e63e3e2a52c2 100644
--- a/.github/workflows/ci-macos.yml
+++ b/.github/workflows/ci-macos.yml
@@ -28,10 +28,14 @@ jobs:
         cache-dependency-path: '**/requirements.txt'
     - run: pip install -r requirements.txt
 
-    - name: Install dependencies
+    - name: Install dependencies (Homebrew)
       run: |
         brew install openmpi hdf5-mpi adios2 || true
 
+    - name: Install OpenPMD
+      run: |
+        openPMD_USE_MPI=ON python3 -m pip install openpmd-api --no-binary openpmd-api
+
     - name: Install parthenon_tools
       run: |
         pip install scripts/python/packages/parthenon_tools
diff --git a/.github/workflows/ci-short.yml b/.github/workflows/ci-short.yml
index 25cf1609d816..c711acf5c116 100644
--- a/.github/workflows/ci-short.yml
+++ b/.github/workflows/ci-short.yml
@@ -32,8 +32,9 @@ jobs:
       - name: cpplint
         run: python3 ./tst/style/cpplint.py --counting=detailed --recursive src example tst
       - name: copyright
+        # using variant mpi because openpmd lib is only installed with mpi support (no serial)
         run: |
-          cmake -DCMAKE_CXX_FLAGS=-Werror -Bbuild-copyright-check
+          cmake -DCMAKE_CXX_FLAGS=-Werror -Bbuild-copyright-check -DMACHINE_VARIANT=mpi
           cmake --build build-copyright-check -t check-copyright
       - uses: actions/upload-artifact@v4
         with:
@@ -104,6 +105,7 @@ jobs:
           # make sure parthenon tools is in our python path
           export PYTHONPATH="$PYTHONPATH:$(python -m site --user-site)"
           ctest -R regression_mpi_test:output_hdf5
+          ctest -R regression_mpi_test:restart_opmd
       # Test example with swarms
       - name: particle-leapfrog
         run: |
@@ -174,6 +176,7 @@ jobs:
           # make sure parthenon tools is in our python path
           export PYTHONPATH="$PYTHONPATH:$(python -m site --user-site)"
           ctest -R regression_mpi_test:output_hdf5
+          ctest -R regression_mpi_test:restart_opmd
       # Test example with swarms
       - name: particle-leapfrog
         run: |
diff --git a/.github/workflows/docs.yml b/.github/workflows/docs.yml
index bc8ee82056ec..0eb78d3af7f1 100644
--- a/.github/workflows/docs.yml
+++ b/.github/workflows/docs.yml
@@ -36,6 +36,7 @@ jobs:
             mkdir -p build && cd build
             cmake -DPARTHENON_DISABLE_HDF5=ON \
                   -DPARTHENON_DISABLE_MPI=ON \
+                  -DPARTHENON_DISABLE_OPENPMD=ON \
                   -DREGRESSION_GOLD_STANDARD_SYNC=OFF \
                   -DBUILD_TESTING=OFF \
                   ..
diff --git a/CMakeLists.txt b/CMakeLists.txt
index 90722cca713d..ef7cfd4ff7a4 100644
--- a/CMakeLists.txt
+++ b/CMakeLists.txt
@@ -36,6 +36,8 @@ option(PARTHENON_DISABLE_MPI "MPI is enabled by default if found, set this to Tr
 option(PARTHENON_ENABLE_HOST_COMM_BUFFERS "CUDA/HIP Only: Allocate communication buffers on host (may be slower)" OFF)
 option(PARTHENON_DISABLE_HDF5 "HDF5 is enabled by default if found, set this to True to disable HDF5" OFF)
 option(PARTHENON_DISABLE_HDF5_COMPRESSION "HDF5 compression is enabled by default, set this to True to disable compression in HDF5 output/restart files" OFF)
+option(PARTHENON_DISABLE_OPENPMD "OpenPMD is enabled by default if found, set this to ON to disable OpenPMD" OFF)
+option(PARTHENON_USE_SYSTEM_OPENPMD "OpenPMD API is downloaded and installed automatically by default. Set this to ON to find and use a version installed on the system." OFF)
 option(PARTHENON_DISABLE_SPARSE "Sparse capability is enabled by default, set this to True to compile-time disable all sparse capability" OFF)
 option(PARTHENON_ENABLE_ASCENT "Enable Ascent for in situ visualization and analysis" OFF)
 option(PARTHENON_LINT_DEFAULT "Linting is turned off by default, use the \"lint\" target or set \
@@ -207,6 +209,51 @@ if (NOT PARTHENON_DISABLE_HDF5)
   install(TARGETS HDF5_C EXPORT parthenonTargets)
 endif()
 
+set(PARTHENON_ENABLE_OPENPMD OFF)
+if (NOT PARTHENON_DISABLE_OPENPMD)
+  if (PARTHENON_USE_SYSTEM_OPENPMD)
+    # we want to enforce the use of ADIOS2 with this backend
+    set(PARTHENON_OPENPMD_COMPONENTS "ADIOS2")
+    if (ENABLE_MPI)
+      list(APPEND PARTHENON_OPENPMD_COMPONENTS "MPI")
+    else()
+      list(APPEND PARTHENON_OPENPMD_COMPONENTS "NOMPI")
+    endif()
+    find_package(openPMD 0.16.1 CONFIG COMPONENTS ${PARTHENON_OPENPMD_COMPONENTS})
+    if (NOT openPMD_FOUND)
+      message(FATAL_ERROR "OpenPMD API requested to be used from the environment but it was "
+      "not found. Either append the path to the installed OpenPMD lib via the "
+      "openPMD_DIR or CMAKE_PREFIX_PATH, or use the version shipped with Parthenon by keeping "
+      "PARTHENON_USE_SYSTEM_OPENPMD=OFF")
+    endif()
+  else()
+    include(FetchContent)
+    set(CMAKE_POLICY_DEFAULT_CMP0077 NEW)
+    set(openPMD_BUILD_CLI_TOOLS OFF)
+    set(openPMD_BUILD_EXAMPLES OFF)
+    set(openPMD_BUILD_TESTING OFF)
+    set(openPMD_BUILD_SHARED_LIBS OFF)
+    set(openPMD_INSTALL OFF)
+    set(openPMD_USE_ADIOS2 ON)  # we definitely want ADIOS2
+    if( NOT Python3_Interpreter_FOUND)
+      find_package(Python3 REQUIRED COMPONENTS Interpreter)
+    endif()
+    # Why not build the python interface for easier testing when Python is available
+    if(Python3_Interpreter_FOUND)
+      set(openPMD_USE_PYTHON ON)
+    else()
+      set(openPMD_USE_PYTHON OFF)
+    endif()
+    FetchContent_Declare(openPMD
+      GIT_REPOSITORY "https://github.com/openPMD/openPMD-api.git"
+      GIT_TAG        "3a60e77") # Release 0.16.1
+    FetchContent_MakeAvailable(openPMD)
+    install(TARGETS openPMD EXPORT parthenonTargets)
+  endif()
+
+  set(PARTHENON_ENABLE_OPENPMD ON)
+endif()
+
 # Kokkos recommendatation resulting in not using default GNU extensions
 set(CMAKE_CXX_EXTENSIONS OFF)
 
diff --git a/cmake/machinecfg/CI.cmake b/cmake/machinecfg/CI.cmake
index d9b7bb6df013..16c0dc0c6cf0 100644
--- a/cmake/machinecfg/CI.cmake
+++ b/cmake/machinecfg/CI.cmake
@@ -1,6 +1,6 @@
 #========================================================================================
 # Parthenon performance portable AMR framework
-# Copyright(C) 2020 The Parthenon collaboration
+# Copyright(C) 2020-2025 The Parthenon collaboration
 # Licensed under the 3-clause BSD License, see LICENSE file for details
 #========================================================================================
 # (C) (or copyright) 2020. Triad National Security, LLC. All rights reserved.
@@ -38,3 +38,5 @@ else()
   set(HDF5_ROOT /usr/local/hdf5/serial CACHE STRING "HDF5 path")
   set(PARTHENON_DISABLE_MPI ON CACHE BOOL "Disable MPI")
 endif()
+
+set(PARTHENON_USE_SYSTEM_OPENPMD ON CACHE BOOL "Use API in container")
diff --git a/cmake/machinecfg/GitHubActions.cmake b/cmake/machinecfg/GitHubActions.cmake
index b524483d996c..ad5bb586c5f1 100644
--- a/cmake/machinecfg/GitHubActions.cmake
+++ b/cmake/machinecfg/GitHubActions.cmake
@@ -1,6 +1,6 @@
 #========================================================================================
 # Parthenon performance portable AMR framework
-# Copyright(C) 2021 The Parthenon collaboration
+# Copyright(C) 2021-2025 The Parthenon collaboration
 # Licensed under the 3-clause BSD License, see LICENSE file for details
 #========================================================================================
 # (C) (or copyright) 2021. Triad National Security, LLC. All rights reserved.
@@ -50,4 +50,6 @@ else()
   set(PARTHENON_DISABLE_MPI ON CACHE BOOL "Disable MPI")
 endif()
 
+set(PARTHENON_USE_SYSTEM_OPENPMD ON CACHE BOOL "Use API in container")
+
 set(CMAKE_CXX_FLAGS "${MACHINE_CXX_FLAGS}" CACHE STRING "Default flags for this config")
diff --git a/src/CMakeLists.txt b/src/CMakeLists.txt
index 306d0690104c..507151dd7265 100644
--- a/src/CMakeLists.txt
+++ b/src/CMakeLists.txt
@@ -1,4 +1,8 @@
 #=========================================================================================
+# Parthenon performance portable AMR framework
+# Copyright(C) 2020-2025 The Parthenon collaboration
+# Licensed under the 3-clause BSD License, see LICENSE file for detail
+#=========================================================================================
 # (C) (or copyright) 2020-2024. Triad National Security, LLC. All rights reserved.
 #
 # This program was produced under U.S. Government contract 89233218CNA000001 for Los
@@ -196,6 +200,7 @@ add_library(parthenon
   outputs/history.cpp
   outputs/io_wrapper.cpp
   outputs/io_wrapper.hpp
+  outputs/output_attr.hpp
   outputs/output_utils.cpp
   outputs/output_utils.hpp
   outputs/outputs.cpp
@@ -358,6 +363,16 @@ if (ENABLE_HDF5)
   target_link_libraries(parthenon PUBLIC HDF5_C)
 endif()
 
+if (PARTHENON_ENABLE_OPENPMD)
+  target_sources(parthenon PRIVATE
+    outputs/parthenon_opmd.cpp
+    outputs/parthenon_opmd.hpp
+    outputs/restart_opmd.cpp
+    outputs/restart_opmd.hpp
+  )
+  target_link_libraries(parthenon PUBLIC openPMD::openPMD)
+endif()
+
 # For Cuda with NVCC (<11.2) and C++17 Kokkos currently does not work/compile with
 # relaxed-constexpr, see https://github.com/kokkos/kokkos/issues/3496
 # However, Parthenon heavily relies on it and there is no harm in compiling Kokkos
diff --git a/src/config.hpp.in b/src/config.hpp.in
index 588aff2672e8..058e7b2146a3 100644
--- a/src/config.hpp.in
+++ b/src/config.hpp.in
@@ -45,6 +45,8 @@
 // defne ENABLE_HDF5 or not at all
 #cmakedefine ENABLE_HDF5
 
+#cmakedefine PARTHENON_ENABLE_OPENPMD
+
 // define PARTHENON_DISABLE_HDF5_COMPRESSION or not at all
 #cmakedefine PARTHENON_DISABLE_HDF5_COMPRESSION
 
diff --git a/src/interface/params.hpp b/src/interface/params.hpp
index 1a19de82e7bf..a8c7a55e2f8d 100644
--- a/src/interface/params.hpp
+++ b/src/interface/params.hpp
@@ -122,6 +122,12 @@ class Params {
     return myParams_.at(key)->type();
   }
 
+  const Mutability &GetMutability(const std::string &key) const {
+    auto const it = myMutable_.find(key);
+    PARTHENON_REQUIRE_THROWS(it != myMutable_.end(), "Key " + key + " doesn't exist");
+    return it->second;
+  }
+
   std::vector<std::string> GetKeys() const {
     std::vector<std::string> keys;
     for (auto &x : myParams_) {
@@ -130,7 +136,6 @@ class Params {
     return keys;
   }
 
-  auto GetMutability(const std::string &key) const { return myMutable_.at(key); }
   bool IsMutable(const std::string &key) const {
     return static_cast<bool>(myMutable_.at(key));
   }
diff --git a/src/outputs/output_attr.hpp b/src/outputs/output_attr.hpp
new file mode 100644
index 000000000000..8607157e09a2
--- /dev/null
+++ b/src/outputs/output_attr.hpp
@@ -0,0 +1,47 @@
+//========================================================================================
+// Parthenon performance portable AMR framework
+// Copyright(C) 2023-2024 The Parthenon collaboration
+// Licensed under the 3-clause BSD License, see LICENSE file for details
+//========================================================================================
+// (C) (or copyright) 2020-2024. Triad National Security, LLC. All rights reserved.
+//
+// This program was produced under U.S. Government contract 89233218CNA000001 for Los
+// Alamos National Laboratory (LANL), which is operated by Triad National Security, LLC
+// for the U.S. Department of Energy/National Nuclear Security Administration. All rights
+// in the program are reserved by Triad National Security, LLC, and the U.S. Department
+// of Energy/National Nuclear Security Administration. The Government is granted for
+// itself and others acting on its behalf a nonexclusive, paid-up, irrevocable worldwide
+// license in this material to reproduce, prepare derivative works, distribute copies to
+// the public, perform publicly and display publicly, and to permit others to do so.
+//========================================================================================
+
+#ifndef OUTPUTS_OUTPUT_ATTR_HPP_
+#define OUTPUTS_OUTPUT_ATTR_HPP_
+
+#include <vector>
+
+// JMM: This could probably be done with template magic but I think
+// using a macro is honestly the simplest and cleanest solution here.
+// Template solution would be to define a variatic class to conain the
+// list of types and then a hierarchy of structs/functions to turn
+// that into function calls. Preprocessor seems easier, given we're
+// not manipulating this list in any way.
+// The following types are the ones we allow to be stored as attributes in outputs
+// (specifically within Params).
+#define PARTHENON_ATTR_VALID_VEC_TYPES(T)                                                \
+  T, std::vector<T>, ParArray1D<T>, ParArray2D<T>, ParArray3D<T>, HostArray1D<T>,        \
+      HostArray2D<T>, HostArray3D<T>, Kokkos::View<T *>, Kokkos::View<T **>,             \
+      ParArrayND<T>, ParArrayHost<T>
+// JMM: This is the list of template specializations we
+// "pre-instantiate" We only pre-instantiate device memory, not host
+// memory. The reason is that when building with the Kokkos serial
+// backend, DevMemSpace and HostMemSpace are the same and so this
+// resolves to the same type in the macro, which causes problems.
+#define PARTHENON_ATTR_FOREACH_VECTOR_TYPE(T)                                            \
+  PARTHENON_ATTR_APPLY(T);                                                               \
+  PARTHENON_ATTR_APPLY(Kokkos::View<T *, LayoutWrapper, DevMemSpace>);                   \
+  PARTHENON_ATTR_APPLY(Kokkos::View<T **, LayoutWrapper, DevMemSpace>);                  \
+  PARTHENON_ATTR_APPLY(Kokkos::View<T ***, LayoutWrapper, DevMemSpace>);                 \
+  PARTHENON_ATTR_APPLY(device_view_t<T>)
+
+#endif // OUTPUTS_OUTPUT_ATTR_HPP_
diff --git a/src/outputs/output_utils.cpp b/src/outputs/output_utils.cpp
index 5d6064ad35d4..c08d27238a99 100644
--- a/src/outputs/output_utils.cpp
+++ b/src/outputs/output_utils.cpp
@@ -18,6 +18,7 @@
 #include <algorithm>
 #include <functional>
 #include <map>
+#include <memory>
 #include <set>
 #include <string>
 #include <type_traits>
@@ -34,11 +35,15 @@
 #include "mesh/meshblock.hpp"
 #include "outputs/output_utils.hpp"
 #include "parameter_input.hpp"
+#include "utils/error_checking.hpp"
+#include "utils/mpi_types.hpp"
 
 namespace parthenon {
 namespace OutputUtils {
 
-Triple_t<int> VarInfo::GetNumKJI(const IndexDomain domain) const {
+// This function returns the max dimensions over all topological elements of the given
+// variable, i.e., it returns nx1+1, nx2+1, nx3+1 for a face centered variable.
+Triple_t<int> VarInfo::GetPaddedNumKJI(const IndexDomain domain) const {
   int nx3 = 1, nx2 = 1, nx1 = 1;
   // TODO(JMM): I know that this could be done by hand, but I'd rather
   // rely on the loop bounds machinery and this should be cheap.
@@ -92,13 +97,23 @@ int VarInfo::TensorSize() const {
   }
 }
 
-int VarInfo::FillSize(const IndexDomain domain) const {
+int VarInfo::FillSize(const IndexDomain domain, const bool is_padded) const {
   if (where == MetadataFlag({Metadata::None})) {
     return Size();
-  } else {
-    auto [n3, n2, n1] = GetNumKJI(domain);
+  }
+  if (is_padded) {
+    auto [n3, n2, n1] = GetPaddedNumKJI(domain);
     return ntop_elems * TensorSize() * n3 * n2 * n1;
   }
+  // Use raw info from topological elements (including some safety checks)
+  auto ncells = cellbounds.GetTotal(domain, topological_elements.at(0));
+  for (auto el_idx = 1; el_idx < ntop_elems; el_idx++) {
+    PARTHENON_REQUIRE_THROWS(
+        ncells == cellbounds.GetTotal(domain, topological_elements.at(el_idx)),
+        "All topological elements in a given output variable should have the same total "
+        "number of cells.");
+  }
+  return ntop_elems * TensorSize() * ncells;
 }
 
 // number of elements of data that describe variable shape
@@ -112,7 +127,7 @@ int VarInfo::GetNDim() const {
 std::vector<int> VarInfo::GetPaddedShape(IndexDomain domain) const {
   std::vector<int> out = GetRawShape();
   if (where != MetadataFlag({Metadata::None})) {
-    auto [nx3, nx2, nx1] = GetNumKJI(domain);
+    auto [nx3, nx2, nx1] = GetPaddedNumKJI(domain);
     out[0] = nx3;
     out[1] = nx2;
     out[2] = nx1;
@@ -122,7 +137,7 @@ std::vector<int> VarInfo::GetPaddedShape(IndexDomain domain) const {
 std::vector<int> VarInfo::GetPaddedShapeReversed(IndexDomain domain) const {
   std::vector<int> out(rnx_.begin(), rnx_.end());
   if (where != MetadataFlag({Metadata::None})) {
-    auto [nx3, nx2, nx1] = GetNumKJI(domain);
+    auto [nx3, nx2, nx1] = GetPaddedNumKJI(domain);
     out[VNDIM - 3] = nx3;
     out[VNDIM - 2] = nx2;
     out[VNDIM - 1] = nx1;
@@ -290,6 +305,49 @@ std::vector<int> ComputeDerefinementCount(Mesh *pm) {
                                });
 }
 
+template <typename T>
+std::vector<T> FlattendedLocalToGlobal(Mesh *pm, const std::vector<T> &data_local) {
+  const int n_blocks_global = pm->nbtotal;
+  const int n_blocks_local = static_cast<int>(pm->block_list.size());
+
+  const int n_elem = data_local.size() / n_blocks_local;
+  PARTHENON_REQUIRE_THROWS(data_local.size() % n_blocks_local == 0,
+                           "Results from flattened input vector does not evenly divide "
+                           "into number of local blocks.");
+  std::vector<T> data_global(n_elem * n_blocks_global);
+
+  std::vector<int> counts(Globals::nranks);
+  std::vector<int> offsets(Globals::nranks);
+
+  const auto &nblist = pm->GetNbList();
+  counts[0] = n_elem * nblist[0];
+  offsets[0] = 0;
+  for (int r = 1; r < Globals::nranks; r++) {
+    counts[r] = n_elem * nblist[r];
+    offsets[r] = offsets[r - 1] + counts[r - 1];
+  }
+
+#ifdef MPI_PARALLEL
+  PARTHENON_MPI_CHECK(MPI_Allgatherv(data_local.data(), counts[Globals::my_rank],
+                                     MPITypeMap<T>::type(), data_global.data(),
+                                     counts.data(), offsets.data(), MPITypeMap<T>::type(),
+                                     MPI_COMM_WORLD));
+#else
+  return data_local;
+#endif
+  return data_global;
+}
+
+// explicit template instantiation
+template std::vector<std::size_t>
+FlattendedLocalToGlobal(Mesh *pm, const std::vector<std::size_t> &data_local);
+template std::vector<int8_t>
+FlattendedLocalToGlobal(Mesh *pm, const std::vector<int8_t> &data_local);
+template std::vector<int64_t>
+FlattendedLocalToGlobal(Mesh *pm, const std::vector<int64_t> &data_local);
+template std::vector<int> FlattendedLocalToGlobal(Mesh *pm,
+                                                  const std::vector<int> &data_local);
+
 // TODO(JMM): I could make this use the other loop
 // functionality/high-order functions.  but it was more code than this
 // for, I think, little benefit.
@@ -361,6 +419,35 @@ std::size_t MPISum(std::size_t val) {
   return val;
 }
 
+VariableVector<Real> GetVarsToWrite(const std::shared_ptr<MeshBlock> pmb,
+                                    const bool restart,
+                                    const std::vector<std::string> &variables) {
+  const auto &var_vec = pmb->meshblock_data.Get()->GetVariableVector();
+  auto vars_to_write = GetAnyVariables(var_vec, variables);
+  if (restart) {
+    // get all vars with flag Independent OR restart
+    auto restart_vars = GetAnyVariables(
+        var_vec, {parthenon::Metadata::Independent, parthenon::Metadata::Restart});
+    for (auto restart_var : restart_vars) {
+      vars_to_write.emplace_back(restart_var);
+    }
+  }
+  return vars_to_write;
+}
+
+std::vector<VarInfo> GetAllVarsInfo(const VariableVector<Real> &vars,
+                                    const IndexShape &cellbounds) {
+  std::vector<VarInfo> all_vars_info;
+  for (auto &v : vars) {
+    all_vars_info.emplace_back(v, cellbounds);
+  }
+
+  // sort alphabetically
+  std::sort(all_vars_info.begin(), all_vars_info.end(),
+            [](const VarInfo &a, const VarInfo &b) { return a.label < b.label; });
+  return all_vars_info;
+}
+
 void CheckParameterInputConsistent(ParameterInput *pin) {
 #ifdef MPI_PARALLEL
   CheckMPISizeT();
diff --git a/src/outputs/output_utils.hpp b/src/outputs/output_utils.hpp
index 73011c6cbdf9..b4371ddf2e8a 100644
--- a/src/outputs/output_utils.hpp
+++ b/src/outputs/output_utils.hpp
@@ -72,14 +72,16 @@ struct VarInfo {
   // whether or not topological element matters.
   bool element_matters;
 
-  Triple_t<int> GetNumKJI(const IndexDomain domain) const;
+  Triple_t<int> GetPaddedNumKJI(const IndexDomain domain) const;
   Triple_t<IndexRange> GetPaddedBoundsKJI(const IndexDomain domain) const;
 
   int Size() const;
   // Includes topological element shape
   int TensorSize() const;
-  // Size of region that needs to be filled with 0s if not allocated
-  int FillSize(const IndexDomain domain) const;
+  // Size of region that needs to be filled with 0s if not allocated.
+  // is_padded is set to true by default as it's the assumption in the original (HDF5)
+  // output files.
+  int FillSize(const IndexDomain domain, const bool is_padded = true) const;
   // number of elements of data that describe variable shape
   int GetNDim() const;
 
@@ -93,7 +95,7 @@ struct VarInfo {
       // For nx1,nx2,nx3 find max storage required in each direction
       // accross topological elements. Unused indices will be written but
       // empty.
-      auto [nx3, nx2, nx1] = GetNumKJI(domain);
+      auto [nx3, nx2, nx1] = GetPaddedNumKJI(domain);
       // fill topological element, if relevant
       if (element_matters) {
         data[0] = ntop_elems;
@@ -188,6 +190,8 @@ struct VarInfo {
  private:
   // TODO(JMM): Probably nx_ and rnx_ both not necessary... but it was
   // easiest for me to reason about it this way.
+  // Note, nx_ is usually initialized to the view dimensions (i.e., padded for face and
+  // edge centered fields).
   std::array<int, VNDIM> nx_;
   std::vector<int> rnx_;
 };
@@ -219,8 +223,8 @@ struct SwarmInfo {
   std::size_t count_on_rank = 0;                // per-meshblock
   std::size_t global_offset;                    // global
   std::size_t global_count;                     // global
-  std::vector<std::size_t> counts;              // per-meshblock
-  std::vector<std::size_t> offsets;             // global
+  std::vector<std::size_t> counts;              // on local meshblocks
+  std::vector<std::size_t> offsets;             // global offset for local meshblocks
   // std::vector<ParArray1D<bool>> masks; // used for reading swarms without defrag
   std::vector<std::size_t> max_indices;   // JMM: If we defrag, unneeded?
   void AddOffsets(const SP_Swarm &swarm); // sets above metadata
@@ -249,7 +253,7 @@ struct SwarmInfo {
   // Copies swarmvar to host in prep for output
   template <typename T>
   std::vector<T> FillHostBuffer(const std::string vname,
-                                ParticleVariableVector<T> &swmvarvec) {
+                                const ParticleVariableVector<T> &swmvarvec) const {
     const auto &vinfo = var_info.at(vname);
     std::vector<T> host_data(count_on_rank * vinfo.nvar);
     std::size_t ivec = 0;
@@ -258,6 +262,7 @@ struct SwarmInfo {
         for (int n4 = 0; n4 < vinfo.GetN(4); ++n4) {
           for (int n3 = 0; n3 < vinfo.GetN(3); ++n3) {
             for (int n2 = 0; n2 < vinfo.GetN(2); ++n2) {
+              // TODO(pgrete) understand what's doing on with the blocks here...
               std::size_t block_idx = 0;
               for (auto &swmvar : swmvarvec) {
                 // Copied extra times. JMM: If we defrag, unneeded?
@@ -313,16 +318,19 @@ std::vector<T> FlattenBlockInfo(Mesh *pm, int shape, Function_t f) {
 
 // mirror must be provided because copying done externally
 template <typename idx_t, typename Function_t>
-void PackOrUnpackVar(const VarInfo &info, bool do_ghosts, idx_t &idx, Function_t f) {
+void PackOrUnpackVar(const VarInfo &info, bool do_ghosts, bool is_padded, idx_t &idx,
+                     Function_t f) {
   const IndexDomain domain = (do_ghosts ? IndexDomain::entire : IndexDomain::interior);
   // shape as written to or read from. contains additional padding
   // in orthogonal directions.
   // e.g., Face1-centered var is shape (N1+1)x(N2+1)x(N3+1)
   // format is
   // topological_elems x tensor_elems x block_elems
+  // If variable is written without padding, we'll cut the indices below.
   const auto shape = info.GetPaddedShapeReversed(domain);
   // TODO(JMM): Should I hide this inside VarInfo?
   auto [kb, jb, ib] = info.GetPaddedBoundsKJI(domain);
+  // Adjust padded indices for variables not tied to the mesh
   if (info.where == MetadataFlag({Metadata::None})) {
     kb.s = 0;
     kb.e = std::max(0, shape[4] - 1);
@@ -332,6 +340,12 @@ void PackOrUnpackVar(const VarInfo &info, bool do_ghosts, idx_t &idx, Function_t
     ib.e = std::max(0, shape[6] - 1);
   }
   for (int topo = 0; topo < shape[0]; ++topo) {
+    // Adjust padded indices for variables not written with padding
+    if (!is_padded) {
+      kb = info.cellbounds.GetBoundsK(domain, info.topological_elements.at(topo));
+      jb = info.cellbounds.GetBoundsJ(domain, info.topological_elements.at(topo));
+      ib = info.cellbounds.GetBoundsI(domain, info.topological_elements.at(topo));
+    }
     for (int t = 0; t < shape[1]; ++t) {
       for (int u = 0; u < shape[2]; ++u) {
         for (int v = 0; v < shape[3]; ++v) {
@@ -357,10 +371,26 @@ std::vector<int64_t> ComputeLocs(Mesh *pm);
 std::vector<int> ComputeIDsAndFlags(Mesh *pm);
 std::vector<int> ComputeDerefinementCount(Mesh *pm);
 
+// Takes a vector containing flattened data of all rank local blocks and returns the
+// flattened data over all blocks.
+template <typename T>
+std::vector<T> FlattendedLocalToGlobal(Mesh *pm, const std::vector<T> &data_local);
+
 // TODO(JMM): If we ever need non-int need to generalize
 std::size_t MPIPrefixSum(std::size_t local, std::size_t &tot_count);
 std::size_t MPISum(std::size_t local);
 
+// Return all variables to write, i.e., for restarts all indpendent variables and ones
+// with explicit Restart flag, but also variables explicitly defined to output in the
+// input file.
+VariableVector<Real> GetVarsToWrite(const std::shared_ptr<MeshBlock> pmb,
+                                    const bool restart,
+                                    const std::vector<std::string> &variables);
+
+// Returns a sorted vector of VarInfo associated with vars
+std::vector<VarInfo> GetAllVarsInfo(const VariableVector<Real> &vars,
+                                    const IndexShape &cellbounds);
+
 void CheckParameterInputConsistent(ParameterInput *pin);
 } // namespace OutputUtils
 } // namespace parthenon
diff --git a/src/outputs/outputs.cpp b/src/outputs/outputs.cpp
index 0062cefc098d..3ca8c80b3696 100644
--- a/src/outputs/outputs.cpp
+++ b/src/outputs/outputs.cpp
@@ -234,28 +234,34 @@ Outputs::Outputs(Mesh *pm, ParameterInput *pin, SimTime *tm) {
     // read single precision output option
     const bool is_hdf5_output = (op.file_type == "rst") || (op.file_type == "hdf5") ||
                                 (op.file_type == "corehdf5");
+    const bool is_openpmd_output = (op.file_type == "openpmd");
 
-    if (is_hdf5_output) {
+    if (is_hdf5_output || is_openpmd_output) {
       op.single_precision_output =
           pin->GetOrAddBoolean(op.block_name, "single_precision_output", false);
-      op.sparse_seed_nans =
-          pin->GetOrAddBoolean(op.block_name, "sparse_seed_nans", false,
-                               "write non-allocated sparse data as NaN");
-      op.meshdata_name = pin->GetOrAddString(op.block_name, "meshdata_name", "base",
-                                             "which meshdata object to write from");
     } else {
       op.single_precision_output = false;
-      op.sparse_seed_nans = false;
-
       if (pin->DoesParameterExist(op.block_name, "single_precision_output")) {
         std::stringstream warn;
         warn << "Output option single_precision_output only applies to "
                 "HDF5 outputs or restarts. Ignoring it for output block '"
              << op.block_name << "'";
-        PARTHENON_WARN(warn);
+        if (Globals::my_rank == 0) {
+          PARTHENON_WARN(warn);
+        }
       }
     }
 
+    if (is_hdf5_output) {
+      op.sparse_seed_nans =
+          pin->GetOrAddBoolean(op.block_name, "sparse_seed_nans", false,
+                               "write non-allocated sparse data as NaN");
+      op.meshdata_name = pin->GetOrAddString(op.block_name, "meshdata_name", "base",
+                                             "which meshdata object to write from");
+    } else {
+      op.sparse_seed_nans = false;
+    }
+
     if (is_hdf5_output) {
       int default_compression_level = 5;
 #ifdef PARTHENON_DISABLE_HDF5_COMPRESSION
@@ -354,6 +360,25 @@ Outputs::Outputs(Mesh *pm, ParameterInput *pin, SimTime *tm) {
       pnew_type = std::make_shared<HistoryOutput>(op);
     } else if (op.file_type == "ascent") {
       pnew_type = std::make_shared<AscentOutput>(op);
+    } else if (op.file_type == "openpmd") {
+#ifdef PARTHENON_ENABLE_OPENPMD
+      const auto backend_config =
+          pin->GetOrAddString(op.block_name, "backend_config", "default");
+      const auto coarsening_factor =
+          pin->GetOrAddInteger(op.block_name, "coarsening_factor", 1,
+                               "Output data coarsened by given factor n. Every n^dim "
+                               "data point is used, i.e., the data is not average. "
+                               "Requires even number of cells in each block dimension.");
+
+      pnew_type = std::make_shared<OpenPMDOutput>(op, backend_config, coarsening_factor);
+#else
+      msg << "### FATAL ERROR in Outputs constructor" << std::endl
+          << "Executable not configured for OpenPMD outputs, but OpenPMD file format "
+          << "is requested in output/restart block '" << op.block_name << "'. "
+          << "You can disable this block without deleting it by setting a dt < 0."
+          << std::endl;
+      PARTHENON_FAIL(msg);
+#endif // ifdef PARTHENON_ENABLE_OPENPMD
     } else if (op.file_type == "histogram") {
 #ifdef ENABLE_HDF5
       pnew_type = std::make_shared<HistogramOutput>(op, pin);
diff --git a/src/outputs/outputs.hpp b/src/outputs/outputs.hpp
index fe375c9ba93c..99572c182519 100644
--- a/src/outputs/outputs.hpp
+++ b/src/outputs/outputs.hpp
@@ -27,6 +27,7 @@
 #include <memory>
 #include <set>
 #include <string>
+#include <utility>
 #include <vector>
 
 #include "Kokkos_ScatterView.hpp"
@@ -141,6 +142,28 @@ class AscentOutput : public OutputType {
   ParArray1D<Real> ghost_mask_;
 };
 
+//----------------------------------------------------------------------------------------
+//! \class OpenPMDOutput
+//  \brief derived OutputType class for OpenPMD based output
+
+class OpenPMDOutput : public OutputType {
+ public:
+  explicit OpenPMDOutput(const OutputParameters &oparams, std::string backend_config,
+                         int coarsening_factor)
+      : OutputType(oparams), backend_config_(std::move(backend_config)),
+        coarsening_factor_(coarsening_factor) {}
+  void WriteOutputFile(Mesh *pm, ParameterInput *pin, SimTime *tm,
+                       const SignalHandler::OutputSignal signal) override;
+  template <bool WRITE_SINGLE_PRECISION>
+  void WriteOutputFileImpl(Mesh *pm, ParameterInput *pin, SimTime *tm,
+                           const SignalHandler::OutputSignal signal);
+
+ private:
+  //  path to file containing config passed to backend
+  std::string backend_config_;
+  int coarsening_factor_;
+};
+
 #ifdef ENABLE_HDF5
 //----------------------------------------------------------------------------------------
 //! \class PHDF5Output
diff --git a/src/outputs/parthenon_hdf5.cpp b/src/outputs/parthenon_hdf5.cpp
index e3c272b597e0..6ae4c6832032 100644
--- a/src/outputs/parthenon_hdf5.cpp
+++ b/src/outputs/parthenon_hdf5.cpp
@@ -3,10 +3,6 @@
 // Copyright(C) 2020-2025 The Parthenon collaboration
 // Licensed under the 3-clause BSD License, see LICENSE file for details
 //========================================================================================
-// Parthenon performance portable AMR framework
-// Copyright(C) 2020-2025 The Parthenon collaboration
-// Licensed under the 3-clause BSD License, see LICENSE file for details
-//========================================================================================
 // (C) (or copyright) 2020-2025. Triad National Security, LLC. All rights reserved.
 //
 // This program was produced under U.S. Government contract 89233218CNA000001 for Los
@@ -321,7 +317,8 @@ void PHDF5Output::WriteOutputFileImpl(Mesh *pm, ParameterInput *pin, SimTime *tm
   // The dataset SparseInfo itself is a 2D array of bools. The first index is the
   // global block index and the second index is the sparse field (same order as the
   // SparseFields attribute). SparseInfo[b][v] is true if the sparse field with index
-  // v is allocated on the block with index b, otherwise the value is false
+  // v is allocated on the block with index b, otherwise the value is false.
+  // If the logic here is ever updated, ensure to update the OpenPMD logic, too.
 
   std::vector<std::string> sparse_names;
   std::unordered_map<std::string, size_t> sparse_field_idx;
@@ -397,22 +394,21 @@ void PHDF5Output::WriteOutputFileImpl(Mesh *pm, ParameterInput *pin, SimTime *tm
       const auto &pmb = pm->block_list[b_idx];
       bool is_allocated = false;
       int dealloc_count = 0;
-      // for each variable that this local meshblock actually has
-      const auto vars = get_vars(pmb);
-      for (auto &v : vars) {
-        // For reference, if we update the logic here, there's also
-        // a similar block in parthenon_manager.cpp
-        if (v->IsAllocated() && (var_name == v->label())) {
-          auto v_h = v->data.GetHostMirrorAndCopy();
-          OutputUtils::PackOrUnpackVar(
-              vinfo, output_params.include_ghost_zones, index,
-              [&](auto index, int topo, int t, int u, int v, int k, int j, int i) {
-                tmpData[index] = static_cast<OutT>(v_h(topo, t, u, v, k, j, i));
-              });
-          is_allocated = true;
-          dealloc_count = v->dealloc_count;
-          break;
-        }
+      // TODO(reviewers) Why was the loop originally there? Does the direct Get causes
+      // issue?
+      auto v = pmb->meshblock_data.Get()->GetVarPtr(var_name);
+      // For reference, if we update the logic here, there's also
+      // a similar block in parthenon_manager.cpp
+      if (v->IsAllocated() && (var_name == v->label())) {
+        auto v_h = v->data.GetHostMirrorAndCopy();
+        OutputUtils::PackOrUnpackVar(
+            vinfo, output_params.include_ghost_zones, true, index,
+            [&](auto index, int topo, int t, int u, int v, int k, int j, int i) {
+              tmpData[index] = static_cast<OutT>(v_h(topo, t, u, v, k, j, i));
+            });
+
+        is_allocated = true;
+        dealloc_count = v->dealloc_count;
       }
 
       if (vinfo.is_sparse) {
diff --git a/src/outputs/parthenon_hdf5.hpp b/src/outputs/parthenon_hdf5.hpp
index 6dc3ffcb69c3..06a7d6b8fe09 100644
--- a/src/outputs/parthenon_hdf5.hpp
+++ b/src/outputs/parthenon_hdf5.hpp
@@ -21,29 +21,9 @@
 #include "defs.hpp"
 
 #include "kokkos_abstraction.hpp"
+#include "output_attr.hpp"
 #include "parthenon_arrays.hpp"
 
-// JMM: This could probably be done with template magic but I think
-// using a macro is honestly the simplest and cleanest solution here.
-// Template solution would be to define a variatic class to conain the
-// list of types and then a hierarchy of structs/functions to turn
-// that into function calls. Preprocessor seems easier, given we're
-// not manipulating this list in any way.
-#define PARTHENON_ATTR_VALID_VEC_TYPES(T)                                                \
-  T, std::vector<T>, ParArray1D<T>, ParArray2D<T>, ParArray3D<T>, HostArray1D<T>,        \
-      HostArray2D<T>, HostArray3D<T>, Kokkos::View<T *>, Kokkos::View<T **>,             \
-      ParArrayND<T>, ParArrayHost<T>
-// JMM: This is the list of template specializations we
-// "pre-instantiate" We only pre-instantiate device memory, not host
-// memory. The reason is that when building with the Kokkos serial
-// backend, DevMemSpace and HostMemSpace are the same and so this
-// resolves to the same type in the macro, which causes problems.
-#define PARTHENON_ATTR_FOREACH_VECTOR_TYPE(T)                                            \
-  PARTHENON_ATTR_APPLY(T);                                                               \
-  PARTHENON_ATTR_APPLY(Kokkos::View<T *, LayoutWrapper, DevMemSpace>);                   \
-  PARTHENON_ATTR_APPLY(Kokkos::View<T **, LayoutWrapper, DevMemSpace>);                  \
-  PARTHENON_ATTR_APPLY(Kokkos::View<T ***, LayoutWrapper, DevMemSpace>);                 \
-  PARTHENON_ATTR_APPLY(device_view_t<T>)
 // Only proceed if HDF5 output enabled
 #ifdef ENABLE_HDF5
 
diff --git a/src/outputs/parthenon_opmd.cpp b/src/outputs/parthenon_opmd.cpp
new file mode 100644
index 000000000000..c393c7025320
--- /dev/null
+++ b/src/outputs/parthenon_opmd.cpp
@@ -0,0 +1,888 @@
+//========================================================================================
+// Parthenon performance portable AMR framework
+// Copyright(C) 2024-2025 The Parthenon collaboration
+// Licensed under the 3-clause BSD License, see LICENSE file for details
+//========================================================================================
+// (C) (or copyright) 2024. Triad National Security, LLC. All rights reserved.
+//
+// This program was produced under U.S. Government contract 89233218CNA000001 for Los
+// Alamos National Laboratory (LANL), which is operated by Triad National Security, LLC
+// for the U.S. Department of Energy/National Nuclear Security Administration. All rights
+// in the program are reserved by Triad National Security, LLC, and the U.S. Department
+// of Energy/National Nuclear Security Administration. The Government is granted for
+// itself and others acting on its behalf a nonexclusive, paid-up, irrevocable worldwide
+// license in this material to reproduce, prepare derivative works, distribute copies to
+// the public, perform publicly and display publicly, and to permit others to do so.
+//========================================================================================
+//! \file parthenon_openpmd.cpp
+//  \brief Output for OpenPMD https://www.openpmd.org/ (supporting various backends)
+
+#include <algorithm>
+#include <cstddef>
+#include <cstdint>
+#include <cstdio>
+#include <cstdlib>
+#include <limits>
+#include <memory>
+#include <sstream>
+#include <string>
+#include <tuple>
+#include <type_traits>
+#include <unordered_map>
+#include <utility>
+#include <vector>
+
+// OpenPMD headers
+#include <openPMD/openPMD.hpp>
+
+// Parthenon headers
+#include "basic_types.hpp"
+#include "coordinates/coordinates.hpp"
+#include "defs.hpp"
+#include "driver/driver.hpp"
+#include "globals.hpp"
+#include "interface/state_descriptor.hpp"
+#include "interface/variable_state.hpp"
+#include "mesh/mesh.hpp"
+#include "mesh/meshblock.hpp"
+#include "outputs/output_attr.hpp"
+#include "outputs/output_utils.hpp"
+#include "outputs/outputs.hpp"
+#include "outputs/parthenon_opmd.hpp"
+#include "pack/swarm_default_names.hpp"
+#include "parthenon_array_generic.hpp"
+#include "utils/error_checking.hpp"
+#include "utils/instrument.hpp"
+
+namespace parthenon {
+
+using namespace OutputUtils;
+
+namespace OpenPMDUtils {
+
+template <typename T>
+auto GetFlatHostVecFromView(T view) {
+  // Take a view and return a vector containing rank and dims and a flattened (1D)
+  // std::vector that can then easily be passed to OpenPMD.
+  // Note, this function is not
+  // optimial as multiple (unnecessary) copies may be done. PG didn't come up with a
+  // smarter way but thinks that it's not a performance issue as this is only called for
+  // outputs (thus not that often) and for mostly small amounts of data. With a C++20 span
+  // we could probably direct reuse the host mirror data pointer.
+  auto view_h = Kokkos::create_mirror_view_and_copy(HostMemSpace(), view);
+
+  using base_t = typename std::remove_pointer<decltype(view_h.data())>::type;
+  auto host_vec = std::vector<base_t>(view_h.size());
+  for (auto i = 0; i < view_h.size(); i++) {
+    host_vec[i] = view_h.data()[i];
+  }
+  // cpplint demands compile constants be all caps
+  constexpr auto RANK = static_cast<size_t>(T::rank);
+  std::vector<size_t> rank_and_dims(RANK + 1);
+  rank_and_dims[0] = RANK;
+  for (size_t d = 0; d < RANK; ++d) {
+    rank_and_dims[1 + d] = view.extent_int(d);
+  }
+  return std::make_tuple(rank_and_dims, host_vec);
+}
+
+template <typename T>
+void WriteAllParamsOfType(const Params &params, const std::string &prefix,
+                          openPMD::Iteration *it) {
+  for (const auto &key : params.GetKeys()) {
+    const auto type = params.GetType(key);
+    if (type == std::type_index(typeid(T))) {
+      auto full_path = prefix + delim + key;
+      // The '/' is kind of a reserved character in the OpenPMD standard, which results
+      // in attribute keys with said character not being exposed.
+      // Thus we replace it.
+      std::replace(full_path.begin(), full_path.end(), '/', delim[0]);
+
+      if constexpr (implements<kokkos_view(T)>::value) {
+        const auto &view = params.Get<T>(key);
+        auto [rank_and_dims, host_vec] = GetFlatHostVecFromView(view);
+        it->setAttribute(full_path + ".rankdims", rank_and_dims);
+        it->setAttribute(full_path, host_vec);
+      } else if constexpr (is_specialization_of<T, ParArrayGeneric>::value) {
+        const auto &view = params.Get<T>(key).KokkosView();
+        auto [rank_and_dims, host_vec] = GetFlatHostVecFromView(view);
+        it->setAttribute(full_path + ".rankdims", rank_and_dims);
+        it->setAttribute(full_path, host_vec);
+      } else {
+        it->setAttribute(full_path, params.Get<T>(key));
+      }
+    }
+  }
+}
+
+template <typename... Ts>
+void WriteAllParamsOfMultipleTypes(const Params &params, const std::string &prefix,
+                                   openPMD::Iteration *it) {
+  ([&] { WriteAllParamsOfType<Ts>(params, prefix, it); }(), ...);
+}
+
+template <typename T>
+void WriteAllParams(const Params &params, const std::string &prefix,
+                    openPMD::Iteration *it) {
+  WriteAllParamsOfMultipleTypes<PARTHENON_ATTR_VALID_VEC_TYPES(T)>(params, prefix, it);
+}
+
+void WriteAllParams(const Params &params, const std::string &pkg_name,
+                    openPMD::Iteration *it) {
+  using OpenPMDUtils::delim;
+  const std::string prefix = "Params" + delim + pkg_name;
+  // check why this (vector of bool) doesn't work
+  // WriteAllParams<bool>(params, prefix, it);
+  WriteAllParamsOfType<bool>(params, prefix, it);
+  WriteAllParams<int32_t>(params, prefix, it);
+  WriteAllParams<int64_t>(params, prefix, it);
+  WriteAllParams<uint32_t>(params, prefix, it);
+  WriteAllParams<uint64_t>(params, prefix, it);
+  WriteAllParams<float>(params, prefix, it);
+  WriteAllParams<double>(params, prefix, it);
+
+  // strings (not supported in Kokkos Views)
+  WriteAllParamsOfType<std::string>(params, prefix, it);
+  WriteAllParamsOfType<std::vector<std::string>>(params, prefix, it);
+}
+
+template <typename T>
+void WriteSwarmVar(const SwarmInfo &swinfo, openPMD::ParticleSpecies swm,
+                   openPMD::Iteration it) {
+  auto &vars_of_type_T = std::get<SwarmInfo::MapToVarVec<T>>(swinfo.vars);
+  for (const auto &[vname, swmvarvec] : vars_of_type_T) {
+    const auto &vinfo = swinfo.var_info.at(vname);
+    auto host_data = swinfo.FillHostBuffer<T>(vname, swmvarvec);
+
+    auto const dataset = openPMD::Dataset(openPMD::determineDatatype(host_data.data()),
+                                          {swinfo.global_count});
+    // TODO(pgrete) ask OpenPMD group if this is the right approach (flatten vector and
+    // tensors with flattended indices as string component names) or if our non-scalar
+    // particle variables should be a multi-D `dataset` (if possible)
+    for (auto n = 0; n < vinfo.nvar; n++) {
+      auto [particle_record, particle_record_component] =
+          OpenPMDUtils::GetParticleRecordAndComponentNames(vname, vinfo.tensor_rank, n);
+
+      openPMD::RecordComponent rc = swm[particle_record][particle_record_component];
+      rc.resetDataset(dataset);
+      // only write if there's sth to write (otherwise the host_data nullptr is caught)
+      if (swinfo.count_on_rank != 0) {
+        rc.storeChunkRaw(&host_data[n * swinfo.count_on_rank], {swinfo.global_offset},
+                         {swinfo.count_on_rank});
+      }
+
+      // if positional, add offsets
+      if (particle_record == "position") {
+        auto rc_offset = swm["positionOffset"][particle_record_component];
+        rc_offset.resetDataset(dataset);
+        rc_offset.makeConstant(0.0);
+      }
+    }
+    // Flush because the host buffer is temporary
+    it.seriesFlush();
+  }
+}
+
+std::tuple<std::string, std::string>
+GetParticleRecordAndComponentNames(const std::string &vname, const int rank,
+                                   const int flat_comp_idx) {
+  std::string particle_record;
+  std::string particle_record_component;
+
+  // special sauce to align "positions" with standard
+  if (vname == swarm_position::x::name()) {
+    particle_record = "position";
+    particle_record_component = "x";
+  } else if (vname == swarm_position::y::name()) {
+    particle_record = "position";
+    particle_record_component = "y";
+  } else if (vname == swarm_position::z::name()) {
+    particle_record = "position";
+    particle_record_component = "z";
+  } else if (vname == swarm_position::id::name()) {
+    particle_record = "id";
+    particle_record_component = openPMD::MeshRecordComponent::SCALAR;
+  } else {
+    particle_record = vname;
+    particle_record_component =
+        rank == 0 ? openPMD::MeshRecordComponent::SCALAR : std::to_string(flat_comp_idx);
+  }
+  return {particle_record, particle_record_component};
+}
+
+std::tuple<std::string, std::string>
+GetMeshRecordAndComponentNames(const VarInfo &vinfo, const TopologicalElement te,
+                               const int comp_idx, const int level) {
+  std::string comp_name;
+  if (vinfo.is_vector) {
+    if (comp_idx == 0) {
+      comp_name = "x";
+    } else if (comp_idx == 1) {
+      comp_name = "y";
+    } else if (comp_idx == 2) {
+      comp_name = "z";
+    } else {
+      PARTHENON_THROW("Expected component index doesn't match vector expectation.");
+    }
+    //  Current unclear how to properly handle other vectors and tensors, so everything
+    //  that not's a proper vector is a a scalar for now.
+  } else {
+    comp_name = openPMD::MeshRecordComponent::SCALAR;
+  }
+
+  // Default for cell centered fields is an empty string
+  // to maintain backwards compatiblity with first iteration of
+  // OpenPMD outputs.
+  std::string te_str = "";
+  if (te == TopologicalElement::F1) {
+    te_str = "F1_";
+  } else if (te == TopologicalElement::F2) {
+    te_str = "F2_";
+  } else if (te == TopologicalElement::F3) {
+    te_str = "F3_";
+  } else if (te == TopologicalElement::E1) {
+    te_str = "E1_";
+  } else if (te == TopologicalElement::E2) {
+    te_str = "E2_";
+  } else if (te == TopologicalElement::E3) {
+    te_str = "E3_";
+  } else if (te == TopologicalElement::NN) {
+    te_str = "NN_";
+  } else {
+    PARTHENON_REQUIRE_THROWS(te == TopologicalElement::CC,
+                             "Outputs for this type of TE not implemented.")
+  }
+  // TODO(pgrete) need to make sure that var names are allowed within standard
+  const std::string &mesh_record_name = vinfo.label + "_" + te_str +
+                                        vinfo.component_labels[comp_idx] + "_lvl" +
+                                        std::to_string(level);
+  return {mesh_record_name, comp_name};
+}
+
+std::tuple<openPMD::Offset, openPMD::Extent>
+GetChunkOffsetAndExtent(Mesh *pm, std::shared_ptr<MeshBlock> pmb,
+                        const TopologicalElement te, const int coarsening_factor,
+                        const SubOutputType output_type) {
+  openPMD::Offset chunk_offset;
+  openPMD::Extent chunk_extent;
+  const auto loc = pm->Forest().GetLegacyTreeLocation(pmb->loc);
+  uint64_t nx1_eff = pmb->block_size.nx(X1DIR) / coarsening_factor;
+  uint64_t nx2_eff = pmb->block_size.nx(X2DIR) / coarsening_factor;
+  uint64_t nx3_eff = pmb->block_size.nx(X3DIR) / coarsening_factor;
+  if (pm->ndim == 3) {
+    chunk_offset = {loc.lx3() * nx3_eff, loc.lx2() * nx2_eff, loc.lx1() * nx1_eff};
+    chunk_extent = {nx3_eff + TopologicalOffsetK(te), nx2_eff + TopologicalOffsetJ(te),
+                    nx1_eff + TopologicalOffsetI(te)};
+  } else if (pm->ndim == 2) {
+    chunk_offset = {loc.lx2() * nx2_eff, loc.lx1() * nx1_eff};
+    chunk_extent = {static_cast<uint64_t>(nx2_eff + TopologicalOffsetJ(te)),
+                    static_cast<uint64_t>(nx1_eff + TopologicalOffsetI(te))};
+  } else {
+    PARTHENON_THROW("1D output for openpmd not yet supported.");
+  }
+  int remove_comp = -1;
+  if (output_type == SubOutputType::X1Slice) {
+    remove_comp = 2;
+  } else if (output_type == SubOutputType::X2Slice) {
+    remove_comp = 1;
+  } else if (output_type == SubOutputType::X3Slice) {
+    remove_comp = 0;
+  }
+  if (remove_comp >= 0) {
+    chunk_extent.erase(chunk_extent.begin() + remove_comp);
+    chunk_offset.erase(chunk_offset.begin() + remove_comp);
+  }
+  return {chunk_offset, chunk_extent};
+}
+} // namespace OpenPMDUtils
+
+//----------------------------------------------------------------------------------------
+//! \fn void OpenPMDOutput:::WriteOutputFile(Mesh *pm)
+//  \brief  Write output in OpenPMD format
+void OpenPMDOutput::WriteOutputFile(Mesh *pm, ParameterInput *pin, SimTime *tm,
+                                    const SignalHandler::OutputSignal signal) {
+  if (output_params.single_precision_output) {
+    this->template WriteOutputFileImpl<true>(pm, pin, tm, signal);
+  } else {
+    this->template WriteOutputFileImpl<false>(pm, pin, tm, signal);
+  }
+}
+
+//----------------------------------------------------------------------------------------
+//! \fn void OpenPMDOutput:::WriteOutputFile(Mesh *pm)
+//  \brief  Write output in OpenPMD format
+template <bool WRITE_SINGLE_PRECISION>
+void OpenPMDOutput::WriteOutputFileImpl(Mesh *pm, ParameterInput *pin, SimTime *tm,
+                                        const SignalHandler::OutputSignal signal) {
+  if constexpr (WRITE_SINGLE_PRECISION) {
+    Kokkos::Profiling::pushRegion("OPMD::WriteOutputFileSinglePrec");
+  } else {
+    Kokkos::Profiling::pushRegion("OPMD::WriteOutputFileRealPrec");
+  }
+  // Check that the parameter input is safe to write (i.e., consistent across ranks)
+  OutputUtils::CheckParameterInputConsistent(pin);
+
+  using openPMD::Access;
+  using openPMD::Series;
+
+  // TODO(pgrete) .h5 for hd5 and .bp for ADIOS2 or .json for JSON
+  // TODO(pgrete) check if CREATE is the correct pattern (for not overwriting the series
+  // but an interation) This just describes the pattern of the filename. The correct file
+  // will be accessed through the iteration idx below. The file suffix maps to the chosen
+  // backend.
+  // TODO(pgrete) add final and now logic
+  // Prepending @ indicates that the config is a file to be read and parsed.
+  std::string backend_config =
+      backend_config_ == "default" ? "{}" : "@" + backend_config_;
+
+  auto filename = output_params.file_basename + "." + output_params.file_id;
+  if (signal == SignalHandler::OutputSignal::now) {
+    filename.append(".now");
+  } else if (signal == SignalHandler::OutputSignal::final &&
+             output_params.file_label_final) {
+    filename.append(".final");
+  }
+  filename.append(".%05T");
+
+  filename.append(".bp");
+  Series series = Series(filename, Access::CREATE,
+#ifdef MPI_PARALLEL
+                         MPI_COMM_WORLD,
+#endif
+                         backend_config);
+  // TODO(pgrete) How to handle downstream info, e.g.,  on how/what defines a vector?
+  // TODO(pgrete) Should we update for restart or only set this once? Or make it per
+  // iteration?
+  // ... = pin->GetString(output_params.block_name, "actions_file");
+  series.setAuthor("My Name <mail@addre.es");
+  series.setComment("Hello world!");
+  series.setMachine("bla");
+  series.setSoftware("Parthenon + Downstream info");
+  series.setDate("2024-02-29 17:48:42 +0100");
+
+  // TODO(pgrete) Units?
+
+  // In line with existing outputs, we write one file per iteration/snapshot
+  series.setIterationEncoding(openPMD::IterationEncoding::fileBased);
+
+  // open iteration (corresponding to a timestep in OpenPMD naming)
+  // TODO(pgrete) fix iteration name <-> file naming
+  auto it = series.iterations[output_params.file_number];
+  it.open(); // explicit open() is important when run in parallel
+
+  if (signal == SignalHandler::OutputSignal::none) {
+    // After file has been opened with the current number, already advance output
+    // parameters so that for restarts the file is not immediatly overwritten again.
+    // Only applies to default time-based data dumps, so that writing "now" and "final"
+    // outputs does not change the desired output numbering.
+    UpdateNextOutput_(pm, tm);
+  }
+
+  auto const &first_block = *(pm->block_list.front());
+
+  // TODO(?) in principle, we could abstract this to a more general WriteAttributes place
+  // and reuse for hdf5 and OpenPMD output with corresponing calls
+  // -------------------------------------------------------------------------------- //
+  //   WRITING ATTRIBUTES                                                             //
+  // -------------------------------------------------------------------------------- //
+
+  // Note, that profiling is likely skewed as data is actually written to disk/flushed
+  // only later.
+  Kokkos::Profiling::pushRegion("write Attributes");
+  // First the ones required by the OpenPMD standard
+  if (tm != nullptr) {
+    it.setTime(tm->time);
+    it.setDt(tm->dt);
+    it.setAttribute("NCycle", tm->ncycle);
+  } else {
+    it.setTime(-1.0);
+    it.setDt(-1.0);
+  }
+
+  // TODO(reviewers): PG: I didn't want to pollute OutputParams with sth specific to this
+  // output type. It's not super nice to process `pin` info here but it did the job. Any
+  // suggestions?
+
+  const auto output_type_str = pin->GetOrAddString(
+      output_params.block_name, "output_type", "restart",
+      std::vector<std::string>{"restart", "x1slice", "x2slice", "x3slice"},
+      "Type of output in the file.");
+  // C++20 please
+  // using enum OpenPMDUtils::SubOutputType;
+  using OpenPMDUtils::SubOutputType;
+  auto output_type = SubOutputType::Restart;
+  if (output_type_str == "x1slice") {
+    output_type = SubOutputType::X1Slice;
+  } else if (output_type_str == "x2slice") {
+    output_type = SubOutputType::X2Slice;
+  } else if (output_type_str == "x3slice") {
+    output_type = SubOutputType::X3Slice;
+  }
+  const auto is_slice = output_type == SubOutputType::X1Slice ||
+                        output_type == SubOutputType::X2Slice ||
+                        output_type == SubOutputType::X3Slice;
+  auto slice_loc = std::numeric_limits<Real>::signaling_NaN();
+  if (is_slice) {
+    PARTHENON_REQUIRE_THROWS(pm->ndim == 3, "Slices are only implemented in 3D");
+    slice_loc = pin->GetReal(output_params.block_name, "slice_loc");
+  }
+
+  if (!is_slice) {
+    PARTHENON_INSTRUMENT_REGION("Dump Params");
+
+    for (const auto &[pkg_name, pkg] : pm->packages.AllPackages()) {
+      const auto &params = pkg->AllParams();
+      OpenPMDUtils::WriteAllParams(params, pkg_name, &it);
+    }
+  }
+  // Then our own
+  if (!is_slice) {
+    PARTHENON_INSTRUMENT_REGION("write input");
+    // write input key-value pairs
+    std::ostringstream oss;
+    pin->ParameterDump(oss);
+    it.setAttribute("InputFile", oss.str());
+  }
+
+  if (!is_slice) {
+    // It's not clear we need all these attributes, but they mirror what's done in the
+    // hdf5 output.
+    it.setAttribute("WallTime", Driver::elapsed_main());
+    it.setAttribute("NumDims", pm->ndim);
+    it.setAttribute("NumMeshBlocks", pm->nbtotal);
+    it.setAttribute("MaxLevel", pm->GetCurrentLevel() - pm->GetRootLevel());
+    // write whether we include ghost cells or not
+    it.setAttribute("IncludesGhost", output_params.include_ghost_zones ? 1 : 0);
+    // write number of ghost cells in simulation
+    it.setAttribute("NGhost", Globals::nghost);
+    it.setAttribute("Coordinates", std::string(first_block.coords.Name()).c_str());
+
+    // restart info, write always
+    it.setAttribute("NBNew", pm->nbnew);
+    it.setAttribute("NBDel", pm->nbdel);
+    it.setAttribute("RootLevel", pm->GetLegacyTreeRootLevel());
+    it.setAttribute("Refine", pm->adaptive ? 1 : 0);
+    it.setAttribute("Multilevel", pm->multilevel ? 1 : 0);
+
+    it.setAttribute("BlocksPerPE", pm->GetNbList());
+    // TODO(pgrete) Add safety check for supported coarsenign factors
+    // probably already in or before ctor
+    it.setAttribute("CoarseningFactor", coarsening_factor_);
+
+    // Mesh block size
+    // TODO(pgrete) Check if we potentially can modify this to restart from coarse outs
+    const auto base_block_size = pm->GetDefaultBlockSize();
+    it.setAttribute("MeshBlockSize",
+                    std::vector<int>{base_block_size.nx(X1DIR), base_block_size.nx(X2DIR),
+                                     base_block_size.nx(X3DIR)});
+
+    // RootGridDomain - float[9] array with xyz mins, maxs, rats (dx(i)/dx(i-1))
+    it.setAttribute(
+        "RootGridDomain",
+        std::vector<Real>{pm->mesh_size.xmin(X1DIR), pm->mesh_size.xmax(X1DIR),
+                          pm->mesh_size.xrat(X1DIR), pm->mesh_size.xmin(X2DIR),
+                          pm->mesh_size.xmax(X2DIR), pm->mesh_size.xrat(X2DIR),
+                          pm->mesh_size.xmin(X3DIR), pm->mesh_size.xmax(X3DIR),
+                          pm->mesh_size.xrat(X3DIR)});
+
+    // Root grid size (number of cells at root level)
+    it.setAttribute("RootGridSize",
+                    std::vector<int>{pm->mesh_size.nx(X1DIR), pm->mesh_size.nx(X2DIR),
+                                     pm->mesh_size.nx(X3DIR)});
+
+    // Boundary conditions
+    auto arr_to_vec = [](const auto &arr) {
+      std::vector<std::string> vec(BOUNDARY_NFACES);
+      for (int i = 0; i < BOUNDARY_NFACES; i++) {
+        vec[i] = arr.at(i);
+      }
+      return vec;
+    };
+    it.setAttribute("BoundaryConditions", arr_to_vec(pm->mesh_bc_names));
+    it.setAttribute("SwarmBoundaryConditions", arr_to_vec(pm->mesh_swarm_bc_names));
+  } // Info section
+
+  Kokkos::Profiling::popRegion(); // write Attributes
+
+  // Write block metadata
+  if (!is_slice) {
+    // Manually gather all block data first as it allows to use the (simpler)
+    // Attribute interface rather than writing a distributed dataset -- especially as all
+    // data is being read on restart by every rank anyway.
+    std::vector<int64_t> loc_local = OutputUtils::ComputeLocs(pm);
+    auto loc_global = FlattendedLocalToGlobal<int64_t>(pm, loc_local);
+    it.setAttribute("loc.lx123", loc_global);
+
+    std::vector<int> id_local = OutputUtils::ComputeIDsAndFlags(pm);
+    auto id_global = FlattendedLocalToGlobal<int>(pm, id_local);
+    it.setAttribute("loc.level-gid-lid-cnghost-gflag", id_global);
+
+    // derefinement count
+    std::vector<int> derefcnt_local = OutputUtils::ComputeDerefinementCount(pm);
+    auto derefcnt_global = FlattendedLocalToGlobal<int>(pm, derefcnt_local);
+    it.setAttribute("derefinement_count", derefcnt_global);
+  }
+
+  // TODO(pgrete) check var name standard compatiblity
+  // e.g., description: names of records and their components are only allowed to contain
+  // the characters a-Z, the numbers 0-9 and the underscore _
+
+  const int num_blocks_local = static_cast<int>(pm->block_list.size());
+
+  // -------------------------------------------------------------------------------- //
+  //   WRITING VARIABLES DATA                                                         //
+  // -------------------------------------------------------------------------------- //
+  Kokkos::Profiling::pushRegion("write all variable data");
+
+  auto &bounds = pm->block_list.front()->cellbounds;
+  // get list of all vars, just use the first block since the list is the same for all
+  // blocks
+  // TODO(pgrete) add restart_ var to output
+  // TODO(pgrete) check if this needs to be updated/unifed with get_var logic in hdf5
+  auto all_vars_info = GetAllVarsInfo(
+      GetVarsToWrite(pm->block_list.front(), true, output_params.variables), bounds);
+
+  // Mirroring the SparseInfo handling in HDF5 here.
+  // Could probably made easier by just sequentially filling vectors, but better be safe
+  // than sorry.
+  //
+  // We need to add information about the sparse variables to the output file, namely:
+  // 1) Which variables are sparse
+  // 2) Is a sparse id of a particular sparse variable allocated on a given block
+  //
+  // This information is stored in the dataset called "SparseInfo". The data set
+  // contains an attribute "SparseFields" that is a vector of strings with the names
+  // of the sparse fields (field name with sparse id, i.e. "bar_28", "bar_7", foo_1",
+  // "foo_145"). The field names are in alphabetical order, which is the same order
+  // they show up in all_unique_vars (because it's a sorted set).
+  //
+  // The dataset SparseInfo itself is a 2D array of bools. The first index is the
+  // global block index and the second index is the sparse field (same order as the
+  // SparseFields attribute). SparseInfo[b][v] is true if the sparse field with index
+  // v is allocated on the block with index b, otherwise the value is false.
+  // If the logic here is ever updated, ensure to update the HDF5 logic, too.
+  std::vector<std::string> sparse_names;
+  std::unordered_map<std::string, size_t> sparse_field_idx;
+  for (auto &vinfo : all_vars_info) {
+    if (vinfo.is_sparse) {
+      sparse_field_idx.insert({vinfo.label, sparse_names.size()});
+      sparse_names.push_back(vinfo.label);
+    }
+  }
+  auto num_sparse = sparse_names.size();
+  // Note, we're using int8_t here to circument the global reduction of a bool vector,
+  // which would require much more boilerplate.
+  std::vector<int8_t> sparse_allocated(num_blocks_local * num_sparse);
+  std::vector<int> sparse_dealloc_count(num_blocks_local * num_sparse);
+
+  // We're currently writing (flushing) one var at a time. This saves host memory but
+  // results more smaller write. Might be updated in the future.
+  // Allocate space for largest size variable
+  // Could in principle be reduced for coarsended outputs, but lets better be safe than
+  // sorry given the edge cases with non cell centered vars.
+  int var_size_max = 0;
+  for (auto &vinfo : all_vars_info) {
+    const auto var_size = vinfo.Size();
+    var_size_max = std::max(var_size_max, var_size);
+  }
+
+  using OutT = typename std::conditional<WRITE_SINGLE_PRECISION, float, Real>::type;
+  std::vector<OutT> tmp_data(var_size_max * num_blocks_local);
+
+  // for each variable we write
+  for (auto &vinfo : all_vars_info) {
+    PARTHENON_INSTRUMENT_REGION("Write variable loop")
+
+    // Reset host write bufer. Not really necessary, but doesn't hurt.
+    memset(tmp_data.data(), 0, tmp_data.size() * sizeof(OutT));
+    uint64_t tmp_offset = 0;
+
+    if (vinfo.is_vector) {
+      // sanity check
+      PARTHENON_REQUIRE_THROWS(
+          vinfo.GetDim(4) == pm->ndim && vinfo.GetDim(5) == 1 && vinfo.GetDim(6) == 1,
+          "A 'standard' vector is expected to only have components matching the "
+          "dimensionality of the simulation.")
+    }
+
+    // for each local mesh block
+    for (size_t b_idx = 0; b_idx < num_blocks_local; ++b_idx) {
+      const auto &pmb = pm->block_list[b_idx];
+      // TODO(pgrete) check if we should skip the suffix for level 0
+      const auto level = pmb->loc.level() - pm->GetRootLevel();
+      for (const auto &te : vinfo.topological_elements) {
+        for (int comp_idx = 0; comp_idx < vinfo.component_labels.size(); comp_idx++) {
+          const auto [record_name, comp_name] =
+              OpenPMDUtils::GetMeshRecordAndComponentNames(vinfo, te, comp_idx, level);
+
+          // Create the mesh_record for this variable at the given level (if it doesn't
+          // exist yet)
+          if (!it.meshes.contains(record_name)) {
+            auto mesh_record = it.meshes[record_name];
+
+            // These following attributes are shared across all components of the record.
+
+            PARTHENON_REQUIRE_THROWS(
+                typeid(Coordinates_t) == typeid(UniformCartesian),
+                "OpenPMD in Parthenon currently only supports Cartesian coordinates.");
+            mesh_record.setGeometry(openPMD::Mesh::Geometry::cartesian);
+            auto &coords = pmb->coords;
+            // For uniform Cartesian, all dxN are const across the block so we just pick
+            // the first index.
+            Real dx1 = coords.CellWidth<X1DIR>(0, 0, 0) * coarsening_factor_;
+            Real dx2 = coords.CellWidth<X2DIR>(0, 0, 0) * coarsening_factor_;
+            Real dx3 = coords.CellWidth<X3DIR>(0, 0, 0) * coarsening_factor_;
+
+            // TODO(pgrete) check if this should be tied to the MemoryLayout
+            mesh_record.setDataOrder(openPMD::Mesh::DataOrder::C);
+
+            auto mesh_comp = mesh_record[comp_name];
+            // TODO(pgrete) This feels wrong for deep hierachies... Check with OPMD people
+            auto effective_nx = static_cast<std::uint64_t>(std::pow(2, level));
+            openPMD::Extent global_extent;
+            if (pm->ndim == 3) {
+              auto grid_spacing = std::vector<Real>{dx3, dx2, dx1};
+              auto axis_labels = std::vector<std::string>{"z", "y", "x"};
+              auto global_offset = std::vector<Real>{
+                  pm->mesh_size.xmin(X3DIR),
+                  pm->mesh_size.xmin(X2DIR),
+                  pm->mesh_size.xmin(X1DIR),
+              };
+              auto position = std::vector<Real>{0.5 - 0.5 * TopologicalOffsetK(te),
+                                                0.5 - 0.5 * TopologicalOffsetJ(te),
+                                                0.5 - 0.5 * TopologicalOffsetI(te)};
+              global_extent = {
+                  static_cast<std::uint64_t>(pm->mesh_size.nx(X3DIR) /
+                                             coarsening_factor_) *
+                          effective_nx +
+                      TopologicalOffsetK(te),
+                  static_cast<std::uint64_t>(pm->mesh_size.nx(X2DIR) /
+                                             coarsening_factor_) *
+                          effective_nx +
+                      TopologicalOffsetJ(te),
+                  static_cast<std::uint64_t>(pm->mesh_size.nx(X1DIR) /
+                                             coarsening_factor_) *
+                          effective_nx +
+                      TopologicalOffsetI(te),
+              };
+              int remove_comp = -1;
+              if (output_type == SubOutputType::X1Slice) {
+                remove_comp = 2;
+              } else if (output_type == SubOutputType::X2Slice) {
+                remove_comp = 1;
+              } else if (output_type == SubOutputType::X3Slice) {
+                remove_comp = 0;
+              }
+              if (remove_comp >= 0) {
+                grid_spacing.erase(grid_spacing.begin() + remove_comp);
+                axis_labels.erase(axis_labels.begin() + remove_comp);
+                global_offset.erase(global_offset.begin() + remove_comp);
+                position.erase(position.begin() + remove_comp);
+                global_extent.erase(global_extent.begin() + remove_comp);
+              }
+              mesh_record.setGridSpacing(grid_spacing);
+              mesh_record.setAxisLabels(axis_labels);
+              mesh_record.setGridGlobalOffset(global_offset);
+              mesh_comp.setPosition(position);
+            } else if (pm->ndim == 2) {
+              mesh_record.setGridSpacing(std::vector<Real>{dx2, dx1});
+              mesh_record.setAxisLabels({"y", "x"});
+              mesh_record.setGridGlobalOffset({
+                  pm->mesh_size.xmin(X2DIR),
+                  pm->mesh_size.xmin(X1DIR),
+              });
+
+              mesh_comp.setPosition(
+                  std::vector<Real>{0.5 - 0.5 * TopologicalOffsetJ(te),
+                                    0.5 - 0.5 * TopologicalOffsetI(te)});
+              global_extent = {
+                  static_cast<std::uint64_t>(pm->mesh_size.nx(X2DIR) /
+                                             coarsening_factor_) *
+                          effective_nx +
+                      TopologicalOffsetJ(te),
+                  static_cast<std::uint64_t>(pm->mesh_size.nx(X1DIR) /
+                                             coarsening_factor_) *
+                          effective_nx +
+                      TopologicalOffsetI(te),
+              };
+
+            } else {
+              PARTHENON_THROW("1D output for openpmd not yet supported.");
+            }
+            // Handling this here to now re-reset dataset later when iterating through the
+            // blocks
+            auto const dataset =
+                openPMD::Dataset(openPMD::determineDatatype<OutT>(), global_extent);
+            // TODO(pgrete) check whether this should/need to be a collective so that the
+            // mesh generation should be done across all ranks prior to writing data,
+            // rather than in-situ for the local blocks only
+            mesh_comp.resetDataset(dataset);
+
+            // TODO(pgrete) need unitDimension and timeOffset for this record?
+          }
+        }
+      }
+
+      // Now that the mesh record exists, actually write the data
+      auto out_var = pmb->meshblock_data.Get()->GetVarPtr(vinfo.label);
+
+      if (out_var->IsAllocated()) {
+        // TODO(pgrete) check if we can work with a direct copy from a subview to not
+        // duplicate the memory footprint here
+#if 0
+        // Pick a subview of the active cells of this component
+        auto const data = Kokkos::subview(
+            var->data, 0, 0, icomp, std::make_pair(kb.s, kb.e + 1),
+            std::make_pair(jb.s, jb.e + 1), std::make_pair(ib.s, ib.e + 1));
+
+        // Map a view onto a host allocation (so that we can call deep_copy)
+        auto component_buffer = buffer_list.emplace_back(ncells);
+        Kokkos::View<Real ***, Kokkos::HostSpace, Kokkos::MemoryTraits<Kokkos::Unmanaged>>
+            component_buffer_view(component_buffer.data(), nk, nj, ni);
+        Kokkos::deep_copy(component_buffer_view, data);
+#endif
+        auto &coords = pmb->coords;
+        auto out_var_h = out_var->data.GetHostMirrorAndCopy();
+        for (const auto &te : vinfo.topological_elements) {
+          auto ib = bounds.GetBoundsI(IndexDomain::interior, te);
+          auto jb = bounds.GetBoundsJ(IndexDomain::interior, te);
+          auto kb = bounds.GetBoundsK(IndexDomain::interior, te);
+          int comp_idx = 0;
+          const auto &Nt = out_var->GetDim(6);
+          const auto &Nu = out_var->GetDim(5);
+          const auto &Nv = out_var->GetDim(4);
+          // loop over all components
+          for (int t = 0; t < Nt; ++t) {
+            for (int u = 0; u < Nu; ++u) {
+              for (int v = 0; v < Nv; ++v) {
+                const auto [record_name, comp_name] =
+                    OpenPMDUtils::GetMeshRecordAndComponentNames(vinfo, te, comp_idx,
+                                                                 level);
+                auto mesh_comp = it.meshes[record_name][comp_name];
+
+                const auto comp_offset = tmp_offset;
+                for (int k = kb.s; k <= kb.e; ++k) {
+                  for (int j = jb.s; j <= jb.e; ++j) {
+                    for (int i = ib.s; i <= ib.e; ++i) {
+                      // Skip cells for coarse grained outputs
+                      if (((i - ib.s) % coarsening_factor_ != 0) ||
+                          ((j - jb.s) % coarsening_factor_ != 0) ||
+                          ((k - kb.s) % coarsening_factor_ != 0)) {
+                        continue;
+                      }
+                      // Skip cells outside slices
+                      if (is_slice) {
+                        if (output_type == SubOutputType::X1Slice) {
+                          if (slice_loc < coords.Xf<X1DIR>(k, j, i)) continue;
+                          if (slice_loc >= coords.Xf<X1DIR>(k, j, i + coarsening_factor_))
+                            continue;
+                        } else if (output_type == SubOutputType::X2Slice) {
+                          if (slice_loc < coords.Xf<X2DIR>(k, j, i)) continue;
+                          if (slice_loc >= coords.Xf<X2DIR>(k, j + coarsening_factor_, i))
+                            continue;
+                        } else if (output_type == SubOutputType::X3Slice) {
+                          if (slice_loc < coords.Xf<X3DIR>(k, j, i)) continue;
+                          if (slice_loc >= coords.Xf<X3DIR>(k + coarsening_factor_, j, i))
+                            continue;
+                        } else {
+                          PARTHENON_FAIL("Unclear how I got here.");
+                        }
+                      }
+                      tmp_data[tmp_offset] = static_cast<OutT>(
+                          out_var_h(static_cast<int>(te) % 3, t, u, v, k, j, i));
+
+                      tmp_offset++;
+                    }
+                  }
+                }
+                // if no data was being selected
+                if (comp_offset == tmp_offset) {
+                  continue;
+                }
+                const auto [chunk_offset, chunk_extent] =
+                    OpenPMDUtils::GetChunkOffsetAndExtent(pm, pmb, te, coarsening_factor_,
+                                                          output_type);
+
+                mesh_comp.storeChunkRaw(&tmp_data[comp_offset], chunk_offset,
+                                        chunk_extent);
+                comp_idx += 1;
+              }
+            }
+          } // loop over components
+        }   // loop over topological elements
+      }     // out_var->IsAllocated()
+      if (vinfo.is_sparse) {
+        auto sparse_idx = sparse_field_idx.at(vinfo.label);
+        sparse_allocated.at(b_idx * num_sparse + sparse_idx) =
+            static_cast<int8_t>(out_var->IsAllocated());
+        sparse_dealloc_count.at(b_idx * num_sparse + sparse_idx) = out_var->dealloc_count;
+      }
+    } // loop over blocks
+    it.seriesFlush();
+  }                               // loop over vars
+  Kokkos::Profiling::popRegion(); // write all variable data
+
+  // -------------------------------------------------------------------------------- //
+  //   WRITING Sparse metadata                                                        //
+  // -------------------------------------------------------------------------------- //
+  if (!is_slice && num_sparse > 0) {
+    auto sparse_allocated_global = FlattendedLocalToGlobal<int8_t>(pm, sparse_allocated);
+    it.setAttribute("SparseInfo", sparse_allocated_global);
+    it.setAttribute("SparseFields", sparse_names);
+    auto sparse_dealloc_count_global =
+        FlattendedLocalToGlobal<int>(pm, sparse_dealloc_count);
+    it.setAttribute("SparseDeallocCount", sparse_dealloc_count_global);
+  }
+
+  // -------------------------------------------------------------------------------- //
+  //   WRITING PARTICLE DATA                                                          //
+  // -------------------------------------------------------------------------------- //
+  if (!is_slice) {
+    Kokkos::Profiling::pushRegion("write particle data");
+    // TODO(pgrete) as above, first wrt differentiating between restart_ (last arg)
+    AllSwarmInfo all_swarm_info(pm->block_list, output_params.swarms,
+                                DumpOutputMode::RESTART);
+    for (auto &[swname, swinfo] : all_swarm_info.all_info) {
+      openPMD::ParticleSpecies swm = it.particles[swname];
+      // These indicate particles/meshblock and location in global index
+      // space where each meshblock starts
+      auto counts_global = FlattendedLocalToGlobal<std::size_t>(pm, swinfo.counts);
+      swm.setAttribute("counts", counts_global);
+      auto offsets_global = FlattendedLocalToGlobal<std::size_t>(pm, swinfo.offsets);
+      swm.setAttribute("offsets", offsets_global);
+
+      if (swinfo.global_count == 0) {
+        continue;
+      }
+
+      OpenPMDUtils::WriteSwarmVar<int>(swinfo, swm, it);
+      OpenPMDUtils::WriteSwarmVar<uint64_t>(swinfo, swm, it);
+      OpenPMDUtils::WriteSwarmVar<Real>(swinfo, swm, it);
+
+      // From the HDF5 output:
+      // If swarm does not contain an "id" object, generate a sequential
+      // one for vis.
+      // BUT PG: this may break things in unpredicable ways
+      // I'm in favor of enforcing a global id somehow. We shold discuss.
+      PARTHENON_REQUIRE_THROWS(swinfo.var_info.count(swarm_position::id::name()) != 0 ||
+                                   swinfo.var_info.count("id") != 0,
+                               "Particles should always carry a unique, persistent id!");
+    }
+    Kokkos::Profiling::popRegion(); // write particle data
+  }
+  // The iteration can be closed in order to help free up resources.
+  // The iteration's content will be flushed automatically.
+  // An iteration once closed cannot (yet) be reopened.
+  it.close();
+  series.close();
+  Kokkos::Profiling::popRegion(); // WriteOutputFile???Prec
+}
+// explicit template instantiation
+template void
+OpenPMDOutput::WriteOutputFileImpl<true>(Mesh *pm, ParameterInput *pin, SimTime *tm,
+                                         const SignalHandler::OutputSignal signal);
+template void
+OpenPMDOutput::WriteOutputFileImpl<false>(Mesh *pm, ParameterInput *pin, SimTime *tm,
+                                          const SignalHandler::OutputSignal signal);
+
+} // namespace parthenon
diff --git a/src/outputs/parthenon_opmd.hpp b/src/outputs/parthenon_opmd.hpp
new file mode 100644
index 000000000000..e4c9e3b134a0
--- /dev/null
+++ b/src/outputs/parthenon_opmd.hpp
@@ -0,0 +1,70 @@
+//========================================================================================
+// Parthenon performance portable AMR framework
+// Copyright(C) 2024-2025 The Parthenon collaboration
+// Licensed under the 3-clause BSD License, see LICENSE file for details
+//========================================================================================
+#ifndef OUTPUTS_PARTHENON_OPMD_HPP_
+#define OUTPUTS_PARTHENON_OPMD_HPP_
+//! \file restart_opmd.hpp
+//  \brief Provides support for restarting from OpenPMD output
+
+// C++ stdlib
+#include <memory>
+#include <string>
+#include <tuple>
+
+// OpenPMD headers
+#include <openPMD/openPMD.hpp>
+
+#include "basic_types.hpp"
+#include "mesh/meshblock.hpp"
+#include "outputs/output_utils.hpp"
+
+namespace parthenon {
+
+namespace OpenPMDUtils {
+
+enum class SubOutputType { Restart, X1Slice, X2Slice, X3Slice };
+
+template <typename T>
+void RestoreViewAttribute(const std::string &full_path, T &view, openPMD::Iteration *it);
+
+void WriteAllParams(const Params &params, const std::string &prefix,
+                    openPMD::Iteration *it);
+
+// Deliminter to separate packages and parameters in attributes.
+// More or less a workaround as the OpenPMD API does currently not expose
+// access to non-standard groups (such as "Params" versus the standard "meshes").
+inline static const std::string delim = "~";
+
+// Construct OpenPMD Mesh "record" name and comonnent identifier.
+// - te is the TopologicalElement (which is used as part of the variable name record)
+// - comp_idx is a flattended index over all components of the vectors and tensors, i.e.,
+// the typical v,u,t indices.
+// - level is the current effective level of the Mesh record
+std::tuple<std::string, std::string>
+GetMeshRecordAndComponentNames(const OutputUtils::VarInfo &vinfo,
+                               const TopologicalElement te, const int comp_idx,
+                               const int level);
+
+// Calculate logical location on effective mesh (i.e., a mesh with size that matches full
+// coverage at given resolution on a particular level)
+// TODO(pgrete) needs to be updated to properly work with Forests
+std::tuple<openPMD::Offset, openPMD::Extent>
+GetChunkOffsetAndExtent(Mesh *pm, std::shared_ptr<MeshBlock> pmb,
+                        const TopologicalElement te, const int coarsening_factor,
+                        const SubOutputType outupt_type);
+
+// Construct OpenPMD Particle "record" name and comonnent identifier.
+// - vname is the variable name
+// - rank is the variable rank (i.e., 0 is scalar etc)
+// - comp_idx is a flattended index over all components of the vectors and tensors, i.e.,
+// the typical v,u,t indices.
+std::tuple<std::string, std::string>
+GetParticleRecordAndComponentNames(const std::string &vname, const int rank,
+                                   const int flat_comp_idx);
+
+} // namespace OpenPMDUtils
+} // namespace parthenon
+
+#endif // OUTPUTS_PARTHENON_OPMD_HPP_
diff --git a/src/outputs/restart.hpp b/src/outputs/restart.hpp
index 022c4adf684d..e61cfe2dd6d4 100644
--- a/src/outputs/restart.hpp
+++ b/src/outputs/restart.hpp
@@ -106,7 +106,13 @@ class RestartReader {
   // fills internal data for given pointer
   virtual void ReadBlocks(const std::string &name, IndexRange range,
                           const OutputUtils::VarInfo &info, std::vector<Real> &dataVec,
-                          int file_output_format_version) const = 0;
+                          Mesh *pmesh) const = 0;
+
+  //  The PackOrUnpack logic requires knowledge of how data is stored and being read into
+  //  the buffer. For HDF5 data is padded if needed (i.e., a face centered field has tims
+  //  nx#+1 in all dimensions) or OpenPMD it's not (i.e., a face centered field has dims
+  //  nx1+1, nx2, nx3 in case of the F1 field).
+  [[nodiscard]] virtual bool BlockdataIsPadded() const = 0;
 
   // Gets the data from a swarm var on current rank. Assumes all
   // blocks are contiguous. Fills dataVec based on shape from swarmvar
@@ -130,7 +136,10 @@ class RestartReader {
 
   virtual void ReadParams(const std::string &name, Params &p) = 0;
 
-  [[nodiscard]] virtual bool VariableExists(const std::string &name) const = 0;
+  enum class DataType { Field, Swarm, SwarmVar };
+  [[nodiscard]] virtual bool
+  VariableExists(const std::string &name, const DataType data_type,
+                 const std::string swarmvarname = "") const = 0;
 
   // closes out the restart file
   // perhaps belongs in a destructor?
diff --git a/src/outputs/restart_hdf5.cpp b/src/outputs/restart_hdf5.cpp
index 5e5066baf18b..67780f54fd75 100644
--- a/src/outputs/restart_hdf5.cpp
+++ b/src/outputs/restart_hdf5.cpp
@@ -57,6 +57,15 @@ RestartReaderHDF5::RestartReaderHDF5(const char *filename) : filename_(filename)
   params_group_ = H5G::FromHIDCheck(H5Oopen(fh_, "Params", H5P_DEFAULT));
 
   has_ghost = GetAttr<int>("Info", "IncludesGhost");
+
+  // Currently supports versions 3 and 4.
+  const auto file_output_format_ver = GetOutputFormatVersion();
+  if (file_output_format_ver < HDF5::OUTPUT_VERSION_FORMAT - 1) {
+    std::stringstream msg;
+    msg << "File format version " << file_output_format_ver << " not supported. "
+        << "Current format is " << HDF5::OUTPUT_VERSION_FORMAT << std::endl;
+    PARTHENON_THROW(msg)
+  }
 #endif // ENABLE_HDF5
 }
 
@@ -208,8 +217,7 @@ void RestartReaderHDF5::ReadParams(const std::string &name, Params &p) {
 }
 void RestartReaderHDF5::ReadBlocks(const std::string &name, IndexRange range,
                                    const OutputUtils::VarInfo &info,
-                                   std::vector<Real> &dataVec,
-                                   int file_output_format_version) const {
+                                   std::vector<Real> &dataVec, Mesh * /*pmesh*/) const {
 #ifndef ENABLE_HDF5
   PARTHENON_FAIL("Restart functionality is not available because HDF5 is disabled");
 #else  // HDF5 enabled
@@ -227,15 +235,7 @@ void RestartReaderHDF5::ReadBlocks(const std::string &name, IndexRange range,
   count[0] = static_cast<hsize_t>(range.e - range.s + 1);
   const IndexDomain domain = has_ghost != 0 ? IndexDomain::entire : IndexDomain::interior;
 
-  // Currently supports versions 3 and 4.
-  if (file_output_format_version >= HDF5::OUTPUT_VERSION_FORMAT - 1) {
-    total_dim = info.FillShape<hsize_t>(domain, &(count[1])) + 1;
-  } else {
-    std::stringstream msg;
-    msg << "File format version " << file_output_format_version << " not supported. "
-        << "Current format is " << HDF5::OUTPUT_VERSION_FORMAT << std::endl;
-    PARTHENON_THROW(msg)
-  }
+  total_dim = info.FillShape<hsize_t>(domain, &(count[1])) + 1;
 
   hsize_t total_count = 1;
   for (int i = 0; i < total_dim; ++i) {
@@ -248,6 +248,7 @@ void RestartReaderHDF5::ReadBlocks(const std::string &name, IndexRange range,
                                std::to_string(total_count) + ")");
 
   const H5S memspace = H5S::FromHIDCheck(H5Screate_simple(total_dim, count, NULL));
+  // TODO(reviewer) What's going on here? The follow line is identical to the one above.
   PARTHENON_HDF5_CHECK(
       H5Sselect_hyperslab(hdl.dataspace, H5S_SELECT_SET, offset, NULL, count, NULL));
 
diff --git a/src/outputs/restart_hdf5.hpp b/src/outputs/restart_hdf5.hpp
index dd49562be38f..f73246b47370 100644
--- a/src/outputs/restart_hdf5.hpp
+++ b/src/outputs/restart_hdf5.hpp
@@ -116,7 +116,12 @@ class RestartReaderHDF5 : public RestartReader {
   // fills internal data for given pointer
   void ReadBlocks(const std::string &name, IndexRange range,
                   const OutputUtils::VarInfo &info, std::vector<Real> &dataVec,
-                  int file_output_format_version) const override;
+                  Mesh *pmesh) const override;
+
+  //  The PackOrUnpack logic requires knowledge of how data is stored and being read into
+  //  the buffer. For HDF5 data is padded if needed (i.e., a face centered field has tims
+  //  nx#+1 in all dimensions).
+  [[nodiscard]] bool BlockdataIsPadded() const override { return true; };
 
   // Gets the data from a swarm var on current rank. Assumes all
   // blocks are contiguous. Fills dataVec based on shape from swarmvar
@@ -229,13 +234,23 @@ class RestartReaderHDF5 : public RestartReader {
 
   void ReadParams(const std::string &name, Params &p) override;
 
-  [[nodiscard]] bool VariableExists(const std::string &name) const override {
+  [[nodiscard]] bool VariableExists(const std::string &name, const DataType data_type,
+                                    const std::string swarmvarname = ""
+
+  ) const override {
 #ifdef ENABLE_HDF5
-    // make sure dataset exists
-    // disabling error handling/printing as we take care of it
+    // Make sure dataset exists. Our HDF5 output does not differentiate between
+    // fields and swarms, so we can ignore the data_type. Note, we may eventually
+    // want to fix this as swarms and fields with the same name may cause issues.
+    // disable error handling/printing while probing so missing datasets do not
+    // spam the log, then restore the aborting handler.
+    std::string full_name = name;
+    if (data_type == DataType::SwarmVar) {
+      full_name = name + "/SwarmVars/" + swarmvarname;
+    }
     H5Eset_auto(H5E_DEFAULT, NULL, NULL);
-    auto status = H5Oexists_by_name(fh_, name.c_str(), H5P_DEFAULT);
-    // reenable HDF5 error handling to throw an error
+    auto status =
+        PARTHENON_HDF5_CHECK(H5Oexists_by_name(fh_, full_name.c_str(), H5P_DEFAULT));
     H5Eset_auto(H5E_DEFAULT, aborting_error_handler, NULL);
     return status > 0;
 #else
diff --git a/src/outputs/restart_opmd.cpp b/src/outputs/restart_opmd.cpp
new file mode 100644
index 000000000000..41cf9350c46e
--- /dev/null
+++ b/src/outputs/restart_opmd.cpp
@@ -0,0 +1,262 @@
+//========================================================================================
+// Parthenon performance portable AMR framework
+// Copyright(C) 2024-2025 The Parthenon collaboration
+// Licensed under the 3-clause BSD License, see LICENSE file for details
+//========================================================================================
+//! \file restart_opmd.cpp
+//  \brief Restarts a simulation from an OpenPMD output with ADIOS2 backend
+
+#include <algorithm>
+#include <cstddef>
+#include <cstdint>
+#include <functional>
+#include <memory>
+#include <numeric>
+#include <string>
+#include <vector>
+
+// OpenPMD headers
+#include <openPMD/openPMD.hpp>
+
+#include "basic_types.hpp"
+#include "interface/params.hpp"
+#include "outputs/output_attr.hpp"
+#include "outputs/parthenon_opmd.hpp"
+#include "outputs/restart.hpp"
+#include "outputs/restart_opmd.hpp"
+#include "utils/error_checking.hpp"
+
+namespace parthenon {
+
+//----------------------------------------------------------------------------------------
+//! \fn void RestartReader::RestartReader(const std::string filename)
+//  \brief Opens the restart file and stores appropriate file handle in fh_
+RestartReaderOPMD::RestartReaderOPMD(const char *filename) : filename_(filename) {
+  // This silly logic is required as the unit tests may or may not define MPI_PARALLEL but
+  // are always run in serial.
+#ifdef MPI_PARALLEL
+  int mpi_initialized;
+  PARTHENON_MPI_CHECK(MPI_Initialized(&mpi_initialized));
+  if (mpi_initialized) {
+    series = openPMD::Series(filename, openPMD::Access::READ_ONLY, MPI_COMM_WORLD);
+  } else {
+    series = openPMD::Series(filename, openPMD::Access::READ_ONLY);
+  }
+#else
+  series = openPMD::Series(filename, openPMD::Access::READ_ONLY);
+
+#endif
+  PARTHENON_REQUIRE_THROWS(
+      series.iterations.size() == 1,
+      "Parthenon restarts should only contain one iteration/timestep.");
+  std::uint64_t idx;
+  for (const auto &i : series.iterations) {
+    idx = i.first;
+  }
+  it = std::make_unique<openPMD::Iteration>(series.iterations[idx]);
+  // Explicitly open (important for parallel execution)
+  it->open();
+}
+
+int RestartReaderOPMD::GetOutputFormatVersion() const {
+  // TODO(pgrete) move info to shared header and introduce constexpr var
+  if (it->containsAttribute("OutputFormatVersion")) {
+    return it->getAttribute("OutputFormatVersion").get<int>();
+  } else {
+    return -1;
+  }
+}
+
+RestartReaderOPMD::SparseInfo RestartReaderOPMD::GetSparseInfo() const {
+  SparseInfo info;
+  // Only read if data exists. Otherwise return default constructed.
+  if (it->containsAttribute("SparseInfo")) {
+    auto sinfo_vec = it->getAttribute("SparseInfo").get<std::vector<int8_t>>();
+    info.labels = it->getAttribute("SparseFields").get<std::vector<std::string>>();
+    info.num_sparse = static_cast<int>(info.labels.size());
+    info.num_blocks = sinfo_vec.size() / info.num_sparse;
+    info.dealloc_count = it->getAttribute("SparseDeallocCount").get<std::vector<int>>();
+
+    // copy "vector" data to bool pointer for compatiblity between output backends
+    info.allocated.reset(new bool[sinfo_vec.size()]);
+    for (int i = 0; i < sinfo_vec.size(); i++) {
+      info.allocated[i] = sinfo_vec.at(i);
+    }
+  }
+
+  return info;
+}
+
+RestartReaderOPMD::MeshInfo RestartReaderOPMD::GetMeshInfo() const {
+  RestartReaderOPMD::MeshInfo mesh_info;
+  mesh_info.nbnew = it->getAttribute("NBNew").get<int>();
+  mesh_info.nbdel = it->getAttribute("NBDel").get<int>();
+  mesh_info.nbtotal = it->getAttribute("NumMeshBlocks").get<int>();
+  mesh_info.root_level = it->getAttribute("RootLevel").get<int>();
+
+  mesh_info.block_size = it->getAttribute("MeshBlockSize").get<std::vector<int>>();
+  mesh_info.includes_ghost = it->getAttribute("IncludesGhost").get<int>();
+  mesh_info.n_ghost = it->getAttribute("NGhost").get<int>();
+
+  mesh_info.grid_dim = it->getAttribute("RootGridDomain").get<std::vector<Real>>();
+  mesh_info.lx123 = it->getAttribute("loc.lx123").get<std::vector<int64_t>>();
+  mesh_info.level_gid_lid_cnghost_gflag =
+      it->getAttribute("loc.level-gid-lid-cnghost-gflag").get<std::vector<int>>();
+  mesh_info.derefinement_count =
+      it->getAttribute("derefinement_count").get<std::vector<int>>();
+
+  return mesh_info;
+}
+
+SimTime RestartReaderOPMD::GetTimeInfo() const {
+  SimTime time_info{};
+
+  time_info.time = it->time<Real>();
+  time_info.dt = it->dt<Real>();
+  time_info.ncycle = it->getAttribute("NCycle").get<int>();
+
+  return time_info;
+}
+// Gets the counts and offsets for MPI ranks for the meshblocks set
+// by the indexrange. Returns the total count on this rank.
+std::size_t RestartReaderOPMD::GetSwarmCounts(const std::string &swarm,
+                                              const IndexRange &range,
+                                              std::vector<std::size_t> &counts,
+                                              std::vector<std::size_t> &offsets) {
+  // datasets
+  auto counts_dset =
+      it->particles[swarm].getAttribute("counts").get<std::vector<size_t>>();
+  auto offsets_dset =
+      it->particles[swarm].getAttribute("offsets").get<std::vector<size_t>>();
+
+  // Read data for requested blocks in range
+  counts.resize(range.e - range.s + 1);
+  offsets.resize(range.e - range.s + 1);
+
+  std::copy(counts_dset.begin() + range.s, counts_dset.begin() + range.e + 1,
+            counts.begin());
+  std::copy(offsets_dset.begin() + range.s, offsets_dset.begin() + range.e + 1,
+            offsets.begin());
+
+  // Compute total count rank
+  std::size_t total_count_on_rank = std::accumulate(counts.begin(), counts.end(), 0);
+  return total_count_on_rank;
+}
+
+template <typename T>
+void RestartReaderOPMD::ReadAllParamsOfType(const std::string &prefix, Params &params) {
+  for (const auto &key : params.GetKeys()) {
+    using OpenPMDUtils::delim;
+    const auto type = params.GetType(key);
+    auto mutability = params.GetMutability(key);
+    if (type == std::type_index(typeid(T)) && mutability == Params::Mutability::Restart) {
+      auto full_path = prefix + delim + key;
+      // The '/' is kind of a reserved character in the OpenPMD standard, which results
+      // in attribute keys with said character not being exposed.
+      // Thus we replace it.
+      std::replace(full_path.begin(), full_path.end(), '/', delim[0]);
+
+      try {
+        T val;
+        if constexpr (implements<kokkos_view(T)>::value) {
+          val = params.Get<T>(key);
+          RestoreViewAttribute(full_path, val);
+        } else if constexpr (is_specialization_of<T, ParArrayGeneric>::value) {
+          val = params.Get<T>(key);
+          auto &view = val.KokkosView();
+          RestoreViewAttribute(full_path, view);
+        } else {
+          val = it->getAttribute(full_path).get<T>();
+        }
+        params.Update(key, val);
+      } catch (...) {
+        // TODO(JMM/PG) Add failed load list of "fail/needs fix" list
+        if (Globals::my_rank == 0) {
+          std::stringstream ss;
+          ss << "Failed to load parameter " << full_path
+             << " from the restart file! Using default value." << std::endl;
+          PARTHENON_WARN(ss);
+        }
+      }
+    }
+  }
+}
+
+template <typename... Ts>
+void RestartReaderOPMD::ReadAllParamsOfMultipleTypes(const std::string &prefix,
+                                                     Params &p) {
+  ([&] { ReadAllParamsOfType<Ts>(prefix, p); }(), ...);
+}
+
+template <typename T>
+void RestartReaderOPMD::ReadAllParams(const std::string &pkg_name, Params &p) {
+  ReadAllParamsOfMultipleTypes<PARTHENON_ATTR_VALID_VEC_TYPES(T)>(pkg_name, p);
+}
+void RestartReaderOPMD::ReadParams(const std::string &pkg_name, Params &p) {
+  using OpenPMDUtils::delim;
+  const auto prefix = "Params" + delim + pkg_name;
+  ReadAllParams<int32_t>(prefix, p);
+  ReadAllParams<int64_t>(prefix, p);
+  ReadAllParams<uint32_t>(prefix, p);
+  ReadAllParams<uint64_t>(prefix, p);
+  ReadAllParams<float>(prefix, p);
+  ReadAllParams<double>(prefix, p);
+
+  // strings (not supported in Kokkos Views)
+  ReadAllParamsOfType<std::string>(prefix, p);
+  ReadAllParamsOfType<std::vector<std::string>>(prefix, p);
+  // TODO(pgrete) same as for the writing. fix vec of bool
+  ReadAllParamsOfType<bool>(prefix, p);
+}
+
+void RestartReaderOPMD::ReadBlocks(const std::string &var_name, IndexRange block_range,
+                                   const OutputUtils::VarInfo &vinfo,
+                                   std::vector<Real> &data_vec, Mesh *pm) const {
+  int64_t comp_offset = 0; // offset data_vector to store component data
+  for (auto &pmb : pm->block_list) {
+    // TODO(pgrete) check if we should skip the suffix for level 0
+    const auto level = pmb->loc.level() - pm->GetRootLevel();
+
+    for (const auto &te : vinfo.topological_elements) {
+      int comp_idx = 0; // used in label for non-vector variables
+      const auto &Nt = vinfo.GetDim(6);
+      const auto &Nu = vinfo.GetDim(5);
+      const auto &Nv = vinfo.GetDim(4);
+      // loop over all components
+      for (int t = 0; t < Nt; ++t) {
+        for (int u = 0; u < Nu; ++u) {
+          for (int v = 0; v < Nv; ++v) {
+            // Get the correct record
+            const auto [record_name, comp_name] =
+                OpenPMDUtils::GetMeshRecordAndComponentNames(vinfo, te, comp_idx, level);
+
+            PARTHENON_REQUIRE_THROWS(it->meshes.contains(record_name),
+                                     "Missing mesh record '" + record_name +
+                                         "' in restart file.");
+            auto mesh_record = it->meshes[record_name];
+            PARTHENON_REQUIRE_THROWS(mesh_record.contains(comp_name),
+                                     "Missing component'" + comp_name +
+                                         "' in mesh record '" + record_name +
+                                         "' of restart file.");
+            auto mesh_comp = mesh_record[comp_name];
+
+            // Restarting from coarsened output not supported at the moment
+            const int coarsening_factor = 1;
+            const auto [chunk_offset, chunk_extent] =
+                OpenPMDUtils::GetChunkOffsetAndExtent(
+                    pm, pmb, te, coarsening_factor, OpenPMDUtils::SubOutputType::Restart);
+            mesh_comp.loadChunkRaw(&data_vec[comp_offset], chunk_offset, chunk_extent);
+            comp_offset += std::accumulate(chunk_extent.cbegin(), chunk_extent.cend(), 1,
+                                           std::multiplies<std::uint64_t>{});
+            comp_idx += 1;
+          }
+        }
+      } // loop over components
+    }   // loop over topological elements
+  }     // loop over blocks
+
+  // Now actually read the registered chunks form disk
+  it->seriesFlush();
+}
+
+} // namespace parthenon
diff --git a/src/outputs/restart_opmd.hpp b/src/outputs/restart_opmd.hpp
new file mode 100644
index 000000000000..6a503aa0cfe7
--- /dev/null
+++ b/src/outputs/restart_opmd.hpp
@@ -0,0 +1,187 @@
+//========================================================================================
+// Parthenon performance portable AMR framework
+// Copyright(C) 2024-2025 The Parthenon collaboration
+// Licensed under the 3-clause BSD License, see LICENSE file for details
+//========================================================================================
+#ifndef OUTPUTS_RESTART_OPMD_HPP_
+#define OUTPUTS_RESTART_OPMD_HPP_
+//! \file restart_opmd.hpp
+//  \brief Provides support for restarting from OpenPMD output
+
+#include <cstdint>
+#include <memory>
+#include <string>
+#include <vector>
+
+// OpenPMD headers
+#include <openPMD/openPMD.hpp>
+
+#include "basic_types.hpp"
+#include "outputs/parthenon_opmd.hpp"
+#include "outputs/restart.hpp"
+#include "pack/swarm_default_names.hpp"
+
+#include "mesh/domain.hpp"
+
+namespace parthenon {
+
+class Mesh;
+class Param;
+
+class RestartReaderOPMD : public RestartReader {
+ public:
+  explicit RestartReaderOPMD(const char *filename);
+
+  [[nodiscard]] SparseInfo GetSparseInfo() const override;
+
+  [[nodiscard]] MeshInfo GetMeshInfo() const override;
+
+  [[nodiscard]] SimTime GetTimeInfo() const override;
+
+  [[nodiscard]] std::string GetInputString() const override {
+    return it->getAttribute("InputFile").get<std::string>();
+  };
+
+  // Return output format version number. Return -1 if not existent.
+  [[nodiscard]] int GetOutputFormatVersion() const override;
+
+  // Current not supported
+  [[nodiscard]] int HasGhost() const override { return 0; };
+
+ public:
+  // Gets data for all blocks on current rank.
+  // Assumes blocks are contiguous
+  // fills internal data for given pointer
+  void ReadBlocks(const std::string &name, IndexRange range,
+                  const OutputUtils::VarInfo &info, std::vector<Real> &dataVec,
+                  Mesh *pmesh) const override;
+
+  //  The PackOrUnpack logic requires knowledge of how data is stored and being read into
+  //  the buffer. OpenPMD is dense (i.e., a face centered field has dims
+  //  nx1+1, nx2, nx3 in case of the F1 field).
+  [[nodiscard]] bool BlockdataIsPadded() const override { return false; };
+
+  // Gets the data from a swarm var on current rank. Assumes all
+  // blocks are contiguous. Fills dataVec based on shape from swarmvar
+  // metadata.
+  template <typename T>
+  void ReadSwarmVar(const std::string &swarmname, const std::string &varname,
+                    const std::size_t count, const std::size_t offset, const Metadata &m,
+                    std::vector<T> &data_vec) {
+    openPMD::ParticleSpecies swm = it->particles[swarmname];
+
+    const auto &shape = m.Shape();
+    const int rank = shape.size();
+    std::size_t ncomp = 1;
+    for (int i = 0; i < rank; ++i) {
+      ncomp *= shape[rank - 1 - i];
+    }
+    std::size_t total_count = ncomp * count;
+    if (data_vec.size() < total_count) { // greedy re-alloc
+      data_vec.resize(total_count);
+    }
+
+    for (auto n = 0; n < ncomp; n++) {
+      auto [particle_record, particle_record_component] =
+          OpenPMDUtils::GetParticleRecordAndComponentNames(varname, rank, n);
+      openPMD::RecordComponent rc = swm[particle_record][particle_record_component];
+      rc.loadChunkRaw(&data_vec[n * count], {offset}, {count});
+    }
+
+    // Now actually read the registered chunks form disk
+    it->seriesFlush();
+  }
+
+  void ReadSwarmVar(const std::string &swarmname, const std::string &varname,
+                    const std::size_t count, const std::size_t offset, const Metadata &m,
+                    std::vector<Real> &dataVec) override {
+    ReadSwarmVar<>(swarmname, varname, count, offset, m, dataVec);
+  };
+  void ReadSwarmVar(const std::string &swarmname, const std::string &varname,
+                    const std::size_t count, const std::size_t offset, const Metadata &m,
+                    std::vector<int> &dataVec) override {
+    ReadSwarmVar<>(swarmname, varname, count, offset, m, dataVec);
+  };
+  void ReadSwarmVar(const std::string &swarmname, const std::string &varname,
+                    const std::size_t count, const std::size_t offset, const Metadata &m,
+                    std::vector<uint64_t> &dataVec) override {
+    ReadSwarmVar<>(swarmname, varname, count, offset, m, dataVec);
+  };
+
+  // Gets the counts and offsets for MPI ranks for the meshblocks set
+  // by the indexrange. Returns the total count on this rank.
+  [[nodiscard]] std::size_t GetSwarmCounts(const std::string &swarm,
+                                           const IndexRange &range,
+                                           std::vector<std::size_t> &counts,
+                                           std::vector<std::size_t> &offsets) override;
+
+  void ReadParams(const std::string &name, Params &p) override;
+
+  template <typename T>
+  void RestoreViewAttribute(const std::string &full_path, T &view) {
+    auto rank_and_dims =
+        it->getAttribute(full_path + ".rankdims").get<std::vector<size_t>>();
+    // Resize view.
+    typename T::array_layout layout;
+    for (int d = 0; d < rank_and_dims[0]; ++d) {
+      layout.dimension[d] = rank_and_dims[1 + d];
+    }
+    // Cannot use Kokkos::resize here as it's ambiguous at this point.
+    // Also, resize() interally also just create a new view.
+    view = T(Kokkos::view_alloc(Kokkos::WithoutInitializing, view.label()), layout);
+    auto view_h = Kokkos::create_mirror_view(HostMemSpace(), view);
+
+    using base_t = typename std::remove_pointer<decltype(view_h.data())>::type;
+    auto flat_data = it->getAttribute(full_path).get<std::vector<base_t>>();
+    for (auto i = 0; i < view_h.size(); i++) {
+      view_h.data()[i] = flat_data[i];
+    }
+    Kokkos::deep_copy(view, view_h);
+  }
+  [[nodiscard]] bool VariableExists(const std::string &name, const DataType data_type,
+                                    const std::string swarmvarname = "") const override {
+    if (data_type == DataType::Field) {
+      // Given that MeshRecord labels also carry information about the topological element
+      // and level, we just check for the prefix (this silently assumes that if one
+      // matching record is found, then the variable exists on all levels/for all
+      // components). Might cause issue for edge cases (and or variable combinations that
+      // contain the `_` separator), but this should not be an issue as the error message
+      // in the OpenPMD restart reader is clear (about the variable) when reading fails
+      // later.
+      for (auto [label, mesh] : it->meshes) {
+        if (label.compare(0, name.length() + 1, name + "_") == 0) {
+          return true;
+        }
+      }
+    } else if (data_type == DataType::Swarm) {
+      return it->particles.contains(name);
+    } else if (data_type == DataType::SwarmVar) {
+      // rank = 0, and component index = 0 because we just care about the record name
+      auto [particle_record, particle_record_component] =
+          OpenPMDUtils::GetParticleRecordAndComponentNames(swarmvarname, 0, 0);
+      return it->particles[name].contains(particle_record);
+    }
+    return false;
+  }
+  // closes out the restart file
+  // perhaps belongs in a destructor?
+  void Close();
+
+ private:
+  const std::string filename_;
+
+  openPMD::Series series;
+  // Iteration is a pointer because it cannot be default constructed (it depends on the
+  // Series).
+  std::unique_ptr<openPMD::Iteration> it;
+
+  template <typename T>
+  void ReadAllParamsOfType(const std::string &prefix, Params &params);
+  template <typename... Ts>
+  void ReadAllParamsOfMultipleTypes(const std::string &prefix, Params &p);
+  template <typename T>
+  void ReadAllParams(const std::string &pkg_name, Params &p);
+};
+
+} // namespace parthenon
+#endif // OUTPUTS_RESTART_OPMD_HPP_
diff --git a/src/parthenon_manager.cpp b/src/parthenon_manager.cpp
index 74f4b67f1c0f..841e694fe197 100644
--- a/src/parthenon_manager.cpp
+++ b/src/parthenon_manager.cpp
@@ -28,8 +28,6 @@
 #include <utility>
 #include <vector>
 
-#include <Kokkos_Core.hpp>
-
 #include "amr_criteria/amr_criteria.hpp"
 #include "amr_criteria/refinement_package.hpp"
 #include "config.hpp"
@@ -41,6 +39,9 @@
 #include "outputs/outputs_package.hpp"
 #include "outputs/restart.hpp"
 #include "outputs/restart_hdf5.hpp"
+#ifdef PARTHENON_ENABLE_OPENPMD
+#include "outputs/restart_opmd.hpp"
+#endif
 #include "utils/error_checking.hpp"
 #include "utils/utils.hpp"
 
@@ -102,7 +103,18 @@ ParthenonStatus ParthenonManager::ParthenonInitEnv(int argc, char *argv[]) {
   if (arg.is_restart) {
     // Read input from restart file
     if (fs::path(arg.restart_filename).extension() == ".rhdf") {
+#ifdef ENABLE_HDF5
       restartReader = std::make_unique<RestartReaderHDF5>(arg.restart_filename);
+#else // HDF5 disabled
+      PARTHENON_FAIL("Restart functionality is not available because HDF5 is disabled");
+#endif
+    } else if (fs::path(arg.restart_filename).extension() == ".bp") {
+#ifdef PARTHENON_ENABLE_OPENPMD
+      restartReader = std::make_unique<RestartReaderOPMD>(arg.restart_filename);
+#else
+      PARTHENON_FAIL("Trying to restart from OpenPMD file but OpenPMD support was not "
+                     "compiled into Parthenon.");
+#endif // ifdef PARTHENON_ENABLE_OPENPMD
     } else {
       PARTHENON_FAIL("Unsupported restart file format.");
     }
@@ -260,9 +272,6 @@ ParthenonManager::ProcessPackagesDefault(std::unique_ptr<ParameterInput> &pin) {
 }
 
 void ParthenonManager::RestartPackages(Mesh &rm, RestartReader &resfile) {
-#ifndef ENABLE_HDF5
-  PARTHENON_FAIL("Restart functionality is not available because HDF5 is disabled");
-#else  // HDF5 enabled
   // Restart packages with information for blocks in ids from the restart file
   // Assumption: blocks are contiguous in restart file, may have to revisit this.
   const IndexDomain theDomain =
@@ -274,19 +283,9 @@ void ParthenonManager::RestartPackages(Mesh &rm, RestartReader &resfile) {
   int nbe = nbs + nb - 1;
   IndexRange myBlocks{nbs, nbe};
 
-  // TODO(cleanup) why is this code here and not contained in the restart reader?
   std::cout << "Blocks assigned to rank " << Globals::my_rank << ": " << nbs << ":" << nbe
             << std::endl;
 
-  // Currently supports versions 3 and 4.
-  const auto file_output_format_ver = resfile.GetOutputFormatVersion();
-  if (file_output_format_ver < HDF5::OUTPUT_VERSION_FORMAT - 1) {
-    std::stringstream msg;
-    msg << "File format version " << file_output_format_ver << " not supported. "
-        << "Current format is " << HDF5::OUTPUT_VERSION_FORMAT << std::endl;
-    PARTHENON_THROW(msg)
-  }
-
   // Get list of variables, they are the same for all blocks (since all blocks have the
   // same variable metadata)
   const auto indep_restart_vars =
@@ -320,8 +319,8 @@ void ParthenonManager::RestartPackages(Mesh &rm, RestartReader &resfile) {
                                    " is marked as sparse in restart file");
     }
 
-    max_fillsize =
-        std::max(max_fillsize, static_cast<size_t>(v_info.FillSize(theDomain)));
+    max_fillsize = std::max(max_fillsize, static_cast<size_t>(v_info.FillSize(
+                                              theDomain, resfile.BlockdataIsPadded())));
   }
 
   // make sure we have all sparse variables that are in the restart file
@@ -336,10 +335,11 @@ void ParthenonManager::RestartPackages(Mesh &rm, RestartReader &resfile) {
   std::vector<Real> tmp(static_cast<size_t>(nb) * max_fillsize);
   for (const auto &v_info : all_vars_info) {
     const auto vlen = v_info.num_components * v_info.ntop_elems;
-    const auto fill_size = v_info.FillSize(theDomain);
+    const auto fill_size = v_info.FillSize(theDomain, resfile.BlockdataIsPadded());
     const auto &label = v_info.label;
 
-    auto var_missing_on_disk = !resfile.VariableExists(label);
+    auto var_missing_on_disk =
+        !resfile.VariableExists(label, RestartReader::DataType::Field);
     if (Globals::my_rank == 0) {
       std::cout << "Var: " << label << ":" << vlen
                 << (var_missing_on_disk ? " missing on disk\n" : "\n");
@@ -351,7 +351,7 @@ void ParthenonManager::RestartPackages(Mesh &rm, RestartReader &resfile) {
     // Read relevant data from the hdf file, this works for dense and sparse variables
     // because sparse variables are currently densely written for HDF5.
     try {
-      resfile.ReadBlocks(label, myBlocks, v_info, tmp, file_output_format_ver);
+      resfile.ReadBlocks(label, myBlocks, v_info, tmp, &rm);
       // Variable does exist but could not be read. So we definitely want to fail here.
     } catch (std::exception &ex) {
       std::stringstream msg;
@@ -382,19 +382,12 @@ void ParthenonManager::RestartPackages(Mesh &rm, RestartReader &resfile) {
       auto v_h = v->data.GetHostMirror();
 
       // Double note that this also needs to be update in case
-      // we update the HDF5 infrastructure!
-      if (file_output_format_ver >= HDF5::OUTPUT_VERSION_FORMAT - 1) {
-        OutputUtils::PackOrUnpackVar(
-            v_info, resfile.HasGhost() != 0, index,
-            [&](auto index, int topo, int t, int u, int v, int k, int j, int i) {
-              v_h(topo, t, u, v, k, j, i) = tmp[index];
-            });
-      } else {
-        std::stringstream msg;
-        msg << "File format version " << file_output_format_ver << " not supported. "
-            << "Current format is " << HDF5::OUTPUT_VERSION_FORMAT << std::endl;
-        PARTHENON_THROW(msg)
-      }
+      // we update the OpenPMD/HDF5 infrastructure!
+      OutputUtils::PackOrUnpackVar(
+          v_info, resfile.HasGhost() != 0, resfile.BlockdataIsPadded(), index,
+          [&](auto index, int topo, int t, int u, int v, int k, int j, int i) {
+            v_h(topo, t, u, v, k, j, i) = tmp[index];
+          });
 
       v->data.DeepCopy(v_h);
     }
@@ -406,7 +399,8 @@ void ParthenonManager::RestartPackages(Mesh &rm, RestartReader &resfile) {
   auto swarms = (mb.meshblock_data.Get()->GetSwarmData())->GetSwarmsByFlag(flags);
   for (auto &swarm : swarms) {
     auto swarmname = swarm->label();
-    auto var_missing_on_disk = !resfile.VariableExists(swarmname);
+    auto var_missing_on_disk =
+        !resfile.VariableExists(swarmname, RestartReader::DataType::Swarm);
     if (Globals::my_rank == 0) {
       std::cout << "Swarm: " << swarmname
                 << (var_missing_on_disk ? " missing on disk\n" : "\n");
@@ -443,7 +437,6 @@ void ParthenonManager::RestartPackages(Mesh &rm, RestartReader &resfile) {
     auto &params = pkg->AllParams();
     resfile.ReadParams(name, params);
   }
-#endif // ifdef ENABLE_HDF5
 }
 
 } // namespace parthenon
diff --git a/src/parthenon_manager.hpp b/src/parthenon_manager.hpp
index 6c8e0d4f01d3..34fe5458e710 100644
--- a/src/parthenon_manager.hpp
+++ b/src/parthenon_manager.hpp
@@ -72,8 +72,8 @@ class ParthenonManager {
       const auto &m = var->metadata();
       auto arrdims = m.GetArrayDims(pswarm->GetBlockPointer(), false);
 
-      auto var_missing_on_disk =
-          !restartReader->VariableExists(swarmname + "/SwarmVars/" + varname);
+      auto var_missing_on_disk = !restartReader->VariableExists(
+          swarmname, RestartReader::DataType::SwarmVar, varname);
       if (Globals::my_rank == 0) {
         std::cout << "SwarmVar: " << varname
                   << (var_missing_on_disk ? " missing on disk\n" : "\n");
diff --git a/src/utils/mpi_types.hpp b/src/utils/mpi_types.hpp
index 4685adef3158..f33961ef88d5 100644
--- a/src/utils/mpi_types.hpp
+++ b/src/utils/mpi_types.hpp
@@ -1,4 +1,8 @@
 //========================================================================================
+// Parthenon performance portable AMR framework
+// Copyright(C) 2021-2024 The Parthenon collaboration
+// Licensed under the 3-clause BSD License, see LICENSE file for details
+//========================================================================================
 // (C) (or copyright) 2021. Triad National Security, LLC. All rights reserved.
 //
 // This program was produced under U.S. Government contract 89233218CNA000001 for Los
@@ -34,6 +38,16 @@ inline MPI_Datatype MPITypeMap<Real>::type() {
   return MPI_PARTHENON_REAL;
 }
 
+template <>
+inline MPI_Datatype MPITypeMap<int64_t>::type() {
+  return MPI_INT64_T;
+}
+
+template <>
+inline MPI_Datatype MPITypeMap<int8_t>::type() {
+  return MPI_INT8_T;
+}
+
 template <>
 inline MPI_Datatype MPITypeMap<int>::type() {
   return MPI_INT;
@@ -44,6 +58,12 @@ inline MPI_Datatype MPITypeMap<bool>::type() {
   return MPI_CXX_BOOL;
 }
 
+template <>
+inline MPI_Datatype MPITypeMap<std::size_t>::type() {
+  // TODO(pgrete) do we need special checks here wrt to conflicts on MacOS?
+  return MPI_UINT64_T;
+}
+
 } // namespace parthenon
 #endif
 
diff --git a/tst/regression/CMakeLists.txt b/tst/regression/CMakeLists.txt
index 89a83cc09703..f4cde1f4d20b 100644
--- a/tst/regression/CMakeLists.txt
+++ b/tst/regression/CMakeLists.txt
@@ -164,6 +164,21 @@ if (ENABLE_HDF5)
 
 endif()
 
+if (PARTHENON_ENABLE_OPENPMD)
+
+  # h5py is also needed for the current test
+  list(APPEND REQUIRED_PYTHON_MODULES openpmd_api h5py)
+
+  # Restart
+  list(APPEND TEST_DIRS restart_opmd)
+  list(APPEND TEST_PROCS ${NUM_MPI_PROC_TESTING})
+  list(APPEND TEST_ARGS "--driver ${PROJECT_BINARY_DIR}/example/advection/advection-example \
+    --driver_input ${CMAKE_CURRENT_SOURCE_DIR}/test_suites/restart_opmd/parthinput.restart \
+    --num_steps 3")
+  list(APPEND EXTRA_TEST_LABELS "")
+
+  endif()
+
 # Any external modules that are required by python can be added to REQUIRED_PYTHON_MODULES
 # list variable, before including TestSetup.cmake.
 list(APPEND REQUIRED_PYTHON_MODULES numpy)
diff --git a/tst/regression/test_suites/restart_opmd/__init__.py b/tst/regression/test_suites/restart_opmd/__init__.py
new file mode 100644
index 000000000000..e69de29bb2d1
diff --git a/tst/regression/test_suites/restart_opmd/parthinput.restart b/tst/regression/test_suites/restart_opmd/parthinput.restart
new file mode 100644
index 000000000000..5ba796143d19
--- /dev/null
+++ b/tst/regression/test_suites/restart_opmd/parthinput.restart
@@ -0,0 +1,64 @@
+# ========================================================================================
+#  Parthenon performance portable AMR framework
+#  Copyright(C) 2024-2025 The Parthenon collaboration
+#  Licensed under the 3-clause BSD License, see LICENSE file for details
+# ========================================================================================
+
+<parthenon/job>
+problem_id = advection
+
+<parthenon/mesh>
+refinement = adaptive
+numlevel = 3
+
+nx1 = 64
+x1min = -0.5
+x1max = 0.5
+ix1_bc = periodic
+ox1_bc = periodic
+
+nx2 = 64
+x2min = -0.5
+x2max = 0.5
+ix2_bc = periodic
+ox2_bc = periodic
+
+nx3 = 1
+x3min = -0.5
+x3max = 0.5
+ix3_bc = periodic
+ox3_bc = periodic
+
+<parthenon/meshblock>
+nx1 = 16
+nx2 = 16
+nx3 = 1
+
+<parthenon/time>
+nlim = -1
+tlim = 0.2
+integrator = rk2
+ncycle_out_mesh = -10000
+
+<Advection>
+cfl = 0.45
+vx = 1.0
+vy = 1.0
+vz = 1.0
+profile = hard_sphere
+
+refine_tol = 0.3    # control the package specific refinement tagging function
+derefine_tol = 0.03
+compute_error = false
+num_vars = 1 # number of variables
+vec_size = 1 # size of each variable
+fill_derived = false # whether to fill one-copy test vars
+
+<parthenon/output1>
+file_type = openpmd
+dt = 0.050
+use_final_label = false
+
+<parthenon/output2>
+file_type = rst
+dt = 0.050
diff --git a/tst/regression/test_suites/restart_opmd/parthinput_override.restart b/tst/regression/test_suites/restart_opmd/parthinput_override.restart
new file mode 100644
index 000000000000..c5b368aebcbd
--- /dev/null
+++ b/tst/regression/test_suites/restart_opmd/parthinput_override.restart
@@ -0,0 +1,9 @@
+# ========================================================================================
+# Parthenon performance portable AMR framework
+# Copyright(C) 2024 The Parthenon collaboration
+# Licensed under the 3-clause BSD License, see LICENSE file for details
+# ========================================================================================
+
+# Testing to override parameters in a restart file from an input file
+<parthenon/job>
+problem_id=silver
diff --git a/tst/regression/test_suites/restart_opmd/restart_opmd.py b/tst/regression/test_suites/restart_opmd/restart_opmd.py
new file mode 100644
index 000000000000..d91029e0f0e2
--- /dev/null
+++ b/tst/regression/test_suites/restart_opmd/restart_opmd.py
@@ -0,0 +1,173 @@
+# ========================================================================================
+# Parthenon performance portable AMR framework
+# Copyright(C) 2024 The Parthenon collaboration
+# Licensed under the 3-clause BSD License, see LICENSE file for details
+# ========================================================================================
+
+# Modules
+import sys
+import utils.test_case
+import numpy as np
+
+
+# To prevent littering up imported folders with .pyc files or __pycache_ folder
+sys.dont_write_bytecode = True
+
+
+# The test case uses an AMR simulation (with blocks being created and destroyed) as basline.
+# The initial run will run to completion (writing hdf5 rst and opmd output with the same cadence).
+# Then the simulation is restarted from the first, non-initial condition opmd output and again run to completion.
+# Finally, the simulation is restarted again but using the hdf5 output generated from the previous restart.
+# For testing all resulting pmd snapshots are compared against each other at the same simulation time.
+# If they agree, restarting from opmd works and also the info contained in the opmd restart matches
+# the info in the hdf5 rst files (and vice versa).
+class TestCase(utils.test_case.TestCaseAbs):
+    def Prepare(self, parameters, step):
+        # enable coverage testing on pass where restart
+        # files are both read and written
+        parameters.coverage_status = "both"
+
+        # run baseline (to the very end)
+        if step == 1:
+            parameters.driver_cmd_line_args = ["parthenon/job/problem_id=gold"]
+        # restart from an early openpmd snapshot
+        elif step == 2:
+            parameters.driver_cmd_line_args = [
+                "-r",
+                "gold.out1.00001.bp",
+                "-i",
+                f"{parameters.parthenon_path}/tst/regression/test_suites/restart_opmd/parthinput_override.restart",
+            ]
+        # restart from an hdf5 snapshot produced from the restarted opmd one
+        elif step == 3:
+            parameters.driver_cmd_line_args = [
+                "-r",
+                "silver.out2.00002.rhdf",
+                "parthenon/job/problem_id=bronze",
+            ]
+
+        return parameters
+
+    def Analyse(self, parameters):
+        try:
+            import openpmd_api as opmd
+        except ModuleNotFoundError:
+            print("Couldn't find required openpmd_api module to compare test results.")
+            return False
+        success = True
+
+        def compare_attributes(series_a, series_b):
+            skip_attributes = [
+                "iterationFormat",  # Stores the file name format. Expected to differ.
+                "WallTime",
+                "InputFile",  # Is updated during runtime, e.g., startime and thus differs
+            ]
+            all_equal = True
+            for attr in series_a.attributes:
+                if series_b.contains_attribute(attr):
+                    attr_a = series_a.get_attribute(attr)
+                    attr_b = series_b.get_attribute(attr)
+                    if attr not in skip_attributes and attr_a != attr_b:
+                        print(
+                            f"Mismatch in attribute '{attr}'. "
+                            f"'{attr_a}' versus '{attr_b}'\n"
+                        )
+                        all_equal = False
+                else:
+                    print(f"Missing attribute '{attr}' in second file.")
+                    all_equal = False
+            return all_equal
+
+        # need series in order to flush
+        def compare_data(it_a, it_b, series_a, series_b):
+            all_equal = True
+            for mesh_name, mesh_a in it_a.meshes.items():
+                if mesh_name not in it_b.meshes:
+                    print(f"Missing mesh '{mesh_name}' in second file.")
+                    all_equal = False
+                    continue
+                mesh_b = it_b.meshes[mesh_name]
+
+                for comp_name, comp_a in mesh_a.items():
+                    if comp_name not in mesh_b:
+                        print(
+                            f"Missing component '{comp_name}' in mesh '{mesh_name}' of second file."
+                        )
+                        all_equal = False
+                        continue
+                    comp_b = mesh_b[comp_name]
+
+                    if comp_a.shape != comp_b.shape:
+                        print(
+                            f"Mismatch is mech record component shapes of "
+                            " compontent '{comp_name}' in mesh '{mesh_name}': "
+                            f"{comp_a.shape} versus {comp_b.shape}\n"
+                        )
+                        all_equal = False
+                        continue
+
+                    # Given that the shapes are guaranteed to match (follow the check above)
+                    # we can load chunks from both files.
+                    # Note that we have to go over chunks as data might be sparse on disk so
+                    # loading the entire record will contain garbage in sparse places.
+                    data_a = np.empty(comp_a.shape)
+                    data_a[:] = np.nan
+                    data_b = np.copy(data_a)
+                    for chunk in comp_a.available_chunks():
+                        # Following OpenPMD-viewer `chunk_to_slice` here
+                        # https://github.com/openPMD/openPMD-viewer/blob/6eccb608893d2c9b8d158d950c3f0451898a80f6/openpmd_viewer/openpmd_timeseries/data_reader/io_reader/utilities.py#L14
+                        stops = [a + b for a, b in zip(chunk.offset, chunk.extent)]
+                        indices_per_dim = zip(chunk.offset, stops)
+                        sl = tuple(
+                            map(lambda s: slice(s[0], s[1], None), indices_per_dim)
+                        )
+
+                        tmp = comp_a[sl]
+                        series_a.flush()
+                        data_a[sl] = tmp
+
+                        tmp = comp_b[sl]
+                        series_b.flush()
+                        data_b[sl] = tmp
+
+                    try:
+                        np.testing.assert_array_max_ulp(data_a, data_b)
+                    except AssertionError as err:
+                        print(
+                            f"Data of component '{comp_name}' in mesh '{mesh_name}' does not match:\n"
+                            f"{err}\n"
+                        )
+                        all_equal = False
+                        continue
+
+            return all_equal
+
+        def compare_files(idx_it, name_a, name_b):
+            all_good = True
+            series_gold = opmd.Series(f"{name_a}.out1.%T.bp/", opmd.Access.read_only)
+            series_silver = opmd.Series(f"{name_b}.out1.%T.bp/", opmd.Access.read_only)
+
+            # PG: yes, this is inefficient but keeps the logic simple
+            all_good &= compare_attributes(series_gold, series_silver)
+            all_good &= compare_attributes(series_silver, series_gold)
+
+            it_gold = series_gold.iterations[idx_it]
+            it_silver = series_silver.iterations[idx_it]
+            all_good &= compare_attributes(it_gold, it_silver)
+            all_good &= compare_attributes(it_silver, it_gold)
+
+            all_good &= compare_data(it_silver, it_gold, series_silver, series_gold)
+            all_good &= compare_data(it_gold, it_silver, series_gold, series_silver)
+
+            return all_good
+
+        # comapre a few files throughout the simulations
+        success &= compare_files(2, "gold", "silver")
+        # bronze outputs only exists from dump 3 on
+        success &= compare_files(3, "gold", "silver")
+        success &= compare_files(3, "silver", "bronze")
+        success &= compare_files(4, "gold", "silver")
+        success &= compare_files(4, "silver", "bronze")
+        # success &= compare_files("final")
+
+        return success
diff --git a/tst/unit/test_unit_params.cpp b/tst/unit/test_unit_params.cpp
index fad51c069538..8a987a5e4763 100644
--- a/tst/unit/test_unit_params.cpp
+++ b/tst/unit/test_unit_params.cpp
@@ -1,6 +1,6 @@
 //========================================================================================
-// Athena++ astrophysical MHD code
-// Copyright(C) 2014 James M. Stone <jmstone@princeton.edu> and other code contributors
+// Parthenon performance portable AMR framework
+// Copyright(C) 2020-2025 The Parthenon collaboration
 // Licensed under the 3-clause BSD License, see LICENSE file for details
 //========================================================================================
 // (C) (or copyright) 2020-2025. Triad National Security, LLC. All rights reserved.
@@ -16,6 +16,8 @@
 //========================================================================================
 
 #include <string>
+#include <tuple>
+#include <type_traits>
 #include <vector>
 
 #include <catch2/catch.hpp>
@@ -24,8 +26,13 @@
 #include "config.hpp"
 #include "interface/params.hpp"
 #include "kokkos_abstraction.hpp"
+#include "openPMD/Series.hpp"
 #include "outputs/parthenon_hdf5.hpp"
+#include "outputs/parthenon_opmd.hpp"
+#include "outputs/restart_hdf5.hpp"
+#include "outputs/restart_opmd.hpp"
 #include "parameter_input.hpp"
+#include "parthenon_array_generic.hpp"
 
 using parthenon::Params;
 using parthenon::Real;
@@ -137,9 +144,22 @@ TEST_CASE("when hasKey is called", "[hasKey]") {
   }
 }
 
-#ifdef ENABLE_HDF5
-
-TEST_CASE("A set of params can be dumped to file", "[params][output]") {
+#if defined(ENABLE_HDF5) && defined(PARTHENON_ENABLE_OPENPMD)
+using parthenon::RestartReaderHDF5;
+using parthenon::RestartReaderOPMD;
+using OutputTypes = std::tuple<RestartReaderHDF5, RestartReaderOPMD>;
+#elif defined(ENABLE_HDF5)
+using parthenon::RestartReaderHDF5;
+using OutputTypes = std::tuple<RestartReaderHDF5>;
+#elif defined(PARTHENON_ENABLE_OPENPMD)
+using parthenon::RestartReaderOPMD;
+using OutputTypes = std::tuple<RestartReaderOPMD>;
+#else
+using OutputTypes = std::tuple<>;
+#endif
+
+TEMPLATE_LIST_TEST_CASE("A set of params can be dumped to file", "[params][output]",
+                        OutputTypes) {
   GIVEN("A params object with a few kinds of objects") {
     Params params;
     const auto restart = Params::Mutability::Restart;
@@ -164,43 +184,97 @@ TEST_CASE("A set of params can be dumped to file", "[params][output]") {
     Kokkos::deep_copy(arr2d, arr2d_h);
     params.Add("arr2d", arr2d);
 
-    parthenon::HostArray2D<Real> hostarr("hostarr2d", 2, 3);
+    // "Vectors" of bools have some special sauce under the hood so let's try the logic
+    // with a plain view
+    Kokkos::View<bool *> bool1d("boolview", 10);
+    auto bool1d_h = Kokkos::create_mirror_view(bool1d);
+    for (int i = 0; i < 10; ++i) {
+      bool1d_h(i) = i % 2;
+    }
+    Kokkos::deep_copy(bool1d, bool1d_h);
+    params.Add("bool1d", bool1d);
+
+    parthenon::HostArray2D<Real> hostarr2d("hostarr2d", 2, 3);
     for (int i = 0; i < 2; ++i) {
       for (int j = 0; j < 3; ++j) {
-        hostarr(i, j) = 2 * i + j + 1;
+        hostarr2d(i, j) = 2 * i + j + 1;
       }
     }
-    params.Add("hostarr2d", hostarr, restart);
+    params.Add("hostarr2d", hostarr2d, restart);
 
-    THEN("We can output to hdf5") {
-      const std::string filename = "params_test.h5";
-      const std::string groupname = "params";
+    THEN("We can output") {
+      std::string filename;
+      const std::string groupname = "Params";
       const std::string prefix = "test_pkg";
-      using namespace parthenon::HDF5;
-      {
+      if constexpr (std::is_same_v<RestartReaderHDF5, TestType>) {
+        using namespace parthenon::HDF5;
+        filename = "params_test.h5";
+
         H5F file = H5F::FromHIDCheck(
             H5Fcreate(filename.c_str(), H5F_ACC_TRUNC, H5P_DEFAULT, H5P_DEFAULT));
         auto group = MakeGroup(file, groupname);
         params.WriteAllToHDF5(prefix, group);
+      } else if constexpr (std::is_same_v<RestartReaderOPMD, TestType>) {
+        filename = ("params_test.%05T.bp");
+        auto series = openPMD::Series(filename, openPMD::Access::CREATE);
+        series.setIterationEncoding(openPMD::IterationEncoding::fileBased);
+        auto it = series.iterations[0];
+        parthenon::OpenPMDUtils::WriteAllParams(params, prefix, &it);
+      } else {
+        FAIL("This logic is flawed. I should not be here.");
       }
-      AND_THEN("We can directly read the relevant data from the hdf5 file") {
-        H5F file =
-            H5F::FromHIDCheck(H5Fopen(filename.c_str(), H5F_ACC_RDONLY, H5P_DEFAULT));
-        const H5O obj = H5O::FromHIDCheck(H5Oopen(file, groupname.c_str(), H5P_DEFAULT));
-
+      AND_THEN("We can directly read the relevant data from the file") {
         Real in_scalar;
-        HDF5ReadAttribute(obj, prefix + "/scalar", in_scalar);
-        REQUIRE(std::abs(scalar - in_scalar) <= 1e-10);
-
         std::vector<int> in_vector;
-        HDF5ReadAttribute(obj, prefix + "/vector", in_vector);
+        // deliberately the wrong size
+        parthenon::ParArray2D<Real> in_arr2d("myarr", 1, 1);
+        parthenon::HostArray2D<Real> in_hostarr2d("hostarr2d", 2, 3);
+        Kokkos::View<bool *> in_bool1d("in_bool1d", 5);
+
+        if constexpr (std::is_same_v<RestartReaderHDF5, TestType>) {
+          H5F file =
+              H5F::FromHIDCheck(H5Fopen(filename.c_str(), H5F_ACC_RDONLY, H5P_DEFAULT));
+          const H5O obj =
+              H5O::FromHIDCheck(H5Oopen(file, groupname.c_str(), H5P_DEFAULT));
+
+          HDF5ReadAttribute(obj, prefix + "/scalar", in_scalar);
+          HDF5ReadAttribute(obj, prefix + "/vector", in_vector);
+          HDF5ReadAttribute(obj, prefix + "/arr2d", in_arr2d);
+          HDF5ReadAttribute(obj, prefix + "/hostarr2d", in_hostarr2d);
+          HDF5ReadAttribute(obj, prefix + "/bool1d", in_bool1d);
+        } else if constexpr (std::is_same_v<RestartReaderOPMD, TestType>) {
+          auto series = openPMD::Series(filename, openPMD::Access::READ_ONLY);
+          auto it = series.iterations[0];
+          // Note that we're explicitly using `delim` here which tests the character
+          // replacement of '/' in the WriteAllParams function.
+          using parthenon::OpenPMDUtils::delim;
+
+          in_scalar =
+              it.getAttribute(groupname + delim + prefix + delim + "scalar").get<Real>();
+
+          in_vector = it.getAttribute(groupname + delim + prefix + delim + "vector")
+                          .get<std::vector<int>>();
+
+          // Technically, we're not reading "directly" here but the restart reader ctor
+          // literally just opens the file.
+          auto resfile = RestartReaderOPMD(filename.c_str());
+          auto &in_arr2d_v = in_arr2d.KokkosView();
+          resfile.RestoreViewAttribute(groupname + delim + prefix + delim + "arr2d",
+                                       in_arr2d_v);
+
+          auto &in_hostarr2d_v = in_hostarr2d.KokkosView();
+          resfile.RestoreViewAttribute(groupname + delim + prefix + delim + "hostarr2d",
+                                       in_hostarr2d_v);
+          // TODO(pgrete) make this work and also add checks for correctness below
+          // resfile.RestoreViewAttribute(groupname + delim + prefix + delim + "bool1d",
+          // in_bool1d);
+        }
+        REQUIRE(scalar == in_scalar);
+
         for (int i = 0; i < vector.size(); ++i) {
           REQUIRE(in_vector[i] == vector[i]);
         }
 
-        // deliberately the wrong size
-        parthenon::ParArray2D<Real> in_arr2d("myarr", 1, 1);
-        HDF5ReadAttribute(obj, prefix + "/arr2d", in_arr2d);
         REQUIRE(in_arr2d.extent_int(0) == arr2d.extent_int(0));
         REQUIRE(in_arr2d.extent_int(1) == arr2d.extent_int(1));
         int nwrong = 1;
@@ -212,9 +286,17 @@ TEST_CASE("A set of params can be dumped to file", "[params][output]") {
             },
             nwrong);
         REQUIRE(nwrong == 0);
+
+        REQUIRE(in_hostarr2d.extent_int(0) == hostarr2d.extent_int(0));
+        REQUIRE(in_hostarr2d.extent_int(1) == hostarr2d.extent_int(1));
+        for (int i = 0; i < 2; ++i) {
+          for (int j = 0; j < 3; ++j) {
+            REQUIRE(hostarr2d(i, j) == in_hostarr2d(i, j));
+          }
+        }
       }
 
-      AND_THEN("We can restart a params object from the HDF5 file") {
+      AND_THEN("We can restart a params object from the file") {
         Params rparams;
 
         // init the params object to restart into
@@ -233,24 +315,30 @@ TEST_CASE("A set of params can be dumped to file", "[params][output]") {
         parthenon::HostArray2D<Real> test_hostarr("hostarr2d", 1, 1);
         rparams.Add("hostarr2d", test_hostarr, restart);
 
-        H5F file =
-            H5F::FromHIDCheck(H5Fopen(filename.c_str(), H5F_ACC_RDONLY, H5P_DEFAULT));
-        const H5G obj = H5G::FromHIDCheck(H5Oopen(file, groupname.c_str(), H5P_DEFAULT));
-        rparams.ReadFromRestart(prefix, obj);
+        if constexpr (std::is_same_v<RestartReaderHDF5, TestType>) {
+          H5F file =
+              H5F::FromHIDCheck(H5Fopen(filename.c_str(), H5F_ACC_RDONLY, H5P_DEFAULT));
+          const H5G obj =
+              H5G::FromHIDCheck(H5Oopen(file, groupname.c_str(), H5P_DEFAULT));
+          rparams.ReadFromRestart(prefix, obj);
+        } else if constexpr (std::is_same_v<RestartReaderOPMD, TestType>) {
+          auto resfile = RestartReaderOPMD(filename.c_str());
+          resfile.ReadParams(prefix, rparams);
+        }
 
         AND_THEN("The values for the restartable params are updated to match the file") {
           auto test_scalar = rparams.Get<Real>("scalar");
-          REQUIRE(std::abs(test_scalar - scalar) <= 1e-10);
+          REQUIRE(test_scalar == scalar);
 
           auto test_bool = rparams.Get<bool>("boolscalar");
           REQUIRE(test_bool == boolscalar);
 
-          auto test_hostarr = params.Get<parthenon::HostArray2D<Real>>("hostarr2d");
-          REQUIRE(test_hostarr.extent_int(0) == hostarr.extent_int(0));
-          REQUIRE(test_hostarr.extent_int(1) == hostarr.extent_int(1));
-          for (int i = 0; i < hostarr.extent_int(0); ++i) {
-            for (int j = 0; j < hostarr.extent_int(1); ++j) {
-              REQUIRE(test_hostarr(i, j) == hostarr(i, j));
+          auto test_hostarr = rparams.Get<parthenon::HostArray2D<Real>>("hostarr2d");
+          REQUIRE(test_hostarr.extent_int(0) == hostarr2d.extent_int(0));
+          REQUIRE(test_hostarr.extent_int(1) == hostarr2d.extent_int(1));
+          for (int i = 0; i < hostarr2d.extent_int(0); ++i) {
+            for (int j = 0; j < hostarr2d.extent_int(1); ++j) {
+              REQUIRE(test_hostarr(i, j) == hostarr2d(i, j));
             }
           }
         }
@@ -265,5 +353,3 @@ TEST_CASE("A set of params can be dumped to file", "[params][output]") {
     }
   }
 }
-
-#endif // ENABLE_HDF5