diff --git a/.github/workflows/draft-pdf.yml b/.github/workflows/draft-pdf.yml
new file mode 100644
index 00000000..2cb66715
--- /dev/null
+++ b/.github/workflows/draft-pdf.yml
@@ -0,0 +1,27 @@
+name: Draft PDF
+on:
+  push:
+    paths:
+      - paper/**
+      - .github/workflows/draft-pdf.yml
+jobs:
+  paper:
+    runs-on: ubuntu-latest
+    name: Paper Draft
+    steps:
+      - name: Checkout
+        uses: actions/checkout@v4
+      - name: Build draft PDF
+        uses: openjournals/openjournals-draft-action@master
+        with:
+          journal: joss
+          # This should be the path to the paper within your repo.
+          paper-path: paper/paper.md
+      - name: Upload
+        uses: actions/upload-artifact@v4
+        with:
+          name: paper
+          # This is the output path where Pandoc will write the compiled
+          # PDF. Note, this should be the same directory as the input
+          # paper.md
+          path: paper/paper.pdf
diff --git a/paper/paper.bib b/paper/paper.bib
new file mode 100644
index 00000000..4e4544a4
--- /dev/null
+++ b/paper/paper.bib
@@ -0,0 +1,59 @@
+@article{Pearson:2017,
+  	url = {http://adsabs.harvard.edu/abs/2017arXiv170304627P},
+  	Archiveprefix = {arXiv},
+  	Author = {{Pearson}, S. and {Price-Whelan}, A.~M. and {Johnston}, K.~V.},
+  	Eprint = {1703.04627},
+  	Journal = {ArXiv e-prints},
+  	Keywords = {Astrophysics - Astrophysics of Galaxies},
+  	Month = mar,
+  	Title = {{Gaps in Globular Cluster Streams: Pal 5 and the Galactic Bar}},
+  	Year = 2017
+}
+
+@book{Binney:2008,
+  	url = {http://adsabs.harvard.edu/abs/2008gady.book.....B},
+  	Author = {{Binney}, J. and {Tremaine}, S.},
+  	Booktitle = {Galactic Dynamics: Second Edition, by James Binney and Scott Tremaine.~ISBN 978-0-691-13026-2 (HB).~Published by Princeton University Press, Princeton, NJ USA, 2008.},
+  	Publisher = {Princeton University Press},
+  	Title = {{Galactic Dynamics: Second Edition}},
+  	Year = 2008
+}
+
+@article{gaia,
+    author = {{Gaia Collaboration}},
+    title = "{The Gaia mission}",
+    journal = {Astronomy and Astrophysics},
+    archivePrefix = "arXiv",
+    eprint = {1609.04153},
+    primaryClass = "astro-ph.IM",
+    keywords = {space vehicles: instruments, Galaxy: structure, astrometry, parallaxes, proper motions, telescopes},
+    year = 2016,
+    month = nov,
+    volume = 595,
+    doi = {10.1051/0004-6361/201629272},
+    url = {http://adsabs.harvard.edu/abs/2016A%26A...595A...1G},
+}
+
+@article{astropy,
+    author = {{Astropy Collaboration}},
+    title = "{Astropy: A community Python package for astronomy}",
+    journal = {Astronomy and Astrophysics},
+    archivePrefix = "arXiv",
+    eprint = {1307.6212},
+    primaryClass = "astro-ph.IM",
+    keywords = {methods: data analysis, methods: miscellaneous, virtual observatory tools},
+    year = 2013,
+    month = oct,
+    volume = 558,
+    doi = {10.1051/0004-6361/201322068},
+    url = {http://adsabs.harvard.edu/abs/2013A%26A...558A..33A}
+}
+
+@misc{fidgit,
+  author = {A. M. Smith and K. Thaney and M. Hahnel},
+  title = {Fidgit: An ungodly union of GitHub and Figshare},
+  year = {2020},
+  publisher = {GitHub},
+  journal = {GitHub repository},
+  url = {https://github.com/arfon/fidgit}
+}
diff --git a/paper/paper.md b/paper/paper.md
new file mode 100644
index 00000000..d3bcfe79
--- /dev/null
+++ b/paper/paper.md
@@ -0,0 +1,327 @@
+---
+title: 'PyMOR: A Python package for sharable Earth System Model data'
+tags:
+  - Python
+  - Earth System Modelling
+  - Climatology
+  - Oceanography
+  - Atmospheric Science
+authors:
+  - name: Paul Gierz
+    orcid: 0000-0002-4512-087X
+    corresponding: true
+    equal-contrib: true
+    affilitation: 1
+  - name: Pavan Siligam
+    orcid: ????
+    equal-contrib: true
+    affiliation: 1
+  - name: Miguel Andres-Martinez
+    orcid: ????
+    equal-contrib: true
+    affiliation: 1
+affiliations:
+  - name: Alfred Wegener Institute, Helmholtz Centre for Polar and Marine Research, Bremerhaven, Germany
+    index: 1
+    ror: 032e6b942
+date: 9 July, 2025
+bibliography: paper.bib
+---
+
+# Summary
+
+PyMOR is a toolbox for preparing Earth System Model (ESM) data for analysis and
+sharing with the community. PyMOR uses a simple command line interface and a
+clear way to manipulate NetCDF files step by step to add relevant metadata,
+transform units, combine variables, regrid, transform geometries, and more. It
+runs in parallel using Dask and SLURM, and thus is suitable to handle even
+large amounts of data. Written in Python, it allows users to quickly plug in
+custom functionality outside of the core standard library, ensuring that the
+toolbox can be extended to meet the exact needs of the user.
+
+# Statement of need
+
+Standardization of climate model outputs is crucial for preparing data for IPCC
+reports because it ensures that results from different modeling centers worldwide
+can be directly compared, combined, and analyzed in a consistent and transparent
+manner. The IPCC and associated projects like CMIP require model outputs to be
+formatted according to strict technical specifications: data must be provided
+in standardized NetCDF files, using common variable names, units, metadata
+conventions (such as the CF Metadata Conventions), and grid structures (e.g.,
+rectilinear grids for most fields, standard pressure or depth levels for
+vertical coordinates). This uniformity allows the Program for Climate Model
+Diagnosis and Intercomparison (PCMDI) to centrally archive and distribute model
+results, enabling hundreds of researchers to efficiently scrutinize, benchmark,
+and synthesize findings across models and scenarios. Without such
+standardization, the process of aggregating results for global assessments
+would be error-prone, time-consuming, and potentially unreliable, undermining
+the scientific basis for the IPCC’s policy-relevant conclusions.
+
+While the benefit of standardization is clear, a non-inconsequential portion of
+the climate modelling community prepares output files with native names, and
+preparing data for comparison projects often requires post-processing after
+the numerical simulations have been performed, rather than implementing the
+proper naming conventions and metadata standards directly in the numerical
+codes. Certain requested variables may need to be extracted from multiple output
+files or computed from other variables, units may need to be converted, or
+numerical geometry may need to be considered. Additionally, newer simulations
+are producing considerably larger datasets than previous generations, which can
+make it challenging to manipulate the files to conform to the requisite metadata
+standards and best-practices.
+
+We developed `pymor` to fill the need for a flexible, performant, extensible
+post-processing toolbox for Earth System Model data. Built on top of `xarray`,
+and `dask`, `pymor` provides a community-driven library of common
+transformations, as well as a simple extension system. We were primarily
+motivated to fill the following gaols:
+
+* Metadata, variable naming, and unit conversion to the standards developed by
+the CMIP community should work "out-of-the-box".
+* first-class support for extension of the library to include custom user steps
+* easy integration with other Python software
+* ability to handle big data
+* ability to run in parallel
+* open source and community driven
+
+# Overview of functionality
+
+![workflow](workflow.jpg)
+
+The functionality of `PyMOR` covers several key areas: accessing PCMDI standard
+name tables, metadata management, and data transformation. To specify this, the
+users create a specification file in YAML format, which describes the desired
+output files as well as processing steps to apply to the inputs.
+
+**PCMDI Standard Name Tables** are specified via the following entries in the
+user yaml:
+
+```yaml
+general:
+  cmor_version: "CMIP6"
+  mip: "CMIP"
+  CV_Dir: "..."
+  CMIP_Tables_Dir: "..."
+```
+
+internall, `pymor` then extracts and understands the metadata to attach to the
+simulation output files such as standard and long variable names, units,
+institutional attributes, experiment metadata, and more.
+
+**Flexible Mapping of Variables** allows the user to customize which variables
+in which NetCDF files correspond to which variables in the PCMDI standard name.
+As an example, we consider the variable `sst` (sea surface temperature), which
+in the example model ouput is natively named `tos` (temperature of ocean surface).
+
+The following mapping would be needed in the user yaml to map these variables to
+each other:
+
+```yaml
+rules:
+  - name: Conversion for SST
+    description: "Here is some text for humans. It isn't used anywhere."
+    inputs:
+      - path: <path/to/an/output/directory>
+        pattern: <some_regex_pattern>
+    cmor_variable: sst
+    model_variable: tos
+```
+
+**Data handling via the Pydata Ecosystem** allows the user to easily access the
+NetCDF files in a familiar format (`xarray`) to perform custom manipulations.
+Any processing step in a pipeline is expressed as a Python function with the
+following signature:
+
+```python
+import pymor
+from typing import Any
+
+def my_custom_step(data: Any, rule: pymor.core.rule.Rule) -> Any:
+    """
+    A custom pipeline step
+
+    Parameters
+    ----------
+    data : Any
+        While ``data`` is formally ``Any``, typically it will be either
+        a ``xarray.Dataset`` or ``xarray.DataArray`` object.
+
+    rule : pymor.core.rule.Rule
+        You additionally must have the parameter ``rule``, which contains the
+        user-specified description that applies to this data, such as name of
+        the variable in cmor, name in native terminology, source identification,
+        model name, experiment, and so on.
+
+    Returns
+    -------
+    Any
+        The return value of this step is used further down the pipeline.
+        Typically you want to pass back the (somehow transformed) ``data``.
+    """
+    ... # do some manipulation with data
+    return data
+```
+
+**A robust standard library** of data transformations allows for common and
+tested ways to manipulate data, including:
+
+* unit conversion
+* temporal averaging and resampling
+* regridding and spatial averaging
+* metadata attributes on both the file and variable level in output NetCDFs
+* variable renaming
+* axis, coordinate, and bounds renaming, sorting, and reordering
+
+**Specialized pipelines** for each conversion allows the user to specify exactly
+which manipulations should be applied to which files. In the `rules` section of
+the yaml file the user specifies which pipelines should be applied to the data
+loaded from the input section. Continuing the example from above:
+
+```yaml
+rules:
+  - name: Conversion for SST
+    description: "Here is some text for humans. It isn't used anywhere."
+    inputs:
+      - path: <path/to/an/output/directory>
+        pattern: <some_regex_pattern>
+    cmor_variable: sst
+    model_variable: tos
+    pipelines:
+        - my_named_pipeline
+        - another_pipeline
+```
+Data will thus pass first through the `my_named_pipeline` and then through
+`another_pipeline`. Each of those needs to be defined as well, which is done in
+a separate section of the `yaml` file:
+
+```yaml
+pipelines:
+  - name: my_named_pipeline
+    steps:
+      - "pymor.core.gather_inputs.load_mfdataset"
+      - "pymor.std_lib.convert_units"
+      - "pymor.std_lib.time_average"
+      - "pymor.std_lib.set_global_attributes"
+  - name: another_pipeline
+    steps:
+      - "pymor.std_lib.trigger_compute"
+      - "pymor.std_lib.show_data"
+      - "pymor.std_lib.files.save_dataset"
+```
+For this example, we have just split the default pipeline into two ajoining
+parts. If a `rule` specification does not have any `pipelines` defined, the
+build-in `default` is used.
+
+**Inclusion of custom steps** allows users to easily include their own functions
+to further manipulate data. First, a suitable Python function should be written:
+
+```python
+import xarray as xr
+from pymor.core.rule import Rule
+
+# Note that type hints are encouraged (but not enforced) by PyMOR
+def add_pp_components(data: xr.Dataset, rule: Rule) -> xr.DataArray:
+    """Adds together Net Primary Production components"""
+    # In this example, we utilize two different input variable in the native
+    # model outputs with cryptic names to construct a well-known standard name
+    # for the Net Primary Production (NPP) variable.
+    data["pp"] = data["diags3d01"] + data["diags3d02"]
+    # This return is mandatory for the pipeline to usefully continue
+    # We return our new variable to be further processed:
+    return data["pp"]  # Return type: DataArray.
+```
+
+Then, the user adds the path to the file containing this function to their
+pipeline definition:
+
+```yaml
+pipelines:
+  - name: convert_with_pp
+    steps:
+      - "pymor.core.gather_inputs.load_mfdataset"
+      - "script://./intpp_recom.py:add_pp_components"
+      - "pymor.fesom_1p4.nodes_to_levels"
+      - "script://./intpp_recom.py:vertical_integration"
+      - "script://./intpp_recom.py:set_pp_units"
+      - "pymor.std_lib.convert_units"
+      - "pymor.std_lib.time_average"
+      - "pymor.std_lib.set_global_attributes"
+      - "pymor.std_lib.trigger_compute"
+      - "pymor.std_lib.show_data"
+      - "pymor.std_lib.files.save_dataset"
+```
+
+The special tag `script://` followed by an absolute path to a Python file and
+the function name separated by a colon allows user-defined functionality, as:
+
+```yaml
+pipelines:
+   - name: <some_name>
+     steps:
+        - "script://<path/to/some/script.py>:<function_name>"
+```
+
+**Parallelization and scalability** is achieved by using
+[`dask`](https://dask.org/) and
+[`dask-jobqueue`](https://jobqueue.dask.org/en/latest/) to distribute the
+workload in a High Performance Computing (HPC) environment, typically in such a
+way that the users can run post-processing pipelines on the same machine that
+they produced the simulations with. Simple usage of dask is enabled directly in
+the user configuration file:
+
+```yaml
+pymor:
+  parallel: True
+  dask_cluster: "slurm"
+  dask_cluster_scaling_mode: fixed
+  fixed_jobs: 12
+```
+
+**Simple command line usage** enables launching all conversion
+functionality once the user has defined the configuration file:
+
+```bash
+$ pymor process <path/to/config.yaml>
+```
+
+Once launched, simple monitoring is available to examine both the Dask
+processing, as well as the conversion of individual pipelines, which are
+optionally orchestrated via [`prefect`](https://prefect.io/). When using an
+orchestrator, the user also has options to cache intermediate results, thus
+enabling only partial processing of the conversion if the process needs to be
+restarted for whatever reason.
+
+# Acknowledgements
+
+We acknowledge valuable contributions from Christopher Danek and
+Christian Stepanek for early design testing, as well as the CMIP team for
+fruitful discussions and feedback.
+
+# References
+
+- - - - -
+
+Everything below this part is purely information and writing guidelines for the
+co-authors.
+
+# Citations
+
+Citations to entries in paper.bib should be in
+[rMarkdown](http://rmarkdown.rstudio.com/authoring_bibliographies_and_citations.html)
+format.
+
+If you want to cite a software repository URL (e.g. something on GitHub without a preferred
+citation) then you can do it with the example BibTeX entry below for @fidgit.
+
+For a quick reference, the following citation commands can be used:
+- `@author:2001`  ->  "Author et al. (2001)"
+- `[@author:2001]` -> "(Author et al., 2001)"
+- `[@author1:2001; @author2:2001]` -> "(Author1 et al., 2001; Author2 et al., 2002)"
+
+# Figures
+
+Figures can be included like this:
+![Caption for example figure.\label{fig:example}](figure.png)
+and referenced from text using \autoref{fig:example}.
+
+Figure sizes can be customized by adding an optional second parameter:
+![Caption for example figure.](figure.png){ width=20% }
diff --git a/paper/readme.md b/paper/readme.md
new file mode 100644
index 00000000..c25ee1b2
--- /dev/null
+++ b/paper/readme.md
@@ -0,0 +1,53 @@
+# The PyMOR Paper
+## README and Notes
+
+> [Dr. Paul Gierz](mailto:paul.gierz@awi.de)<a
+    id="cy-effective-orcid-url"
+    class="underline"
+     href="https://orcid.org/0000-0002-4512-087X"
+     target="orcid.widget"
+     rel="me noopener noreferrer"
+     style="vertical-align: top">
+     <img
+        src="https://orcid.org/sites/default/files/images/orcid_16x16.png"
+        style="width: 1em; margin-inline-start: 0.5em"
+        alt="ORCID iD icon"/>
+    </a>
+> | [GitHub](https://github.com/esm-tools/pymor)
+> | [PyPI](https://pypi.org/project/py-cmor/)
+
+
+It would be nice to submit a paper about PyMOR, for the sake of "completeness" if nothing else. Plus, it might help us secure additional development funding.
+
+I would like to target the [Journal of Open Source Software (JOSS)](https://joss.theoj.org/) for this paper, a lot of the ["culture" that they have about publishing software papers](https://joss.theoj.org/about) is very similar to my
+own thinking.
+
+Example paper in commit [9ef1fdd] taken from the [JOSS website's example](https://joss.readthedocs.io/en/latest/example_paper.html#example-paper)
+
+More hints about [citation syntax](https://pandoc.org/MANUAL.html#extension-citations).
+
+We can submit the preprint to [arxiv](https://arxiv.org/).
+
+How to [locally build and typeset the paper](https://joss.readthedocs.io/en/latest/paper.html#checking-that-your-paper-compiles)
+
+## [Submission Guidelines](https://joss.readthedocs.io/en/latest/submitting.html#submitting-a-paper-to-joss)
+
+### Submission requirements
+
+- [x] The software must be open source as per the [OSI definition](https://opensource.org/osd).
+- [x] The software must be hosted at a location where users can browse the source code files, open issues, and propose code changes without manual approval of (or payment for) accounts
+- [ ] The software must have an **obvious** research application.
+> [@pgierz] Do we? I think so...
+- [x] You must be a major contributor to the software you are submitting, and have a GitHub account to participate in the review process.
+- [x] Your paper must not focus on new research results accomplished with the software.
+- [ ] Your paper (`paper.md` and BibTeX files, plus any figures) must be hosted in a Git-based repository together with your software.
+> [@pgierz] This is now in progress, see [PR #179](https://github.com/esm-tools/pymor/pull/179) for details.
+- [ ] ~The paper may be in a short-lived branch which is never merged with the default, although if you do this, make sure this branch is _created_ from the default so that it also includes the source code of your submission.~
+> [@pgierz] I think this is not necessary. The paper can live in the main repository along with everything else.
+
+In addition, the software associated with your submission must:
+
+- [x] Be stored in a repository that can be cloned without registration.
+- [x] Be stored in a repository where the software source files are browsable online without registration.
+- [x] Have an issue tracker that is readable without registration.
+- [x] Permit individuals to create issues/file tickets against your repository
diff --git a/paper/workflow.jpg b/paper/workflow.jpg
new file mode 100644
index 00000000..e97b66a1
Binary files /dev/null and b/paper/workflow.jpg differ