From c5c7056da2af5e2f37bb653cb893178e70999d57 Mon Sep 17 00:00:00 2001
From: Enrique Gonzalez Paredes <enriqueg@cscs.ch>
Date: Fri, 12 Apr 2024 12:55:03 +0200
Subject: [PATCH 001/458] chore: add documentation files and more configuration
 changes

---
 .pre-commit-config.yaml |   4 +-
 CHANGELOG.md            |   1 -
 CODING_GUIDELINES.md    | 143 ++++++++++++++++++++++++++++++++++++++++
 CONTRIBUTING.md         |  57 ++++++++--------
 LICENSE_HEADER.txt      |   4 +-
 README.md               |  10 ++-
 docs/conf.py            |   5 +-
 noxfile.py              |  13 ++--
 pyproject.toml          |  90 ++++++++++++++++++-------
 requirements-dev.txt    |  12 ++--
 src/jace/__init__.py    |   3 +-
 tests/__init__.py       |   6 ++
 tests/test_package.py   |   2 +-
 13 files changed, 272 insertions(+), 78 deletions(-)
 create mode 100644 CODING_GUIDELINES.md
 create mode 100644 tests/__init__.py

diff --git a/.pre-commit-config.yaml b/.pre-commit-config.yaml
index dd663ff..e64f6f2 100644
--- a/.pre-commit-config.yaml
+++ b/.pre-commit-config.yaml
@@ -22,7 +22,7 @@ repos:
   hooks:
   - id: prettier
     types_or: [markdown, html, css, scss, javascript, json]
-    args: [--prose-wrap=always]
+    args: [--prose-wrap=preserve]
 
 - repo: https://github.com/Lucas-C/pre-commit-hooks
   rev: v1.1.9
@@ -30,7 +30,7 @@ repos:
   - id: insert-license
     exclude: ^\..*$
     types: [python]
-    args: [--comment-style, "|#|", --license-filepath, ./LICENSE_HEADER.txt, --fuzzy-match-generates-todo]
+    args: [--comment-style, "|#|", --license-filepath, ./LICENSE_HEADER.txt]
 
 - repo: https://github.com/pre-commit/pre-commit-hooks
   rev: "v4.6.0"
diff --git a/CHANGELOG.md b/CHANGELOG.md
index e7744aa..5967d06 100644
--- a/CHANGELOG.md
+++ b/CHANGELOG.md
@@ -22,4 +22,3 @@ and this project adheres to [Semantic Versioning](https://semver.org/spec/v2.0.0
 ### Removed
 
 - ...
-
diff --git a/CODING_GUIDELINES.md b/CODING_GUIDELINES.md
new file mode 100644
index 0000000..fafa314
--- /dev/null
+++ b/CODING_GUIDELINES.md
@@ -0,0 +1,143 @@
+# Coding Guidelines
+
+## Code Style
+
+We follow the [Google Python Style Guide][google-style-guide] with a few minor changes (mentioned below). Since the best way to remember something is to understand the reasons behind it, make sure you go through the style guide at least once, paying special attention to the discussions in the _Pros_, _Cons_, and _Decision_ subsections.
+
+We deviate from the [Google Python Style Guide][google-style-guide] only in the following points:
+
+- We use [`ruff-linter`][ruff-linter] instead of [`pylint`][pylint].
+- We use [`ruff-formatter`][ruff-formatter] for source code and imports formatting, which may work differently than indicated by the guidelines in section [_3. Python Style Rules_](https://google.github.io/styleguide/pyguide.html#3-python-style-rules). For example, maximum line length is set to 100 instead of 79 (although docstring lines should still be limited to 79).
+- According to subsection [_2.19 Power Features_](https://google.github.io/styleguide/pyguide.html#219-power-features), direct use of _power features_ (e.g. custom metaclasses, import hacks, reflection) should be avoided, but standard library classes that internally use these power features are accepted. Following the same spirit, we allow the use of power features in infrastructure code with similar functionality and scope as the Python standard library.
+- According to subsection [_3.19.12 Imports For Typing_](https://google.github.io/styleguide/pyguide.html#31912-imports-for-typing), symbols from `typing` and `collections.abc` modules used in type annotations _"can be imported directly to keep common annotations concise and match standard typing practices"_. Following the same spirit, we allow symbols to be imported directly from third-party or internal modules when they only contain a collection of frequently used typying definitions.
+
+### Common questions
+
+- `pass` vs `...` (`Ellipsis`)
+
+  `pass` is the _no-op_ statement in Python and `...` is a literal value (called _Ellipsis_) introduced for slicing collections of unknown number of dimensions. Although they are very different in nature, both of them are used in places where a statement is required purely for syntactic reasons, and there is not yet a clear standard practice in the community about when to use one or the other. We decided to align with the common pattern of using `...` in the body of empty function definitions working as placeholders for actual implementations defined somewhere else (e.g. type stubs, abstract methods and methods appearing in `Protocol` classes) and `pass` in any other place where its usage is mixed with actual statements.
+
+  ```python
+  # Correct use of `...` as the empty body of an abstract method
+  class AbstractFoo:
+     @abstractmethod
+     def bar(self) -> Bar:
+        ...
+
+  # Correct use of `pass` when mixed with other statements
+  try:
+     resource.load(id=42)
+  except ResourceException:
+     pass
+  ```
+
+### Error messages
+
+Error messages should be written as sentences, starting with a capital letter and ending with a period (avoid exclamation marks). Try to be informative without being verbose. Code objects such as 'ClassNames' and 'function_names' should be enclosed in single quotes, and so should string values used for message interpolation.
+
+Examples:
+
+```python
+raise ValueError(f"Invalid argument 'dimension': should be of type 'Dimension', got '{dimension.type}'.")
+```
+
+Interpolated integer values do not need double quotes, if they are indicating an amount. Example:
+
+```python
+raise ValueError(f"Invalid number of arguments: expected 3 arguments, got {len(args)}.")
+```
+
+The double quotes can also be dropped when presenting a sequence of values. In this case the message should be rephrased so the sequence is separated from the text by a colon ':'.
+
+```python
+raise ValueError(f"unexpected keyword arguments: {', '.join(set(kwarg_names) - set(expected_kwarg_names))}.")
+```
+
+The message should be kept to one sentence if reasonably possible. Ideally the sentence should be kept short and avoid unnecessary words. Examples:
+
+```python
+# too many sentences
+raise ValueError(f"Received an unexpected number of arguments. Should receive 5 arguments, but got {len(args)}. Please provide the correct number of arguments.")
+# better
+raise ValueError(f"Wrong number of arguments: expected 5, got {len(args)}.")
+
+# less extreme
+raise TypeError(f"Wrong argument type. Can only accept 'int's, got '{type(arg)}' instead.")
+# but can still be improved
+raise TypeError(f"Wrong argument type: 'int' expected, got '{type(arg)}'")
+```
+
+The terseness vs. helpfulness tradeoff should be more in favor of terseness for internal error messages and more in favor of helpfulness for `DSLError` and it's subclassses, where additional sentences are encouraged if they point out likely hidden sources of the problem or common fixes.
+
+### Docstrings
+
+TODO: update to autodoc2
+
+We generate the API documentation automatically from the docstrings using [Sphinx][sphinx] and some extensions such as [Sphinx-autodoc][sphinx-autodoc] and [Sphinx-napoleon][sphinx-napoleon]. These follow the Google Python Style Guide docstring conventions to automatically format the generated documentation. A complete overview can be found here: [Example Google Style Python Docstrings](https://sphinxcontrib-napoleon.readthedocs.io/en/latest/example_google.html#example-google).
+
+Sphinx supports the [reStructuredText][sphinx-rest] (reST) markup language for defining additional formatting options in the generated documentation, however section [_3.8 Comments and Docstrings_](https://google.github.io/styleguide/pyguide.html#38-comments-and-docstrings) of the Google Python Style Guide does not specify how to use markups in docstrings. As a result, we decided to forbid reST markup in docstrings, except for the following cases:
+
+- Cross-referencing other objects using Sphinx text roles for the [Python domain](https://www.sphinx-doc.org/en/master/usage/restructuredtext/domains.html#the-python-domain) (as explained [here](https://www.sphinx-doc.org/en/master/usage/restructuredtext/domains.html#python-roles)).
+- Very basic formatting markup to improve _readability_ of the generated documentation without obscuring the source docstring (e.g. ` ``literal`` ` strings, bulleted lists).
+
+We highly encourage the [doctest][doctest] format for code examples in docstrings. In fact, doctest runs code examples and makes sure they are in sync with the codebase.
+
+### Module structure
+
+In general, you should structure new Python modules in the following way:
+
+1. _shebang_ line: `#! /usr/bin/env python3` (only for **executable scripts**!).
+2. License header (see `LICENSE_HEADER.txt`).
+3. Module docstring.
+4. Imports, alphabetically ordered within each block (fixed automatically by `ruff-formatter`):
+   1. Block of imports from the standard library.
+   2. Block of imports from general third party libraries using standard shortcuts when customary (e.g. `numpy as np`).
+   3. Block of imports from specific modules of the project.
+5. Definition of exported symbols (optional, mainly for re-exporting symbols from other modules):
+
+```python
+__all__ = ["func_a", "CONST_B"]
+```
+
+6. Public constants and typing definitions.
+7. Module contents organized in a convenient way for understanding how the pieces of code fit together, usually defining functions before classes.
+
+Try to keep sections and items logically ordered, add section separator comments to make section boundaries explicit when needed. If there is not a single evident logical order, pick the order you consider best or use alphabetical order.
+
+Consider configuration files as another type of source code and apply the same criteria, using comments when possible for better readability.
+
+### Ignoring QA errors
+
+You may occasionally need to disable checks from _quality assurance_ (QA) tools (e.g. linters, type checkers, etc.) on specific lines as some tool might not be able to fully understand why a certain piece of code is needed. This is usually done with special comments, e.g. `# noqa: F401`, `# type: ignore`. However, you should **only** ignore QA errors when you fully understand their source and rewriting your code to pass QA checks would make it less readable. Additionally, you should add a short descriptive code if possible (check [ruff rules][ruff-rules] and [mypy error codes][mypy-error-codes] for reference):
+
+```python
+f = lambda: 'empty'  # noqa: E731 [lambda-assignment]
+```
+
+and, if needed, a brief comment for future reference:
+
+```python
+...
+return undeclared_symbol  # noqa: F821 [undefined-name] on purpose to trigger black-magic
+```
+
+## Testing
+
+Testing components is a critical part of a software development project. We follow standard practices in software development and write unit, integration, and regression tests. Note that even though [doctests][doctest] are great for documentation purposes, they lack many features and are difficult to debug. Hence, they should not be used as replacement for proper unit tests except in trivial cases.
+
+<!-- Reference links -->
+
+[doctest]: https://docs.python.org/3/library/doctest.html
+[google-style-guide]: https://google.github.io/styleguide/pyguide.html
+[mypy]: https://mypy.readthedocs.io/
+[mypy-error-codes]: https://mypy.readthedocs.io/en/stable/error_code_list.html
+[pre-commit]: https://pre-commit.com/
+[pylint]: https://pylint.pycqa.org/
+[ruff-formatter]: https://docs.astral.sh/ruff/formatter/
+[ruff-linter]: https://docs.astral.sh/ruff/linter/
+[ruff-rules]: https://docs.astral.sh/ruff/rules/
+[sphinx]: https://www.sphinx-doc.org
+[sphinx-autodoc]: https://www.sphinx-doc.org/en/master/usage/extensions/autodoc.html
+[sphinx-napoleon]: https://sphinxcontrib-napoleon.readthedocs.io/en/latest/index.html#
+[sphinx-rest]: https://www.sphinx-doc.org/en/master/usage/restructuredtext/basics.html
+[ci-docs]: docs/development/CI/infrastructure.md
diff --git a/CONTRIBUTING.md b/CONTRIBUTING.md
index 55e3f0a..8c6b57a 100644
--- a/CONTRIBUTING.md
+++ b/CONTRIBUTING.md
@@ -1,20 +1,12 @@
-See the [Scientific Python Developer Guide][spc-dev-intro] for a detailed
-description of best practices for developing scientific packages.
+# Contributing
 
-[spc-dev-intro]: https://learn.scientific-python.org/development/
+JaCe is an open-source project that accepts contributions from any individual or organization. Proper credit will be given to contributors by adding their names to the [AUTHORS.md](AUTHORS.md) file.
 
 # Quick development
 
-The fastest way to start with development is to use nox. If you don't have nox,
-you can use `pipx run nox` to run it without installing, or `pipx install nox`.
-If you don't have pipx (pip for applications), then you can install with
-`pip install pipx` (the only case were installing an application with regular
-pip is reasonable). If you use macOS, then pipx and nox are both in brew, use
-`brew install pipx nox`.
+The fastest way to start with development is to use nox. If you don't have nox, you can use `pipx run nox` to run it without installing, or `pipx install nox`. If you don't have pipx (pip for applications), then you can install with `pip install pipx` (the only case were installing an application with regular pip is reasonable). If you use macOS, then pipx and nox are both in brew, use `brew install pipx nox`.
 
-To use, run `nox`. This will lint and test using every installed version of
-Python on your system, skipping ones that are not installed. You can also run
-specific jobs:
+To use, run `nox`. This will lint and test using every installed version of Python on your system, skipping ones that are not installed. You can also run specific jobs:
 
 ```console
 $ nox -s lint  # Lint only
@@ -23,8 +15,7 @@ $ nox -s docs -- --serve  # Build and serve the docs
 $ nox -s build  # Make an SDist and wheel
 ```
 
-Nox handles everything for you, including setting up an temporary virtual
-environment for each run.
+Nox handles everything for you, including setting up an temporary virtual environment for each run.
 
 # Setting up a development environment manually
 
@@ -34,33 +25,29 @@ You can set up a development environment by running:
 python3 -m venv .venv
 source ./.venv/bin/activate
 pip install --upgrade pip setuptools wheel
-pip install -r requirements-dev.txt 
+pip install -r requirements-dev.txt
 pip install -v -e .
 ```
 
-If you have the
-[Python Launcher for Unix](https://github.com/brettcannon/python-launcher), you
-can instead do:
+If you have the [Python Launcher for Unix](https://github.com/brettcannon/python-launcher), you can instead do:
 
 ```bash
 py -m venv .venv
 py -m pip install --upgrade pip setuptools wheel
-py -m pip install -r requirements-dev.txt 
+py -m pip install -r requirements-dev.txt
 py -m pip install -v -e .
 ```
 
 # Post setup
 
-You should prepare pre-commit, which will help you by checking that commits pass
-required checks:
+You should prepare pre-commit, which will help you by checking that commits pass required checks:
 
 ```bash
 pip install pre-commit # or brew install pre-commit on macOS
 pre-commit install # Will install a pre-commit hook into the git repo
 ```
 
-You can also/alternatively run `pre-commit run` (changes only) or
-`pre-commit run --all-files` to check even without installing the hook.
+You can also/alternatively run `pre-commit run` (changes only) or `pre-commit run --all-files` to check even without installing the hook.
 
 # Testing
 
@@ -94,12 +81,30 @@ nox -s docs -- --serve
 
 # Pre-commit
 
-This project uses pre-commit for all style checking. While you can run it with
-nox, this is such an important tool that it deserves to be installed on its own.
-Install pre-commit and run:
+This project uses pre-commit for all style checking. While you can run it with nox, this is such an important tool that it deserves to be installed on its own. Install pre-commit and run:
 
 ```bash
 pre-commit run -a
 ```
 
 to check all files.
+
+# Pull requests (PRs) and merge guidelines
+
+Before submitting a pull request, check that it meets the following criteria:
+
+1. Pull request with code changes should always include tests.
+2. If the pull request adds functionality, it should be documented both in the code docstrings and in the official documentation.
+3. The pull request should have a proper description of its intent and the main changes in the code. In general this description should be used as commit message if the pull request is approved (check point **5.** below).
+4. If the pull request contains code authored by first-time contributors, they should add their names to the [AUTHORS.md](AUTHORS.md) file.
+5. Pick one reviewer and try to contact them directly to let them know about the pull request. If there is no feedback in 24h/48h try to contact them again or pick another reviewer.
+6. Once the pull request has been approved, it should be squash-merged as soon as possible with a meaningful description of the changes. We use the [Conventional Commits][https://www.conventionalcommits.org/en/v1.0.0/#summary] specification for writing informative and automation-friendly commit messages. The following _commit types_ are accepted:
+   - `chore`: changes that only modify development-related tools, the build system configuration or external dependencies
+   - `ci`: changes to our CI configuration files and scripts
+   - `docs`: documentation only changes
+   - `feat`: a new feature
+   - `fix`: a bug fix
+   - `perf`: a code change that improves performance
+   - `refactor`: a code change that neither fixes a bug nor adds a feature
+   - `style`: changes that do not affect the meaning of the code (white-space, formatting, missing semi-colons, etc)
+   - `test`: adding missing tests or correcting existing tests
diff --git a/LICENSE_HEADER.txt b/LICENSE_HEADER.txt
index 75c2b7f..39ef751 100644
--- a/LICENSE_HEADER.txt
+++ b/LICENSE_HEADER.txt
@@ -1,6 +1,6 @@
-JaCe - JAX jit using DaCe (Data Centric Parallel Programming)
+JaCe - JAX Just-In-Time compilation using DaCe (Data Centric Parallel Programming)
 
 Copyright (c) 2024, ETH Zurich
 All rights reserved.
 
-SPDX-License-Identifier: BSD-3-Clause
\ No newline at end of file
+SPDX-License-Identifier: BSD-3-Clause
diff --git a/README.md b/README.md
index 3d20d77..f17b970 100644
--- a/README.md
+++ b/README.md
@@ -1,4 +1,12 @@
-# JaCe
+# JaCe - JAX Just-In-Time compilation using DaCe (Data Centric Parallel Programming)
+
+### JAX: High-Performance Array Computing
+
+JAX is a Python library for accelerator-oriented array computation and program transformation, designed for high-performance numerical computing and large-scale machine learning.
+
+### DaCe: Data-Centric Parallel Programming
+
+The DaCe project aims to build new representations for programs and algorithms, in order to efficiently map them to the entire hardware architecture landscape (CPU, GPU, and FPGA) with high utilization. With data-centric parallel programming, we enable direct knowledge transfer of performance optimization, regardless of the scientific application or the target processor.
 
 [![Actions Status][actions-badge]][actions-link]
 [![Documentation Status][rtd-badge]][rtd-link]
diff --git a/docs/conf.py b/docs/conf.py
index 10df60e..cb0bb09 100644
--- a/docs/conf.py
+++ b/docs/conf.py
@@ -1,4 +1,4 @@
-# JaCe - JAX jit using DaCe (Data Centric Parallel Programming)
+# JaCe - JAX Just-In-Time compilation using DaCe (Data Centric Parallel Programming)
 #
 # Copyright (c) 2024, ETH Zurich
 # All rights reserved.
@@ -9,8 +9,9 @@
 
 import importlib.metadata
 
+
 project = "JaCe"
-copyright = "2024, ETH Zurich"
+copyright = "2024, ETH Zurich"  # noqa: A001 [builtin-variable-shadowing]
 author = "ETH Zurich"
 version = release = importlib.metadata.version("jace")
 
diff --git a/noxfile.py b/noxfile.py
index c274c52..3772f2d 100644
--- a/noxfile.py
+++ b/noxfile.py
@@ -6,6 +6,7 @@
 
 import nox
 
+
 DIR = Path(__file__).parent.resolve()
 
 nox.needs_version = ">=2024.3.2"
@@ -19,9 +20,7 @@ def lint(session: nox.Session) -> None:
     Run the linter.
     """
     session.install("pre-commit")
-    session.run(
-        "pre-commit", "run", "--all-files", "--show-diff-on-failure", *session.posargs
-    )
+    session.run("pre-commit", "run", "--all-files", "--show-diff-on-failure", *session.posargs)
 
 
 @nox.session
@@ -41,9 +40,7 @@ def docs(session: nox.Session) -> None:
 
     parser = argparse.ArgumentParser()
     parser.add_argument("--serve", action="store_true", help="Serve after building")
-    parser.add_argument(
-        "-b", dest="builder", default="html", help="Build target (default: html)"
-    )
+    parser.add_argument("-b", dest="builder", default="html", help="Build target (default: html)")
     args, posargs = parser.parse_known_args(session.posargs)
 
     if args.builder != "html" and args.serve:
@@ -55,9 +52,7 @@ def docs(session: nox.Session) -> None:
     session.chdir("docs")
 
     if args.builder == "linkcheck":
-        session.run(
-            "sphinx-build", "-b", "linkcheck", ".", "_build/linkcheck", *posargs
-        )
+        session.run("sphinx-build", "-b", "linkcheck", ".", "_build/linkcheck", *posargs)
         return
 
     shared_args = (
diff --git a/pyproject.toml b/pyproject.toml
index 358ae00..7e1025c 100644
--- a/pyproject.toml
+++ b/pyproject.toml
@@ -42,20 +42,33 @@ report.exclude_also = [
 ]
 run.source = ["jace"]
 
+# -- mypy  --
 [tool.mypy]
-disallow_incomplete_defs = false
-disallow_untyped_defs = false
-enable_error_code = ["ignore-without-code", "redundant-expr", "truthy-bool"]
+disallow_incomplete_defs = true
+disallow_untyped_defs = true
 files = ["src", "tests"]
+ignore_missing_imports = false
+implicit_optional = false
+implicit_reexport = false
+# install_types = true
+namespace_packages = false
+# pretty = true
 python_version = "3.10"
-strict = true
+show_column_numbers = true
+show_error_codes = true
+warn_redundant_casts = true
 warn_unreachable = true
 warn_unused_configs = true
+warn_unused_ignores = true
 
 [[tool.mypy.overrides]]
-disallow_incomplete_defs = true
-disallow_untyped_defs = true
-module = "jace.*"
+disallow_incomplete_defs = false
+disallow_untyped_defs = false
+ignore_missing_imports = true
+module = "tests.*"
+
+# -- pytest  --
+[tool.pytest]
 
 [tool.pytest.ini_options]
 addopts = ["-ra", "--showlocals", "--strict-markers", "--strict-config"]
@@ -69,40 +82,67 @@ testpaths = [
 ]
 xfail_strict = true
 
+# -- ruff --
 [tool.ruff]
+line-length = 100
+respect-gitignore = true
+show-fixes = true
 src = ["src"]
 
+[tool.ruff.format]
+docstring-code-format = true
+
 [tool.ruff.lint]
 extend-select = [
+  "A",  # flake8-builtins
   "B",  # flake8-bugbear
   "I",  # isort
-  "ARG",  # flake8-unused-arguments
+  "G",  # flake8-logging-format
   "C4",  # flake8-comprehensions
-  "EM",  # flake8-errmsg
+  "PT",  # flake8-pytest-style
+  "UP",  # pyupgrade  # TODO: evaluate and remove if needed
+  "ARG",  # flake8-unused-arguments
+  "ERA",  # eradicate
   "ICN",  # flake8-import-conventions
-  "G",  # flake8-logging-format
   "PGH",  # pygrep-hooks
   "PIE",  # flake8-pie
-  "PL",  # pylint
-  "PT",  # flake8-pytest-style
   "PTH",  # flake8-use-pathlib
-  "RET",  # flake8-return
+  "RET",  # flake8-return  # TODO: evaluate and remove if needed
   "RUF",  # Ruff-specific
-  "SIM",  # flake8-simplify
-  "T20",  # flake8-print
-  "UP",  # pyupgrade
-  "YTT",  # flake8-2020
-  "EXE",  # flake8-executable
-  "NPY",  # NumPy specific rules
-  "PD"  # pandas-vet
+  "SIM",  # flake8-simplify  # TODO: evaluate and remove if needed
+  "T10",  # flake8-debugger
+  "T20",  # flake8-print  # TODO: evaluate and remove if needed
+  "NPY"  # NumPy specific rules
 ]
 ignore = [
-  "PLR09",  # Too many <...>
-  "PLR2004",  # Magic value used in comparison
-  "ISC001"  # Conflicts with formatter
+  'E501'  # [line-too-long]
+]
+ignore-init-module-imports = true
+unfixable = []
+
+[tool.ruff.lint.isort]
+combine-as-imports = true
+known-first-party = ['jace']
+known-third-party = [
+  'cupy',
+  'dace',
+  'jax',
+  'numpy',
+  'pytest',
+  'typing_extensions'
+]
+lines-after-imports = 2
+order-by-type = true
+required-imports = ["from __future__ import annotations"]
+section-order = [
+  'future',
+  'standard-library',
+  'third-party',
+  'first-party',
+  'tests',
+  'local-folder'
 ]
-isort.required-imports = ["from __future__ import annotations"]
 
 [tool.ruff.lint.per-file-ignores]
 "noxfile.py" = ["T20"]
-"tests/**" = ["T20"]
+"tests/**" = ["T10", "T20"]
diff --git a/requirements-dev.txt b/requirements-dev.txt
index f401505..a7a822e 100644
--- a/requirements-dev.txt
+++ b/requirements-dev.txt
@@ -1,15 +1,11 @@
-# dev
+furo>=2023.08.17
 mypy >= 1.9.0
+myst_parser>=0.13
 pytest >=6
 pytest-cov >=3
 ruff >= 0.3.5
-typing-extensions>=4.10.0
-types-all
-
-# docs
-furo>=2023.08.17
-myst_parser>=0.13
 sphinx>=7.0
 sphinx_autodoc_typehints
 sphinx_copybutton
-
+types-all
+typing-extensions>=4.10.0
diff --git a/src/jace/__init__.py b/src/jace/__init__.py
index 192fe9b..56f6505 100644
--- a/src/jace/__init__.py
+++ b/src/jace/__init__.py
@@ -1,4 +1,4 @@
-# JaCe - JAX jit using DaCe (Data Centric Parallel Programming)
+# JaCe - JAX Just-In-Time compilation using DaCe (Data Centric Parallel Programming)
 #
 # Copyright (c) 2024, ETH Zurich
 # All rights reserved.
@@ -11,6 +11,7 @@
 
 from __future__ import annotations
 
+
 __version__ = "0.1.0"
 
 __all__ = ["__version__"]
diff --git a/tests/__init__.py b/tests/__init__.py
new file mode 100644
index 0000000..116302a
--- /dev/null
+++ b/tests/__init__.py
@@ -0,0 +1,6 @@
+# JaCe - JAX Just-In-Time compilation using DaCe (Data Centric Parallel Programming)
+#
+# Copyright (c) 2024, ETH Zurich
+# All rights reserved.
+#
+# SPDX-License-Identifier: BSD-3-Clause
diff --git a/tests/test_package.py b/tests/test_package.py
index 23f3e78..bf92c00 100644
--- a/tests/test_package.py
+++ b/tests/test_package.py
@@ -1,4 +1,4 @@
-# JaCe - JAX jit using DaCe (Data Centric Parallel Programming)
+# JaCe - JAX Just-In-Time compilation using DaCe (Data Centric Parallel Programming)
 #
 # Copyright (c) 2024, ETH Zurich
 # All rights reserved.

From c9c7b07008f9df35ff7c4615d7823420c1e633c7 Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Fri, 19 Apr 2024 07:20:13 +0200
Subject: [PATCH 002/458] Initial import of the current development state.

---
 src/jace/__about__.py                         |   23 +
 src/jace/__init__.py                          |   16 +-
 src/jace/py.typed                             |    0
 src/jace/translator/__init__.py               |   19 +
 .../jace_subtranslator_interface.py           |  250 ++++
 .../translator/jaxpr_translator_driver.py     | 1265 +++++++++++++++++
 .../translator/sub_translators/__init__.py    |    3 +
 .../sub_translators/alu_translator.py         |  363 +++++
 src/jace/translator/util/__init__.py          |   17 +
 .../util/jace_translation_memento.py          |   79 +
 src/jace/translator/util/revision_counter.py  |   55 +
 .../util/subtranslator_helper_order.py        |   79 +
 src/jace/translator/util/util.py              |   15 +
 src/jace/util/__init__.py                     |   22 +
 src/jace/util/dace.py                         |   13 +
 src/jace/util/jax.py                          |   43 +
 src/jace/util/traits.py                       |   66 +
 src/jace/util/util.py                         |   39 +
 tests/test_subtranslator_helper_order.py      |  130 ++
 19 files changed, 2491 insertions(+), 6 deletions(-)
 create mode 100644 src/jace/__about__.py
 delete mode 100644 src/jace/py.typed
 create mode 100644 src/jace/translator/__init__.py
 create mode 100644 src/jace/translator/jace_subtranslator_interface.py
 create mode 100644 src/jace/translator/jaxpr_translator_driver.py
 create mode 100644 src/jace/translator/sub_translators/__init__.py
 create mode 100644 src/jace/translator/sub_translators/alu_translator.py
 create mode 100644 src/jace/translator/util/__init__.py
 create mode 100644 src/jace/translator/util/jace_translation_memento.py
 create mode 100644 src/jace/translator/util/revision_counter.py
 create mode 100644 src/jace/translator/util/subtranslator_helper_order.py
 create mode 100644 src/jace/translator/util/util.py
 create mode 100644 src/jace/util/__init__.py
 create mode 100644 src/jace/util/dace.py
 create mode 100644 src/jace/util/jax.py
 create mode 100644 src/jace/util/traits.py
 create mode 100644 src/jace/util/util.py
 create mode 100644 tests/test_subtranslator_helper_order.py

diff --git a/src/jace/__about__.py b/src/jace/__about__.py
new file mode 100644
index 0000000..35acfe1
--- /dev/null
+++ b/src/jace/__about__.py
@@ -0,0 +1,23 @@
+# JaCe - JAX jit using DaCe (Data Centric Parallel Programming)
+#
+# Copyright (c) 2024, ETH Zurich
+# All rights reserved.
+#
+# SPDX-License-Identifier: BSD-3-Clause
+
+"""Package metadata: version, authors, license and copyright."""
+
+from __future__ import annotations
+
+from typing import Final
+
+from packaging import version as pkg_version
+
+
+__all__ = ["__author__", "__copyright__", "__license__", "__version__", "__version_info__"]
+
+__author__: Final = "ETH Zurich and individual contributors"
+__copyright__: Final = "Copyright (c) 2024 ETH Zurich"
+__license__: Final = "BSD-3-Clause-License"
+__version__: Final = "0.0.1"
+__version_info__: Final = pkg_version.parse(__version__)
diff --git a/src/jace/__init__.py b/src/jace/__init__.py
index 56f6505..b4d71d1 100644
--- a/src/jace/__init__.py
+++ b/src/jace/__init__.py
@@ -1,17 +1,21 @@
-# JaCe - JAX Just-In-Time compilation using DaCe (Data Centric Parallel Programming)
+# JaCe - JAX jit using DaCe (Data Centric Parallel Programming)
 #
 # Copyright (c) 2024, ETH Zurich
 # All rights reserved.
 #
 # SPDX-License-Identifier: BSD-3-Clause
 
-"""
-JaCe: JAX jit using DaCe (Data Centric Parallel Programming)
-"""
+"""Python library for translating Jax programs into SDFG."""
 
 from __future__ import annotations
 
+from .__about__ import __author__, __copyright__, __license__, __version__, __version_info__
 
-__version__ = "0.1.0"
 
-__all__ = ["__version__"]
+__all__ = [
+    "__author__",
+    "__copyright__",
+    "__license__",
+    "__version__",
+    "__version_info__",
+]
diff --git a/src/jace/py.typed b/src/jace/py.typed
deleted file mode 100644
index e69de29..0000000
diff --git a/src/jace/translator/__init__.py b/src/jace/translator/__init__.py
new file mode 100644
index 0000000..65a4e3d
--- /dev/null
+++ b/src/jace/translator/__init__.py
@@ -0,0 +1,19 @@
+# JaCe - JAX jit using DaCe (Data Centric Parallel Programming)
+#
+# Copyright (c) 2024, ETH Zurich
+# All rights reserved.
+#
+# SPDX-License-Identifier: BSD-3-Clause
+
+"""Subpackage containing all the code related to Jaxpr translation"""
+
+from __future__ import annotations
+
+from jace.translator.jace_subtranslator_interface import JaCeSubTranslatorInterface
+from jace.translator.jaxpr_translator_driver import JaxprTranslationDriver
+
+
+__all__ = [
+    "JaCeSubTranslatorInterface",
+    "JaxprTranslationDriver",
+]
diff --git a/src/jace/translator/jace_subtranslator_interface.py b/src/jace/translator/jace_subtranslator_interface.py
new file mode 100644
index 0000000..2eda73b
--- /dev/null
+++ b/src/jace/translator/jace_subtranslator_interface.py
@@ -0,0 +1,250 @@
+# JaCe - JAX jit using DaCe (Data Centric Parallel Programming)
+#
+# Copyright (c) 2024, ETH Zurich
+# All rights reserved.
+#
+# SPDX-License-Identifier: BSD-3-Clause
+from __future__ import annotations
+
+from collections.abc import Collection, Sequence
+from typing import TYPE_CHECKING, Any, Final, final
+
+import dace
+from jax import core as jcore
+
+
+if TYPE_CHECKING:
+    from .jaxpr_translator_driver import JaxprTranslationDriver
+
+
+class JaCeSubTranslatorInterface:
+    """Interface for all Jax primitive/intrinsic translators.
+
+    A translator for a primitive, sometimes also called intrinsic, translates a single equation of a Jaxpr into its SDFG equivalent.
+
+    A type that implements this interface must fulfil the following properties:
+    - It must be stateless.
+        It is still possible and explicitly allowed to have an immutable configuration state.
+    - All subclasses has to accept '**kwargs' arguments and must forward all unconsumed arguments to the base.
+        Thus the '__init__()' function of the base must be called.
+
+    Once a subtranslator is initialized the driver will call its 'get_handled_primitives()' function, which returns the names of all Jax primitives it would like to handle.
+    A subtranslator can register for as many primitive it wants.
+    At the same time more than one subtranslators can be registered for a single primitive.
+
+    To decide which subtranslator should be used for a single equation the driver will use their 'can_translate_jaxeqn()' function.
+    The first subtranslator that returns 'True' will then be used.
+    Note it is unspecific if the 'can_translate_jaxeqn()' of the remaining subtranslators is also called.
+
+    There are two ways how to influence the order in which they are processed.
+    The first and simple one is to implement 'get_priority()'.
+    The driver will order the subtranslators, in ascending order, according to their respective priority.
+    Thus the lower the priority the earlier the subtranslator is checked.
+    Subtranslators that returns 'JaCeSubTranslatorInterface.DEFAULT_PRIORITY' are handled specially and are _always_ put at the end of the list (in unspecific order).
+
+    The second possibility is to override the '__lt__()' and '__eq__()' functions.
+    While this allows more control it might be more difficult.
+    If a subtranslator does this, its 'get_priority()' function should return 'NotImplemented'.
+    """
+
+    __slots__ = ()
+
+    # Default value for the priority of primitive translators.
+    DEFAULT_PRIORITY: Final = int("1" * 64, base=2)
+
+    def __init__(
+        self,
+        *args,
+        **kwargs,
+    ):
+        """Initialize the interface.
+
+        It is required that subclasses calls this method during initialization.
+        """
+
+    def get_handled_primitives(self) -> Collection[str] | str:
+        """Returns the names of all Jax primitives that can be handled by this subtranslator.
+
+        The returned collection is used to narrow down which translator should be used to translate a given primitive.
+        It is possible that several translators can be registered for the same name.
+
+        See Also:
+            'self.can_translate_jaxeqn()' and 'self.get_priority()'.
+
+        Notes:
+            It is also possible to return a string instead of a collection with just one element.
+        """
+        raise NotImplementedError(
+            "Class '{type(self).__name__}' does not implement 'get_handled_primitives()'."
+        )
+
+    def can_translate_jaxeqn(
+        self,
+        driver: "JaxprTranslationDriver",
+        in_var_names: Sequence[str | None],
+        out_var_names: Sequence[str],
+        eqn: jcore.JaxprEqn,
+    ) -> bool:
+        """Tests if 'self' is able to translate the Jax primitive passed as 'eqn'.
+
+        This function is used by the driver translator to determine which subtranslator
+        should be used to handle the 'jcore.JaxprEqn', i.e. primitive.
+        For a more detailed description of the arguments see 'self.translate_jaxeqn()' function.
+
+        Args:
+            driver:         The driver object of the translation.
+            in_var_names:   Names of the SDFG variables used as inputs for the primitive.
+            out_var_names:  Names of the SDFG variables used as outputs for the primitive.
+            eqn:            The 'jcore.JaxprEqn' instance that is currently being handled.
+
+        Notes:
+            This function has to consider 'self' and all of its arguments as constant.
+            In case there is only one subtranslator registered for a certain primitive,
+                it is unspecific if this function will be called before 'self.translate_jaxeqn()' is called.
+            This function will never be called for a primitive for which it has not registered itself.
+        """
+        raise NotImplementedError(
+            "Class '{type(self).__name__}' does not implement 'can_translate_jaxeqn()'."
+        )
+
+    def translate_jaxeqn(
+        self,
+        driver: "JaxprTranslationDriver",
+        in_var_names: Sequence[str | None],
+        out_var_names: Sequence[str],
+        eqn: jcore.JaxprEqn,
+        eqn_state: dace.SDFGState,
+    ) -> dace.SDFGState | None:
+        """Translates the Jax primitive into its SDFG equivalent.
+
+        Before the driver will call this function to translate the primitive into an SDFG it will perform the following preparatory tasks:
+        - It will allocate the SDFG variables that are used as outputs.
+            Their names will be passed through the 'out_var_names' argument, in the same order as 'eqn.outvars'.
+        - It will collect the names of the SDFG variables that are used as input and place them in 'in_var_names', in the same order as 'eqn.invars'.
+            If an input argument refers to a literal no SDFG variable is created for it and 'None' is passed to indicate this.
+        - The driver will create a new terminal state and pass it as 'eqn_state' argument.
+            This state is guaranteed to be empty and 'translator.getTerminalState() is eqn_state' holds.
+
+        If 'self' returns 'None' the driver assumes that the whole primitive was constructed inside 'eqn_state', and the terminal state will left unmodified.
+        However, in case 'self' explicitly returns a state, the driver will use it as new terminal state.
+
+        Args:
+            driver:         The driver object of the translation.
+            in_var_names:   List of the names of the arrays created inside the SDFG for the inpts or 'None' in case of a literal.
+            out_var_names:  List of the names of the arrays created inside the SDFG for the outputs.
+            eqn:            The Jax primitive that should be translated.
+            eqn_state:      State into which the primitive's SDFG representation should be constructed.
+
+        Notes:
+            A subtranslator is free to do anything to the passed 'eqn_state' with the exception of deleting it or modifying any of its _incoming_ interstateedges.
+            As a general rule, if the subtranslator has to create more states it should explicitly return the new terminal state.
+        """
+        raise NotImplementedError(
+            "Class '{type(self).__name__}' does not implement 'translate_jaxeqn()'."
+        )
+
+    def get_priority(self) -> int:
+        """Returns the priority of this translator.
+
+        In case many translators are registered for the same primitive, see 'self.get_handled_primitives()' they must be ordered.
+        The translators are ordered, and checked by the driver according to this value.
+        The _smaller_ the value the earlier it is checked.
+
+        See Also:
+            'self.can_translate_jaxeqn()' and 'self.get_handled_primitives()'.
+
+        Notes:
+            By default the function returns 'self.DEFAULT_PRIORITY', which is handled specially, i.e. it is put at the end.
+            If a subtranslator opts in to overwrite '__lt__()' instead the function should return 'NotImplemented'.
+                Such translators are biased towards lower priorities.
+        """
+        return self.DEFAULT_PRIORITY
+
+    def has_default_priority(self) -> bool:
+        """Checks if 'self' has default priority.
+
+        Notes:
+            It is allowed, but not advised to override this function.
+                However, it has to be consistent with 'self.get_priority()'.
+        """
+        try:
+            x = self.get_priority()
+        except NotImplementedError:
+            return False
+        if x is NotImplemented:
+            return False
+        return x is self.DEFAULT_PRIORITY or (x == self.DEFAULT_PRIORITY)
+
+    def __lt__(
+        self,
+        other: JaCeSubTranslatorInterface,
+    ) -> bool:
+        """Tests if 'self' should be checked before 'other' in the selection process.
+
+        As outlined in the class description there are two possibilities to influence the order in which subtranslators are checked.
+        The simpler one is simply to implement 'get_priority()'.
+        The second one, is to override the '__lt__()' function, which allows to inspect the other subtranslators.
+
+        Notes:
+            If you override this function it is advised that 'get_priority()' returns 'NotImplemented'.
+            This function is never called if either 'self' or 'other' have default priority.
+        """
+        return self.get_priority() < other.get_priority()
+
+    def __eq__(
+        self,
+        other: Any,
+    ) -> bool:
+        """Tests if two subtranslators are equal.
+
+        The default implementation checks if 'self' and 'other' have the same type.
+        However, it your subtranslator strongly depend on its configuration you should override this function.
+
+        Notes:
+            If you override this function you should also override 'self.__hash__()' to make the two consistent.
+        """
+        if not isinstance(other, JaCeSubTranslatorInterface):
+            return NotImplemented
+        return type(self) == type(other)
+
+    def __hash__(self) -> int:
+        """Computes the hash of the subtranslator.
+
+        The default implementation return a hash that is based on the class.
+        Thus all instances of a particular subtranslator will have the same hash value.
+
+        Notes:
+            If you override this function you should also override 'self.__eq__()' to make the two consistent.
+        """
+        return id(self.__class__)
+
+    @final
+    def __ne__(
+        self,
+        other: Any,
+    ) -> bool:
+        return NotImplemented
+
+    @final
+    def __le__(
+        self,
+        other: Any,
+    ) -> bool:
+        return NotImplemented
+
+    @final
+    def __ge__(
+        self,
+        other: Any,
+    ) -> bool:
+        return NotImplemented
+
+    @final
+    def __gt__(
+        self,
+        other: Any,
+    ) -> bool:
+        return NotImplemented
+
+
+# end class(JaCeSubTranslatorInterface):
diff --git a/src/jace/translator/jaxpr_translator_driver.py b/src/jace/translator/jaxpr_translator_driver.py
new file mode 100644
index 0000000..fb6856f
--- /dev/null
+++ b/src/jace/translator/jaxpr_translator_driver.py
@@ -0,0 +1,1265 @@
+# JaCe - JAX jit using DaCe (Data Centric Parallel Programming)
+#
+# Copyright (c) 2024, ETH Zurich
+# All rights reserved.
+#
+# SPDX-License-Identifier: BSD-3-Clause
+
+from __future__ import annotations
+
+import re
+from collections.abc import Collection, Iterable, Mapping, Sequence
+from typing import Any, Final, Union, cast, overload
+
+import dace
+import jax
+from dace import data as ddata, properties as dprop
+from jax import core as jcore
+
+from jace import translator
+from jace.translator import util as jtrutil
+from jace.util import jax as jutil
+
+
+class JaxprTranslationDriver:
+    """Internal driver class for creating an SDFG equivalent of a `Jaxpr` instance.
+
+    The idea of the transformation is quite simple.
+    Since Jaxpr is essentially a list consisting of more or less simple instructions, we will process them one after the other.
+    For simplicity we will put each equation in its own state, primitives that needs more states must be put into a nested SDFG.
+
+    This class builds an SDFG of a very particular form, which is not directly usable.
+    But it is used as the canonical form inside JaCe and characterized by:
+    - the SDFG is a list of states, each state corresponds to single Jax primitive,
+    - all variable names are derived from Jax names,
+    - there are no global variables inside the SDFG,
+    - there is no possibility to return something.
+
+    To support nested Jaxpr expressions the driver provides the possibility to clone/fork itself, see `self.fork()` for more.
+    Clones, i.e. the return values of `self.fork()`, also known as children or clone, have a unique identifier, called revision.
+    It is important that the revision is only unique within a family and during a translation process.
+    This identifier is used to generate unique variable names.
+    The clones form a tree that is rooted at the so called 'head translator', i.e. the driver that was explicitly created.
+
+    The actual translation of a Jaxpr equation is not handled by the driver instance directly.
+    Instead it is forwarded to a subtranslator instance, see `JaCeSubTranslatorInterface` for more.
+    These subtranslators are independent objects that are owned by the driver.
+    However, they are tightly coupled and thus a subtranslator is allowed to use the following private functions:
+    - `_add_array()` if the translator has to create new.
+    - `_create_jax_var_list()` for the bulk creation of Jax variables.
+    - `_add_reserved_names()` if a name should be blocked (only affects later equation.
+    - `_add_jax_name_mapping()` for creating new links between Jax variables and SDFG variables.
+    However, a subtranslator should only call them if it is neccessary.
+
+
+    If no translation is ongoing the only function that makes sense to call is `translate_jaxpr()` to start a translation.
+    Driver supplied to the subtranslators as arguments, such as in `translateEqn()` are allowed to call any public function of the driver.
+    In addition to them it is allowed to call:
+
+    Notes:
+        Equations that only have `_` as output variable are skipped.
+        It is not safe to deepcopy `self` during an active translation instead you should use `self.fork()`.
+        To ensure unique names also in the presence of nested SDFG every instance contains a revision index.
+
+    Todos:
+        Split the functions into several interfaces one, that is for the whole world to use, one for subtranlators and one for the implementation.
+    """
+
+    # Member variables that are private to an instance, i.e. they are not passed on to the children.
+    #  By definition all private variable belongs to the translation context but not all variable of the translation context are private.
+    #   NOTE: The context also includes some shared members, but they are handled a bit differently.
+    __private_slots__ = (
+        "_sdfg",
+        "_term_sdfg_state",
+        "_init_sdfg_state",
+        "_jax_name_map",
+        "_sdfg_in_names",
+        "_sdfg_out_names",
+        "_rev_idx",
+    )
+    # These are the member variables that are shared among the forks.
+    __shared_slots__ = (
+        "_reserved_names",  # Part of the context.
+        "_sub_translators",
+        "_rev_manager",  # This is the revision counter manager
+    )
+    __slot__ = __private_slots__ + __shared_slots__
+
+    def __init__(
+        self,
+        **kwargs: Any,
+    ) -> None:
+        """Creates the base translator.
+
+        This function will forward all arguments that does _not_ start with an underscore to the constructors of the subtranslators.
+        Furthermore, this function will allocate the shared members, but the private members are not allocated.
+
+        Args:
+            _no_shared_alloc (bool):     If set then all allocation will be avoided (internal)
+
+        Notes:
+            All arguments that does not start with an underscore are forwarded to the translators for the intrinsics.
+            By setting `_no_shared_alloc` to `True` the function will not allocate the shared part.
+                This flag is provided only for implementing `self.fork()` using it denotes an error and undefined behaviour.
+        """
+        allocate_shared_parts: bool = not kwargs.pop("_no_shared_alloc", False)
+
+        # Contains all the subtranslators that we need.
+        #  They are partitioned by the names of the primitive they have registered for.
+        #  Inside a partition they are ordered by priority, lowest first, more important.
+        #  This member is allocated by '_init_sub_translators()' and remains allocated during the lifetime of the object.
+        self._sub_translators: dict[str, list[translator.JaCeSubTranslatorInterface]] = None  # type: ignore[assignment]
+
+        # The SDFG object that we are currently constructing.
+        #  Only allocated during an ongoing translation.
+        self._sdfg: dace.SDFG = None
+
+        # This is the HEAD SDFG state, i.e. the last state in which we translated an equation.
+        #  Only allocated during an ongoing translation.
+        self._term_sdfg_state: dace.SDFGState = None
+
+        # This is the beginning of the SDFG, i.e. the original SDFG HEAD.
+        #  Only allocated during an ongoing translation.
+        self._init_sdfg_state: dace.SDFGState = None
+
+        # This is the mapping, that maps the Jax name to the name that is used inside the SDFG.
+        #  Only allocated during an ongoing translation.
+        self._jax_name_map: dict[str, str] = None  # type: ignore[assignment]
+
+        # These names can not be used for the automatic naming of Jax variables.
+        #  They differ from the forbidden names, that they denote valid SDFG names.
+        #  An example would be names of the function arguments.
+        #  Only allocated during an ongoing translation.
+        self._reserved_names: set[str] = None  # type: ignore[assignment]
+
+        # These are the names of the SDFG variables that serves as input and output.
+        #  They have the same order as in the Jaxpr.
+        #  Only allocated during an ongoing translation.
+        self._sdfg_in_names: Sequence[str] = None  # type: ignore[assignment]
+        self._sdfg_out_names: Sequence[str] = None  # type: ignore[assignment]
+
+        # This is the manager for the revision counter.
+        #  It is shared among all children.
+        #  Might be overwritten if we are in the context of 'fork()'.
+        self._rev_manager: jtrutil.RevisionCounterManager = jtrutil.RevisionCounterManager()
+
+        # This is the revision of self.
+        #  Unlike the manager it is not shared and private.
+        #  Might be overwritten in the context of a fork.
+        self._rev_idx: int = self._rev_manager.assign_revision()
+        assert self.is_head_translator()
+
+        # If requested we will now allocate some internal state
+        if allocate_shared_parts:
+            self._init_sub_translators(kwargs)
+
+    def translate_jaxpr(
+        self,
+        jaxpr: jcore.ClosedJaxpr,
+        *,
+        inp_scalar_as_array: bool = False,
+        name: str | None = None,
+        reserved_names: str | Collection[str] | None = None,
+        allow_empty_jaxpr: bool = False,
+        _clear_translation_ctx: bool = True,
+    ) -> jtrutil.JaCeTranslationMemento:
+        """Perform the translation of a Jaxpr description into a SDFG.
+
+        As described above the function will create the canonical form of Jaxpr based SDFGs.
+        Furthermore the function will return the SDFG encaplulated inside a `jace.translator.util.JaCeTranslationMemento` object.
+
+        Args:
+            inp_scalar_as_array:       Translate scalar _input_ arguments to arrays of length 1.
+            name:                   Use this name for the SDFG instead some generated one.
+            reserved_names:          Prevent the generation of such names, when translating Jax variable names into SDFG names.
+            allow_empty_jaxpr:        Allows empty Jaxpr.
+            _clear_translation_ctx:      Do not deallocate the inner state of `self`.
+
+        Notes:
+            By default the function will store its translation state inside the return value and deallocate the internal members.
+                However, by setting `_clear_translation_ctx` to `False` `self` is not deallocated.
+                This means that `self` and the returned memento share the same state.
+                To explicitly deallocate the translation context of `self`, which is required, use `self._clearTranslatorCtx()`.
+        """
+        if self.is_allocated():
+            raise RuntimeError(
+                "The translator driver is already allocated, you should resort to 'fork()'."
+            )
+        if (len(jaxpr.eqns) == 0) and (not allow_empty_jaxpr):
+            raise ValueError("Passed an empty Jaxpr, but did not allow for empty Jaxpr.")
+        if not isinstance(jaxpr, jcore.ClosedJaxpr):
+            raise TypeError(f"Expected a 'jax.core.ClosedJaxp' instance but got '{type(jaxpr)}'")
+        if len(jaxpr.effects) != 0:
+            raise NotImplementedError(
+                "Currently 'Jaxpr' instances with side effects are not supported."
+            )
+        if len(jaxpr.out_avals) == 0:
+            raise ValueError("Jaxpr has zero output variables.")
+        if not jax.config.read("jax_enable_x64"):
+            raise NotImplementedError(
+                "The translation only works if 'jax_enable_x64' is enabled. Do it manually or use 'self.transform()'!"
+            )
+
+        self._allocate_translation_ctx(
+            name=name,
+            reserved_names=reserved_names,
+        )
+        self._create_initial_input(
+            jaxpr=jaxpr,
+            inp_scalar_as_array=inp_scalar_as_array,
+        )
+        self._create_constants(
+            jaxpr=jaxpr,
+        )
+        memento: jtrutil.JaCeTranslationMemento = self._translate_jaxpr_internal(jaxpr)
+
+        if _clear_translation_ctx:
+            self._clear_translation_ctx()
+
+        return memento
+
+    def fork(self) -> JaxprTranslationDriver:
+        """Return a child of `self` ready for transformation.
+
+        The returned object, known as child, will always be of type `JaxprTranslationDriver`, and should be seen as a partial clone of `self`.
+        While the child shares some members with its parent, i.e. `self`, it has an unallocated translation context.
+        Essentially, this function returns an object that when its `translate_jaxpr()` function is called behaves the exact same way as
+        its parent behaved as it was called just with another `jaxpr` argument.
+
+        Notes:
+            A user has to ensure that the lifetime of a fork ends before the one of its direct parent.
+                In case of a head translator, the lifetime of its children have to end before the translation process finishes.
+        """
+        # Create a new (empty) driver instance; prevent allocation to make it cheep
+        dolly: JaxprTranslationDriver = JaxprTranslationDriver(_no_shared_alloc=True)
+
+        # Copy the shared members from parent to fork.
+        for slotName in self.__shared_slots__:
+            setattr(dolly, slot_name, getattr(self, slot_name))
+
+        # Handle the special members and initialize them.
+        dolly._rev_idx = dolly._rev_manager.assign_revision()
+        assert not dolly.is_head_translator()
+
+        return dolly
+
+    def append_new_state(
+        self,
+        label: str | None = None,
+        condition: dprop.CodeBlock | None = None,
+        assignments: Mapping[str, Any] | None = None,
+        *,
+        prev_state: dace.SDFGState | None = None,
+    ) -> dace.SDFGState:
+        """Creates a new SDFGState and appends it.
+
+        By default the new SDFGState is appended to the current terminal SDFGState.
+        However, if `prev_state` is given the new SDFGState will be appended to it instead.
+
+        Args:
+            label:          The name that should be used for the new SDFGState.
+            condition:      The condition of the state transitions used on the InterstateEdge.
+            assignments:    Symbol assignments that should be done during the transition.
+            prev_state:      Alternative SDFGState to which we should append the new SDFGState.
+
+        Notes:
+            In case no SDFGState exists yet, an initial SDFGState will be created first.
+            This function is similar to `SDFGState.add_state_after()` but differs in the fact that it does not perform reconnecting.
+                I.e. if the state to which we append already has downstream states they will not be reconnected to be after the newly created state.
+            This function will not update the head state of `self`.
+        """
+        assert self._sdfg is not None
+
+        # Test if we must create a start state.
+        if self._sdfg.start_block is None:
+            self._init_sdfg_state = self._sdfg.add_state(label="initial_state", is_start_block=True)
+            self._term_sdfg_state = self._init_sdfg_state
+        assert self._sdfg.start_block is self._init_sdfg_state
+
+        # Now create and append the new state
+        app_state: dace.SDFGState = self._term_sdfg_state if prev_state is None else prev_state
+        new_state = self._sdfg.add_state(label, is_start_block=False)
+        self._sdfg.add_edge(
+            app_state,
+            new_state,
+            dace.sdfg.InterstateEdge(condition=condition, assignments=assignments),
+        )
+
+        return new_state
+
+    def get_arrays(self) -> Mapping[str, ddata.Data]:
+        """Get the maps containing all known arrays inside the SDFG.
+
+        Essentially a shorthand and preferred way for `self.get_sdfg().arrays`.
+        """
+        assert self._sdfg is not None
+        return cast(Mapping[str, ddata.Data], self._sdfg.arrays)
+
+    def get_array(
+        self,
+        name: str | jcore.Atom,
+    ) -> ddata.Data:
+        """Returns the `dace.data.Data` object `name` referees to.
+
+        If `name` is a string, it is directly interpreted as the name of an SDFG variable.
+        In case it is a `jax.core.Atom` it is first translated.
+        """
+        assert self._sdfg is not None
+
+        if isinstance(name, str):
+            pass
+        elif isinstance(name, jcore.Atom):
+            name = self.map_jax_var_to_sdfg(name)
+        else:
+            raise TypeError(f"Does not know how to handle '{type(name).__name__}'.")
+        if name not in self._sdfg.arrays:
+            raise KeyError(f"Requested the SDFG array '{name}' but it is not known.")
+
+        return self._sdfg.arrays[name]
+
+    @overload
+    def map_jax_var_to_sdfg(
+        self,
+        jax_var: str | jcore.Atom,
+    ) -> str: ...
+
+    @overload
+    def map_jax_var_to_sdfg(
+        self,
+        jax_var: str | jcore.Atom,
+        allow_fail: bool,
+    ) -> Union[str, None]: ...
+
+    def map_jax_var_to_sdfg(
+        self,
+        jax_var: str | jcore.Atom,
+        allow_fail: bool = False,
+    ) -> Union[str, None]:
+        """Returns the name of the SDFG variable that the Jax variable `jax_var` is referring to.
+
+        Args:
+            jax_var:        The Jax variable to look up.
+            allow_fail:     If mapping is not known return `None` instead of raise `KeyError`.
+        """
+        assert self._jax_name_map is not None
+        assert isinstance(jax_var, (jcore.Atom, str))
+
+        jax_var = jutil.get_jax_var_name(jax_var)
+        if jax_var not in self._jax_name_map:
+            if allow_fail:
+                return None
+            KeyError(f"The Jax variable '{jax_var}' was never registered.")
+
+        return self._jax_name_map[jax_var]
+
+    def get_sdfg(self) -> dace.SDFG:
+        """Returns the tentative SDFG that is currently constructed.
+
+        If you want access to the arrays of the SDFG use `self.get_arrays()`/`self.get_array()`.
+        """
+        assert self._sdfg is not None
+        assert (self._init_sdfg_state is None) or (self._init_sdfg_state is self._sdfg.start_block)
+        return self._sdfg
+
+    def get_terminal_sdfg_state(self) -> dace.SDFGState:
+        """Returns the current tentative terminal state of the SDFG under construction.
+
+        Since the translator works by turning each Jax primitive into an SDFG state, the constructed SDFG is essentially a list of states.
+        This function returns the tentative final/terminal SDFGState of the SDFG.
+        States of new primitives will be appended to this one.
+
+        Notes:
+            It is an error to call this function outside the context of a subtranslator.
+                If you want access to the arrays of the SDFG use `self.get_arrays()`.
+        """
+        assert all(x is not None for x in (self._sdfg, self._term_sdfg_state))
+        return self._term_sdfg_state
+
+    def is_allocated(self) -> bool:
+        """Tests if `self` is allocated.
+
+        This function only checks if the translation context is allocated.
+        As a side effect a return value of `True` means that a translation process is ongoing.
+
+        Notes:
+            The state of the reserved name list is handled specially.
+                In case the function returns `True` it is guaranteed that it is allocated.
+                If `False` is returned it might or might not be allocated.
+        """
+        small_ctx: Sequence[Any] = [getattr(self, x)  for x in self.__shared_slots__ if x != "_reserved_names"]
+        if all((x is None) for x in small_ctx):
+            if self._reserved_names is None:
+                raise RuntimeError(
+                    "Invalid allocation state: All context variables except the reserved name list are allocated."
+                )
+            return True
+        elif all((x is not None) for x in small_ctx):
+            return False
+
+        raise RuntimeError("Invalid allocation state: Translation context is mixed allocated.")
+
+    def is_head_translator(self) -> bool:
+        """Tests if `self` is a head translator.
+
+        A head translator is a translator/driver that was created explicitly, i.e. not by `self.fork()`.
+        """
+        return self._rev_manager.is_root_revision(self._rev_idx)
+
+    def same_family(
+            self,
+            other: JaxprTranslationDriver,
+    ) -> bool:
+        """Test if `self` and `other` belongs to the same family of driver/translators.
+
+        They belong to the same family if they decend from the same head translator.
+        """
+        if not isinstance(other, JaxprTranslationDriver):
+            return NotImplemented
+        if(all(getattr(self, x) is getattr(self, x)  for x in self.__shared_slots__)):
+            #assert (self if (self._rev_idx < other._rev_idx) else other).is_allocated()
+            return True
+        assert not any(getattr(self, x) is getattr(self, x)  for x in self.__shared_slots__)
+
+        return False
+
+
+    @staticmethod
+    def translate_dtype(dtype: Any) -> dace.typeclass:
+        """Turns a Jax datatype into a DaCe datatype.
+
+        Todo:
+            Imporove.
+        """
+        nameof_dtype = str(dtype)
+
+        # Make some basic checks if the datatype is okay
+        if (not jax.config.read("jax_enable_x64")) and (nameof_dtype == "float64"):
+            raise ValueError("Found a 'float64' type but 'x64' support is disabled.")
+        if nameof_dtype.startswith("complex"):
+            raise NotImplementedError("Support for complecx computation is not implemented.")
+
+        # Now extract the datatype from dace, this is extremely ugly.
+        if not hasattr(dace.dtypes, nameof_dtype):
+            raise TypeError(
+                f"Could not find the type '{nameof_dtype}' ({type(dtype).__name__}) in 'dace.dtypes'."
+            )
+        dcd_type = getattr(dace.dtypes, nameof_dtype)
+
+        if not isinstance(dcd_type, dace.dtypes.typeclass):
+            raise TypeError(
+                f"Expected that '{nameof_dtype}' would map to a 'dace.typeclass' but it mapped to a '{type(dcd_type).__name__}'."
+            )
+
+        return dcd_type
+
+    def _add_jax_name_mapping(
+            self,
+            jax_var: str | jcore.Atom,
+            sdfg_name: str
+    ) -> JaxprTranslationDriver:
+        """Creates the mapping between `jax_var` to `sdfg_name`.
+
+        It is an error if there is already a mapping installed for `jax_var`.
+
+        Args:
+            jax_var:     The Jax variable that is used.
+            sdfg_name:   The name of the corresponding SDFG variable.
+
+        Notes:
+            While the function allows to create a mapping for Jax names that are in the set of avoided names,
+                it will refuse to create a mapping for a forbidden name.
+        """
+        assert self._jax_name_map is not None
+        assert isinstance(jax_var, (jcore.Atom, str))
+
+        jax_name = jutil.get_jax_var_name(jax_var)
+        if jax_name in self._jax_name_map:
+            if self._jax_name_map[jax_name] == sdfg_name:  # We consider this as no ops.
+                return self
+            raise ValueError(
+                f"Tried to create a mapping for Jax variable '{jax_name}' to '{sdfg_name}', but that mapping exists already and is pointing to '{self.map_jax_var_to_sdfg(jax_name)}'."
+            )
+        if sdfg_name not in self.get_arrays():
+            raise KeyError(
+                f"Tried to create the mapping '{jax_name} -> {sdfg_name}', but '{sdfg_name}' is not a known SDFG variable."
+            )
+        elif sdfg_name in self._forbidden_names:
+            raise NameError(  # This is actually an internal error
+                f"Tried to create the mapping '{jax_name} -> {sdfg_name}', but '{sdfg_name}' is forbidden."
+            )
+
+        self._jax_name_map[jax_name] = sdfg_name
+        return self
+
+    def _add_reserved_names(
+        self,
+        reserved_names: None | str | Collection[str],
+    ) -> JaxprTranslationDriver:
+        """Adds the names listed in `reserved_names` to the internal list."""
+        assert isinstance(self._reserved_names, set)
+
+        if reserved_names is None:
+            return self
+        elif isinstance(reserved_names, str):
+            reserved_names = [reserved_names]
+        elif isinstance(reserved_names, Collection):
+            pass
+        else:
+            raise TypeError(f"Does not know how to handle the type '{type(reserved_names).__name__}'.")
+        assert all(isinstance(x, str) for x in reserved_names)
+
+        self._reserved_names.update(reserved_names)
+        return self
+
+    def _add_array(
+        self,
+        arg: jcore.Atom,
+        *,
+        as_transient: bool = True,
+        alt_name: str | None = None,
+        name_prefix: str | None = None,
+        force_array: bool = False,
+        as_view: bool = False,
+        strides: Sequence[int | dace.symbol | str] | None = None,
+        symb_strides: bool | None = None,
+        find_new_name: bool | None = None,
+        allow_literals: bool = False,
+        force_jax_name: bool = False,
+        update_var_mapping: bool = False,
+    ) -> str:
+        """Creates an SDFG variable for the Jax variable `arg` and returns the SDFG name.
+
+        By default the function will create a transient, which can be changed by setting `as_transient` to `False`.
+        In case the Jax variable `arg` refers to a scalar, i.e. having an empty shape, the function will generate a SDFG scalar.
+        However, if `force_array` is set, then it will generate an array with shape `(1,)`.
+        For generating a `View` you must set `as_view` to `True`.
+
+        By specifying `alt_name` it is possible to force a certain name on a variable.
+        It is important that if `alt_name` is specified the function will either generate the variable or fail.
+        In case `alt_name` is not given, then the function will be derived one from `jutil.get_jax_var_name(arg)`.
+        The  driver distinguishes between two kinds of "bad (SDFG) variable names".
+        The first category are the forbidden names, which the function refuses to generate.
+        The second one are the reserved names, which were set at the beginning.
+        These names can be used if they are specified through `alt_name` but are not used in automatic naming.
+
+        If nothing is specified, the strides of the data are determined by DaCe, which is continuous C order.
+        There are two ways to change that.
+        The first way is to specify the `strides` argument, which are then forwarded to the underlying DaCe function.
+        The function will only check if enough values were provided, but no further check is performed.
+        The second one is to set `symb_strides` to `True` in which case the function will generate symbols and use them.
+        However, even if symbolic strides are activated, arrays with just one dimensions have always a non symbolic stride.
+        Furthermore, dimensions with shape 1 will always have stride 0.
+
+        By default this function does not update the internal variable map.
+        However, by setting `update_var_mapping` to `True` the function will update the mapping.
+
+        Args:
+            arg:                The Jax object for which a SDFG equivalent should be created.
+            as_transient:        If set, the SDFG variable is a transient, `True` by default.
+            alt_name:            Try to create the variable with this name; either succeed or fail.
+            name_prefix:         If given and in automatic naming mode, add this prefix to the name before anything else.
+            force_array:         Instead of a `dace.Scalar` object create a `dace.Array` object with one element.
+            as_view:             Creates a view instead of an array, if it is a scalar it is silently ignored.
+            strides:            Instead of the default strides use this value for the strides.
+            symb_strides:        Create symbols and use them for fully symbolic strides.
+            find_new_name:        The translator will try to find a new name if the designated is already occupied.
+                                    This does not work if the name was supplied by `alt_name`.
+            allow_literals:      If `True` then also allows JaxLiterals as `arg`.
+            force_jax_name:       If `True` then, the verbatim Jax name will be used.
+            update_var_mapping:   Update the internal variable mapping; by default `False`.
+
+        Notes:
+            If `find_new_name` is `None` the default the function will only look for a new name if there is a need for that.
+                If it is `True` the function will always look for a new name, even if the initial name was fine.
+                If it is `False` the function will never look for a new new, thus if the name is unavailable an error is generated.
+            Specifying `alt_name` implies `find_new_name=False`.
+            The effect of specifying `force_jax_name` is as passing `jutil.get_jax_var_name(arg)` as `alt_name`.
+        """
+        assert all(x is not None  for x in (self._sdfg, self._jax_name_map))
+        shape: Sequence[int] = arg.aval.shape  # Shape of the array
+        offset = None  # i.e. no offset
+        storage: dace.StorageType = dace.StorageType.Default  # Set at later stages (optimization)
+        is_scalar: bool = shape == ()
+        dtype = self.translate_dtype(arg.aval.dtype)
+
+        if (alt_name is not None) and (not re.fullmatch("[a-zA-Z_][a-zA-Z0-9_]*", alt_name)):
+            raise ValueError(f"The passed name 'alt_name' '{alt_name}' is invalid.")
+
+        if force_jax_name:
+            if alt_name is not None:
+                raise ValueError(
+                    f"Specified 'force_jax_name' but passed '{alt_name}' as 'alt_name'."
+                )
+            if name_prefix is not None:
+                raise ValueError(
+                    f"Specified 'force_jax_name' and set 'name_prefix' to '{name_prefix}'."
+                )
+            alt_name = jutil.get_jax_var_name(arg)
+        if name_prefix is not None:
+            assert isinstance(name_prefix, str) and (
+                len(name_prefix) > 0
+            ), f"Invalid 'name_prefix': '{name_prefix}'."
+            if alt_name is not None:
+                raise ValueError("Specified 'name_prefix' and 'alt_name' which is not possible.")
+
+        if (symb_strides is None) and (strides is None):
+            symb_strides = False if (len(shape) <= 1) else False
+        if as_view and (not as_transient):
+            raise ValueError("You tried to create a global view, which is not allowed.")
+
+        if isinstance(arg, jcore.Var):
+            prop_name = jutil.get_jax_var_name(
+                arg
+            )  # This is the name that is _suggested_ by the conversion.
+            if (alt_name is None) and prop_name.startswith("__"):
+                raise ValueError(
+                    f"You tried to create the variable '{prop_name}' which starts with two underscores, if you really want to do that use 'alt_name'."
+                )
+            if isinstance(name_prefix, str):
+                prop_name = name_prefix + prop_name
+        elif isinstance(arg, jcore.Literal):
+            if not allow_literals:
+                raise NotImplementedError("Jax Literals are not yet implemented.")
+            if alt_name is None:
+                raise ValueError(f"Passed literal '{arg}', but not specified a name to use.")
+        else:
+            raise TypeError(f"Does not know how to handle '{type(arg).__name__}'.")
+
+        if alt_name is None:
+            # If we are the root translator, then we will use `prop_name` directly;
+            #  if not we will append the revision of `self` to the name.
+            arg_name = prop_name + ("" if self.is_head_translator() else f"_rev_idx{self._rev_idx}")
+        else:
+            arg_name = str(alt_name)
+            find_new_name = False  # If a name was given, then use it no matter what.
+            if arg_name in self._forbidden_names:
+                raise ValueError(f"You used 'alt_name' to create the forbidden name '{alt_name}'.")
+            if arg_name in self._sdfg.arrays:
+                raise ValueError(
+                    f"Tried to create a variable with name '{arg_name}' explicitly, but it is already known."
+                )
+        if find_new_name is None:
+            find_new_name = (arg_name in self._forbidden_names) or (
+                arg_name in self._reserved_names
+            )
+
+        if find_new_name:
+            # We have to find a new name.
+            name_tmpl = "_jax_variable__" + arg_name + "__{}"
+            for iCounter in range(1000):
+                _arg_name = name_tmpl.format(iCounter)
+                if (
+                    (_arg_name in self._forbidden_names)
+                    or (_arg_name in self._reserved_names)
+                    or (_arg_name in self._sdfg.arrays)
+                ):
+                    continue  # The proposed variable is known, so try next value.
+                arg_name = _arg_name  # We found a name that we can use.
+                break
+            else:
+                raise ValueError(f"Failed to find a replacement name for '{arg_name}'")
+            del iCounter, _arg_name
+        elif arg_name in self._forbidden_names:
+            raise ValueError(f"Can not create variable '{arg_name}', name is forbidden.")
+        elif arg_name in self._sdfg.arrays:
+            raise ValueError(f"Can not create variable '{arg_name}', variable is already created.")
+        if not re.fullmatch("[a-zA-Z_][a-zA-Z0-9_]*", arg_name):
+            raise ValueError(f"The requested variable name '{arg_name}' is invalid.")
+
+        # Promotion of scalar to array.
+        if is_scalar and force_array:
+            shape = (1,)
+            symb_strides = False
+            strides = None
+            is_scalar = False
+
+        if strides is not None:
+            if symb_strides:
+                raise ValueError("Specified 'symb_strides' and 'stride at the same time.")
+            if len(strides) != len(shape):
+                raise ValueError(
+                    f"'strides' was '{strides}' it had length {len(strides)}, but the array has rank {len(shape)}."
+                )
+            strides = tuple(strides)
+
+        elif (symb_strides is True) and (not is_scalar):
+            strides = [
+                dace.symbol(f"{arg_name}_stride{dim}", dace.int64) if size >= 2 else 0
+                for dim, size in enumerate(shape)
+            ]
+
+        if is_scalar:
+            self._sdfg.add_scalar(
+                name=arg_name, storage=storage, dtype=dtype, transient=as_transient
+            )
+        elif as_view:
+            self._sdfg.add_view(
+                name=arg_name,
+                shape=shape,
+                strides=strides,
+                offset=offset,
+                storage=storage,
+                dtype=dtype,
+            )
+        else:
+            self._sdfg.add_array(
+                name=arg_name,
+                shape=shape,
+                strides=strides,
+                offset=offset,
+                storage=storage,
+                dtype=dtype,
+                transient=as_transient,
+            )
+
+        if update_var_mapping:
+            self._add_jax_name_mapping(jax_var=arg, sdfg_name=arg_name)
+
+        return arg_name
+
+    def _create_jax_var_list(
+        self,
+        jax_var_list: Sequence[jcore.Atom],
+        prevent_creation: bool = False,
+        only_creation: bool = False,
+        **kwargs: Any,
+    ) -> list[Union[None, str]]:
+        """Creates SDFG variables for the listed Jax variables and returns the SDFG names as a list.
+
+        Before the function will create a variable, by using `_add_array()` with `update_var_mapping=True`,
+        the function will check if the variable is known and no new variable is created.
+        Instead the name of the previously created variable is added to the return value.
+        In case the Jax Atom denotes a literal, no variable will be created, instead `None`
+        will be added to the output list.
+
+        Args:
+            jax_var_list:         The list of Jax variables that should be transformed to SDFG names.
+            prevent_creation:    Never create a variable, indicates that all variables must already exists.
+            only_creation:       Indicates that no variables exists yet and all must be created.
+            kwargs:             In case of variable creation will be forwarded to `self._add_array()` function.
+
+        Notes:
+            Expected input arguments are `jcore.JaxprEqn.invars` or `jcore.JaxprEqn.outvars`.
+            If `only_creation` is set, then literals will cause an error.
+            It is an error to pass the `update_var_mapping` argument.
+        """
+        assert self._jax_name_map is not None
+        if only_creation and prevent_creation:
+            raise ValueError("Specified both 'only_creation' and 'prevent_creation'.")
+
+        ret_list: list[Union[None, str]] = []
+        for jax_var in jax_var_list:
+            if isinstance(jax_var, jcore.Literal):
+                if only_creation:
+                    raise ValueError(f"Requested 'only_creation', but '{jax_var}' is a 'Literal'.")
+                ret_list.append(None)
+            elif isinstance(jax_var, jcore.jax_var):
+                mapped_sdfg_name: Union[str, None] = self.map_jax_var_to_sdfg(
+                    jax_var, allow_fail=True)
+                if mapped_sdfg_name is None:
+                    if prevent_creation:
+                        raise ValueError(
+                            f"Forbid the creation of jaxVariables, but need to create '{jax_var!s}'."
+                        )
+                    ret_list.append(
+                        self._add_array(arg=jax_var, update_var_mapping=True, **kwargs)
+                    )
+                else:
+                    if only_creation:
+                        raise ValueError(
+                            f"Requested 'only_creation', but '{jax_var}' already exists as '{mapped_sdfg_name}'."
+                        )
+                    ret_list.append(mapped_sdfg_name)
+            else:
+                raise ValueError(
+                    f"The translation process is not implemented for '{type(jax_var)}'"
+                )
+
+        return ret_list
+
+    def _create_initial_input(
+        self,
+        jaxpr: jcore.ClosedJaxpr,
+        inp_scalar_as_array: bool,
+    ) -> Sequence[str]:
+        """This function will create the internal input variables that are used for the SDFG.
+
+        Args:
+            jaxpr:              The Jaxpr that we want to translate.
+            inp_scalar_as_array:   Promote scalars to arrays of size one.
+
+        Returns:
+            The list of SDFG variables used as input arguments of `jaxpr` in the same order.
+
+        Notes:
+            This function will fill the internal list of inputs.
+        """
+        assert self.is_allocated()
+        assert len(jaxpr.jaxpr.invars)
+
+        if len(self._sdfg_in_names) != 0:
+            raise RuntimeError("Called '_create_initial_input()' twice?")
+        assert len(self._sdfg_out_names) == 0
+
+        # Handle the initial input arguments
+        sdfg: dace.SDFG = self._sdfg
+        init_in_var_names: Sequence[str] = self._create_jax_var_list(  # type: ignore[assignment]
+            jax_var_list=jaxpr.jaxpr.invars,
+            only_creation=True,
+            as_transient=True,  # Explicit transient; no error!
+            force_array=inp_scalar_as_array,
+            force_jax_name=self.is_head_translator(),  # Ensure head get the pure Jax name.
+        )
+        sdfg.arg_names.extend(init_in_var_names)
+
+        # Store the list of inputs in self; this is done to simplify exporting.
+        #  The output list is either generated by `self._translate_jaxpr_internal()` of `self._handle_null_jaxpr()`.
+        self._sdfg_in_names = tuple(init_in_var_names)
+
+        return init_in_var_names
+
+    def _create_constants(
+        self,
+        jaxpr: jcore.ClosedJaxpr,
+    ) -> Sequence[str]:
+        """Creates all constants requested by the `jaxpr`.
+
+        The function will create an SDFG variable and add them as constant to the SDFG.
+        The value they should have is deepcopied.
+
+        Returns:
+            Names of the SDFG variables created for the constants in the same order.
+        """
+        from copy import deepcopy
+
+        assert self.is_allocated()
+        if not len(jaxpr.consts):
+            return []
+
+        const_names: list[str] = []
+        for cJaxVar, cValue in zip(jaxpr.jaxpr.constvars, jaxpr.consts, strict=False):
+            c_sdfg_name = self._add_array(
+                arg=cJaxVar,
+                name_prefix="__const_",
+                as_transient=True,
+                symb_strides=False,
+                strides=None,
+                update_var_mapping=True,
+            )
+            # We have to pass the data descriptor to `add_constant()`, otherwise a new one would be created.
+            self._sdfg.add_constant(c_sdfg_name, deepcopy(cValue), self._sdfg.arrays[c_sdfg_name])
+            const_names.append(c_sdfg_name)
+        return const_names
+
+    def _allocate_translation_ctx(
+        self,
+        name: str | None = None,
+        reserved_names: str | Collection[str] | None = None,
+    ) -> JaxprTranslationDriver:
+        """This function allocates and initialize the members related to the translation context.
+
+        After this function is called, `self` is said to have an ongoing translation process.
+
+        Args:
+            name:               The name of the SDFG.
+            reserved_names:     Add these name to the set of resered names of `self`.
+
+        Notes:
+            It is not an error, if the reserved names are already allocated.
+                In that case the names passed by `reserved_names` are added to the list already preset.
+        """
+        if self.is_allocated():
+            raise RuntimeError("The translator is already allocated.")
+        if name and (not re.fullmatch("[a-zA-Z_][a-zA-Z0-9_]*", name)):
+            raise ValueError(f"The provided name '{name}' for the SDFG is invalid.")
+
+        self._sdfg = dace.SDFG(name=(name or f"unnamed_SDFG_{id(self)}"))
+        self._init_sdfg_state = self._sdfg.add_state(label="initial_state", is_start_block=True)
+        self._term_sdfg_state = self._init_sdfg_state
+        self._jax_name_map = {}
+        self._sdfg_in_names = ()
+        self._sdfg_out_names = ()
+
+        # Handle the `reserved_names` argument as described above.
+        #  This is essentially needed that children works properly.
+        if self._reserved_names is None:
+            self._reserved_names = set()
+        elif isinstance(self._reserved_names, set):
+            assert not self.is_head_translator()
+            assert all(isinstance(x, str) for x in self._reserved_names)
+        else:
+            raise RuntimeError("The reserved names are allocated incorrectly.")
+        self._add_reserved_names(reserved_names)
+
+        return self
+
+    def _init_sub_translators(
+        self,
+        kwargs: Mapping[str, Any],
+    ) -> JaxprTranslationDriver:
+        """This function initializes the subtranslator.
+
+        The function forwards `kwargs` to teh constructor of teh subtranslators.
+        However, it will remove all arguments starting with an underscore.
+        """
+        if(isinstance(self._sub_translators, dict)):
+            raise RuntimeError(f"Tried to allocate the internal subtranslators twice.")
+        assert self._sub_translators is None
+
+        # We might get arguments that starts with an underscore, which are not meant for the subtranslators.
+        kwargs = {k: v for k, v in kwargs.items() if not k.startswith("_")}
+
+        # Will contain all subtranslators we create.
+        subtranslators: dict[str, list[translator.JaCeSubTranslatorInterface]] = {}
+
+        # First we will create all subtranslators and partition them.
+        subtranslator_cls: type[translator.JaCeSubTranslatorInterface]
+        for subtranslator_cls in []:
+            subtranslator: translator.JaCeSubTranslatorInterface = subtranslator_cls(**kwargs)
+            handled_primitives: Iterable[str] = jutil.ensure_iterability(
+                subtranslator.getHandledPrimitives()
+            )
+
+            # Now add the subtranslator to the primitives it requests, we will sort them later into the correct order.
+            for handledPrimitive in handled_primitives:
+                subtranslators.setdefault(handledPrimitive, []).append(subtranslator)
+
+        # Now we order the subtranslators for the primitives.
+        self._sub_translators = {
+            prim_name: jtrutil.sort_subtranslators(primSubTranslators)
+            for prim_name, primSubTranslators in subtranslators.items()
+        }
+        return self
+
+    def _clear_translation_ctx(self) -> JaxprTranslationDriver:
+        """This function deallocate the translation context of `self`.
+
+        Notes:
+            While it is allowed for outside code to call this explicitly function, it is is most likely an error.
+            If this function is called on a head translator, then the revision state will be rested.
+                Thus a caller has to make sure that the lifetime of all children has ended.
+            If `self` is not allocated this function acts as a noops.
+            The reserved names are only deallocated if `self` is a head translator.
+        """
+        if not self.is_allocated():
+            return self
+        self._sdfg = None
+        self._init_sdfg_state = None
+        self._term_sdfg_state = None
+        self._jax_name_map = None  # type: ignore[assignment]
+        self._sdfg_in_names = None  # type: ignore[assignment]
+        self._sdfg_out_names = None  # type: ignore[assignment]
+
+        if self.is_head_translator():
+            # We are the head translator thus we reset the revision manager.
+            #  Since this function is only called at the very end, we know that the translation process as a whole has finished.
+            #  We reset the state that the numbers are small again when we start anew.
+            self._rev_manager._reset_state()
+
+            # Freeing the reserved names only for heads make it more safe in case a child translator is reused.
+            #  On the other hand reusing a child translator is discouraged, but not forbidden.
+            self._reserved_names = None  # type: ignore[assignment]
+        return self
+
+    def _find_sub_translator_for(
+        self,
+        in_var_names: Sequence[str | None],
+        out_var_names: Sequence[str],
+        eqn: jcore.JaxprEqn,
+    ) -> translator.JaCeSubTranslatorInterface:
+        """Returns the subtranslator object to translate `eqn`.
+
+        The subtranslators are checked for applicability in the order of their priority.
+        The fist one that accepts the translation will be taken.
+
+        Notes:
+            The arguments are the same as for `JaCeSubTranslatorInterface.can_translate_jaxeqn()`.
+        """
+        assert self._sub_translators is not None
+
+        prim_name: str = eqn.primitive.name
+        if prim_name not in self._sub_translators:
+            raise NotImplementedError(f"No subtranslators known to hanble primitive '{prim_name}'.")
+        subtranslator_canidates = self._sub_translators[prim_name]
+        assert len(subtranslator_canidates) > 0
+
+        subtranslator: translator.JaCeSubTranslatorInterface = None  # type: ignore[assignment]
+        if len(subtranslator_canidates) == 1:
+            subtranslator = next(iter(subtranslator_canidates))
+            assert subtranslator.can_translate_jaxeqn(
+                driver=self, in_var_names=in_var_names,
+                out_var_names=out_var_names, eqn=eqn)
+        else:
+            for subtranslatorCanidate in subtranslator_canidates:
+                if subtranslatorCanidate.can_translate_jaxeqn(
+                    driver=self,
+                    in_var_names=in_var_names,
+                    out_var_names=out_var_names,
+                    eqn=eqn,
+                ):
+                    subtranslator = subtranslatorCanidate
+            else:
+                raise NotImplementedError(f"No subtranslator found for handling '{eqn}'.")
+        return subtranslator
+
+    def _translate_single_eqn(
+        self,
+        jaxpr: jcore.ClosedJaxpr,
+        eqn: jcore.JaxprEqn,
+    ) -> tuple[Sequence[Union[str, None]], Sequence[str]]:
+        """Translate `eqn` into its SDFG equivalent.
+
+        To do this the function will do the following steps:
+        - Assemble the in and output variables.
+        - Select which subtranslator to use.
+        - Create a new empty state, i.e. append to the tentative terminal state.
+        - Perform the actual translation.
+
+        Returns:
+            The SDFG names that where used as input and output are returned.
+            The inputs might contain `None` which indicates that the input was a Jax literal.
+            For more information see `JaCeSubTranslatorInterface.can_translate_jaxeqn()`.
+
+        Notes:
+            While `jaxpr` must be the closed version, `eqn` must come from the unclosed version.
+            The function will also perform some consistency checking.
+        """
+        assert isinstance(eqn, jcore.JaxprEqn) and isinstance(jaxpr, jcore.ClosedJaxpr)
+
+        if len(eqn.effects) != 0:
+            raise NotImplementedError(f"Equation '{eqn}' had side effects.")
+
+        # Input/Output variables
+        in_var_names: Sequence[Union[str, None]] = self._create_jax_var_list(
+            eqn.invars,
+            prevent_creation=True,  # Inputs must already exists.
+        )
+        out_var_names: Sequence[str] = self._create_jax_var_list(  # type: ignore[assignment]
+            eqn.outvars,
+            only_creation=True, # Output must not exist yet.
+        )
+
+        # Find the subtranslator 
+        subtranslator: translator.JaCeSubTranslatorInterface = self._find_sub_translator_for(
+            in_var_names=in_var_names,
+            out_var_names=out_var_names,
+            eqn=eqn,
+        )
+
+        # Create the state into which the equation is put
+        last_term_state: dace.SDFGState = self.get_terminal_sdfg_state()  # noqa: F841 # Will be used later
+        eqn_state = self.append_new_state(
+                label=f"{eqn.primitive.name}_{out_var_names[0]}",
+                prev_state=None,    # Force to append as terminal state.
+        )
+
+        # Now perform the actual translation of the equation.
+        new_sdfg_term_state = subtranslator.translate_jaxeqn(
+            driver=self,
+            in_var_names=in_var_names,
+            out_var_names=out_var_names,  # Might be modified by subtranslator!
+            eqn=eqn,
+            eqn_state=eqn_state,
+        )
+
+        # Determine the new (tentative) terminal state of the SDFG we are building.
+        if new_sdfg_term_state is None:
+            if eqn_state is self._term_sdfg_state:
+                raise RuntimeError("Inconsistent terminal state was detected.")
+            new_sdfg_term_state = eqn_state
+        elif isinstance(new_sdfg_term_state, dace.SDFGState):
+            # TODO(phimuell): use `last_term_state` to test if there is reachability to new end.
+            pass
+        else:
+            raise TypeError(f"Encountered illegal types '{type(new_sdfg_term_state)}'")
+
+        # In case a subtranslator decided to not use the variables we created for it, he is technically
+        #  allowed to create new ones, but he must update the `out_var_names` list.
+        #  We will now test if the mapping was updated correctly.
+        for expectedSDFGName, jax_var in zip(out_var_names, eqn.outvars, strict=False):
+            mapped_sdfg_name = self.map_jax_var_to_sdfg(jax_var)
+            jax_name = jutil.get_jax_var_name(jax_var)
+            if mapped_sdfg_name != expectedSDFGName:
+                raise ValueError(
+                    f"Mapping inconsistency detected, expected that Jax variable '{jax_name}' maps to '{expectedSDFGName}' but it actually maps to '{mapped_sdfg_name}'."
+                )
+
+        # Views can only be used if there is a direct connection, between source, view and destination (place of usage)
+        #  Because of the way how Jax works, it is impossible that an output variable is a View.
+        #  Thus we now make the check if this is the case.
+        for outVarName, jax_var in zip(out_var_names, eqn.outvars, strict=False):
+            sdfg_var = self.get_array(outVarName)
+            if isinstance(sdfg_var, (dace.data.Array, dace.data.Scalar)):
+                pass
+            elif isinstance(sdfg_var, dace.data.View):
+                raise TypeError(
+                    f"For the Jax variable '{jutil.get_jax_var_name(jax_var)}' (SDFG: '{outVarName}'), which is an output, you used a View, which is not possible."
+                    + " It must either be an array or a scalar."
+                )
+            else:
+                raise NotImplementedError(
+                    f"The output variable '{jutil.get_jax_var_name(jax_var)}' (SDFG: '{outVarName}') is of type '{type(sdfg_var).__name__}' which I does not know how to handle."
+                )
+
+        # Modify terminal head state of 'self'
+        self._term_sdfg_state = new_sdfg_term_state
+
+        return (in_var_names, out_var_names)
+
+    def _translate_jaxpr_internal(
+        self,
+        jaxpr: jcore.ClosedJaxpr,
+    ) -> jtrutil.JaCeTranslationMemento:
+        """Performs the actual translation of the Jaxpr into an SDFG.
+
+        The function assumes that the context is already allocated and the initial variables are already created.
+        The function will ignore, i.e. not translate, any state whose output variables name only consists of `_`.
+
+        The function will store the internal state of `self` into a memento and return it.
+        However, it will not deallocate the context of `self`, thus `self` and the memento share the same context in memory.
+
+        Args:
+            jaxpr:      The Jaxpr to translate.
+
+        Notes:
+            The function will unconditionally handle empty Jaxpr.
+            Jax uses a variable with name `_` to indicate that this value is never read.
+                It is included by some transformations such as `gard()`.
+        """
+        assert isinstance(jaxpr, jcore.ClosedJaxpr)
+        assert self.is_allocated()
+
+        nb_translated_eqn: int = 0
+        for eqn in jaxpr.jaxpr.eqns:  # Translate the equations one by one.
+            assert len(eqn.effects) == 0
+            if len(eqn.outvars) == 0:  # Do we need this special case.
+                continue  #  Looks more like internal Jax error.
+            if any(jutil.get_jax_var_name(outVar) == "_" for outVar in eqn.outvars):
+                assert (len(eqn.outvars) == 1) or all(
+                    jutil.get_jax_var_name(outVar) == "_" for outVar in eqn.outvars
+                )
+                continue
+            _, out_var_names = self._translate_single_eqn(jaxpr=jaxpr, eqn=eqn)
+            nb_translated_eqn += 1
+
+        if nb_translated_eqn != 0:
+            # Equations where translated so set the output variables.
+            self._sdfg_out_names = tuple(out_var_names)
+        else:
+            # No equations were translated, i.e. no equation at all or all outputs had name '_'
+            self._handle_null_jaxpr(jaxpr)
+
+        return self._export_memento()
+
+    def _export_memento(self) -> jtrutil.JaCeTranslationMemento:
+        """Encapsulate the translation context of `self` into a memento.
+
+        This function will not deallocate the internal context of `self`.
+        Thus the memento and `self` share the same context in memory.
+        """
+        assert self.is_allocated()
+        assert len(self._sdfg_in_names) > 0
+        assert all(isinstance(x, str) for x in self._sdfg_in_names)
+        assert len(self._sdfg_out_names) > 0
+        assert all(isinstance(x, str) for x in self._sdfg_out_names)
+
+        return jtrutil.JaCeTranslationMemento(
+            sdfg=self._sdfg,
+            start_state=self._init_sdfg_state,
+            terminal_state=self._term_sdfg_state,
+            jax_name_map=self._jax_name_map,
+            inp_names=self._sdfg_in_names,
+            out_names=self._sdfg_out_names,
+        )
+
+    def _handle_null_jaxpr(
+        self,
+        jaxpr: jcore.ClosedJaxpr,
+    ) -> JaxprTranslationDriver:
+        """This function is called in case a `Jaxpr` with zero equations is encountered.
+
+        Notes:
+            This function will fill the internal list of outputs.
+        """
+        if len(jaxpr.eqns) != 0:
+            raise NotImplementedError("'_handle_null_jaxpr()' was called for a non empty Jaxpr.")
+        if (
+            len(jaxpr.out_avals) == 0
+        ):  # There is not output so we do not have to copy anything around.
+            self._sdfg_out_names = ()
+            return self
+        if self.is_head_translator():
+            # In this case there is nothing to do, because input is already the output.
+            #  However, this is only possible if we are the head translator.
+            self._sdfg_out_names = tuple(
+                self.map_jax_var_to_sdfg(jax_out_var) for jax_out_var in jaxpr.jaxpr.outvars
+            )
+            raise NotImplementedError("Please test me.")
+            return self
+        #
+        assert self._term_sdfg_state is self._init_sdfg_state
+        assert len(self._sdfg_in_names) > 0
+        assert len(self._sdfg_out_names) == 0
+
+        # We will use this list to build the list of output names.
+        #  This is important for the exporter.
+        out_var_names: list[str] = []
+
+        # If we are here then we are dealing with a nested SDFG/Jaxpr.
+        #  Because an input also serves as output, the nested SDFG will have connector pairs
+        #  with the same name, one serving as input the other as output, with the same name.
+        #  This will make node validation fail.
+        #  Thus we have to introduce a some fake output name and explicitly copy the data around.
+        #  Once DaCe will inline the nested SDFG it will remove this intermediate copy.
+        for jax_out_var in jaxpr.jaxpr.outvars:
+            jax_inp_name = jutil.get_jax_var_name(
+                jax_out_var
+            )  # Since output == input their names must be the same.
+            assert self.map_jax_var_to_sdfg(jax_inp_name, allow_fail=True)
+
+            # This is the name we give to fictive Jax variable serving as output.
+            jax_out_name = f"_zero_equation_output_{self.map_jax_var_to_sdfg(jax_out_var)}"
+
+            # Now create the SDFG variable for it, give it a unique name.
+            sdfg_out_name = self._add_array(
+                jax_out_var,
+                as_transient=True,
+                name_prefix="_zero_equation_output_for_",
+                update_var_mapping=False,
+            )
+
+            # We now create a new mapping, we do this that we will later find the variable again.
+            self._add_jax_name_mapping(jax_var=jax_out_name, sdfg_name=sdfg_out_name)
+            out_var_names.append(jax_out_name)
+
+            # Now copy the input into the fake output variable.
+            inp_acc = self._init_sdfg_state.add_read(self.map_jax_var_to_sdfg(jax_inp_name))
+            out_acc = self._init_sdfg_state.add_write(self.map_jax_var_to_sdfg(jax_out_var))
+            self._sdfg_head.add_nedge(
+                src=inp_acc,
+                dst=out_acc,
+                data=dace.Memlet.from_array(
+                    jax_inp_name, self.get_array(self.map_jax_var_to_sdfg(jax_inp_name))
+                ),
+            )
+        # We also have to update the list of outputs.
+        #  This is needed for making the exporter aware of what we are doing.
+        self._sdfg_out_names = tuple(out_var_names)
+        return self
+
+    # fmt: off
+    _forbidden_names: Final[set[str]] = {
+        # These should be most of the C++ keywords, it is more important to have the short ones.
+        #  Taken from 'https://learn.microsoft.com/en-us/cpp/cpp/keywords-cpp?view=msvc-170'
+        'alignas', 'alignof', 'and', 'asm', 'auto', 'bitand', 'bitor', 'bool', 'break', 'case', 'catch',
+        'char', 'class', 'compl', 'concept', 'const', 'consteval', 'constexpr', 'constinit', 'continue',
+        'decltype', 'default', 'delete', 'directive', 'do', 'double', 'else', 'enum', 'explicit', 'export',
+        'extern', 'false', 'float', 'for', 'friend', 'goto', 'if', 'inline', 'int', 'long', 'mutable',
+        'namespace', 'new', 'noexcept', 'not', 'nullptr', 'operator', 'or', 'private', 'protected',
+        'public', 'register', 'requires', 'return', 'short', 'signed', 'sizeof', 'static', 'struct',
+        'switch', 'template', 'this', 'throw', 'true', 'try', 'typedef', 'typeid', 'typename', 'union',
+        'unsigned', 'using', 'virtual', 'void', 'volatile', 'while', 'xor', 'std',
+    }
+    # fmt: on
+
+
diff --git a/src/jace/translator/sub_translators/__init__.py b/src/jace/translator/sub_translators/__init__.py
new file mode 100644
index 0000000..4efefed
--- /dev/null
+++ b/src/jace/translator/sub_translators/__init__.py
@@ -0,0 +1,3 @@
+"""This module contains all subtranslator implementations.
+"""
+
diff --git a/src/jace/translator/sub_translators/alu_translator.py b/src/jace/translator/sub_translators/alu_translator.py
new file mode 100644
index 0000000..3ca33e3
--- /dev/null
+++ b/src/jace/translator/sub_translators/alu_translator.py
@@ -0,0 +1,363 @@
+"""This module contains the `ALUTranslator` which translates all arithmetic and logic primitives.
+"""
+
+from typing import Union, Any, Final, TYPE_CHECKING, cast
+from typing_extensions import override
+
+
+import jace
+from jace import translator as jtranslator
+from jace.translator import util as jtutil
+
+
+import dace
+
+import jax
+from jax import core as jcore
+import numpy as np
+
+
+if TYPE_CHECKING:
+    from .jaxpr_translator_driver import JaxprTranslationDriver
+
+
+
+class ALUTranslator(jtranslator.JaCeSubTranslatorInterface):
+    """This translator handles all arithmetic and logical operations.
+
+    """
+    __slots__ = ("_unary_ops", "_binary_ops")
+
+    # Contains all translation templates for unarry operations.
+    self.m_unarryOps: Final[dict[str, str]] = {
+            "pos":          "__out0 = +(__in0)",
+            "neg":          "__out0 = -(__in0)",
+            "not":          "__out0 = not (__in0)",
+
+            "floor":        "__out0 = floor(__in0)",
+            "ceil":         "__out0 = ceil(__in0)",
+            "round":        "__out0 = round(__in0)",
+            "abs":          "__out0 = abs(__in0)",
+            "sign":         "__out0 = sign(__in0)",
+
+            "sqrt":         "__out0 = sqrt(__in0)",
+
+            "log":          "__out0 = log(__in0)",
+            "exp":          "__out0 = exp(__in0)",
+            "integer_pow":  "__out0 = (__in0)**({y})",  # 'y' is a parameter of the primitive
+
+            "sin":          "__out0 = sin(__in0)",
+            "asin":         "__out0 = asin(__in0)",
+            "cos":          "__out0 = cos(__in0)",
+            "acos":         "__out0 = acos(__in0)",
+            "tan":          "__out0 = tan(__in0)",
+            "atan":         "__out0 = atan(__in0)",
+            "tanh":         "__out0 = tanh(__in0)",
+    }
+    # Transformation for all binary operations
+    self._binarryOps: Final[dict[str, str]] = {
+            "add":          "__out0 = (__in0)+(__in1)",
+            "add_any":      "__out0 = (__in0)+(__in1)",     # No idea what makes `add_any` differ from `add`
+            "sub":          "__out0 = (__in0)-(__in1)",
+            "mul":          "__out0 = (__in0)*(__in1)",
+            "div":          "__out0 = (__in0)/(__in1)",
+            "rem":          "__out0 = (__in0)%(__in1)",
+
+            "and":          "__out0 = (__in0) and (__in1)",
+            "or":           "__out0 = (__in0) or  (__in1)",
+
+            "pow":          "__out0 = (__in0)**(__in1)",
+            "ipow":         "__out0 = (__in0)**(int(__in1))",
+
+            "min":          "__out0 = min(__in0, __in1)",
+            "max":          "__out0 = max(__in0, __in1)",
+
+            "eq":          "__out0 = __in0 == __in1",
+            "ne":          "__out0 = __in0 != __in1",
+            "ge":          "__out0 = __in0 >= __in1",
+            "gt":          "__out0 = __in0 > __in1",
+            "le":          "__out0 = __in0 <= __in1",
+            "lt":          "__out0 = __in0 < __in1",
+    }
+
+    def __init__(
+            self,
+            **kwargs: Any
+    ) -> None:
+        """Initialize the `ALUTranslator`.
+        """
+        super().__init__(**kwargs)
+    # end def: __init__
+
+
+    @override
+    def get_handled_primitives(self) -> Collection[str] | str:
+        """Returns the list of all known primitives.
+        """
+        return set(self._unary_ops.keys()).union(self._binary_ops.keys())
+
+
+    @override
+    def can_translate_jaxeqn(
+        self,
+        driver: "JaxprTranslationDriver",
+        in_var_names: Sequence[str | None],
+        out_var_names: Sequence[str],
+        eqn: jcore.JaxprEqn,
+    ) -> bool:
+        """Tests if the translator can handle the primitive.
+
+        Notes:
+            A user can generally expect that this function returns `True`.
+        """
+        is_scalar: bool = (len(eqn.outvars[0].aval.shape) == 0)
+        prim_name: str = eqn.primitive.name
+        if(prim_name in self._unary_ops):
+            assert len(eqn.invars) == 1
+        elif(prim_name in self._binary_ops):
+            assert len(eqn.invars) == 2
+        elif(out_var_names[0] is None):
+            return False
+        if(all(x is None  for x in in_var_names)):
+            return False
+        if(len(eqn.effects) != 0):
+            return False
+        return True
+
+
+    @override
+    def translate_jaxeqn(
+        self,
+        driver: "JaxprTranslationDriver",
+        in_var_names: Sequence[str | None],
+        out_var_names: Sequence[str],
+        eqn: jcore.JaxprEqn,
+        eqn_state: dace.SDFGState,
+    ) -> None:
+        """Perform the translation.
+
+        Deepening on the shapes of the input the function will either create a Tasklet or a mapped Tasklet.
+        The translator is able to handle broadcasting with NumPy rules.
+        The function will always perform the translation inside the provided state.
+
+        Args:
+            driver:         The driver object of the translation.
+            in_var_names:   List of the names of the arrays created inside the SDFG for the inpts or 'None' in case of a literal.
+            out_var_names:  List of the names of the arrays created inside the SDFG for the outputs.
+            eqn:            The Jax equation that is translated.
+            eqn_state:      State into which the primitive's SDFG representation is constructed.
+        """
+
+        # All this checks are done to capture corner cases that Jax might do but are not implemented.
+        #  If you find out that Jax will never create something, then remove it.
+        if(not all(invar.aval.shape == ()  for invar, x in zip(eqn.invars, in_var_names) if x is None)):
+            raise NotImplementedError(f"Can not handle Literals that are not scalars.")
+        if(in_var_names[0] is None):
+            raise NotImplementedError(f"Literal can only not be on the right hand side of the operation.")
+        if(not any(invar.aval.shape == eqn.outvars[0].aval.shape  for invar in eqn.invars)):
+            raise NotImplementedError(f"At least input must have the same shape as the output.")
+        if(len(eqn.outvars) != 1):
+            raise NotImplementedError(f"Can only handle one output (Eq: '{eqn}'.")
+
+        # Determine what kind of input we got and how we should proceed.
+        is_scalar = (len(eqn.outvars[0].aval.shape) == 0)
+        inp_scalars = [len(Inp.aval.shape) == 0  for i, Inp in enumerate(eqn.invars)]
+        has_scalars_as_inputs = any(inp_scalars)
+        only_scalars_as_inputs = all(inp_scalars)
+        has_some_literals = any([x is None  for x in in_var_names])
+        only_literals_as_inputs = all([x is None  for x in in_var_names])
+        inps_same_shape   = all([eqn.invars[0].aval.shape == eqn.invars[i].aval.shape  for i in range(1, len(eqn.invars))])
+
+        # We will now look which dimensions have to be broadcasted on which operator.
+        #  I.e. in the dimensions in the lists below there will be no map iteration index.
+        dims_to_bcastl: Sequence[int] = []
+        dims_to_bcastr: Sequence[int] = []
+
+        # Determine if and if yes how we have to broadcast.
+        if(is_scalar):
+            # The output is a scalar, in which case we must have only scalar input as well.
+            #  Furthermore, we can have the situation that only Literals are the input.
+            assert (not is_scalar) or only_scalars_as_inputs
+            assert (not is_scalar) or only_literals_as_inputs
+
+        elif(only_literals_as_inputs):
+            raise NotImplementedError(f"Only literals an input is only allowed for the scalar case.")
+
+        elif(inps_same_shape):
+            pass
+
+        elif(has_some_literals or has_scalars_as_inputs):
+            # This is essentially array plus scalar, but in two possibilities.
+            #  We either have a scalar variable or we have a scalar literal.
+            assert (not has_some_literals) or all(invar.aval.shape == eqn.outvars[0].aval.shape  for (invar, x) in zip(eqn.invars, in_var_names) if x is not None)
+            assert (not has_scalars_as_inputs) or all(invar.aval.shape in {eqn.outvars[0].aval.shape, ()}  for (invar, x) in zip(eqn.invars, in_var_names) if x is not None)
+
+        elif(len(in_var_names) != 2):
+            raise ValueError(f"Can only do broadcasting if there are two operands.")
+
+        else:
+            # This is the general broadcasting case
+            #  We assume that both inputs and the output have the same rank but different sizes in each dimension.
+            #  It seems that Jax ensures this.
+            #  We further assume that if the size in a dimension differs then one must have size 1.
+            #  This is the size we broadcast over, i.e. conceptually replicated.
+            out_shp  = tuple(eqn.outvars[0].aval.shape)  # Shape of the output.
+            inp_shpl = tuple(eqn.invars[0].aval.shape)   # Shape of the left/first input
+            inp_shpr = tuple(eqn.invars[1].aval.shape)   # Shape of the right/second input; this must be "expanded"
+
+            if(not ((len(inp_shpl) == len(inp_shpr)) and (len(out_shp) == len(inp_shpr)))):
+                raise NotImplementedError("Can not broadcast over different ranks.")
+
+            for dim in reversed(range(len(out_shp))):
+                shp_lft = inp_shpl[dim]
+                shp_rgt = inp_shpr[dim]
+
+                if(shp_lft == shp_rgt):
+                    assert out_shp[dim] == shp_lft
+                elif(shp_lft == 1):
+                    assert shp_rgt == out_shp[dim]
+                    dims_to_bcastl.append(dim)
+                elif(shp_rgt == 1):
+                    assert shp_lft == out_shp[dim]
+                    dims_to_bcastr.append(dim)
+                else:
+                    raise ValueError(f"Invalid shapes in dimension {dim} for broadcasting.")
+
+        # Now we create the Tasklet into which we solve the equation.
+        tskl_code: str = self._writeTaskletCode(in_var_names, eqn)
+        tskl_name: str = eqn.primitive.name
+        tskl_map_ranges: list[tuple[str, str]] = [
+                (f'__i{dim}', f'0:{N}')
+                for dim, N in enumerate(eqn.outvars[0].aval.shape)
+        ]
+        tskl_outputs: list[Union[tuple[str, dace.Memlet]], tuple[None, None]] = []
+        tskl_inputs: list[tuple[str, dace.Memlet]] = []
+
+        # Generate the Memlets for the input.
+        for i, dims_to_bcast in zip(range(len(eqn.invars)), [dims_to_bcastl, dims_to_bcastr]):
+            if(in_var_names[i] is None):
+                # Litteral: No input needed.
+                tskl_inputs.append((None, None))
+                continue
+            elif(inp_scalars[i]):
+                # We have a scalar argument.
+                i_memlet = dace.Memlet.from_array(in_var_names[i], translator.getSDFG().arrays[in_var_names[i]])
+            else:
+                # We have an array argument.
+                inputs_: list[str] = []
+                for dim, (map_var, _) in enumerate(tskl_map_ranges):
+                    if(dim in dims_to_bcast):
+                        inputs_.append('0')
+                    else:
+                        inputs_.append(str(map_var))
+                i_memlet: dace.Memlet = dace.Memlet.simple(in_var_names[i], ", ".join(tInputs_))
+                del inputs_
+            tskl_inputs.append( (f'__in{i}', i_memlet) )
+
+        # Now generate the Memlets for the outputs
+        if(is_scalar):
+            tskl_outputs.append( (f'__out{i}', dace.Memlet.from_array(out_var_names[0], translator.getSDFG().arrays[out_var_names[i]])) )
+        else:
+            tskl_outputs.append( (f'__out{i}', dace.Memlet.simple(out_var_names[0], ', '.join([X[0]  for X in tskl_map_ranges]))) )
+
+        if(is_scalar):
+            tskl_tasklet = eqn_state.add_tasklet(
+                    tskl_name,
+                    list_to_dict(tskl_inputs).keys(),
+                    list_to_dict(tskl_outputs).keys(),
+                    tskl_code,
+            )
+            for in_var, (in_connector, in_memlet)  in filter(lambda X: X[0] is not None, zip(in_var_names, tskl_inputs)):
+                eqn_state.add_edge(
+                        eqn_state.add_read(in_var),
+                        None,
+                        tskl_tasklet,
+                        in_connector,
+                        in_memlet,
+                )
+            for out_var, (out_connector, out_memlet) in zip(out_var_names, tskl_outputs):
+                out = eqn_state.add_write(oVar)
+                eqn_state.add_edge(
+                        tskl_tasklet,
+                        out_connector,
+                        eqn_state.add_write(oVar),
+                        None,
+                        out_memlet,
+                )
+        else:
+            eqn_state.add_mapped_tasklet(
+                name=tskl_name,
+                map_ranges=jtutil.list_to_dict(tskl_map_ranges),
+                inputs=jtutil.list_to_dict(tskl_inputs),
+                code=tskl_code,
+                outputs=jtutil.list_to_dict(tskl_outputs),
+                external_edges=True,
+            )
+
+        return eqn_state
+
+
+    def _writeTaskletCode(
+            self,
+            in_var_names: list[Union[str, None]],
+            eqn: JaxprEqn,
+    ):
+        """This function generates the Tasklet code based on a primitive.
+
+        The function will also perform literal substitution and parameter handling.
+
+        Args:
+            in_var_names:   The list of SDFG variables used as input.
+        """
+        t_name = eqn.primitive.name
+        if("integer_pow" == t_name):
+            # INTEGER POWER
+            exponent = int(eqn.params['y'])
+            if(exponent == 0):
+                t_code = f"__out0 = dace.{str(eqn.outvars[0].aval.dtype)}(1)"
+            elif(exponent == 1):
+                t_code = "__out0 = __in0"
+            elif(exponent == 2):
+                t_code = "__out0 = __in0 * __in0"
+            elif(exponent == 3):
+                t_code = "__out0 = (__in0 * __in0) * __in0"
+            elif(exponent == 4):
+                t_code = "__tmp0 = __in0 * __in0\n__out0 = __tmp0 * __tmp0"
+            elif(exponent == 5):
+                t_code = "__tmp0 = __in0 * __in0\n__tmp1 = __tmp0 * __tmp0\n__out0 = __tmp1 * __in0"
+            else:
+                t_code = self.m_unarryOps[t_name]
+
+        else:
+            # GENERAL CASE
+            if(t_name in self._unary_ops):
+                t_code = self._unary_ops[t_name]
+            elif(t_name in self._binary_ops):
+                t_code = self._binary_ops[t_name]
+
+        # Now we handle Literal substitution
+        for i, in_var_name in enumerate(in_var_names):
+            if(in_var_name is not None):
+                continue
+
+            jax_in_var: jcore.Literal = cast(jcore.Literal, eqn.invars[i])
+            if(jax_in_var.aval.shape == ()):
+                t_val = jax_in_var.val
+                if(isinstance(t_val, np.ndarray)):
+                    t_val = jax_in_var.val.max() # I do not know a better way in that case
+                t_code = t_code.replace(f"__in{i}", str(t_val))
+            else:
+                raise ValueError(f"Can not handle the literal case of shape: {jax_in_var.aval.shape}")
+
+        # Now replace the parameters
+        if(len(eqn.params) != 0):
+            t_code = t_code.format(**eqn.params)
+
+        return t_code
+
+
+
+
+
+
+
diff --git a/src/jace/translator/util/__init__.py b/src/jace/translator/util/__init__.py
new file mode 100644
index 0000000..fb3eee6
--- /dev/null
+++ b/src/jace/translator/util/__init__.py
@@ -0,0 +1,17 @@
+# JaCe - JAX jit using DaCe (Data Centric Parallel Programming)
+#
+# Copyright (c) 2024, ETH Zurich
+# All rights reserved.
+#
+# SPDX-License-Identifier: BSD-3-Clause
+
+"""Subpackage containing all utilities related to the translators."""
+
+from __future__ import annotations
+
+from .jace_translation_memento import JaCeTranslationMemento
+from .revision_counter import RevisionCounterManager
+from .subtranslator_helper_order import sort_subtranslators
+from .util import list_to_dict
+
+
diff --git a/src/jace/translator/util/jace_translation_memento.py b/src/jace/translator/util/jace_translation_memento.py
new file mode 100644
index 0000000..62ad230
--- /dev/null
+++ b/src/jace/translator/util/jace_translation_memento.py
@@ -0,0 +1,79 @@
+# JaCe - JAX jit using DaCe (Data Centric Parallel Programming)
+#
+# Copyright (c) 2024, ETH Zurich
+# All rights reserved.
+#
+# SPDX-License-Identifier: BSD-3-Clause
+from __future__ import annotations
+
+from collections.abc import Mapping, Sequence
+from dataclasses import dataclass
+from typing import Any
+
+import dace
+
+
+@dataclass(init=True, repr=True, eq=False, frozen=True, kw_only=True, slots=True)
+class JaCeTranslationMemento:
+    """Encapsulates the result of a translation run of the 'JaxprTranslationDriver' object.
+
+    It defines the following members:
+    - 'sdfg' the SDFG object that was created.
+    - 'start_state' the first state in the SDFG state machine.
+    - 'terminal_state' the last state in the state machine.
+    - 'jax_name_map' a 'dict' that maps every Jax name to its corresponding SDFG variable name.
+    - 'inp_names' a 'list' of the SDFG variables that are used as input, in the same order as 'Jaxpr.invars'.
+    - 'out_names' a 'list' of the SDFG variables that are used as output, in the same order as 'Jaxpr.outvars'.
+    """
+
+    sdfg: dace.SDFG
+    start_state: dace.SDFGState
+    terminal_state: dace.SDFGState
+    jax_name_map: Mapping[str, str]
+    inp_names: Sequence[str]
+    out_names: Sequence[str]
+
+    def validate(self) -> bool:
+        """Validate the underlying SDFG."""
+
+        # To prevent the 'non initialized' data warnings we have to temporary promote the input arguments as global.
+        org_trans_state: dict[str, bool] = {}
+        for var in self.inp_names:
+            org_trans_state[var] = self.sdfg.arrays[var].transient
+            self.sdfg.arrays[var].transient = False
+        try:
+            self.sdfg.validate()
+        finally:
+            for var, orgValue in org_trans_state.items():
+                self.sdfg.arrays[var].transient = orgValue
+        return True
+
+    def __getitem__(self, idx: str) -> Any:
+        """Allows member access using brackets."""
+        if not isinstance(idx, str):
+            raise TypeError(f"Expected 'idx' as 'str' but got '{type(str)}'")
+        if not hasattr(self, idx):
+            raise KeyError(f"The key '{idx}' is not known.")
+        return getattr(self, idx)
+
+    def __hash__(self) -> int:
+        """Computes the hash of the underlying SDFG object."""
+        return hash(self.sdfg)
+
+    def __eq__(self, other: Any) -> bool:
+        """Compares the underlying SDFG object with 'rhs'."""
+        if isinstance(other, JaCeTranslationMemento):
+            return bool(self.sdfg == other.sdfg)
+        elif hasattr(other, "__sdfg__"):
+            other = other.__sdfg__()
+        elif isinstance(other, dace.SDFG):
+            pass
+        else:
+            return NotImplemented
+        #
+
+        x: bool = self.sdfg.__eq__(other)
+        return x
+
+
+# end class(JaCeTranslationMemento):
diff --git a/src/jace/translator/util/revision_counter.py b/src/jace/translator/util/revision_counter.py
new file mode 100644
index 0000000..7f19a76
--- /dev/null
+++ b/src/jace/translator/util/revision_counter.py
@@ -0,0 +1,55 @@
+# JaCe - JAX jit using DaCe (Data Centric Parallel Programming)
+#
+# Copyright (c) 2024, ETH Zurich
+# All rights reserved.
+#
+# SPDX-License-Identifier: BSD-3-Clause
+from __future__ import annotations
+
+from typing import Final
+
+
+class RevisionCounterManager:
+    """This class acts as a manager for revision counters.
+
+    It is intended as a shared object and each new object that needs a revision,
+    simply calls 'assign_revision()' to get the new one.
+    """
+
+    __slots__ = ("_next_revision",)
+
+    """The revision value of the very first call to 'assign_revision()'.
+    This revision is only assigned once."""
+    ROOT_REVISION: Final[int] = 0
+
+    def __init__(self) -> None:
+        """Creates a revision counter manager."""
+        self._next_revision = self.ROOT_REVISION
+
+    def assign_revision(self) -> int:
+        """Returns a revision number and advance self."""
+        ret = self._next_revision
+        self._next_revision += 1
+        return ret
+
+    def _reset_state(self) -> RevisionCounterManager:
+        """This function sets the revision counter back.
+
+        Notes:
+            Calling this function is almost always an error.
+            This function does not restore the state right after initialization, but one call after 'assign_revision()'.
+                This is done to ensure that there is one single initial revision.
+        """
+        self._next_revision = self.ROOT_REVISION
+        _ = self.assign_revision()  # Ensure that we throw away the root
+        return self
+
+    def is_root_revision(
+        self,
+        rev: int,
+    ) -> bool:
+        """This function checks if 'rev' revers to the (absolute) unique revision of the root."""
+        return rev == self.ROOT_REVISION
+
+
+# end class(RevisionCounterManager):
diff --git a/src/jace/translator/util/subtranslator_helper_order.py b/src/jace/translator/util/subtranslator_helper_order.py
new file mode 100644
index 0000000..1b52d81
--- /dev/null
+++ b/src/jace/translator/util/subtranslator_helper_order.py
@@ -0,0 +1,79 @@
+# JaCe - JAX jit using DaCe (Data Centric Parallel Programming)
+#
+# Copyright (c) 2024, ETH Zurich
+# All rights reserved.
+#
+# SPDX-License-Identifier: BSD-3-Clause
+from __future__ import annotations
+
+from collections.abc import Sequence
+
+from jace import translator
+
+
+def sort_subtranslators(
+    subtranslators: Sequence[translator.JaCeSubTranslatorInterface],
+) -> Sequence[translator.JaCeSubTranslatorInterface]:
+    """Orders the subtranslators according to their priorities.
+
+    The function ensures the following:
+    - All subtranslators that have default priority are at the end.
+    - All subtranslators whose 'get_priority()' returns 'NotImplemented' are at the begin of the list.
+        These subtranslators are ordered according to their '__lt__()' function.
+    - All subtranslators whose 'get_priority()' function returns an integer are in the middle,
+        ordered according to this value.
+    """
+    if len(subtranslators) <= 1:
+        return subtranslators
+    subtranslators = [
+        subtranslator.get()
+        for subtranslator in sorted(map(_SubtranslatorOrderingHelper, subtranslators))
+    ]
+    assert (len(subtranslators) <= 1) or all(
+        subtranslators[i - 1].has_default_priority() <= subtranslators[i].has_default_priority()
+        for i in range(1, len(subtranslators))
+    )
+    return subtranslators
+
+
+class _SubtranslatorOrderingHelper:
+    """This is a helper class that is used by 'JaxprTranslationDriver' to bring the subtranslators in the correct order.
+
+    Essentially it is a wrapper around a subtranslator that handles the different ordering correct.
+    """
+
+    def __init__(self, subtranslator: translator.JaCeSubTranslatorInterface):
+        assert isinstance(subtranslator, translator.JaCeSubTranslatorInterface)
+        self._sub = subtranslator
+
+    def get(self) -> translator.JaCeSubTranslatorInterface:
+        return self._sub
+
+    def __lt__(
+        self,
+        other: _SubtranslatorOrderingHelper,
+    ) -> bool:
+        # Default priority means that it will always go to the end.
+        if self._sub.has_default_priority():
+            return False  # 'self' has default priority, so it must go to the end.
+        elif other._sub.has_default_priority():
+            return True  # 'self' does not have default prio, thus it _must_ go before 'other'.
+        # Get the priorities of the subtranslators.
+        prio_self = self._sub.get_priority()
+        prio_other = other._sub.get_priority()
+        if all(prio is NotImplemented for prio in (prio_self, prio_other)):
+            # Both does not have an explicit priority, thus 'self' should decide if it should go first.
+            x = self._sub.__lt__(other._sub)
+            assert isinstance(x, bool)
+            return x
+        # In case only one has a priority, we change the order such that the one that implements a custom '__lt__()' goes first.
+        #  This is consistent with the description of the interface telling that such translators are biased towards lower priorities.
+        if prio_self is NotImplemented:
+            assert isinstance(prio_other, int)
+            return True
+        elif prio_other is NotImplemented:
+            assert isinstance(prio_self, int)
+            return False
+        # Both have a priority
+        assert all(isinstance(prio, int) for prio in (prio_other, prio_self))
+        return prio_self < prio_other
diff --git a/src/jace/translator/util/util.py b/src/jace/translator/util/util.py
new file mode 100644
index 0000000..574efad
--- /dev/null
+++ b/src/jace/translator/util/util.py
@@ -0,0 +1,15 @@
+"""Contains all general helper functions needed inside the translator.
+"""
+
+from typing import Union, Any
+
+def list_to_dict(
+        inp: list[Union[tuple[None, Any], tuple[Any, Any]]]
+) -> dict[Any, Any]:
+    """This method turns a `list` of pairs into a `dict` and applies a `None` filter.
+
+    The function will only include pairs whose key, i.e. first element is not `None`.
+    """
+    return {k:v  for k, v in inp if k is not None}
+# end def: ListToDict
+
diff --git a/src/jace/util/__init__.py b/src/jace/util/__init__.py
new file mode 100644
index 0000000..703ad85
--- /dev/null
+++ b/src/jace/util/__init__.py
@@ -0,0 +1,22 @@
+# JaCe - JAX jit using DaCe (Data Centric Parallel Programming)
+#
+# Copyright (c) 2024, ETH Zurich
+# All rights reserved.
+#
+# SPDX-License-Identifier: BSD-3-Clause
+
+"""Global utility package for the jax to dace translator."""
+
+from __future__ import annotations
+
+from .jax import get_jax_var_name
+from .traits import is_iterable, is_str
+from .util import ensure_iterability
+
+
+__all__ = [
+    "get_jax_var_name",
+    "is_str",
+    "is_iterable",
+    "ensure_iterability",
+]
diff --git a/src/jace/util/dace.py b/src/jace/util/dace.py
new file mode 100644
index 0000000..1e9b874
--- /dev/null
+++ b/src/jace/util/dace.py
@@ -0,0 +1,13 @@
+# JaCe - JAX jit using DaCe (Data Centric Parallel Programming)
+#
+# Copyright (c) 2024, ETH Zurich
+# All rights reserved.
+#
+# SPDX-License-Identifier: BSD-3-Clause
+
+"""Implements all utility functions that are related to DaCe.
+
+Most of the functions defined here allow an unified access to DaCe's internals in a consistent and centralized way.
+"""
+
+from __future__ import annotations
diff --git a/src/jace/util/jax.py b/src/jace/util/jax.py
new file mode 100644
index 0000000..6e0c1a5
--- /dev/null
+++ b/src/jace/util/jax.py
@@ -0,0 +1,43 @@
+# JaCe - JAX jit using DaCe (Data Centric Parallel Programming)
+#
+# Copyright (c) 2024, ETH Zurich
+# All rights reserved.
+#
+# SPDX-License-Identifier: BSD-3-Clause
+
+"""Implements all utility functions that are related to Jax.
+
+Most of the functions defined here allow an unified access to Jax' internals in a consistent and centralized way.
+"""
+
+from __future__ import annotations
+
+import jax.core as jcore
+
+
+def get_jax_var_name(jax_var: jcore.Atom | str) -> str:
+    """Returns the name of the Jax variable as a string.
+
+    Args:
+        jax_var:     The variable to stringify.
+
+    Todos:
+        Implement a regex check for the name.
+    """
+    if isinstance(jax_var, jcore.DropVar):
+        return "_"
+    if isinstance(jax_var, jcore.Atom):
+        jax_name = str(jax_var)  # This only works up to some version
+    elif isinstance(jax_var, str):
+        jax_name = jax_var
+    else:
+        raise TypeError(
+            f"Does not know how to transform '{jax_var}' (type: '{type(jax_var).__name__}') into a string."
+        )
+    # TODO(phimuell): Add regex to ensure that the name is legit.
+    assert isinstance(jax_name, str)
+    if len(jax_name) == 0:
+        raise ValueError(
+            f"Failed to translate the Jax variable '{jax_var}' into a name, the result was empty."
+        )
+    return jax_var
diff --git a/src/jace/util/traits.py b/src/jace/util/traits.py
new file mode 100644
index 0000000..b791cb8
--- /dev/null
+++ b/src/jace/util/traits.py
@@ -0,0 +1,66 @@
+# JaCe - JAX jit using DaCe (Data Centric Parallel Programming)
+#
+# Copyright (c) 2024, ETH Zurich
+# All rights reserved.
+#
+# SPDX-License-Identifier: BSD-3-Clause
+
+"""Common functionality to identify types of objects."""
+
+from __future__ import annotations
+
+from typing import Any, Sequence
+
+
+def is_str(
+    *args: Sequence[Any],
+    allow_empty: bool = True,
+) -> bool:
+    """Tests if its arguments are strings.
+
+    By default empty strings are also considered as strings.
+    However, by setting 'allow_empty' to 'False' the function will consider them not as string.
+    In case no arguments were passed to the function 'False' will be returned.
+    """
+    if len(args) == 0:
+        return False
+
+    elif allow_empty:
+        for x in args:
+            if not isinstance(x, str):
+                return False  # Not a string
+        # end for(x):
+    else:
+        for x in args:
+            if not isinstance(x, str):
+                return False  # Not a string
+            if len(x) == 0:
+                return False  # A string but empty; and check enabled
+        # end for(x):
+    # end if:
+
+    return True
+
+
+def is_iterable(
+    x: Any,
+    ign_str: bool = True,
+) -> bool:
+    """Test if 'x' is iterable, with an exception for strings.
+
+    By default this function considers strings as not iterable.
+    The idea is that a string is in most cases not a collection of individual characters, but should be seen as a whole.
+    However, by setting 'ign_str' to 'False' a string is also considered as an iterable.
+
+    Args:
+        x:          The object to check.
+        ign_str:     Ignore strings, defaults to 'True'.
+    """
+    from collections.abc import Iterable
+
+    # We do not consider strings as iterable.
+    if ign_str and is_str(x):
+        return False
+
+    # Based on: https://stackoverflow.com/questions/1952464/in-python-how-do-i-determine-if-an-object-is-iterable/61139278
+    return isinstance(x, Iterable)
diff --git a/src/jace/util/util.py b/src/jace/util/util.py
new file mode 100644
index 0000000..2c1af01
--- /dev/null
+++ b/src/jace/util/util.py
@@ -0,0 +1,39 @@
+# JaCe - JAX jit using DaCe (Data Centric Parallel Programming)
+#
+# Copyright (c) 2024, ETH Zurich
+# All rights reserved.
+#
+# SPDX-License-Identifier: BSD-3-Clause
+from __future__ import annotations
+
+from collections.abc import Iterable
+from typing import Any
+
+
+def ensure_iterability(
+    x: Any,
+    dcyp: bool = False,
+    scyp: bool = False,
+    ign_str: bool = True,
+) -> Iterable[Any]:
+    """Ensures that 'x' is iterable.
+
+    By default a string is _not_ considered as a sequence of chars but as one object.
+
+    Args:
+        x:          To test.
+        dcyp:       Perform a deep copy on the reurned object, takes precedence.
+        scyp:       Perform a shallow copy on the returned object.
+        ign_str:    Ignore that a string is iterabile.
+    """
+    import copy
+
+    if ign_str and isinstance(x, str):
+        x = [x]  # Turn a string into an interable
+    elif isinstance(x, Iterable):
+        pass  # Already an iterable
+    if dcyp:
+        x = copy.deepcopy(x)
+    elif scyp:
+        x = copy.copy(x)
+    return x
diff --git a/tests/test_subtranslator_helper_order.py b/tests/test_subtranslator_helper_order.py
new file mode 100644
index 0000000..a0965b6
--- /dev/null
+++ b/tests/test_subtranslator_helper_order.py
@@ -0,0 +1,130 @@
+"""Implements tests to check if the sorting algorithm is correct.
+"""
+
+from typing                     import Collection, Sequence, Union
+
+import jace
+from jace   import translator as jtrans
+
+
+def test_subtranslatior_order_simple():
+    """This test is to ensure that `sortSubtranslators()` works correctly.
+    """
+    from jace.translator.util.subtranslator_helper_order import  sort_subtranslators
+
+    class SimpleSubTrans1(jtrans.JaCeSubTranslatorInterface):
+        _EXP_ORDER = 0
+        def __init__(self, *args, **kwargs):
+            super().__init__(*args, **kwargs)
+        def getPriority(self):
+            return 1
+    # end class(SimpleSubTrans1):
+
+    class SimpleSubTrans2(jtrans.JaCeSubTranslatorInterface):
+        _EXP_ORDER = 1  # Not last because, default prio is always last.
+        def __init__(self, *args, **kwargs):
+            super().__init__(*args, **kwargs)
+        def getPriority(self):
+            return jtrans.JaCeSubTranslatorInterface.DEFAULT_PRIORITY + 1
+    # end class(SimpleSubTrans2):
+
+    class SimpleSubTrans3(jtrans.JaCeSubTranslatorInterface):
+        _EXP_ORDER = 2
+        def __init__(self, *args, **kwargs):
+            super().__init__(*args, **kwargs)
+    # end class(SimpleSubTrans3):
+
+    initialOrder = [
+            SimpleSubTrans3(),
+            SimpleSubTrans2(),
+            SimpleSubTrans1(),
+    ]
+
+    # Now call the function.
+    sortedTranslators = sortSubtranslators(initialOrder)
+
+    # Now we bring the list in expected order.
+    expectedOrder = sorted(initialOrder, key=lambda st: st._EXP_ORDER)
+
+    assert all(ist is soll  for ist, soll in zip(sortedTranslators, expectedOrder)), \
+            f"Expected order was `{[type(x).__name__  for x in expectedOrder]}`, but got `{[type(x).__name__  for x in sortedTranslators]}`."
+    return True
+# end def: test_subtranslatior_order_simple
+
+
+def test_subtranslatior_order_custom1():
+    from Jax2DaCe.translator.util._subtranslator_helper_order       import sortSubtranslators
+
+    class SimpleSubTrans1(jtrans.JaCeSubTranslatorInterface):
+        _EXP_ORDER = 0
+        def __init__(self, *args, **kwargs):
+            super().__init__(*args, **kwargs)
+        def getPriority(self):
+            return NotImplemented
+        def __lt__(self, other):
+            return isinstance(other, SimpleSubTrans2)
+    # end class(SimpleSubTrans1):
+
+    class SimpleSubTrans2(jtrans.JaCeSubTranslatorInterface):
+        _EXP_ORDER = 1
+        def __init__(self, *args, **kwargs):
+            super().__init__(*args, **kwargs)
+        def getPriority(self):
+            return NotImplemented
+        def __lt__(self, other):
+            return True
+    # end class(SimpleSubTrans2):
+
+    class SimpleSubTrans3(jtrans.JaCeSubTranslatorInterface):
+        _EXP_ORDER = 2
+        def __init__(self, *args, **kwargs):
+            super().__init__(*args, **kwargs)
+        def getPriority(self):
+            return NotImplemented
+        def __lt__(self, other):
+            return False
+    # end class(SimpleSubTrans3):
+
+    class SimpleSubTrans4(jtrans.JaCeSubTranslatorInterface):
+        _EXP_ORDER = 3
+        def __init__(self, *args, **kwargs):
+            super().__init__(*args, **kwargs)
+        def getPriority(self):
+            return jtrans.JaCeSubTranslatorInterface.DEFAULT_PRIORITY + 1
+    # end class(SimpleSubTrans4):
+
+    class SimpleSubTrans5(jtrans.JaCeSubTranslatorInterface):
+        _EXP_ORDER = 4
+        def __init__(self, *args, **kwargs):
+            super().__init__(*args, **kwargs)
+    # end class(SimpleSubTrans5):
+
+    assert SimpleSubTrans2() < SimpleSubTrans1()
+
+    initialOrder = [
+            SimpleSubTrans5(),
+            SimpleSubTrans4(),
+            SimpleSubTrans3(),
+            SimpleSubTrans2(),
+            SimpleSubTrans1(),
+    ]
+
+    # Now call the function.
+    sortedTranslators = sortSubtranslators(initialOrder)
+
+    # Now we bring the list in expected order.
+    expectedOrder = sorted(initialOrder, key=lambda st: st._EXP_ORDER)
+
+    assert all(ist is soll  for ist, soll in zip(sortedTranslators, expectedOrder)), \
+            f"Expected order was `{[type(x).__name__  for x in expectedOrder]}`, but got `{[type(x).__name__  for x in sortedTranslators]}`."
+    return True
+# end def: test_subtranslatior_order_custom1
+
+
+if "__main__" == __name__:
+    test_subtranslatior_order_simple()
+    test_subtranslatior_order_custom1()
+# end(main):
+
+
+

From f7f9fcfd02f2e0cdddab7f5ae762bbbcef5eb6b2 Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Fri, 19 Apr 2024 07:22:21 +0200
Subject: [PATCH 003/458] Also added a test.

---
 tests/test_subtranslator_helper_order.py | 34 ++++++++++++------------
 1 file changed, 17 insertions(+), 17 deletions(-)

diff --git a/tests/test_subtranslator_helper_order.py b/tests/test_subtranslator_helper_order.py
index a0965b6..ed35cc6 100644
--- a/tests/test_subtranslator_helper_order.py
+++ b/tests/test_subtranslator_helper_order.py
@@ -16,7 +16,7 @@ class SimpleSubTrans1(jtrans.JaCeSubTranslatorInterface):
         _EXP_ORDER = 0
         def __init__(self, *args, **kwargs):
             super().__init__(*args, **kwargs)
-        def getPriority(self):
+        def get_priority(self):
             return 1
     # end class(SimpleSubTrans1):
 
@@ -24,7 +24,7 @@ class SimpleSubTrans2(jtrans.JaCeSubTranslatorInterface):
         _EXP_ORDER = 1  # Not last because, default prio is always last.
         def __init__(self, *args, **kwargs):
             super().__init__(*args, **kwargs)
-        def getPriority(self):
+        def get_priority(self):
             return jtrans.JaCeSubTranslatorInterface.DEFAULT_PRIORITY + 1
     # end class(SimpleSubTrans2):
 
@@ -34,32 +34,32 @@ def __init__(self, *args, **kwargs):
             super().__init__(*args, **kwargs)
     # end class(SimpleSubTrans3):
 
-    initialOrder = [
+    initial_order = [
             SimpleSubTrans3(),
             SimpleSubTrans2(),
             SimpleSubTrans1(),
     ]
 
     # Now call the function.
-    sortedTranslators = sortSubtranslators(initialOrder)
+    sorted_translators = sort_subtranslators(initial_order)
 
     # Now we bring the list in expected order.
-    expectedOrder = sorted(initialOrder, key=lambda st: st._EXP_ORDER)
+    expected_order = sorted(initial_order, key=lambda st: st._EXP_ORDER)
 
-    assert all(ist is soll  for ist, soll in zip(sortedTranslators, expectedOrder)), \
-            f"Expected order was `{[type(x).__name__  for x in expectedOrder]}`, but got `{[type(x).__name__  for x in sortedTranslators]}`."
+    assert all(ist is soll  for ist, soll in zip(sorted_translators, expected_order)), \
+            f"Expected order was `{[type(x).__name__  for x in expected_order]}`, but got `{[type(x).__name__  for x in sorted_translators]}`."
     return True
 # end def: test_subtranslatior_order_simple
 
 
 def test_subtranslatior_order_custom1():
-    from Jax2DaCe.translator.util._subtranslator_helper_order       import sortSubtranslators
+    from jace.translator.util.subtranslator_helper_order import  sort_subtranslators
 
     class SimpleSubTrans1(jtrans.JaCeSubTranslatorInterface):
         _EXP_ORDER = 0
         def __init__(self, *args, **kwargs):
             super().__init__(*args, **kwargs)
-        def getPriority(self):
+        def get_priority(self):
             return NotImplemented
         def __lt__(self, other):
             return isinstance(other, SimpleSubTrans2)
@@ -69,7 +69,7 @@ class SimpleSubTrans2(jtrans.JaCeSubTranslatorInterface):
         _EXP_ORDER = 1
         def __init__(self, *args, **kwargs):
             super().__init__(*args, **kwargs)
-        def getPriority(self):
+        def get_priority(self):
             return NotImplemented
         def __lt__(self, other):
             return True
@@ -79,7 +79,7 @@ class SimpleSubTrans3(jtrans.JaCeSubTranslatorInterface):
         _EXP_ORDER = 2
         def __init__(self, *args, **kwargs):
             super().__init__(*args, **kwargs)
-        def getPriority(self):
+        def get_priority(self):
             return NotImplemented
         def __lt__(self, other):
             return False
@@ -89,7 +89,7 @@ class SimpleSubTrans4(jtrans.JaCeSubTranslatorInterface):
         _EXP_ORDER = 3
         def __init__(self, *args, **kwargs):
             super().__init__(*args, **kwargs)
-        def getPriority(self):
+        def get_priority(self):
             return jtrans.JaCeSubTranslatorInterface.DEFAULT_PRIORITY + 1
     # end class(SimpleSubTrans4):
 
@@ -101,7 +101,7 @@ def __init__(self, *args, **kwargs):
 
     assert SimpleSubTrans2() < SimpleSubTrans1()
 
-    initialOrder = [
+    initial_order = [
             SimpleSubTrans5(),
             SimpleSubTrans4(),
             SimpleSubTrans3(),
@@ -110,13 +110,13 @@ def __init__(self, *args, **kwargs):
     ]
 
     # Now call the function.
-    sortedTranslators = sortSubtranslators(initialOrder)
+    sorted_translators = sort_subtranslators(initial_order)
 
     # Now we bring the list in expected order.
-    expectedOrder = sorted(initialOrder, key=lambda st: st._EXP_ORDER)
+    expected_order = sorted(initial_order, key=lambda st: st._EXP_ORDER)
 
-    assert all(ist is soll  for ist, soll in zip(sortedTranslators, expectedOrder)), \
-            f"Expected order was `{[type(x).__name__  for x in expectedOrder]}`, but got `{[type(x).__name__  for x in sortedTranslators]}`."
+    assert all(ist is soll  for ist, soll in zip(sorted_translators, expected_order)), \
+            f"Expected order was `{[type(x).__name__  for x in expected_order]}`, but got `{[type(x).__name__  for x in sorted_translators]}`."
     return True
 # end def: test_subtranslatior_order_custom1
 

From 4e24c0e3dc07d71572d2e2134b7a6ba88fa7d2d0 Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Fri, 19 Apr 2024 07:56:24 +0200
Subject: [PATCH 004/458] Added the current code state.

---
 src/jace/__about__.py                         |   2 +-
 src/jace/__init__.py                          |   2 +-
 src/jace/translator/__init__.py               |   2 +-
 .../jace_subtranslator_interface.py           |  10 +-
 .../translator/jaxpr_translator_driver.py     |  80 ++--
 .../translator/sub_translators/__init__.py    |   9 +-
 .../sub_translators/alu_translator.py         | 372 +++++++++---------
 src/jace/translator/util/__init__.py          |  12 +-
 .../util/jace_translation_memento.py          |   6 +-
 src/jace/translator/util/revision_counter.py  |   6 +-
 .../util/subtranslator_helper_order.py        |   3 +-
 src/jace/translator/util/util.py              |  24 +-
 src/jace/util/__init__.py                     |   2 +-
 src/jace/util/dace.py                         |   2 +-
 src/jace/util/jax.py                          |   5 +-
 src/jace/util/traits.py                       |   5 +-
 src/jace/util/util.py                         |   3 +-
 17 files changed, 284 insertions(+), 261 deletions(-)

diff --git a/src/jace/__about__.py b/src/jace/__about__.py
index 35acfe1..437e86b 100644
--- a/src/jace/__about__.py
+++ b/src/jace/__about__.py
@@ -1,4 +1,4 @@
-# JaCe - JAX jit using DaCe (Data Centric Parallel Programming)
+# JaCe - JAX Just-In-Time compilation using DaCe (Data Centric Parallel Programming)
 #
 # Copyright (c) 2024, ETH Zurich
 # All rights reserved.
diff --git a/src/jace/__init__.py b/src/jace/__init__.py
index b4d71d1..5e0595b 100644
--- a/src/jace/__init__.py
+++ b/src/jace/__init__.py
@@ -1,4 +1,4 @@
-# JaCe - JAX jit using DaCe (Data Centric Parallel Programming)
+# JaCe - JAX Just-In-Time compilation using DaCe (Data Centric Parallel Programming)
 #
 # Copyright (c) 2024, ETH Zurich
 # All rights reserved.
diff --git a/src/jace/translator/__init__.py b/src/jace/translator/__init__.py
index 65a4e3d..899d973 100644
--- a/src/jace/translator/__init__.py
+++ b/src/jace/translator/__init__.py
@@ -1,4 +1,4 @@
-# JaCe - JAX jit using DaCe (Data Centric Parallel Programming)
+# JaCe - JAX Just-In-Time compilation using DaCe (Data Centric Parallel Programming)
 #
 # Copyright (c) 2024, ETH Zurich
 # All rights reserved.
diff --git a/src/jace/translator/jace_subtranslator_interface.py b/src/jace/translator/jace_subtranslator_interface.py
index 2eda73b..3d6f53b 100644
--- a/src/jace/translator/jace_subtranslator_interface.py
+++ b/src/jace/translator/jace_subtranslator_interface.py
@@ -1,9 +1,10 @@
-# JaCe - JAX jit using DaCe (Data Centric Parallel Programming)
+# JaCe - JAX Just-In-Time compilation using DaCe (Data Centric Parallel Programming)
 #
 # Copyright (c) 2024, ETH Zurich
 # All rights reserved.
 #
 # SPDX-License-Identifier: BSD-3-Clause
+
 from __future__ import annotations
 
 from collections.abc import Collection, Sequence
@@ -80,7 +81,7 @@ def get_handled_primitives(self) -> Collection[str] | str:
 
     def can_translate_jaxeqn(
         self,
-        driver: "JaxprTranslationDriver",
+        driver: JaxprTranslationDriver,
         in_var_names: Sequence[str | None],
         out_var_names: Sequence[str],
         eqn: jcore.JaxprEqn,
@@ -109,7 +110,7 @@ def can_translate_jaxeqn(
 
     def translate_jaxeqn(
         self,
-        driver: "JaxprTranslationDriver",
+        driver: JaxprTranslationDriver,
         in_var_names: Sequence[str | None],
         out_var_names: Sequence[str],
         eqn: jcore.JaxprEqn,
@@ -245,6 +246,3 @@ def __gt__(
         other: Any,
     ) -> bool:
         return NotImplemented
-
-
-# end class(JaCeSubTranslatorInterface):
diff --git a/src/jace/translator/jaxpr_translator_driver.py b/src/jace/translator/jaxpr_translator_driver.py
index fb6856f..0f9c5ab 100644
--- a/src/jace/translator/jaxpr_translator_driver.py
+++ b/src/jace/translator/jaxpr_translator_driver.py
@@ -1,4 +1,4 @@
-# JaCe - JAX jit using DaCe (Data Centric Parallel Programming)
+# JaCe - JAX Just-In-Time compilation using DaCe (Data Centric Parallel Programming)
 #
 # Copyright (c) 2024, ETH Zurich
 # All rights reserved.
@@ -9,7 +9,7 @@
 
 import re
 from collections.abc import Collection, Iterable, Mapping, Sequence
-from typing import Any, Final, Union, cast, overload
+from typing import Any, Final, cast, overload
 
 import dace
 import jax
@@ -49,7 +49,7 @@ class JaxprTranslationDriver:
     - `_create_jax_var_list()` for the bulk creation of Jax variables.
     - `_add_reserved_names()` if a name should be blocked (only affects later equation.
     - `_add_jax_name_mapping()` for creating new links between Jax variables and SDFG variables.
-    However, a subtranslator should only call them if it is neccessary.
+    However, a subtranslator should only call them if it is necessary.
 
 
     If no translation is ongoing the only function that makes sense to call is `translate_jaxpr()` to start a translation.
@@ -234,7 +234,7 @@ def fork(self) -> JaxprTranslationDriver:
         dolly: JaxprTranslationDriver = JaxprTranslationDriver(_no_shared_alloc=True)
 
         # Copy the shared members from parent to fork.
-        for slotName in self.__shared_slots__:
+        for slot_name in self.__shared_slots__:
             setattr(dolly, slot_name, getattr(self, slot_name))
 
         # Handle the special members and initialize them.
@@ -328,13 +328,13 @@ def map_jax_var_to_sdfg(
         self,
         jax_var: str | jcore.Atom,
         allow_fail: bool,
-    ) -> Union[str, None]: ...
+    ) -> str | None: ...
 
     def map_jax_var_to_sdfg(
         self,
         jax_var: str | jcore.Atom,
         allow_fail: bool = False,
-    ) -> Union[str, None]:
+    ) -> str | None:
         """Returns the name of the SDFG variable that the Jax variable `jax_var` is referring to.
 
         Args:
@@ -386,7 +386,9 @@ def is_allocated(self) -> bool:
                 In case the function returns `True` it is guaranteed that it is allocated.
                 If `False` is returned it might or might not be allocated.
         """
-        small_ctx: Sequence[Any] = [getattr(self, x)  for x in self.__shared_slots__ if x != "_reserved_names"]
+        small_ctx: Sequence[Any] = [
+            getattr(self, x) for x in self.__shared_slots__ if x != "_reserved_names"
+        ]
         if all((x is None) for x in small_ctx):
             if self._reserved_names is None:
                 raise RuntimeError(
@@ -406,29 +408,28 @@ def is_head_translator(self) -> bool:
         return self._rev_manager.is_root_revision(self._rev_idx)
 
     def same_family(
-            self,
-            other: JaxprTranslationDriver,
+        self,
+        other: JaxprTranslationDriver,
     ) -> bool:
         """Test if `self` and `other` belongs to the same family of driver/translators.
 
-        They belong to the same family if they decend from the same head translator.
+        They belong to the same family if they descend from the same head translator.
         """
         if not isinstance(other, JaxprTranslationDriver):
             return NotImplemented
-        if(all(getattr(self, x) is getattr(self, x)  for x in self.__shared_slots__)):
-            #assert (self if (self._rev_idx < other._rev_idx) else other).is_allocated()
+        if all(getattr(self, x) is getattr(self, x) for x in self.__shared_slots__):
+            assert (self if (self._rev_idx < other._rev_idx) else other).is_allocated()
             return True
-        assert not any(getattr(self, x) is getattr(self, x)  for x in self.__shared_slots__)
+        assert not any(getattr(self, x) is getattr(self, x) for x in self.__shared_slots__)
 
         return False
 
-
     @staticmethod
     def translate_dtype(dtype: Any) -> dace.typeclass:
         """Turns a Jax datatype into a DaCe datatype.
 
         Todo:
-            Imporove.
+            Improve.
         """
         nameof_dtype = str(dtype)
 
@@ -453,9 +454,7 @@ def translate_dtype(dtype: Any) -> dace.typeclass:
         return dcd_type
 
     def _add_jax_name_mapping(
-            self,
-            jax_var: str | jcore.Atom,
-            sdfg_name: str
+        self, jax_var: str | jcore.Atom, sdfg_name: str
     ) -> JaxprTranslationDriver:
         """Creates the mapping between `jax_var` to `sdfg_name`.
 
@@ -505,7 +504,9 @@ def _add_reserved_names(
         elif isinstance(reserved_names, Collection):
             pass
         else:
-            raise TypeError(f"Does not know how to handle the type '{type(reserved_names).__name__}'.")
+            raise TypeError(
+                f"Does not know how to handle the type '{type(reserved_names).__name__}'."
+            )
         assert all(isinstance(x, str) for x in reserved_names)
 
         self._reserved_names.update(reserved_names)
@@ -575,7 +576,7 @@ def _add_array(
             Specifying `alt_name` implies `find_new_name=False`.
             The effect of specifying `force_jax_name` is as passing `jutil.get_jax_var_name(arg)` as `alt_name`.
         """
-        assert all(x is not None  for x in (self._sdfg, self._jax_name_map))
+        assert all(x is not None for x in (self._sdfg, self._jax_name_map))
         shape: Sequence[int] = arg.aval.shape  # Shape of the array
         offset = None  # i.e. no offset
         storage: dace.StorageType = dace.StorageType.Default  # Set at later stages (optimization)
@@ -723,7 +724,7 @@ def _create_jax_var_list(
         prevent_creation: bool = False,
         only_creation: bool = False,
         **kwargs: Any,
-    ) -> list[Union[None, str]]:
+    ) -> list[None | str]:
         """Creates SDFG variables for the listed Jax variables and returns the SDFG names as a list.
 
         Before the function will create a variable, by using `_add_array()` with `update_var_mapping=True`,
@@ -747,23 +748,20 @@ def _create_jax_var_list(
         if only_creation and prevent_creation:
             raise ValueError("Specified both 'only_creation' and 'prevent_creation'.")
 
-        ret_list: list[Union[None, str]] = []
+        ret_list: list[None | str] = []
         for jax_var in jax_var_list:
             if isinstance(jax_var, jcore.Literal):
                 if only_creation:
                     raise ValueError(f"Requested 'only_creation', but '{jax_var}' is a 'Literal'.")
                 ret_list.append(None)
             elif isinstance(jax_var, jcore.jax_var):
-                mapped_sdfg_name: Union[str, None] = self.map_jax_var_to_sdfg(
-                    jax_var, allow_fail=True)
+                mapped_sdfg_name: str | None = self.map_jax_var_to_sdfg(jax_var, allow_fail=True)
                 if mapped_sdfg_name is None:
                     if prevent_creation:
                         raise ValueError(
                             f"Forbid the creation of jaxVariables, but need to create '{jax_var!s}'."
                         )
-                    ret_list.append(
-                        self._add_array(arg=jax_var, update_var_mapping=True, **kwargs)
-                    )
+                    ret_list.append(self._add_array(arg=jax_var, update_var_mapping=True, **kwargs))
                 else:
                     if only_creation:
                         raise ValueError(
@@ -899,11 +897,11 @@ def _init_sub_translators(
     ) -> JaxprTranslationDriver:
         """This function initializes the subtranslator.
 
-        The function forwards `kwargs` to teh constructor of teh subtranslators.
+        The function forwards `kwargs` to the constructor of the subtranslators.
         However, it will remove all arguments starting with an underscore.
         """
-        if(isinstance(self._sub_translators, dict)):
-            raise RuntimeError(f"Tried to allocate the internal subtranslators twice.")
+        if isinstance(self._sub_translators, dict):
+            raise RuntimeError("Tried to allocate the internal subtranslators twice.")
         assert self._sub_translators is None
 
         # We might get arguments that starts with an underscore, which are not meant for the subtranslators.
@@ -987,8 +985,8 @@ def _find_sub_translator_for(
         if len(subtranslator_canidates) == 1:
             subtranslator = next(iter(subtranslator_canidates))
             assert subtranslator.can_translate_jaxeqn(
-                driver=self, in_var_names=in_var_names,
-                out_var_names=out_var_names, eqn=eqn)
+                driver=self, in_var_names=in_var_names, out_var_names=out_var_names, eqn=eqn
+            )
         else:
             for subtranslatorCanidate in subtranslator_canidates:
                 if subtranslatorCanidate.can_translate_jaxeqn(
@@ -1006,7 +1004,7 @@ def _translate_single_eqn(
         self,
         jaxpr: jcore.ClosedJaxpr,
         eqn: jcore.JaxprEqn,
-    ) -> tuple[Sequence[Union[str, None]], Sequence[str]]:
+    ) -> tuple[Sequence[str | None], Sequence[str]]:
         """Translate `eqn` into its SDFG equivalent.
 
         To do this the function will do the following steps:
@@ -1030,16 +1028,16 @@ def _translate_single_eqn(
             raise NotImplementedError(f"Equation '{eqn}' had side effects.")
 
         # Input/Output variables
-        in_var_names: Sequence[Union[str, None]] = self._create_jax_var_list(
+        in_var_names: Sequence[str | None] = self._create_jax_var_list(
             eqn.invars,
             prevent_creation=True,  # Inputs must already exists.
         )
         out_var_names: Sequence[str] = self._create_jax_var_list(  # type: ignore[assignment]
             eqn.outvars,
-            only_creation=True, # Output must not exist yet.
+            only_creation=True,  # Output must not exist yet.
         )
 
-        # Find the subtranslator 
+        # Find the subtranslator
         subtranslator: translator.JaCeSubTranslatorInterface = self._find_sub_translator_for(
             in_var_names=in_var_names,
             out_var_names=out_var_names,
@@ -1049,8 +1047,8 @@ def _translate_single_eqn(
         # Create the state into which the equation is put
         last_term_state: dace.SDFGState = self.get_terminal_sdfg_state()  # noqa: F841 # Will be used later
         eqn_state = self.append_new_state(
-                label=f"{eqn.primitive.name}_{out_var_names[0]}",
-                prev_state=None,    # Force to append as terminal state.
+            label=f"{eqn.primitive.name}_{out_var_names[0]}",
+            prev_state=None,  # Force to append as terminal state.
         )
 
         # Now perform the actual translation of the equation.
@@ -1124,7 +1122,7 @@ def _translate_jaxpr_internal(
         Notes:
             The function will unconditionally handle empty Jaxpr.
             Jax uses a variable with name `_` to indicate that this value is never read.
-                It is included by some transformations such as `gard()`.
+                It is included by some transformations such as `grad()`.
         """
         assert isinstance(jaxpr, jcore.ClosedJaxpr)
         assert self.is_allocated()
@@ -1235,7 +1233,7 @@ def _handle_null_jaxpr(
             # Now copy the input into the fake output variable.
             inp_acc = self._init_sdfg_state.add_read(self.map_jax_var_to_sdfg(jax_inp_name))
             out_acc = self._init_sdfg_state.add_write(self.map_jax_var_to_sdfg(jax_out_var))
-            self._sdfg_head.add_nedge(
+            self._init_sdfg_state.add_nedge(
                 src=inp_acc,
                 dst=out_acc,
                 data=dace.Memlet.from_array(
@@ -1261,5 +1259,3 @@ def _handle_null_jaxpr(
         'unsigned', 'using', 'virtual', 'void', 'volatile', 'while', 'xor', 'std',
     }
     # fmt: on
-
-
diff --git a/src/jace/translator/sub_translators/__init__.py b/src/jace/translator/sub_translators/__init__.py
index 4efefed..3878727 100644
--- a/src/jace/translator/sub_translators/__init__.py
+++ b/src/jace/translator/sub_translators/__init__.py
@@ -1,3 +1,8 @@
-"""This module contains all subtranslator implementations.
-"""
+# JaCe - JAX Just-In-Time compilation using DaCe (Data Centric Parallel Programming)
+#
+# Copyright (c) 2024, ETH Zurich
+# All rights reserved.
+#
+# SPDX-License-Identifier: BSD-3-Clause
 
+"""This module contains all subtranslator implementations."""
diff --git a/src/jace/translator/sub_translators/alu_translator.py b/src/jace/translator/sub_translators/alu_translator.py
index 3ca33e3..3b62d43 100644
--- a/src/jace/translator/sub_translators/alu_translator.py
+++ b/src/jace/translator/sub_translators/alu_translator.py
@@ -1,106 +1,90 @@
-"""This module contains the `ALUTranslator` which translates all arithmetic and logic primitives.
-"""
+# JaCe - JAX Just-In-Time compilation using DaCe (Data Centric Parallel Programming)
+#
+# Copyright (c) 2024, ETH Zurich
+# All rights reserved.
+#
+# SPDX-License-Identifier: BSD-3-Clause
 
-from typing import Union, Any, Final, TYPE_CHECKING, cast
-from typing_extensions import override
+"""This module contains the `ALUTranslator` which translates all arithmetic and logic primitives."""
 
+from __future__ import annotations
 
-import jace
-from jace import translator as jtranslator
-from jace.translator import util as jtutil
-
+from collections.abc import Collection, Sequence
+from typing import Any, Final, cast
 
 import dace
-
-import jax
-from jax import core as jcore
 import numpy as np
+from jax import core as jcore
+from typing_extensions import override
 
-
-if TYPE_CHECKING:
-    from .jaxpr_translator_driver import JaxprTranslationDriver
-
+from jace import translator as jtranslator
+from jace.translator import util as jtutil
 
 
 class ALUTranslator(jtranslator.JaCeSubTranslatorInterface):
-    """This translator handles all arithmetic and logical operations.
+    """This translator handles all arithmetic and logical operations."""
 
-    """
     __slots__ = ("_unary_ops", "_binary_ops")
 
     # Contains all translation templates for unarry operations.
-    self.m_unarryOps: Final[dict[str, str]] = {
-            "pos":          "__out0 = +(__in0)",
-            "neg":          "__out0 = -(__in0)",
-            "not":          "__out0 = not (__in0)",
-
-            "floor":        "__out0 = floor(__in0)",
-            "ceil":         "__out0 = ceil(__in0)",
-            "round":        "__out0 = round(__in0)",
-            "abs":          "__out0 = abs(__in0)",
-            "sign":         "__out0 = sign(__in0)",
-
-            "sqrt":         "__out0 = sqrt(__in0)",
-
-            "log":          "__out0 = log(__in0)",
-            "exp":          "__out0 = exp(__in0)",
-            "integer_pow":  "__out0 = (__in0)**({y})",  # 'y' is a parameter of the primitive
-
-            "sin":          "__out0 = sin(__in0)",
-            "asin":         "__out0 = asin(__in0)",
-            "cos":          "__out0 = cos(__in0)",
-            "acos":         "__out0 = acos(__in0)",
-            "tan":          "__out0 = tan(__in0)",
-            "atan":         "__out0 = atan(__in0)",
-            "tanh":         "__out0 = tanh(__in0)",
+    _unary_ops: Final[dict[str, str]] = {
+        "pos": "__out0 = +(__in0)",
+        "neg": "__out0 = -(__in0)",
+        "not": "__out0 = not (__in0)",
+        "floor": "__out0 = floor(__in0)",
+        "ceil": "__out0 = ceil(__in0)",
+        "round": "__out0 = round(__in0)",
+        "abs": "__out0 = abs(__in0)",
+        "sign": "__out0 = sign(__in0)",
+        "sqrt": "__out0 = sqrt(__in0)",
+        "log": "__out0 = log(__in0)",
+        "exp": "__out0 = exp(__in0)",
+        "integer_pow": "__out0 = (__in0)**({y})",  # 'y' is a parameter of the primitive
+        "sin": "__out0 = sin(__in0)",
+        "asin": "__out0 = asin(__in0)",
+        "cos": "__out0 = cos(__in0)",
+        "acos": "__out0 = acos(__in0)",
+        "tan": "__out0 = tan(__in0)",
+        "atan": "__out0 = atan(__in0)",
+        "tanh": "__out0 = tanh(__in0)",
     }
     # Transformation for all binary operations
-    self._binarryOps: Final[dict[str, str]] = {
-            "add":          "__out0 = (__in0)+(__in1)",
-            "add_any":      "__out0 = (__in0)+(__in1)",     # No idea what makes `add_any` differ from `add`
-            "sub":          "__out0 = (__in0)-(__in1)",
-            "mul":          "__out0 = (__in0)*(__in1)",
-            "div":          "__out0 = (__in0)/(__in1)",
-            "rem":          "__out0 = (__in0)%(__in1)",
-
-            "and":          "__out0 = (__in0) and (__in1)",
-            "or":           "__out0 = (__in0) or  (__in1)",
-
-            "pow":          "__out0 = (__in0)**(__in1)",
-            "ipow":         "__out0 = (__in0)**(int(__in1))",
-
-            "min":          "__out0 = min(__in0, __in1)",
-            "max":          "__out0 = max(__in0, __in1)",
-
-            "eq":          "__out0 = __in0 == __in1",
-            "ne":          "__out0 = __in0 != __in1",
-            "ge":          "__out0 = __in0 >= __in1",
-            "gt":          "__out0 = __in0 > __in1",
-            "le":          "__out0 = __in0 <= __in1",
-            "lt":          "__out0 = __in0 < __in1",
+    _binary_ops: Final[dict[str, str]] = {
+        "add": "__out0 = (__in0)+(__in1)",
+        "add_any": "__out0 = (__in0)+(__in1)",  # No idea what makes `add_any` differ from `add`
+        "sub": "__out0 = (__in0)-(__in1)",
+        "mul": "__out0 = (__in0)*(__in1)",
+        "div": "__out0 = (__in0)/(__in1)",
+        "rem": "__out0 = (__in0)%(__in1)",
+        "and": "__out0 = (__in0) and (__in1)",
+        "or": "__out0 = (__in0) or  (__in1)",
+        "pow": "__out0 = (__in0)**(__in1)",
+        "ipow": "__out0 = (__in0)**(int(__in1))",
+        "min": "__out0 = min(__in0, __in1)",
+        "max": "__out0 = max(__in0, __in1)",
+        "eq": "__out0 = __in0 == __in1",
+        "ne": "__out0 = __in0 != __in1",
+        "ge": "__out0 = __in0 >= __in1",
+        "gt": "__out0 = __in0 > __in1",
+        "le": "__out0 = __in0 <= __in1",
+        "lt": "__out0 = __in0 < __in1",
     }
 
-    def __init__(
-            self,
-            **kwargs: Any
-    ) -> None:
-        """Initialize the `ALUTranslator`.
-        """
+    def __init__(self, **kwargs: Any) -> None:
+        """Initialize the `ALUTranslator`."""
         super().__init__(**kwargs)
-    # end def: __init__
 
+    # end def: __init__
 
     @override
     def get_handled_primitives(self) -> Collection[str] | str:
-        """Returns the list of all known primitives.
-        """
+        """Returns the list of all known primitives."""
         return set(self._unary_ops.keys()).union(self._binary_ops.keys())
 
-
     @override
     def can_translate_jaxeqn(
         self,
-        driver: "JaxprTranslationDriver",
+        driver: jtranslator.JaxprTranslationDriver,
         in_var_names: Sequence[str | None],
         out_var_names: Sequence[str],
         eqn: jcore.JaxprEqn,
@@ -110,25 +94,24 @@ def can_translate_jaxeqn(
         Notes:
             A user can generally expect that this function returns `True`.
         """
-        is_scalar: bool = (len(eqn.outvars[0].aval.shape) == 0)
+        is_scalar: bool = len(eqn.outvars[0].aval.shape) == 0
         prim_name: str = eqn.primitive.name
-        if(prim_name in self._unary_ops):
+        if prim_name in self._unary_ops:
             assert len(eqn.invars) == 1
-        elif(prim_name in self._binary_ops):
+        elif prim_name in self._binary_ops:
             assert len(eqn.invars) == 2
-        elif(out_var_names[0] is None):
+        elif out_var_names[0] is None or (not is_scalar) and all(x is None for x in in_var_names):
             return False
-        if(all(x is None  for x in in_var_names)):
+        if all(x is None for x in in_var_names):
             return False
-        if(len(eqn.effects) != 0):
+        if len(eqn.effects) != 0:
             return False
         return True
 
-
     @override
     def translate_jaxeqn(
         self,
-        driver: "JaxprTranslationDriver",
+        driver: jtranslator.JaxprTranslationDriver,
         in_var_names: Sequence[str | None],
         out_var_names: Sequence[str],
         eqn: jcore.JaxprEqn,
@@ -150,50 +133,69 @@ def translate_jaxeqn(
 
         # All this checks are done to capture corner cases that Jax might do but are not implemented.
         #  If you find out that Jax will never create something, then remove it.
-        if(not all(invar.aval.shape == ()  for invar, x in zip(eqn.invars, in_var_names) if x is None)):
-            raise NotImplementedError(f"Can not handle Literals that are not scalars.")
-        if(in_var_names[0] is None):
-            raise NotImplementedError(f"Literal can only not be on the right hand side of the operation.")
-        if(not any(invar.aval.shape == eqn.outvars[0].aval.shape  for invar in eqn.invars)):
-            raise NotImplementedError(f"At least input must have the same shape as the output.")
-        if(len(eqn.outvars) != 1):
+        if not all(
+            invar.aval.shape == ()
+            for invar, x in zip(eqn.invars, in_var_names, strict=False)
+            if x is None
+        ):
+            raise NotImplementedError("Can not handle Literals that are not scalars.")
+        if in_var_names[0] is None:
+            raise NotImplementedError(
+                "Literal can only not be on the right hand side of the operation."
+            )
+        if not any(invar.aval.shape == eqn.outvars[0].aval.shape for invar in eqn.invars):
+            raise NotImplementedError("At least input must have the same shape as the output.")
+        if len(eqn.outvars) != 1:
             raise NotImplementedError(f"Can only handle one output (Eq: '{eqn}'.")
 
         # Determine what kind of input we got and how we should proceed.
-        is_scalar = (len(eqn.outvars[0].aval.shape) == 0)
-        inp_scalars = [len(Inp.aval.shape) == 0  for i, Inp in enumerate(eqn.invars)]
+        is_scalar = len(eqn.outvars[0].aval.shape) == 0
+        inp_scalars = [len(Inp.aval.shape) == 0 for i, Inp in enumerate(eqn.invars)]
         has_scalars_as_inputs = any(inp_scalars)
         only_scalars_as_inputs = all(inp_scalars)
-        has_some_literals = any([x is None  for x in in_var_names])
-        only_literals_as_inputs = all([x is None  for x in in_var_names])
-        inps_same_shape   = all([eqn.invars[0].aval.shape == eqn.invars[i].aval.shape  for i in range(1, len(eqn.invars))])
+        has_some_literals = any([x is None for x in in_var_names])
+        only_literals_as_inputs = all([x is None for x in in_var_names])
+        inps_same_shape = all(
+            [
+                eqn.invars[0].aval.shape == eqn.invars[i].aval.shape
+                for i in range(1, len(eqn.invars))
+            ]
+        )
 
         # We will now look which dimensions have to be broadcasted on which operator.
         #  I.e. in the dimensions in the lists below there will be no map iteration index.
-        dims_to_bcastl: Sequence[int] = []
-        dims_to_bcastr: Sequence[int] = []
+        dims_to_bcastl: list[int] = []
+        dims_to_bcastr: list[int] = []
 
         # Determine if and if yes how we have to broadcast.
-        if(is_scalar):
+        if is_scalar:
             # The output is a scalar, in which case we must have only scalar input as well.
             #  Furthermore, we can have the situation that only Literals are the input.
             assert (not is_scalar) or only_scalars_as_inputs
             assert (not is_scalar) or only_literals_as_inputs
 
-        elif(only_literals_as_inputs):
-            raise NotImplementedError(f"Only literals an input is only allowed for the scalar case.")
+        elif only_literals_as_inputs:
+            raise NotImplementedError("Only literals an input is only allowed for the scalar case.")
 
-        elif(inps_same_shape):
+        elif inps_same_shape:
             pass
 
-        elif(has_some_literals or has_scalars_as_inputs):
+        elif has_some_literals or has_scalars_as_inputs:
             # This is essentially array plus scalar, but in two possibilities.
             #  We either have a scalar variable or we have a scalar literal.
-            assert (not has_some_literals) or all(invar.aval.shape == eqn.outvars[0].aval.shape  for (invar, x) in zip(eqn.invars, in_var_names) if x is not None)
-            assert (not has_scalars_as_inputs) or all(invar.aval.shape in {eqn.outvars[0].aval.shape, ()}  for (invar, x) in zip(eqn.invars, in_var_names) if x is not None)
+            assert (not has_some_literals) or all(
+                invar.aval.shape == eqn.outvars[0].aval.shape
+                for (invar, x) in zip(eqn.invars, in_var_names, strict=False)
+                if x is not None
+            )
+            assert (not has_scalars_as_inputs) or all(
+                invar.aval.shape in {eqn.outvars[0].aval.shape, ()}
+                for (invar, x) in zip(eqn.invars, in_var_names, strict=False)
+                if x is not None
+            )
 
-        elif(len(in_var_names) != 2):
-            raise ValueError(f"Can only do broadcasting if there are two operands.")
+        elif len(in_var_names) != 2:
+            raise ValueError("Can only do broadcasting if there are two operands.")
 
         else:
             # This is the general broadcasting case
@@ -201,23 +203,25 @@ def translate_jaxeqn(
             #  It seems that Jax ensures this.
             #  We further assume that if the size in a dimension differs then one must have size 1.
             #  This is the size we broadcast over, i.e. conceptually replicated.
-            out_shp  = tuple(eqn.outvars[0].aval.shape)  # Shape of the output.
-            inp_shpl = tuple(eqn.invars[0].aval.shape)   # Shape of the left/first input
-            inp_shpr = tuple(eqn.invars[1].aval.shape)   # Shape of the right/second input; this must be "expanded"
+            out_shp = tuple(eqn.outvars[0].aval.shape)  # Shape of the output.
+            inp_shpl = tuple(eqn.invars[0].aval.shape)  # Shape of the left/first input
+            inp_shpr = tuple(
+                eqn.invars[1].aval.shape
+            )  # Shape of the right/second input; this must be "expanded"
 
-            if(not ((len(inp_shpl) == len(inp_shpr)) and (len(out_shp) == len(inp_shpr)))):
+            if not ((len(inp_shpl) == len(inp_shpr)) and (len(out_shp) == len(inp_shpr))):
                 raise NotImplementedError("Can not broadcast over different ranks.")
 
             for dim in reversed(range(len(out_shp))):
                 shp_lft = inp_shpl[dim]
                 shp_rgt = inp_shpr[dim]
 
-                if(shp_lft == shp_rgt):
+                if shp_lft == shp_rgt:
                     assert out_shp[dim] == shp_lft
-                elif(shp_lft == 1):
+                elif shp_lft == 1:
                     assert shp_rgt == out_shp[dim]
                     dims_to_bcastl.append(dim)
-                elif(shp_rgt == 1):
+                elif shp_rgt == 1:
                     assert shp_lft == out_shp[dim]
                     dims_to_bcastr.append(dim)
                 else:
@@ -227,62 +231,82 @@ def translate_jaxeqn(
         tskl_code: str = self._writeTaskletCode(in_var_names, eqn)
         tskl_name: str = eqn.primitive.name
         tskl_map_ranges: list[tuple[str, str]] = [
-                (f'__i{dim}', f'0:{N}')
-                for dim, N in enumerate(eqn.outvars[0].aval.shape)
+            (f"__i{dim}", f"0:{N}") for dim, N in enumerate(eqn.outvars[0].aval.shape)
         ]
-        tskl_outputs: list[Union[tuple[str, dace.Memlet]], tuple[None, None]] = []
-        tskl_inputs: list[tuple[str, dace.Memlet]] = []
+        tskl_outputs: list[tuple[str, dace.Memlet]] = []
+        tskl_inputs: list[tuple[str, dace.Memlet] | tuple[None, None]] = []
 
         # Generate the Memlets for the input.
-        for i, dims_to_bcast in zip(range(len(eqn.invars)), [dims_to_bcastl, dims_to_bcastr]):
-            if(in_var_names[i] is None):
-                # Litteral: No input needed.
+        for i, dims_to_bcast in zip(
+            range(len(eqn.invars)), [dims_to_bcastl, dims_to_bcastr], strict=False
+        ):
+            if in_var_names[i] is None:
+                # Literal: No input needed.
                 tskl_inputs.append((None, None))
                 continue
-            elif(inp_scalars[i]):
+            elif inp_scalars[i]:
                 # We have a scalar argument.
-                i_memlet = dace.Memlet.from_array(in_var_names[i], translator.getSDFG().arrays[in_var_names[i]])
+                i_memlet: dace.Memlet = dace.Memlet.from_array(
+                    in_var_names[i], driver.get_sdfg().arrays[in_var_names[i]]
+                )
             else:
                 # We have an array argument.
                 inputs_: list[str] = []
                 for dim, (map_var, _) in enumerate(tskl_map_ranges):
-                    if(dim in dims_to_bcast):
-                        inputs_.append('0')
+                    if dim in dims_to_bcast:
+                        inputs_.append("0")
                     else:
                         inputs_.append(str(map_var))
-                i_memlet: dace.Memlet = dace.Memlet.simple(in_var_names[i], ", ".join(tInputs_))
+                i_memlet = dace.Memlet.simple(in_var_names[i], ", ".join(inputs_))
                 del inputs_
-            tskl_inputs.append( (f'__in{i}', i_memlet) )
+            tskl_inputs.append((f"__in{i}", i_memlet))
 
         # Now generate the Memlets for the outputs
-        if(is_scalar):
-            tskl_outputs.append( (f'__out{i}', dace.Memlet.from_array(out_var_names[0], translator.getSDFG().arrays[out_var_names[i]])) )
+        if is_scalar:
+            tskl_outputs.append(
+                (
+                    f"__out{i}",
+                    dace.Memlet.from_array(
+                        out_var_names[0], driver.get_sdfg().arrays[out_var_names[i]]
+                    ),
+                )
+            )
         else:
-            tskl_outputs.append( (f'__out{i}', dace.Memlet.simple(out_var_names[0], ', '.join([X[0]  for X in tskl_map_ranges]))) )
+            tskl_outputs.append(
+                (
+                    f"__out{i}",
+                    dace.Memlet.simple(
+                        out_var_names[0], ", ".join([X[0] for X in tskl_map_ranges])
+                    ),
+                )
+            )
 
-        if(is_scalar):
+        if is_scalar:
             tskl_tasklet = eqn_state.add_tasklet(
-                    tskl_name,
-                    list_to_dict(tskl_inputs).keys(),
-                    list_to_dict(tskl_outputs).keys(),
-                    tskl_code,
+                tskl_name,
+                jtutil.list_to_dict(tskl_inputs).keys(),
+                jtutil.list_to_dict(tskl_outputs).keys(),
+                tskl_code,
             )
-            for in_var, (in_connector, in_memlet)  in filter(lambda X: X[0] is not None, zip(in_var_names, tskl_inputs)):
+            for in_var, (in_connector, in_memlet) in filter(
+                lambda X: X[0] is not None, zip(in_var_names, tskl_inputs, strict=False)
+            ):
                 eqn_state.add_edge(
-                        eqn_state.add_read(in_var),
-                        None,
-                        tskl_tasklet,
-                        in_connector,
-                        in_memlet,
+                    eqn_state.add_read(in_var),
+                    None,
+                    tskl_tasklet,
+                    in_connector,
+                    in_memlet,
                 )
-            for out_var, (out_connector, out_memlet) in zip(out_var_names, tskl_outputs):
-                out = eqn_state.add_write(oVar)
+            for out_var, (out_connector, out_memlet) in zip(
+                out_var_names, tskl_outputs, strict=False
+            ):
                 eqn_state.add_edge(
-                        tskl_tasklet,
-                        out_connector,
-                        eqn_state.add_write(oVar),
-                        None,
-                        out_memlet,
+                    tskl_tasklet,
+                    out_connector,
+                    eqn_state.add_write(out_var),
+                    None,
+                    out_memlet,
                 )
         else:
             eqn_state.add_mapped_tasklet(
@@ -296,12 +320,11 @@ def translate_jaxeqn(
 
         return eqn_state
 
-
     def _writeTaskletCode(
-            self,
-            in_var_names: list[Union[str, None]],
-            eqn: JaxprEqn,
-    ):
+        self,
+        in_var_names: Sequence[str | None],
+        eqn: jcore.JaxprEqn,
+    ) -> str:
         """This function generates the Tasklet code based on a primitive.
 
         The function will also perform literal substitution and parameter handling.
@@ -310,54 +333,49 @@ def _writeTaskletCode(
             in_var_names:   The list of SDFG variables used as input.
         """
         t_name = eqn.primitive.name
-        if("integer_pow" == t_name):
+        if t_name == "integer_pow":
             # INTEGER POWER
-            exponent = int(eqn.params['y'])
-            if(exponent == 0):
-                t_code = f"__out0 = dace.{str(eqn.outvars[0].aval.dtype)}(1)"
-            elif(exponent == 1):
+            exponent = int(eqn.params["y"])
+            if exponent == 0:
+                t_code = f"__out0 = dace.{eqn.outvars[0].aval.dtype!s}(1)"
+            elif exponent == 1:
                 t_code = "__out0 = __in0"
-            elif(exponent == 2):
+            elif exponent == 2:
                 t_code = "__out0 = __in0 * __in0"
-            elif(exponent == 3):
+            elif exponent == 3:
                 t_code = "__out0 = (__in0 * __in0) * __in0"
-            elif(exponent == 4):
+            elif exponent == 4:
                 t_code = "__tmp0 = __in0 * __in0\n__out0 = __tmp0 * __tmp0"
-            elif(exponent == 5):
+            elif exponent == 5:
                 t_code = "__tmp0 = __in0 * __in0\n__tmp1 = __tmp0 * __tmp0\n__out0 = __tmp1 * __in0"
             else:
-                t_code = self.m_unarryOps[t_name]
+                t_code = self._unary_ops[t_name]
 
         else:
             # GENERAL CASE
-            if(t_name in self._unary_ops):
+            if t_name in self._unary_ops:
                 t_code = self._unary_ops[t_name]
-            elif(t_name in self._binary_ops):
+            elif t_name in self._binary_ops:
                 t_code = self._binary_ops[t_name]
 
         # Now we handle Literal substitution
         for i, in_var_name in enumerate(in_var_names):
-            if(in_var_name is not None):
+            if in_var_name is not None:
                 continue
 
             jax_in_var: jcore.Literal = cast(jcore.Literal, eqn.invars[i])
-            if(jax_in_var.aval.shape == ()):
+            if jax_in_var.aval.shape == ():
                 t_val = jax_in_var.val
-                if(isinstance(t_val, np.ndarray)):
-                    t_val = jax_in_var.val.max() # I do not know a better way in that case
+                if isinstance(t_val, np.ndarray):
+                    t_val = jax_in_var.val.max()  # I do not know a better way in that case
                 t_code = t_code.replace(f"__in{i}", str(t_val))
             else:
-                raise ValueError(f"Can not handle the literal case of shape: {jax_in_var.aval.shape}")
+                raise ValueError(
+                    f"Can not handle the literal case of shape: {jax_in_var.aval.shape}"
+                )
 
         # Now replace the parameters
-        if(len(eqn.params) != 0):
+        if len(eqn.params) != 0:
             t_code = t_code.format(**eqn.params)
 
         return t_code
-
-
-
-
-
-
-
diff --git a/src/jace/translator/util/__init__.py b/src/jace/translator/util/__init__.py
index fb3eee6..7410138 100644
--- a/src/jace/translator/util/__init__.py
+++ b/src/jace/translator/util/__init__.py
@@ -1,4 +1,4 @@
-# JaCe - JAX jit using DaCe (Data Centric Parallel Programming)
+# JaCe - JAX Just-In-Time compilation using DaCe (Data Centric Parallel Programming)
 #
 # Copyright (c) 2024, ETH Zurich
 # All rights reserved.
@@ -9,9 +9,7 @@
 
 from __future__ import annotations
 
-from .jace_translation_memento import JaCeTranslationMemento
-from .revision_counter import RevisionCounterManager
-from .subtranslator_helper_order import sort_subtranslators
-from .util import list_to_dict
-
-
+from .jace_translation_memento import JaCeTranslationMemento  # noqa: F401 # Unused import
+from .revision_counter import RevisionCounterManager  # noqa: F401 # Unused import
+from .subtranslator_helper_order import sort_subtranslators  # noqa: F401 # Unused import
+from .util import list_to_dict  # noqa: F401 # Unused import
diff --git a/src/jace/translator/util/jace_translation_memento.py b/src/jace/translator/util/jace_translation_memento.py
index 62ad230..1f267e7 100644
--- a/src/jace/translator/util/jace_translation_memento.py
+++ b/src/jace/translator/util/jace_translation_memento.py
@@ -1,9 +1,10 @@
-# JaCe - JAX jit using DaCe (Data Centric Parallel Programming)
+# JaCe - JAX Just-In-Time compilation using DaCe (Data Centric Parallel Programming)
 #
 # Copyright (c) 2024, ETH Zurich
 # All rights reserved.
 #
 # SPDX-License-Identifier: BSD-3-Clause
+
 from __future__ import annotations
 
 from collections.abc import Mapping, Sequence
@@ -74,6 +75,3 @@ def __eq__(self, other: Any) -> bool:
 
         x: bool = self.sdfg.__eq__(other)
         return x
-
-
-# end class(JaCeTranslationMemento):
diff --git a/src/jace/translator/util/revision_counter.py b/src/jace/translator/util/revision_counter.py
index 7f19a76..e6531bc 100644
--- a/src/jace/translator/util/revision_counter.py
+++ b/src/jace/translator/util/revision_counter.py
@@ -1,9 +1,10 @@
-# JaCe - JAX jit using DaCe (Data Centric Parallel Programming)
+# JaCe - JAX Just-In-Time compilation using DaCe (Data Centric Parallel Programming)
 #
 # Copyright (c) 2024, ETH Zurich
 # All rights reserved.
 #
 # SPDX-License-Identifier: BSD-3-Clause
+
 from __future__ import annotations
 
 from typing import Final
@@ -50,6 +51,3 @@ def is_root_revision(
     ) -> bool:
         """This function checks if 'rev' revers to the (absolute) unique revision of the root."""
         return rev == self.ROOT_REVISION
-
-
-# end class(RevisionCounterManager):
diff --git a/src/jace/translator/util/subtranslator_helper_order.py b/src/jace/translator/util/subtranslator_helper_order.py
index 1b52d81..4be8604 100644
--- a/src/jace/translator/util/subtranslator_helper_order.py
+++ b/src/jace/translator/util/subtranslator_helper_order.py
@@ -1,9 +1,10 @@
-# JaCe - JAX jit using DaCe (Data Centric Parallel Programming)
+# JaCe - JAX Just-In-Time compilation using DaCe (Data Centric Parallel Programming)
 #
 # Copyright (c) 2024, ETH Zurich
 # All rights reserved.
 #
 # SPDX-License-Identifier: BSD-3-Clause
+
 from __future__ import annotations
 
 from collections.abc import Sequence
diff --git a/src/jace/translator/util/util.py b/src/jace/translator/util/util.py
index 574efad..484b4ef 100644
--- a/src/jace/translator/util/util.py
+++ b/src/jace/translator/util/util.py
@@ -1,15 +1,21 @@
-"""Contains all general helper functions needed inside the translator.
-"""
+# JaCe - JAX Just-In-Time compilation using DaCe (Data Centric Parallel Programming)
+#
+# Copyright (c) 2024, ETH Zurich
+# All rights reserved.
+#
+# SPDX-License-Identifier: BSD-3-Clause
 
-from typing import Union, Any
+"""Contains all general helper functions needed inside the translator."""
 
-def list_to_dict(
-        inp: list[Union[tuple[None, Any], tuple[Any, Any]]]
-) -> dict[Any, Any]:
+from __future__ import annotations
+
+from collections.abc import Sequence
+from typing import Any
+
+
+def list_to_dict(inp: Sequence[tuple[None | Any, Any]]) -> dict[Any, Any]:
     """This method turns a `list` of pairs into a `dict` and applies a `None` filter.
 
     The function will only include pairs whose key, i.e. first element is not `None`.
     """
-    return {k:v  for k, v in inp if k is not None}
-# end def: ListToDict
-
+    return {k: v for k, v in inp if k is not None}
diff --git a/src/jace/util/__init__.py b/src/jace/util/__init__.py
index 703ad85..fcd0380 100644
--- a/src/jace/util/__init__.py
+++ b/src/jace/util/__init__.py
@@ -1,4 +1,4 @@
-# JaCe - JAX jit using DaCe (Data Centric Parallel Programming)
+# JaCe - JAX Just-In-Time compilation using DaCe (Data Centric Parallel Programming)
 #
 # Copyright (c) 2024, ETH Zurich
 # All rights reserved.
diff --git a/src/jace/util/dace.py b/src/jace/util/dace.py
index 1e9b874..90300d7 100644
--- a/src/jace/util/dace.py
+++ b/src/jace/util/dace.py
@@ -1,4 +1,4 @@
-# JaCe - JAX jit using DaCe (Data Centric Parallel Programming)
+# JaCe - JAX Just-In-Time compilation using DaCe (Data Centric Parallel Programming)
 #
 # Copyright (c) 2024, ETH Zurich
 # All rights reserved.
diff --git a/src/jace/util/jax.py b/src/jace/util/jax.py
index 6e0c1a5..bc80b2c 100644
--- a/src/jace/util/jax.py
+++ b/src/jace/util/jax.py
@@ -1,4 +1,4 @@
-# JaCe - JAX jit using DaCe (Data Centric Parallel Programming)
+# JaCe - JAX Just-In-Time compilation using DaCe (Data Centric Parallel Programming)
 #
 # Copyright (c) 2024, ETH Zurich
 # All rights reserved.
@@ -41,3 +41,6 @@ def get_jax_var_name(jax_var: jcore.Atom | str) -> str:
             f"Failed to translate the Jax variable '{jax_var}' into a name, the result was empty."
         )
     return jax_var
+
+
+# NEW LINE
diff --git a/src/jace/util/traits.py b/src/jace/util/traits.py
index b791cb8..ccdf19a 100644
--- a/src/jace/util/traits.py
+++ b/src/jace/util/traits.py
@@ -1,4 +1,4 @@
-# JaCe - JAX jit using DaCe (Data Centric Parallel Programming)
+# JaCe - JAX Just-In-Time compilation using DaCe (Data Centric Parallel Programming)
 #
 # Copyright (c) 2024, ETH Zurich
 # All rights reserved.
@@ -9,7 +9,8 @@
 
 from __future__ import annotations
 
-from typing import Any, Sequence
+from collections.abc import Sequence
+from typing import Any
 
 
 def is_str(
diff --git a/src/jace/util/util.py b/src/jace/util/util.py
index 2c1af01..e1ae14a 100644
--- a/src/jace/util/util.py
+++ b/src/jace/util/util.py
@@ -1,9 +1,10 @@
-# JaCe - JAX jit using DaCe (Data Centric Parallel Programming)
+# JaCe - JAX Just-In-Time compilation using DaCe (Data Centric Parallel Programming)
 #
 # Copyright (c) 2024, ETH Zurich
 # All rights reserved.
 #
 # SPDX-License-Identifier: BSD-3-Clause
+
 from __future__ import annotations
 
 from collections.abc import Iterable

From e702e6fec9914131395239fe01067d28cfb54cd7 Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Fri, 19 Apr 2024 08:59:45 +0200
Subject: [PATCH 005/458] Implemented a possibibility to manage translators.

The infrastructure also allows to add new translator for exterally defined primitives.
---
 .../translator/sub_translators/__init__.py    | 80 ++++++++++++++++++-
 1 file changed, 79 insertions(+), 1 deletion(-)

diff --git a/src/jace/translator/sub_translators/__init__.py b/src/jace/translator/sub_translators/__init__.py
index 3878727..aea1151 100644
--- a/src/jace/translator/sub_translators/__init__.py
+++ b/src/jace/translator/sub_translators/__init__.py
@@ -5,4 +5,82 @@
 #
 # SPDX-License-Identifier: BSD-3-Clause
 
-"""This module contains all subtranslator implementations."""
+"""Module collecting all built-in subtranslators.
+
+"""
+
+from typing import Final, Type, Sequence
+
+import jace
+from jace import translator as jtrans
+
+from .alu_translator import ALUTranslator
+
+# List of all subtranslators that ships with JaCe.
+_BUILTIN_SUBTRANSLATORS: Final[list[Type[jtrans.JaCeSubTranslatorInterface]]] = [
+        ALUTranslator,
+]
+
+# List of the externally supplied subtranslator implementation.
+#  It is a `dict` to do fast access and remember the order, value is always `None`.
+#  The list is manipulated through `{add,rm}_subtranslator()`.
+_EXTERNAL_SUBTRANSLATORS: dict[Type[jtrans.JaCeSubTranslatorInterface], None] = {}
+
+
+def add_subtranslator(
+        subtrans: Type[jtrans.JaCeSubTranslatorInterface],
+) -> bool:
+    """Add `subtrans` to the internal list of externally supplied subtranslators.
+
+    The function returns `True` if it was added and `False` is not.
+    """
+    from inspect import isclass
+    if(subtrans in _EXTERNAL_SUBTRANSLATORS):
+        return False
+    if(not isclass(subtrans)):
+        return False
+    if(not issubclass(subtrans, jtrans.JaCeSubTranslatorInterface)):
+        return False
+    _EXTERNAL_SUBTRANSLATORS[subtrans] = None
+    return True
+
+
+def rm_subtranslator(
+        subtrans: Type[jtrans.JaCeSubTranslatorInterface],
+        strict: bool = False,
+) -> bool:
+    """Removes subtranslator `subtrans` from the list of known subtranslators.
+
+    If `subtrans` is not known no error is generated unless `strict` is set to `True`.
+    """
+    if(subtrans not in _EXTERNAL_SUBTRANSLATORS):
+        if(strict):
+            raise KeyError(f"Subtranslator '{type(subtrans)}' is not known.")
+        return False
+    del _EXTERNAL_SUBTRANSLATORS[subtrans]
+    return True
+
+
+def _get_subtranslators_cls(
+        with_external: bool = True,
+        builtins: bool = True,
+) -> Sequence[Type[jtrans.JaCeSubTranslatorInterface]]:
+    """Returns a list of all subtranslator classes in JaCe.
+
+    Args:
+        with_external:  Include the translators that were externally supplied.
+        builtins:       Include the build in translators.
+    """
+    ret: list[Type[jtrans.JaCeSubTranslatorInterface]] = []
+    if(builtins):
+        ret.extend(_BUILTIN_SUBTRANSLATORS)
+    if(with_external):
+        ret.extend(_EXTERNAL_SUBTRANSLATORS.keys())
+    return ret
+
+
+__all__ = [
+        "add_subtranslator",
+        "rm_subtranslator",
+]
+

From 6ccd9f65c4aa8f6e209db6cfbc7450d0a81e69e2 Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Fri, 19 Apr 2024 09:02:02 +0200
Subject: [PATCH 006/458] Made some renaming.

---
 .../translator/jaxpr_translator_driver.py     | 22 ++++++++++---------
 1 file changed, 12 insertions(+), 10 deletions(-)

diff --git a/src/jace/translator/jaxpr_translator_driver.py b/src/jace/translator/jaxpr_translator_driver.py
index 0f9c5ab..5a73d39 100644
--- a/src/jace/translator/jaxpr_translator_driver.py
+++ b/src/jace/translator/jaxpr_translator_driver.py
@@ -9,16 +9,18 @@
 
 import re
 from collections.abc import Collection, Iterable, Mapping, Sequence
-from typing import Any, Final, cast, overload
+from typing import Any, Final, cast, overload, Type
 
 import dace
 import jax
 from dace import data as ddata, properties as dprop
 from jax import core as jcore
 
-from jace import translator
-from jace.translator import util as jtrutil
+import jace
+from jace import translator as trans
 from jace.util import jax as jutil
+from jace.translator import util as jtrutil
+from jace.translator import sub_translators as jtsubt
 
 
 class JaxprTranslationDriver:
@@ -108,7 +110,7 @@ def __init__(
         #  They are partitioned by the names of the primitive they have registered for.
         #  Inside a partition they are ordered by priority, lowest first, more important.
         #  This member is allocated by '_init_sub_translators()' and remains allocated during the lifetime of the object.
-        self._sub_translators: dict[str, list[translator.JaCeSubTranslatorInterface]] = None  # type: ignore[assignment]
+        self._sub_translators: dict[str, list[trans.JaCeSubTranslatorInterface]] = None  # type: ignore[assignment]
 
         # The SDFG object that we are currently constructing.
         #  Only allocated during an ongoing translation.
@@ -908,12 +910,12 @@ def _init_sub_translators(
         kwargs = {k: v for k, v in kwargs.items() if not k.startswith("_")}
 
         # Will contain all subtranslators we create.
-        subtranslators: dict[str, list[translator.JaCeSubTranslatorInterface]] = {}
+        subtranslators: dict[str, list[trans.JaCeSubTranslatorInterface]] = {}
 
         # First we will create all subtranslators and partition them.
-        subtranslator_cls: type[translator.JaCeSubTranslatorInterface]
+        subtranslator_cls: Type[trans.JaCeSubTranslatorInterface]
         for subtranslator_cls in []:
-            subtranslator: translator.JaCeSubTranslatorInterface = subtranslator_cls(**kwargs)
+            subtranslator: trans.JaCeSubTranslatorInterface = subtranslator_cls(**kwargs)
             handled_primitives: Iterable[str] = jutil.ensure_iterability(
                 subtranslator.getHandledPrimitives()
             )
@@ -964,7 +966,7 @@ def _find_sub_translator_for(
         in_var_names: Sequence[str | None],
         out_var_names: Sequence[str],
         eqn: jcore.JaxprEqn,
-    ) -> translator.JaCeSubTranslatorInterface:
+    ) -> trans.JaCeSubTranslatorInterface:
         """Returns the subtranslator object to translate `eqn`.
 
         The subtranslators are checked for applicability in the order of their priority.
@@ -981,7 +983,7 @@ def _find_sub_translator_for(
         subtranslator_canidates = self._sub_translators[prim_name]
         assert len(subtranslator_canidates) > 0
 
-        subtranslator: translator.JaCeSubTranslatorInterface = None  # type: ignore[assignment]
+        subtranslator: trans.JaCeSubTranslatorInterface = None  # type: ignore[assignment]
         if len(subtranslator_canidates) == 1:
             subtranslator = next(iter(subtranslator_canidates))
             assert subtranslator.can_translate_jaxeqn(
@@ -1038,7 +1040,7 @@ def _translate_single_eqn(
         )
 
         # Find the subtranslator
-        subtranslator: translator.JaCeSubTranslatorInterface = self._find_sub_translator_for(
+        subtranslator: trans.JaCeSubTranslatorInterface = self._find_sub_translator_for(
             in_var_names=in_var_names,
             out_var_names=out_var_names,
             eqn=eqn,

From c684ceb2ba2ce86aa49da3ab4c8fbb0d6ad7c786 Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Fri, 19 Apr 2024 09:02:31 +0200
Subject: [PATCH 007/458] The driver now loads the subtrabnslator and actually
 initiaslizes them.

At least the arethmetic translator now works.
---
 src/jace/translator/jaxpr_translator_driver.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/src/jace/translator/jaxpr_translator_driver.py b/src/jace/translator/jaxpr_translator_driver.py
index 5a73d39..c1f9e04 100644
--- a/src/jace/translator/jaxpr_translator_driver.py
+++ b/src/jace/translator/jaxpr_translator_driver.py
@@ -914,7 +914,7 @@ def _init_sub_translators(
 
         # First we will create all subtranslators and partition them.
         subtranslator_cls: Type[trans.JaCeSubTranslatorInterface]
-        for subtranslator_cls in []:
+        for subtranslator_cls in jtsubt._get_subtranslators_cls():
             subtranslator: trans.JaCeSubTranslatorInterface = subtranslator_cls(**kwargs)
             handled_primitives: Iterable[str] = jutil.ensure_iterability(
                 subtranslator.getHandledPrimitives()

From 935908f472f3e46a24531afa60c889534b079899 Mon Sep 17 00:00:00 2001
From: Enrique Gonzalez Paredes <enriqueg@cscs.ch>
Date: Fri, 19 Apr 2024 09:34:35 +0200
Subject: [PATCH 008/458] chore: fine tune linting settings

---
 pyproject.toml | 16 +++++++++-------
 1 file changed, 9 insertions(+), 7 deletions(-)

diff --git a/pyproject.toml b/pyproject.toml
index 7e1025c..78b41c1 100644
--- a/pyproject.toml
+++ b/pyproject.toml
@@ -100,22 +100,23 @@ extend-select = [
   "G",  # flake8-logging-format
   "C4",  # flake8-comprehensions
   "PT",  # flake8-pytest-style
-  "UP",  # pyupgrade  # TODO: evaluate and remove if needed
+  "UP",  # pyupgrade       # TODO: in evaluation
   "ARG",  # flake8-unused-arguments
   "ERA",  # eradicate
   "ICN",  # flake8-import-conventions
   "PGH",  # pygrep-hooks
   "PIE",  # flake8-pie
   "PTH",  # flake8-use-pathlib
-  "RET",  # flake8-return  # TODO: evaluate and remove if needed
+  "RET",  # flake8-return   # TODO: in evaluation
   "RUF",  # Ruff-specific
-  "SIM",  # flake8-simplify  # TODO: evaluate and remove if needed
+  "SIM",  # flake8-simplify # TODO: in evaluation
   "T10",  # flake8-debugger
-  "T20",  # flake8-print  # TODO: evaluate and remove if needed
+  "T20",  # flake8-print    # TODO: in evaluation
   "NPY"  # NumPy specific rules
 ]
 ignore = [
-  'E501'  # [line-too-long]
+  'E501',  # [line-too-long]
+  'UP038'  # [non-pep604-isinstance]
 ]
 ignore-init-module-imports = true
 unfixable = []
@@ -144,5 +145,6 @@ section-order = [
 ]
 
 [tool.ruff.lint.per-file-ignores]
-"noxfile.py" = ["T20"]
-"tests/**" = ["T10", "T20"]
+"!tests/**.py" = ["PT"]  # Ignore `flake8-pytest-style` everywhere except in `tests/`
+"noxfile.py" = ["T20"]  # Ignore `flake8-print`
+"tests/**" = ["T10", "T20"]  # Ignore `flake8-debugger` and `flake8-print`

From 741a209954ee933220bb6b396349d6a03902d511 Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Fri, 19 Apr 2024 09:40:48 +0200
Subject: [PATCH 009/458] WIP: Added more tests.

---
 ..._order.py => test_subtranslator_helper.py} | 96 ++++++++++++++++++-
 1 file changed, 94 insertions(+), 2 deletions(-)
 rename tests/{test_subtranslator_helper_order.py => test_subtranslator_helper.py} (64%)

diff --git a/tests/test_subtranslator_helper_order.py b/tests/test_subtranslator_helper.py
similarity index 64%
rename from tests/test_subtranslator_helper_order.py
rename to tests/test_subtranslator_helper.py
index ed35cc6..b6250d9 100644
--- a/tests/test_subtranslator_helper_order.py
+++ b/tests/test_subtranslator_helper.py
@@ -1,14 +1,16 @@
 """Implements tests to check if the sorting algorithm is correct.
 """
 
-from typing                     import Collection, Sequence, Union
+from typing                     import Collection, Sequence, Union, Type
 
 import jace
 from jace   import translator as jtrans
 
 
 def test_subtranslatior_order_simple():
-    """This test is to ensure that `sortSubtranslators()` works correctly.
+    """Tests if the ordering of subtranslators works correctly.
+
+    Simple version that only uses priorities.
     """
     from jace.translator.util.subtranslator_helper_order import  sort_subtranslators
 
@@ -53,6 +55,10 @@ def __init__(self, *args, **kwargs):
 
 
 def test_subtranslatior_order_custom1():
+    """Tests if the ordering of subtranslators works correctly.
+
+    Interaction of priorities and custom `__lt__()`.
+    """
     from jace.translator.util.subtranslator_helper_order import  sort_subtranslators
 
     class SimpleSubTrans1(jtrans.JaCeSubTranslatorInterface):
@@ -121,6 +127,92 @@ def __init__(self, *args, **kwargs):
 # end def: test_subtranslatior_order_custom1
 
 
+
+def test_subtranslatior_managing():
+    """Esnsures the functionality of the subtranslator managing.
+    """
+    from jace.translator.sub_translators import  _get_subtranslators_cls, add_subtranslator, rm_subtranslator
+
+    class ValidSubTrans(jtrans.JaCeSubTranslatorInterface):
+        def __init__(self, *args, **kwargs):
+            super().__init__(*args, **kwargs)
+    #
+
+    class InvalidSubTrans(object):
+        def __init__(self):
+            ...
+        def get_handled_primitives(self) -> Collection[str] | str:
+            return "add"
+        def can_translate_jaxeqn(self, *args: Any, **kwargs: Any):
+            return False
+        def translate_jaxeqn(self, *args: Any, **kwargs: Any):
+            raise NotImplementedError()
+        def get_priority(self) -> int:
+            return 0
+        def has_default_priority(self) -> bool:
+            return False
+        def __lt__(self, other: Any) -> bool:
+            return NotImplemented
+        def __eq__(self, other: Any) -> bool:
+            return id(self) == id(other)
+        def __hash__(self) -> int:
+            return id(self)
+        def __ne__(self, other: Any) -> bool:
+            return NotImplemented
+        def __le__(self, other: Any) -> bool:
+            return NotImplemented
+        def __ge__(self, other: Any) -> bool:
+            return NotImplemented
+        def __gt__(self, other: Any) -> bool:
+            return NotImplemented
+    #
+
+    # Thest the initial conditions
+    init_sub_trans_list = _get_subtranslators_cls(builtins=False)
+    init_built_in = _get_subtranslators_cls(with_external=False)
+    assert len(init_sub_trans_list) == 0, f"Expected no external subtranslators but found: {init_sub_trans_list}"
+
+    # Now we add the valid subtranslator interface
+    assert add_subtranslator(ValidSubTrans), f"Failed to add the `ValidSubTrans`"
+    first_sub_trans = _get_subtranslators_cls(builtins=False)
+
+
+
+
+
+    # Should not include the 
+    subTrans = _get_subtranslators_cls(with_external=False)
+
+
+
+
+
+
+    assert not add_subtranslator(ValidSubTrans), f"Could add `ValidSubTrans` twice"
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+# end def: test_subtranslatior_order_simple
+
+
+
+
+
+
 if "__main__" == __name__:
     test_subtranslatior_order_simple()
     test_subtranslatior_order_custom1()

From 16f9adf7670c8152e498ac163e58144419de75e6 Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Fri, 19 Apr 2024 09:51:49 +0200
Subject: [PATCH 010/458] Some changes.

---
 src/jace/translator/jaxpr_translator_driver.py        | 4 +---
 src/jace/translator/sub_translators/alu_translator.py | 6 ++----
 2 files changed, 3 insertions(+), 7 deletions(-)

diff --git a/src/jace/translator/jaxpr_translator_driver.py b/src/jace/translator/jaxpr_translator_driver.py
index 0f9c5ab..d7e9cdd 100644
--- a/src/jace/translator/jaxpr_translator_driver.py
+++ b/src/jace/translator/jaxpr_translator_driver.py
@@ -597,9 +597,7 @@ def _add_array(
                 )
             alt_name = jutil.get_jax_var_name(arg)
         if name_prefix is not None:
-            assert isinstance(name_prefix, str) and (
-                len(name_prefix) > 0
-            ), f"Invalid 'name_prefix': '{name_prefix}'."
+            assert isinstance(name_prefix, str) and (len(name_prefix) > 0)
             if alt_name is not None:
                 raise ValueError("Specified 'name_prefix' and 'alt_name' which is not possible.")
 
diff --git a/src/jace/translator/sub_translators/alu_translator.py b/src/jace/translator/sub_translators/alu_translator.py
index 3b62d43..5594497 100644
--- a/src/jace/translator/sub_translators/alu_translator.py
+++ b/src/jace/translator/sub_translators/alu_translator.py
@@ -153,13 +153,11 @@ def translate_jaxeqn(
         inp_scalars = [len(Inp.aval.shape) == 0 for i, Inp in enumerate(eqn.invars)]
         has_scalars_as_inputs = any(inp_scalars)
         only_scalars_as_inputs = all(inp_scalars)
-        has_some_literals = any([x is None for x in in_var_names])
-        only_literals_as_inputs = all([x is None for x in in_var_names])
+        has_some_literals = any(x is None for x in in_var_names)
+        only_literals_as_inputs = all(x is None for x in in_var_names)
         inps_same_shape = all(
-            [
                 eqn.invars[0].aval.shape == eqn.invars[i].aval.shape
                 for i in range(1, len(eqn.invars))
-            ]
         )
 
         # We will now look which dimensions have to be broadcasted on which operator.

From d2bb87bc690a5f02e2e8038c57315c3bca29f1ee Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Fri, 19 Apr 2024 09:59:04 +0200
Subject: [PATCH 011/458] Fixed an issue.

---
 .../jace_subtranslator_interface.py           |  2 +-
 .../translator/jaxpr_translator_driver.py     | 23 +++++++++----------
 .../sub_translators/alu_translator.py         |  3 +--
 src/jace/util/traits.py                       |  9 ++------
 4 files changed, 15 insertions(+), 22 deletions(-)

diff --git a/src/jace/translator/jace_subtranslator_interface.py b/src/jace/translator/jace_subtranslator_interface.py
index 3d6f53b..cf9420c 100644
--- a/src/jace/translator/jace_subtranslator_interface.py
+++ b/src/jace/translator/jace_subtranslator_interface.py
@@ -57,7 +57,7 @@ def __init__(
         self,
         *args,
         **kwargs,
-    ):
+    ) -> None:
         """Initialize the interface.
 
         It is required that subclasses calls this method during initialization.
diff --git a/src/jace/translator/jaxpr_translator_driver.py b/src/jace/translator/jaxpr_translator_driver.py
index d7e9cdd..c3c266f 100644
--- a/src/jace/translator/jaxpr_translator_driver.py
+++ b/src/jace/translator/jaxpr_translator_driver.py
@@ -389,15 +389,14 @@ def is_allocated(self) -> bool:
         small_ctx: Sequence[Any] = [
             getattr(self, x) for x in self.__shared_slots__ if x != "_reserved_names"
         ]
-        if all((x is None) for x in small_ctx):
+        if all((x is not None) for x in small_ctx):
             if self._reserved_names is None:
                 raise RuntimeError(
                     "Invalid allocation state: All context variables except the reserved name list are allocated."
                 )
             return True
-        elif all((x is not None) for x in small_ctx):
+        elif all((x is None) for x in small_ctx):
             return False
-
         raise RuntimeError("Invalid allocation state: Translation context is mixed allocated.")
 
     def is_head_translator(self) -> bool:
@@ -416,7 +415,7 @@ def same_family(
         They belong to the same family if they descend from the same head translator.
         """
         if not isinstance(other, JaxprTranslationDriver):
-            return NotImplemented
+            return NotImplemented  # type: ignore[unreachable]
         if all(getattr(self, x) is getattr(self, x) for x in self.__shared_slots__):
             assert (self if (self._rev_idx < other._rev_idx) else other).is_allocated()
             return True
@@ -597,7 +596,8 @@ def _add_array(
                 )
             alt_name = jutil.get_jax_var_name(arg)
         if name_prefix is not None:
-            assert isinstance(name_prefix, str) and (len(name_prefix) > 0)
+            assert isinstance(name_prefix, str)
+            assert len(name_prefix) > 0
             if alt_name is not None:
                 raise ValueError("Specified 'name_prefix' and 'alt_name' which is not possible.")
 
@@ -879,12 +879,10 @@ def _allocate_translation_ctx(
         # Handle the `reserved_names` argument as described above.
         #  This is essentially needed that children works properly.
         if self._reserved_names is None:
-            self._reserved_names = set()
-        elif isinstance(self._reserved_names, set):
-            assert not self.is_head_translator()
-            assert all(isinstance(x, str) for x in self._reserved_names)
+            self._reserved_names = set()  # type: ignore[unreachable]
         else:
             raise RuntimeError("The reserved names are allocated incorrectly.")
+        assert all(isinstance(x, str) for x in self._reserved_names)  # type: ignore[unreachable]
         self._add_reserved_names(reserved_names)
 
         return self
@@ -900,7 +898,7 @@ def _init_sub_translators(
         """
         if isinstance(self._sub_translators, dict):
             raise RuntimeError("Tried to allocate the internal subtranslators twice.")
-        assert self._sub_translators is None
+        assert self._sub_translators is None  # type: ignore[unreachable]
 
         # We might get arguments that starts with an underscore, which are not meant for the subtranslators.
         kwargs = {k: v for k, v in kwargs.items() if not k.startswith("_")}
@@ -1020,7 +1018,8 @@ def _translate_single_eqn(
             While `jaxpr` must be the closed version, `eqn` must come from the unclosed version.
             The function will also perform some consistency checking.
         """
-        assert isinstance(eqn, jcore.JaxprEqn) and isinstance(jaxpr, jcore.ClosedJaxpr)
+        assert isinstance(eqn, jcore.JaxprEqn)
+        assert isinstance(jaxpr, jcore.ClosedJaxpr)
 
         if len(eqn.effects) != 0:
             raise NotImplementedError(f"Equation '{eqn}' had side effects.")
@@ -1191,7 +1190,7 @@ def _handle_null_jaxpr(
                 self.map_jax_var_to_sdfg(jax_out_var) for jax_out_var in jaxpr.jaxpr.outvars
             )
             raise NotImplementedError("Please test me.")
-            return self
+            return self  # type: ignore[unreachable] # reminder
         #
         assert self._term_sdfg_state is self._init_sdfg_state
         assert len(self._sdfg_in_names) > 0
diff --git a/src/jace/translator/sub_translators/alu_translator.py b/src/jace/translator/sub_translators/alu_translator.py
index 5594497..c088fa9 100644
--- a/src/jace/translator/sub_translators/alu_translator.py
+++ b/src/jace/translator/sub_translators/alu_translator.py
@@ -156,8 +156,7 @@ def translate_jaxeqn(
         has_some_literals = any(x is None for x in in_var_names)
         only_literals_as_inputs = all(x is None for x in in_var_names)
         inps_same_shape = all(
-                eqn.invars[0].aval.shape == eqn.invars[i].aval.shape
-                for i in range(1, len(eqn.invars))
+            eqn.invars[0].aval.shape == eqn.invars[i].aval.shape for i in range(1, len(eqn.invars))
         )
 
         # We will now look which dimensions have to be broadcasted on which operator.
diff --git a/src/jace/util/traits.py b/src/jace/util/traits.py
index ccdf19a..9d87803 100644
--- a/src/jace/util/traits.py
+++ b/src/jace/util/traits.py
@@ -25,21 +25,16 @@ def is_str(
     """
     if len(args) == 0:
         return False
-
     elif allow_empty:
         for x in args:
             if not isinstance(x, str):
                 return False  # Not a string
-        # end for(x):
     else:
         for x in args:
             if not isinstance(x, str):
-                return False  # Not a string
+                return False
             if len(x) == 0:
-                return False  # A string but empty; and check enabled
-        # end for(x):
-    # end if:
-
+                return False
     return True
 
 
From 5cf76fa51519d3588c70a5eed5fcfcbeda18bbb3 Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Fri, 19 Apr 2024 11:26:24 +0200
Subject: [PATCH 012/458] Fixed some stuff.

---
 src/jace/py.typed                              |  0
 src/jace/translator/__init__.py                |  4 ++--
 src/jace/translator/jaxpr_translator_driver.py |  6 +++---
 src/jace/translator/util/__init__.py           | 15 +++++++++++----
 4 files changed, 16 insertions(+), 9 deletions(-)
 create mode 100644 src/jace/py.typed

diff --git a/src/jace/py.typed b/src/jace/py.typed
new file mode 100644
index 0000000..e69de29
diff --git a/src/jace/translator/__init__.py b/src/jace/translator/__init__.py
index 899d973..71b567b 100644
--- a/src/jace/translator/__init__.py
+++ b/src/jace/translator/__init__.py
@@ -9,8 +9,8 @@
 
 from __future__ import annotations
 
-from jace.translator.jace_subtranslator_interface import JaCeSubTranslatorInterface
-from jace.translator.jaxpr_translator_driver import JaxprTranslationDriver
+from .jace_subtranslator_interface import JaCeSubTranslatorInterface
+from .jaxpr_translator_driver import JaxprTranslationDriver
 
 
 __all__ = [
diff --git a/src/jace/translator/jaxpr_translator_driver.py b/src/jace/translator/jaxpr_translator_driver.py
index c3c266f..95fbe49 100644
--- a/src/jace/translator/jaxpr_translator_driver.py
+++ b/src/jace/translator/jaxpr_translator_driver.py
@@ -395,7 +395,7 @@ def is_allocated(self) -> bool:
                     "Invalid allocation state: All context variables except the reserved name list are allocated."
                 )
             return True
-        elif all((x is None) for x in small_ctx):
+        if all((x is None) for x in small_ctx):
             return False
         raise RuntimeError("Invalid allocation state: Translation context is mixed allocated.")
 
@@ -481,7 +481,7 @@ def _add_jax_name_mapping(
             raise KeyError(
                 f"Tried to create the mapping '{jax_name} -> {sdfg_name}', but '{sdfg_name}' is not a known SDFG variable."
             )
-        elif sdfg_name in self._forbidden_names:
+        if sdfg_name in self._forbidden_names:
             raise NameError(  # This is actually an internal error
                 f"Tried to create the mapping '{jax_name} -> {sdfg_name}', but '{sdfg_name}' is forbidden."
             )
@@ -498,7 +498,7 @@ def _add_reserved_names(
 
         if reserved_names is None:
             return self
-        elif isinstance(reserved_names, str):
+        if isinstance(reserved_names, str):
             reserved_names = [reserved_names]
         elif isinstance(reserved_names, Collection):
             pass
diff --git a/src/jace/translator/util/__init__.py b/src/jace/translator/util/__init__.py
index 7410138..910589e 100644
--- a/src/jace/translator/util/__init__.py
+++ b/src/jace/translator/util/__init__.py
@@ -9,7 +9,14 @@
 
 from __future__ import annotations
 
-from .jace_translation_memento import JaCeTranslationMemento  # noqa: F401 # Unused import
-from .revision_counter import RevisionCounterManager  # noqa: F401 # Unused import
-from .subtranslator_helper_order import sort_subtranslators  # noqa: F401 # Unused import
-from .util import list_to_dict  # noqa: F401 # Unused import
+from .jace_translation_memento import JaCeTranslationMemento
+from .revision_counter import RevisionCounterManager
+from .util import list_to_dict
+
+
+# Q: Is there a way to import everything from `.util` and put it into `__all__` without writing it manually?
+__all__ = [
+    "JaCeTranslationMemento",
+    "RevisionCounterManager",
+    "list_to_dict",
+]

From d80be3b404bc4b9856468595dbadf2878fdbdea1 Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Fri, 19 Apr 2024 11:33:39 +0200
Subject: [PATCH 013/458] Made some modification.

---
 .../translator/sub_translators/alu_translator.py   |  4 ++--
 .../translator/util/jace_translation_memento.py    |  8 ++------
 .../translator/util/subtranslator_helper_order.py  | 14 ++++++--------
 src/jace/util/traits.py                            |  2 +-
 4 files changed, 11 insertions(+), 17 deletions(-)

diff --git a/src/jace/translator/sub_translators/alu_translator.py b/src/jace/translator/sub_translators/alu_translator.py
index c088fa9..c8997a8 100644
--- a/src/jace/translator/sub_translators/alu_translator.py
+++ b/src/jace/translator/sub_translators/alu_translator.py
@@ -241,9 +241,9 @@ def translate_jaxeqn(
                 # Literal: No input needed.
                 tskl_inputs.append((None, None))
                 continue
-            elif inp_scalars[i]:
+            if inp_scalars[i]:
                 # We have a scalar argument.
-                i_memlet: dace.Memlet = dace.Memlet.from_array(
+                i_memlet = dace.Memlet.from_array(
                     in_var_names[i], driver.get_sdfg().arrays[in_var_names[i]]
                 )
             else:
diff --git a/src/jace/translator/util/jace_translation_memento.py b/src/jace/translator/util/jace_translation_memento.py
index 1f267e7..93d11af 100644
--- a/src/jace/translator/util/jace_translation_memento.py
+++ b/src/jace/translator/util/jace_translation_memento.py
@@ -65,13 +65,9 @@ def __eq__(self, other: Any) -> bool:
         """Compares the underlying SDFG object with 'rhs'."""
         if isinstance(other, JaCeTranslationMemento):
             return bool(self.sdfg == other.sdfg)
-        elif hasattr(other, "__sdfg__"):
+        if hasattr(other, "__sdfg__"):
             other = other.__sdfg__()
-        elif isinstance(other, dace.SDFG):
-            pass
-        else:
+        elif not isinstance(other, dace.SDFG):
             return NotImplemented
-        #
-
         x: bool = self.sdfg.__eq__(other)
         return x
diff --git a/src/jace/translator/util/subtranslator_helper_order.py b/src/jace/translator/util/subtranslator_helper_order.py
index 4be8604..e90697b 100644
--- a/src/jace/translator/util/subtranslator_helper_order.py
+++ b/src/jace/translator/util/subtranslator_helper_order.py
@@ -57,24 +57,22 @@ def __lt__(
         # Default priority means that it will always go to the end.
         if self._sub.has_default_priority():
             return False  # 'self' has default priority, so it must go to the end.
-        elif other._sub.has_default_priority():
+        if other._sub.has_default_priority():
             return True  # 'self' does not have default prio, thus it _must_ go before 'other'.
-        # Get the priorities of the subtranslators.
-        prio_self = self._sub.get_priority()
+        prio_self = self._sub.get_priority()  # Get the priorities of the subtranslators.
         prio_other = other._sub.get_priority()
         if all(prio is NotImplemented for prio in (prio_self, prio_other)):
-            # Both does not have an explicit priority, thus 'self' should decide if it should go first.
+            # None has a prio, 'self' should decide if it should go first.
             x = self._sub.__lt__(other._sub)
             assert isinstance(x, bool)
             return x
-        # In case only one has a priority, we change the order such that the one that implements a custom '__lt__()' goes first.
-        #  This is consistent with the description of the interface telling that such translators are biased towards lower priorities.
+        # In case only one has a priority, we change the order such that the one that implements
+        #  a '__lt__()' goes first.
         if prio_self is NotImplemented:
             assert isinstance(prio_other, int)
             return True
-        elif prio_other is NotImplemented:
+        if prio_other is NotImplemented:
             assert isinstance(prio_self, int)
             return False
-        # Both have a priority
         assert all(isinstance(prio, int) for prio in (prio_other, prio_self))
         return prio_self < prio_other
diff --git a/src/jace/util/traits.py b/src/jace/util/traits.py
index 9d87803..822861c 100644
--- a/src/jace/util/traits.py
+++ b/src/jace/util/traits.py
@@ -25,7 +25,7 @@ def is_str(
     """
     if len(args) == 0:
         return False
-    elif allow_empty:
+    if allow_empty:
         for x in args:
             if not isinstance(x, str):
                 return False  # Not a string

From c8be5da03f64e49092345e183e81353f2380466d Mon Sep 17 00:00:00 2001
From: Enrique Gonzalez Paredes <enriqueg@cscs.ch>
Date: Fri, 19 Apr 2024 09:34:35 +0200
Subject: [PATCH 014/458] chore: fine tune linting settings

---
 pyproject.toml | 17 ++++++++++-------
 1 file changed, 10 insertions(+), 7 deletions(-)

diff --git a/pyproject.toml b/pyproject.toml
index 7e1025c..4d551f1 100644
--- a/pyproject.toml
+++ b/pyproject.toml
@@ -100,22 +100,24 @@ extend-select = [
   "G",  # flake8-logging-format
   "C4",  # flake8-comprehensions
   "PT",  # flake8-pytest-style
-  "UP",  # pyupgrade  # TODO: evaluate and remove if needed
+  "UP",  # pyupgrade       # TODO: in evaluation
   "ARG",  # flake8-unused-arguments
   "ERA",  # eradicate
   "ICN",  # flake8-import-conventions
   "PGH",  # pygrep-hooks
   "PIE",  # flake8-pie
   "PTH",  # flake8-use-pathlib
-  "RET",  # flake8-return  # TODO: evaluate and remove if needed
+  "RET",  # flake8-return   # TODO: in evaluation
   "RUF",  # Ruff-specific
-  "SIM",  # flake8-simplify  # TODO: evaluate and remove if needed
+  "SIM",  # flake8-simplify # TODO: in evaluation
   "T10",  # flake8-debugger
-  "T20",  # flake8-print  # TODO: evaluate and remove if needed
+  "T20",  # flake8-print    # TODO: in evaluation
   "NPY"  # NumPy specific rules
 ]
 ignore = [
-  'E501'  # [line-too-long]
+  'B905',  # [zip-without-explicit-strict]
+  'E501',  # [line-too-long]
+  'UP038'  # [non-pep604-isinstance]
 ]
 ignore-init-module-imports = true
 unfixable = []
@@ -144,5 +146,6 @@ section-order = [
 ]
 
 [tool.ruff.lint.per-file-ignores]
-"noxfile.py" = ["T20"]
-"tests/**" = ["T10", "T20"]
+"!tests/**.py" = ["PT"]  # Ignore `flake8-pytest-style` everywhere except in `tests/`
+"noxfile.py" = ["T20"]  # Ignore `flake8-print`
+"tests/**" = ["T10", "T20"]  # Ignore `flake8-debugger` and `flake8-print`

From 10b3e6c6debf46a459b4258c9a4491b356edefdd Mon Sep 17 00:00:00 2001
From: Enrique Gonzalez Paredes <enriqueg@cscs.ch>
Date: Fri, 19 Apr 2024 10:04:41 +0200
Subject: [PATCH 015/458] docs: update coding guidelines

---
 CODING_GUIDELINES.md | 18 ++++++++++++++++--
 1 file changed, 16 insertions(+), 2 deletions(-)

diff --git a/CODING_GUIDELINES.md b/CODING_GUIDELINES.md
index fafa314..c7c5d3c 100644
--- a/CODING_GUIDELINES.md
+++ b/CODING_GUIDELINES.md
@@ -9,6 +9,21 @@ We deviate from the [Google Python Style Guide][google-style-guide] only in the
 - We use [`ruff-linter`][ruff-linter] instead of [`pylint`][pylint].
 - We use [`ruff-formatter`][ruff-formatter] for source code and imports formatting, which may work differently than indicated by the guidelines in section [_3. Python Style Rules_](https://google.github.io/styleguide/pyguide.html#3-python-style-rules). For example, maximum line length is set to 100 instead of 79 (although docstring lines should still be limited to 79).
 - According to subsection [_2.19 Power Features_](https://google.github.io/styleguide/pyguide.html#219-power-features), direct use of _power features_ (e.g. custom metaclasses, import hacks, reflection) should be avoided, but standard library classes that internally use these power features are accepted. Following the same spirit, we allow the use of power features in infrastructure code with similar functionality and scope as the Python standard library.
+- For readability purposes, when a docstring contains more than the required summary line, we prefer indenting the first line at the same cursor position as the first opening quote, although this is not explicitly considered in the doctring conventions described in subsection [_3.8.1 Docstrings_](https://google.github.io/styleguide/pyguide.html#381-docstrings). Example:
+
+  ```python
+  # single line docstring
+  """A one-line summary of the module or program, terminated by a period."""
+
+  # multi-line docstring
+  """
+  A one-line summary of the module or program, terminated by a period.
+
+  Leave one blank line. The rest of this docstring should contain an
+  overall description of the module or program.
+  """
+  ```
+
 - According to subsection [_3.19.12 Imports For Typing_](https://google.github.io/styleguide/pyguide.html#31912-imports-for-typing), symbols from `typing` and `collections.abc` modules used in type annotations _"can be imported directly to keep common annotations concise and match standard typing practices"_. Following the same spirit, we allow symbols to be imported directly from third-party or internal modules when they only contain a collection of frequently used typying definitions.
 
 ### Common questions
@@ -71,7 +86,7 @@ The terseness vs. helpfulness tradeoff should be more in favor of terseness for
 
 ### Docstrings
 
-TODO: update to autodoc2
+TODO: update to `autodoc2`
 
 We generate the API documentation automatically from the docstrings using [Sphinx][sphinx] and some extensions such as [Sphinx-autodoc][sphinx-autodoc] and [Sphinx-napoleon][sphinx-napoleon]. These follow the Google Python Style Guide docstring conventions to automatically format the generated documentation. A complete overview can be found here: [Example Google Style Python Docstrings](https://sphinxcontrib-napoleon.readthedocs.io/en/latest/example_google.html#example-google).
 
@@ -140,4 +155,3 @@ Testing components is a critical part of a software development project. We foll
 [sphinx-autodoc]: https://www.sphinx-doc.org/en/master/usage/extensions/autodoc.html
 [sphinx-napoleon]: https://sphinxcontrib-napoleon.readthedocs.io/en/latest/index.html#
 [sphinx-rest]: https://www.sphinx-doc.org/en/master/usage/restructuredtext/basics.html
-[ci-docs]: docs/development/CI/infrastructure.md

From 94dd0e4f28eb42ca4699cc1b3d9832c6cada5810 Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Fri, 19 Apr 2024 11:37:42 +0200
Subject: [PATCH 016/458] Made some more changes.

---
 ..._order.py => test_subtranslator_helper.py} | 83 +++++++++++--------
 1 file changed, 47 insertions(+), 36 deletions(-)
 rename tests/{test_subtranslator_helper_order.py => test_subtranslator_helper.py} (70%)

diff --git a/tests/test_subtranslator_helper_order.py b/tests/test_subtranslator_helper.py
similarity index 70%
rename from tests/test_subtranslator_helper_order.py
rename to tests/test_subtranslator_helper.py
index ed35cc6..4da5d8f 100644
--- a/tests/test_subtranslator_helper_order.py
+++ b/tests/test_subtranslator_helper.py
@@ -1,43 +1,49 @@
-"""Implements tests to check if the sorting algorithm is correct.
-"""
+# JaCe - JAX Just-In-Time compilation using DaCe (Data Centric Parallel Programming)
+#
+# Copyright (c) 2024, ETH Zurich
+# All rights reserved.
+#
+# SPDX-License-Identifier: BSD-3-Clause
 
-from typing                     import Collection, Sequence, Union
+"""Implements tests to check if the sorting algorithm is correct."""
 
-import jace
-from jace   import translator as jtrans
+from __future__ import annotations
+
+from jace import translator as jtrans
 
 
 def test_subtranslatior_order_simple():
-    """This test is to ensure that `sortSubtranslators()` works correctly.
-    """
-    from jace.translator.util.subtranslator_helper_order import  sort_subtranslators
+    """This test is to ensure that `sortSubtranslators()` works correctly."""
+    from jace.translator.util.subtranslator_helper_order import sort_subtranslators
 
     class SimpleSubTrans1(jtrans.JaCeSubTranslatorInterface):
         _EXP_ORDER = 0
+
         def __init__(self, *args, **kwargs):
             super().__init__(*args, **kwargs)
+
         def get_priority(self):
             return 1
-    # end class(SimpleSubTrans1):
 
     class SimpleSubTrans2(jtrans.JaCeSubTranslatorInterface):
         _EXP_ORDER = 1  # Not last because, default prio is always last.
+
         def __init__(self, *args, **kwargs):
             super().__init__(*args, **kwargs)
+
         def get_priority(self):
             return jtrans.JaCeSubTranslatorInterface.DEFAULT_PRIORITY + 1
-    # end class(SimpleSubTrans2):
 
     class SimpleSubTrans3(jtrans.JaCeSubTranslatorInterface):
         _EXP_ORDER = 2
+
         def __init__(self, *args, **kwargs):
             super().__init__(*args, **kwargs)
-    # end class(SimpleSubTrans3):
 
     initial_order = [
-            SimpleSubTrans3(),
-            SimpleSubTrans2(),
-            SimpleSubTrans1(),
+        SimpleSubTrans3(),
+        SimpleSubTrans2(),
+        SimpleSubTrans1(),
     ]
 
     # Now call the function.
@@ -46,67 +52,75 @@ def __init__(self, *args, **kwargs):
     # Now we bring the list in expected order.
     expected_order = sorted(initial_order, key=lambda st: st._EXP_ORDER)
 
-    assert all(ist is soll  for ist, soll in zip(sorted_translators, expected_order)), \
-            f"Expected order was `{[type(x).__name__  for x in expected_order]}`, but got `{[type(x).__name__  for x in sorted_translators]}`."
+    assert all(
+        got_ord is exp_ord
+        for got_ord, exp_ord in zip(sorted_translators, expected_order, strict=False)
+    ), f"Expected order was `{[type(x).__name__  for x in expected_order]}`, but got `{[type(x).__name__  for x in sorted_translators]}`."
     return True
-# end def: test_subtranslatior_order_simple
 
 
 def test_subtranslatior_order_custom1():
-    from jace.translator.util.subtranslator_helper_order import  sort_subtranslators
+    from jace.translator.util.subtranslator_helper_order import sort_subtranslators
 
     class SimpleSubTrans1(jtrans.JaCeSubTranslatorInterface):
         _EXP_ORDER = 0
+
         def __init__(self, *args, **kwargs):
             super().__init__(*args, **kwargs)
+
         def get_priority(self):
             return NotImplemented
+
         def __lt__(self, other):
             return isinstance(other, SimpleSubTrans2)
-    # end class(SimpleSubTrans1):
 
     class SimpleSubTrans2(jtrans.JaCeSubTranslatorInterface):
         _EXP_ORDER = 1
+
         def __init__(self, *args, **kwargs):
             super().__init__(*args, **kwargs)
+
         def get_priority(self):
             return NotImplemented
+
         def __lt__(self, other):
             return True
-    # end class(SimpleSubTrans2):
 
     class SimpleSubTrans3(jtrans.JaCeSubTranslatorInterface):
         _EXP_ORDER = 2
+
         def __init__(self, *args, **kwargs):
             super().__init__(*args, **kwargs)
+
         def get_priority(self):
             return NotImplemented
+
         def __lt__(self, other):
             return False
-    # end class(SimpleSubTrans3):
 
     class SimpleSubTrans4(jtrans.JaCeSubTranslatorInterface):
         _EXP_ORDER = 3
+
         def __init__(self, *args, **kwargs):
             super().__init__(*args, **kwargs)
+
         def get_priority(self):
             return jtrans.JaCeSubTranslatorInterface.DEFAULT_PRIORITY + 1
-    # end class(SimpleSubTrans4):
 
     class SimpleSubTrans5(jtrans.JaCeSubTranslatorInterface):
         _EXP_ORDER = 4
+
         def __init__(self, *args, **kwargs):
             super().__init__(*args, **kwargs)
-    # end class(SimpleSubTrans5):
 
     assert SimpleSubTrans2() < SimpleSubTrans1()
 
     initial_order = [
-            SimpleSubTrans5(),
-            SimpleSubTrans4(),
-            SimpleSubTrans3(),
-            SimpleSubTrans2(),
-            SimpleSubTrans1(),
+        SimpleSubTrans5(),
+        SimpleSubTrans4(),
+        SimpleSubTrans3(),
+        SimpleSubTrans2(),
+        SimpleSubTrans1(),
     ]
 
     # Now call the function.
@@ -115,16 +129,13 @@ def __init__(self, *args, **kwargs):
     # Now we bring the list in expected order.
     expected_order = sorted(initial_order, key=lambda st: st._EXP_ORDER)
 
-    assert all(ist is soll  for ist, soll in zip(sorted_translators, expected_order)), \
-            f"Expected order was `{[type(x).__name__  for x in expected_order]}`, but got `{[type(x).__name__  for x in sorted_translators]}`."
+    assert all(
+        got_ord is exp_ord
+        for got_ord, exp_ord in zip(sorted_translators, expected_order, strict=False)
+    ), f"Expected order was `{[type(x).__name__  for x in expected_order]}`, but got `{[type(x).__name__  for x in sorted_translators]}`."
     return True
-# end def: test_subtranslatior_order_custom1
 
 
-if "__main__" == __name__:
+if __name__ == "__main__":
     test_subtranslatior_order_simple()
     test_subtranslatior_order_custom1()
-# end(main):
-
-
-

From c03737397547a2f4d68666fc2f1b17df2c11915e Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Fri, 19 Apr 2024 12:38:01 +0200
Subject: [PATCH 017/458] Removed an old file.

---
 src/jace/util/jax.py | 3 ---
 1 file changed, 3 deletions(-)

diff --git a/src/jace/util/jax.py b/src/jace/util/jax.py
index bc80b2c..4379a8a 100644
--- a/src/jace/util/jax.py
+++ b/src/jace/util/jax.py
@@ -41,6 +41,3 @@ def get_jax_var_name(jax_var: jcore.Atom | str) -> str:
             f"Failed to translate the Jax variable '{jax_var}' into a name, the result was empty."
         )
     return jax_var
-
-
-# NEW LINE

From 081bb15113853bba388b2d6d43cd611c1f04d09a Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Fri, 19 Apr 2024 12:59:15 +0200
Subject: [PATCH 018/458] Removed some functionality that is no longer used.

---
 src/jace/util/__init__.py |  3 --
 src/jace/util/traits.py   | 62 ---------------------------------------
 src/jace/util/util.py     | 16 ++--------
 3 files changed, 3 insertions(+), 78 deletions(-)
 delete mode 100644 src/jace/util/traits.py

diff --git a/src/jace/util/__init__.py b/src/jace/util/__init__.py
index fcd0380..80de0e3 100644
--- a/src/jace/util/__init__.py
+++ b/src/jace/util/__init__.py
@@ -10,13 +10,10 @@
 from __future__ import annotations
 
 from .jax import get_jax_var_name
-from .traits import is_iterable, is_str
 from .util import ensure_iterability
 
 
 __all__ = [
     "get_jax_var_name",
-    "is_str",
-    "is_iterable",
     "ensure_iterability",
 ]
diff --git a/src/jace/util/traits.py b/src/jace/util/traits.py
deleted file mode 100644
index 822861c..0000000
--- a/src/jace/util/traits.py
+++ /dev/null
@@ -1,62 +0,0 @@
-# JaCe - JAX Just-In-Time compilation using DaCe (Data Centric Parallel Programming)
-#
-# Copyright (c) 2024, ETH Zurich
-# All rights reserved.
-#
-# SPDX-License-Identifier: BSD-3-Clause
-
-"""Common functionality to identify types of objects."""
-
-from __future__ import annotations
-
-from collections.abc import Sequence
-from typing import Any
-
-
-def is_str(
-    *args: Sequence[Any],
-    allow_empty: bool = True,
-) -> bool:
-    """Tests if its arguments are strings.
-
-    By default empty strings are also considered as strings.
-    However, by setting 'allow_empty' to 'False' the function will consider them not as string.
-    In case no arguments were passed to the function 'False' will be returned.
-    """
-    if len(args) == 0:
-        return False
-    if allow_empty:
-        for x in args:
-            if not isinstance(x, str):
-                return False  # Not a string
-    else:
-        for x in args:
-            if not isinstance(x, str):
-                return False
-            if len(x) == 0:
-                return False
-    return True
-
-
-def is_iterable(
-    x: Any,
-    ign_str: bool = True,
-) -> bool:
-    """Test if 'x' is iterable, with an exception for strings.
-
-    By default this function considers strings as not iterable.
-    The idea is that a string is in most cases not a collection of individual characters, but should be seen as a whole.
-    However, by setting 'ign_str' to 'False' a string is also considered as an iterable.
-
-    Args:
-        x:          The object to check.
-        ign_str:     Ignore strings, defaults to 'True'.
-    """
-    from collections.abc import Iterable
-
-    # We do not consider strings as iterable.
-    if ign_str and is_str(x):
-        return False
-
-    # Based on: https://stackoverflow.com/questions/1952464/in-python-how-do-i-determine-if-an-object-is-iterable/61139278
-    return isinstance(x, Iterable)
diff --git a/src/jace/util/util.py b/src/jace/util/util.py
index e1ae14a..407a153 100644
--- a/src/jace/util/util.py
+++ b/src/jace/util/util.py
@@ -13,28 +13,18 @@
 
 def ensure_iterability(
     x: Any,
-    dcyp: bool = False,
-    scyp: bool = False,
     ign_str: bool = True,
 ) -> Iterable[Any]:
     """Ensures that 'x' is iterable.
 
-    By default a string is _not_ considered as a sequence of chars but as one object.
+    By default strings are _not_ considered iterable.
 
     Args:
         x:          To test.
-        dcyp:       Perform a deep copy on the reurned object, takes precedence.
-        scyp:       Perform a shallow copy on the returned object.
         ign_str:    Ignore that a string is iterabile.
     """
-    import copy
-
     if ign_str and isinstance(x, str):
-        x = [x]  # Turn a string into an interable
+        x = [x]
     elif isinstance(x, Iterable):
-        pass  # Already an iterable
-    if dcyp:
-        x = copy.deepcopy(x)
-    elif scyp:
-        x = copy.copy(x)
+        pass
     return x

From 7fbe79ac98ce455e4e075be47bb2e8ea2bd182ea Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Fri, 19 Apr 2024 16:29:11 +0200
Subject: [PATCH 019/458] Continued to make a test.

---
 .../jace_subtranslator_interface.py           | 130 ++---
 .../translator/jaxpr_translator_driver.py     | 478 +++++++++---------
 .../translator/sub_translators/__init__.py    |   3 +-
 tests/test_subtranslator_helper.py            |   8 +-
 4 files changed, 299 insertions(+), 320 deletions(-)

diff --git a/src/jace/translator/jace_subtranslator_interface.py b/src/jace/translator/jace_subtranslator_interface.py
index cf9420c..9d7d992 100644
--- a/src/jace/translator/jace_subtranslator_interface.py
+++ b/src/jace/translator/jace_subtranslator_interface.py
@@ -19,33 +19,39 @@
 
 
 class JaCeSubTranslatorInterface:
-    """Interface for all Jax primitive/intrinsic translators.
+    """Interface for all Jax primitive/intrinsic subtranslators.
 
     A translator for a primitive, sometimes also called intrinsic, translates a single equation of a Jaxpr into its SDFG equivalent.
-
     A type that implements this interface must fulfil the following properties:
     - It must be stateless.
         It is still possible and explicitly allowed to have an immutable configuration state.
-    - All subclasses has to accept '**kwargs' arguments and must forward all unconsumed arguments to the base.
-        Thus the '__init__()' function of the base must be called.
+    - All subclasses has to accept `**kwargs` arguments and must forward all unconsumed arguments to the base.
 
-    Once a subtranslator is initialized the driver will call its 'get_handled_primitives()' function, which returns the names of all Jax primitives it would like to handle.
-    A subtranslator can register for as many primitive it wants.
-    At the same time more than one subtranslators can be registered for a single primitive.
+    Subtranslators are rather simple objects that only have to perform the translation.
+    The translation process itself is managed by a driver object, which owns and manage the subtranslators.
+    In the end this implements the delegation pattern.
 
-    To decide which subtranslator should be used for a single equation the driver will use their 'can_translate_jaxeqn()' function.
-    The first subtranslator that returns 'True' will then be used.
-    Note it is unspecific if the 'can_translate_jaxeqn()' of the remaining subtranslators is also called.
+    A subtranslator uses its `get_handled_primitives()` function to indicate for which Jax primitives it want to register.
+    It is important that a subtranslator can register for as many primitive it wants.
+    At the same time, it is possible that multiple subtranslators have registered for a single primitive.
 
-    There are two ways how to influence the order in which they are processed.
-    The first and simple one is to implement 'get_priority()'.
-    The driver will order the subtranslators, in ascending order, according to their respective priority.
-    Thus the lower the priority the earlier the subtranslator is checked.
-    Subtranslators that returns 'JaCeSubTranslatorInterface.DEFAULT_PRIORITY' are handled specially and are _always_ put at the end of the list (in unspecific order).
+    If multiple subtranslator have registered for the same primitive they will be ordered by driver.
+    There are two ways how a subtranslator can influence this order.
+    The first one is by implementing `get_priority()`, the driver will then put them in ascending order.
+    I.e. the lower its priority the earlier a subtranslator is checked.
+    Subtranslators that returns the special value `JaCeSubTranslatorInterface.DEFAULT_PRIORITY` are handled specially.
+    Such subtranslators are _always_ put at the end of the list (in unspecific order).
 
     The second possibility is to override the '__lt__()' and '__eq__()' functions.
     While this allows more control it might be more difficult.
-    If a subtranslator does this, its 'get_priority()' function should return 'NotImplemented'.
+    If a subtranslator overrides this functions then it should also override `get_priority()` to return `NotImplemented`.
+
+    To decide which subtranslator should be used for a single equation the driver will use their 'can_translate_jaxeqn()' function.
+    The first subtranslator that returns 'True' will then be used.
+
+    Todo:
+        Come up with a better way of ordering; maybe introduce fixed priority level.
+            And then allows to sort them according to `__lt__()` within the level.
     """
 
     __slots__ = ()
@@ -55,8 +61,8 @@ class JaCeSubTranslatorInterface:
 
     def __init__(
         self,
-        *args,
-        **kwargs,
+        *args: Any,
+        **kwargs: Any,
     ) -> None:
         """Initialize the interface.
 
@@ -64,13 +70,13 @@ def __init__(
         """
 
     def get_handled_primitives(self) -> Collection[str] | str:
-        """Returns the names of all Jax primitives that can be handled by this subtranslator.
+        """Returns the names of all Jax primitives that this subtranslator can handle.
 
-        The returned collection is used to narrow down which translator should be used to translate a given primitive.
+        There is no limit on the number of primitives for which a subtranslator can register.
         It is possible that several translators can be registered for the same name.
 
         See Also:
-            'self.can_translate_jaxeqn()' and 'self.get_priority()'.
+            `self.can_translate_jaxeqn()` and `self.get_priority()`.
 
         Notes:
             It is also possible to return a string instead of a collection with just one element.
@@ -86,22 +92,21 @@ def can_translate_jaxeqn(
         out_var_names: Sequence[str],
         eqn: jcore.JaxprEqn,
     ) -> bool:
-        """Tests if 'self' is able to translate the Jax primitive passed as 'eqn'.
+        """Tests if `self` is able to translate the Jax primitive passed as `eqn`.
 
-        This function is used by the driver translator to determine which subtranslator
-        should be used to handle the 'jcore.JaxprEqn', i.e. primitive.
-        For a more detailed description of the arguments see 'self.translate_jaxeqn()' function.
+        This function is used by the driver to determine which of the subtranslators,
+        that have registered for a certain type of primitive, should be used.
+        For a more detailed description of the arguments see `self.translate_jaxeqn()` function.
 
         Args:
             driver:         The driver object of the translation.
             in_var_names:   Names of the SDFG variables used as inputs for the primitive.
             out_var_names:  Names of the SDFG variables used as outputs for the primitive.
-            eqn:            The 'jcore.JaxprEqn' instance that is currently being handled.
+            eqn:            The `jcore.JaxprEqn` instance that is currently being handled.
 
         Notes:
-            This function has to consider 'self' and all of its arguments as constant.
             In case there is only one subtranslator registered for a certain primitive,
-                it is unspecific if this function will be called before 'self.translate_jaxeqn()' is called.
+                it is unspecific if this function will be called at all `self.translate_jaxeqn()`.
             This function will never be called for a primitive for which it has not registered itself.
         """
         raise NotImplementedError(
@@ -118,27 +123,31 @@ def translate_jaxeqn(
     ) -> dace.SDFGState | None:
         """Translates the Jax primitive into its SDFG equivalent.
 
-        Before the driver will call this function to translate the primitive into an SDFG it will perform the following preparatory tasks:
+        Before the driver calls this function it will perform the following preparatory tasks:
         - It will allocate the SDFG variables that are used as outputs.
-            Their names will be passed through the 'out_var_names' argument, in the same order as 'eqn.outvars'.
-        - It will collect the names of the SDFG variables that are used as input and place them in 'in_var_names', in the same order as 'eqn.invars'.
-            If an input argument refers to a literal no SDFG variable is created for it and 'None' is passed to indicate this.
-        - The driver will create a new terminal state and pass it as 'eqn_state' argument.
-            This state is guaranteed to be empty and 'translator.getTerminalState() is eqn_state' holds.
-
-        If 'self' returns 'None' the driver assumes that the whole primitive was constructed inside 'eqn_state', and the terminal state will left unmodified.
-        However, in case 'self' explicitly returns a state, the driver will use it as new terminal state.
+            Their names will be passed through the `out_var_names` argument, in the same order as `eqn.outvars`.
+        - It will collect the names of the SDFG variables that are used as input and place them in `in_var_names`, in the same order as `eqn.invars`.
+            If an input argument refers to a literal no SDFG variable is created for it and `None` is passed to indicate this.
+            It is not allowed to modify the data descriptors these variables refers to in any way, including replacing them.
+        - The driver will create a new terminal state and pass it as `eqn_state` argument.
+            This state is guaranteed to be empty and `translator.getTerminalState() is eqn_state` holds.
+            A subtranslator should construct the data flow graph inside it.
+
+        It is allowed that the subtranslators creates more states if needed, but this state machine has to have a single terminal state.
+        However, state have to be reachable from the passed `eqn_state`.
+        In this case the function must return this state explicitly.
+        If the function returns `None` the driver will assume that subtranslator was able to fully construct the dataflow graph within `eqn_state`.
+
+        While a subtranslator is forbidden from meddling with the input variables, it is allowed to modify the output variables.
+        For example he could create a new SDFG variable, with different strides.
+        But if the SDFG variable has a different name the subtranslator has to update the name mapping of the driver, and write this change into `out_var_names`.
 
         Args:
             driver:         The driver object of the translation.
-            in_var_names:   List of the names of the arrays created inside the SDFG for the inpts or 'None' in case of a literal.
+            in_var_names:   List of the names of the arrays created inside the SDFG for the inpts or `None` in case of a literal.
             out_var_names:  List of the names of the arrays created inside the SDFG for the outputs.
             eqn:            The Jax primitive that should be translated.
-            eqn_state:      State into which the primitive's SDFG representation should be constructed.
-
-        Notes:
-            A subtranslator is free to do anything to the passed 'eqn_state' with the exception of deleting it or modifying any of its _incoming_ interstateedges.
-            As a general rule, if the subtranslator has to create more states it should explicitly return the new terminal state.
+            eqn_state:      State into which the primitive`s SDFG representation should be constructed.
         """
         raise NotImplementedError(
             "Class '{type(self).__name__}' does not implement 'translate_jaxeqn()'."
@@ -147,26 +156,24 @@ def translate_jaxeqn(
     def get_priority(self) -> int:
         """Returns the priority of this translator.
 
-        In case many translators are registered for the same primitive, see 'self.get_handled_primitives()' they must be ordered.
-        The translators are ordered, and checked by the driver according to this value.
+        The value returned by this function is used by the driver to order the subtranslators that have registered for the same primitive.
         The _smaller_ the value the earlier it is checked.
 
         See Also:
-            'self.can_translate_jaxeqn()' and 'self.get_handled_primitives()'.
+            `self.can_translate_jaxeqn()` and `self.get_handled_primitives()`.
 
         Notes:
-            By default the function returns 'self.DEFAULT_PRIORITY', which is handled specially, i.e. it is put at the end.
-            If a subtranslator opts in to overwrite '__lt__()' instead the function should return 'NotImplemented'.
-                Such translators are biased towards lower priorities.
+            By default the function returns `self.DEFAULT_PRIORITY`, which is handled specially, i.e. it is put at the end.
+            If a subtranslator instead overrides `__lt__()` this function should return `NotImplemented`.
         """
         return self.DEFAULT_PRIORITY
 
     def has_default_priority(self) -> bool:
-        """Checks if 'self' has default priority.
+        """Checks if `self` has default priority.
 
         Notes:
             It is allowed, but not advised to override this function.
-                However, it has to be consistent with 'self.get_priority()'.
+                However, it has to be consistent with `self.get_priority()`.
         """
         try:
             x = self.get_priority()
@@ -174,21 +181,20 @@ def has_default_priority(self) -> bool:
             return False
         if x is NotImplemented:
             return False
-        return x is self.DEFAULT_PRIORITY or (x == self.DEFAULT_PRIORITY)
+        return x == self.DEFAULT_PRIORITY
 
     def __lt__(
         self,
         other: JaCeSubTranslatorInterface,
     ) -> bool:
-        """Tests if 'self' should be checked before 'other' in the selection process.
+        """Tests if `self` should be checked before `other` in the selection process.
 
-        As outlined in the class description there are two possibilities to influence the order in which subtranslators are checked.
-        The simpler one is simply to implement 'get_priority()'.
-        The second one, is to override the '__lt__()' function, which allows to inspect the other subtranslators.
+        As outlined in the class description this is the second possibility to influence the order of the subtranslator.
+        This function should return `True` if `self` should be checked for applicability _before_ `other`.
 
         Notes:
-            If you override this function it is advised that 'get_priority()' returns 'NotImplemented'.
-            This function is never called if either 'self' or 'other' have default priority.
+            If this function is overridden `get_priority()` should return `NotImplemented`.
+            This function is never called if either `self` or `other` have default priority.
         """
         return self.get_priority() < other.get_priority()
 
@@ -198,11 +204,11 @@ def __eq__(
     ) -> bool:
         """Tests if two subtranslators are equal.
 
-        The default implementation checks if 'self' and 'other' have the same type.
-        However, it your subtranslator strongly depend on its configuration you should override this function.
+        The default implementation checks if `self` and `other` have the same type.
+        However, if the behaviour of a subtranslator strongly depend on its configuration this function should be overridden.
 
         Notes:
-            If you override this function you should also override 'self.__hash__()' to make the two consistent.
+            If you override this function you should also override `self.__hash__()` to make the two consistent.
         """
         if not isinstance(other, JaCeSubTranslatorInterface):
             return NotImplemented
@@ -215,7 +221,7 @@ def __hash__(self) -> int:
         Thus all instances of a particular subtranslator will have the same hash value.
 
         Notes:
-            If you override this function you should also override 'self.__eq__()' to make the two consistent.
+            If you override this function you should also override `self.__eq__()` to make the two consistent.
         """
         return id(self.__class__)
 
diff --git a/src/jace/translator/jaxpr_translator_driver.py b/src/jace/translator/jaxpr_translator_driver.py
index 001c5ad..97d0b26 100644
--- a/src/jace/translator/jaxpr_translator_driver.py
+++ b/src/jace/translator/jaxpr_translator_driver.py
@@ -16,7 +16,7 @@
 from dace import data as ddata, properties as dprop
 from jax import core as jcore
 
-from jace import translator as trans
+from jace import translator as jtrans
 from jace.translator import sub_translators as jtsubt, util as jtrutil
 from jace.util import jax as jutil
 
@@ -24,45 +24,41 @@
 class JaxprTranslationDriver:
     """Internal driver class for creating an SDFG equivalent of a `Jaxpr` instance.
 
-    The idea of the transformation is quite simple.
-    Since Jaxpr is essentially a list consisting of more or less simple instructions, we will process them one after the other.
-    For simplicity we will put each equation in its own state, primitives that needs more states must be put into a nested SDFG.
-
-    This class builds an SDFG of a very particular form, which is not directly usable.
-    But it is used as the canonical form inside JaCe and characterized by:
-    - the SDFG is a list of states, each state corresponds to single Jax primitive,
+    This class builds an SDFG of a very particular form, which for us is canonical, which is not
+    directly usable. Thus this class should not be directly used, instead a user should use TBA.
+    The canonical form is characterized by the following:
+    - the SDFG is a list of states, ideally each state corresponds to single Jax primitive,
     - all variable names are derived from Jax names,
     - there are no global variables inside the SDFG,
     - there is no possibility to return something.
 
-    To support nested Jaxpr expressions the driver provides the possibility to clone/fork itself, see `self.fork()` for more.
-    Clones, i.e. the return values of `self.fork()`, also known as children or clone, have a unique identifier, called revision.
-    It is important that the revision is only unique within a family and during a translation process.
-    This identifier is used to generate unique variable names.
-    The clones form a tree that is rooted at the so called 'head translator', i.e. the driver that was explicitly created.
+    The idea of the translator is extremely simple.
+    Since Jaxpr is a list consisting of more or less simple instructions/equations, they get processed one after the other.
+    Each equation is translated into its own state that is appended to the SDFG, thus the SDFG is a long list of states.
+    In certain cases it might be that an equation needs more states, but this is an exception.
+
+    The actual translation is not handled by the driver instead a so called subtranslator object is used.
+    This subtranslator, is specialized for one type of primitive.
+    For more information on the subtranslators see the documentation of `JaCeSubTranslatorInterface`.
 
-    The actual translation of a Jaxpr equation is not handled by the driver instance directly.
-    Instead it is forwarded to a subtranslator instance, see `JaCeSubTranslatorInterface` for more.
     These subtranslators are independent objects that are owned by the driver.
-    However, they are tightly coupled and thus a subtranslator is allowed to use the following private functions:
+    However, due to their tight coupling they are allowed to use the following private functions:
     - `_add_array()` if the translator has to create new.
     - `_create_jax_var_list()` for the bulk creation of Jax variables.
     - `_add_reserved_names()` if a name should be blocked (only affects later equation.
     - `_add_jax_name_mapping()` for creating new links between Jax variables and SDFG variables.
     However, a subtranslator should only call them if it is necessary.
 
+    To support nested Jaxpr expressions the driver provides the possibility to clone/fork itself, see `self.fork()` for more.
+    Every clone, i.e. return value of `self.fork()`, of a driver, which is also known as child, has a unique identifier.
+    This identifier is used for example to generate unique SDFG variable names during a translation process.
+    The original driver, the one that was explicitly created, is also known as head translator, see `is_head_translator()`.
+    It is important that the revision is only unique within a family and during a translation process.
 
-    If no translation is ongoing the only function that makes sense to call is `translate_jaxpr()` to start a translation.
-    Driver supplied to the subtranslators as arguments, such as in `translateEqn()` are allowed to call any public function of the driver.
-    In addition to them it is allowed to call:
-
-    Notes:
-        Equations that only have `_` as output variable are skipped.
-        It is not safe to deepcopy `self` during an active translation instead you should use `self.fork()`.
-        To ensure unique names also in the presence of nested SDFG every instance contains a revision index.
+    If no translation is ongoing the only function that makes sense to call is `translate_jaxpr()` which starts a translation.
 
     Todos:
-        Split the functions into several interfaces one, that is for the whole world to use, one for subtranlators and one for the implementation.
+        Find a better way than to allow giving access to protected functions.
     """
 
     # Member variables that are private to an instance, i.e. they are not passed on to the children.
@@ -91,16 +87,15 @@ def __init__(
     ) -> None:
         """Creates the base translator.
 
-        This function will forward all arguments that does _not_ start with an underscore to the constructors of the subtranslators.
-        Furthermore, this function will allocate the shared members, but the private members are not allocated.
+        All arguments that does not start with an underscore are used as arguments to construct the subtranslators.
 
         Args:
             _no_shared_alloc (bool):     If set then all allocation will be avoided (internal)
 
         Notes:
-            All arguments that does not start with an underscore are forwarded to the translators for the intrinsics.
+            This function will not allocate the translation context of `self` but will only allocate the shared members.
             By setting `_no_shared_alloc` to `True` the function will not allocate the shared part.
-                This flag is provided only for implementing `self.fork()` using it denotes an error and undefined behaviour.
+                This flag is provided only for implementing `self.fork()` using it is an error and undefined behaviour.
         """
         allocate_shared_parts: bool = not kwargs.pop("_no_shared_alloc", False)
 
@@ -108,7 +103,7 @@ def __init__(
         #  They are partitioned by the names of the primitive they have registered for.
         #  Inside a partition they are ordered by priority, lowest first, more important.
         #  This member is allocated by '_init_sub_translators()' and remains allocated during the lifetime of the object.
-        self._sub_translators: dict[str, list[trans.JaCeSubTranslatorInterface]] = None  # type: ignore[assignment]
+        self._sub_translators: dict[str, list[jtrans.JaCeSubTranslatorInterface]] = None  # type: ignore[assignment]
 
         # The SDFG object that we are currently constructing.
         #  Only allocated during an ongoing translation.
@@ -161,25 +156,24 @@ def translate_jaxpr(
         name: str | None = None,
         reserved_names: str | Collection[str] | None = None,
         allow_empty_jaxpr: bool = False,
-        _clear_translation_ctx: bool = True,
+        **kwargs: Any,
     ) -> jtrutil.JaCeTranslationMemento:
         """Perform the translation of a Jaxpr description into a SDFG.
 
-        As described above the function will create the canonical form of Jaxpr based SDFGs.
-        Furthermore the function will return the SDFG encaplulated inside a `jace.translator.util.JaCeTranslationMemento` object.
+        While this function is running `self` has an ongoing translation.
+        As explained above the translation will not result in a "good" SDFG but needs further preprocessing.
+        However, it is the internal format that the translation toolchain expects.
 
         Args:
-            inp_scalar_as_array:       Translate scalar _input_ arguments to arrays of length 1.
+            inp_scalar_as_array:    Translate scalar _input_ arguments to arrays of length 1.
             name:                   Use this name for the SDFG instead some generated one.
-            reserved_names:          Prevent the generation of such names, when translating Jax variable names into SDFG names.
-            allow_empty_jaxpr:        Allows empty Jaxpr.
-            _clear_translation_ctx:      Do not deallocate the inner state of `self`.
+            reserved_names:         Prevent the generation of variables with these names, see `self._add_array()` for more.
+            allow_empty_jaxpr:      Allows empty Jaxpr.
 
-        Notes:
-            By default the function will store its translation state inside the return value and deallocate the internal members.
-                However, by setting `_clear_translation_ctx` to `False` `self` is not deallocated.
-                This means that `self` and the returned memento share the same state.
-                To explicitly deallocate the translation context of `self`, which is required, use `self._clearTranslatorCtx()`.
+        Returns:
+            The function will not return the SDFG directly.
+            Instead it will be wrapped inside a `JaCeTranslationMemento` instance.
+            That contains the SDFG and some meta data needed for further processing.
         """
         if self.is_allocated():
             raise RuntimeError(
@@ -200,6 +194,9 @@ def translate_jaxpr(
                 "The translation only works if 'jax_enable_x64' is enabled. Do it manually or use 'self.transform()'!"
             )
 
+        # Consume the hidden flags
+        _clear_translation_ctx: bool = kwargs.pop("_clear_translation_ctx", True)
+
         self._allocate_translation_ctx(
             name=name,
             reserved_names=reserved_names,
@@ -213,6 +210,8 @@ def translate_jaxpr(
         )
         memento: jtrutil.JaCeTranslationMemento = self._translate_jaxpr_internal(jaxpr)
 
+        # If the translation context is not cleared `self` and `memento` will share the same data.
+        #  There is some legitimate use for that.
         if _clear_translation_ctx:
             self._clear_translation_ctx()
 
@@ -223,12 +222,13 @@ def fork(self) -> JaxprTranslationDriver:
 
         The returned object, known as child, will always be of type `JaxprTranslationDriver`, and should be seen as a partial clone of `self`.
         While the child shares some members with its parent, i.e. `self`, it has an unallocated translation context.
-        Essentially, this function returns an object that when its `translate_jaxpr()` function is called behaves the exact same way as
+        If `translate_jaxpr(jaxpr)` is called on the returned object function will behave the exact same way as
         its parent behaved as it was called just with another `jaxpr` argument.
 
         Notes:
-            A user has to ensure that the lifetime of a fork ends before the one of its direct parent.
+            A user has to ensure that the lifetime of a child ends before the lifetime of its direct parent.
                 In case of a head translator, the lifetime of its children have to end before the translation process finishes.
+            It is important that a clone instance should not be reused, instead you should fork it again, even from the clone.
         """
         # Create a new (empty) driver instance; prevent allocation to make it cheep
         dolly: JaxprTranslationDriver = JaxprTranslationDriver(_no_shared_alloc=True)
@@ -251,33 +251,41 @@ def append_new_state(
         *,
         prev_state: dace.SDFGState | None = None,
     ) -> dace.SDFGState:
-        """Creates a new SDFGState and appends it.
+        """Creates a new `SDFGState` and adds it to the SDFG.
+
+        By default the new state is appended to the current terminal state.
+        This will also update the terminal SDFG state of `self`.
 
-        By default the new SDFGState is appended to the current terminal SDFGState.
-        However, if `prev_state` is given the new SDFGState will be appended to it instead.
+        However, if `prev_state` is specified the state new state will be appended to `prev_state` instead.
+        This will not modify the terminal state unless `prev_state` is the current terminal state.
 
         Args:
-            label:          The name that should be used for the new SDFGState.
-            condition:      The condition of the state transitions used on the InterstateEdge.
+            label:          The name that should be given to the new `SDFGState`.
+            condition:      The condition of the state transitions used on the `InterstateEdge`.
             assignments:    Symbol assignments that should be done during the transition.
-            prev_state:      Alternative SDFGState to which we should append the new SDFGState.
+            prev_state:     Alternative `SDFGState` at which we should append the new state.
 
         Notes:
-            In case no SDFGState exists yet, an initial SDFGState will be created first.
+            In case no `SDFGState` exists yet, an initial SDFGState will be created first.
             This function is similar to `SDFGState.add_state_after()` but differs in the fact that it does not perform reconnecting.
                 I.e. if the state to which we append already has downstream states they will not be reconnected to be after the newly created state.
-            This function will not update the head state of `self`.
         """
         assert self._sdfg is not None
 
         # Test if we must create a start state.
         if self._sdfg.start_block is None:
+            assert all(
+                x is None for x in (self._init_sub_translators, self._term_sdfg_state, prev_state)
+            )
             self._init_sdfg_state = self._sdfg.add_state(label="initial_state", is_start_block=True)
             self._term_sdfg_state = self._init_sdfg_state
-        assert self._sdfg.start_block is self._init_sdfg_state
 
-        # Now create and append the new state
-        app_state: dace.SDFGState = self._term_sdfg_state if prev_state is None else prev_state
+        # Decide if appending to that state will modify the terminal state.
+        modify_term_state: bool = False
+        if (prev_state is self._term_sdfg_state) or (prev_state is None):
+            modify_term_state = True
+            app_state = prev_state
+
         new_state = self._sdfg.add_state(label, is_start_block=False)
         self._sdfg.add_edge(
             app_state,
@@ -285,12 +293,16 @@ def append_new_state(
             dace.sdfg.InterstateEdge(condition=condition, assignments=assignments),
         )
 
+        if modify_term_state:
+            self._term_sdfg_state = new_state
         return new_state
 
     def get_arrays(self) -> Mapping[str, ddata.Data]:
-        """Get the maps containing all known arrays inside the SDFG.
+        """Get all `Data` descriptors that are currently known to the SDFG.
 
-        Essentially a shorthand and preferred way for `self.get_sdfg().arrays`.
+        Notes:
+            Essentially a shorthand and preferred way for `self.get_sdfg().arrays`.
+            For getting a specific data descriptor use `self.get_array()`.
         """
         assert self._sdfg is not None
         return cast(Mapping[str, ddata.Data], self._sdfg.arrays)
@@ -299,10 +311,10 @@ def get_array(
         self,
         name: str | jcore.Atom,
     ) -> ddata.Data:
-        """Returns the `dace.data.Data` object `name` referees to.
+        """Returns the SDFG `Data` object `name` referees to.
 
-        If `name` is a string, it is directly interpreted as the name of an SDFG variable.
-        In case it is a `jax.core.Atom` it is first translated.
+        If `name` is a string it is directly interpreted as the name of an SDFG variable.
+        In case it is a `jax.core.Atom` it is first translated, see `self.map_jax_var_to_sdfg()`.
         """
         assert self._sdfg is not None
 
@@ -353,7 +365,7 @@ def map_jax_var_to_sdfg(
         return self._jax_name_map[jax_var]
 
     def get_sdfg(self) -> dace.SDFG:
-        """Returns the tentative SDFG that is currently constructed.
+        """Returns the SDFG that is currently constructed.
 
         If you want access to the arrays of the SDFG use `self.get_arrays()`/`self.get_array()`.
         """
@@ -362,32 +374,27 @@ def get_sdfg(self) -> dace.SDFG:
         return self._sdfg
 
     def get_terminal_sdfg_state(self) -> dace.SDFGState:
-        """Returns the current tentative terminal state of the SDFG under construction.
+        """Returns the current terminal state of the SDFG under construction.
 
-        Since the translator works by turning each Jax primitive into an SDFG state, the constructed SDFG is essentially a list of states.
-        This function returns the tentative final/terminal SDFGState of the SDFG.
-        States of new primitives will be appended to this one.
-
-        Notes:
-            It is an error to call this function outside the context of a subtranslator.
-                If you want access to the arrays of the SDFG use `self.get_arrays()`.
+        The SDFGs that are constructed by the driver are essentially a list of states.
+        New states are appended at the current terminal/end state and becoming the new terminal state.
+        This function returns the current terminal state.
         """
         assert all(x is not None for x in (self._sdfg, self._term_sdfg_state))
         return self._term_sdfg_state
 
     def is_allocated(self) -> bool:
-        """Tests if `self` is allocated.
-
-        This function only checks if the translation context is allocated.
-        As a side effect a return value of `True` means that a translation process is ongoing.
+        """Tests if the translation context of `self` is allocated.
 
         Notes:
-            The state of the reserved name list is handled specially.
-                In case the function returns `True` it is guaranteed that it is allocated.
-                If `False` is returned it might or might not be allocated.
+            It is safe to call this function any time.
+            If this function returns `True` it means that an allocation is ongoing.
         """
         small_ctx: Sequence[Any] = [
-            getattr(self, x) for x in self.__shared_slots__ if x != "_reserved_names"
+            # for the proper implementation of forking the reserved names are handled special.
+            getattr(self, x)
+            for x in self.__shared_slots__
+            if x != "_reserved_names"
         ]
         if all((x is not None) for x in small_ctx):
             if self._reserved_names is None:
@@ -412,7 +419,7 @@ def same_family(
     ) -> bool:
         """Test if `self` and `other` belongs to the same family of driver/translators.
 
-        They belong to the same family if they descend from the same head translator.
+        The family of a translator is given by the set of all driver that descend from the same head translator.
         """
         if not isinstance(other, JaxprTranslationDriver):
             return NotImplemented  # type: ignore[unreachable]
@@ -455,35 +462,33 @@ def translate_dtype(dtype: Any) -> dace.typeclass:
     def _add_jax_name_mapping(
         self, jax_var: str | jcore.Atom, sdfg_name: str
     ) -> JaxprTranslationDriver:
-        """Creates the mapping between `jax_var` to `sdfg_name`.
+        """Creates a mapping between `jax_var` to `sdfg_name`.
 
         It is an error if there is already a mapping installed for `jax_var`.
 
         Args:
-            jax_var:     The Jax variable that is used.
+            jax_var:     The Jax variable.
             sdfg_name:   The name of the corresponding SDFG variable.
-
-        Notes:
-            While the function allows to create a mapping for Jax names that are in the set of avoided names,
-                it will refuse to create a mapping for a forbidden name.
         """
         assert self._jax_name_map is not None
         assert isinstance(jax_var, (jcore.Atom, str))
+        assert isinstance(sdfg_name, str)
 
         jax_name = jutil.get_jax_var_name(jax_var)
         if jax_name in self._jax_name_map:
             if self._jax_name_map[jax_name] == sdfg_name:  # We consider this as no ops.
                 return self
             raise ValueError(
-                f"Tried to create a mapping for Jax variable '{jax_name}' to '{sdfg_name}', but that mapping exists already and is pointing to '{self.map_jax_var_to_sdfg(jax_name)}'."
+                f"Tried to create the mapping '{jax_name} -> {sdfg_name}', but '{jax_name}'"
+                + f" already points to '{self.map_jax_var_to_sdfg(jax_name)}'."
             )
         if sdfg_name not in self.get_arrays():
             raise KeyError(
-                f"Tried to create the mapping '{jax_name} -> {sdfg_name}', but '{sdfg_name}' is not a known SDFG variable."
+                f"Tried to create the mapping '{jax_name} -> {sdfg_name}', but SDFG target unknown."
             )
         if sdfg_name in self._forbidden_names:
-            raise NameError(  # This is actually an internal error
-                f"Tried to create the mapping '{jax_name} -> {sdfg_name}', but '{sdfg_name}' is forbidden."
+            raise NameError(
+                f"Tried to create the mapping '{jax_name} -> {sdfg_name}', but forbidden name."
             )
 
         self._jax_name_map[jax_name] = sdfg_name
@@ -503,11 +508,9 @@ def _add_reserved_names(
         elif isinstance(reserved_names, Collection):
             pass
         else:
-            raise TypeError(
-                f"Does not know how to handle the type '{type(reserved_names).__name__}'."
-            )
-        assert all(isinstance(x, str) for x in reserved_names)
-
+            raise TypeError(f"Does not know how to handle the type '{type(reserved_names)}'.")
+        if not all(isinstance(x, str) and (len(x) != 0) for x in reserved_names):
+            raise TypeError("Reserved names must all be non empty strings.")
         self._reserved_names.update(reserved_names)
         return self
 
@@ -527,27 +530,27 @@ def _add_array(
         force_jax_name: bool = False,
         update_var_mapping: bool = False,
     ) -> str:
-        """Creates an SDFG variable for the Jax variable `arg` and returns the SDFG name.
+        """Creates an SDFG variable for the Jax variable `arg` and returns its SDFG name.
 
-        By default the function will create a transient, which can be changed by setting `as_transient` to `False`.
-        In case the Jax variable `arg` refers to a scalar, i.e. having an empty shape, the function will generate a SDFG scalar.
-        However, if `force_array` is set, then it will generate an array with shape `(1,)`.
-        For generating a `View` you must set `as_view` to `True`.
+        By default the function will create a transient, use `as_transient` to change that.
+        By default the function will honor if the Jax variable is a scalar or an array.
+        However, by setting `force_array` the function will always generate an array.
 
+        By default the name for the SDFG variable is derived from the Jax variable.
+        It is guaranteed that this name is unique in the SDFG, even in the presence of nested SDFGs.
         By specifying `alt_name` it is possible to force a certain name on a variable.
         It is important that if `alt_name` is specified the function will either generate the variable or fail.
-        In case `alt_name` is not given, then the function will be derived one from `jutil.get_jax_var_name(arg)`.
+
         The  driver distinguishes between two kinds of "bad (SDFG) variable names".
         The first category are the forbidden names, which the function refuses to generate.
-        The second one are the reserved names, which were set at the beginning.
+        The second type are the so called reserved names, which were set at the beginning.
         These names can be used if they are specified through `alt_name` but are not used in automatic naming.
 
         If nothing is specified, the strides of the data are determined by DaCe, which is continuous C order.
         There are two ways to change that.
         The first way is to specify the `strides` argument, which are then forwarded to the underlying DaCe function.
-        The function will only check if enough values were provided, but no further check is performed.
-        The second one is to set `symb_strides` to `True` in which case the function will generate symbols and use them.
-        However, even if symbolic strides are activated, arrays with just one dimensions have always a non symbolic stride.
+        The second way is to set `symb_strides` to `True` in which case the function will generate symbols and use them.
+        However, even if symbolic strides are activated, arrays with just one dimensions have always a non symbolic stride of 1.
         Furthermore, dimensions with shape 1 will always have stride 0.
 
         By default this function does not update the internal variable map.
@@ -555,21 +558,22 @@ def _add_array(
 
         Args:
             arg:                The Jax object for which a SDFG equivalent should be created.
-            as_transient:        If set, the SDFG variable is a transient, `True` by default.
-            alt_name:            Try to create the variable with this name; either succeed or fail.
-            name_prefix:         If given and in automatic naming mode, add this prefix to the name before anything else.
-            force_array:         Instead of a `dace.Scalar` object create a `dace.Array` object with one element.
-            as_view:             Creates a view instead of an array, if it is a scalar it is silently ignored.
-            strides:            Instead of the default strides use this value for the strides.
-            symb_strides:        Create symbols and use them for fully symbolic strides.
-            find_new_name:        The translator will try to find a new name if the designated is already occupied.
+            as_transient:       If set, the SDFG variable is a transient, `True` by default.
+            alt_name:           Try to create the variable with this name; either succeed or fail.
+            name_prefix:        If given and in automatic naming mode, add this prefix to the name.
+            force_array:        Instead of a `dace.Scalar` object create a `dace.Array` with one element.
+            as_view:            Creates a view instead of an array, if it is a scalar it is silently ignored.
+            strides:            Instead of the default strides use these values.
+            symb_strides:       Create symbols and use them for fully symbolic strides.
+            find_new_name:      The translator will try to find a new name if the designated is already occupied.
                                     This does not work if the name was supplied by `alt_name`.
-            allow_literals:      If `True` then also allows JaxLiterals as `arg`.
-            force_jax_name:       If `True` then, the verbatim Jax name will be used.
-            update_var_mapping:   Update the internal variable mapping; by default `False`.
+            allow_literals:     If `True` then also allows JaxLiterals as `arg`.
+            force_jax_name:     If `True` then, the verbatim Jax name will be used.
+            update_var_mapping: Update the internal variable mapping; by default `False`.
 
         Notes:
-            If `find_new_name` is `None` the default the function will only look for a new name if there is a need for that.
+            If this function is used directly a user is advised to always set `update_var_mapping` to `True`.
+            If `find_new_name` is `None` the default, the function will only look for a new name if there is a need for it.
                 If it is `True` the function will always look for a new name, even if the initial name was fine.
                 If it is `False` the function will never look for a new new, thus if the name is unavailable an error is generated.
             Specifying `alt_name` implies `find_new_name=False`.
@@ -584,41 +588,34 @@ def _add_array(
 
         if (alt_name is not None) and (not re.fullmatch("[a-zA-Z_][a-zA-Z0-9_]*", alt_name)):
             raise ValueError(f"The passed name 'alt_name' '{alt_name}' is invalid.")
-
         if force_jax_name:
             if alt_name is not None:
-                raise ValueError(
-                    f"Specified 'force_jax_name' but passed '{alt_name}' as 'alt_name'."
-                )
-            if name_prefix is not None:
-                raise ValueError(
-                    f"Specified 'force_jax_name' and set 'name_prefix' to '{name_prefix}'."
-                )
+                raise ValueError("Specified 'force_jax_name' but passed  'alt_name'.")
             alt_name = jutil.get_jax_var_name(arg)
+            if name_prefix is not None:
+                assert isinstance(name_prefix, str)
+                alt_name = name_prefix + alt_name
         if name_prefix is not None:
             assert isinstance(name_prefix, str)
-            assert len(name_prefix) > 0
             if alt_name is not None:
                 raise ValueError("Specified 'name_prefix' and 'alt_name' which is not possible.")
-
         if (symb_strides is None) and (strides is None):
             symb_strides = False if (len(shape) <= 1) else False
         if as_view and (not as_transient):
             raise ValueError("You tried to create a global view, which is not allowed.")
 
         if isinstance(arg, jcore.Var):
-            prop_name = jutil.get_jax_var_name(
-                arg
-            )  # This is the name that is _suggested_ by the conversion.
+            prop_name = jutil.get_jax_var_name(arg)
             if (alt_name is None) and prop_name.startswith("__"):
                 raise ValueError(
-                    f"You tried to create the variable '{prop_name}' which starts with two underscores, if you really want to do that use 'alt_name'."
+                    f"You tried to create the variable '{prop_name}' which"
+                    "starts with two underscores, use 'alt_name' for that."
                 )
             if isinstance(name_prefix, str):
                 prop_name = name_prefix + prop_name
         elif isinstance(arg, jcore.Literal):
             if not allow_literals:
-                raise NotImplementedError("Jax Literals are not yet implemented.")
+                raise NotImplementedError("Jax Literals are not supported.")
             if alt_name is None:
                 raise ValueError(f"Passed literal '{arg}', but not specified a name to use.")
         else:
@@ -635,7 +632,8 @@ def _add_array(
                 raise ValueError(f"You used 'alt_name' to create the forbidden name '{alt_name}'.")
             if arg_name in self._sdfg.arrays:
                 raise ValueError(
-                    f"Tried to create a variable with name '{arg_name}' explicitly, but it is already known."
+                    f"Tried to create a variable with name '{arg_name}'"
+                    " explicitly, but it is already known."
                 )
         if find_new_name is None:
             find_new_name = (arg_name in self._forbidden_names) or (
@@ -658,9 +656,9 @@ def _add_array(
             else:
                 raise ValueError(f"Failed to find a replacement name for '{arg_name}'")
             del iCounter, _arg_name
-        elif arg_name in self._forbidden_names:
+        if arg_name in self._forbidden_names:
             raise ValueError(f"Can not create variable '{arg_name}', name is forbidden.")
-        elif arg_name in self._sdfg.arrays:
+        if arg_name in self._sdfg.arrays:
             raise ValueError(f"Can not create variable '{arg_name}', variable is already created.")
         if not re.fullmatch("[a-zA-Z_][a-zA-Z0-9_]*", arg_name):
             raise ValueError(f"The requested variable name '{arg_name}' is invalid.")
@@ -677,7 +675,8 @@ def _add_array(
                 raise ValueError("Specified 'symb_strides' and 'stride at the same time.")
             if len(strides) != len(shape):
                 raise ValueError(
-                    f"'strides' was '{strides}' it had length {len(strides)}, but the array has rank {len(shape)}."
+                    f"'strides' was '{strides}' it had length {len(strides)},"
+                    f" but the array has rank {len(shape)}."
                 )
             strides = tuple(strides)
 
@@ -726,19 +725,18 @@ def _create_jax_var_list(
         """Creates SDFG variables for the listed Jax variables and returns the SDFG names as a list.
 
         Before the function will create a variable, by using `_add_array()` with `update_var_mapping=True`,
-        the function will check if the variable is known and no new variable is created.
-        Instead the name of the previously created variable is added to the return value.
-        In case the Jax Atom denotes a literal, no variable will be created, instead `None`
-        will be added to the output list.
+        it will check if the variable is known and if so no new variable is created.
+        Instead the name of the previously created variable is added to the list.
+        In case the Jax Atom denotes a Jax Literal, no variable will be created,
+        instead `None` will be added to the list.
 
         Args:
-            jax_var_list:         The list of Jax variables that should be transformed to SDFG names.
-            prevent_creation:    Never create a variable, indicates that all variables must already exists.
-            only_creation:       Indicates that no variables exists yet and all must be created.
-            kwargs:             In case of variable creation will be forwarded to `self._add_array()` function.
+            jax_var_list:       The list of Jax variables that should be transformed to SDFG names.
+            prevent_creation:   Never create a variable, indicates that all variables must already exists.
+            only_creation:      If a variable already exists, generate an error instead of using it.
+            kwargs:             Will be forwarded to `self._add_array()` if a variable will be created.
 
         Notes:
-            Expected input arguments are `jcore.JaxprEqn.invars` or `jcore.JaxprEqn.outvars`.
             If `only_creation` is set, then literals will cause an error.
             It is an error to pass the `update_var_mapping` argument.
         """
@@ -754,23 +752,16 @@ def _create_jax_var_list(
                 ret_list.append(None)
             elif isinstance(jax_var, jcore.jax_var):
                 mapped_sdfg_name: str | None = self.map_jax_var_to_sdfg(jax_var, allow_fail=True)
+                if (mapped_sdfg_name is None) and prevent_creation:
+                    raise ValueError(f"prevent_creation' given but have to create '{jax_var}'.")
                 if mapped_sdfg_name is None:
-                    if prevent_creation:
-                        raise ValueError(
-                            f"Forbid the creation of jaxVariables, but need to create '{jax_var!s}'."
-                        )
                     ret_list.append(self._add_array(arg=jax_var, update_var_mapping=True, **kwargs))
+                elif only_creation:
+                    raise ValueError(f"'only_creation' given '{jax_var}' already exists.")
                 else:
-                    if only_creation:
-                        raise ValueError(
-                            f"Requested 'only_creation', but '{jax_var}' already exists as '{mapped_sdfg_name}'."
-                        )
                     ret_list.append(mapped_sdfg_name)
             else:
-                raise ValueError(
-                    f"The translation process is not implemented for '{type(jax_var)}'"
-                )
-
+                raise TypeError(f"Does not know how to handle '{type(jax_var).__name__}'")
         return ret_list
 
     def _create_initial_input(
@@ -781,8 +772,8 @@ def _create_initial_input(
         """This function will create the internal input variables that are used for the SDFG.
 
         Args:
-            jaxpr:              The Jaxpr that we want to translate.
-            inp_scalar_as_array:   Promote scalars to arrays of size one.
+            jaxpr:                  The Jaxpr that we want to translate.
+            inp_scalar_as_array:    Promote scalars to arrays of size one.
 
         Returns:
             The list of SDFG variables used as input arguments of `jaxpr` in the same order.
@@ -804,12 +795,12 @@ def _create_initial_input(
             only_creation=True,
             as_transient=True,  # Explicit transient; no error!
             force_array=inp_scalar_as_array,
-            force_jax_name=self.is_head_translator(),  # Ensure head get the pure Jax name.
+            force_jax_name=self.is_head_translator(),  # Ensure head get pure Jax names.
         )
         sdfg.arg_names.extend(init_in_var_names)
 
         # Store the list of inputs in self; this is done to simplify exporting.
-        #  The output list is either generated by `self._translate_jaxpr_internal()` of `self._handle_null_jaxpr()`.
+        #  The output list is populated by `self._translate_jaxpr_internal()`
         self._sdfg_in_names = tuple(init_in_var_names)
 
         return init_in_var_names
@@ -852,17 +843,13 @@ def _allocate_translation_ctx(
         name: str | None = None,
         reserved_names: str | Collection[str] | None = None,
     ) -> JaxprTranslationDriver:
-        """This function allocates and initialize the members related to the translation context.
+        """This function allocates and initialize the members of the translation context of `self`.
 
         After this function is called, `self` is said to have an ongoing translation process.
 
         Args:
             name:               The name of the SDFG.
             reserved_names:     Add these name to the set of resered names of `self`.
-
-        Notes:
-            It is not an error, if the reserved names are already allocated.
-                In that case the names passed by `reserved_names` are added to the list already preset.
         """
         if self.is_allocated():
             raise RuntimeError("The translator is already allocated.")
@@ -876,16 +863,13 @@ def _allocate_translation_ctx(
         self._sdfg_in_names = ()
         self._sdfg_out_names = ()
 
-        # Handle the `reserved_names` argument as described above.
-        #  This is essentially needed that children works properly.
+        # If the reserved names are already allocated then keep them.
+        #  This is needed to preserve them among forks.
         if self._reserved_names is None:
             self._reserved_names = set()  # type: ignore[unreachable]
-        else:
+        elif not isinstance(self._reserved_names, set):
             raise RuntimeError("The reserved names are allocated incorrectly.")
-        assert all(isinstance(x, str) for x in self._reserved_names)  # type: ignore[unreachable]
-        self._add_reserved_names(reserved_names)
-
-        return self
+        return self._add_reserved_names(reserved_names)
 
     def _init_sub_translators(
         self,
@@ -900,23 +884,19 @@ def _init_sub_translators(
             raise RuntimeError("Tried to allocate the internal subtranslators twice.")
         assert self._sub_translators is None  # type: ignore[unreachable]
 
-        # We might get arguments that starts with an underscore, which are not meant for the subtranslators.
         kwargs = {k: v for k, v in kwargs.items() if not k.startswith("_")}
 
-        # Will contain all subtranslators we create.
-        subtranslators: dict[str, list[trans.JaCeSubTranslatorInterface]] = {}
-
         # First we will create all subtranslators and partition them.
-        subtranslator_cls: type[trans.JaCeSubTranslatorInterface]
+        subtranslators: dict[str, list[jtrans.JaCeSubTranslatorInterface]] = {}
         for subtranslator_cls in jtsubt._get_subtranslators_cls():
-            subtranslator: trans.JaCeSubTranslatorInterface = subtranslator_cls(**kwargs)
+            subtranslator: jtrans.JaCeSubTranslatorInterface = subtranslator_cls(**kwargs)
             handled_primitives: Iterable[str] = jutil.ensure_iterability(
-                subtranslator.getHandledPrimitives()
+                subtranslator.get_handled_primitives()
             )
 
             # Now add the subtranslator to the primitives it requests, we will sort them later into the correct order.
-            for handledPrimitive in handled_primitives:
-                subtranslators.setdefault(handledPrimitive, []).append(subtranslator)
+            for handled_primitive in handled_primitives:
+                subtranslators.setdefault(handled_primitive, []).append(subtranslator)
 
         # Now we order the subtranslators for the primitives.
         self._sub_translators = {
@@ -930,8 +910,9 @@ def _clear_translation_ctx(self) -> JaxprTranslationDriver:
 
         Notes:
             While it is allowed for outside code to call this explicitly function, it is is most likely an error.
-            If this function is called on a head translator, then the revision state will be rested.
-                Thus a caller has to make sure that the lifetime of all children has ended.
+            If this function is called on a head translator, then the translation process ends.
+                This implies that all direct and indirect children, i.e. output of `self.fork()` must already be deallocated.
+                A further side effect is that now revision indexes will be reused.
             If `self` is not allocated this function acts as a noops.
             The reserved names are only deallocated if `self` is a head translator.
         """
@@ -960,8 +941,8 @@ def _find_sub_translator_for(
         in_var_names: Sequence[str | None],
         out_var_names: Sequence[str],
         eqn: jcore.JaxprEqn,
-    ) -> trans.JaCeSubTranslatorInterface:
-        """Returns the subtranslator object to translate `eqn`.
+    ) -> jtrans.JaCeSubTranslatorInterface:
+        """Returns the appropriate subtranslator for equation `eqn`.
 
         The subtranslators are checked for applicability in the order of their priority.
         The fist one that accepts the translation will be taken.
@@ -973,23 +954,20 @@ def _find_sub_translator_for(
 
         prim_name: str = eqn.primitive.name
         if prim_name not in self._sub_translators:
-            raise NotImplementedError(f"No subtranslators known to hanble primitive '{prim_name}'.")
+            raise NotImplementedError(f"No subtranslators known to handle '{prim_name}'.")
         subtranslator_canidates = self._sub_translators[prim_name]
         assert len(subtranslator_canidates) > 0
 
-        subtranslator: trans.JaCeSubTranslatorInterface = None  # type: ignore[assignment]
+        subtranslator: jtrans.JaCeSubTranslatorInterface = None  # type: ignore[assignment]
         if len(subtranslator_canidates) == 1:
             subtranslator = next(iter(subtranslator_canidates))
             assert subtranslator.can_translate_jaxeqn(
-                driver=self, in_var_names=in_var_names, out_var_names=out_var_names, eqn=eqn
+                in_var_names=in_var_names, out_var_names=out_var_names, driver=self, eqn=eqn
             )
         else:
             for subtranslatorCanidate in subtranslator_canidates:
                 if subtranslatorCanidate.can_translate_jaxeqn(
-                    driver=self,
-                    in_var_names=in_var_names,
-                    out_var_names=out_var_names,
-                    eqn=eqn,
+                    driver=self, in_var_names=in_var_names, out_var_names=out_var_names, eqn=eqn
                 ):
                     subtranslator = subtranslatorCanidate
             else:
@@ -1005,29 +983,32 @@ def _translate_single_eqn(
 
         To do this the function will do the following steps:
         - Assemble the in and output variables.
-        - Select which subtranslator to use.
-        - Create a new empty state, i.e. append to the tentative terminal state.
-        - Perform the actual translation.
+        - Select the appropriate subtranslator to use.
+        - Create a new empty state terminal state.
+        - Call the subtranslator to perform the translation inside the new state.
 
         Returns:
-            The SDFG names that where used as input and output are returned.
-            The inputs might contain `None` which indicates that the input was a Jax literal.
+            The SDFG names that were used as input and output are returned.
+            The inputs might contain `None` which indicates that that input was a Jax Literal.
             For more information see `JaCeSubTranslatorInterface.can_translate_jaxeqn()`.
 
         Notes:
-            While `jaxpr` must be the closed version, `eqn` must come from the unclosed version.
-            The function will also perform some consistency checking.
+            While `jaxpr` must be a `ClosedJaxpr`, `eqn` must come from the unclosed instance.
+            The function will perform some consistency checking after the subtranslator was called.
         """
         assert isinstance(eqn, jcore.JaxprEqn)
         assert isinstance(jaxpr, jcore.ClosedJaxpr)
 
         if len(eqn.effects) != 0:
-            raise NotImplementedError(f"Equation '{eqn}' had side effects.")
+            raise NotImplementedError(f"Equation '{eqn}' has side effects.")
 
         # Input/Output variables
-        in_var_names: Sequence[str | None] = self._create_jax_var_list(
-            eqn.invars,
-            prevent_creation=True,  # Inputs must already exists.
+        #  Using a tuple for the input ensures that it is not modified.
+        in_var_names: Sequence[str | None] = tuple(
+            self._create_jax_var_list(
+                eqn.invars,
+                prevent_creation=True,  # Inputs must already exists.
+            )
         )
         out_var_names: Sequence[str] = self._create_jax_var_list(  # type: ignore[assignment]
             eqn.outvars,
@@ -1035,17 +1016,17 @@ def _translate_single_eqn(
         )
 
         # Find the subtranslator
-        subtranslator: trans.JaCeSubTranslatorInterface = self._find_sub_translator_for(
+        subtranslator: jtrans.JaCeSubTranslatorInterface = self._find_sub_translator_for(
             in_var_names=in_var_names,
             out_var_names=out_var_names,
             eqn=eqn,
         )
 
-        # Create the state into which the equation is put
+        # Create the state into which the equation should be translated
         last_term_state: dace.SDFGState = self.get_terminal_sdfg_state()  # noqa: F841 # Will be used later
         eqn_state = self.append_new_state(
             label=f"{eqn.primitive.name}_{out_var_names[0]}",
-            prev_state=None,  # Force to append as terminal state.
+            prev_state=None,
         )
 
         # Now perform the actual translation of the equation.
@@ -1059,41 +1040,48 @@ def _translate_single_eqn(
 
         # Determine the new (tentative) terminal state of the SDFG we are building.
         if new_sdfg_term_state is None:
-            if eqn_state is self._term_sdfg_state:
+            if eqn_state is not self._term_sdfg_state:
                 raise RuntimeError("Inconsistent terminal state was detected.")
             new_sdfg_term_state = eqn_state
         elif isinstance(new_sdfg_term_state, dace.SDFGState):
-            # TODO(phimuell): use `last_term_state` to test if there is reachability to new end.
+            # TODO(phimuell): use `last_term_state` to test if `new_sdfg_term_state` is reachable.
             pass
         else:
             raise TypeError(f"Encountered illegal types '{type(new_sdfg_term_state)}'")
 
-        # In case a subtranslator decided to not use the variables we created for it, he is technically
-        #  allowed to create new ones, but he must update the `out_var_names` list.
-        #  We will now test if the mapping was updated correctly.
-        for expectedSDFGName, jax_var in zip(out_var_names, eqn.outvars, strict=False):
+        # In case a subtranslator decided to not use the variables we created for it, which is allowed
+        #  but he must update the `out_var_names` list correctly, we will now verify this.
+        if len(out_var_names) != len(eqn.outvars):
+            raise RuntimeError(
+                f"Modified 'out_var_names'! Expected {len(eqn.outvars)} variables."
+                f" but found {len(out_var_names)}"
+            )
+        for expectedSDFGName, jax_var in zip(out_var_names, eqn.outvars, strict=True):
             mapped_sdfg_name = self.map_jax_var_to_sdfg(jax_var)
             jax_name = jutil.get_jax_var_name(jax_var)
             if mapped_sdfg_name != expectedSDFGName:
                 raise ValueError(
-                    f"Mapping inconsistency detected, expected that Jax variable '{jax_name}' maps to '{expectedSDFGName}' but it actually maps to '{mapped_sdfg_name}'."
+                    f"Mapping inconsistency detected, expected that Jax variable"
+                    f" '{jax_name}' maps to '{expectedSDFGName}' but it actually"
+                    f" maps to '{mapped_sdfg_name}'."
                 )
 
         # Views can only be used if there is a direct connection, between source, view and destination (place of usage)
         #  Because of the way how Jax works, it is impossible that an output variable is a View.
-        #  Thus we now make the check if this is the case.
-        for outVarName, jax_var in zip(out_var_names, eqn.outvars, strict=False):
+        for outVarName, jax_var in zip(out_var_names, eqn.outvars, strict=True):
             sdfg_var = self.get_array(outVarName)
             if isinstance(sdfg_var, (dace.data.Array, dace.data.Scalar)):
                 pass
             elif isinstance(sdfg_var, dace.data.View):
                 raise TypeError(
-                    f"For the Jax variable '{jutil.get_jax_var_name(jax_var)}' (SDFG: '{outVarName}'), which is an output, you used a View, which is not possible."
-                    + " It must either be an array or a scalar."
+                    f"For the Jax variable '{jutil.get_jax_var_name(jax_var)}' (SDFG: '{outVarName}'),"
+                    f" which is an output, you used a View, which is not possible."
+                    " It must either be an array or a scalar."
                 )
             else:
                 raise NotImplementedError(
-                    f"The output variable '{jutil.get_jax_var_name(jax_var)}' (SDFG: '{outVarName}') is of type '{type(sdfg_var).__name__}' which I does not know how to handle."
+                    f"The output variable '{jutil.get_jax_var_name(jax_var)}' (SDFG: '{outVarName}')"
+                    f" is of type '{type(sdfg_var).__name__}' which I does not know how to handle."
                 )
 
         # Modify terminal head state of 'self'
@@ -1108,8 +1096,6 @@ def _translate_jaxpr_internal(
         """Performs the actual translation of the Jaxpr into an SDFG.
 
         The function assumes that the context is already allocated and the initial variables are already created.
-        The function will ignore, i.e. not translate, any state whose output variables name only consists of `_`.
-
         The function will store the internal state of `self` into a memento and return it.
         However, it will not deallocate the context of `self`, thus `self` and the memento share the same context in memory.
 
@@ -1118,13 +1104,15 @@ def _translate_jaxpr_internal(
 
         Notes:
             The function will unconditionally handle empty Jaxpr.
-            Jax uses a variable with name `_` to indicate that this value is never read.
-                It is included by some transformations such as `grad()`.
+            Jax uses a variable with name `_` to indicate that this value is never read,
+                this is used by Jax to indicate that they are never read.
+                Such variables are included by some transformations such as `grad()`.
         """
         assert isinstance(jaxpr, jcore.ClosedJaxpr)
         assert self.is_allocated()
 
         nb_translated_eqn: int = 0
+        out_var_names: Sequence[str] = []
         for eqn in jaxpr.jaxpr.eqns:  # Translate the equations one by one.
             assert len(eqn.effects) == 0
             if len(eqn.outvars) == 0:  # Do we need this special case.
@@ -1137,12 +1125,10 @@ def _translate_jaxpr_internal(
             _, out_var_names = self._translate_single_eqn(jaxpr=jaxpr, eqn=eqn)
             nb_translated_eqn += 1
 
-        if nb_translated_eqn != 0:
-            # Equations where translated so set the output variables.
-            self._sdfg_out_names = tuple(out_var_names)
-        else:
-            # No equations were translated, i.e. no equation at all or all outputs had name '_'
-            self._handle_null_jaxpr(jaxpr)
+        if nb_translated_eqn == 0:
+            # There were no equation, so handle the copying of input to output.
+            out_var_names = self._handle_null_jaxpr(jaxpr)
+        self._sdfg_out_names = tuple(out_var_names)
 
         return self._export_memento()
 
@@ -1153,10 +1139,8 @@ def _export_memento(self) -> jtrutil.JaCeTranslationMemento:
         Thus the memento and `self` share the same context in memory.
         """
         assert self.is_allocated()
-        assert len(self._sdfg_in_names) > 0
-        assert all(isinstance(x, str) for x in self._sdfg_in_names)
-        assert len(self._sdfg_out_names) > 0
-        assert all(isinstance(x, str) for x in self._sdfg_out_names)
+        assert all((isinstance(x, str) and (len(x) > 0)) for x in self._sdfg_in_names)
+        assert all((isinstance(x, str) and (len(x) > 0)) for x in self._sdfg_out_names)
 
         return jtrutil.JaCeTranslationMemento(
             sdfg=self._sdfg,
@@ -1170,28 +1154,21 @@ def _export_memento(self) -> jtrutil.JaCeTranslationMemento:
     def _handle_null_jaxpr(
         self,
         jaxpr: jcore.ClosedJaxpr,
-    ) -> JaxprTranslationDriver:
+    ) -> Sequence[str]:
         """This function is called in case a `Jaxpr` with zero equations is encountered.
 
-        Notes:
-            This function will fill the internal list of outputs.
+        A function with zero equation might still have output, in which case an input is copied to an output.
+        This function will handle the copying from the input into the corresponding output variable.
+
+        Returns:
+            The function returns a list denoting the SDFG variables that refers to the output.
+            The order of the list is the same as in `jaxpr.jaxpr.outvars`.
         """
         if len(jaxpr.eqns) != 0:
             raise NotImplementedError("'_handle_null_jaxpr()' was called for a non empty Jaxpr.")
-        if (
-            len(jaxpr.out_avals) == 0
-        ):  # There is not output so we do not have to copy anything around.
-            self._sdfg_out_names = ()
-            return self
-        if self.is_head_translator():
-            # In this case there is nothing to do, because input is already the output.
-            #  However, this is only possible if we are the head translator.
-            self._sdfg_out_names = tuple(
-                self.map_jax_var_to_sdfg(jax_out_var) for jax_out_var in jaxpr.jaxpr.outvars
-            )
-            raise NotImplementedError("Please test me.")
-            return self  # type: ignore[unreachable] # reminder
-        #
+        if len(jaxpr.out_avals) == 0:
+            # There is not output so we do not have to copy anything around.
+            return ()
         assert self._term_sdfg_state is self._init_sdfg_state
         assert len(self._sdfg_in_names) > 0
         assert len(self._sdfg_out_names) == 0
@@ -1237,10 +1214,7 @@ def _handle_null_jaxpr(
                     jax_inp_name, self.get_array(self.map_jax_var_to_sdfg(jax_inp_name))
                 ),
             )
-        # We also have to update the list of outputs.
-        #  This is needed for making the exporter aware of what we are doing.
-        self._sdfg_out_names = tuple(out_var_names)
-        return self
+        return tuple(out_var_names)
 
     # fmt: off
     _forbidden_names: Final[set[str]] = {
diff --git a/src/jace/translator/sub_translators/__init__.py b/src/jace/translator/sub_translators/__init__.py
index 0155ba0..8acfffc 100644
--- a/src/jace/translator/sub_translators/__init__.py
+++ b/src/jace/translator/sub_translators/__init__.py
@@ -10,9 +10,8 @@
 from __future__ import annotations
 
 from collections.abc import Sequence
-from typing import Final, Type
+from typing import Final
 
-import jace
 from jace import translator as jtrans
 
 from .alu_translator import ALUTranslator
diff --git a/tests/test_subtranslator_helper.py b/tests/test_subtranslator_helper.py
index 7d4c55b..a7fa78e 100644
--- a/tests/test_subtranslator_helper.py
+++ b/tests/test_subtranslator_helper.py
@@ -199,19 +199,19 @@ def __gt__(self, other: Any) -> bool:
 
     #
 
-    # Thest the initial conditions
+    # Test the initial conditions
     init_sub_trans_list = _get_subtranslators_cls(builtins=False)
-    init_built_in = _get_subtranslators_cls(with_external=False)
+    init_built_in = _get_subtranslators_cls(with_external=False)  # noqa: F841  # Not finished
     assert (
         len(init_sub_trans_list) == 0
     ), f"Expected no external subtranslators but found: {init_sub_trans_list}"
 
     # Now we add the valid subtranslator interface
     assert add_subtranslator(ValidSubTrans), "Failed to add the `ValidSubTrans`"
-    first_sub_trans = _get_subtranslators_cls(builtins=False)
+    first_sub_trans = _get_subtranslators_cls(builtins=False)  # noqa: F841  # Not finished
 
     # Should not include the
-    subTrans = _get_subtranslators_cls(with_external=False)
+    subTrans = _get_subtranslators_cls(with_external=False)  # noqa: F841  # Not finished
 
     assert not add_subtranslator(ValidSubTrans), "Could add `ValidSubTrans` twice"
     raise AssertionError("NOT FINISHED YET")

From dc8b7cf55ed931d04d0769b9d2006a5220cf0903 Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Sun, 21 Apr 2024 12:48:04 +0200
Subject: [PATCH 020/458] Made some formating changes.

---
 .../jace_subtranslator_interface.py           | 149 +++++---
 .../translator/jaxpr_translator_driver.py     | 335 ++++++++++--------
 .../util/jace_translation_memento.py          |  19 +-
 src/jace/translator/util/revision_counter.py  |  13 +-
 .../util/subtranslator_helper_order.py        |  30 +-
 src/jace/util/dace.py                         |   3 +-
 src/jace/util/jax.py                          |   3 +-
 src/jace/util/util.py                         |   2 +-
 8 files changed, 321 insertions(+), 233 deletions(-)

diff --git a/src/jace/translator/jace_subtranslator_interface.py b/src/jace/translator/jace_subtranslator_interface.py
index 9d7d992..73b49f7 100644
--- a/src/jace/translator/jace_subtranslator_interface.py
+++ b/src/jace/translator/jace_subtranslator_interface.py
@@ -21,35 +21,46 @@
 class JaCeSubTranslatorInterface:
     """Interface for all Jax primitive/intrinsic subtranslators.
 
-    A translator for a primitive, sometimes also called intrinsic, translates a single equation of a Jaxpr into its SDFG equivalent.
-    A type that implements this interface must fulfil the following properties:
+    A translator for a primitive, sometimes also called intrinsic, translates
+    a single equation of a Jaxpr into its SDFG equivalent. A type that
+    implements this interface must fulfil the following properties:
     - It must be stateless.
-        It is still possible and explicitly allowed to have an immutable configuration state.
-    - All subclasses has to accept `**kwargs` arguments and must forward all unconsumed arguments to the base.
-
-    Subtranslators are rather simple objects that only have to perform the translation.
-    The translation process itself is managed by a driver object, which owns and manage the subtranslators.
+        It is still possible and explicitly allowed to have an
+        immutable configuration state.
+    - All subclasses has to accept `**kwargs` arguments and must
+        forward all unconsumed arguments to the base.
+
+    Subtranslators are rather simple objects that only have to perform
+    the translation. The translation process itself is managed by a driver
+    object, which owns and manage the subtranslators.   
     In the end this implements the delegation pattern.
 
-    A subtranslator uses its `get_handled_primitives()` function to indicate for which Jax primitives it want to register.
-    It is important that a subtranslator can register for as many primitive it wants.
-    At the same time, it is possible that multiple subtranslators have registered for a single primitive.
+    A subtranslator uses its `get_handled_primitives()` function to indicate
+    for which Jax primitives it want to register. It is important that a
+    subtranslator can register for as many primitive it wants. At the same
+    time, it is possible that multiple subtranslators have registered for a
+    single primitive.
 
-    If multiple subtranslator have registered for the same primitive they will be ordered by driver.
-    There are two ways how a subtranslator can influence this order.
-    The first one is by implementing `get_priority()`, the driver will then put them in ascending order.
+    If multiple subtranslator have registered for the same primitive they
+    will be ordered by driver. There are two ways how a subtranslator can
+    influence this order. The first one is by implementing `get_priority()`,
+    the driver will then put them in ascending order.
     I.e. the lower its priority the earlier a subtranslator is checked.
-    Subtranslators that returns the special value `JaCeSubTranslatorInterface.DEFAULT_PRIORITY` are handled specially.
-    Such subtranslators are _always_ put at the end of the list (in unspecific order).
+    However, if a subtranslator returns the special value
+    `JaCeSubTranslatorInterface.DEFAULT_PRIORITY` it will be always put at the
+    end, in unspecific order if multiple translator are involved.
 
-    The second possibility is to override the '__lt__()' and '__eq__()' functions.
-    While this allows more control it might be more difficult.
-    If a subtranslator overrides this functions then it should also override `get_priority()` to return `NotImplemented`.
+    The second possibility is to override the '__lt__()' function,
+    and establish a strict weak order. If a subtranslator overrides this
+    function it should also override `get_priority()` to return `NotImplemented`.
 
-    To decide which subtranslator should be used for a single equation the driver will use their 'can_translate_jaxeqn()' function.
+    To decide which subtranslator should be used for a specific equation
+    the driver will use their 'can_translate_jaxeqn()' function.
     The first subtranslator that returns 'True' will then be used.
 
     Todo:
+        Also come up with a way how to avoid that instances are allowed to access
+            some private members of the driver; Possibly by composition.
         Come up with a better way of ordering; maybe introduce fixed priority level.
             And then allows to sort them according to `__lt__()` within the level.
     """
@@ -70,16 +81,17 @@ def __init__(
         """
 
     def get_handled_primitives(self) -> Collection[str] | str:
-        """Returns the names of all Jax primitives that this subtranslator can handle.
+        """Returns the names of all Jax primitives that `self` is able to handle.
 
-        There is no limit on the number of primitives for which a subtranslator can register.
-        It is possible that several translators can be registered for the same name.
+        There is no limit on the number of primitives for which a subtranslator
+        can register. It is possible that several translators can be registered
+        for the same name.
 
         See Also:
             `self.can_translate_jaxeqn()` and `self.get_priority()`.
 
         Notes:
-            It is also possible to return a string instead of a collection with just one element.
+            In case a string is returned it is interpreted as 1 element collection.
         """
         raise NotImplementedError(
             "Class '{type(self).__name__}' does not implement 'get_handled_primitives()'."
@@ -96,7 +108,8 @@ def can_translate_jaxeqn(
 
         This function is used by the driver to determine which of the subtranslators,
         that have registered for a certain type of primitive, should be used.
-        For a more detailed description of the arguments see `self.translate_jaxeqn()` function.
+        For a more detailed description of the arguments see
+        `self.translate_jaxeqn()` function.
 
         Args:
             driver:         The driver object of the translation.
@@ -123,31 +136,51 @@ def translate_jaxeqn(
     ) -> dace.SDFGState | None:
         """Translates the Jax primitive into its SDFG equivalent.
 
-        Before the driver calls this function it will perform the following preparatory tasks:
+        Before the driver calls this function it will perform the following
+        preparatory tasks:
         - It will allocate the SDFG variables that are used as outputs.
-            Their names will be passed through the `out_var_names` argument, in the same order as `eqn.outvars`.
-        - It will collect the names of the SDFG variables that are used as input and place them in `in_var_names`, in the same order as `eqn.invars`.
-            If an input argument refers to a literal no SDFG variable is created for it and `None` is passed to indicate this.
-            It is not allowed to modify the data descriptors these variables refers to in any way, including replacing them.
-        - The driver will create a new terminal state and pass it as `eqn_state` argument.
-            This state is guaranteed to be empty and `translator.getTerminalState() is eqn_state` holds.
-            A subtranslator should construct the data flow graph inside it.
-
-        It is allowed that the subtranslators creates more states if needed, but this state machine has to have a single terminal state.
-        However, state have to be reachable from the passed `eqn_state`.
-        In this case the function must return this state explicitly.
-        If the function returns `None` the driver will assume that subtranslator was able to fully construct the dataflow graph within `eqn_state`.
-
-        While a subtranslator is forbidden from meddling with the input variables, it is allowed to modify the output variables.
-        For example he could create a new SDFG variable, with different strides.
-        But if the SDFG variable has a different name the subtranslator has to update the name mapping of the driver, and write this change into `out_var_names`.
+            Their names will be passed through the `out_var_names` argument,
+            in the same order as `eqn.outvars`.
+        - It will collect the names of the SDFG variables that are used as input
+            and place them in `in_var_names`, in the same order as `eqn.invars`.
+            If an input argument refers to a literal no SDFG variable is created
+            for it and `None` is passed to indicate this.
+        - The subtranslator will create variables that are used as output.
+            They are passed as `out_var_names`, same order as in the equation.
+        - The driver will create a new terminal state and pass it as
+            `eqn_state` argument. This state is guaranteed to be empty and
+            `translator.get_terminal_sdfg_state() is eqn_state` holds.
+        
+        Then the subtranslator is called. Usually a subtranslator should
+        construct the dataflow graph inside it. It is allowed that the
+        subtranslators creates more states if needed, but this state machine
+        has to have a single terminal state, which must be returned
+        and reachable from `eqn_state`.
+        If the function returns `None` the driver will assume that
+        subtranslator was able to fully construct the dataflow graph
+        within `eqn_state`.
+
+
+        While a subtranslator is forbidden from meddling with the input
+        variables mentioned in `in_var_names` in any way, it is allowed to
+        modify the output variables. For example he could create a new
+        SDFG variable, with different strides. But in that case the
+        subtranslator must update the internal mapping of the driver TBA HOW,
+        and modify the mapping in `out_var_names`.
+        However, the subtranslator is allowed to create internal temporary
+        variables. It just have to ensure that no name collision will occur,
+        a way to do this is to use a passed variable name as prefix.
+
 
         Args:
             driver:         The driver object of the translation.
-            in_var_names:   List of the names of the arrays created inside the SDFG for the inpts or `None` in case of a literal.
-            out_var_names:  List of the names of the arrays created inside the SDFG for the outputs.
+            in_var_names:   List of the names of the arrays created inside the
+                                SDFG for the inpts or `None` in case of a literal.
+            out_var_names:  List of the names of the arrays created inside the
+                                SDFG for the outputs.
             eqn:            The Jax primitive that should be translated.
-            eqn_state:      State into which the primitive`s SDFG representation should be constructed.
+            eqn_state:      State into which the primitive`s SDFG representation
+                                should be constructed.
         """
         raise NotImplementedError(
             "Class '{type(self).__name__}' does not implement 'translate_jaxeqn()'."
@@ -156,15 +189,18 @@ def translate_jaxeqn(
     def get_priority(self) -> int:
         """Returns the priority of this translator.
 
-        The value returned by this function is used by the driver to order the subtranslators that have registered for the same primitive.
+        The value returned by this function is used by the driver to order the
+        subtranslators that have registered for the same primitive.
         The _smaller_ the value the earlier it is checked.
 
         See Also:
             `self.can_translate_jaxeqn()` and `self.get_handled_primitives()`.
 
         Notes:
-            By default the function returns `self.DEFAULT_PRIORITY`, which is handled specially, i.e. it is put at the end.
-            If a subtranslator instead overrides `__lt__()` this function should return `NotImplemented`.
+            By default the function returns `self.DEFAULT_PRIORITY`, which is
+                handled specially, i.e. it is put at the end.
+            If a subtranslator instead overrides `__lt__()` this function
+                should return `NotImplemented`.
         """
         return self.DEFAULT_PRIORITY
 
@@ -189,8 +225,9 @@ def __lt__(
     ) -> bool:
         """Tests if `self` should be checked before `other` in the selection process.
 
-        As outlined in the class description this is the second possibility to influence the order of the subtranslator.
-        This function should return `True` if `self` should be checked for applicability _before_ `other`.
+        As outlined in the class description this is the second possibility to
+        influence the order of the subtranslator. This function should return
+        `True` if `self` should be checked for applicability _before_ `other`.
 
         Notes:
             If this function is overridden `get_priority()` should return `NotImplemented`.
@@ -204,11 +241,13 @@ def __eq__(
     ) -> bool:
         """Tests if two subtranslators are equal.
 
-        The default implementation checks if `self` and `other` have the same type.
-        However, if the behaviour of a subtranslator strongly depend on its configuration this function should be overridden.
+        The default implementation checks if `self` and `other` have the same
+        type. However, if the behaviour of a subtranslator strongly depend on
+        its configuration this function should be overridden.
 
         Notes:
-            If you override this function you should also override `self.__hash__()` to make the two consistent.
+            If you override this function you should also override
+                `self.__hash__()` to make the two consistent.
         """
         if not isinstance(other, JaCeSubTranslatorInterface):
             return NotImplemented
@@ -218,10 +257,12 @@ def __hash__(self) -> int:
         """Computes the hash of the subtranslator.
 
         The default implementation return a hash that is based on the class.
-        Thus all instances of a particular subtranslator will have the same hash value.
+        Thus all instances of a particular subtranslator will have the same
+        hash value.
 
         Notes:
-            If you override this function you should also override `self.__eq__()` to make the two consistent.
+            If you override this function you should also override
+                `self.__eq__()` to make the two consistent.
         """
         return id(self.__class__)
 
diff --git a/src/jace/translator/jaxpr_translator_driver.py b/src/jace/translator/jaxpr_translator_driver.py
index 97d0b26..6ef5086 100644
--- a/src/jace/translator/jaxpr_translator_driver.py
+++ b/src/jace/translator/jaxpr_translator_driver.py
@@ -24,46 +24,45 @@
 class JaxprTranslationDriver:
     """Internal driver class for creating an SDFG equivalent of a `Jaxpr` instance.
 
-    This class builds an SDFG of a very particular form, which for us is canonical, which is not
-    directly usable. Thus this class should not be directly used, instead a user should use TBA.
+    This class builds an SDFG of a very particular form, which for us is
+    canonical, which is not directly usable. Thus this class should not be
+    directly used, instead a user should use TBA.
     The canonical form is characterized by the following:
     - the SDFG is a list of states, ideally each state corresponds to single Jax primitive,
     - all variable names are derived from Jax names,
     - there are no global variables inside the SDFG,
-    - there is no possibility to return something.
-
-    The idea of the translator is extremely simple.
-    Since Jaxpr is a list consisting of more or less simple instructions/equations, they get processed one after the other.
-    Each equation is translated into its own state that is appended to the SDFG, thus the SDFG is a long list of states.
-    In certain cases it might be that an equation needs more states, but this is an exception.
-
-    The actual translation is not handled by the driver instead a so called subtranslator object is used.
-    This subtranslator, is specialized for one type of primitive.
-    For more information on the subtranslators see the documentation of `JaCeSubTranslatorInterface`.
-
-    These subtranslators are independent objects that are owned by the driver.
-    However, due to their tight coupling they are allowed to use the following private functions:
-    - `_add_array()` if the translator has to create new.
-    - `_create_jax_var_list()` for the bulk creation of Jax variables.
-    - `_add_reserved_names()` if a name should be blocked (only affects later equation.
-    - `_add_jax_name_mapping()` for creating new links between Jax variables and SDFG variables.
-    However, a subtranslator should only call them if it is necessary.
-
-    To support nested Jaxpr expressions the driver provides the possibility to clone/fork itself, see `self.fork()` for more.
-    Every clone, i.e. return value of `self.fork()`, of a driver, which is also known as child, has a unique identifier.
-    This identifier is used for example to generate unique SDFG variable names during a translation process.
-    The original driver, the one that was explicitly created, is also known as head translator, see `is_head_translator()`.
-    It is important that the revision is only unique within a family and during a translation process.
-
-    If no translation is ongoing the only function that makes sense to call is `translate_jaxpr()` which starts a translation.
+    - It lacks the special `__return` variable.
+    - The argument names are not set.
+
+    The idea of the translator is extremely simple. Since Jaxpr is a list
+    consisting of more or less simple instructions/equations, they get processed
+    one after the other. Each equation is translated into its own state that
+    is appended to the SDFG, thus the SDFG is a long list of states. In certain
+    cases it might be that an equation needs more states, but this is an exception.
+
+    The actual translation is not handled by the driver instead a so called
+    subtranslator object is used. A subtranslator is specialized to translate
+    one type of primitive. For more information on the subtranslators see the
+    documentation of `JaCeSubTranslatorInterface`.
+
+    To support nested Jaxpr expressions the driver provides the possibility to
+    clone/fork itself, see `self.fork()` for more. Every clone, i.e. return
+    value of `self.fork()`, of a driver, which is also known as child, has
+    a unique identifier. This identifier is used for example to generate
+    unique SDFG variable names during a translation process,
+    see `self.same_family() for more.
+
+    If no translation is ongoing the only function that makes sense to call
+    is `translate_jaxpr()` which starts a translation.
 
     Todos:
         Find a better way than to allow giving access to protected functions.
+            Probably using composition with the higher level instance.
     """
 
-    # Member variables that are private to an instance, i.e. they are not passed on to the children.
-    #  By definition all private variable belongs to the translation context but not all variable of the translation context are private.
-    #   NOTE: The context also includes some shared members, but they are handled a bit differently.
+    # Member variables private to an instance, i.e. they are not passed on to the children.
+    #  By definition all of them belongs to the translation context but not all variable of
+    #  the translation context are private, some are actually shared.
     __private_slots__ = (
         "_sdfg",
         "_term_sdfg_state",
@@ -73,7 +72,7 @@ class JaxprTranslationDriver:
         "_sdfg_out_names",
         "_rev_idx",
     )
-    # These are the member variables that are shared among the forks.
+    # Variables that are shared among the instances of a family.
     __shared_slots__ = (
         "_reserved_names",  # Part of the context.
         "_sub_translators",
@@ -87,22 +86,26 @@ def __init__(
     ) -> None:
         """Creates the base translator.
 
-        All arguments that does not start with an underscore are used as arguments to construct the subtranslators.
+        All arguments that does not start with an underscore are used as
+        arguments to construct the subtranslators.
 
         Args:
             _no_shared_alloc (bool):     If set then all allocation will be avoided (internal)
 
         Notes:
-            This function will not allocate the translation context of `self` but will only allocate the shared members.
-            By setting `_no_shared_alloc` to `True` the function will not allocate the shared part.
-                This flag is provided only for implementing `self.fork()` using it is an error and undefined behaviour.
+            This function will not allocate the translation context of `self`
+                but will only allocate the shared members.
+            By setting `_no_shared_alloc` to `True` the function will not allocate
+                the shared part. This flag is provided only for implementing
+                `self.fork()` using it is an error and undefined behaviour.
         """
         allocate_shared_parts: bool = not kwargs.pop("_no_shared_alloc", False)
 
         # Contains all the subtranslators that we need.
         #  They are partitioned by the names of the primitive they have registered for.
         #  Inside a partition they are ordered by priority, lowest first, more important.
-        #  This member is allocated by '_init_sub_translators()' and remains allocated during the lifetime of the object.
+        #  This member is allocated by '_init_sub_translators()' and remains allocated
+        #  during the lifetime of the object.
         self._sub_translators: dict[str, list[jtrans.JaCeSubTranslatorInterface]] = None  # type: ignore[assignment]
 
         # The SDFG object that we are currently constructing.
@@ -160,14 +163,17 @@ def translate_jaxpr(
     ) -> jtrutil.JaCeTranslationMemento:
         """Perform the translation of a Jaxpr description into a SDFG.
 
-        While this function is running `self` has an ongoing translation.
-        As explained above the translation will not result in a "good" SDFG but needs further preprocessing.
-        However, it is the internal format that the translation toolchain expects.
+        Returns:
+            The function will translate the passed Jaxpr object into an SDFG.
+            However, the SDFG will be in canonical form and needs further
+            processing. The SDFG is encapsulated inside a `JaCeTranslationMemento`,
+            that contains additional metadata for further manipulation.
 
         Args:
             inp_scalar_as_array:    Translate scalar _input_ arguments to arrays of length 1.
             name:                   Use this name for the SDFG instead some generated one.
-            reserved_names:         Prevent the generation of variables with these names, see `self._add_array()` for more.
+            reserved_names:         Prevent the generation of variables with these names,
+                                        see `self.add_array()` for more.
             allow_empty_jaxpr:      Allows empty Jaxpr.
 
         Returns:
@@ -184,15 +190,11 @@ def translate_jaxpr(
         if not isinstance(jaxpr, jcore.ClosedJaxpr):
             raise TypeError(f"Expected a 'jax.core.ClosedJaxp' instance but got '{type(jaxpr)}'")
         if len(jaxpr.effects) != 0:
-            raise NotImplementedError(
-                "Currently 'Jaxpr' instances with side effects are not supported."
-            )
+            raise NotImplementedError("'Jaxpr' with side effects are not supported.")
         if len(jaxpr.out_avals) == 0:
             raise ValueError("Jaxpr has zero output variables.")
         if not jax.config.read("jax_enable_x64"):
-            raise NotImplementedError(
-                "The translation only works if 'jax_enable_x64' is enabled. Do it manually or use 'self.transform()'!"
-            )
+            raise NotImplementedError("The translation only works if 'jax_enable_x64' is enabled.")
 
         # Consume the hidden flags
         _clear_translation_ctx: bool = kwargs.pop("_clear_translation_ctx", True)
@@ -220,15 +222,21 @@ def translate_jaxpr(
     def fork(self) -> JaxprTranslationDriver:
         """Return a child of `self` ready for transformation.
 
-        The returned object, known as child, will always be of type `JaxprTranslationDriver`, and should be seen as a partial clone of `self`.
-        While the child shares some members with its parent, i.e. `self`, it has an unallocated translation context.
-        If `translate_jaxpr(jaxpr)` is called on the returned object function will behave the exact same way as
-        its parent behaved as it was called just with another `jaxpr` argument.
+        The returned object should be seen as a partial clone if `self`. It will
+        have an unallocated translation context, but all other variables are schared.
+        To distinguish children all have a unique identifier, see `self.same_family()`.
+
+        The main reason for its function is to implement nested Jaxpr. If
+        `self.translate_jaxpr()` is called on the returned object it will behave
+        the exact same way as its parent would, with a different Jaxpr argument.
 
         Notes:
-            A user has to ensure that the lifetime of a child ends before the lifetime of its direct parent.
-                In case of a head translator, the lifetime of its children have to end before the translation process finishes.
-            It is important that a clone instance should not be reused, instead you should fork it again, even from the clone.
+            A user has to ensure that the lifetime of a child ends before the
+                lifetime of its direct parent. In case of a head translator,
+                the lifetime of its children have to end before the translation
+                process finishes.
+            It is important that a clone instance should not be reused,
+                instead you should fork it again.
         """
         # Create a new (empty) driver instance; prevent allocation to make it cheep
         dolly: JaxprTranslationDriver = JaxprTranslationDriver(_no_shared_alloc=True)
@@ -256,8 +264,9 @@ def append_new_state(
         By default the new state is appended to the current terminal state.
         This will also update the terminal SDFG state of `self`.
 
-        However, if `prev_state` is specified the state new state will be appended to `prev_state` instead.
-        This will not modify the terminal state unless `prev_state` is the current terminal state.
+        However, if `prev_state` is specified the state new state will be
+        appended to `prev_state` instead. This will not modify the terminal
+        state unless `prev_state` is the current terminal state.
 
         Args:
             label:          The name that should be given to the new `SDFGState`.
@@ -267,8 +276,6 @@ def append_new_state(
 
         Notes:
             In case no `SDFGState` exists yet, an initial SDFGState will be created first.
-            This function is similar to `SDFGState.add_state_after()` but differs in the fact that it does not perform reconnecting.
-                I.e. if the state to which we append already has downstream states they will not be reconnected to be after the newly created state.
         """
         assert self._sdfg is not None
 
@@ -398,18 +405,17 @@ def is_allocated(self) -> bool:
         ]
         if all((x is not None) for x in small_ctx):
             if self._reserved_names is None:
-                raise RuntimeError(
-                    "Invalid allocation state: All context variables except the reserved name list are allocated."
-                )
+                raise RuntimeError("Invalid allocation state: Reserved names not allocated.")
             return True
         if all((x is None) for x in small_ctx):
             return False
-        raise RuntimeError("Invalid allocation state: Translation context is mixed allocated.")
+        raise RuntimeError("Invalid allocation state: Translation context partially allocated.")
 
     def is_head_translator(self) -> bool:
         """Tests if `self` is a head translator.
 
-        A head translator is a translator/driver that was created explicitly, i.e. not by `self.fork()`.
+        A head translator is a translator/driver that was created explicitly,
+        i.e. not by `self.fork()`.
         """
         return self._rev_manager.is_root_revision(self._rev_idx)
 
@@ -419,7 +425,10 @@ def same_family(
     ) -> bool:
         """Test if `self` and `other` belongs to the same family of driver/translators.
 
-        The family of a translator is given by the set of all driver that descend from the same head translator.
+        A driver is either explicitly created, i.e. head translator, or created
+        by a call to `fork()`. All drivers that descend from the same head translator
+        from a family.
+
         """
         if not isinstance(other, JaxprTranslationDriver):
             return NotImplemented  # type: ignore[unreachable]
@@ -430,6 +439,15 @@ def same_family(
 
         return False
 
+    def get_rev_idx(self) -> int:
+        """Returns the revision index of `self`.
+
+        To distinguish members of same family every diver has a unique identifier,
+        known as revision. However, the revision is only unique within a single
+        family and during an ongoing translation.
+        """
+        return self._rev_idx
+
     @staticmethod
     def translate_dtype(dtype: Any) -> dace.typeclass:
         """Turns a Jax datatype into a DaCe datatype.
@@ -448,23 +466,28 @@ def translate_dtype(dtype: Any) -> dace.typeclass:
         # Now extract the datatype from dace, this is extremely ugly.
         if not hasattr(dace.dtypes, nameof_dtype):
             raise TypeError(
-                f"Could not find the type '{nameof_dtype}' ({type(dtype).__name__}) in 'dace.dtypes'."
+                f"Could not find the type '{nameof_dtype}' ({type(dtype).__name__}) in 'dace'."
             )
         dcd_type = getattr(dace.dtypes, nameof_dtype)
 
         if not isinstance(dcd_type, dace.dtypes.typeclass):
             raise TypeError(
-                f"Expected that '{nameof_dtype}' would map to a 'dace.typeclass' but it mapped to a '{type(dcd_type).__name__}'."
-            )
+                f"Expected that '{nameof_dtype}' would map to a 'dace.typeclass'"
+                f"but it mapped to a '{type(dcd_type).__name__}'.")
 
         return dcd_type
 
-    def _add_jax_name_mapping(
-        self, jax_var: str | jcore.Atom, sdfg_name: str
+    def add_jax_name_mapping(
+        self,
+        jax_var: str | jcore.Atom,
+        sdfg_name: str,
     ) -> JaxprTranslationDriver:
         """Creates a mapping between `jax_var` to `sdfg_name`.
 
-        It is an error if there is already a mapping installed for `jax_var`.
+        This function updates the internal map of `self` and after the call
+        `self.map_jax_var_to_sdfg()` will identify `jax_var` with `sdfg_name`.
+        This function is not able to delete a variable mapping that was
+        established before, for this use TBA.
 
         Args:
             jax_var:     The Jax variable.
@@ -480,21 +503,16 @@ def _add_jax_name_mapping(
                 return self
             raise ValueError(
                 f"Tried to create the mapping '{jax_name} -> {sdfg_name}', but '{jax_name}'"
-                + f" already points to '{self.map_jax_var_to_sdfg(jax_name)}'."
-            )
+                f" already points to '{self.map_jax_var_to_sdfg(jax_name)}'.")
         if sdfg_name not in self.get_arrays():
-            raise KeyError(
-                f"Tried to create the mapping '{jax_name} -> {sdfg_name}', but SDFG target unknown."
-            )
+            raise KeyError(f"Mapping '{jax_name} -> {sdfg_name}': SDFG target unknown.")
         if sdfg_name in self._forbidden_names:
-            raise NameError(
-                f"Tried to create the mapping '{jax_name} -> {sdfg_name}', but forbidden name."
-            )
+            raise NameError(f"Mapping '{jax_name} -> {sdfg_name}': Forbidden name.")
 
         self._jax_name_map[jax_name] = sdfg_name
         return self
 
-    def _add_reserved_names(
+    def add_reserved_names(
         self,
         reserved_names: None | str | Collection[str],
     ) -> JaxprTranslationDriver:
@@ -514,7 +532,7 @@ def _add_reserved_names(
         self._reserved_names.update(reserved_names)
         return self
 
-    def _add_array(
+    def add_array(
         self,
         arg: jcore.Atom,
         *,
@@ -532,52 +550,64 @@ def _add_array(
     ) -> str:
         """Creates an SDFG variable for the Jax variable `arg` and returns its SDFG name.
 
-        By default the function will create a transient, use `as_transient` to change that.
-        By default the function will honor if the Jax variable is a scalar or an array.
-        However, by setting `force_array` the function will always generate an array.
+        By default the function will create a transient, use `as_transient` to
+        change that. By default the function will honor if the Jax variable is
+        a scalar or an array. However, by setting `force_array` the function
+        will always generate an array.
 
         By default the name for the SDFG variable is derived from the Jax variable.
-        It is guaranteed that this name is unique in the SDFG, even in the presence of nested SDFGs.
-        By specifying `alt_name` it is possible to force a certain name on a variable.
-        It is important that if `alt_name` is specified the function will either generate the variable or fail.
+        It is guaranteed that this name is unique in the SDFG, even in the presence
+        of nested SDFGs. By specifying `alt_name` it is possible to force a certain
+        name on a variable. It is important that if `alt_name` is specified the function
+        will either generate the variable or fail.
 
         The  driver distinguishes between two kinds of "bad (SDFG) variable names".
         The first category are the forbidden names, which the function refuses to generate.
         The second type are the so called reserved names, which were set at the beginning.
-        These names can be used if they are specified through `alt_name` but are not used in automatic naming.
-
-        If nothing is specified, the strides of the data are determined by DaCe, which is continuous C order.
-        There are two ways to change that.
-        The first way is to specify the `strides` argument, which are then forwarded to the underlying DaCe function.
-        The second way is to set `symb_strides` to `True` in which case the function will generate symbols and use them.
-        However, even if symbolic strides are activated, arrays with just one dimensions have always a non symbolic stride of 1.
-        Furthermore, dimensions with shape 1 will always have stride 0.
+        These names can be used if they are specified through `alt_name` but are not used
+        in automatic naming.
+
+        If nothing is specified, the strides of the data are determined by DaCe, which is
+        continuous C order. There are two ways to change that.
+        The first way is to specify the `strides` argument, which are then forwarded
+        to the underlying DaCe function. The second way is to set `symb_strides`
+        to `True` in which case the function will generate symbols and use them.
+        However, even if symbolic strides are activated, arrays with just one
+        dimensions have always a non symbolic stride of 1. Furthermore, dimensions
+        with shape 1 will always have stride 0.
 
         By default this function does not update the internal variable map.
-        However, by setting `update_var_mapping` to `True` the function will update the mapping.
+        However, by setting `update_var_mapping` to `True` the function will
+        update the mapping.
 
         Args:
             arg:                The Jax object for which a SDFG equivalent should be created.
             as_transient:       If set, the SDFG variable is a transient, `True` by default.
             alt_name:           Try to create the variable with this name; either succeed or fail.
             name_prefix:        If given and in automatic naming mode, add this prefix to the name.
-            force_array:        Instead of a `dace.Scalar` object create a `dace.Array` with one element.
-            as_view:            Creates a view instead of an array, if it is a scalar it is silently ignored.
+            force_array:        Instead of a `dace.Scalar` create a `dace.Array` with one element.
+            as_view:            Creates a view instead of an array, if it is a scalar
+                                    it is silently ignored.
             strides:            Instead of the default strides use these values.
             symb_strides:       Create symbols and use them for fully symbolic strides.
-            find_new_name:      The translator will try to find a new name if the designated is already occupied.
-                                    This does not work if the name was supplied by `alt_name`.
+            find_new_name:      The translator will try to find a new name if the designated
+                                    is already occupied. This does not work if the name
+                                    was supplied by `alt_name`.
             allow_literals:     If `True` then also allows JaxLiterals as `arg`.
             force_jax_name:     If `True` then, the verbatim Jax name will be used.
             update_var_mapping: Update the internal variable mapping; by default `False`.
 
         Notes:
-            If this function is used directly a user is advised to always set `update_var_mapping` to `True`.
-            If `find_new_name` is `None` the default, the function will only look for a new name if there is a need for it.
-                If it is `True` the function will always look for a new name, even if the initial name was fine.
-                If it is `False` the function will never look for a new new, thus if the name is unavailable an error is generated.
+            If this function is used directly a user is advised to always set
+                `update_var_mapping` to `True`.
+            If `find_new_name` is `None` the default, the function will only
+                look for a new name if there is a need for it. If it is `True`
+                the function will always look for a new name, even if the initial
+                name was fine. If it is `False` the function will never look for
+                a new new, thus if the name is unavailable an error is generated.
             Specifying `alt_name` implies `find_new_name=False`.
-            The effect of specifying `force_jax_name` is as passing `jutil.get_jax_var_name(arg)` as `alt_name`.
+            The effect of specifying `force_jax_name` is as passing
+                `jutil.get_jax_var_name(arg)` as `alt_name`.
         """
         assert all(x is not None for x in (self._sdfg, self._jax_name_map))
         shape: Sequence[int] = arg.aval.shape  # Shape of the array
@@ -711,30 +741,30 @@ def _add_array(
             )
 
         if update_var_mapping:
-            self._add_jax_name_mapping(jax_var=arg, sdfg_name=arg_name)
+            self.add_jax_name_mapping(jax_var=arg, sdfg_name=arg_name)
 
         return arg_name
 
-    def _create_jax_var_list(
+    def create_jax_var_list(
         self,
         jax_var_list: Sequence[jcore.Atom],
         prevent_creation: bool = False,
         only_creation: bool = False,
         **kwargs: Any,
     ) -> list[None | str]:
-        """Creates SDFG variables for the listed Jax variables and returns the SDFG names as a list.
+        """Creates SDFG variables for the listed Jax variables and returns their SDFG names.
 
-        Before the function will create a variable, by using `_add_array()` with `update_var_mapping=True`,
-        it will check if the variable is known and if so no new variable is created.
-        Instead the name of the previously created variable is added to the list.
-        In case the Jax Atom denotes a Jax Literal, no variable will be created,
-        instead `None` will be added to the list.
+        Before the function will create a variable, by using `add_array()` with
+        `update_var_mapping=True`, it will check if the variable is known and if
+        so no new variable is created. Instead the name of the previously created
+        variable is added to the list. In case the Jax Atom denotes a Jax Literal,
+        no variable will be created, instead `None` will be added to the list.
 
         Args:
             jax_var_list:       The list of Jax variables that should be transformed to SDFG names.
-            prevent_creation:   Never create a variable, indicates that all variables must already exists.
-            only_creation:      If a variable already exists, generate an error instead of using it.
-            kwargs:             Will be forwarded to `self._add_array()` if a variable will be created.
+            prevent_creation:   Never create a variable, indicates that all variables must exists.
+            only_creation:      Variables must be generated, generate an error instead of using it.
+            kwargs:             Will be forwarded to `self.add_array()` if a variable as to be created.
 
         Notes:
             If `only_creation` is set, then literals will cause an error.
@@ -755,7 +785,7 @@ def _create_jax_var_list(
                 if (mapped_sdfg_name is None) and prevent_creation:
                     raise ValueError(f"prevent_creation' given but have to create '{jax_var}'.")
                 if mapped_sdfg_name is None:
-                    ret_list.append(self._add_array(arg=jax_var, update_var_mapping=True, **kwargs))
+                    ret_list.append(self.add_array(arg=jax_var, update_var_mapping=True, **kwargs))
                 elif only_creation:
                     raise ValueError(f"'only_creation' given '{jax_var}' already exists.")
                 else:
@@ -790,7 +820,7 @@ def _create_initial_input(
 
         # Handle the initial input arguments
         sdfg: dace.SDFG = self._sdfg
-        init_in_var_names: Sequence[str] = self._create_jax_var_list(  # type: ignore[assignment]
+        init_in_var_names: Sequence[str] = self.create_jax_var_list(  # type: ignore[assignment]
             jax_var_list=jaxpr.jaxpr.invars,
             only_creation=True,
             as_transient=True,  # Explicit transient; no error!
@@ -825,7 +855,7 @@ def _create_constants(
 
         const_names: list[str] = []
         for cJaxVar, cValue in zip(jaxpr.jaxpr.constvars, jaxpr.consts, strict=False):
-            c_sdfg_name = self._add_array(
+            c_sdfg_name = self.add_array(
                 arg=cJaxVar,
                 name_prefix="__const_",
                 as_transient=True,
@@ -869,7 +899,7 @@ def _allocate_translation_ctx(
             self._reserved_names = set()  # type: ignore[unreachable]
         elif not isinstance(self._reserved_names, set):
             raise RuntimeError("The reserved names are allocated incorrectly.")
-        return self._add_reserved_names(reserved_names)
+        return self.add_reserved_names(reserved_names)
 
     def _init_sub_translators(
         self,
@@ -909,10 +939,12 @@ def _clear_translation_ctx(self) -> JaxprTranslationDriver:
         """This function deallocate the translation context of `self`.
 
         Notes:
-            While it is allowed for outside code to call this explicitly function, it is is most likely an error.
-            If this function is called on a head translator, then the translation process ends.
-                This implies that all direct and indirect children, i.e. output of `self.fork()` must already be deallocated.
-                A further side effect is that now revision indexes will be reused.
+            While it is allowed for outside code to call this explicitly function,
+                it is is most likely an error.
+            If this function is called on a head translator, then the translation
+                process ends. This implies that all direct and indirect children,
+                i.e. output of `self.fork()` must already be deallocated. A further
+                side effect is that now revision indexes might be reused.
             If `self` is not allocated this function acts as a noops.
             The reserved names are only deallocated if `self` is a head translator.
         """
@@ -927,12 +959,14 @@ def _clear_translation_ctx(self) -> JaxprTranslationDriver:
 
         if self.is_head_translator():
             # We are the head translator thus we reset the revision manager.
-            #  Since this function is only called at the very end, we know that the translation process as a whole has finished.
-            #  We reset the state that the numbers are small again when we start anew.
+            #  Since this function is only called at the very end, we know that the translation
+            #  process as a whole has finished. We reset the state that the numbers are small
+            #  again when we start anew.
             self._rev_manager._reset_state()
 
-            # Freeing the reserved names only for heads make it more safe in case a child translator is reused.
-            #  On the other hand reusing a child translator is discouraged, but not forbidden.
+            # Freeing the reserved names only for heads make it more safe in case a child
+            #  translator is reused.c On the other hand reusing a child translator is
+            #  discouraged, but not forbidden.
             self._reserved_names = None  # type: ignore[assignment]
         return self
 
@@ -1005,12 +1039,12 @@ def _translate_single_eqn(
         # Input/Output variables
         #  Using a tuple for the input ensures that it is not modified.
         in_var_names: Sequence[str | None] = tuple(
-            self._create_jax_var_list(
+            self.create_jax_var_list(
                 eqn.invars,
                 prevent_creation=True,  # Inputs must already exists.
             )
         )
-        out_var_names: Sequence[str] = self._create_jax_var_list(  # type: ignore[assignment]
+        out_var_names: Sequence[str] = self.create_jax_var_list(  # type: ignore[assignment]
             eqn.outvars,
             only_creation=True,  # Output must not exist yet.
         )
@@ -1066,21 +1100,22 @@ def _translate_single_eqn(
                     f" maps to '{mapped_sdfg_name}'."
                 )
 
-        # Views can only be used if there is a direct connection, between source, view and destination (place of usage)
-        #  Because of the way how Jax works, it is impossible that an output variable is a View.
+        # Views can only be used if there is a direct connection, between source,
+        #  view and destination (place of usage). Because of the way how Jax works,
+        #  it is impossible that an output variable is a View.
         for outVarName, jax_var in zip(out_var_names, eqn.outvars, strict=True):
             sdfg_var = self.get_array(outVarName)
             if isinstance(sdfg_var, (dace.data.Array, dace.data.Scalar)):
                 pass
             elif isinstance(sdfg_var, dace.data.View):
                 raise TypeError(
-                    f"For the Jax variable '{jutil.get_jax_var_name(jax_var)}' (SDFG: '{outVarName}'),"
+                    f"For Jax variable '{jutil.get_jax_var_name(jax_var)}' (SDFG: '{outVarName}'),"
                     f" which is an output, you used a View, which is not possible."
                     " It must either be an array or a scalar."
                 )
             else:
                 raise NotImplementedError(
-                    f"The output variable '{jutil.get_jax_var_name(jax_var)}' (SDFG: '{outVarName}')"
+                    f"Output variable '{jutil.get_jax_var_name(jax_var)}' (SDFG: '{outVarName}')"
                     f" is of type '{type(sdfg_var).__name__}' which I does not know how to handle."
                 )
 
@@ -1095,9 +1130,11 @@ def _translate_jaxpr_internal(
     ) -> jtrutil.JaCeTranslationMemento:
         """Performs the actual translation of the Jaxpr into an SDFG.
 
-        The function assumes that the context is already allocated and the initial variables are already created.
-        The function will store the internal state of `self` into a memento and return it.
-        However, it will not deallocate the context of `self`, thus `self` and the memento share the same context in memory.
+        The function assumes that the context is already allocated and the initial
+        input variables were already created. The function will store the internal
+        state of `self` into a memento and return it.
+        However, it will not deallocate the translation context, thus `self`
+        and the memento share the same context in memory.
 
         Args:
             jaxpr:      The Jaxpr to translate.
@@ -1157,8 +1194,9 @@ def _handle_null_jaxpr(
     ) -> Sequence[str]:
         """This function is called in case a `Jaxpr` with zero equations is encountered.
 
-        A function with zero equation might still have output, in which case an input is copied to an output.
-        This function will handle the copying from the input into the corresponding output variable.
+        A function with zero equation might still have output, in which case an
+        input is copied to an output. This function will handle the copying from
+        the input into the corresponding output variable.
 
         Returns:
             The function returns a list denoting the SDFG variables that refers to the output.
@@ -1193,7 +1231,7 @@ def _handle_null_jaxpr(
             jax_out_name = f"_zero_equation_output_{self.map_jax_var_to_sdfg(jax_out_var)}"
 
             # Now create the SDFG variable for it, give it a unique name.
-            sdfg_out_name = self._add_array(
+            sdfg_out_name = self.add_array(
                 jax_out_var,
                 as_transient=True,
                 name_prefix="_zero_equation_output_for_",
@@ -1201,7 +1239,7 @@ def _handle_null_jaxpr(
             )
 
             # We now create a new mapping, we do this that we will later find the variable again.
-            self._add_jax_name_mapping(jax_var=jax_out_name, sdfg_name=sdfg_out_name)
+            self.add_jax_name_mapping(jax_var=jax_out_name, sdfg_name=sdfg_out_name)
             out_var_names.append(jax_out_name)
 
             # Now copy the input into the fake output variable.
@@ -1220,13 +1258,14 @@ def _handle_null_jaxpr(
     _forbidden_names: Final[set[str]] = {
         # These should be most of the C++ keywords, it is more important to have the short ones.
         #  Taken from 'https://learn.microsoft.com/en-us/cpp/cpp/keywords-cpp?view=msvc-170'
-        'alignas', 'alignof', 'and', 'asm', 'auto', 'bitand', 'bitor', 'bool', 'break', 'case', 'catch',
-        'char', 'class', 'compl', 'concept', 'const', 'consteval', 'constexpr', 'constinit', 'continue',
-        'decltype', 'default', 'delete', 'directive', 'do', 'double', 'else', 'enum', 'explicit', 'export',
-        'extern', 'false', 'float', 'for', 'friend', 'goto', 'if', 'inline', 'int', 'long', 'mutable',
-        'namespace', 'new', 'noexcept', 'not', 'nullptr', 'operator', 'or', 'private', 'protected',
-        'public', 'register', 'requires', 'return', 'short', 'signed', 'sizeof', 'static', 'struct',
-        'switch', 'template', 'this', 'throw', 'true', 'try', 'typedef', 'typeid', 'typename', 'union',
-        'unsigned', 'using', 'virtual', 'void', 'volatile', 'while', 'xor', 'std',
+        'alignas', 'alignof', 'and', 'asm', 'auto', 'bitand', 'bitor', 'bool', 'break', 'case',
+        'catch', 'char', 'class', 'compl', 'concept', 'const', 'consteval', 'constexpr',
+        'constinit', 'continue', 'decltype', 'default', 'delete', 'directive', 'do', 'double',
+        'else', 'enum', 'explicit', 'export', 'extern', 'false', 'float', 'for', 'friend',
+        'goto', 'if', 'inline', 'int', 'long', 'mutable', 'namespace', 'new', 'noexcept', 'not',
+        'nullptr', 'operator', 'or', 'private', 'protected', 'public', 'register', 'requires',
+        'return', 'short', 'signed', 'sizeof', 'static', 'struct', 'switch', 'template', 'this',
+        'throw', 'true', 'try', 'typedef', 'typeid', 'typename', 'union', 'unsigned', 'using',
+        'virtual', 'void', 'volatile', 'while', 'xor', 'std',
     }
     # fmt: on
diff --git a/src/jace/translator/util/jace_translation_memento.py b/src/jace/translator/util/jace_translation_memento.py
index 93d11af..d551082 100644
--- a/src/jace/translator/util/jace_translation_memento.py
+++ b/src/jace/translator/util/jace_translation_memento.py
@@ -16,15 +16,17 @@
 
 @dataclass(init=True, repr=True, eq=False, frozen=True, kw_only=True, slots=True)
 class JaCeTranslationMemento:
-    """Encapsulates the result of a translation run of the 'JaxprTranslationDriver' object.
+    """Encapsulates the result of a translation run of the `JaxprTranslationDriver` object.
 
     It defines the following members:
-    - 'sdfg' the SDFG object that was created.
-    - 'start_state' the first state in the SDFG state machine.
-    - 'terminal_state' the last state in the state machine.
-    - 'jax_name_map' a 'dict' that maps every Jax name to its corresponding SDFG variable name.
-    - 'inp_names' a 'list' of the SDFG variables that are used as input, in the same order as 'Jaxpr.invars'.
-    - 'out_names' a 'list' of the SDFG variables that are used as output, in the same order as 'Jaxpr.outvars'.
+    - `sdfg` the SDFG object that was created.
+    - `start_state` the first state in the SDFG state machine.
+    - `terminal_state` the last state in the state machine.
+    - `jax_name_map` a `dict` that maps every Jax name to its corresponding SDFG variable name.
+    - `inp_names` a `list` of the SDFG variables that are used as input,
+            in the same order as `Jaxpr.invars`.
+    - `out_names` a `list` of the SDFG variables that are used as output,
+            in the same order as `Jaxpr.outvars`.
     """
 
     sdfg: dace.SDFG
@@ -37,7 +39,8 @@ class JaCeTranslationMemento:
     def validate(self) -> bool:
         """Validate the underlying SDFG."""
 
-        # To prevent the 'non initialized' data warnings we have to temporary promote the input arguments as global.
+        # To prevent the 'non initialized' data warnings we have to temporary promote the
+        #  input arguments as global.
         org_trans_state: dict[str, bool] = {}
         for var in self.inp_names:
             org_trans_state[var] = self.sdfg.arrays[var].transient
diff --git a/src/jace/translator/util/revision_counter.py b/src/jace/translator/util/revision_counter.py
index e6531bc..661ab22 100644
--- a/src/jace/translator/util/revision_counter.py
+++ b/src/jace/translator/util/revision_counter.py
@@ -14,13 +14,13 @@ class RevisionCounterManager:
     """This class acts as a manager for revision counters.
 
     It is intended as a shared object and each new object that needs a revision,
-    simply calls 'assign_revision()' to get the new one.
+    simply calls `assign_revision()` to get the new one.
     """
 
     __slots__ = ("_next_revision",)
 
-    """The revision value of the very first call to 'assign_revision()'.
-    This revision is only assigned once."""
+    # The revision value of the very first call to `assign_revision()`.
+    #  This revision is only assigned once.
     ROOT_REVISION: Final[int] = 0
 
     def __init__(self) -> None:
@@ -38,8 +38,9 @@ def _reset_state(self) -> RevisionCounterManager:
 
         Notes:
             Calling this function is almost always an error.
-            This function does not restore the state right after initialization, but one call after 'assign_revision()'.
-                This is done to ensure that there is one single initial revision.
+            This function does not restore the state right after initialization,
+                but one call after `assign_revision()`. This is done to ensure
+                that there is one single root revision index.
         """
         self._next_revision = self.ROOT_REVISION
         _ = self.assign_revision()  # Ensure that we throw away the root
@@ -49,5 +50,5 @@ def is_root_revision(
         self,
         rev: int,
     ) -> bool:
-        """This function checks if 'rev' revers to the (absolute) unique revision of the root."""
+        """This function checks if `rev` revers to the (absolute) unique revision of the root."""
         return rev == self.ROOT_REVISION
diff --git a/src/jace/translator/util/subtranslator_helper_order.py b/src/jace/translator/util/subtranslator_helper_order.py
index e90697b..4543613 100644
--- a/src/jace/translator/util/subtranslator_helper_order.py
+++ b/src/jace/translator/util/subtranslator_helper_order.py
@@ -19,17 +19,15 @@ def sort_subtranslators(
 
     The function ensures the following:
     - All subtranslators that have default priority are at the end.
-    - All subtranslators whose 'get_priority()' returns 'NotImplemented' are at the begin of the list.
-        These subtranslators are ordered according to their '__lt__()' function.
-    - All subtranslators whose 'get_priority()' function returns an integer are in the middle,
-        ordered according to this value.
+    - All subtranslators whose `get_priority()` returns `NotImplemented`
+        are at the begin of the list. These subtranslators are ordered according
+        to their `__lt__()` function.
+    - All subtranslators whose `get_priority()` function returns an integer are
+        in the middle, ordered according to this value.
     """
     if len(subtranslators) <= 1:
         return subtranslators
-    subtranslators = [
-        subtranslator.get()
-        for subtranslator in sorted(map(_SubtranslatorOrderingHelper, subtranslators))
-    ]
+    subtranslators = sorted(subtranslators, key=_SubtranslatorOrderingHelper)
     assert (len(subtranslators) <= 1) or all(
         subtranslators[i - 1].has_default_priority() <= subtranslators[i].has_default_priority()
         for i in range(1, len(subtranslators))
@@ -38,9 +36,13 @@ def sort_subtranslators(
 
 
 class _SubtranslatorOrderingHelper:
-    """This is a helper class that is used by 'JaxprTranslationDriver' to bring the subtranslators in the correct order.
+    """Helper class used by `JaxprTranslationDriver` to bring the subtranslators in the correct order.
 
-    Essentially it is a wrapper around a subtranslator that handles the different ordering correct.
+    Essentially it is a wrapper that contains the additional logic that is needed for sorting.
+    This way subclasses does not need to implement it themselves.
+
+    Notes:
+        This class does not implement the other comparison function as requested by PEP8.
     """
 
     def __init__(self, subtranslator: translator.JaCeSubTranslatorInterface):
@@ -56,18 +58,18 @@ def __lt__(
     ) -> bool:
         # Default priority means that it will always go to the end.
         if self._sub.has_default_priority():
-            return False  # 'self' has default priority, so it must go to the end.
+            return False  # `self` has default priority, so it must go to the end.
         if other._sub.has_default_priority():
-            return True  # 'self' does not have default prio, thus it _must_ go before 'other'.
+            return True  # `self` does not have default prio, thus it _must_ go before `other`.
         prio_self = self._sub.get_priority()  # Get the priorities of the subtranslators.
         prio_other = other._sub.get_priority()
         if all(prio is NotImplemented for prio in (prio_self, prio_other)):
-            # None has a prio, 'self' should decide if it should go first.
+            # None has a prio, `self` should decide if it should go first.
             x = self._sub.__lt__(other._sub)
             assert isinstance(x, bool)
             return x
         # In case only one has a priority, we change the order such that the one that implements
-        #  a '__lt__()' goes first.
+        #  a `__lt__()` goes first.
         if prio_self is NotImplemented:
             assert isinstance(prio_other, int)
             return True
diff --git a/src/jace/util/dace.py b/src/jace/util/dace.py
index 90300d7..1c75a55 100644
--- a/src/jace/util/dace.py
+++ b/src/jace/util/dace.py
@@ -7,7 +7,8 @@
 
 """Implements all utility functions that are related to DaCe.
 
-Most of the functions defined here allow an unified access to DaCe's internals in a consistent and centralized way.
+Most of the functions defined here allow an unified access to DaCe's internals
+in a consistent and stable way.
 """
 
 from __future__ import annotations
diff --git a/src/jace/util/jax.py b/src/jace/util/jax.py
index 4379a8a..3a7ed06 100644
--- a/src/jace/util/jax.py
+++ b/src/jace/util/jax.py
@@ -7,7 +7,8 @@
 
 """Implements all utility functions that are related to Jax.
 
-Most of the functions defined here allow an unified access to Jax' internals in a consistent and centralized way.
+Most of the functions defined here allow an unified access to Jax' internals
+in a consistent and stable way.
 """
 
 from __future__ import annotations
diff --git a/src/jace/util/util.py b/src/jace/util/util.py
index 407a153..d728be5 100644
--- a/src/jace/util/util.py
+++ b/src/jace/util/util.py
@@ -15,7 +15,7 @@ def ensure_iterability(
     x: Any,
     ign_str: bool = True,
 ) -> Iterable[Any]:
-    """Ensures that 'x' is iterable.
+    """Ensures that `x` is iterable.
 
     By default strings are _not_ considered iterable.
 

From 18e1f0d6e5e96bebca4c1016f499f8061c310b7d Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Sun, 21 Apr 2024 12:59:27 +0200
Subject: [PATCH 021/458] Made some more updates.

---
 .../jace_subtranslator_interface.py           |  3 +--
 .../translator/sub_translators/__init__.py    | 21 +++++++++++++------
 .../util/subtranslator_helper_order.py        |  4 ++--
 3 files changed, 18 insertions(+), 10 deletions(-)

diff --git a/src/jace/translator/jace_subtranslator_interface.py b/src/jace/translator/jace_subtranslator_interface.py
index 73b49f7..3c1dbb7 100644
--- a/src/jace/translator/jace_subtranslator_interface.py
+++ b/src/jace/translator/jace_subtranslator_interface.py
@@ -150,7 +150,7 @@ def translate_jaxeqn(
         - The driver will create a new terminal state and pass it as
             `eqn_state` argument. This state is guaranteed to be empty and
             `translator.get_terminal_sdfg_state() is eqn_state` holds.
-        
+
         Then the subtranslator is called. Usually a subtranslator should
         construct the dataflow graph inside it. It is allowed that the
         subtranslators creates more states if needed, but this state machine
@@ -160,7 +160,6 @@ def translate_jaxeqn(
         subtranslator was able to fully construct the dataflow graph
         within `eqn_state`.
 
-
         While a subtranslator is forbidden from meddling with the input
         variables mentioned in `in_var_names` in any way, it is allowed to
         modify the output variables. For example he could create a new
diff --git a/src/jace/translator/sub_translators/__init__.py b/src/jace/translator/sub_translators/__init__.py
index 8acfffc..f03144e 100644
--- a/src/jace/translator/sub_translators/__init__.py
+++ b/src/jace/translator/sub_translators/__init__.py
@@ -22,7 +22,7 @@
     ALUTranslator,
 ]
 
-# List of the externally supplied subtranslator implementation.
+# All externally supplied subtranslator implementation.
 #  It is a `dict` to do fast access and remember the order, value is always `None`.
 #  The list is manipulated through `{add,rm}_subtranslator()`.
 _EXTERNAL_SUBTRANSLATORS: dict[type[jtrans.JaCeSubTranslatorInterface], None] = {}
@@ -31,7 +31,7 @@
 def add_subtranslator(
     subtrans: type[jtrans.JaCeSubTranslatorInterface],
 ) -> bool:
-    """Add `subtrans` to the internal list of externally supplied subtranslators.
+    """Add `subtrans` to the externally defined subtranslators.
 
     The function returns `True` if it was added and `False` is not.
     """
@@ -51,7 +51,7 @@ def rm_subtranslator(
     subtrans: type[jtrans.JaCeSubTranslatorInterface],
     strict: bool = False,
 ) -> bool:
-    """Removes subtranslator `subtrans` from the list of known subtranslators.
+    """Remove `subtrans` as externally defined subtranslators.
 
     If `subtrans` is not known no error is generated unless `strict` is set to `True`.
     """
@@ -67,17 +67,26 @@ def _get_subtranslators_cls(
     with_external: bool = True,
     builtins: bool = True,
 ) -> Sequence[type[jtrans.JaCeSubTranslatorInterface]]:
-    """Returns a list of all subtranslator classes in JaCe.
+    """Returns the list of all subtranslator known to JaCe.
 
     Args:
         with_external:  Include the translators that were externally supplied.
         builtins:       Include the build in translators.
+
+    Notes:
+        If the externally defined subtranslators are requested they will be
+            first and ordered as FILO order.
     """
+    # It is important that the externally defined are ordered before the builtins
+    #  and are ordered in FILO order, especuially if multiple subtranslator per
+    #  primitive are registered. Because this way they are inserted first
+    #  into the internal list of the driver, and furthermore since `sorted()`
+    #  is stable they will tend to end up more to the front.
     ret: list[type[jtrans.JaCeSubTranslatorInterface]] = []
+    if with_external:
+        ret.extend(reversed(_EXTERNAL_SUBTRANSLATORS.keys()))
     if builtins:
         ret.extend(_BUILTIN_SUBTRANSLATORS)
-    if with_external:
-        ret.extend(_EXTERNAL_SUBTRANSLATORS.keys())
     return ret
 
 
diff --git a/src/jace/translator/util/subtranslator_helper_order.py b/src/jace/translator/util/subtranslator_helper_order.py
index 4543613..767521a 100644
--- a/src/jace/translator/util/subtranslator_helper_order.py
+++ b/src/jace/translator/util/subtranslator_helper_order.py
@@ -38,8 +38,8 @@ def sort_subtranslators(
 class _SubtranslatorOrderingHelper:
     """Helper class used by `JaxprTranslationDriver` to bring the subtranslators in the correct order.
 
-    Essentially it is a wrapper that contains the additional logic that is needed for sorting.
-    This way subclasses does not need to implement it themselves.
+    Essentially it is a wrapper that contains the additional logic that is
+    needed for sorting. This way subclasses does not need to implement it themselves.
 
     Notes:
         This class does not implement the other comparison function as requested by PEP8.

From cc7f5f749cdbdf7ec600c6d16c5d97a3d79cb5e2 Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Sun, 21 Apr 2024 13:02:36 +0200
Subject: [PATCH 022/458] Forgot to rerun the formater.

---
 src/jace/translator/jace_subtranslator_interface.py | 2 +-
 src/jace/translator/jaxpr_translator_driver.py      | 6 ++++--
 2 files changed, 5 insertions(+), 3 deletions(-)

diff --git a/src/jace/translator/jace_subtranslator_interface.py b/src/jace/translator/jace_subtranslator_interface.py
index 3c1dbb7..0178755 100644
--- a/src/jace/translator/jace_subtranslator_interface.py
+++ b/src/jace/translator/jace_subtranslator_interface.py
@@ -32,7 +32,7 @@ class JaCeSubTranslatorInterface:
 
     Subtranslators are rather simple objects that only have to perform
     the translation. The translation process itself is managed by a driver
-    object, which owns and manage the subtranslators.   
+    object, which owns and manage the subtranslators.
     In the end this implements the delegation pattern.
 
     A subtranslator uses its `get_handled_primitives()` function to indicate
diff --git a/src/jace/translator/jaxpr_translator_driver.py b/src/jace/translator/jaxpr_translator_driver.py
index 6ef5086..b1a4eba 100644
--- a/src/jace/translator/jaxpr_translator_driver.py
+++ b/src/jace/translator/jaxpr_translator_driver.py
@@ -473,7 +473,8 @@ def translate_dtype(dtype: Any) -> dace.typeclass:
         if not isinstance(dcd_type, dace.dtypes.typeclass):
             raise TypeError(
                 f"Expected that '{nameof_dtype}' would map to a 'dace.typeclass'"
-                f"but it mapped to a '{type(dcd_type).__name__}'.")
+                f"but it mapped to a '{type(dcd_type).__name__}'."
+            )
 
         return dcd_type
 
@@ -503,7 +504,8 @@ def add_jax_name_mapping(
                 return self
             raise ValueError(
                 f"Tried to create the mapping '{jax_name} -> {sdfg_name}', but '{jax_name}'"
-                f" already points to '{self.map_jax_var_to_sdfg(jax_name)}'.")
+                f" already points to '{self.map_jax_var_to_sdfg(jax_name)}'."
+            )
         if sdfg_name not in self.get_arrays():
             raise KeyError(f"Mapping '{jax_name} -> {sdfg_name}': SDFG target unknown.")
         if sdfg_name in self._forbidden_names:

From 771beb171481a39863e47f3084c1223e323e7e6d Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Sun, 21 Apr 2024 13:07:19 +0200
Subject: [PATCH 023/458] First part of the initial infrastructure.

---
 src/jace/__about__.py                         |  23 ++
 src/jace/__init__.py                          |  10 +-
 src/jace/translator/__init__.py               |  19 ++
 .../jace_subtranslator_interface.py           | 294 ++++++++++++++++++
 .../translator/sub_translators/__init__.py    |  93 ++++++
 src/jace/translator/util/__init__.py          |  22 ++
 .../util/jace_translation_memento.py          |  76 +++++
 src/jace/translator/util/revision_counter.py  |  54 ++++
 .../util/subtranslator_helper_order.py        |  80 +++++
 src/jace/translator/util/util.py              |  21 ++
 src/jace/util/__init__.py                     |  19 ++
 src/jace/util/dace.py                         |  14 +
 src/jace/util/jax.py                          |  44 +++
 src/jace/util/util.py                         |  30 ++
 14 files changed, 797 insertions(+), 2 deletions(-)
 create mode 100644 src/jace/__about__.py
 create mode 100644 src/jace/translator/__init__.py
 create mode 100644 src/jace/translator/jace_subtranslator_interface.py
 create mode 100644 src/jace/translator/sub_translators/__init__.py
 create mode 100644 src/jace/translator/util/__init__.py
 create mode 100644 src/jace/translator/util/jace_translation_memento.py
 create mode 100644 src/jace/translator/util/revision_counter.py
 create mode 100644 src/jace/translator/util/subtranslator_helper_order.py
 create mode 100644 src/jace/translator/util/util.py
 create mode 100644 src/jace/util/__init__.py
 create mode 100644 src/jace/util/dace.py
 create mode 100644 src/jace/util/jax.py
 create mode 100644 src/jace/util/util.py

diff --git a/src/jace/__about__.py b/src/jace/__about__.py
new file mode 100644
index 0000000..437e86b
--- /dev/null
+++ b/src/jace/__about__.py
@@ -0,0 +1,23 @@
+# JaCe - JAX Just-In-Time compilation using DaCe (Data Centric Parallel Programming)
+#
+# Copyright (c) 2024, ETH Zurich
+# All rights reserved.
+#
+# SPDX-License-Identifier: BSD-3-Clause
+
+"""Package metadata: version, authors, license and copyright."""
+
+from __future__ import annotations
+
+from typing import Final
+
+from packaging import version as pkg_version
+
+
+__all__ = ["__author__", "__copyright__", "__license__", "__version__", "__version_info__"]
+
+__author__: Final = "ETH Zurich and individual contributors"
+__copyright__: Final = "Copyright (c) 2024 ETH Zurich"
+__license__: Final = "BSD-3-Clause-License"
+__version__: Final = "0.0.1"
+__version_info__: Final = pkg_version.parse(__version__)
diff --git a/src/jace/__init__.py b/src/jace/__init__.py
index 56f6505..cf7b6ae 100644
--- a/src/jace/__init__.py
+++ b/src/jace/__init__.py
@@ -11,7 +11,13 @@
 
 from __future__ import annotations
 
+from .__about__ import __author__, __copyright__, __license__, __version__, __version_info__
 
-__version__ = "0.1.0"
 
-__all__ = ["__version__"]
+__all__ = [
+    "__author__",
+    "__copyright__",
+    "__license__",
+    "__version__",
+    "__version_info__",
+]
diff --git a/src/jace/translator/__init__.py b/src/jace/translator/__init__.py
new file mode 100644
index 0000000..71b567b
--- /dev/null
+++ b/src/jace/translator/__init__.py
@@ -0,0 +1,19 @@
+# JaCe - JAX Just-In-Time compilation using DaCe (Data Centric Parallel Programming)
+#
+# Copyright (c) 2024, ETH Zurich
+# All rights reserved.
+#
+# SPDX-License-Identifier: BSD-3-Clause
+
+"""Subpackage containing all the code related to Jaxpr translation"""
+
+from __future__ import annotations
+
+from .jace_subtranslator_interface import JaCeSubTranslatorInterface
+from .jaxpr_translator_driver import JaxprTranslationDriver
+
+
+__all__ = [
+    "JaCeSubTranslatorInterface",
+    "JaxprTranslationDriver",
+]
diff --git a/src/jace/translator/jace_subtranslator_interface.py b/src/jace/translator/jace_subtranslator_interface.py
new file mode 100644
index 0000000..0178755
--- /dev/null
+++ b/src/jace/translator/jace_subtranslator_interface.py
@@ -0,0 +1,294 @@
+# JaCe - JAX Just-In-Time compilation using DaCe (Data Centric Parallel Programming)
+#
+# Copyright (c) 2024, ETH Zurich
+# All rights reserved.
+#
+# SPDX-License-Identifier: BSD-3-Clause
+
+from __future__ import annotations
+
+from collections.abc import Collection, Sequence
+from typing import TYPE_CHECKING, Any, Final, final
+
+import dace
+from jax import core as jcore
+
+
+if TYPE_CHECKING:
+    from .jaxpr_translator_driver import JaxprTranslationDriver
+
+
+class JaCeSubTranslatorInterface:
+    """Interface for all Jax primitive/intrinsic subtranslators.
+
+    A translator for a primitive, sometimes also called intrinsic, translates
+    a single equation of a Jaxpr into its SDFG equivalent. A type that
+    implements this interface must fulfil the following properties:
+    - It must be stateless.
+        It is still possible and explicitly allowed to have an
+        immutable configuration state.
+    - All subclasses has to accept `**kwargs` arguments and must
+        forward all unconsumed arguments to the base.
+
+    Subtranslators are rather simple objects that only have to perform
+    the translation. The translation process itself is managed by a driver
+    object, which owns and manage the subtranslators.
+    In the end this implements the delegation pattern.
+
+    A subtranslator uses its `get_handled_primitives()` function to indicate
+    for which Jax primitives it want to register. It is important that a
+    subtranslator can register for as many primitive it wants. At the same
+    time, it is possible that multiple subtranslators have registered for a
+    single primitive.
+
+    If multiple subtranslator have registered for the same primitive they
+    will be ordered by driver. There are two ways how a subtranslator can
+    influence this order. The first one is by implementing `get_priority()`,
+    the driver will then put them in ascending order.
+    I.e. the lower its priority the earlier a subtranslator is checked.
+    However, if a subtranslator returns the special value
+    `JaCeSubTranslatorInterface.DEFAULT_PRIORITY` it will be always put at the
+    end, in unspecific order if multiple translator are involved.
+
+    The second possibility is to override the '__lt__()' function,
+    and establish a strict weak order. If a subtranslator overrides this
+    function it should also override `get_priority()` to return `NotImplemented`.
+
+    To decide which subtranslator should be used for a specific equation
+    the driver will use their 'can_translate_jaxeqn()' function.
+    The first subtranslator that returns 'True' will then be used.
+
+    Todo:
+        Also come up with a way how to avoid that instances are allowed to access
+            some private members of the driver; Possibly by composition.
+        Come up with a better way of ordering; maybe introduce fixed priority level.
+            And then allows to sort them according to `__lt__()` within the level.
+    """
+
+    __slots__ = ()
+
+    # Default value for the priority of primitive translators.
+    DEFAULT_PRIORITY: Final = int("1" * 64, base=2)
+
+    def __init__(
+        self,
+        *args: Any,
+        **kwargs: Any,
+    ) -> None:
+        """Initialize the interface.
+
+        It is required that subclasses calls this method during initialization.
+        """
+
+    def get_handled_primitives(self) -> Collection[str] | str:
+        """Returns the names of all Jax primitives that `self` is able to handle.
+
+        There is no limit on the number of primitives for which a subtranslator
+        can register. It is possible that several translators can be registered
+        for the same name.
+
+        See Also:
+            `self.can_translate_jaxeqn()` and `self.get_priority()`.
+
+        Notes:
+            In case a string is returned it is interpreted as 1 element collection.
+        """
+        raise NotImplementedError(
+            "Class '{type(self).__name__}' does not implement 'get_handled_primitives()'."
+        )
+
+    def can_translate_jaxeqn(
+        self,
+        driver: JaxprTranslationDriver,
+        in_var_names: Sequence[str | None],
+        out_var_names: Sequence[str],
+        eqn: jcore.JaxprEqn,
+    ) -> bool:
+        """Tests if `self` is able to translate the Jax primitive passed as `eqn`.
+
+        This function is used by the driver to determine which of the subtranslators,
+        that have registered for a certain type of primitive, should be used.
+        For a more detailed description of the arguments see
+        `self.translate_jaxeqn()` function.
+
+        Args:
+            driver:         The driver object of the translation.
+            in_var_names:   Names of the SDFG variables used as inputs for the primitive.
+            out_var_names:  Names of the SDFG variables used as outputs for the primitive.
+            eqn:            The `jcore.JaxprEqn` instance that is currently being handled.
+
+        Notes:
+            In case there is only one subtranslator registered for a certain primitive,
+                it is unspecific if this function will be called at all `self.translate_jaxeqn()`.
+            This function will never be called for a primitive for which it has not registered itself.
+        """
+        raise NotImplementedError(
+            "Class '{type(self).__name__}' does not implement 'can_translate_jaxeqn()'."
+        )
+
+    def translate_jaxeqn(
+        self,
+        driver: JaxprTranslationDriver,
+        in_var_names: Sequence[str | None],
+        out_var_names: Sequence[str],
+        eqn: jcore.JaxprEqn,
+        eqn_state: dace.SDFGState,
+    ) -> dace.SDFGState | None:
+        """Translates the Jax primitive into its SDFG equivalent.
+
+        Before the driver calls this function it will perform the following
+        preparatory tasks:
+        - It will allocate the SDFG variables that are used as outputs.
+            Their names will be passed through the `out_var_names` argument,
+            in the same order as `eqn.outvars`.
+        - It will collect the names of the SDFG variables that are used as input
+            and place them in `in_var_names`, in the same order as `eqn.invars`.
+            If an input argument refers to a literal no SDFG variable is created
+            for it and `None` is passed to indicate this.
+        - The subtranslator will create variables that are used as output.
+            They are passed as `out_var_names`, same order as in the equation.
+        - The driver will create a new terminal state and pass it as
+            `eqn_state` argument. This state is guaranteed to be empty and
+            `translator.get_terminal_sdfg_state() is eqn_state` holds.
+
+        Then the subtranslator is called. Usually a subtranslator should
+        construct the dataflow graph inside it. It is allowed that the
+        subtranslators creates more states if needed, but this state machine
+        has to have a single terminal state, which must be returned
+        and reachable from `eqn_state`.
+        If the function returns `None` the driver will assume that
+        subtranslator was able to fully construct the dataflow graph
+        within `eqn_state`.
+
+        While a subtranslator is forbidden from meddling with the input
+        variables mentioned in `in_var_names` in any way, it is allowed to
+        modify the output variables. For example he could create a new
+        SDFG variable, with different strides. But in that case the
+        subtranslator must update the internal mapping of the driver TBA HOW,
+        and modify the mapping in `out_var_names`.
+        However, the subtranslator is allowed to create internal temporary
+        variables. It just have to ensure that no name collision will occur,
+        a way to do this is to use a passed variable name as prefix.
+
+
+        Args:
+            driver:         The driver object of the translation.
+            in_var_names:   List of the names of the arrays created inside the
+                                SDFG for the inpts or `None` in case of a literal.
+            out_var_names:  List of the names of the arrays created inside the
+                                SDFG for the outputs.
+            eqn:            The Jax primitive that should be translated.
+            eqn_state:      State into which the primitive`s SDFG representation
+                                should be constructed.
+        """
+        raise NotImplementedError(
+            "Class '{type(self).__name__}' does not implement 'translate_jaxeqn()'."
+        )
+
+    def get_priority(self) -> int:
+        """Returns the priority of this translator.
+
+        The value returned by this function is used by the driver to order the
+        subtranslators that have registered for the same primitive.
+        The _smaller_ the value the earlier it is checked.
+
+        See Also:
+            `self.can_translate_jaxeqn()` and `self.get_handled_primitives()`.
+
+        Notes:
+            By default the function returns `self.DEFAULT_PRIORITY`, which is
+                handled specially, i.e. it is put at the end.
+            If a subtranslator instead overrides `__lt__()` this function
+                should return `NotImplemented`.
+        """
+        return self.DEFAULT_PRIORITY
+
+    def has_default_priority(self) -> bool:
+        """Checks if `self` has default priority.
+
+        Notes:
+            It is allowed, but not advised to override this function.
+                However, it has to be consistent with `self.get_priority()`.
+        """
+        try:
+            x = self.get_priority()
+        except NotImplementedError:
+            return False
+        if x is NotImplemented:
+            return False
+        return x == self.DEFAULT_PRIORITY
+
+    def __lt__(
+        self,
+        other: JaCeSubTranslatorInterface,
+    ) -> bool:
+        """Tests if `self` should be checked before `other` in the selection process.
+
+        As outlined in the class description this is the second possibility to
+        influence the order of the subtranslator. This function should return
+        `True` if `self` should be checked for applicability _before_ `other`.
+
+        Notes:
+            If this function is overridden `get_priority()` should return `NotImplemented`.
+            This function is never called if either `self` or `other` have default priority.
+        """
+        return self.get_priority() < other.get_priority()
+
+    def __eq__(
+        self,
+        other: Any,
+    ) -> bool:
+        """Tests if two subtranslators are equal.
+
+        The default implementation checks if `self` and `other` have the same
+        type. However, if the behaviour of a subtranslator strongly depend on
+        its configuration this function should be overridden.
+
+        Notes:
+            If you override this function you should also override
+                `self.__hash__()` to make the two consistent.
+        """
+        if not isinstance(other, JaCeSubTranslatorInterface):
+            return NotImplemented
+        return type(self) == type(other)
+
+    def __hash__(self) -> int:
+        """Computes the hash of the subtranslator.
+
+        The default implementation return a hash that is based on the class.
+        Thus all instances of a particular subtranslator will have the same
+        hash value.
+
+        Notes:
+            If you override this function you should also override
+                `self.__eq__()` to make the two consistent.
+        """
+        return id(self.__class__)
+
+    @final
+    def __ne__(
+        self,
+        other: Any,
+    ) -> bool:
+        return NotImplemented
+
+    @final
+    def __le__(
+        self,
+        other: Any,
+    ) -> bool:
+        return NotImplemented
+
+    @final
+    def __ge__(
+        self,
+        other: Any,
+    ) -> bool:
+        return NotImplemented
+
+    @final
+    def __gt__(
+        self,
+        other: Any,
+    ) -> bool:
+        return NotImplemented
diff --git a/src/jace/translator/sub_translators/__init__.py b/src/jace/translator/sub_translators/__init__.py
new file mode 100644
index 0000000..a226de1
--- /dev/null
+++ b/src/jace/translator/sub_translators/__init__.py
@@ -0,0 +1,93 @@
+# JaCe - JAX Just-In-Time compilation using DaCe (Data Centric Parallel Programming)
+#
+# Copyright (c) 2024, ETH Zurich
+# All rights reserved.
+#
+# SPDX-License-Identifier: BSD-3-Clause
+
+"""Module collecting all built-in subtranslators."""
+
+from __future__ import annotations
+
+from collections.abc import Sequence
+from typing import Final
+
+from jace import translator as jtrans
+
+
+# List of all subtranslators that ships with JaCe.
+_BUILTIN_SUBTRANSLATORS: Final[list[type[jtrans.JaCeSubTranslatorInterface]]] = [
+]
+
+# All externally supplied subtranslator implementation.
+#  It is a `dict` to do fast access and remember the order, value is always `None`.
+#  The list is manipulated through `{add,rm}_subtranslator()`.
+_EXTERNAL_SUBTRANSLATORS: dict[type[jtrans.JaCeSubTranslatorInterface], None] = {}
+
+
+def add_subtranslator(
+    subtrans: type[jtrans.JaCeSubTranslatorInterface],
+) -> bool:
+    """Add `subtrans` to the externally defined subtranslators.
+
+    The function returns `True` if it was added and `False` is not.
+    """
+    from inspect import isclass
+
+    if subtrans in _EXTERNAL_SUBTRANSLATORS:
+        return False
+    if not isclass(subtrans):
+        return False
+    if not issubclass(subtrans, jtrans.JaCeSubTranslatorInterface):
+        return False
+    _EXTERNAL_SUBTRANSLATORS[subtrans] = None
+    return True
+
+
+def rm_subtranslator(
+    subtrans: type[jtrans.JaCeSubTranslatorInterface],
+    strict: bool = False,
+) -> bool:
+    """Remove `subtrans` as externally defined subtranslators.
+
+    If `subtrans` is not known no error is generated unless `strict` is set to `True`.
+    """
+    if subtrans not in _EXTERNAL_SUBTRANSLATORS:
+        if strict:
+            raise KeyError(f"Subtranslator '{type(subtrans)}' is not known.")
+        return False
+    del _EXTERNAL_SUBTRANSLATORS[subtrans]
+    return True
+
+
+def _get_subtranslators_cls(
+    with_external: bool = True,
+    builtins: bool = True,
+) -> Sequence[type[jtrans.JaCeSubTranslatorInterface]]:
+    """Returns the list of all subtranslator known to JaCe.
+
+    Args:
+        with_external:  Include the translators that were externally supplied.
+        builtins:       Include the build in translators.
+
+    Notes:
+        If the externally defined subtranslators are requested they will be
+            first and ordered as FILO order.
+    """
+    # It is important that the externally defined are ordered before the builtins
+    #  and are ordered in FILO order, especuially if multiple subtranslator per
+    #  primitive are registered. Because this way they are inserted first
+    #  into the internal list of the driver, and furthermore since `sorted()`
+    #  is stable they will tend to end up more to the front.
+    ret: list[type[jtrans.JaCeSubTranslatorInterface]] = []
+    if with_external:
+        ret.extend(reversed(_EXTERNAL_SUBTRANSLATORS.keys()))
+    if builtins:
+        ret.extend(_BUILTIN_SUBTRANSLATORS)
+    return ret
+
+
+__all__ = [
+    "add_subtranslator",
+    "rm_subtranslator",
+]
diff --git a/src/jace/translator/util/__init__.py b/src/jace/translator/util/__init__.py
new file mode 100644
index 0000000..910589e
--- /dev/null
+++ b/src/jace/translator/util/__init__.py
@@ -0,0 +1,22 @@
+# JaCe - JAX Just-In-Time compilation using DaCe (Data Centric Parallel Programming)
+#
+# Copyright (c) 2024, ETH Zurich
+# All rights reserved.
+#
+# SPDX-License-Identifier: BSD-3-Clause
+
+"""Subpackage containing all utilities related to the translators."""
+
+from __future__ import annotations
+
+from .jace_translation_memento import JaCeTranslationMemento
+from .revision_counter import RevisionCounterManager
+from .util import list_to_dict
+
+
+# Q: Is there a way to import everything from `.util` and put it into `__all__` without writing it manually?
+__all__ = [
+    "JaCeTranslationMemento",
+    "RevisionCounterManager",
+    "list_to_dict",
+]
diff --git a/src/jace/translator/util/jace_translation_memento.py b/src/jace/translator/util/jace_translation_memento.py
new file mode 100644
index 0000000..d551082
--- /dev/null
+++ b/src/jace/translator/util/jace_translation_memento.py
@@ -0,0 +1,76 @@
+# JaCe - JAX Just-In-Time compilation using DaCe (Data Centric Parallel Programming)
+#
+# Copyright (c) 2024, ETH Zurich
+# All rights reserved.
+#
+# SPDX-License-Identifier: BSD-3-Clause
+
+from __future__ import annotations
+
+from collections.abc import Mapping, Sequence
+from dataclasses import dataclass
+from typing import Any
+
+import dace
+
+
+@dataclass(init=True, repr=True, eq=False, frozen=True, kw_only=True, slots=True)
+class JaCeTranslationMemento:
+    """Encapsulates the result of a translation run of the `JaxprTranslationDriver` object.
+
+    It defines the following members:
+    - `sdfg` the SDFG object that was created.
+    - `start_state` the first state in the SDFG state machine.
+    - `terminal_state` the last state in the state machine.
+    - `jax_name_map` a `dict` that maps every Jax name to its corresponding SDFG variable name.
+    - `inp_names` a `list` of the SDFG variables that are used as input,
+            in the same order as `Jaxpr.invars`.
+    - `out_names` a `list` of the SDFG variables that are used as output,
+            in the same order as `Jaxpr.outvars`.
+    """
+
+    sdfg: dace.SDFG
+    start_state: dace.SDFGState
+    terminal_state: dace.SDFGState
+    jax_name_map: Mapping[str, str]
+    inp_names: Sequence[str]
+    out_names: Sequence[str]
+
+    def validate(self) -> bool:
+        """Validate the underlying SDFG."""
+
+        # To prevent the 'non initialized' data warnings we have to temporary promote the
+        #  input arguments as global.
+        org_trans_state: dict[str, bool] = {}
+        for var in self.inp_names:
+            org_trans_state[var] = self.sdfg.arrays[var].transient
+            self.sdfg.arrays[var].transient = False
+        try:
+            self.sdfg.validate()
+        finally:
+            for var, orgValue in org_trans_state.items():
+                self.sdfg.arrays[var].transient = orgValue
+        return True
+
+    def __getitem__(self, idx: str) -> Any:
+        """Allows member access using brackets."""
+        if not isinstance(idx, str):
+            raise TypeError(f"Expected 'idx' as 'str' but got '{type(str)}'")
+        if not hasattr(self, idx):
+            raise KeyError(f"The key '{idx}' is not known.")
+        return getattr(self, idx)
+
+    def __hash__(self) -> int:
+        """Computes the hash of the underlying SDFG object."""
+        return hash(self.sdfg)
+
+    def __eq__(self, other: Any) -> bool:
+        """Compares the underlying SDFG object with 'rhs'."""
+        if isinstance(other, JaCeTranslationMemento):
+            return bool(self.sdfg == other.sdfg)
+        if hasattr(other, "__sdfg__"):
+            other = other.__sdfg__()
+        elif not isinstance(other, dace.SDFG):
+            return NotImplemented
+        x: bool = self.sdfg.__eq__(other)
+        return x
diff --git a/src/jace/translator/util/revision_counter.py b/src/jace/translator/util/revision_counter.py
new file mode 100644
index 0000000..661ab22
--- /dev/null
+++ b/src/jace/translator/util/revision_counter.py
@@ -0,0 +1,54 @@
+# JaCe - JAX Just-In-Time compilation using DaCe (Data Centric Parallel Programming)
+#
+# Copyright (c) 2024, ETH Zurich
+# All rights reserved.
+#
+# SPDX-License-Identifier: BSD-3-Clause
+
+from __future__ import annotations
+
+from typing import Final
+
+
+class RevisionCounterManager:
+    """This class acts as a manager for revision counters.
+
+    It is intended as a shared object and each new object that needs a revision,
+    simply calls `assign_revision()` to get the new one.
+    """
+
+    __slots__ = ("_next_revision",)
+
+    # The revision value of the very first call to `assign_revision()`.
+    #  This revision is only assigned once.
+    ROOT_REVISION: Final[int] = 0
+
+    def __init__(self) -> None:
+        """Creates a revision counter manager."""
+        self._next_revision = self.ROOT_REVISION
+
+    def assign_revision(self) -> int:
+        """Returns a revision number and advance self."""
+        ret = self._next_revision
+        self._next_revision += 1
+        return ret
+
+    def _reset_state(self) -> RevisionCounterManager:
+        """This function sets the revision counter back.
+
+        Notes:
+            Calling this function is almost always an error.
+            This function does not restore the state right after initialization,
+                but one call after `assign_revision()`. This is done to ensure
+                that there is one single root revision index.
+        """
+        self._next_revision = self.ROOT_REVISION
+        _ = self.assign_revision()  # Ensure that we throw away the root
+        return self
+
+    def is_root_revision(
+        self,
+        rev: int,
+    ) -> bool:
+        """This function checks if `rev` revers to the (absolute) unique revision of the root."""
+        return rev == self.ROOT_REVISION
diff --git a/src/jace/translator/util/subtranslator_helper_order.py b/src/jace/translator/util/subtranslator_helper_order.py
new file mode 100644
index 0000000..767521a
--- /dev/null
+++ b/src/jace/translator/util/subtranslator_helper_order.py
@@ -0,0 +1,80 @@
+# JaCe - JAX Just-In-Time compilation using DaCe (Data Centric Parallel Programming)
+#
+# Copyright (c) 2024, ETH Zurich
+# All rights reserved.
+#
+# SPDX-License-Identifier: BSD-3-Clause
+
+from __future__ import annotations
+
+from collections.abc import Sequence
+
+from jace import translator
+
+
+def sort_subtranslators(
+    subtranslators: Sequence[translator.JaCeSubTranslatorInterface],
+) -> Sequence[translator.JaCeSubTranslatorInterface]:
+    """Orders the subtranslators according to their priorities.
+
+    The function ensures the following:
+    - All subtranslators that have default priority are at the end.
+    - All subtranslators whose `get_priority()` returns `NotImplemented`
+        are at the begin of the list. These subtranslators are ordered according
+        to their `__lt__()` function.
+    - All subtranslators whose `get_priority()` function returns an integer are
+        in the middle, ordered according to this value.
+    """
+    if len(subtranslators) <= 1:
+        return subtranslators
+    subtranslators = sorted(subtranslators, key=_SubtranslatorOrderingHelper)
+    assert (len(subtranslators) <= 1) or all(
+        subtranslators[i - 1].has_default_priority() <= subtranslators[i].has_default_priority()
+        for i in range(1, len(subtranslators))
+    )
+    return subtranslators
+
+
+class _SubtranslatorOrderingHelper:
+    """Helper class used by `JaxprTranslationDriver` to bring the subtranslators in the correct order.
+
+    Essentially it is a wrapper that contains the additional logic that is
+    needed for sorting. This way subclasses does not need to implement it themselves.
+
+    Notes:
+        This class does not implement the other comparison function as requested by PEP8.
+    """
+
+    def __init__(self, subtranslator: translator.JaCeSubTranslatorInterface):
+        assert isinstance(subtranslator, translator.JaCeSubTranslatorInterface)
+        self._sub = subtranslator
+
+    def get(self) -> translator.JaCeSubTranslatorInterface:
+        return self._sub
+
+    def __lt__(
+        self,
+        other: _SubtranslatorOrderingHelper,
+    ) -> bool:
+        # Default priority means that it will always go to the end.
+        if self._sub.has_default_priority():
+            return False  # `self` has default priority, so it must go to the end.
+        if other._sub.has_default_priority():
+            return True  # `self` does not have default prio, thus it _must_ go before `other`.
+        prio_self = self._sub.get_priority()  # Get the priorities of the subtranslators.
+        prio_other = other._sub.get_priority()
+        if all(prio is NotImplemented for prio in (prio_self, prio_other)):
+            # None has a prio, `self` should decide if it should go first.
+            x = self._sub.__lt__(other._sub)
+            assert isinstance(x, bool)
+            return x
+        # In case only one has a priority, we change the order such that the one that implements
+        #  a `__lt__()` goes first.
+        if prio_self is NotImplemented:
+            assert isinstance(prio_other, int)
+            return True
+        if prio_other is NotImplemented:
+            assert isinstance(prio_self, int)
+            return False
+        assert all(isinstance(prio, int) for prio in (prio_other, prio_self))
+        return prio_self < prio_other
diff --git a/src/jace/translator/util/util.py b/src/jace/translator/util/util.py
new file mode 100644
index 0000000..484b4ef
--- /dev/null
+++ b/src/jace/translator/util/util.py
@@ -0,0 +1,21 @@
+# JaCe - JAX Just-In-Time compilation using DaCe (Data Centric Parallel Programming)
+#
+# Copyright (c) 2024, ETH Zurich
+# All rights reserved.
+#
+# SPDX-License-Identifier: BSD-3-Clause
+
+"""Contains all general helper functions needed inside the translator."""
+
+from __future__ import annotations
+
+from collections.abc import Sequence
+from typing import Any
+
+
+def list_to_dict(inp: Sequence[tuple[None | Any, Any]]) -> dict[Any, Any]:
+    """This method turns a `list` of pairs into a `dict` and applies a `None` filter.
+
+    The function will only include pairs whose key, i.e. first element is not `None`.
+    """
+    return {k: v for k, v in inp if k is not None}
diff --git a/src/jace/util/__init__.py b/src/jace/util/__init__.py
new file mode 100644
index 0000000..80de0e3
--- /dev/null
+++ b/src/jace/util/__init__.py
@@ -0,0 +1,19 @@
+# JaCe - JAX Just-In-Time compilation using DaCe (Data Centric Parallel Programming)
+#
+# Copyright (c) 2024, ETH Zurich
+# All rights reserved.
+#
+# SPDX-License-Identifier: BSD-3-Clause
+
+"""Global utility package for the jax to dace translator."""
+
+from __future__ import annotations
+
+from .jax import get_jax_var_name
+from .util import ensure_iterability
+
+
+__all__ = [
+    "get_jax_var_name",
+    "ensure_iterability",
+]
diff --git a/src/jace/util/dace.py b/src/jace/util/dace.py
new file mode 100644
index 0000000..1c75a55
--- /dev/null
+++ b/src/jace/util/dace.py
@@ -0,0 +1,14 @@
+# JaCe - JAX Just-In-Time compilation using DaCe (Data Centric Parallel Programming)
+#
+# Copyright (c) 2024, ETH Zurich
+# All rights reserved.
+#
+# SPDX-License-Identifier: BSD-3-Clause
+
+"""Implements all utility functions that are related to DaCe.
+
+Most of the functions defined here allow an unified access to DaCe's internals
+in a consistent and stable way.
+"""
+
+from __future__ import annotations
diff --git a/src/jace/util/jax.py b/src/jace/util/jax.py
new file mode 100644
index 0000000..3a7ed06
--- /dev/null
+++ b/src/jace/util/jax.py
@@ -0,0 +1,44 @@
+# JaCe - JAX Just-In-Time compilation using DaCe (Data Centric Parallel Programming)
+#
+# Copyright (c) 2024, ETH Zurich
+# All rights reserved.
+#
+# SPDX-License-Identifier: BSD-3-Clause
+
+"""Implements all utility functions that are related to Jax.
+
+Most of the functions defined here allow an unified access to Jax' internals
+in a consistent and stable way.
+"""
+
+from __future__ import annotations
+
+import jax.core as jcore
+
+
+def get_jax_var_name(jax_var: jcore.Atom | str) -> str:
+    """Returns the name of the Jax variable as a string.
+
+    Args:
+        jax_var:     The variable to stringify.
+
+    Todos:
+        Implement a regex check for the name.
+    """
+    if isinstance(jax_var, jcore.DropVar):
+        return "_"
+    if isinstance(jax_var, jcore.Atom):
+        jax_name = str(jax_var)  # This only works up to some version
+    elif isinstance(jax_var, str):
+        jax_name = jax_var
+    else:
+        raise TypeError(
+            f"Does not know how to transform '{jax_var}' (type: '{type(jax_var).__name__}') into a string."
+        )
+    # TODO(phimuell): Add regex to ensure that the name is legit.
+    assert isinstance(jax_name, str)
+    if len(jax_name) == 0:
+        raise ValueError(
+            f"Failed to translate the Jax variable '{jax_var}' into a name, the result was empty."
+        )
+    return jax_var
diff --git a/src/jace/util/util.py b/src/jace/util/util.py
new file mode 100644
index 0000000..d728be5
--- /dev/null
+++ b/src/jace/util/util.py
@@ -0,0 +1,30 @@
+# JaCe - JAX Just-In-Time compilation using DaCe (Data Centric Parallel Programming)
+#
+# Copyright (c) 2024, ETH Zurich
+# All rights reserved.
+#
+# SPDX-License-Identifier: BSD-3-Clause
+
+from __future__ import annotations
+
+from collections.abc import Iterable
+from typing import Any
+
+
+def ensure_iterability(
+    x: Any,
+    ign_str: bool = True,
+) -> Iterable[Any]:
+    """Ensures that `x` is iterable.
+
+    By default strings are _not_ considered iterable.
+
+    Args:
+        x:          To test.
+        ign_str:    Ignore that a string is iterabile.
+    """
+    if ign_str and isinstance(x, str):
+        x = [x]
+    elif isinstance(x, Iterable):
+        pass
+    return x

From b4c313e67a5b650008a612630efc0d0dd3cd1203 Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Sun, 21 Apr 2024 13:13:02 +0200
Subject: [PATCH 024/458] First reviewable commit of translator.

---
 .../translator/jaxpr_translator_driver.py     | 48 +++++++++++++++++++
 .../translator/sub_translators/__init__.py    |  3 +-
 2 files changed, 49 insertions(+), 2 deletions(-)
 create mode 100644 src/jace/translator/jaxpr_translator_driver.py

diff --git a/src/jace/translator/jaxpr_translator_driver.py b/src/jace/translator/jaxpr_translator_driver.py
new file mode 100644
index 0000000..267c72b
--- /dev/null
+++ b/src/jace/translator/jaxpr_translator_driver.py
@@ -0,0 +1,48 @@
+# JaCe - JAX Just-In-Time compilation using DaCe (Data Centric Parallel Programming)
+#
+# Copyright (c) 2024, ETH Zurich
+# All rights reserved.
+#
+# SPDX-License-Identifier: BSD-3-Clause
+
+from __future__ import annotations
+
+
+class JaxprTranslationDriver:
+    """Internal driver class for creating an SDFG equivalent of a `Jaxpr` instance.
+
+    This class builds an SDFG of a very particular form, which for us is
+    canonical, which is not directly usable. Thus this class should not be
+    directly used, instead a user should use TBA.
+    The canonical form is characterized by the following:
+    - the SDFG is a list of states, ideally each state corresponds to single Jax primitive,
+    - all variable names are derived from Jax names,
+    - there are no global variables inside the SDFG,
+    - It lacks the special `__return` variable.
+    - The argument names are not set.
+
+    The idea of the translator is extremely simple. Since Jaxpr is a list
+    consisting of more or less simple instructions/equations, they get processed
+    one after the other. Each equation is translated into its own state that
+    is appended to the SDFG, thus the SDFG is a long list of states. In certain
+    cases it might be that an equation needs more states, but this is an exception.
+
+    The actual translation is not handled by the driver instead a so called
+    subtranslator object is used. A subtranslator is specialized to translate
+    one type of primitive. For more information on the subtranslators see the
+    documentation of `JaCeSubTranslatorInterface`.
+
+    To support nested Jaxpr expressions the driver provides the possibility to
+    clone/fork itself, see `self.fork()` for more. Every clone, i.e. return
+    value of `self.fork()`, of a driver, which is also known as child, has
+    a unique identifier. This identifier is used for example to generate
+    unique SDFG variable names during a translation process,
+    see `self.same_family() for more.
+
+    If no translation is ongoing the only function that makes sense to call
+    is `translate_jaxpr()` which starts a translation.
+
+    Todos:
+        Find a better way than to allow giving access to protected functions.
+            Probably using composition with the higher level instance.
+    """
diff --git a/src/jace/translator/sub_translators/__init__.py b/src/jace/translator/sub_translators/__init__.py
index a226de1..c9e1557 100644
--- a/src/jace/translator/sub_translators/__init__.py
+++ b/src/jace/translator/sub_translators/__init__.py
@@ -16,8 +16,7 @@
 
 
 # List of all subtranslators that ships with JaCe.
-_BUILTIN_SUBTRANSLATORS: Final[list[type[jtrans.JaCeSubTranslatorInterface]]] = [
-]
+_BUILTIN_SUBTRANSLATORS: Final[list[type[jtrans.JaCeSubTranslatorInterface]]] = []
 
 # All externally supplied subtranslator implementation.
 #  It is a `dict` to do fast access and remember the order, value is always `None`.

From 0ffff9870eb2361166c0452959be21ff71da1302 Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Mon, 22 Apr 2024 08:21:06 +0200
Subject: [PATCH 025/458] Updated the ALU translator.

However, I am still not happy with it.
---
 .../sub_translators/alu_translator.py         | 154 ++++++------------
 1 file changed, 54 insertions(+), 100 deletions(-)

diff --git a/src/jace/translator/sub_translators/alu_translator.py b/src/jace/translator/sub_translators/alu_translator.py
index c8997a8..ae5829c 100644
--- a/src/jace/translator/sub_translators/alu_translator.py
+++ b/src/jace/translator/sub_translators/alu_translator.py
@@ -96,16 +96,30 @@ def can_translate_jaxeqn(
         """
         is_scalar: bool = len(eqn.outvars[0].aval.shape) == 0
         prim_name: str = eqn.primitive.name
-        if prim_name in self._unary_ops:
-            assert len(eqn.invars) == 1
-        elif prim_name in self._binary_ops:
-            assert len(eqn.invars) == 2
-        elif out_var_names[0] is None or (not is_scalar) and all(x is None for x in in_var_names):
+        if len(eqn.invars) == 1:
+            if prim_name not in self._unary_ops:
+                return False
+        elif len(eqn.invars) == 2:
+            if prim_name not in self._binary_ops:
+                return False
+        else:
+            return False
+        if out_var_names[0] is None:
+            raise RuntimeError(f"Encountered a litteral output '{eqn}'.")
+        if len(eqn.outvars) != 1:
             return False
-        if all(x is None for x in in_var_names):
+        if (not is_scalar) and all(x is None for x in in_var_names):
+            # Only literals as input are only allowed if we are scalar.
             return False
         if len(eqn.effects) != 0:
             return False
+        if not all(
+            invar.aval.shape == ()
+            for invar, inname in zip(eqn.invars, in_var_names)
+            if inname is None
+        ):
+            # All literals must be scalars
+            return False
         return True
 
     @override
@@ -131,30 +145,11 @@ def translate_jaxeqn(
             eqn_state:      State into which the primitive's SDFG representation is constructed.
         """
 
-        # All this checks are done to capture corner cases that Jax might do but are not implemented.
-        #  If you find out that Jax will never create something, then remove it.
-        if not all(
-            invar.aval.shape == ()
-            for invar, x in zip(eqn.invars, in_var_names, strict=False)
-            if x is None
-        ):
-            raise NotImplementedError("Can not handle Literals that are not scalars.")
-        if in_var_names[0] is None:
-            raise NotImplementedError(
-                "Literal can only not be on the right hand side of the operation."
-            )
-        if not any(invar.aval.shape == eqn.outvars[0].aval.shape for invar in eqn.invars):
-            raise NotImplementedError("At least input must have the same shape as the output.")
-        if len(eqn.outvars) != 1:
-            raise NotImplementedError(f"Can only handle one output (Eq: '{eqn}'.")
-
         # Determine what kind of input we got and how we should proceed.
         is_scalar = len(eqn.outvars[0].aval.shape) == 0
         inp_scalars = [len(Inp.aval.shape) == 0 for i, Inp in enumerate(eqn.invars)]
         has_scalars_as_inputs = any(inp_scalars)
-        only_scalars_as_inputs = all(inp_scalars)
         has_some_literals = any(x is None for x in in_var_names)
-        only_literals_as_inputs = all(x is None for x in in_var_names)
         inps_same_shape = all(
             eqn.invars[0].aval.shape == eqn.invars[i].aval.shape for i in range(1, len(eqn.invars))
         )
@@ -164,22 +159,12 @@ def translate_jaxeqn(
         dims_to_bcastl: list[int] = []
         dims_to_bcastr: list[int] = []
 
-        # Determine if and if yes how we have to broadcast.
-        if is_scalar:
-            # The output is a scalar, in which case we must have only scalar input as well.
-            #  Furthermore, we can have the situation that only Literals are the input.
-            assert (not is_scalar) or only_scalars_as_inputs
-            assert (not is_scalar) or only_literals_as_inputs
-
-        elif only_literals_as_inputs:
-            raise NotImplementedError("Only literals an input is only allowed for the scalar case.")
-
-        elif inps_same_shape:
+        # Determine if and how we have to broadcast.
+        if inps_same_shape or is_scalar:
             pass
 
         elif has_some_literals or has_scalars_as_inputs:
-            # This is essentially array plus scalar, but in two possibilities.
-            #  We either have a scalar variable or we have a scalar literal.
+            # This is essentially an array plus a scalar, that is eitehr a literal or a variable.
             assert (not has_some_literals) or all(
                 invar.aval.shape == eqn.outvars[0].aval.shape
                 for (invar, x) in zip(eqn.invars, in_var_names, strict=False)
@@ -191,92 +176,64 @@ def translate_jaxeqn(
                 if x is not None
             )
 
-        elif len(in_var_names) != 2:
-            raise ValueError("Can only do broadcasting if there are two operands.")
-
         else:
             # This is the general broadcasting case
             #  We assume that both inputs and the output have the same rank but different sizes in each dimension.
             #  It seems that Jax ensures this.
             #  We further assume that if the size in a dimension differs then one must have size 1.
             #  This is the size we broadcast over, i.e. conceptually replicated.
-            out_shp = tuple(eqn.outvars[0].aval.shape)  # Shape of the output.
+            out_shps = tuple(eqn.outvars[0].aval.shape)  # Shape of the output
             inp_shpl = tuple(eqn.invars[0].aval.shape)  # Shape of the left/first input
-            inp_shpr = tuple(
-                eqn.invars[1].aval.shape
-            )  # Shape of the right/second input; this must be "expanded"
+            inp_shpr = tuple(eqn.invars[1].aval.shape)  # Shape of the right/second input
 
-            if not ((len(inp_shpl) == len(inp_shpr)) and (len(out_shp) == len(inp_shpr))):
+            if not ((len(inp_shpl) == len(inp_shpr)) and (len(out_shps) == len(inp_shpr))):
                 raise NotImplementedError("Can not broadcast over different ranks.")
 
-            for dim in reversed(range(len(out_shp))):
-                shp_lft = inp_shpl[dim]
-                shp_rgt = inp_shpr[dim]
-
+            for dim, (shp_lft, shp_rgt, out_shp) in enumerate(zip(inp_shpl, inp_shpr, out_shps)):
                 if shp_lft == shp_rgt:
-                    assert out_shp[dim] == shp_lft
+                    assert out_shp == shp_lft
                 elif shp_lft == 1:
-                    assert shp_rgt == out_shp[dim]
+                    assert shp_rgt == out_shp
                     dims_to_bcastl.append(dim)
                 elif shp_rgt == 1:
-                    assert shp_lft == out_shp[dim]
+                    assert shp_lft == out_shp
                     dims_to_bcastr.append(dim)
                 else:
                     raise ValueError(f"Invalid shapes in dimension {dim} for broadcasting.")
 
-        # Now we create the Tasklet into which we solve the equation.
+        # Now we create the Tasklet in which the calculation is performed.
         tskl_code: str = self._writeTaskletCode(in_var_names, eqn)
         tskl_name: str = eqn.primitive.name
         tskl_map_ranges: list[tuple[str, str]] = [
             (f"__i{dim}", f"0:{N}") for dim, N in enumerate(eqn.outvars[0].aval.shape)
         ]
-        tskl_outputs: list[tuple[str, dace.Memlet]] = []
+        tskl_outputs: tuple[str, dace.Memlet] = None
         tskl_inputs: list[tuple[str, dace.Memlet] | tuple[None, None]] = []
 
         # Generate the Memlets for the input.
-        for i, dims_to_bcast in zip(
-            range(len(eqn.invars)), [dims_to_bcastl, dims_to_bcastr], strict=False
-        ):
-            if in_var_names[i] is None:
-                # Literal: No input needed.
+        for i, dims_to_bcast in enumerate([dims_to_bcastl, dims_to_bcastr]):
+            if in_var_names[i] is None:  # Literal: No input needed.
                 tskl_inputs.append((None, None))
                 continue
-            if inp_scalars[i]:
-                # We have a scalar argument.
-                i_memlet = dace.Memlet.from_array(
-                    in_var_names[i], driver.get_sdfg().arrays[in_var_names[i]]
-                )
-            else:
-                # We have an array argument.
+            if inp_scalars[i]:  # Scalar
+                assert len(dims_to_bcast) == 0
+                i_memlet = dace.Memlet.simple(in_var_names[i], "0")
+            else:  # Array: We may have to broadcast
                 inputs_: list[str] = []
                 for dim, (map_var, _) in enumerate(tskl_map_ranges):
                     if dim in dims_to_bcast:
                         inputs_.append("0")
                     else:
-                        inputs_.append(str(map_var))
+                        inputs_.append(map_var)
                 i_memlet = dace.Memlet.simple(in_var_names[i], ", ".join(inputs_))
                 del inputs_
             tskl_inputs.append((f"__in{i}", i_memlet))
 
-        # Now generate the Memlets for the outputs
-        if is_scalar:
-            tskl_outputs.append(
-                (
-                    f"__out{i}",
-                    dace.Memlet.from_array(
-                        out_var_names[0], driver.get_sdfg().arrays[out_var_names[i]]
-                    ),
-                )
-            )
-        else:
-            tskl_outputs.append(
-                (
-                    f"__out{i}",
-                    dace.Memlet.simple(
-                        out_var_names[0], ", ".join([X[0] for X in tskl_map_ranges])
-                    ),
-                )
-            )
+        # Now generate the Memlets for the output
+        tskl_output = (
+            "__out0",
+            dace.Memlet.simple(out_var_names[0], ", ".join([X[0] for X in tskl_map_ranges])),
+        )
 
         if is_scalar:
             tskl_tasklet = eqn_state.add_tasklet(
@@ -285,9 +242,9 @@ def translate_jaxeqn(
                 jtutil.list_to_dict(tskl_outputs).keys(),
                 tskl_code,
             )
-            for in_var, (in_connector, in_memlet) in filter(
-                lambda X: X[0] is not None, zip(in_var_names, tskl_inputs, strict=False)
-            ):
+            for in_var, (in_connector, in_memlet) in zip(in_var_names, tskl_inputs, strict=False):
+                if in_var is None:  # So access node for literal
+                    continue
                 eqn_state.add_edge(
                     eqn_state.add_read(in_var),
                     None,
@@ -295,16 +252,13 @@ def translate_jaxeqn(
                     in_connector,
                     in_memlet,
                 )
-            for out_var, (out_connector, out_memlet) in zip(
-                out_var_names, tskl_outputs, strict=False
-            ):
-                eqn_state.add_edge(
-                    tskl_tasklet,
-                    out_connector,
-                    eqn_state.add_write(out_var),
-                    None,
-                    out_memlet,
-                )
+            eqn_state.add_edge(
+                tskl_tasklet,
+                tskl_output[0],
+                eqn_state.add_write(out_var_names[0]),
+                None,
+                tskl_output[1],
+            )
         else:
             eqn_state.add_mapped_tasklet(
                 name=tskl_name,

From 4e97c6d7a202475285e086e580d67b5b9c531565 Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Mon, 22 Apr 2024 09:43:39 +0200
Subject: [PATCH 026/458] Fixed a bad merge.

---
 CODING_GUIDELINES.md | 18 ++++++++++++++++--
 CONTRIBUTING.md      |  3 ++-
 pyproject.toml       | 17 ++++++++++-------
 3 files changed, 28 insertions(+), 10 deletions(-)

diff --git a/CODING_GUIDELINES.md b/CODING_GUIDELINES.md
index fafa314..c7c5d3c 100644
--- a/CODING_GUIDELINES.md
+++ b/CODING_GUIDELINES.md
@@ -9,6 +9,21 @@ We deviate from the [Google Python Style Guide][google-style-guide] only in the
 - We use [`ruff-linter`][ruff-linter] instead of [`pylint`][pylint].
 - We use [`ruff-formatter`][ruff-formatter] for source code and imports formatting, which may work differently than indicated by the guidelines in section [_3. Python Style Rules_](https://google.github.io/styleguide/pyguide.html#3-python-style-rules). For example, maximum line length is set to 100 instead of 79 (although docstring lines should still be limited to 79).
 - According to subsection [_2.19 Power Features_](https://google.github.io/styleguide/pyguide.html#219-power-features), direct use of _power features_ (e.g. custom metaclasses, import hacks, reflection) should be avoided, but standard library classes that internally use these power features are accepted. Following the same spirit, we allow the use of power features in infrastructure code with similar functionality and scope as the Python standard library.
+- For readability purposes, when a docstring contains more than the required summary line, we prefer indenting the first line at the same cursor position as the first opening quote, although this is not explicitly considered in the doctring conventions described in subsection [_3.8.1 Docstrings_](https://google.github.io/styleguide/pyguide.html#381-docstrings). Example:
+
+  ```python
+  # single line docstring
+  """A one-line summary of the module or program, terminated by a period."""
+
+  # multi-line docstring
+  """
+  A one-line summary of the module or program, terminated by a period.
+
+  Leave one blank line. The rest of this docstring should contain an
+  overall description of the module or program.
+  """
+  ```
+
 - According to subsection [_3.19.12 Imports For Typing_](https://google.github.io/styleguide/pyguide.html#31912-imports-for-typing), symbols from `typing` and `collections.abc` modules used in type annotations _"can be imported directly to keep common annotations concise and match standard typing practices"_. Following the same spirit, we allow symbols to be imported directly from third-party or internal modules when they only contain a collection of frequently used typying definitions.
 
 ### Common questions
@@ -71,7 +86,7 @@ The terseness vs. helpfulness tradeoff should be more in favor of terseness for
 
 ### Docstrings
 
-TODO: update to autodoc2
+TODO: update to `autodoc2`
 
 We generate the API documentation automatically from the docstrings using [Sphinx][sphinx] and some extensions such as [Sphinx-autodoc][sphinx-autodoc] and [Sphinx-napoleon][sphinx-napoleon]. These follow the Google Python Style Guide docstring conventions to automatically format the generated documentation. A complete overview can be found here: [Example Google Style Python Docstrings](https://sphinxcontrib-napoleon.readthedocs.io/en/latest/example_google.html#example-google).
 
@@ -140,4 +155,3 @@ Testing components is a critical part of a software development project. We foll
 [sphinx-autodoc]: https://www.sphinx-doc.org/en/master/usage/extensions/autodoc.html
 [sphinx-napoleon]: https://sphinxcontrib-napoleon.readthedocs.io/en/latest/index.html#
 [sphinx-rest]: https://www.sphinx-doc.org/en/master/usage/restructuredtext/basics.html
-[ci-docs]: docs/development/CI/infrastructure.md
diff --git a/CONTRIBUTING.md b/CONTRIBUTING.md
index 8c6b57a..e3dc26e 100644
--- a/CONTRIBUTING.md
+++ b/CONTRIBUTING.md
@@ -99,7 +99,8 @@ Before submitting a pull request, check that it meets the following criteria:
 4. If the pull request contains code authored by first-time contributors, they should add their names to the [AUTHORS.md](AUTHORS.md) file.
 5. Pick one reviewer and try to contact them directly to let them know about the pull request. If there is no feedback in 24h/48h try to contact them again or pick another reviewer.
 6. Once the pull request has been approved, it should be squash-merged as soon as possible with a meaningful description of the changes. We use the [Conventional Commits][https://www.conventionalcommits.org/en/v1.0.0/#summary] specification for writing informative and automation-friendly commit messages. The following _commit types_ are accepted:
-   - `chore`: changes that only modify development-related tools, the build system configuration or external dependencies
+   - `build`: changes that affect the build system or external dependencies
+   - `chore`: changes related to the development tools or process
    - `ci`: changes to our CI configuration files and scripts
    - `docs`: documentation only changes
    - `feat`: a new feature
diff --git a/pyproject.toml b/pyproject.toml
index 7e1025c..4d551f1 100644
--- a/pyproject.toml
+++ b/pyproject.toml
@@ -100,22 +100,24 @@ extend-select = [
   "G",  # flake8-logging-format
   "C4",  # flake8-comprehensions
   "PT",  # flake8-pytest-style
-  "UP",  # pyupgrade  # TODO: evaluate and remove if needed
+  "UP",  # pyupgrade       # TODO: in evaluation
   "ARG",  # flake8-unused-arguments
   "ERA",  # eradicate
   "ICN",  # flake8-import-conventions
   "PGH",  # pygrep-hooks
   "PIE",  # flake8-pie
   "PTH",  # flake8-use-pathlib
-  "RET",  # flake8-return  # TODO: evaluate and remove if needed
+  "RET",  # flake8-return   # TODO: in evaluation
   "RUF",  # Ruff-specific
-  "SIM",  # flake8-simplify  # TODO: evaluate and remove if needed
+  "SIM",  # flake8-simplify # TODO: in evaluation
   "T10",  # flake8-debugger
-  "T20",  # flake8-print  # TODO: evaluate and remove if needed
+  "T20",  # flake8-print    # TODO: in evaluation
   "NPY"  # NumPy specific rules
 ]
 ignore = [
-  'E501'  # [line-too-long]
+  'B905',  # [zip-without-explicit-strict]
+  'E501',  # [line-too-long]
+  'UP038'  # [non-pep604-isinstance]
 ]
 ignore-init-module-imports = true
 unfixable = []
@@ -144,5 +146,6 @@ section-order = [
 ]
 
 [tool.ruff.lint.per-file-ignores]
-"noxfile.py" = ["T20"]
-"tests/**" = ["T10", "T20"]
+"!tests/**.py" = ["PT"]  # Ignore `flake8-pytest-style` everywhere except in `tests/`
+"noxfile.py" = ["T20"]  # Ignore `flake8-print`
+"tests/**" = ["T10", "T20"]  # Ignore `flake8-debugger` and `flake8-print`

From 24726c7e90ce3d0acb45c711a70f515737d2f4a8 Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Mon, 22 Apr 2024 13:04:37 +0200
Subject: [PATCH 027/458] Made some small modifications.

---
 .../translator/jaxpr_translator_driver.py     | 25 ++++++++++++++-----
 .../sub_translators/alu_translator.py         |  6 ++---
 src/jace/translator/util/__init__.py          |  2 ++
 3 files changed, 24 insertions(+), 9 deletions(-)

diff --git a/src/jace/translator/jaxpr_translator_driver.py b/src/jace/translator/jaxpr_translator_driver.py
index 4aec98b..09e61db 100644
--- a/src/jace/translator/jaxpr_translator_driver.py
+++ b/src/jace/translator/jaxpr_translator_driver.py
@@ -16,9 +16,9 @@
 from dace import data as ddata, properties as dprop
 from jax import core as jcore
 
-from jace import translator as jtrans
+from jace import translator as jtrans, util as jutil
 from jace.translator import sub_translators as jtsubt, util as jtrutil
-from jace.util import jax as jutil
+
 
 class JaxprTranslationDriver:
     """Internal driver class for creating an SDFG equivalent of a `Jaxpr` instance.
@@ -73,7 +73,7 @@ class JaxprTranslationDriver:
     )
     # Variables that are shared among the instances of a family.
     __shared_slots__ = (
-        "_reserved_names",  # Part of the context.
+        "_reserved_names",  # Part of the context, but is copied.
         "_sub_translators",
         "_rev_manager",  # This is the revision counter manager
     )
@@ -237,6 +237,11 @@ def fork(self) -> JaxprTranslationDriver:
             It is important that a clone instance should not be reused,
                 instead you should fork it again.
         """
+        from copy import copy as scpy
+
+        if not self.is_allocated():
+            raise RuntimeError("Only allocated driver can fork.")
+
         # Create a new (empty) driver instance; prevent allocation to make it cheep
         dolly: JaxprTranslationDriver = JaxprTranslationDriver(_no_shared_alloc=True)
 
@@ -248,6 +253,11 @@ def fork(self) -> JaxprTranslationDriver:
         dolly._rev_idx = dolly._rev_manager.assign_revision()
         assert not dolly.is_head_translator()
 
+        # We will now copy the reserved name list
+        #  Although they are shared, only their content is shared.
+        #  This prevents a feedback from the child to the parent.
+        dolly._reserved_names = scpy(self._reserved_names)
+
         return dolly
 
     def append_new_state(
@@ -290,6 +300,8 @@ def append_new_state(
         modify_term_state: bool = False
         if (prev_state is self._term_sdfg_state) or (prev_state is None):
             modify_term_state = True
+            app_state = self._term_sdfg_state
+        else:
             app_state = prev_state
 
         new_state = self._sdfg.add_state(label, is_start_block=False)
@@ -399,9 +411,11 @@ def is_allocated(self) -> bool:
         small_ctx: Sequence[Any] = [
             # for the proper implementation of forking the reserved names are handled special.
             getattr(self, x)
-            for x in self.__shared_slots__
-            if x != "_reserved_names"
+            for x in self.__private_slots__
+            if x != "_rev_idx"
         ]
+        assert isinstance(self._rev_idx, int)
+        assert isinstance(self._sub_translators, dict)
         if all((x is not None) for x in small_ctx):
             if self._reserved_names is None:
                 raise RuntimeError("Invalid allocation state: Reserved names not allocated.")
@@ -432,7 +446,6 @@ def same_family(
         if not isinstance(other, JaxprTranslationDriver):
             return NotImplemented  # type: ignore[unreachable]
         if all(getattr(self, x) is getattr(self, x) for x in self.__shared_slots__):
-            assert (self if (self._rev_idx < other._rev_idx) else other).is_allocated()
             return True
         assert not any(getattr(self, x) is getattr(self, x) for x in self.__shared_slots__)
 
diff --git a/src/jace/translator/sub_translators/alu_translator.py b/src/jace/translator/sub_translators/alu_translator.py
index ae5829c..b90bf79 100644
--- a/src/jace/translator/sub_translators/alu_translator.py
+++ b/src/jace/translator/sub_translators/alu_translator.py
@@ -24,7 +24,7 @@
 class ALUTranslator(jtranslator.JaCeSubTranslatorInterface):
     """This translator handles all arithmetic and logical operations."""
 
-    __slots__ = ("_unary_ops", "_binary_ops")
+    __slots__ = ()
 
     # Contains all translation templates for unarry operations.
     _unary_ops: Final[dict[str, str]] = {
@@ -239,7 +239,7 @@ def translate_jaxeqn(
             tskl_tasklet = eqn_state.add_tasklet(
                 tskl_name,
                 jtutil.list_to_dict(tskl_inputs).keys(),
-                jtutil.list_to_dict(tskl_outputs).keys(),
+                jtutil.list_to_dict([tskl_outputs]).keys(),
                 tskl_code,
             )
             for in_var, (in_connector, in_memlet) in zip(in_var_names, tskl_inputs, strict=False):
@@ -265,7 +265,7 @@ def translate_jaxeqn(
                 map_ranges=jtutil.list_to_dict(tskl_map_ranges),
                 inputs=jtutil.list_to_dict(tskl_inputs),
                 code=tskl_code,
-                outputs=jtutil.list_to_dict(tskl_outputs),
+                outputs=jtutil.list_to_dict([tskl_outputs]),
                 external_edges=True,
             )
 
diff --git a/src/jace/translator/util/__init__.py b/src/jace/translator/util/__init__.py
index 910589e..38ce344 100644
--- a/src/jace/translator/util/__init__.py
+++ b/src/jace/translator/util/__init__.py
@@ -11,6 +11,7 @@
 
 from .jace_translation_memento import JaCeTranslationMemento
 from .revision_counter import RevisionCounterManager
+from .subtranslator_helper_order import sort_subtranslators
 from .util import list_to_dict
 
 
@@ -19,4 +20,5 @@
     "JaCeTranslationMemento",
     "RevisionCounterManager",
     "list_to_dict",
+    "sort_subtranslators",
 ]

From 3ebbc3639ce80e97c02a61ceb5faad3aa6b923c6 Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Mon, 22 Apr 2024 13:37:31 +0200
Subject: [PATCH 028/458] Updated the tests for the subtranslator helper.

---
 tests/test_subtranslator_helper.py | 77 +++++++++++++++++++++++-------
 1 file changed, 61 insertions(+), 16 deletions(-)

diff --git a/tests/test_subtranslator_helper.py b/tests/test_subtranslator_helper.py
index a7fa78e..386786a 100644
--- a/tests/test_subtranslator_helper.py
+++ b/tests/test_subtranslator_helper.py
@@ -12,6 +12,8 @@
 from collections.abc import Collection
 from typing import Any
 
+import pytest
+
 from jace import translator as jtrans
 
 
@@ -147,17 +149,20 @@ def __init__(self, *args, **kwargs):
 
 
 def test_subtranslatior_managing():
-    """Esnsures the functionality of the subtranslator managing."""
+    """Ensures the functionality of the subtranslator managing."""
     from jace.translator.sub_translators import (
         _get_subtranslators_cls,
         add_subtranslator,
+        rm_subtranslator,
     )
 
     class ValidSubTrans(jtrans.JaCeSubTranslatorInterface):
         def __init__(self, *args, **kwargs):
             super().__init__(*args, **kwargs)
 
-    #
+    class ValidSubTrans2(jtrans.JaCeSubTranslatorInterface):
+        def __init__(self, *args, **kwargs):
+            super().__init__(*args, **kwargs)
 
     class InvalidSubTrans:
         def __init__(self): ...
@@ -200,23 +205,63 @@ def __gt__(self, other: Any) -> bool:
     #
 
     # Test the initial conditions
-    init_sub_trans_list = _get_subtranslators_cls(builtins=False)
-    init_built_in = _get_subtranslators_cls(with_external=False)  # noqa: F841  # Not finished
+    builtin_subtrans = _get_subtranslators_cls(with_external=False)
+    curr_external_subtrans = _get_subtranslators_cls(builtins=False)
+    exp_curr_external_subtrans = []
     assert (
-        len(init_sub_trans_list) == 0
-    ), f"Expected no external subtranslators but found: {init_sub_trans_list}"
-
-    # Now we add the valid subtranslator interface
-    assert add_subtranslator(ValidSubTrans), "Failed to add the `ValidSubTrans`"
-    first_sub_trans = _get_subtranslators_cls(builtins=False)  # noqa: F841  # Not finished
-
-    # Should not include the
-    subTrans = _get_subtranslators_cls(with_external=False)  # noqa: F841  # Not finished
-
-    assert not add_subtranslator(ValidSubTrans), "Could add `ValidSubTrans` twice"
-    raise AssertionError("NOT FINISHED YET")
+        curr_external_subtrans == exp_curr_external_subtrans
+    ), f"Expected no external subtranslators but found: {builtin_subtrans}"
+    assert (
+        len(builtin_subtrans) != 0
+    ), "Expected to have some builtin subtranslator, but there were none."
+    assert builtin_subtrans is not _get_subtranslators_cls()  # Ensures no sharing
+
+    # Add a subtranslator to the internal list
+    assert add_subtranslator(ValidSubTrans), "Failed to add 'ValidSubTrans'"
+    exp_curr_external_subtrans = [ValidSubTrans]
+    curr_external_subtrans = _get_subtranslators_cls(builtins=False)
+    assert (
+        curr_external_subtrans == exp_curr_external_subtrans
+    ), f"Wrong subtranslator order, expected '{exp_curr_external_subtrans}' got '{curr_external_subtrans}'."
+    assert builtin_subtrans == _get_subtranslators_cls(with_external=False)
+    assert _get_subtranslators_cls() == exp_curr_external_subtrans + builtin_subtrans
+
+    # Add a second translator
+    assert add_subtranslator(ValidSubTrans2), "Failed to add 'ValidSubTrans2'"
+    exp_curr_external_subtrans = [ValidSubTrans2, ValidSubTrans]  # FILO order
+    curr_external_subtrans = _get_subtranslators_cls(builtins=False)
+    assert (
+        exp_curr_external_subtrans == curr_external_subtrans
+    ), f"Wrong subtranslator order, expected '{exp_curr_external_subtrans}' got '{curr_external_subtrans}'."
+    assert exp_curr_external_subtrans + builtin_subtrans == _get_subtranslators_cls()
+
+    # Now we try to add some translators that will be rejected.
+    assert not add_subtranslator(ValidSubTrans)  # Already known
+    assert not add_subtranslator(ValidSubTrans2)  # Already known
+    assert not add_subtranslator(ValidSubTrans())  # Is an instance
+    assert not add_subtranslator(InvalidSubTrans)  # Not implementing interface
+    assert exp_curr_external_subtrans + builtin_subtrans == _get_subtranslators_cls()
+
+    # Now we remove a translator from the list.
+    assert rm_subtranslator(ValidSubTrans), "Failed to remove 'ValidSubTrans'"
+    exp_curr_external_subtrans = [ValidSubTrans2]
+    curr_external_subtrans = _get_subtranslators_cls(builtins=False)
+    assert (
+        curr_external_subtrans == exp_curr_external_subtrans
+    ), f"Wrong subtranslator order, expected '{exp_curr_external_subtrans}' got '{curr_external_subtrans}'."
+    assert builtin_subtrans == _get_subtranslators_cls(with_external=False)
+    assert _get_subtranslators_cls() == exp_curr_external_subtrans + builtin_subtrans
+
+    # Now try to remove it again.
+    assert not rm_subtranslator(ValidSubTrans), "Was allowed to remove 'ValidSubTrans' again!"
+    with pytest.raises(
+        expected_exception=KeyError, match=f"Subtranslator '{type(ValidSubTrans)}' is not known."
+    ):
+        rm_subtranslator(ValidSubTrans, strict=True)
+    #
 
 
 if __name__ == "__main__":
     test_subtranslatior_order_simple()
     test_subtranslatior_order_custom1()
+    test_subtranslatior_managing()

From a19d825abeaa306e3382d9335ee66fa2f7bd9c81 Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Mon, 22 Apr 2024 13:39:52 +0200
Subject: [PATCH 029/458] Updated tests for the driver.

---
 tests/test_jaxpr_translator_driver.py | 144 ++++++++++++++++++++++++++
 1 file changed, 144 insertions(+)
 create mode 100644 tests/test_jaxpr_translator_driver.py

diff --git a/tests/test_jaxpr_translator_driver.py b/tests/test_jaxpr_translator_driver.py
new file mode 100644
index 0000000..2becc04
--- /dev/null
+++ b/tests/test_jaxpr_translator_driver.py
@@ -0,0 +1,144 @@
+# JaCe - JAX Just-In-Time compilation using DaCe (Data Centric Parallel Programming)
+#
+# Copyright (c) 2024, ETH Zurich
+# All rights reserved.
+#
+# SPDX-License-Identifier: BSD-3-Clause
+
+"""Implements some tests of the subtranslator driver."""
+
+from __future__ import annotations
+
+import dace
+import pytest
+
+from jace import translator as jtrans
+
+
+@pytest.fixture(scope="module")
+def alloc_driver():
+    """Returns an allocated driver instance."""
+    name = "fixture_driver"
+    driver = jtrans.JaxprTranslationDriver()
+    driver._allocate_translation_ctx(name=name)
+    return driver
+
+
+def test_driver_alloc():
+    """Tests the state right after allocation."""
+    driver = jtrans.JaxprTranslationDriver()
+    assert not driver.is_allocated(), "Driver was created allocated."
+
+    # The reserved names will be tested in `test_driver_fork()`.
+    sdfg_name = "qwertzuiopasdfghjkl"
+    driver._allocate_translation_ctx(name=sdfg_name)
+
+    sdfg: dace.SDFG = driver.get_sdfg()
+
+    assert driver.get_sdfg().name == sdfg_name
+    assert sdfg.number_of_nodes() == 1
+    assert sdfg.number_of_edges() == 0
+    assert sdfg.start_block is driver._init_sdfg_state
+    assert driver.get_terminal_sdfg_state() is driver._init_sdfg_state
+
+
+def test_driver_fork():
+    """Tests the fork ability of the driver."""
+
+    # This is the parent driver.
+    driver = jtrans.JaxprTranslationDriver()
+    assert not driver.is_allocated(), "Driver should not be allocated."
+
+    with pytest.raises(expected_exception=RuntimeError, match="Only allocated driver can fork."):
+        _ = driver.fork()
+    #
+
+    # We allocate the driver directly, because we need to set some internals.
+    #  This is also the reason why we do not use the fixture.
+    org_res_names = {"a", "b"}
+    driver._allocate_translation_ctx("driver", reserved_names=org_res_names)
+    assert driver.is_allocated()
+    assert driver._reserved_names == org_res_names
+
+    # Now we allocate a child
+    dolly = driver.fork()
+    dolly_rev = dolly.get_rev_idx()
+    assert not dolly.is_allocated()
+    assert not dolly.is_head_translator()
+    assert driver.is_head_translator()
+    assert dolly.same_family(driver)
+    assert driver.same_family(dolly)
+    assert driver._sub_translators is dolly._sub_translators
+    assert driver._rev_manager is dolly._rev_manager
+    assert dolly._reserved_names == driver._reserved_names
+    assert dolly._reserved_names is not driver._reserved_names
+
+    # Test if allocation of fork works properly
+    dolly_only_res_names = ["c"]  # reserved names that are only known to dolly
+    dolly_full_res_names = org_res_names.union(dolly_only_res_names)
+    dolly._allocate_translation_ctx("dolly", reserved_names=dolly_only_res_names)
+
+    assert dolly.is_allocated()
+    assert dolly._reserved_names == dolly_full_res_names
+    assert driver._reserved_names == org_res_names
+
+    # Now we deallocate dolly
+    dolly._clear_translation_ctx()
+    assert not dolly.is_allocated()
+    assert dolly._reserved_names is not None
+    assert dolly._reserved_names == dolly_full_res_names
+
+    # Now we test if the revision index is again increased properly.
+    dolly2 = driver.fork()
+    assert dolly_rev < dolly2.get_rev_idx()
+    assert dolly2.same_family(dolly)
+    assert dolly2.same_family(driver)
+
+    # Deallocate the driver
+    driver._clear_translation_ctx()
+    assert not driver.is_allocated()
+    assert driver.is_head_translator()
+    assert driver._reserved_names is None
+    assert driver._rev_manager._next_revision == dolly_rev
+
+
+def test_driver_append_state(alloc_driver):
+    """Tests the functionality of appending states."""
+    sdfg: dace.SDFG = alloc_driver.get_sdfg()
+
+    terminal_state_1: dace.SDFGState = alloc_driver.append_new_state("terminal_state_1")
+    assert sdfg.number_of_nodes() == 2
+    assert sdfg.number_of_edges() == 1
+    assert terminal_state_1 is alloc_driver.get_terminal_sdfg_state()
+    assert alloc_driver.get_terminal_sdfg_state() is alloc_driver._term_sdfg_state
+    assert alloc_driver._init_sdfg_state is sdfg.start_block
+    assert alloc_driver._init_sdfg_state is not terminal_state_1
+    assert next(iter(sdfg.edges())).src is sdfg.start_block
+    assert next(iter(sdfg.edges())).dst is terminal_state_1
+
+    # Specifying an explicit append state that is the terminal should also update the terminal state of the driver.
+    terminal_state_2: dace.SDFGState = alloc_driver.append_new_state(
+        "terminal_state_2", prev_state=terminal_state_1
+    )
+    assert sdfg.number_of_nodes() == 3
+    assert sdfg.number_of_edges() == 2
+    assert terminal_state_2 is alloc_driver.get_terminal_sdfg_state()
+    assert sdfg.out_degree(terminal_state_1) == 1
+    assert sdfg.out_degree(terminal_state_2) == 0
+    assert sdfg.in_degree(terminal_state_2) == 1
+    assert next(iter(sdfg.in_edges(terminal_state_2))).src is terminal_state_1
+
+    # Specifying a previous node that is not the terminal state should not do anything.
+    non_terminal_state: dace.SDFGState = alloc_driver.append_new_state(
+        "non_terminal_state", prev_state=terminal_state_1
+    )
+    assert alloc_driver.get_terminal_sdfg_state() is not non_terminal_state
+    assert sdfg.in_degree(non_terminal_state) == 1
+    assert sdfg.out_degree(non_terminal_state) == 0
+    assert next(iter(sdfg.in_edges(non_terminal_state))).src is terminal_state_1
+
+
+if __name__ == "__main__":
+    test_driver_alloc()
+    test_driver_fork()
+    test_driver_append_state(alloc_driver())

From 38eb33cb16ec8a82b8f75bc4a0995d31fff44cbf Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Mon, 22 Apr 2024 14:16:10 +0200
Subject: [PATCH 030/458] refactored the `add_array()` function.

---
 .../translator/jaxpr_translator_driver.py     | 92 +++++++++++--------
 1 file changed, 55 insertions(+), 37 deletions(-)

diff --git a/src/jace/translator/jaxpr_translator_driver.py b/src/jace/translator/jaxpr_translator_driver.py
index 09e61db..9de0229 100644
--- a/src/jace/translator/jaxpr_translator_driver.py
+++ b/src/jace/translator/jaxpr_translator_driver.py
@@ -630,60 +630,83 @@ def add_array(
         is_scalar: bool = shape == ()
         dtype = self.translate_dtype(arg.aval.dtype)
 
-        if (alt_name is not None) and (not re.fullmatch("[a-zA-Z_][a-zA-Z0-9_]*", alt_name)):
-            raise ValueError(f"The passed name 'alt_name' '{alt_name}' is invalid.")
-        if force_jax_name:
-            if alt_name is not None:
-                raise ValueError("Specified 'force_jax_name' but passed  'alt_name'.")
-            alt_name = jutil.get_jax_var_name(arg)
+        if alt_name is not None:
+            assert isinstance(alt_name, str)
+            find_new_name = False  # If a name was given, then use it no matter what.
+            if len(alt_name) == 0:
+                raise ValueError("Passed an empty 'alt_name'.")
+            if alt_name in self._forbidden_names:
+                raise ValueError("'alt_name' is a forbidden name.")
+            if not re.fullmatch("[a-zA-Z_][a-zA-Z0-9_]*", alt_name):
+                raise ValueError(f"The passed name 'alt_name' '{alt_name}' is invalid.")
+            if force_jax_name:
+                raise ValueError("Specified 'force_jax_name' but passed 'alt_name'.")
             if name_prefix is not None:
-                assert isinstance(name_prefix, str)
-                alt_name = name_prefix + alt_name
+                raise ValueError(
+                    f"Specified 'name_prefix' ('{name_prefix}') but passed '{alt_name}' as 'alt_name'."
+                )
+            if alt_name in self._sdfg.arrays:
+                raise ValueError(f"Variable '{alt_name}' already exists.")
         if name_prefix is not None:
             assert isinstance(name_prefix, str)
-            if alt_name is not None:
-                raise ValueError("Specified 'name_prefix' and 'alt_name' which is not possible.")
-        if (symb_strides is None) and (strides is None):
-            symb_strides = False if (len(shape) <= 1) else False
+            if len(name_prefix) == 0:
+                raise ValueError("Specified an empty 'name_prefix'.")
         if as_view and (not as_transient):
             raise ValueError("You tried to create a global view, which is not allowed.")
 
-        if isinstance(arg, jcore.Var):
+        if (symb_strides is None) and (strides is None):
+            def_symb_stride = False  # default value for symbolic strides
+            symb_strides = False if (len(shape) <= 1) else def_symb_stride  # Keep for the future
+        elif (symb_strides is not None) and (strides is not None):
+            raise ValueError("Specified 'symb_strides' and 'stride at the same time.")
+        elif strides is not None:
+            if len(strides) != len(shape):
+                raise ValueError(
+                    f"'strides' has length {len(strides)}, but array rank is {len(shape)}."
+                )
+        else:
+            assert isinstance(symb_strides, bool)
+
+        # SDFG variable name
+        if force_jax_name:
+            alt_name = jutil.get_jax_var_name(arg)
+            if name_prefix is not None:
+                alt_name = name_prefix + alt_name
+
+        elif alt_name is not None:
+            prop_name = alt_name  # Just for completion: will be ignored later
+
+        elif isinstance(arg, jcore.Var):
             prop_name = jutil.get_jax_var_name(arg)
-            if (alt_name is None) and prop_name.startswith("__"):
+            if prop_name.startswith("__"):
                 raise ValueError(
                     f"You tried to create the variable '{prop_name}' which"
                     "starts with two underscores, use 'alt_name' for that."
                 )
-            if isinstance(name_prefix, str):
+            if name_prefix is not None:
                 prop_name = name_prefix + prop_name
+
         elif isinstance(arg, jcore.Literal):
             if not allow_literals:
                 raise NotImplementedError("Jax Literals are not supported.")
             if alt_name is None:
                 raise ValueError(f"Passed literal '{arg}', but not specified a name to use.")
+
         else:
             raise TypeError(f"Does not know how to handle '{type(arg).__name__}'.")
 
         if alt_name is None:
             # If we are the root translator, then we will use `prop_name` directly;
-            #  if not we will append the revision of `self` to the name.
+            #  otherwise we will append the revision of `self` to the name.
             arg_name = prop_name + ("" if self.is_head_translator() else f"_rev_idx{self._rev_idx}")
         else:
             arg_name = str(alt_name)
-            find_new_name = False  # If a name was given, then use it no matter what.
-            if arg_name in self._forbidden_names:
-                raise ValueError(f"You used 'alt_name' to create the forbidden name '{alt_name}'.")
-            if arg_name in self._sdfg.arrays:
-                raise ValueError(
-                    f"Tried to create a variable with name '{arg_name}'"
-                    " explicitly, but it is already known."
-                )
+
         if find_new_name is None:
+            # Determine if we should look for a new name or not, if nothing was specified
             find_new_name = (arg_name in self._forbidden_names) or (
                 arg_name in self._reserved_names
             )
-
         if find_new_name:
             # We have to find a new name.
             name_tmpl = "_jax_variable__" + arg_name + "__{}"
@@ -700,11 +723,11 @@ def add_array(
             else:
                 raise ValueError(f"Failed to find a replacement name for '{arg_name}'")
             del iCounter, _arg_name
-        if arg_name in self._forbidden_names:
-            raise ValueError(f"Can not create variable '{arg_name}', name is forbidden.")
-        if arg_name in self._sdfg.arrays:
-            raise ValueError(f"Can not create variable '{arg_name}', variable is already created.")
-        if not re.fullmatch("[a-zA-Z_][a-zA-Z0-9_]*", arg_name):
+        elif arg_name in self._forbidden_names:
+            raise ValueError(f"Can't create variable '{arg_name}', name is forbidden.")
+        elif arg_name in self._sdfg.arrays:
+            raise ValueError(f"Can't create variable '{arg_name}', variable is already created.")
+        elif not re.fullmatch("[a-zA-Z_][a-zA-Z0-9_]*", arg_name):
             raise ValueError(f"The requested variable name '{arg_name}' is invalid.")
 
         # Promotion of scalar to array.
@@ -714,15 +737,10 @@ def add_array(
             strides = None
             is_scalar = False
 
+        # Set the stride if we have to change.
         if strides is not None:
-            if symb_strides:
-                raise ValueError("Specified 'symb_strides' and 'stride at the same time.")
-            if len(strides) != len(shape):
-                raise ValueError(
-                    f"'strides' was '{strides}' it had length {len(strides)},"
-                    f" but the array has rank {len(shape)}."
-                )
             strides = tuple(strides)
+            assert len(strides) == len(shape)
 
         elif (symb_strides is True) and (not is_scalar):
             strides = [

From cd026f067c167002c1bca4082ef38b376ead1e64 Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Mon, 22 Apr 2024 14:17:13 +0200
Subject: [PATCH 031/458] Fixed a typo.

---
 src/jace/translator/sub_translators/alu_translator.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/src/jace/translator/sub_translators/alu_translator.py b/src/jace/translator/sub_translators/alu_translator.py
index b90bf79..78ef172 100644
--- a/src/jace/translator/sub_translators/alu_translator.py
+++ b/src/jace/translator/sub_translators/alu_translator.py
@@ -105,7 +105,7 @@ def can_translate_jaxeqn(
         else:
             return False
         if out_var_names[0] is None:
-            raise RuntimeError(f"Encountered a litteral output '{eqn}'.")
+            raise RuntimeError(f"Encountered a literal output '{eqn}'.")
         if len(eqn.outvars) != 1:
             return False
         if (not is_scalar) and all(x is None for x in in_var_names):

From 6738941c0687b9924b198fced833688a0dd2e56e Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Mon, 22 Apr 2024 14:52:39 +0200
Subject: [PATCH 032/458] It is now also possible to specify the variable shape
 and data type from extern, without the need of having a Jax variable.

---
 .../translator/jaxpr_translator_driver.py     | 25 +++++++++++++++++--
 1 file changed, 23 insertions(+), 2 deletions(-)

diff --git a/src/jace/translator/jaxpr_translator_driver.py b/src/jace/translator/jaxpr_translator_driver.py
index 9de0229..a1afc7a 100644
--- a/src/jace/translator/jaxpr_translator_driver.py
+++ b/src/jace/translator/jaxpr_translator_driver.py
@@ -556,6 +556,8 @@ def add_array(
         force_array: bool = False,
         as_view: bool = False,
         strides: Sequence[int | dace.symbol | str] | None = None,
+        shape: Sequence[int | dace.symbol | str] | None = None,
+        dtype: dace.typeclass | None = None,
         symb_strides: bool | None = None,
         find_new_name: bool | None = None,
         allow_literals: bool = False,
@@ -603,6 +605,8 @@ def add_array(
             as_view:            Creates a view instead of an array, if it is a scalar
                                     it is silently ignored.
             strides:            Instead of the default strides use these values.
+            shape:              Use this shape; only in conjunction with `dtype`, `alt_name` and `arg is None`.
+            dtype:              Use this dtype; only in conjunction with `shape`, `alt_name` and `arg is None`.
             symb_strides:       Create symbols and use them for fully symbolic strides.
             find_new_name:      The translator will try to find a new name if the designated
                                     is already occupied. This does not work if the name
@@ -624,11 +628,28 @@ def add_array(
                 `jutil.get_jax_var_name(arg)` as `alt_name`.
         """
         assert all(x is not None for x in (self._sdfg, self._jax_name_map))
-        shape: Sequence[int] = arg.aval.shape  # Shape of the array
+
+        if arg is None:
+            if not isinstance(dtype, dace.typeclass):
+                raise ValueError(
+                    f"'arg' was 'None' but 'dtype' was not a type, instead '{type(dtype).__name__}'."
+                )
+            if not isinstance(shape, Sequence):
+                raise ValueError(f"'arg' was 'None' but 'shape' was invalid, got '{shape}'.")
+            if not all(isinstance(x, (int | dace.symbol | str)) for x in shape):
+                raise ValueError(f"'arg' was 'None' but 'shape' was invalid, got '{shape}'.")
+            if alt_name is None:
+                raise ValueError("'arg' was 'None' but 'alt_name' was not specified.")
+        else:
+            if shape is not None:
+                raise ValueError(f"Specified 'arg', but also passed a shape: '{shape}'")
+            if dtype is not None:
+                raise ValueError(f"Specified 'arg', but also passed a dtype: '{dtype}'")
+            shape: Sequence[int] = arg.aval.shape  # Shape of the array
+            dtype = self.translate_dtype(arg.aval.dtype)
         offset = None  # i.e. no offset
         storage: dace.StorageType = dace.StorageType.Default  # Set at later stages (optimization)
         is_scalar: bool = shape == ()
-        dtype = self.translate_dtype(arg.aval.dtype)
 
         if alt_name is not None:
             assert isinstance(alt_name, str)

From 9d9678a86805cbf160ae8b0add658f08a4fea857 Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Mon, 22 Apr 2024 15:00:33 +0200
Subject: [PATCH 033/458] Refactored a bit more.

---
 .../translator/jaxpr_translator_driver.py     | 32 +------------------
 src/jace/util/__init__.py                     |  3 +-
 src/jace/util/jax.py                          | 32 +++++++++++++++++++
 3 files changed, 35 insertions(+), 32 deletions(-)

diff --git a/src/jace/translator/jaxpr_translator_driver.py b/src/jace/translator/jaxpr_translator_driver.py
index a1afc7a..25e8cec 100644
--- a/src/jace/translator/jaxpr_translator_driver.py
+++ b/src/jace/translator/jaxpr_translator_driver.py
@@ -460,36 +460,6 @@ def get_rev_idx(self) -> int:
         """
         return self._rev_idx
 
-    @staticmethod
-    def translate_dtype(dtype: Any) -> dace.typeclass:
-        """Turns a Jax datatype into a DaCe datatype.
-
-        Todo:
-            Improve.
-        """
-        nameof_dtype = str(dtype)
-
-        # Make some basic checks if the datatype is okay
-        if (not jax.config.read("jax_enable_x64")) and (nameof_dtype == "float64"):
-            raise ValueError("Found a 'float64' type but 'x64' support is disabled.")
-        if nameof_dtype.startswith("complex"):
-            raise NotImplementedError("Support for complecx computation is not implemented.")
-
-        # Now extract the datatype from dace, this is extremely ugly.
-        if not hasattr(dace.dtypes, nameof_dtype):
-            raise TypeError(
-                f"Could not find the type '{nameof_dtype}' ({type(dtype).__name__}) in 'dace'."
-            )
-        dcd_type = getattr(dace.dtypes, nameof_dtype)
-
-        if not isinstance(dcd_type, dace.dtypes.typeclass):
-            raise TypeError(
-                f"Expected that '{nameof_dtype}' would map to a 'dace.typeclass'"
-                f"but it mapped to a '{type(dcd_type).__name__}'."
-            )
-
-        return dcd_type
-
     def add_jax_name_mapping(
         self,
         jax_var: str | jcore.Atom,
@@ -646,7 +616,7 @@ def add_array(
             if dtype is not None:
                 raise ValueError(f"Specified 'arg', but also passed a dtype: '{dtype}'")
             shape: Sequence[int] = arg.aval.shape  # Shape of the array
-            dtype = self.translate_dtype(arg.aval.dtype)
+            dtype = jutil.translate_dtype(arg.aval.dtype)
         offset = None  # i.e. no offset
         storage: dace.StorageType = dace.StorageType.Default  # Set at later stages (optimization)
         is_scalar: bool = shape == ()
diff --git a/src/jace/util/__init__.py b/src/jace/util/__init__.py
index 80de0e3..8831446 100644
--- a/src/jace/util/__init__.py
+++ b/src/jace/util/__init__.py
@@ -9,11 +9,12 @@
 
 from __future__ import annotations
 
-from .jax import get_jax_var_name
+from .jax import get_jax_var_name, translate_dtype
 from .util import ensure_iterability
 
 
 __all__ = [
     "get_jax_var_name",
     "ensure_iterability",
+    "translate_dtype",
 ]
diff --git a/src/jace/util/jax.py b/src/jace/util/jax.py
index 3a7ed06..22f49f4 100644
--- a/src/jace/util/jax.py
+++ b/src/jace/util/jax.py
@@ -13,8 +13,12 @@
 
 from __future__ import annotations
 
+import jax
 import jax.core as jcore
 
+import dace
+
+
 
 def get_jax_var_name(jax_var: jcore.Atom | str) -> str:
     """Returns the name of the Jax variable as a string.
@@ -42,3 +46,31 @@ def get_jax_var_name(jax_var: jcore.Atom | str) -> str:
             f"Failed to translate the Jax variable '{jax_var}' into a name, the result was empty."
         )
     return jax_var
+
+
+def translate_dtype(dtype: Any) -> dace.typeclass:
+    """Turns a Jax datatype into a DaCe datatype.
+    """
+
+    if(isinstance(dtype, dace.typeclass)):
+        return dtype
+
+    # Make some basic checks if the datatype is okay
+    name_of_dtype = str(dtype)
+    if (not jax.config.read("jax_enable_x64")) and (name_of_dtype == "float64"):
+        raise ValueError("Found a 'float64' type but 'x64' support is disabled.")
+    if name_of_dtype.startswith("complex"):
+        raise NotImplementedError("Support for complecx computation is not implemented yet.")
+
+    # Now extract the datatype from dace, this is extremely ugly.
+    if not hasattr(dace.dtypes, name_of_dtype):
+        raise TypeError(f"Could not find '{name_of_dtype}' ({type(dtype).__name__}) in 'dace'.")
+    dcd_type = getattr(dace.dtypes, name_of_dtype)
+
+    if not isinstance(dcd_type, dace.dtypes.typeclass):
+        raise TypeError(
+            f"'{name_of_dtype}' does not map to a 'dace.typeclass' but to a '{type(dcd_type).__name__}'."
+        )
+    return dcd_type
+
+

From 6779ac8c2a44881556d45803e58ad197a0f4a9c7 Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Mon, 22 Apr 2024 16:12:30 +0200
Subject: [PATCH 034/458] Implemented a mechanism to generate Jax variables
 without having variables.

This is basically a simple substitute class that can be used instead of a full jax variable.
It is mostly usefull for creating arrays during testing.
However, it should also be used to cretae variables for which we do not have anything.

This essentially replaces the flags that allowed to explicitly specify shape and dtype in the `add_array()` function.
---
 .../translator/jaxpr_translator_driver.py     | 54 ++++++------------
 src/jace/util/__init__.py                     |  5 +-
 src/jace/util/jax.py                          | 55 ++++++++++++++++---
 3 files changed, 70 insertions(+), 44 deletions(-)

diff --git a/src/jace/translator/jaxpr_translator_driver.py b/src/jace/translator/jaxpr_translator_driver.py
index 25e8cec..821b454 100644
--- a/src/jace/translator/jaxpr_translator_driver.py
+++ b/src/jace/translator/jaxpr_translator_driver.py
@@ -327,7 +327,7 @@ def get_arrays(self) -> Mapping[str, ddata.Data]:
 
     def get_array(
         self,
-        name: str | jcore.Atom,
+        name: str | jcore.Atom | jutil.JaCeVar,
     ) -> ddata.Data:
         """Returns the SDFG `Data` object `name` referees to.
 
@@ -338,7 +338,7 @@ def get_array(
 
         if isinstance(name, str):
             pass
-        elif isinstance(name, jcore.Atom):
+        elif isinstance(name, (jcore.Atom, jutil.JaCeVar)):
             name = self.map_jax_var_to_sdfg(name)
         else:
             raise TypeError(f"Does not know how to handle '{type(name).__name__}'.")
@@ -350,19 +350,19 @@ def get_array(
     @overload
     def map_jax_var_to_sdfg(
         self,
-        jax_var: str | jcore.Atom,
+        jax_var: str | jcore.Atom | jutil.JaCeVar,
     ) -> str: ...
 
     @overload
     def map_jax_var_to_sdfg(
         self,
-        jax_var: str | jcore.Atom,
+        jax_var: str | jcore.Atom | jutil.JaCeVar,
         allow_fail: bool,
     ) -> str | None: ...
 
     def map_jax_var_to_sdfg(
         self,
-        jax_var: str | jcore.Atom,
+        jax_var: str | jcore.Atom | jutil.JaCeVar,
         allow_fail: bool = False,
     ) -> str | None:
         """Returns the name of the SDFG variable that the Jax variable `jax_var` is referring to.
@@ -372,7 +372,7 @@ def map_jax_var_to_sdfg(
             allow_fail:     If mapping is not known return `None` instead of raise `KeyError`.
         """
         assert self._jax_name_map is not None
-        assert isinstance(jax_var, (jcore.Atom, str))
+        assert isinstance(jax_var, (jcore.Atom, str, jutil.JaCeVar))
 
         jax_var = jutil.get_jax_var_name(jax_var)
         if jax_var not in self._jax_name_map:
@@ -462,7 +462,7 @@ def get_rev_idx(self) -> int:
 
     def add_jax_name_mapping(
         self,
-        jax_var: str | jcore.Atom,
+        jax_var: str | jcore.Atom | jutil.JaCeVar,
         sdfg_name: str,
     ) -> JaxprTranslationDriver:
         """Creates a mapping between `jax_var` to `sdfg_name`.
@@ -477,7 +477,7 @@ def add_jax_name_mapping(
             sdfg_name:   The name of the corresponding SDFG variable.
         """
         assert self._jax_name_map is not None
-        assert isinstance(jax_var, (jcore.Atom, str))
+        assert isinstance(jax_var, (jcore.Atom, str, jutil.JaCeVar))
         assert isinstance(sdfg_name, str)
 
         jax_name = jutil.get_jax_var_name(jax_var)
@@ -518,7 +518,7 @@ def add_reserved_names(
 
     def add_array(
         self,
-        arg: jcore.Atom,
+        arg: jcore.Atom | jutil.JaCeVar,
         *,
         as_transient: bool = True,
         alt_name: str | None = None,
@@ -526,8 +526,6 @@ def add_array(
         force_array: bool = False,
         as_view: bool = False,
         strides: Sequence[int | dace.symbol | str] | None = None,
-        shape: Sequence[int | dace.symbol | str] | None = None,
-        dtype: dace.typeclass | None = None,
         symb_strides: bool | None = None,
         find_new_name: bool | None = None,
         allow_literals: bool = False,
@@ -575,8 +573,6 @@ def add_array(
             as_view:            Creates a view instead of an array, if it is a scalar
                                     it is silently ignored.
             strides:            Instead of the default strides use these values.
-            shape:              Use this shape; only in conjunction with `dtype`, `alt_name` and `arg is None`.
-            dtype:              Use this dtype; only in conjunction with `shape`, `alt_name` and `arg is None`.
             symb_strides:       Create symbols and use them for fully symbolic strides.
             find_new_name:      The translator will try to find a new name if the designated
                                     is already occupied. This does not work if the name
@@ -596,27 +592,13 @@ def add_array(
             Specifying `alt_name` implies `find_new_name=False`.
             The effect of specifying `force_jax_name` is as passing
                 `jutil.get_jax_var_name(arg)` as `alt_name`.
+            If you need to create a special array, you can use `jace.util.JaCeVar`
+                to create a pseudo Jax variable.
         """
-        assert all(x is not None for x in (self._sdfg, self._jax_name_map))
+        assert self.is_allocated()
 
-        if arg is None:
-            if not isinstance(dtype, dace.typeclass):
-                raise ValueError(
-                    f"'arg' was 'None' but 'dtype' was not a type, instead '{type(dtype).__name__}'."
-                )
-            if not isinstance(shape, Sequence):
-                raise ValueError(f"'arg' was 'None' but 'shape' was invalid, got '{shape}'.")
-            if not all(isinstance(x, (int | dace.symbol | str)) for x in shape):
-                raise ValueError(f"'arg' was 'None' but 'shape' was invalid, got '{shape}'.")
-            if alt_name is None:
-                raise ValueError("'arg' was 'None' but 'alt_name' was not specified.")
-        else:
-            if shape is not None:
-                raise ValueError(f"Specified 'arg', but also passed a shape: '{shape}'")
-            if dtype is not None:
-                raise ValueError(f"Specified 'arg', but also passed a dtype: '{dtype}'")
-            shape: Sequence[int] = arg.aval.shape  # Shape of the array
-            dtype = jutil.translate_dtype(arg.aval.dtype)
+        shape: Sequence[int] = jutil.get_jax_var_shape(arg)
+        dtype = jutil.get_jax_var_dtype(arg)
         offset = None  # i.e. no offset
         storage: dace.StorageType = dace.StorageType.Default  # Set at later stages (optimization)
         is_scalar: bool = shape == ()
@@ -667,7 +649,7 @@ def add_array(
         elif alt_name is not None:
             prop_name = alt_name  # Just for completion: will be ignored later
 
-        elif isinstance(arg, jcore.Var):
+        elif isinstance(arg, (jcore.Var, jutil.JaCeVar)):
             prop_name = jutil.get_jax_var_name(arg)
             if prop_name.startswith("__"):
                 raise ValueError(
@@ -677,7 +659,7 @@ def add_array(
             if name_prefix is not None:
                 prop_name = name_prefix + prop_name
 
-        elif isinstance(arg, jcore.Literal):
+        elif isinstance(arg, jcore.Literal):  # type: ignore[unreachable]
             if not allow_literals:
                 raise NotImplementedError("Jax Literals are not supported.")
             if alt_name is None:
@@ -770,7 +752,7 @@ def add_array(
 
     def create_jax_var_list(
         self,
-        jax_var_list: Sequence[jcore.Atom],
+        jax_var_list: Sequence[jcore.Atom | jutil.JaCeVar],
         prevent_creation: bool = False,
         only_creation: bool = False,
         **kwargs: Any,
@@ -803,7 +785,7 @@ def create_jax_var_list(
                 if only_creation:
                     raise ValueError(f"Requested 'only_creation', but '{jax_var}' is a 'Literal'.")
                 ret_list.append(None)
-            elif isinstance(jax_var, jcore.jax_var):
+            elif isinstance(jax_var, (jcore.Var, jutil.JaCeVar)):
                 mapped_sdfg_name: str | None = self.map_jax_var_to_sdfg(jax_var, allow_fail=True)
                 if (mapped_sdfg_name is None) and prevent_creation:
                     raise ValueError(f"prevent_creation' given but have to create '{jax_var}'.")
diff --git a/src/jace/util/__init__.py b/src/jace/util/__init__.py
index 8831446..0bd9a15 100644
--- a/src/jace/util/__init__.py
+++ b/src/jace/util/__init__.py
@@ -9,12 +9,15 @@
 
 from __future__ import annotations
 
-from .jax import get_jax_var_name, translate_dtype
+from .jax import JaCeVar, get_jax_var_dtype, get_jax_var_name, get_jax_var_shape, translate_dtype
 from .util import ensure_iterability
 
 
 __all__ = [
     "get_jax_var_name",
+    "get_jax_var_shape",
+    "get_jax_var_dtype",
     "ensure_iterability",
     "translate_dtype",
+    "JaCeVar",
 ]
diff --git a/src/jace/util/jax.py b/src/jace/util/jax.py
index 22f49f4..3d8d0f7 100644
--- a/src/jace/util/jax.py
+++ b/src/jace/util/jax.py
@@ -13,14 +13,33 @@
 
 from __future__ import annotations
 
+from dataclasses import dataclass
+from typing import Any
+
+import dace
 import jax
 import jax.core as jcore
 
-import dace
 
+@dataclass(init=True, repr=True, eq=True, frozen=True, slots=True)
+class JaCeVar:
+    """Substitute class for Jax' `Var` instance.
+
+    This class is similar to a `jax.core.Var` class, but much simpler.
+    It is only a container for a name, shape and a datatype.
+    All extractor functions `get_jax_var{name, shape, dtype}()` will accept it,
+    as well as multiple functions of the driver.
+
+    Notes:
+        Main intention is to test functionality.
+    """
+
+    name: str
+    shape: tuple[int | dace.symbol | str]
+    dtype: dace.typeclass
 
 
-def get_jax_var_name(jax_var: jcore.Atom | str) -> str:
+def get_jax_var_name(jax_var: jcore.Atom | JaCeVar | str) -> str:
     """Returns the name of the Jax variable as a string.
 
     Args:
@@ -31,6 +50,8 @@ def get_jax_var_name(jax_var: jcore.Atom | str) -> str:
     """
     if isinstance(jax_var, jcore.DropVar):
         return "_"
+    if isinstance(jax_var, JaCeVar):
+        return jax_var.name
     if isinstance(jax_var, jcore.Atom):
         jax_name = str(jax_var)  # This only works up to some version
     elif isinstance(jax_var, str):
@@ -48,11 +69,33 @@ def get_jax_var_name(jax_var: jcore.Atom | str) -> str:
     return jax_var
 
 
-def translate_dtype(dtype: Any) -> dace.typeclass:
-    """Turns a Jax datatype into a DaCe datatype.
+def get_jax_var_shape(jax_var: jcore.Atom) -> tuple[int, ...]:
+    """Returns the shape of a Jax variable.
+
+    Args:
+        jax_var:     The variable to process
     """
+    if isinstance(jax_var, jcore.Atom):
+        return jax_var.aval.shape
+    if isinstance(jax_var, JaCeVar):
+        assert isinstance(jax_var.shape, tuple)
+        return jax_var.shape
+    raise TypeError(f"'get_jax_var_shape()` is not implemented for '{type(jax_var)}'.")
+
+
+def get_jax_var_dtype(jax_var: jcore.Atom) -> dace.typeclass:
+    """Returns the DaCe equivalent of `jax_var`s datatype."""
+    if isinstance(jax_var, jcore.Atom):
+        return translate_dtype(jax_var.aval.dtype)
+    if isinstance(jax_var, JaCeVar):
+        return translate_dtype(jax_var.dtype)
+    raise TypeError(f"'get_jax_var_dtype()` is not implemented for '{type(jax_var)}'.")
+
 
-    if(isinstance(dtype, dace.typeclass)):
+def translate_dtype(dtype: Any) -> dace.typeclass:
+    """Turns a Jax datatype into a DaCe datatype."""
+
+    if isinstance(dtype, dace.typeclass):
         return dtype
 
     # Make some basic checks if the datatype is okay
@@ -72,5 +115,3 @@ def translate_dtype(dtype: Any) -> dace.typeclass:
             f"'{name_of_dtype}' does not map to a 'dace.typeclass' but to a '{type(dcd_type).__name__}'."
         )
     return dcd_type
-
-

From 9f9fc2ca0dcb7db0c36a17b36faa6e8e2187bb80 Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Tue, 23 Apr 2024 09:10:13 +0200
Subject: [PATCH 035/458] More refactoring.

---
 .../translator/jaxpr_translator_driver.py     | 51 ++++++++++++-------
 src/jace/util/jax.py                          |  2 +-
 2 files changed, 34 insertions(+), 19 deletions(-)

diff --git a/src/jace/translator/jaxpr_translator_driver.py b/src/jace/translator/jaxpr_translator_driver.py
index 821b454..2c2c807 100644
--- a/src/jace/translator/jaxpr_translator_driver.py
+++ b/src/jace/translator/jaxpr_translator_driver.py
@@ -589,6 +589,7 @@ def add_array(
                 the function will always look for a new name, even if the initial
                 name was fine. If it is `False` the function will never look for
                 a new new, thus if the name is unavailable an error is generated.
+                However, this excluds variable names that are known.
             Specifying `alt_name` implies `find_new_name=False`.
             The effect of specifying `force_jax_name` is as passing
                 `jutil.get_jax_var_name(arg)` as `alt_name`.
@@ -603,6 +604,23 @@ def add_array(
         storage: dace.StorageType = dace.StorageType.Default  # Set at later stages (optimization)
         is_scalar: bool = shape == ()
 
+        if (alt_name is None) and (self.map_jax_var_to_sdfg(arg, allow_fail=True) is not None):
+            # Maybe the test could be more robust, but it will check if we try to create
+            #  a variable for a second time. It is, however, okay to use one as template,
+            #  if another name is specified from the beginning.
+            raise ValueError(
+                f"Tried to create variable '{arg}' again, without specifying an alternative name.."
+            )
+        if force_jax_name:
+            if alt_name is not None:
+                raise ValueError(
+                    f"Specified 'force_jax_name', but passed '{alt_name}' as 'alt_name'."
+                )
+            if name_prefix is not None:
+                raise ValueError(
+                    f"Specified 'force_jax_name', but passed '{name_prefix}' as 'name_prefix'."
+                )
+            alt_name = jutil.get_jax_var_name(arg)
         if alt_name is not None:
             assert isinstance(alt_name, str)
             find_new_name = False  # If a name was given, then use it no matter what.
@@ -627,6 +645,7 @@ def add_array(
         if as_view and (not as_transient):
             raise ValueError("You tried to create a global view, which is not allowed.")
 
+        # Checking the strides.
         if (symb_strides is None) and (strides is None):
             def_symb_stride = False  # default value for symbolic strides
             symb_strides = False if (len(shape) <= 1) else def_symb_stride  # Keep for the future
@@ -640,15 +659,10 @@ def add_array(
         else:
             assert isinstance(symb_strides, bool)
 
-        # SDFG variable name
-        if force_jax_name:
-            alt_name = jutil.get_jax_var_name(arg)
-            if name_prefix is not None:
-                alt_name = name_prefix + alt_name
-
-        elif alt_name is not None:
+        # Now we determine the proposed name of the variable.
+        #  Depending on the situation, we will further manipulate it.
+        if alt_name is not None:
             prop_name = alt_name  # Just for completion: will be ignored later
-
         elif isinstance(arg, (jcore.Var, jutil.JaCeVar)):
             prop_name = jutil.get_jax_var_name(arg)
             if prop_name.startswith("__"):
@@ -658,16 +672,13 @@ def add_array(
                 )
             if name_prefix is not None:
                 prop_name = name_prefix + prop_name
-
         elif isinstance(arg, jcore.Literal):  # type: ignore[unreachable]
             if not allow_literals:
                 raise NotImplementedError("Jax Literals are not supported.")
             if alt_name is None:
                 raise ValueError(f"Passed literal '{arg}', but not specified a name to use.")
-
         else:
             raise TypeError(f"Does not know how to handle '{type(arg).__name__}'.")
-
         if alt_name is None:
             # If we are the root translator, then we will use `prop_name` directly;
             #  otherwise we will append the revision of `self` to the name.
@@ -675,11 +686,13 @@ def add_array(
         else:
             arg_name = str(alt_name)
 
+        # Determine if we should look for a new name or not, if nothing was specified
         if find_new_name is None:
-            # Determine if we should look for a new name or not, if nothing was specified
-            find_new_name = (arg_name in self._forbidden_names) or (
-                arg_name in self._reserved_names
-            )
+            if arg_name in self._reserved_names:
+                find_new_name = True
+            if arg_name in self._forbidden_names:
+                find_new_name = True
+
         if find_new_name:
             # We have to find a new name.
             name_tmpl = "_jax_variable__" + arg_name + "__{}"
@@ -696,11 +709,13 @@ def add_array(
             else:
                 raise ValueError(f"Failed to find a replacement name for '{arg_name}'")
             del iCounter, _arg_name
-        elif arg_name in self._forbidden_names:
+
+        # Final name check
+        if arg_name in self._forbidden_names:
             raise ValueError(f"Can't create variable '{arg_name}', name is forbidden.")
-        elif arg_name in self._sdfg.arrays:
+        if arg_name in self._sdfg.arrays:
             raise ValueError(f"Can't create variable '{arg_name}', variable is already created.")
-        elif not re.fullmatch("[a-zA-Z_][a-zA-Z0-9_]*", arg_name):
+        if not re.fullmatch("[a-zA-Z_][a-zA-Z0-9_]*", arg_name):
             raise ValueError(f"The requested variable name '{arg_name}' is invalid.")
 
         # Promotion of scalar to array.
diff --git a/src/jace/util/jax.py b/src/jace/util/jax.py
index 3d8d0f7..755e6a3 100644
--- a/src/jace/util/jax.py
+++ b/src/jace/util/jax.py
@@ -35,7 +35,7 @@ class JaCeVar:
     """
 
     name: str
-    shape: tuple[int | dace.symbol | str]
+    shape: tuple[int | dace.symbol | str, ...] | int | dace.symbol | str | tuple[()]
     dtype: dace.typeclass
 
 
From 9a32f5d9bbc92f4941ddfb2e8f0159f94227ead7 Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Tue, 23 Apr 2024 09:32:24 +0200
Subject: [PATCH 036/458] Updated the test for the driver.

---
 tests/test_jaxpr_translator_driver.py | 167 ++++++++++++++++++++++++--
 1 file changed, 160 insertions(+), 7 deletions(-)

diff --git a/tests/test_jaxpr_translator_driver.py b/tests/test_jaxpr_translator_driver.py
index 2becc04..ad70e05 100644
--- a/tests/test_jaxpr_translator_driver.py
+++ b/tests/test_jaxpr_translator_driver.py
@@ -24,7 +24,7 @@ def alloc_driver():
     return driver
 
 
-def test_driver_alloc():
+def test_driver_alloc() -> None:
     """Tests the state right after allocation."""
     driver = jtrans.JaxprTranslationDriver()
     assert not driver.is_allocated(), "Driver was created allocated."
@@ -42,7 +42,7 @@ def test_driver_alloc():
     assert driver.get_terminal_sdfg_state() is driver._init_sdfg_state
 
 
-def test_driver_fork():
+def test_driver_fork() -> None:
     """Tests the fork ability of the driver."""
 
     # This is the parent driver.
@@ -74,11 +74,20 @@ def test_driver_fork():
     assert dolly._reserved_names is not driver._reserved_names
 
     # Test if allocation of fork works properly
-    dolly_only_res_names = ["c"]  # reserved names that are only known to dolly
+    dolly_only_res_names = ["c"]  # reserved names that are only known to dolly; Added latter
     dolly_full_res_names = org_res_names.union(dolly_only_res_names)
-    dolly._allocate_translation_ctx("dolly", reserved_names=dolly_only_res_names)
+    dolly._allocate_translation_ctx(
+        "dolly",
+    )
 
     assert dolly.is_allocated()
+    assert dolly._reserved_names == org_res_names
+    assert driver._reserved_names == org_res_names
+
+    # Now adding reserved names to dolly after construction.
+    dolly.add_reserved_names(None)
+    assert dolly._reserved_names == org_res_names
+    dolly.add_reserved_names(dolly_only_res_names)
     assert dolly._reserved_names == dolly_full_res_names
     assert driver._reserved_names == org_res_names
 
@@ -98,11 +107,11 @@ def test_driver_fork():
     driver._clear_translation_ctx()
     assert not driver.is_allocated()
     assert driver.is_head_translator()
-    assert driver._reserved_names is None
     assert driver._rev_manager._next_revision == dolly_rev
+    assert driver._reserved_names is None
 
 
-def test_driver_append_state(alloc_driver):
+def test_driver_append_state(alloc_driver: jtrans.JaxprTranslationDriver) -> None:
     """Tests the functionality of appending states."""
     sdfg: dace.SDFG = alloc_driver.get_sdfg()
 
@@ -138,7 +147,151 @@ def test_driver_append_state(alloc_driver):
     assert next(iter(sdfg.in_edges(non_terminal_state))).src is terminal_state_1
 
 
+def test_driver_array(alloc_driver: jtrans.JaxprTranslationDriver) -> None:
+    """This function tests the array creation routines.
+
+    However, it does so without using Jax variables.
+    """
+    from dace.data import Array, Data, Scalar
+
+    from jace.util import JaCeVar
+
+    # Since we do not have Jax variables, we are using JaCe substitute for it.
+
+    # Creating a scalar.
+    scal1_j = JaCeVar("scal1", (), dace.float64)
+    scal1_: str = alloc_driver.add_array(
+        arg=scal1_j,
+        update_var_mapping=True,
+    )
+    scal1: Data = alloc_driver.get_array(scal1_)
+    assert scal1 is alloc_driver.get_array(scal1_j)
+    assert scal1_ == alloc_driver.map_jax_var_to_sdfg(scal1_j)
+    assert isinstance(scal1, Scalar)
+    assert scal1_ == scal1_j.name
+    assert scal1.dtype == scal1_j.dtype
+
+    # Create a scalar and force it as an array
+    scal2_j = JaCeVar("scal2", (), dace.int64)
+    scal2_: str = alloc_driver.add_array(
+        arg=scal2_j,
+        force_array=True,
+    )
+    scal2: Data = alloc_driver.get_array(scal2_)
+    assert isinstance(scal2, Array)
+    assert scal2_ == scal2_j.name
+    assert scal2.shape == (1,)
+    assert scal2.strides == (1,)
+    assert scal2.dtype == scal2_j.dtype
+
+    # Create a scalar force it as an array and use symbolic strides.
+    scal3_j = JaCeVar("scal3", (), dace.int64)
+    scal3_: str = alloc_driver.add_array(
+        arg=scal3_j,
+        force_array=True,
+        symb_strides=True,  # Will have no effect.
+    )
+    scal3: Data = alloc_driver.get_array(scal3_)
+    assert isinstance(scal2, Array)
+    assert scal3_ == scal3_j.name
+    assert scal3.shape == (1,)
+    assert scal3.strides == (1,)
+    assert scal3.dtype == scal3_j.dtype
+
+    # Using a special name for the variable
+    scal4_j = scal3_j
+    scal4_n = "scal4_special_name"
+    scal4_: str = alloc_driver.add_array(
+        arg=scal4_j,
+        alt_name=scal4_n,
+        update_var_mapping=True,
+    )
+    assert scal4_ == scal4_n
+    assert scal4_ == alloc_driver.map_jax_var_to_sdfg(scal4_j)
+
+    # Test the prefix functionality
+    scal5_j = JaCeVar("scal5", (), dace.float64)
+    scal5_p = "my_prefix"
+    scal5_: str = alloc_driver.add_array(
+        arg=scal5_j,
+        name_prefix=scal5_p,
+    )
+    assert scal5_.startswith(scal5_p)
+    assert scal5_j.name in scal5_
+
+    # Allocating an array
+    arr1_j = JaCeVar("arr1", (5, 3), dace.float32)
+    arr1_: str = alloc_driver.add_array(
+        arg=arr1_j,
+    )
+    arr1: Data = alloc_driver.get_array(arr1_)
+    assert isinstance(arr1, Array)
+    assert arr1_ == arr1_j.name
+    assert arr1.shape == arr1_j.shape
+    assert arr1.strides == (3, 1)
+    assert arr1.dtype == arr1_j.dtype
+
+    # Create a variable that has a name that is already known.
+    arr2_j = JaCeVar(arr1_, (10,), dace.float64)
+    with pytest.raises(
+        expected_exception=ValueError,
+        match=f"Can't create variable '{arr2_j.name}', variable is already created.",
+    ):
+        arr2_: str = alloc_driver.add_array(arg=arr2_j)
+    with pytest.raises(expected_exception=ValueError, match=f"Variable '{arr1_}' already exists."):
+        # `alt_name` will not work because variable still exists.
+        arr2_ = alloc_driver.add_array(arg=arr2_j, alt_name=arr2_j.name)
+    # However, specifying `find_new_name` will solve this issue
+    #  NOTE: Doing this is not a good idea.
+    arr2_ = alloc_driver.add_array(
+        arg=arr2_j,
+        find_new_name=True,
+    )
+    assert arr2_.startswith("_jax_variable__" + arr2_j.name)
+
+    # Create a variable that has a custom stride
+    arr3_j = JaCeVar("arr3", (5, 1, 3), dace.float64)
+    arr3_st = (5, 3, 2)
+    arr3_: str = alloc_driver.add_array(
+        arg=arr3_j,
+        strides=arr3_st,
+    )
+    arr3: Data = alloc_driver.get_array(arr3_)
+    assert isinstance(arr3, Array)
+    assert arr3.shape == arr3_j.shape
+    assert arr3.strides == arr3_st
+
+    # Test if specifying `symb_strides` and a stride at the same time is an error.
+    arr4_j = JaCeVar("arr4", arr3_j.shape, dace.uintp)
+    arr4_st = arr3_st
+    with pytest.raises(
+        expected_exception=ValueError,
+        match="Specified 'symb_strides' and 'stride at the same time.",
+    ):
+        arr4_: str = alloc_driver.add_array(
+            arg=arr4_j,
+            symb_strides=True,
+            strides=arr4_st,
+        )
+
+    # Test if specifying the symbolic stride alone works.
+    #  Because a shape is `1` there should be no symbolic for it.
+    arr4_ = alloc_driver.add_array(
+        arg=arr4_j,
+        symb_strides=True,
+    )
+    arr4: Data = alloc_driver.get_array(arr4_)
+    assert isinstance(arr4, Array)
+    assert arr4.shape == arr4_j.shape
+
+    for shp, stri in zip(arr4.shape, arr4.strides):
+        if shp == 1:
+            assert isinstance(stri, int)
+            assert stri == 0, f"Expected a stride of 0, but got '{stri}'."
+        else:
+            assert isinstance(stri, (str, dace.symbol))
+
+
 if __name__ == "__main__":
     test_driver_alloc()
     test_driver_fork()
-    test_driver_append_state(alloc_driver())

From e3090c9632a872f02c5287385d3ffb9ae4dd1385 Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Tue, 23 Apr 2024 10:35:59 +0200
Subject: [PATCH 037/458] Added the implementation of teh Jaxpr translator,
 known as driver.

---
 .../translator/jaxpr_translator_driver.py     | 1243 +++++++++++++++++
 1 file changed, 1243 insertions(+)

diff --git a/src/jace/translator/jaxpr_translator_driver.py b/src/jace/translator/jaxpr_translator_driver.py
index 267c72b..2c2c807 100644
--- a/src/jace/translator/jaxpr_translator_driver.py
+++ b/src/jace/translator/jaxpr_translator_driver.py
@@ -7,6 +7,18 @@
 
 from __future__ import annotations
 
+import re
+from collections.abc import Collection, Iterable, Mapping, Sequence
+from typing import Any, Final, cast, overload
+
+import dace
+import jax
+from dace import data as ddata, properties as dprop
+from jax import core as jcore
+
+from jace import translator as jtrans, util as jutil
+from jace.translator import sub_translators as jtsubt, util as jtrutil
+
 
 class JaxprTranslationDriver:
     """Internal driver class for creating an SDFG equivalent of a `Jaxpr` instance.
@@ -46,3 +58,1234 @@ class JaxprTranslationDriver:
         Find a better way than to allow giving access to protected functions.
             Probably using composition with the higher level instance.
     """
+
+    # Member variables private to an instance, i.e. they are not passed on to the children.
+    #  By definition all of them belongs to the translation context but not all variable of
+    #  the translation context are private, some are actually shared.
+    __private_slots__ = (
+        "_sdfg",
+        "_term_sdfg_state",
+        "_init_sdfg_state",
+        "_jax_name_map",
+        "_sdfg_in_names",
+        "_sdfg_out_names",
+        "_rev_idx",
+    )
+    # Variables that are shared among the instances of a family.
+    __shared_slots__ = (
+        "_reserved_names",  # Part of the context, but is copied.
+        "_sub_translators",
+        "_rev_manager",  # This is the revision counter manager
+    )
+    __slot__ = __private_slots__ + __shared_slots__
+
+    def __init__(
+        self,
+        **kwargs: Any,
+    ) -> None:
+        """Creates the base translator.
+
+        All arguments that does not start with an underscore are used as
+        arguments to construct the subtranslators.
+
+        Args:
+            _no_shared_alloc (bool):     If set then all allocation will be avoided (internal)
+
+        Notes:
+            This function will not allocate the translation context of `self`
+                but will only allocate the shared members.
+            By setting `_no_shared_alloc` to `True` the function will not allocate
+                the shared part. This flag is provided only for implementing
+                `self.fork()` using it is an error and undefined behaviour.
+        """
+        allocate_shared_parts: bool = not kwargs.pop("_no_shared_alloc", False)
+
+        # Contains all the subtranslators that we need.
+        #  They are partitioned by the names of the primitive they have registered for.
+        #  Inside a partition they are ordered by priority, lowest first, more important.
+        #  This member is allocated by '_init_sub_translators()' and remains allocated
+        #  during the lifetime of the object.
+        self._sub_translators: dict[str, list[jtrans.JaCeSubTranslatorInterface]] = None  # type: ignore[assignment]
+
+        # The SDFG object that we are currently constructing.
+        #  Only allocated during an ongoing translation.
+        self._sdfg: dace.SDFG = None
+
+        # This is the HEAD SDFG state, i.e. the last state in which we translated an equation.
+        #  Only allocated during an ongoing translation.
+        self._term_sdfg_state: dace.SDFGState = None
+
+        # This is the beginning of the SDFG, i.e. the original SDFG HEAD.
+        #  Only allocated during an ongoing translation.
+        self._init_sdfg_state: dace.SDFGState = None
+
+        # This is the mapping, that maps the Jax name to the name that is used inside the SDFG.
+        #  Only allocated during an ongoing translation.
+        self._jax_name_map: dict[str, str] = None  # type: ignore[assignment]
+
+        # These names can not be used for the automatic naming of Jax variables.
+        #  They differ from the forbidden names, that they denote valid SDFG names.
+        #  An example would be names of the function arguments.
+        #  Only allocated during an ongoing translation.
+        self._reserved_names: set[str] = None  # type: ignore[assignment]
+
+        # These are the names of the SDFG variables that serves as input and output.
+        #  They have the same order as in the Jaxpr.
+        #  Only allocated during an ongoing translation.
+        self._sdfg_in_names: Sequence[str] = None  # type: ignore[assignment]
+        self._sdfg_out_names: Sequence[str] = None  # type: ignore[assignment]
+
+        # This is the manager for the revision counter.
+        #  It is shared among all children.
+        #  Might be overwritten if we are in the context of 'fork()'.
+        self._rev_manager: jtrutil.RevisionCounterManager = jtrutil.RevisionCounterManager()
+
+        # This is the revision of self.
+        #  Unlike the manager it is not shared and private.
+        #  Might be overwritten in the context of a fork.
+        self._rev_idx: int = self._rev_manager.assign_revision()
+        assert self.is_head_translator()
+
+        # If requested we will now allocate some internal state
+        if allocate_shared_parts:
+            self._init_sub_translators(kwargs)
+
+    def translate_jaxpr(
+        self,
+        jaxpr: jcore.ClosedJaxpr,
+        *,
+        inp_scalar_as_array: bool = False,
+        name: str | None = None,
+        reserved_names: str | Collection[str] | None = None,
+        allow_empty_jaxpr: bool = False,
+        **kwargs: Any,
+    ) -> jtrutil.JaCeTranslationMemento:
+        """Perform the translation of a Jaxpr description into a SDFG.
+
+        Returns:
+            The function will translate the passed Jaxpr object into an SDFG.
+            However, the SDFG will be in canonical form and needs further
+            processing. The SDFG is encapsulated inside a `JaCeTranslationMemento`,
+            that contains additional metadata for further manipulation.
+
+        Args:
+            inp_scalar_as_array:    Translate scalar _input_ arguments to arrays of length 1.
+            name:                   Use this name for the SDFG instead some generated one.
+            reserved_names:         Prevent the generation of variables with these names,
+                                        see `self.add_array()` for more.
+            allow_empty_jaxpr:      Allows empty Jaxpr.
+
+        Returns:
+            The function will not return the SDFG directly.
+            Instead it will be wrapped inside a `JaCeTranslationMemento` instance.
+            That contains the SDFG and some meta data needed for further processing.
+        """
+        if self.is_allocated():
+            raise RuntimeError(
+                "The translator driver is already allocated, you should resort to 'fork()'."
+            )
+        if (len(jaxpr.eqns) == 0) and (not allow_empty_jaxpr):
+            raise ValueError("Passed an empty Jaxpr, but did not allow for empty Jaxpr.")
+        if not isinstance(jaxpr, jcore.ClosedJaxpr):
+            raise TypeError(f"Expected a 'jax.core.ClosedJaxp' instance but got '{type(jaxpr)}'")
+        if len(jaxpr.effects) != 0:
+            raise NotImplementedError("'Jaxpr' with side effects are not supported.")
+        if len(jaxpr.out_avals) == 0:
+            raise ValueError("Jaxpr has zero output variables.")
+        if not jax.config.read("jax_enable_x64"):
+            raise NotImplementedError("The translation only works if 'jax_enable_x64' is enabled.")
+
+        # Consume the hidden flags
+        _clear_translation_ctx: bool = kwargs.pop("_clear_translation_ctx", True)
+
+        self._allocate_translation_ctx(
+            name=name,
+            reserved_names=reserved_names,
+        )
+        self._create_initial_input(
+            jaxpr=jaxpr,
+            inp_scalar_as_array=inp_scalar_as_array,
+        )
+        self._create_constants(
+            jaxpr=jaxpr,
+        )
+        memento: jtrutil.JaCeTranslationMemento = self._translate_jaxpr_internal(jaxpr)
+
+        # If the translation context is not cleared `self` and `memento` will share the same data.
+        #  There is some legitimate use for that.
+        if _clear_translation_ctx:
+            self._clear_translation_ctx()
+
+        return memento
+
+    def fork(self) -> JaxprTranslationDriver:
+        """Return a child of `self` ready for transformation.
+
+        The returned object should be seen as a partial clone if `self`. It will
+        have an unallocated translation context, but all other variables are schared.
+        To distinguish children all have a unique identifier, see `self.same_family()`.
+
+        The main reason for its function is to implement nested Jaxpr. If
+        `self.translate_jaxpr()` is called on the returned object it will behave
+        the exact same way as its parent would, with a different Jaxpr argument.
+
+        Notes:
+            A user has to ensure that the lifetime of a child ends before the
+                lifetime of its direct parent. In case of a head translator,
+                the lifetime of its children have to end before the translation
+                process finishes.
+            It is important that a clone instance should not be reused,
+                instead you should fork it again.
+        """
+        from copy import copy as scpy
+
+        if not self.is_allocated():
+            raise RuntimeError("Only allocated driver can fork.")
+
+        # Create a new (empty) driver instance; prevent allocation to make it cheep
+        dolly: JaxprTranslationDriver = JaxprTranslationDriver(_no_shared_alloc=True)
+
+        # Copy the shared members from parent to fork.
+        for slot_name in self.__shared_slots__:
+            setattr(dolly, slot_name, getattr(self, slot_name))
+
+        # Handle the special members and initialize them.
+        dolly._rev_idx = dolly._rev_manager.assign_revision()
+        assert not dolly.is_head_translator()
+
+        # We will now copy the reserved name list
+        #  Although they are shared, only their content is shared.
+        #  This prevents a feedback from the child to the parent.
+        dolly._reserved_names = scpy(self._reserved_names)
+
+        return dolly
+
+    def append_new_state(
+        self,
+        label: str | None = None,
+        condition: dprop.CodeBlock | None = None,
+        assignments: Mapping[str, Any] | None = None,
+        *,
+        prev_state: dace.SDFGState | None = None,
+    ) -> dace.SDFGState:
+        """Creates a new `SDFGState` and adds it to the SDFG.
+
+        By default the new state is appended to the current terminal state.
+        This will also update the terminal SDFG state of `self`.
+
+        However, if `prev_state` is specified the state new state will be
+        appended to `prev_state` instead. This will not modify the terminal
+        state unless `prev_state` is the current terminal state.
+
+        Args:
+            label:          The name that should be given to the new `SDFGState`.
+            condition:      The condition of the state transitions used on the `InterstateEdge`.
+            assignments:    Symbol assignments that should be done during the transition.
+            prev_state:     Alternative `SDFGState` at which we should append the new state.
+
+        Notes:
+            In case no `SDFGState` exists yet, an initial SDFGState will be created first.
+        """
+        assert self._sdfg is not None
+
+        # Test if we must create a start state.
+        if self._sdfg.start_block is None:
+            assert all(
+                x is None for x in (self._init_sub_translators, self._term_sdfg_state, prev_state)
+            )
+            self._init_sdfg_state = self._sdfg.add_state(label="initial_state", is_start_block=True)
+            self._term_sdfg_state = self._init_sdfg_state
+
+        # Decide if appending to that state will modify the terminal state.
+        modify_term_state: bool = False
+        if (prev_state is self._term_sdfg_state) or (prev_state is None):
+            modify_term_state = True
+            app_state = self._term_sdfg_state
+        else:
+            app_state = prev_state
+
+        new_state = self._sdfg.add_state(label, is_start_block=False)
+        self._sdfg.add_edge(
+            app_state,
+            new_state,
+            dace.sdfg.InterstateEdge(condition=condition, assignments=assignments),
+        )
+
+        if modify_term_state:
+            self._term_sdfg_state = new_state
+        return new_state
+
+    def get_arrays(self) -> Mapping[str, ddata.Data]:
+        """Get all `Data` descriptors that are currently known to the SDFG.
+
+        Notes:
+            Essentially a shorthand and preferred way for `self.get_sdfg().arrays`.
+            For getting a specific data descriptor use `self.get_array()`.
+        """
+        assert self._sdfg is not None
+        return cast(Mapping[str, ddata.Data], self._sdfg.arrays)
+
+    def get_array(
+        self,
+        name: str | jcore.Atom | jutil.JaCeVar,
+    ) -> ddata.Data:
+        """Returns the SDFG `Data` object `name` referees to.
+
+        If `name` is a string it is directly interpreted as the name of an SDFG variable.
+        In case it is a `jax.core.Atom` it is first translated, see `self.map_jax_var_to_sdfg()`.
+        """
+        assert self._sdfg is not None
+
+        if isinstance(name, str):
+            pass
+        elif isinstance(name, (jcore.Atom, jutil.JaCeVar)):
+            name = self.map_jax_var_to_sdfg(name)
+        else:
+            raise TypeError(f"Does not know how to handle '{type(name).__name__}'.")
+        if name not in self._sdfg.arrays:
+            raise KeyError(f"Requested the SDFG array '{name}' but it is not known.")
+
+        return self._sdfg.arrays[name]
+
+    @overload
+    def map_jax_var_to_sdfg(
+        self,
+        jax_var: str | jcore.Atom | jutil.JaCeVar,
+    ) -> str: ...
+
+    @overload
+    def map_jax_var_to_sdfg(
+        self,
+        jax_var: str | jcore.Atom | jutil.JaCeVar,
+        allow_fail: bool,
+    ) -> str | None: ...
+
+    def map_jax_var_to_sdfg(
+        self,
+        jax_var: str | jcore.Atom | jutil.JaCeVar,
+        allow_fail: bool = False,
+    ) -> str | None:
+        """Returns the name of the SDFG variable that the Jax variable `jax_var` is referring to.
+
+        Args:
+            jax_var:        The Jax variable to look up.
+            allow_fail:     If mapping is not known return `None` instead of raise `KeyError`.
+        """
+        assert self._jax_name_map is not None
+        assert isinstance(jax_var, (jcore.Atom, str, jutil.JaCeVar))
+
+        jax_var = jutil.get_jax_var_name(jax_var)
+        if jax_var not in self._jax_name_map:
+            if allow_fail:
+                return None
+            KeyError(f"The Jax variable '{jax_var}' was never registered.")
+
+        return self._jax_name_map[jax_var]
+
+    def get_sdfg(self) -> dace.SDFG:
+        """Returns the SDFG that is currently constructed.
+
+        If you want access to the arrays of the SDFG use `self.get_arrays()`/`self.get_array()`.
+        """
+        assert self._sdfg is not None
+        assert (self._init_sdfg_state is None) or (self._init_sdfg_state is self._sdfg.start_block)
+        return self._sdfg
+
+    def get_terminal_sdfg_state(self) -> dace.SDFGState:
+        """Returns the current terminal state of the SDFG under construction.
+
+        The SDFGs that are constructed by the driver are essentially a list of states.
+        New states are appended at the current terminal/end state and becoming the new terminal state.
+        This function returns the current terminal state.
+        """
+        assert all(x is not None for x in (self._sdfg, self._term_sdfg_state))
+        return self._term_sdfg_state
+
+    def is_allocated(self) -> bool:
+        """Tests if the translation context of `self` is allocated.
+
+        Notes:
+            It is safe to call this function any time.
+            If this function returns `True` it means that an allocation is ongoing.
+        """
+        small_ctx: Sequence[Any] = [
+            # for the proper implementation of forking the reserved names are handled special.
+            getattr(self, x)
+            for x in self.__private_slots__
+            if x != "_rev_idx"
+        ]
+        assert isinstance(self._rev_idx, int)
+        assert isinstance(self._sub_translators, dict)
+        if all((x is not None) for x in small_ctx):
+            if self._reserved_names is None:
+                raise RuntimeError("Invalid allocation state: Reserved names not allocated.")
+            return True
+        if all((x is None) for x in small_ctx):
+            return False
+        raise RuntimeError("Invalid allocation state: Translation context partially allocated.")
+
+    def is_head_translator(self) -> bool:
+        """Tests if `self` is a head translator.
+
+        A head translator is a translator/driver that was created explicitly,
+        i.e. not by `self.fork()`.
+        """
+        return self._rev_manager.is_root_revision(self._rev_idx)
+
+    def same_family(
+        self,
+        other: JaxprTranslationDriver,
+    ) -> bool:
+        """Test if `self` and `other` belongs to the same family of driver/translators.
+
+        A driver is either explicitly created, i.e. head translator, or created
+        by a call to `fork()`. All drivers that descend from the same head translator
+        from a family.
+
+        """
+        if not isinstance(other, JaxprTranslationDriver):
+            return NotImplemented  # type: ignore[unreachable]
+        if all(getattr(self, x) is getattr(self, x) for x in self.__shared_slots__):
+            return True
+        assert not any(getattr(self, x) is getattr(self, x) for x in self.__shared_slots__)
+
+        return False
+
+    def get_rev_idx(self) -> int:
+        """Returns the revision index of `self`.
+
+        To distinguish members of same family every diver has a unique identifier,
+        known as revision. However, the revision is only unique within a single
+        family and during an ongoing translation.
+        """
+        return self._rev_idx
+
+    def add_jax_name_mapping(
+        self,
+        jax_var: str | jcore.Atom | jutil.JaCeVar,
+        sdfg_name: str,
+    ) -> JaxprTranslationDriver:
+        """Creates a mapping between `jax_var` to `sdfg_name`.
+
+        This function updates the internal map of `self` and after the call
+        `self.map_jax_var_to_sdfg()` will identify `jax_var` with `sdfg_name`.
+        This function is not able to delete a variable mapping that was
+        established before, for this use TBA.
+
+        Args:
+            jax_var:     The Jax variable.
+            sdfg_name:   The name of the corresponding SDFG variable.
+        """
+        assert self._jax_name_map is not None
+        assert isinstance(jax_var, (jcore.Atom, str, jutil.JaCeVar))
+        assert isinstance(sdfg_name, str)
+
+        jax_name = jutil.get_jax_var_name(jax_var)
+        if jax_name in self._jax_name_map:
+            if self._jax_name_map[jax_name] == sdfg_name:  # We consider this as no ops.
+                return self
+            raise ValueError(
+                f"Tried to create the mapping '{jax_name} -> {sdfg_name}', but '{jax_name}'"
+                f" already points to '{self.map_jax_var_to_sdfg(jax_name)}'."
+            )
+        if sdfg_name not in self.get_arrays():
+            raise KeyError(f"Mapping '{jax_name} -> {sdfg_name}': SDFG target unknown.")
+        if sdfg_name in self._forbidden_names:
+            raise NameError(f"Mapping '{jax_name} -> {sdfg_name}': Forbidden name.")
+
+        self._jax_name_map[jax_name] = sdfg_name
+        return self
+
+    def add_reserved_names(
+        self,
+        reserved_names: None | str | Collection[str],
+    ) -> JaxprTranslationDriver:
+        """Adds the names listed in `reserved_names` to the internal list."""
+        assert isinstance(self._reserved_names, set)
+
+        if reserved_names is None:
+            return self
+        if isinstance(reserved_names, str):
+            reserved_names = [reserved_names]
+        elif isinstance(reserved_names, Collection):
+            pass
+        else:
+            raise TypeError(f"Does not know how to handle the type '{type(reserved_names)}'.")
+        if not all(isinstance(x, str) and (len(x) != 0) for x in reserved_names):
+            raise TypeError("Reserved names must all be non empty strings.")
+        self._reserved_names.update(reserved_names)
+        return self
+
+    def add_array(
+        self,
+        arg: jcore.Atom | jutil.JaCeVar,
+        *,
+        as_transient: bool = True,
+        alt_name: str | None = None,
+        name_prefix: str | None = None,
+        force_array: bool = False,
+        as_view: bool = False,
+        strides: Sequence[int | dace.symbol | str] | None = None,
+        symb_strides: bool | None = None,
+        find_new_name: bool | None = None,
+        allow_literals: bool = False,
+        force_jax_name: bool = False,
+        update_var_mapping: bool = False,
+    ) -> str:
+        """Creates an SDFG variable for the Jax variable `arg` and returns its SDFG name.
+
+        By default the function will create a transient, use `as_transient` to
+        change that. By default the function will honor if the Jax variable is
+        a scalar or an array. However, by setting `force_array` the function
+        will always generate an array.
+
+        By default the name for the SDFG variable is derived from the Jax variable.
+        It is guaranteed that this name is unique in the SDFG, even in the presence
+        of nested SDFGs. By specifying `alt_name` it is possible to force a certain
+        name on a variable. It is important that if `alt_name` is specified the function
+        will either generate the variable or fail.
+
+        The  driver distinguishes between two kinds of "bad (SDFG) variable names".
+        The first category are the forbidden names, which the function refuses to generate.
+        The second type are the so called reserved names, which were set at the beginning.
+        These names can be used if they are specified through `alt_name` but are not used
+        in automatic naming.
+
+        If nothing is specified, the strides of the data are determined by DaCe, which is
+        continuous C order. There are two ways to change that.
+        The first way is to specify the `strides` argument, which are then forwarded
+        to the underlying DaCe function. The second way is to set `symb_strides`
+        to `True` in which case the function will generate symbols and use them.
+        However, even if symbolic strides are activated, arrays with just one
+        dimensions have always a non symbolic stride of 1. Furthermore, dimensions
+        with shape 1 will always have stride 0.
+
+        By default this function does not update the internal variable map.
+        However, by setting `update_var_mapping` to `True` the function will
+        update the mapping.
+
+        Args:
+            arg:                The Jax object for which a SDFG equivalent should be created.
+            as_transient:       If set, the SDFG variable is a transient, `True` by default.
+            alt_name:           Try to create the variable with this name; either succeed or fail.
+            name_prefix:        If given and in automatic naming mode, add this prefix to the name.
+            force_array:        Instead of a `dace.Scalar` create a `dace.Array` with one element.
+            as_view:            Creates a view instead of an array, if it is a scalar
+                                    it is silently ignored.
+            strides:            Instead of the default strides use these values.
+            symb_strides:       Create symbols and use them for fully symbolic strides.
+            find_new_name:      The translator will try to find a new name if the designated
+                                    is already occupied. This does not work if the name
+                                    was supplied by `alt_name`.
+            allow_literals:     If `True` then also allows JaxLiterals as `arg`.
+            force_jax_name:     If `True` then, the verbatim Jax name will be used.
+            update_var_mapping: Update the internal variable mapping; by default `False`.
+
+        Notes:
+            If this function is used directly a user is advised to always set
+                `update_var_mapping` to `True`.
+            If `find_new_name` is `None` the default, the function will only
+                look for a new name if there is a need for it. If it is `True`
+                the function will always look for a new name, even if the initial
+                name was fine. If it is `False` the function will never look for
+                a new new, thus if the name is unavailable an error is generated.
+                However, this excluds variable names that are known.
+            Specifying `alt_name` implies `find_new_name=False`.
+            The effect of specifying `force_jax_name` is as passing
+                `jutil.get_jax_var_name(arg)` as `alt_name`.
+            If you need to create a special array, you can use `jace.util.JaCeVar`
+                to create a pseudo Jax variable.
+        """
+        assert self.is_allocated()
+
+        shape: Sequence[int] = jutil.get_jax_var_shape(arg)
+        dtype = jutil.get_jax_var_dtype(arg)
+        offset = None  # i.e. no offset
+        storage: dace.StorageType = dace.StorageType.Default  # Set at later stages (optimization)
+        is_scalar: bool = shape == ()
+
+        if (alt_name is None) and (self.map_jax_var_to_sdfg(arg, allow_fail=True) is not None):
+            # Maybe the test could be more robust, but it will check if we try to create
+            #  a variable for a second time. It is, however, okay to use one as template,
+            #  if another name is specified from the beginning.
+            raise ValueError(
+                f"Tried to create variable '{arg}' again, without specifying an alternative name.."
+            )
+        if force_jax_name:
+            if alt_name is not None:
+                raise ValueError(
+                    f"Specified 'force_jax_name', but passed '{alt_name}' as 'alt_name'."
+                )
+            if name_prefix is not None:
+                raise ValueError(
+                    f"Specified 'force_jax_name', but passed '{name_prefix}' as 'name_prefix'."
+                )
+            alt_name = jutil.get_jax_var_name(arg)
+        if alt_name is not None:
+            assert isinstance(alt_name, str)
+            find_new_name = False  # If a name was given, then use it no matter what.
+            if len(alt_name) == 0:
+                raise ValueError("Passed an empty 'alt_name'.")
+            if alt_name in self._forbidden_names:
+                raise ValueError("'alt_name' is a forbidden name.")
+            if not re.fullmatch("[a-zA-Z_][a-zA-Z0-9_]*", alt_name):
+                raise ValueError(f"The passed name 'alt_name' '{alt_name}' is invalid.")
+            if force_jax_name:
+                raise ValueError("Specified 'force_jax_name' but passed 'alt_name'.")
+            if name_prefix is not None:
+                raise ValueError(
+                    f"Specified 'name_prefix' ('{name_prefix}') but passed '{alt_name}' as 'alt_name'."
+                )
+            if alt_name in self._sdfg.arrays:
+                raise ValueError(f"Variable '{alt_name}' already exists.")
+        if name_prefix is not None:
+            assert isinstance(name_prefix, str)
+            if len(name_prefix) == 0:
+                raise ValueError("Specified an empty 'name_prefix'.")
+        if as_view and (not as_transient):
+            raise ValueError("You tried to create a global view, which is not allowed.")
+
+        # Checking the strides.
+        if (symb_strides is None) and (strides is None):
+            def_symb_stride = False  # default value for symbolic strides
+            symb_strides = False if (len(shape) <= 1) else def_symb_stride  # Keep for the future
+        elif (symb_strides is not None) and (strides is not None):
+            raise ValueError("Specified 'symb_strides' and 'stride at the same time.")
+        elif strides is not None:
+            if len(strides) != len(shape):
+                raise ValueError(
+                    f"'strides' has length {len(strides)}, but array rank is {len(shape)}."
+                )
+        else:
+            assert isinstance(symb_strides, bool)
+
+        # Now we determine the proposed name of the variable.
+        #  Depending on the situation, we will further manipulate it.
+        if alt_name is not None:
+            prop_name = alt_name  # Just for completion: will be ignored later
+        elif isinstance(arg, (jcore.Var, jutil.JaCeVar)):
+            prop_name = jutil.get_jax_var_name(arg)
+            if prop_name.startswith("__"):
+                raise ValueError(
+                    f"You tried to create the variable '{prop_name}' which"
+                    "starts with two underscores, use 'alt_name' for that."
+                )
+            if name_prefix is not None:
+                prop_name = name_prefix + prop_name
+        elif isinstance(arg, jcore.Literal):  # type: ignore[unreachable]
+            if not allow_literals:
+                raise NotImplementedError("Jax Literals are not supported.")
+            if alt_name is None:
+                raise ValueError(f"Passed literal '{arg}', but not specified a name to use.")
+        else:
+            raise TypeError(f"Does not know how to handle '{type(arg).__name__}'.")
+        if alt_name is None:
+            # If we are the root translator, then we will use `prop_name` directly;
+            #  otherwise we will append the revision of `self` to the name.
+            arg_name = prop_name + ("" if self.is_head_translator() else f"_rev_idx{self._rev_idx}")
+        else:
+            arg_name = str(alt_name)
+
+        # Determine if we should look for a new name or not, if nothing was specified
+        if find_new_name is None:
+            if arg_name in self._reserved_names:
+                find_new_name = True
+            if arg_name in self._forbidden_names:
+                find_new_name = True
+
+        if find_new_name:
+            # We have to find a new name.
+            name_tmpl = "_jax_variable__" + arg_name + "__{}"
+            for iCounter in range(1000):
+                _arg_name = name_tmpl.format(iCounter)
+                if (
+                    (_arg_name in self._forbidden_names)
+                    or (_arg_name in self._reserved_names)
+                    or (_arg_name in self._sdfg.arrays)
+                ):
+                    continue  # The proposed variable is known, so try next value.
+                arg_name = _arg_name  # We found a name that we can use.
+                break
+            else:
+                raise ValueError(f"Failed to find a replacement name for '{arg_name}'")
+            del iCounter, _arg_name
+
+        # Final name check
+        if arg_name in self._forbidden_names:
+            raise ValueError(f"Can't create variable '{arg_name}', name is forbidden.")
+        if arg_name in self._sdfg.arrays:
+            raise ValueError(f"Can't create variable '{arg_name}', variable is already created.")
+        if not re.fullmatch("[a-zA-Z_][a-zA-Z0-9_]*", arg_name):
+            raise ValueError(f"The requested variable name '{arg_name}' is invalid.")
+
+        # Promotion of scalar to array.
+        if is_scalar and force_array:
+            shape = (1,)
+            symb_strides = False
+            strides = None
+            is_scalar = False
+
+        # Set the stride if we have to change.
+        if strides is not None:
+            strides = tuple(strides)
+            assert len(strides) == len(shape)
+
+        elif (symb_strides is True) and (not is_scalar):
+            strides = [
+                dace.symbol(f"{arg_name}_stride{dim}", dace.int64) if size >= 2 else 0
+                for dim, size in enumerate(shape)
+            ]
+
+        if is_scalar:
+            self._sdfg.add_scalar(
+                name=arg_name, storage=storage, dtype=dtype, transient=as_transient
+            )
+        elif as_view:
+            self._sdfg.add_view(
+                name=arg_name,
+                shape=shape,
+                strides=strides,
+                offset=offset,
+                storage=storage,
+                dtype=dtype,
+            )
+        else:
+            self._sdfg.add_array(
+                name=arg_name,
+                shape=shape,
+                strides=strides,
+                offset=offset,
+                storage=storage,
+                dtype=dtype,
+                transient=as_transient,
+            )
+
+        if update_var_mapping:
+            self.add_jax_name_mapping(jax_var=arg, sdfg_name=arg_name)
+
+        return arg_name
+
+    def create_jax_var_list(
+        self,
+        jax_var_list: Sequence[jcore.Atom | jutil.JaCeVar],
+        prevent_creation: bool = False,
+        only_creation: bool = False,
+        **kwargs: Any,
+    ) -> list[None | str]:
+        """Creates SDFG variables for the listed Jax variables and returns their SDFG names.
+
+        Before the function will create a variable, by using `add_array()` with
+        `update_var_mapping=True`, it will check if the variable is known and if
+        so no new variable is created. Instead the name of the previously created
+        variable is added to the list. In case the Jax Atom denotes a Jax Literal,
+        no variable will be created, instead `None` will be added to the list.
+
+        Args:
+            jax_var_list:       The list of Jax variables that should be transformed to SDFG names.
+            prevent_creation:   Never create a variable, indicates that all variables must exists.
+            only_creation:      Variables must be generated, generate an error instead of using it.
+            kwargs:             Will be forwarded to `self.add_array()` if a variable as to be created.
+
+        Notes:
+            If `only_creation` is set, then literals will cause an error.
+            It is an error to pass the `update_var_mapping` argument.
+        """
+        assert self._jax_name_map is not None
+        if only_creation and prevent_creation:
+            raise ValueError("Specified both 'only_creation' and 'prevent_creation'.")
+
+        ret_list: list[None | str] = []
+        for jax_var in jax_var_list:
+            if isinstance(jax_var, jcore.Literal):
+                if only_creation:
+                    raise ValueError(f"Requested 'only_creation', but '{jax_var}' is a 'Literal'.")
+                ret_list.append(None)
+            elif isinstance(jax_var, (jcore.Var, jutil.JaCeVar)):
+                mapped_sdfg_name: str | None = self.map_jax_var_to_sdfg(jax_var, allow_fail=True)
+                if (mapped_sdfg_name is None) and prevent_creation:
+                    raise ValueError(f"prevent_creation' given but have to create '{jax_var}'.")
+                if mapped_sdfg_name is None:
+                    ret_list.append(self.add_array(arg=jax_var, update_var_mapping=True, **kwargs))
+                elif only_creation:
+                    raise ValueError(f"'only_creation' given '{jax_var}' already exists.")
+                else:
+                    ret_list.append(mapped_sdfg_name)
+            else:
+                raise TypeError(f"Does not know how to handle '{type(jax_var).__name__}'")
+        return ret_list
+
+    def _create_initial_input(
+        self,
+        jaxpr: jcore.ClosedJaxpr,
+        inp_scalar_as_array: bool,
+    ) -> Sequence[str]:
+        """This function will create the internal input variables that are used for the SDFG.
+
+        Args:
+            jaxpr:                  The Jaxpr that we want to translate.
+            inp_scalar_as_array:    Promote scalars to arrays of size one.
+
+        Returns:
+            The list of SDFG variables used as input arguments of `jaxpr` in the same order.
+
+        Notes:
+            This function will fill the internal list of inputs.
+        """
+        assert self.is_allocated()
+        assert len(jaxpr.jaxpr.invars)
+
+        if len(self._sdfg_in_names) != 0:
+            raise RuntimeError("Called '_create_initial_input()' twice?")
+        assert len(self._sdfg_out_names) == 0
+
+        # Handle the initial input arguments
+        sdfg: dace.SDFG = self._sdfg
+        init_in_var_names: Sequence[str] = self.create_jax_var_list(  # type: ignore[assignment]
+            jax_var_list=jaxpr.jaxpr.invars,
+            only_creation=True,
+            as_transient=True,  # Explicit transient; no error!
+            force_array=inp_scalar_as_array,
+            force_jax_name=self.is_head_translator(),  # Ensure head get pure Jax names.
+        )
+        sdfg.arg_names.extend(init_in_var_names)
+
+        # Store the list of inputs in self; this is done to simplify exporting.
+        #  The output list is populated by `self._translate_jaxpr_internal()`
+        self._sdfg_in_names = tuple(init_in_var_names)
+
+        return init_in_var_names
+
+    def _create_constants(
+        self,
+        jaxpr: jcore.ClosedJaxpr,
+    ) -> Sequence[str]:
+        """Creates all constants requested by the `jaxpr`.
+
+        The function will create an SDFG variable and add them as constant to the SDFG.
+        The value they should have is deepcopied.
+
+        Returns:
+            Names of the SDFG variables created for the constants in the same order.
+        """
+        from copy import deepcopy
+
+        assert self.is_allocated()
+        if not len(jaxpr.consts):
+            return []
+
+        const_names: list[str] = []
+        for cJaxVar, cValue in zip(jaxpr.jaxpr.constvars, jaxpr.consts, strict=False):
+            c_sdfg_name = self.add_array(
+                arg=cJaxVar,
+                name_prefix="__const_",
+                as_transient=True,
+                symb_strides=False,
+                strides=None,
+                update_var_mapping=True,
+            )
+            # We have to pass the data descriptor to `add_constant()`, otherwise a new one would be created.
+            self._sdfg.add_constant(c_sdfg_name, deepcopy(cValue), self._sdfg.arrays[c_sdfg_name])
+            const_names.append(c_sdfg_name)
+        return const_names
+
+    def _allocate_translation_ctx(
+        self,
+        name: str | None = None,
+        reserved_names: str | Collection[str] | None = None,
+    ) -> JaxprTranslationDriver:
+        """This function allocates and initialize the members of the translation context of `self`.
+
+        After this function is called, `self` is said to have an ongoing translation process.
+
+        Args:
+            name:               The name of the SDFG.
+            reserved_names:     Add these name to the set of resered names of `self`.
+        """
+        if self.is_allocated():
+            raise RuntimeError("The translator is already allocated.")
+        if name and (not re.fullmatch("[a-zA-Z_][a-zA-Z0-9_]*", name)):
+            raise ValueError(f"The provided name '{name}' for the SDFG is invalid.")
+
+        self._sdfg = dace.SDFG(name=(name or f"unnamed_SDFG_{id(self)}"))
+        self._init_sdfg_state = self._sdfg.add_state(label="initial_state", is_start_block=True)
+        self._term_sdfg_state = self._init_sdfg_state
+        self._jax_name_map = {}
+        self._sdfg_in_names = ()
+        self._sdfg_out_names = ()
+
+        # If the reserved names are already allocated then keep them.
+        #  This is needed to preserve them among forks.
+        if self._reserved_names is None:
+            self._reserved_names = set()  # type: ignore[unreachable]
+        elif not isinstance(self._reserved_names, set):
+            raise RuntimeError("The reserved names are allocated incorrectly.")
+        return self.add_reserved_names(reserved_names)
+
+    def _init_sub_translators(
+        self,
+        kwargs: Mapping[str, Any],
+    ) -> JaxprTranslationDriver:
+        """This function initializes the subtranslator.
+
+        The function forwards `kwargs` to the constructor of the subtranslators.
+        However, it will remove all arguments starting with an underscore.
+        """
+        if isinstance(self._sub_translators, dict):
+            raise RuntimeError("Tried to allocate the internal subtranslators twice.")
+        assert self._sub_translators is None  # type: ignore[unreachable]
+
+        kwargs = {k: v for k, v in kwargs.items() if not k.startswith("_")}
+
+        # First we will create all subtranslators and partition them.
+        subtranslators: dict[str, list[jtrans.JaCeSubTranslatorInterface]] = {}
+        for subtranslator_cls in jtsubt._get_subtranslators_cls():
+            subtranslator: jtrans.JaCeSubTranslatorInterface = subtranslator_cls(**kwargs)
+            handled_primitives: Iterable[str] = jutil.ensure_iterability(
+                subtranslator.get_handled_primitives()
+            )
+
+            # Now add the subtranslator to the primitives it requests, we will sort them later into the correct order.
+            for handled_primitive in handled_primitives:
+                subtranslators.setdefault(handled_primitive, []).append(subtranslator)
+
+        # Now we order the subtranslators for the primitives.
+        self._sub_translators = {
+            prim_name: jtrutil.sort_subtranslators(primSubTranslators)
+            for prim_name, primSubTranslators in subtranslators.items()
+        }
+        return self
+
+    def _clear_translation_ctx(self) -> JaxprTranslationDriver:
+        """This function deallocate the translation context of `self`.
+
+        Notes:
+            While it is allowed for outside code to call this explicitly function,
+                it is is most likely an error.
+            If this function is called on a head translator, then the translation
+                process ends. This implies that all direct and indirect children,
+                i.e. output of `self.fork()` must already be deallocated. A further
+                side effect is that now revision indexes might be reused.
+            If `self` is not allocated this function acts as a noops.
+            The reserved names are only deallocated if `self` is a head translator.
+        """
+        if not self.is_allocated():
+            return self
+        self._sdfg = None
+        self._init_sdfg_state = None
+        self._term_sdfg_state = None
+        self._jax_name_map = None  # type: ignore[assignment]
+        self._sdfg_in_names = None  # type: ignore[assignment]
+        self._sdfg_out_names = None  # type: ignore[assignment]
+
+        if self.is_head_translator():
+            # We are the head translator thus we reset the revision manager.
+            #  Since this function is only called at the very end, we know that the translation
+            #  process as a whole has finished. We reset the state that the numbers are small
+            #  again when we start anew.
+            self._rev_manager._reset_state()
+
+            # Freeing the reserved names only for heads make it more safe in case a child
+            #  translator is reused.c On the other hand reusing a child translator is
+            #  discouraged, but not forbidden.
+            self._reserved_names = None  # type: ignore[assignment]
+        return self
+
+    def _find_sub_translator_for(
+        self,
+        in_var_names: Sequence[str | None],
+        out_var_names: Sequence[str],
+        eqn: jcore.JaxprEqn,
+    ) -> jtrans.JaCeSubTranslatorInterface:
+        """Returns the appropriate subtranslator for equation `eqn`.
+
+        The subtranslators are checked for applicability in the order of their priority.
+        The fist one that accepts the translation will be taken.
+
+        Notes:
+            The arguments are the same as for `JaCeSubTranslatorInterface.can_translate_jaxeqn()`.
+        """
+        assert self._sub_translators is not None
+
+        prim_name: str = eqn.primitive.name
+        if prim_name not in self._sub_translators:
+            raise NotImplementedError(f"No subtranslators known to handle '{prim_name}'.")
+        subtranslator_canidates = self._sub_translators[prim_name]
+        assert len(subtranslator_canidates) > 0
+
+        subtranslator: jtrans.JaCeSubTranslatorInterface = None  # type: ignore[assignment]
+        if len(subtranslator_canidates) == 1:
+            subtranslator = next(iter(subtranslator_canidates))
+            assert subtranslator.can_translate_jaxeqn(
+                in_var_names=in_var_names, out_var_names=out_var_names, driver=self, eqn=eqn
+            )
+        else:
+            for subtranslatorCanidate in subtranslator_canidates:
+                if subtranslatorCanidate.can_translate_jaxeqn(
+                    driver=self, in_var_names=in_var_names, out_var_names=out_var_names, eqn=eqn
+                ):
+                    subtranslator = subtranslatorCanidate
+            else:
+                raise NotImplementedError(f"No subtranslator found for handling '{eqn}'.")
+        return subtranslator
+
+    def _translate_single_eqn(
+        self,
+        jaxpr: jcore.ClosedJaxpr,
+        eqn: jcore.JaxprEqn,
+    ) -> tuple[Sequence[str | None], Sequence[str]]:
+        """Translate `eqn` into its SDFG equivalent.
+
+        To do this the function will do the following steps:
+        - Assemble the in and output variables.
+        - Select the appropriate subtranslator to use.
+        - Create a new empty state terminal state.
+        - Call the subtranslator to perform the translation inside the new state.
+
+        Returns:
+            The SDFG names that were used as input and output are returned.
+            The inputs might contain `None` which indicates that that input was a Jax Literal.
+            For more information see `JaCeSubTranslatorInterface.can_translate_jaxeqn()`.
+
+        Notes:
+            While `jaxpr` must be a `ClosedJaxpr`, `eqn` must come from the unclosed instance.
+            The function will perform some consistency checking after the subtranslator was called.
+        """
+        assert isinstance(eqn, jcore.JaxprEqn)
+        assert isinstance(jaxpr, jcore.ClosedJaxpr)
+
+        if len(eqn.effects) != 0:
+            raise NotImplementedError(f"Equation '{eqn}' has side effects.")
+
+        # Input/Output variables
+        #  Using a tuple for the input ensures that it is not modified.
+        in_var_names: Sequence[str | None] = tuple(
+            self.create_jax_var_list(
+                eqn.invars,
+                prevent_creation=True,  # Inputs must already exists.
+            )
+        )
+        out_var_names: Sequence[str] = self.create_jax_var_list(  # type: ignore[assignment]
+            eqn.outvars,
+            only_creation=True,  # Output must not exist yet.
+        )
+
+        # Find the subtranslator
+        subtranslator: jtrans.JaCeSubTranslatorInterface = self._find_sub_translator_for(
+            in_var_names=in_var_names,
+            out_var_names=out_var_names,
+            eqn=eqn,
+        )
+
+        # Create the state into which the equation should be translated
+        last_term_state: dace.SDFGState = self.get_terminal_sdfg_state()  # noqa: F841 # Will be used later
+        eqn_state = self.append_new_state(
+            label=f"{eqn.primitive.name}_{out_var_names[0]}",
+            prev_state=None,
+        )
+
+        # Now perform the actual translation of the equation.
+        new_sdfg_term_state = subtranslator.translate_jaxeqn(
+            driver=self,
+            in_var_names=in_var_names,
+            out_var_names=out_var_names,  # Might be modified by subtranslator!
+            eqn=eqn,
+            eqn_state=eqn_state,
+        )
+
+        # Determine the new (tentative) terminal state of the SDFG we are building.
+        if new_sdfg_term_state is None:
+            if eqn_state is not self._term_sdfg_state:
+                raise RuntimeError("Inconsistent terminal state was detected.")
+            new_sdfg_term_state = eqn_state
+        elif isinstance(new_sdfg_term_state, dace.SDFGState):
+            # TODO(phimuell): use `last_term_state` to test if `new_sdfg_term_state` is reachable.
+            pass
+        else:
+            raise TypeError(f"Encountered illegal types '{type(new_sdfg_term_state)}'")
+
+        # In case a subtranslator decided to not use the variables we created for it, which is allowed
+        #  but he must update the `out_var_names` list correctly, we will now verify this.
+        if len(out_var_names) != len(eqn.outvars):
+            raise RuntimeError(
+                f"Modified 'out_var_names'! Expected {len(eqn.outvars)} variables."
+                f" but found {len(out_var_names)}"
+            )
+        for expectedSDFGName, jax_var in zip(out_var_names, eqn.outvars, strict=True):
+            mapped_sdfg_name = self.map_jax_var_to_sdfg(jax_var)
+            jax_name = jutil.get_jax_var_name(jax_var)
+            if mapped_sdfg_name != expectedSDFGName:
+                raise ValueError(
+                    f"Mapping inconsistency detected, expected that Jax variable"
+                    f" '{jax_name}' maps to '{expectedSDFGName}' but it actually"
+                    f" maps to '{mapped_sdfg_name}'."
+                )
+
+        # Views can only be used if there is a direct connection, between source,
+        #  view and destination (place of usage). Because of the way how Jax works,
+        #  it is impossible that an output variable is a View.
+        for outVarName, jax_var in zip(out_var_names, eqn.outvars, strict=True):
+            sdfg_var = self.get_array(outVarName)
+            if isinstance(sdfg_var, (dace.data.Array, dace.data.Scalar)):
+                pass
+            elif isinstance(sdfg_var, dace.data.View):
+                raise TypeError(
+                    f"For Jax variable '{jutil.get_jax_var_name(jax_var)}' (SDFG: '{outVarName}'),"
+                    f" which is an output, you used a View, which is not possible."
+                    " It must either be an array or a scalar."
+                )
+            else:
+                raise NotImplementedError(
+                    f"Output variable '{jutil.get_jax_var_name(jax_var)}' (SDFG: '{outVarName}')"
+                    f" is of type '{type(sdfg_var).__name__}' which I does not know how to handle."
+                )
+
+        # Modify terminal head state of 'self'
+        self._term_sdfg_state = new_sdfg_term_state
+
+        return (in_var_names, out_var_names)
+
+    def _translate_jaxpr_internal(
+        self,
+        jaxpr: jcore.ClosedJaxpr,
+    ) -> jtrutil.JaCeTranslationMemento:
+        """Performs the actual translation of the Jaxpr into an SDFG.
+
+        The function assumes that the context is already allocated and the initial
+        input variables were already created. The function will store the internal
+        state of `self` into a memento and return it.
+        However, it will not deallocate the translation context, thus `self`
+        and the memento share the same context in memory.
+
+        Args:
+            jaxpr:      The Jaxpr to translate.
+
+        Notes:
+            The function will unconditionally handle empty Jaxpr.
+            Jax uses a variable with name `_` to indicate that this value is never read,
+                this is used by Jax to indicate that they are never read.
+                Such variables are included by some transformations such as `grad()`.
+        """
+        assert isinstance(jaxpr, jcore.ClosedJaxpr)
+        assert self.is_allocated()
+
+        nb_translated_eqn: int = 0
+        out_var_names: Sequence[str] = []
+        for eqn in jaxpr.jaxpr.eqns:  # Translate the equations one by one.
+            assert len(eqn.effects) == 0
+            if len(eqn.outvars) == 0:  # Do we need this special case.
+                continue  #  Looks more like internal Jax error.
+            if any(jutil.get_jax_var_name(outVar) == "_" for outVar in eqn.outvars):
+                assert (len(eqn.outvars) == 1) or all(
+                    jutil.get_jax_var_name(outVar) == "_" for outVar in eqn.outvars
+                )
+                continue
+            _, out_var_names = self._translate_single_eqn(jaxpr=jaxpr, eqn=eqn)
+            nb_translated_eqn += 1
+
+        if nb_translated_eqn == 0:
+            # There were no equation, so handle the copying of input to output.
+            out_var_names = self._handle_null_jaxpr(jaxpr)
+        self._sdfg_out_names = tuple(out_var_names)
+
+        return self._export_memento()
+
+    def _export_memento(self) -> jtrutil.JaCeTranslationMemento:
+        """Encapsulate the translation context of `self` into a memento.
+
+        This function will not deallocate the internal context of `self`.
+        Thus the memento and `self` share the same context in memory.
+        """
+        assert self.is_allocated()
+        assert all((isinstance(x, str) and (len(x) > 0)) for x in self._sdfg_in_names)
+        assert all((isinstance(x, str) and (len(x) > 0)) for x in self._sdfg_out_names)
+
+        return jtrutil.JaCeTranslationMemento(
+            sdfg=self._sdfg,
+            start_state=self._init_sdfg_state,
+            terminal_state=self._term_sdfg_state,
+            jax_name_map=self._jax_name_map,
+            inp_names=self._sdfg_in_names,
+            out_names=self._sdfg_out_names,
+        )
+
+    def _handle_null_jaxpr(
+        self,
+        jaxpr: jcore.ClosedJaxpr,
+    ) -> Sequence[str]:
+        """This function is called in case a `Jaxpr` with zero equations is encountered.
+
+        A function with zero equation might still have output, in which case an
+        input is copied to an output. This function will handle the copying from
+        the input into the corresponding output variable.
+
+        Returns:
+            The function returns a list denoting the SDFG variables that refers to the output.
+            The order of the list is the same as in `jaxpr.jaxpr.outvars`.
+        """
+        if len(jaxpr.eqns) != 0:
+            raise NotImplementedError("'_handle_null_jaxpr()' was called for a non empty Jaxpr.")
+        if len(jaxpr.out_avals) == 0:
+            # There is not output so we do not have to copy anything around.
+            return ()
+        assert self._term_sdfg_state is self._init_sdfg_state
+        assert len(self._sdfg_in_names) > 0
+        assert len(self._sdfg_out_names) == 0
+
+        # We will use this list to build the list of output names.
+        #  This is important for the exporter.
+        out_var_names: list[str] = []
+
+        # If we are here then we are dealing with a nested SDFG/Jaxpr.
+        #  Because an input also serves as output, the nested SDFG will have connector pairs
+        #  with the same name, one serving as input the other as output, with the same name.
+        #  This will make node validation fail.
+        #  Thus we have to introduce a some fake output name and explicitly copy the data around.
+        #  Once DaCe will inline the nested SDFG it will remove this intermediate copy.
+        for jax_out_var in jaxpr.jaxpr.outvars:
+            jax_inp_name = jutil.get_jax_var_name(
+                jax_out_var
+            )  # Since output == input their names must be the same.
+            assert self.map_jax_var_to_sdfg(jax_inp_name, allow_fail=True)
+
+            # This is the name we give to fictive Jax variable serving as output.
+            jax_out_name = f"_zero_equation_output_{self.map_jax_var_to_sdfg(jax_out_var)}"
+
+            # Now create the SDFG variable for it, give it a unique name.
+            sdfg_out_name = self.add_array(
+                jax_out_var,
+                as_transient=True,
+                name_prefix="_zero_equation_output_for_",
+                update_var_mapping=False,
+            )
+
+            # We now create a new mapping, we do this that we will later find the variable again.
+            self.add_jax_name_mapping(jax_var=jax_out_name, sdfg_name=sdfg_out_name)
+            out_var_names.append(jax_out_name)
+
+            # Now copy the input into the fake output variable.
+            inp_acc = self._init_sdfg_state.add_read(self.map_jax_var_to_sdfg(jax_inp_name))
+            out_acc = self._init_sdfg_state.add_write(self.map_jax_var_to_sdfg(jax_out_var))
+            self._init_sdfg_state.add_nedge(
+                src=inp_acc,
+                dst=out_acc,
+                data=dace.Memlet.from_array(
+                    jax_inp_name, self.get_array(self.map_jax_var_to_sdfg(jax_inp_name))
+                ),
+            )
+        return tuple(out_var_names)
+
+    # fmt: off
+    _forbidden_names: Final[set[str]] = {
+        # These should be most of the C++ keywords, it is more important to have the short ones.
+        #  Taken from 'https://learn.microsoft.com/en-us/cpp/cpp/keywords-cpp?view=msvc-170'
+        'alignas', 'alignof', 'and', 'asm', 'auto', 'bitand', 'bitor', 'bool', 'break', 'case',
+        'catch', 'char', 'class', 'compl', 'concept', 'const', 'consteval', 'constexpr',
+        'constinit', 'continue', 'decltype', 'default', 'delete', 'directive', 'do', 'double',
+        'else', 'enum', 'explicit', 'export', 'extern', 'false', 'float', 'for', 'friend',
+        'goto', 'if', 'inline', 'int', 'long', 'mutable', 'namespace', 'new', 'noexcept', 'not',
+        'nullptr', 'operator', 'or', 'private', 'protected', 'public', 'register', 'requires',
+        'return', 'short', 'signed', 'sizeof', 'static', 'struct', 'switch', 'template', 'this',
+        'throw', 'true', 'try', 'typedef', 'typeid', 'typename', 'union', 'unsigned', 'using',
+        'virtual', 'void', 'volatile', 'while', 'xor', 'std',
+    }
+    # fmt: on

From 522a239614ba30b157566649751fc0371298a93e Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Tue, 23 Apr 2024 11:06:46 +0200
Subject: [PATCH 038/458] Removed the possibility to register multiple
 translator for teh same primitive.

---
 .../jace_subtranslator_interface.py           | 160 +-----------------
 .../translator/jaxpr_translator_driver.py     |  74 ++------
 .../translator/sub_translators/__init__.py    |   6 +-
 src/jace/translator/util/__init__.py          |   2 -
 .../util/subtranslator_helper_order.py        |  80 ---------
 tests/test_subtranslator_helper.py            | 133 ---------------
 6 files changed, 26 insertions(+), 429 deletions(-)
 delete mode 100644 src/jace/translator/util/subtranslator_helper_order.py

diff --git a/src/jace/translator/jace_subtranslator_interface.py b/src/jace/translator/jace_subtranslator_interface.py
index 0178755..5f58375 100644
--- a/src/jace/translator/jace_subtranslator_interface.py
+++ b/src/jace/translator/jace_subtranslator_interface.py
@@ -8,7 +8,7 @@
 from __future__ import annotations
 
 from collections.abc import Collection, Sequence
-from typing import TYPE_CHECKING, Any, Final, final
+from typing import TYPE_CHECKING, Any
 
 import dace
 from jax import core as jcore
@@ -36,40 +36,13 @@ class JaCeSubTranslatorInterface:
     In the end this implements the delegation pattern.
 
     A subtranslator uses its `get_handled_primitives()` function to indicate
-    for which Jax primitives it want to register. It is important that a
-    subtranslator can register for as many primitive it wants. At the same
-    time, it is possible that multiple subtranslators have registered for a
-    single primitive.
-
-    If multiple subtranslator have registered for the same primitive they
-    will be ordered by driver. There are two ways how a subtranslator can
-    influence this order. The first one is by implementing `get_priority()`,
-    the driver will then put them in ascending order.
-    I.e. the lower its priority the earlier a subtranslator is checked.
-    However, if a subtranslator returns the special value
-    `JaCeSubTranslatorInterface.DEFAULT_PRIORITY` it will be always put at the
-    end, in unspecific order if multiple translator are involved.
-
-    The second possibility is to override the '__lt__()' function,
-    and establish a strict weak order. If a subtranslator overrides this
-    function it should also override `get_priority()` to return `NotImplemented`.
-
-    To decide which subtranslator should be used for a specific equation
-    the driver will use their 'can_translate_jaxeqn()' function.
-    The first subtranslator that returns 'True' will then be used.
-
-    Todo:
-        Also come up with a way how to avoid that instances are allowed to access
-            some private members of the driver; Possibly by composition.
-        Come up with a better way of ordering; maybe introduce fixed priority level.
-            And then allows to sort them according to `__lt__()` within the level.
+    for which Jax primitives it want to register. It is important that there
+    is no limits on the number of primitives a subtranslator can register itself.
+    However, only one subtranslator can be registered for a primitive.
     """
 
     __slots__ = ()
 
-    # Default value for the priority of primitive translators.
-    DEFAULT_PRIORITY: Final = int("1" * 64, base=2)
-
     def __init__(
         self,
         *args: Any,
@@ -84,11 +57,7 @@ def get_handled_primitives(self) -> Collection[str] | str:
         """Returns the names of all Jax primitives that `self` is able to handle.
 
         There is no limit on the number of primitives for which a subtranslator
-        can register. It is possible that several translators can be registered
-        for the same name.
-
-        See Also:
-            `self.can_translate_jaxeqn()` and `self.get_priority()`.
+        can register.
 
         Notes:
             In case a string is returned it is interpreted as 1 element collection.
@@ -97,35 +66,6 @@ def get_handled_primitives(self) -> Collection[str] | str:
             "Class '{type(self).__name__}' does not implement 'get_handled_primitives()'."
         )
 
-    def can_translate_jaxeqn(
-        self,
-        driver: JaxprTranslationDriver,
-        in_var_names: Sequence[str | None],
-        out_var_names: Sequence[str],
-        eqn: jcore.JaxprEqn,
-    ) -> bool:
-        """Tests if `self` is able to translate the Jax primitive passed as `eqn`.
-
-        This function is used by the driver to determine which of the subtranslators,
-        that have registered for a certain type of primitive, should be used.
-        For a more detailed description of the arguments see
-        `self.translate_jaxeqn()` function.
-
-        Args:
-            driver:         The driver object of the translation.
-            in_var_names:   Names of the SDFG variables used as inputs for the primitive.
-            out_var_names:  Names of the SDFG variables used as outputs for the primitive.
-            eqn:            The `jcore.JaxprEqn` instance that is currently being handled.
-
-        Notes:
-            In case there is only one subtranslator registered for a certain primitive,
-                it is unspecific if this function will be called at all `self.translate_jaxeqn()`.
-            This function will never be called for a primitive for which it has not registered itself.
-        """
-        raise NotImplementedError(
-            "Class '{type(self).__name__}' does not implement 'can_translate_jaxeqn()'."
-        )
-
     def translate_jaxeqn(
         self,
         driver: JaxprTranslationDriver,
@@ -152,7 +92,7 @@ def translate_jaxeqn(
             `translator.get_terminal_sdfg_state() is eqn_state` holds.
 
         Then the subtranslator is called. Usually a subtranslator should
-        construct the dataflow graph inside it. It is allowed that the
+        construct the dataflow graph inside `eqn_state`. It is allowed that the
         subtranslators creates more states if needed, but this state machine
         has to have a single terminal state, which must be returned
         and reachable from `eqn_state`.
@@ -185,55 +125,6 @@ def translate_jaxeqn(
             "Class '{type(self).__name__}' does not implement 'translate_jaxeqn()'."
         )
 
-    def get_priority(self) -> int:
-        """Returns the priority of this translator.
-
-        The value returned by this function is used by the driver to order the
-        subtranslators that have registered for the same primitive.
-        The _smaller_ the value the earlier it is checked.
-
-        See Also:
-            `self.can_translate_jaxeqn()` and `self.get_handled_primitives()`.
-
-        Notes:
-            By default the function returns `self.DEFAULT_PRIORITY`, which is
-                handled specially, i.e. it is put at the end.
-            If a subtranslator instead overrides `__lt__()` this function
-                should return `NotImplemented`.
-        """
-        return self.DEFAULT_PRIORITY
-
-    def has_default_priority(self) -> bool:
-        """Checks if `self` has default priority.
-
-        Notes:
-            It is allowed, but not advised to override this function.
-                However, it has to be consistent with `self.get_priority()`.
-        """
-        try:
-            x = self.get_priority()
-        except NotImplementedError:
-            return False
-        if x is NotImplemented:
-            return False
-        return x == self.DEFAULT_PRIORITY
-
-    def __lt__(
-        self,
-        other: JaCeSubTranslatorInterface,
-    ) -> bool:
-        """Tests if `self` should be checked before `other` in the selection process.
-
-        As outlined in the class description this is the second possibility to
-        influence the order of the subtranslator. This function should return
-        `True` if `self` should be checked for applicability _before_ `other`.
-
-        Notes:
-            If this function is overridden `get_priority()` should return `NotImplemented`.
-            This function is never called if either `self` or `other` have default priority.
-        """
-        return self.get_priority() < other.get_priority()
-
     def __eq__(
         self,
         other: Any,
@@ -241,12 +132,7 @@ def __eq__(
         """Tests if two subtranslators are equal.
 
         The default implementation checks if `self` and `other` have the same
-        type. However, if the behaviour of a subtranslator strongly depend on
-        its configuration this function should be overridden.
-
-        Notes:
-            If you override this function you should also override
-                `self.__hash__()` to make the two consistent.
+        type.
         """
         if not isinstance(other, JaCeSubTranslatorInterface):
             return NotImplemented
@@ -258,37 +144,5 @@ def __hash__(self) -> int:
         The default implementation return a hash that is based on the class.
         Thus all instances of a particular subtranslator will have the same
         hash value.
-
-        Notes:
-            If you override this function you should also override
-                `self.__eq__()` to make the two consistent.
         """
         return id(self.__class__)
-
-    @final
-    def __ne__(
-        self,
-        other: Any,
-    ) -> bool:
-        return NotImplemented
-
-    @final
-    def __le__(
-        self,
-        other: Any,
-    ) -> bool:
-        return NotImplemented
-
-    @final
-    def __ge__(
-        self,
-        other: Any,
-    ) -> bool:
-        return NotImplemented
-
-    @final
-    def __gt__(
-        self,
-        other: Any,
-    ) -> bool:
-        return NotImplemented
diff --git a/src/jace/translator/jaxpr_translator_driver.py b/src/jace/translator/jaxpr_translator_driver.py
index 2c2c807..7be5636 100644
--- a/src/jace/translator/jaxpr_translator_driver.py
+++ b/src/jace/translator/jaxpr_translator_driver.py
@@ -102,10 +102,9 @@ def __init__(
 
         # Contains all the subtranslators that we need.
         #  They are partitioned by the names of the primitive they have registered for.
-        #  Inside a partition they are ordered by priority, lowest first, more important.
         #  This member is allocated by '_init_sub_translators()' and remains allocated
         #  during the lifetime of the object.
-        self._sub_translators: dict[str, list[jtrans.JaCeSubTranslatorInterface]] = None  # type: ignore[assignment]
+        self._sub_translators: dict[str, jtrans.JaCeSubTranslatorInterface] = None  # type: ignore[assignment]
 
         # The SDFG object that we are currently constructing.
         #  Only allocated during an ongoing translation.
@@ -923,36 +922,29 @@ def _allocate_translation_ctx(
 
     def _init_sub_translators(
         self,
-        kwargs: Mapping[str, Any],
+        subtrans_args: Mapping[str, Any],
     ) -> JaxprTranslationDriver:
         """This function initializes the subtranslator.
 
         The function forwards `kwargs` to the constructor of the subtranslators.
         However, it will remove all arguments starting with an underscore.
         """
-        if isinstance(self._sub_translators, dict):
-            raise RuntimeError("Tried to allocate the internal subtranslators twice.")
-        assert self._sub_translators is None  # type: ignore[unreachable]
+        assert self._sub_translators is None
 
-        kwargs = {k: v for k, v in kwargs.items() if not k.startswith("_")}
+        subtrans_args = {k: v for k, v in subtrans_args.items() if not k.startswith("_")}  # type: ignore[unreachable]
 
-        # First we will create all subtranslators and partition them.
-        subtranslators: dict[str, list[jtrans.JaCeSubTranslatorInterface]] = {}
-        for subtranslator_cls in jtsubt._get_subtranslators_cls():
-            subtranslator: jtrans.JaCeSubTranslatorInterface = subtranslator_cls(**kwargs)
+        sub_translators: dict[str, jtrans.JaCeSubTranslatorInterface] = {}
+        for sub_translator_cls in jtsubt._get_subtranslators_cls():
+            sub_translator: jtrans.JaCeSubTranslatorInterface = sub_translator_cls(**subtrans_args)
             handled_primitives: Iterable[str] = jutil.ensure_iterability(
-                subtranslator.get_handled_primitives()
+                sub_translator.get_handled_primitives()
             )
-
-            # Now add the subtranslator to the primitives it requests, we will sort them later into the correct order.
             for handled_primitive in handled_primitives:
-                subtranslators.setdefault(handled_primitive, []).append(subtranslator)
+                if handled_primitive in sub_translators:
+                    raise RuntimeError(f"Multiple sub_translators for '{handled_primitive}' found.")
+                sub_translators[handled_primitive] = sub_translator
+        self._sub_translators = sub_translators
 
-        # Now we order the subtranslators for the primitives.
-        self._sub_translators = {
-            prim_name: jtrutil.sort_subtranslators(primSubTranslators)
-            for prim_name, primSubTranslators in subtranslators.items()
-        }
         return self
 
     def _clear_translation_ctx(self) -> JaxprTranslationDriver:
@@ -992,41 +984,16 @@ def _clear_translation_ctx(self) -> JaxprTranslationDriver:
 
     def _find_sub_translator_for(
         self,
-        in_var_names: Sequence[str | None],
-        out_var_names: Sequence[str],
         eqn: jcore.JaxprEqn,
     ) -> jtrans.JaCeSubTranslatorInterface:
-        """Returns the appropriate subtranslator for equation `eqn`.
-
-        The subtranslators are checked for applicability in the order of their priority.
-        The fist one that accepts the translation will be taken.
-
-        Notes:
-            The arguments are the same as for `JaCeSubTranslatorInterface.can_translate_jaxeqn()`.
-        """
+        """Returns the appropriate subtranslator for equation `eqn`."""
         assert self._sub_translators is not None
 
         prim_name: str = eqn.primitive.name
         if prim_name not in self._sub_translators:
             raise NotImplementedError(f"No subtranslators known to handle '{prim_name}'.")
-        subtranslator_canidates = self._sub_translators[prim_name]
-        assert len(subtranslator_canidates) > 0
-
-        subtranslator: jtrans.JaCeSubTranslatorInterface = None  # type: ignore[assignment]
-        if len(subtranslator_canidates) == 1:
-            subtranslator = next(iter(subtranslator_canidates))
-            assert subtranslator.can_translate_jaxeqn(
-                in_var_names=in_var_names, out_var_names=out_var_names, driver=self, eqn=eqn
-            )
-        else:
-            for subtranslatorCanidate in subtranslator_canidates:
-                if subtranslatorCanidate.can_translate_jaxeqn(
-                    driver=self, in_var_names=in_var_names, out_var_names=out_var_names, eqn=eqn
-                ):
-                    subtranslator = subtranslatorCanidate
-            else:
-                raise NotImplementedError(f"No subtranslator found for handling '{eqn}'.")
-        return subtranslator
+
+        return self._sub_translators[prim_name]
 
     def _translate_single_eqn(
         self,
@@ -1044,7 +1011,6 @@ def _translate_single_eqn(
         Returns:
             The SDFG names that were used as input and output are returned.
             The inputs might contain `None` which indicates that that input was a Jax Literal.
-            For more information see `JaCeSubTranslatorInterface.can_translate_jaxeqn()`.
 
         Notes:
             While `jaxpr` must be a `ClosedJaxpr`, `eqn` must come from the unclosed instance.
@@ -1070,24 +1036,20 @@ def _translate_single_eqn(
         )
 
         # Find the subtranslator
-        subtranslator: jtrans.JaCeSubTranslatorInterface = self._find_sub_translator_for(
-            in_var_names=in_var_names,
-            out_var_names=out_var_names,
-            eqn=eqn,
-        )
+        subtranslator: jtrans.JaCeSubTranslatorInterface = self._find_sub_translator_for(eqn)
 
         # Create the state into which the equation should be translated
         last_term_state: dace.SDFGState = self.get_terminal_sdfg_state()  # noqa: F841 # Will be used later
         eqn_state = self.append_new_state(
             label=f"{eqn.primitive.name}_{out_var_names[0]}",
-            prev_state=None,
+            prev_state=None,  # forces terminal state
         )
 
         # Now perform the actual translation of the equation.
         new_sdfg_term_state = subtranslator.translate_jaxeqn(
             driver=self,
             in_var_names=in_var_names,
-            out_var_names=out_var_names,  # Might be modified by subtranslator!
+            out_var_names=out_var_names,  # Might be modified by the subtranslator!
             eqn=eqn,
             eqn_state=eqn_state,
         )
diff --git a/src/jace/translator/sub_translators/__init__.py b/src/jace/translator/sub_translators/__init__.py
index f03144e..4a02ea2 100644
--- a/src/jace/translator/sub_translators/__init__.py
+++ b/src/jace/translator/sub_translators/__init__.py
@@ -77,13 +77,9 @@ def _get_subtranslators_cls(
         If the externally defined subtranslators are requested they will be
             first and ordered as FILO order.
     """
-    # It is important that the externally defined are ordered before the builtins
-    #  and are ordered in FILO order, especuially if multiple subtranslator per
-    #  primitive are registered. Because this way they are inserted first
-    #  into the internal list of the driver, and furthermore since `sorted()`
-    #  is stable they will tend to end up more to the front.
     ret: list[type[jtrans.JaCeSubTranslatorInterface]] = []
     if with_external:
+        # Guarantees that we get them in FIFO order.
         ret.extend(reversed(_EXTERNAL_SUBTRANSLATORS.keys()))
     if builtins:
         ret.extend(_BUILTIN_SUBTRANSLATORS)
diff --git a/src/jace/translator/util/__init__.py b/src/jace/translator/util/__init__.py
index 38ce344..910589e 100644
--- a/src/jace/translator/util/__init__.py
+++ b/src/jace/translator/util/__init__.py
@@ -11,7 +11,6 @@
 
 from .jace_translation_memento import JaCeTranslationMemento
 from .revision_counter import RevisionCounterManager
-from .subtranslator_helper_order import sort_subtranslators
 from .util import list_to_dict
 
 
@@ -20,5 +19,4 @@
     "JaCeTranslationMemento",
     "RevisionCounterManager",
     "list_to_dict",
-    "sort_subtranslators",
 ]
diff --git a/src/jace/translator/util/subtranslator_helper_order.py b/src/jace/translator/util/subtranslator_helper_order.py
deleted file mode 100644
index 767521a..0000000
--- a/src/jace/translator/util/subtranslator_helper_order.py
+++ /dev/null
@@ -1,80 +0,0 @@
-# JaCe - JAX Just-In-Time compilation using DaCe (Data Centric Parallel Programming)
-#
-# Copyright (c) 2024, ETH Zurich
-# All rights reserved.
-#
-# SPDX-License-Identifier: BSD-3-Clause
-
-from __future__ import annotations
-
-from collections.abc import Sequence
-
-from jace import translator
-
-
-def sort_subtranslators(
-    subtranslators: Sequence[translator.JaCeSubTranslatorInterface],
-) -> Sequence[translator.JaCeSubTranslatorInterface]:
-    """Orders the subtranslators according to their priorities.
-
-    The function ensures the following:
-    - All subtranslators that have default priority are at the end.
-    - All subtranslators whose `get_priority()` returns `NotImplemented`
-        are at the begin of the list. These subtranslators are ordered according
-        to their `__lt__()` function.
-    - All subtranslators whose `get_priority()` function returns an integer are
-        in the middle, ordered according to this value.
-    """
-    if len(subtranslators) <= 1:
-        return subtranslators
-    subtranslators = sorted(subtranslators, key=_SubtranslatorOrderingHelper)
-    assert (len(subtranslators) <= 1) or all(
-        subtranslators[i - 1].has_default_priority() <= subtranslators[i].has_default_priority()
-        for i in range(1, len(subtranslators))
-    )
-    return subtranslators
-
-
-class _SubtranslatorOrderingHelper:
-    """Helper class used by `JaxprTranslationDriver` to bring the subtranslators in the correct order.
-
-    Essentially it is a wrapper that contains the additional logic that is
-    needed for sorting. This way subclasses does not need to implement it themselves.
-
-    Notes:
-        This class does not implement the other comparison function as requested by PEP8.
-    """
-
-    def __init__(self, subtranslator: translator.JaCeSubTranslatorInterface):
-        assert isinstance(subtranslator, translator.JaCeSubTranslatorInterface)
-        self._sub = subtranslator
-
-    def get(self) -> translator.JaCeSubTranslatorInterface:
-        return self._sub
-
-    def __lt__(
-        self,
-        other: _SubtranslatorOrderingHelper,
-    ) -> bool:
-        # Default priority means that it will always go to the end.
-        if self._sub.has_default_priority():
-            return False  # `self` has default priority, so it must go to the end.
-        if other._sub.has_default_priority():
-            return True  # `self` does not have default prio, thus it _must_ go before `other`.
-        prio_self = self._sub.get_priority()  # Get the priorities of the subtranslators.
-        prio_other = other._sub.get_priority()
-        if all(prio is NotImplemented for prio in (prio_self, prio_other)):
-            # None has a prio, `self` should decide if it should go first.
-            x = self._sub.__lt__(other._sub)
-            assert isinstance(x, bool)
-            return x
-        # In case only one has a priority, we change the order such that the one that implements
-        #  a `__lt__()` goes first.
-        if prio_self is NotImplemented:
-            assert isinstance(prio_other, int)
-            return True
-        if prio_other is NotImplemented:
-            assert isinstance(prio_self, int)
-            return False
-        assert all(isinstance(prio, int) for prio in (prio_other, prio_self))
-        return prio_self < prio_other
diff --git a/tests/test_subtranslator_helper.py b/tests/test_subtranslator_helper.py
index 386786a..3af1038 100644
--- a/tests/test_subtranslator_helper.py
+++ b/tests/test_subtranslator_helper.py
@@ -17,137 +17,6 @@
 from jace import translator as jtrans
 
 
-def test_subtranslatior_order_simple():
-    """Tests if the ordering of subtranslators works correctly.
-
-    Simple version that only uses priorities.
-    """
-    from jace.translator.util.subtranslator_helper_order import sort_subtranslators
-
-    class SimpleSubTrans1(jtrans.JaCeSubTranslatorInterface):
-        _EXP_ORDER = 0
-
-        def __init__(self, *args, **kwargs):
-            super().__init__(*args, **kwargs)
-
-        def get_priority(self):
-            return 1
-
-    class SimpleSubTrans2(jtrans.JaCeSubTranslatorInterface):
-        _EXP_ORDER = 1  # Not last because, default prio is always last.
-
-        def __init__(self, *args, **kwargs):
-            super().__init__(*args, **kwargs)
-
-        def get_priority(self):
-            return jtrans.JaCeSubTranslatorInterface.DEFAULT_PRIORITY + 1
-
-    class SimpleSubTrans3(jtrans.JaCeSubTranslatorInterface):
-        _EXP_ORDER = 2
-
-        def __init__(self, *args, **kwargs):
-            super().__init__(*args, **kwargs)
-
-    initial_order = [
-        SimpleSubTrans3(),
-        SimpleSubTrans2(),
-        SimpleSubTrans1(),
-    ]
-
-    # Now call the function.
-    sorted_translators = sort_subtranslators(initial_order)
-
-    # Now we bring the list in expected order.
-    expected_order = sorted(initial_order, key=lambda st: st._EXP_ORDER)
-
-    assert all(
-        got_ord is exp_ord
-        for got_ord, exp_ord in zip(sorted_translators, expected_order, strict=False)
-    ), f"Expected order was `{[type(x).__name__  for x in expected_order]}`, but got `{[type(x).__name__  for x in sorted_translators]}`."
-    return True
-
-
-def test_subtranslatior_order_custom1():
-    """Tests if the ordering of subtranslators works correctly.
-
-    Interaction of priorities and custom `__lt__()`.
-    """
-    from jace.translator.util.subtranslator_helper_order import sort_subtranslators
-
-    class SimpleSubTrans1(jtrans.JaCeSubTranslatorInterface):
-        _EXP_ORDER = 0
-
-        def __init__(self, *args, **kwargs):
-            super().__init__(*args, **kwargs)
-
-        def get_priority(self):
-            return NotImplemented
-
-        def __lt__(self, other):
-            return isinstance(other, SimpleSubTrans2)
-
-    class SimpleSubTrans2(jtrans.JaCeSubTranslatorInterface):
-        _EXP_ORDER = 1
-
-        def __init__(self, *args, **kwargs):
-            super().__init__(*args, **kwargs)
-
-        def get_priority(self):
-            return NotImplemented
-
-        def __lt__(self, other):
-            return True
-
-    class SimpleSubTrans3(jtrans.JaCeSubTranslatorInterface):
-        _EXP_ORDER = 2
-
-        def __init__(self, *args, **kwargs):
-            super().__init__(*args, **kwargs)
-
-        def get_priority(self):
-            return NotImplemented
-
-        def __lt__(self, other):
-            return False
-
-    class SimpleSubTrans4(jtrans.JaCeSubTranslatorInterface):
-        _EXP_ORDER = 3
-
-        def __init__(self, *args, **kwargs):
-            super().__init__(*args, **kwargs)
-
-        def get_priority(self):
-            return jtrans.JaCeSubTranslatorInterface.DEFAULT_PRIORITY + 1
-
-    class SimpleSubTrans5(jtrans.JaCeSubTranslatorInterface):
-        _EXP_ORDER = 4
-
-        def __init__(self, *args, **kwargs):
-            super().__init__(*args, **kwargs)
-
-    assert SimpleSubTrans2() < SimpleSubTrans1()
-
-    initial_order = [
-        SimpleSubTrans5(),
-        SimpleSubTrans4(),
-        SimpleSubTrans3(),
-        SimpleSubTrans2(),
-        SimpleSubTrans1(),
-    ]
-
-    # Now call the function.
-    sorted_translators = sort_subtranslators(initial_order)
-
-    # Now we bring the list in expected order.
-    expected_order = sorted(initial_order, key=lambda st: st._EXP_ORDER)
-
-    assert all(
-        got_ord is exp_ord
-        for got_ord, exp_ord in zip(sorted_translators, expected_order, strict=False)
-    ), f"Expected order was `{[type(x).__name__  for x in expected_order]}`, but got `{[type(x).__name__  for x in sorted_translators]}`."
-    return True
-
-
 def test_subtranslatior_managing():
     """Ensures the functionality of the subtranslator managing."""
     from jace.translator.sub_translators import (
@@ -262,6 +131,4 @@ def __gt__(self, other: Any) -> bool:
 
 
 if __name__ == "__main__":
-    test_subtranslatior_order_simple()
-    test_subtranslatior_order_custom1()
     test_subtranslatior_managing()

From ee9d7b3c9230bb255043a04df867b3105de01d42 Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Tue, 23 Apr 2024 11:16:35 +0200
Subject: [PATCH 039/458] Added some better functions to help with the Jax
 integration.

---
 src/jace/util/__init__.py |  6 +++-
 src/jace/util/jax.py      | 75 ++++++++++++++++++++++++++++++++++++++-
 2 files changed, 79 insertions(+), 2 deletions(-)

diff --git a/src/jace/util/__init__.py b/src/jace/util/__init__.py
index 80de0e3..0bd9a15 100644
--- a/src/jace/util/__init__.py
+++ b/src/jace/util/__init__.py
@@ -9,11 +9,15 @@
 
 from __future__ import annotations
 
-from .jax import get_jax_var_name
+from .jax import JaCeVar, get_jax_var_dtype, get_jax_var_name, get_jax_var_shape, translate_dtype
 from .util import ensure_iterability
 
 
 __all__ = [
     "get_jax_var_name",
+    "get_jax_var_shape",
+    "get_jax_var_dtype",
     "ensure_iterability",
+    "translate_dtype",
+    "JaCeVar",
 ]
diff --git a/src/jace/util/jax.py b/src/jace/util/jax.py
index 3a7ed06..755e6a3 100644
--- a/src/jace/util/jax.py
+++ b/src/jace/util/jax.py
@@ -13,10 +13,33 @@
 
 from __future__ import annotations
 
+from dataclasses import dataclass
+from typing import Any
+
+import dace
+import jax
 import jax.core as jcore
 
 
-def get_jax_var_name(jax_var: jcore.Atom | str) -> str:
+@dataclass(init=True, repr=True, eq=True, frozen=True, slots=True)
+class JaCeVar:
+    """Substitute class for Jax' `Var` instance.
+
+    This class is similar to a `jax.core.Var` class, but much simpler.
+    It is only a container for a name, shape and a datatype.
+    All extractor functions `get_jax_var{name, shape, dtype}()` will accept it,
+    as well as multiple functions of the driver.
+
+    Notes:
+        Main intention is to test functionality.
+    """
+
+    name: str
+    shape: tuple[int | dace.symbol | str, ...] | int | dace.symbol | str | tuple[()]
+    dtype: dace.typeclass
+
+
+def get_jax_var_name(jax_var: jcore.Atom | JaCeVar | str) -> str:
     """Returns the name of the Jax variable as a string.
 
     Args:
@@ -27,6 +50,8 @@ def get_jax_var_name(jax_var: jcore.Atom | str) -> str:
     """
     if isinstance(jax_var, jcore.DropVar):
         return "_"
+    if isinstance(jax_var, JaCeVar):
+        return jax_var.name
     if isinstance(jax_var, jcore.Atom):
         jax_name = str(jax_var)  # This only works up to some version
     elif isinstance(jax_var, str):
@@ -42,3 +67,51 @@ def get_jax_var_name(jax_var: jcore.Atom | str) -> str:
             f"Failed to translate the Jax variable '{jax_var}' into a name, the result was empty."
         )
     return jax_var
+
+
+def get_jax_var_shape(jax_var: jcore.Atom) -> tuple[int, ...]:
+    """Returns the shape of a Jax variable.
+
+    Args:
+        jax_var:     The variable to process
+    """
+    if isinstance(jax_var, jcore.Atom):
+        return jax_var.aval.shape
+    if isinstance(jax_var, JaCeVar):
+        assert isinstance(jax_var.shape, tuple)
+        return jax_var.shape
+    raise TypeError(f"'get_jax_var_shape()` is not implemented for '{type(jax_var)}'.")
+
+
+def get_jax_var_dtype(jax_var: jcore.Atom) -> dace.typeclass:
+    """Returns the DaCe equivalent of `jax_var`s datatype."""
+    if isinstance(jax_var, jcore.Atom):
+        return translate_dtype(jax_var.aval.dtype)
+    if isinstance(jax_var, JaCeVar):
+        return translate_dtype(jax_var.dtype)
+    raise TypeError(f"'get_jax_var_dtype()` is not implemented for '{type(jax_var)}'.")
+
+
+def translate_dtype(dtype: Any) -> dace.typeclass:
+    """Turns a Jax datatype into a DaCe datatype."""
+
+    if isinstance(dtype, dace.typeclass):
+        return dtype
+
+    # Make some basic checks if the datatype is okay
+    name_of_dtype = str(dtype)
+    if (not jax.config.read("jax_enable_x64")) and (name_of_dtype == "float64"):
+        raise ValueError("Found a 'float64' type but 'x64' support is disabled.")
+    if name_of_dtype.startswith("complex"):
+        raise NotImplementedError("Support for complecx computation is not implemented yet.")
+
+    # Now extract the datatype from dace, this is extremely ugly.
+    if not hasattr(dace.dtypes, name_of_dtype):
+        raise TypeError(f"Could not find '{name_of_dtype}' ({type(dtype).__name__}) in 'dace'.")
+    dcd_type = getattr(dace.dtypes, name_of_dtype)
+
+    if not isinstance(dcd_type, dace.dtypes.typeclass):
+        raise TypeError(
+            f"'{name_of_dtype}' does not map to a 'dace.typeclass' but to a '{type(dcd_type).__name__}'."
+        )
+    return dcd_type

From 54b55e1798014ea9c4fbe84ffe1105d847bd60d9 Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Tue, 23 Apr 2024 11:17:05 +0200
Subject: [PATCH 040/458] Removed the functionality that would allow multiple
 translators for a single primitive.

---
 .../jace_subtranslator_interface.py           | 160 +-----------------
 .../translator/jaxpr_translator_driver.py     |  74 ++------
 .../util/subtranslator_helper_order.py        |  80 ---------
 3 files changed, 25 insertions(+), 289 deletions(-)
 delete mode 100644 src/jace/translator/util/subtranslator_helper_order.py

diff --git a/src/jace/translator/jace_subtranslator_interface.py b/src/jace/translator/jace_subtranslator_interface.py
index 0178755..5f58375 100644
--- a/src/jace/translator/jace_subtranslator_interface.py
+++ b/src/jace/translator/jace_subtranslator_interface.py
@@ -8,7 +8,7 @@
 from __future__ import annotations
 
 from collections.abc import Collection, Sequence
-from typing import TYPE_CHECKING, Any, Final, final
+from typing import TYPE_CHECKING, Any
 
 import dace
 from jax import core as jcore
@@ -36,40 +36,13 @@ class JaCeSubTranslatorInterface:
     In the end this implements the delegation pattern.
 
     A subtranslator uses its `get_handled_primitives()` function to indicate
-    for which Jax primitives it want to register. It is important that a
-    subtranslator can register for as many primitive it wants. At the same
-    time, it is possible that multiple subtranslators have registered for a
-    single primitive.
-
-    If multiple subtranslator have registered for the same primitive they
-    will be ordered by driver. There are two ways how a subtranslator can
-    influence this order. The first one is by implementing `get_priority()`,
-    the driver will then put them in ascending order.
-    I.e. the lower its priority the earlier a subtranslator is checked.
-    However, if a subtranslator returns the special value
-    `JaCeSubTranslatorInterface.DEFAULT_PRIORITY` it will be always put at the
-    end, in unspecific order if multiple translator are involved.
-
-    The second possibility is to override the '__lt__()' function,
-    and establish a strict weak order. If a subtranslator overrides this
-    function it should also override `get_priority()` to return `NotImplemented`.
-
-    To decide which subtranslator should be used for a specific equation
-    the driver will use their 'can_translate_jaxeqn()' function.
-    The first subtranslator that returns 'True' will then be used.
-
-    Todo:
-        Also come up with a way how to avoid that instances are allowed to access
-            some private members of the driver; Possibly by composition.
-        Come up with a better way of ordering; maybe introduce fixed priority level.
-            And then allows to sort them according to `__lt__()` within the level.
+    for which Jax primitives it want to register. It is important that there
+    is no limits on the number of primitives a subtranslator can register itself.
+    However, only one subtranslator can be registered for a primitive.
     """
 
     __slots__ = ()
 
-    # Default value for the priority of primitive translators.
-    DEFAULT_PRIORITY: Final = int("1" * 64, base=2)
-
     def __init__(
         self,
         *args: Any,
@@ -84,11 +57,7 @@ def get_handled_primitives(self) -> Collection[str] | str:
         """Returns the names of all Jax primitives that `self` is able to handle.
 
         There is no limit on the number of primitives for which a subtranslator
-        can register. It is possible that several translators can be registered
-        for the same name.
-
-        See Also:
-            `self.can_translate_jaxeqn()` and `self.get_priority()`.
+        can register.
 
         Notes:
             In case a string is returned it is interpreted as 1 element collection.
@@ -97,35 +66,6 @@ def get_handled_primitives(self) -> Collection[str] | str:
             "Class '{type(self).__name__}' does not implement 'get_handled_primitives()'."
         )
 
-    def can_translate_jaxeqn(
-        self,
-        driver: JaxprTranslationDriver,
-        in_var_names: Sequence[str | None],
-        out_var_names: Sequence[str],
-        eqn: jcore.JaxprEqn,
-    ) -> bool:
-        """Tests if `self` is able to translate the Jax primitive passed as `eqn`.
-
-        This function is used by the driver to determine which of the subtranslators,
-        that have registered for a certain type of primitive, should be used.
-        For a more detailed description of the arguments see
-        `self.translate_jaxeqn()` function.
-
-        Args:
-            driver:         The driver object of the translation.
-            in_var_names:   Names of the SDFG variables used as inputs for the primitive.
-            out_var_names:  Names of the SDFG variables used as outputs for the primitive.
-            eqn:            The `jcore.JaxprEqn` instance that is currently being handled.
-
-        Notes:
-            In case there is only one subtranslator registered for a certain primitive,
-                it is unspecific if this function will be called at all `self.translate_jaxeqn()`.
-            This function will never be called for a primitive for which it has not registered itself.
-        """
-        raise NotImplementedError(
-            "Class '{type(self).__name__}' does not implement 'can_translate_jaxeqn()'."
-        )
-
     def translate_jaxeqn(
         self,
         driver: JaxprTranslationDriver,
@@ -152,7 +92,7 @@ def translate_jaxeqn(
             `translator.get_terminal_sdfg_state() is eqn_state` holds.
 
         Then the subtranslator is called. Usually a subtranslator should
-        construct the dataflow graph inside it. It is allowed that the
+        construct the dataflow graph inside `eqn_state`. It is allowed that the
         subtranslators creates more states if needed, but this state machine
         has to have a single terminal state, which must be returned
         and reachable from `eqn_state`.
@@ -185,55 +125,6 @@ def translate_jaxeqn(
             "Class '{type(self).__name__}' does not implement 'translate_jaxeqn()'."
         )
 
-    def get_priority(self) -> int:
-        """Returns the priority of this translator.
-
-        The value returned by this function is used by the driver to order the
-        subtranslators that have registered for the same primitive.
-        The _smaller_ the value the earlier it is checked.
-
-        See Also:
-            `self.can_translate_jaxeqn()` and `self.get_handled_primitives()`.
-
-        Notes:
-            By default the function returns `self.DEFAULT_PRIORITY`, which is
-                handled specially, i.e. it is put at the end.
-            If a subtranslator instead overrides `__lt__()` this function
-                should return `NotImplemented`.
-        """
-        return self.DEFAULT_PRIORITY
-
-    def has_default_priority(self) -> bool:
-        """Checks if `self` has default priority.
-
-        Notes:
-            It is allowed, but not advised to override this function.
-                However, it has to be consistent with `self.get_priority()`.
-        """
-        try:
-            x = self.get_priority()
-        except NotImplementedError:
-            return False
-        if x is NotImplemented:
-            return False
-        return x == self.DEFAULT_PRIORITY
-
-    def __lt__(
-        self,
-        other: JaCeSubTranslatorInterface,
-    ) -> bool:
-        """Tests if `self` should be checked before `other` in the selection process.
-
-        As outlined in the class description this is the second possibility to
-        influence the order of the subtranslator. This function should return
-        `True` if `self` should be checked for applicability _before_ `other`.
-
-        Notes:
-            If this function is overridden `get_priority()` should return `NotImplemented`.
-            This function is never called if either `self` or `other` have default priority.
-        """
-        return self.get_priority() < other.get_priority()
-
     def __eq__(
         self,
         other: Any,
@@ -241,12 +132,7 @@ def __eq__(
         """Tests if two subtranslators are equal.
 
         The default implementation checks if `self` and `other` have the same
-        type. However, if the behaviour of a subtranslator strongly depend on
-        its configuration this function should be overridden.
-
-        Notes:
-            If you override this function you should also override
-                `self.__hash__()` to make the two consistent.
+        type.
         """
         if not isinstance(other, JaCeSubTranslatorInterface):
             return NotImplemented
@@ -258,37 +144,5 @@ def __hash__(self) -> int:
         The default implementation return a hash that is based on the class.
         Thus all instances of a particular subtranslator will have the same
         hash value.
-
-        Notes:
-            If you override this function you should also override
-                `self.__eq__()` to make the two consistent.
         """
         return id(self.__class__)
-
-    @final
-    def __ne__(
-        self,
-        other: Any,
-    ) -> bool:
-        return NotImplemented
-
-    @final
-    def __le__(
-        self,
-        other: Any,
-    ) -> bool:
-        return NotImplemented
-
-    @final
-    def __ge__(
-        self,
-        other: Any,
-    ) -> bool:
-        return NotImplemented
-
-    @final
-    def __gt__(
-        self,
-        other: Any,
-    ) -> bool:
-        return NotImplemented
diff --git a/src/jace/translator/jaxpr_translator_driver.py b/src/jace/translator/jaxpr_translator_driver.py
index 2c2c807..7be5636 100644
--- a/src/jace/translator/jaxpr_translator_driver.py
+++ b/src/jace/translator/jaxpr_translator_driver.py
@@ -102,10 +102,9 @@ def __init__(
 
         # Contains all the subtranslators that we need.
         #  They are partitioned by the names of the primitive they have registered for.
-        #  Inside a partition they are ordered by priority, lowest first, more important.
         #  This member is allocated by '_init_sub_translators()' and remains allocated
         #  during the lifetime of the object.
-        self._sub_translators: dict[str, list[jtrans.JaCeSubTranslatorInterface]] = None  # type: ignore[assignment]
+        self._sub_translators: dict[str, jtrans.JaCeSubTranslatorInterface] = None  # type: ignore[assignment]
 
         # The SDFG object that we are currently constructing.
         #  Only allocated during an ongoing translation.
@@ -923,36 +922,29 @@ def _allocate_translation_ctx(
 
     def _init_sub_translators(
         self,
-        kwargs: Mapping[str, Any],
+        subtrans_args: Mapping[str, Any],
     ) -> JaxprTranslationDriver:
         """This function initializes the subtranslator.
 
         The function forwards `kwargs` to the constructor of the subtranslators.
         However, it will remove all arguments starting with an underscore.
         """
-        if isinstance(self._sub_translators, dict):
-            raise RuntimeError("Tried to allocate the internal subtranslators twice.")
-        assert self._sub_translators is None  # type: ignore[unreachable]
+        assert self._sub_translators is None
 
-        kwargs = {k: v for k, v in kwargs.items() if not k.startswith("_")}
+        subtrans_args = {k: v for k, v in subtrans_args.items() if not k.startswith("_")}  # type: ignore[unreachable]
 
-        # First we will create all subtranslators and partition them.
-        subtranslators: dict[str, list[jtrans.JaCeSubTranslatorInterface]] = {}
-        for subtranslator_cls in jtsubt._get_subtranslators_cls():
-            subtranslator: jtrans.JaCeSubTranslatorInterface = subtranslator_cls(**kwargs)
+        sub_translators: dict[str, jtrans.JaCeSubTranslatorInterface] = {}
+        for sub_translator_cls in jtsubt._get_subtranslators_cls():
+            sub_translator: jtrans.JaCeSubTranslatorInterface = sub_translator_cls(**subtrans_args)
             handled_primitives: Iterable[str] = jutil.ensure_iterability(
-                subtranslator.get_handled_primitives()
+                sub_translator.get_handled_primitives()
             )
-
-            # Now add the subtranslator to the primitives it requests, we will sort them later into the correct order.
             for handled_primitive in handled_primitives:
-                subtranslators.setdefault(handled_primitive, []).append(subtranslator)
+                if handled_primitive in sub_translators:
+                    raise RuntimeError(f"Multiple sub_translators for '{handled_primitive}' found.")
+                sub_translators[handled_primitive] = sub_translator
+        self._sub_translators = sub_translators
 
-        # Now we order the subtranslators for the primitives.
-        self._sub_translators = {
-            prim_name: jtrutil.sort_subtranslators(primSubTranslators)
-            for prim_name, primSubTranslators in subtranslators.items()
-        }
         return self
 
     def _clear_translation_ctx(self) -> JaxprTranslationDriver:
@@ -992,41 +984,16 @@ def _clear_translation_ctx(self) -> JaxprTranslationDriver:
 
     def _find_sub_translator_for(
         self,
-        in_var_names: Sequence[str | None],
-        out_var_names: Sequence[str],
         eqn: jcore.JaxprEqn,
     ) -> jtrans.JaCeSubTranslatorInterface:
-        """Returns the appropriate subtranslator for equation `eqn`.
-
-        The subtranslators are checked for applicability in the order of their priority.
-        The fist one that accepts the translation will be taken.
-
-        Notes:
-            The arguments are the same as for `JaCeSubTranslatorInterface.can_translate_jaxeqn()`.
-        """
+        """Returns the appropriate subtranslator for equation `eqn`."""
         assert self._sub_translators is not None
 
         prim_name: str = eqn.primitive.name
         if prim_name not in self._sub_translators:
             raise NotImplementedError(f"No subtranslators known to handle '{prim_name}'.")
-        subtranslator_canidates = self._sub_translators[prim_name]
-        assert len(subtranslator_canidates) > 0
-
-        subtranslator: jtrans.JaCeSubTranslatorInterface = None  # type: ignore[assignment]
-        if len(subtranslator_canidates) == 1:
-            subtranslator = next(iter(subtranslator_canidates))
-            assert subtranslator.can_translate_jaxeqn(
-                in_var_names=in_var_names, out_var_names=out_var_names, driver=self, eqn=eqn
-            )
-        else:
-            for subtranslatorCanidate in subtranslator_canidates:
-                if subtranslatorCanidate.can_translate_jaxeqn(
-                    driver=self, in_var_names=in_var_names, out_var_names=out_var_names, eqn=eqn
-                ):
-                    subtranslator = subtranslatorCanidate
-            else:
-                raise NotImplementedError(f"No subtranslator found for handling '{eqn}'.")
-        return subtranslator
+
+        return self._sub_translators[prim_name]
 
     def _translate_single_eqn(
         self,
@@ -1044,7 +1011,6 @@ def _translate_single_eqn(
         Returns:
             The SDFG names that were used as input and output are returned.
             The inputs might contain `None` which indicates that that input was a Jax Literal.
-            For more information see `JaCeSubTranslatorInterface.can_translate_jaxeqn()`.
 
         Notes:
             While `jaxpr` must be a `ClosedJaxpr`, `eqn` must come from the unclosed instance.
@@ -1070,24 +1036,20 @@ def _translate_single_eqn(
         )
 
         # Find the subtranslator
-        subtranslator: jtrans.JaCeSubTranslatorInterface = self._find_sub_translator_for(
-            in_var_names=in_var_names,
-            out_var_names=out_var_names,
-            eqn=eqn,
-        )
+        subtranslator: jtrans.JaCeSubTranslatorInterface = self._find_sub_translator_for(eqn)
 
         # Create the state into which the equation should be translated
         last_term_state: dace.SDFGState = self.get_terminal_sdfg_state()  # noqa: F841 # Will be used later
         eqn_state = self.append_new_state(
             label=f"{eqn.primitive.name}_{out_var_names[0]}",
-            prev_state=None,
+            prev_state=None,  # forces terminal state
         )
 
         # Now perform the actual translation of the equation.
         new_sdfg_term_state = subtranslator.translate_jaxeqn(
             driver=self,
             in_var_names=in_var_names,
-            out_var_names=out_var_names,  # Might be modified by subtranslator!
+            out_var_names=out_var_names,  # Might be modified by the subtranslator!
             eqn=eqn,
             eqn_state=eqn_state,
         )
diff --git a/src/jace/translator/util/subtranslator_helper_order.py b/src/jace/translator/util/subtranslator_helper_order.py
deleted file mode 100644
index 767521a..0000000
--- a/src/jace/translator/util/subtranslator_helper_order.py
+++ /dev/null
@@ -1,80 +0,0 @@
-# JaCe - JAX Just-In-Time compilation using DaCe (Data Centric Parallel Programming)
-#
-# Copyright (c) 2024, ETH Zurich
-# All rights reserved.
-#
-# SPDX-License-Identifier: BSD-3-Clause
-
-from __future__ import annotations
-
-from collections.abc import Sequence
-
-from jace import translator
-
-
-def sort_subtranslators(
-    subtranslators: Sequence[translator.JaCeSubTranslatorInterface],
-) -> Sequence[translator.JaCeSubTranslatorInterface]:
-    """Orders the subtranslators according to their priorities.
-
-    The function ensures the following:
-    - All subtranslators that have default priority are at the end.
-    - All subtranslators whose `get_priority()` returns `NotImplemented`
-        are at the begin of the list. These subtranslators are ordered according
-        to their `__lt__()` function.
-    - All subtranslators whose `get_priority()` function returns an integer are
-        in the middle, ordered according to this value.
-    """
-    if len(subtranslators) <= 1:
-        return subtranslators
-    subtranslators = sorted(subtranslators, key=_SubtranslatorOrderingHelper)
-    assert (len(subtranslators) <= 1) or all(
-        subtranslators[i - 1].has_default_priority() <= subtranslators[i].has_default_priority()
-        for i in range(1, len(subtranslators))
-    )
-    return subtranslators
-
-
-class _SubtranslatorOrderingHelper:
-    """Helper class used by `JaxprTranslationDriver` to bring the subtranslators in the correct order.
-
-    Essentially it is a wrapper that contains the additional logic that is
-    needed for sorting. This way subclasses does not need to implement it themselves.
-
-    Notes:
-        This class does not implement the other comparison function as requested by PEP8.
-    """
-
-    def __init__(self, subtranslator: translator.JaCeSubTranslatorInterface):
-        assert isinstance(subtranslator, translator.JaCeSubTranslatorInterface)
-        self._sub = subtranslator
-
-    def get(self) -> translator.JaCeSubTranslatorInterface:
-        return self._sub
-
-    def __lt__(
-        self,
-        other: _SubtranslatorOrderingHelper,
-    ) -> bool:
-        # Default priority means that it will always go to the end.
-        if self._sub.has_default_priority():
-            return False  # `self` has default priority, so it must go to the end.
-        if other._sub.has_default_priority():
-            return True  # `self` does not have default prio, thus it _must_ go before `other`.
-        prio_self = self._sub.get_priority()  # Get the priorities of the subtranslators.
-        prio_other = other._sub.get_priority()
-        if all(prio is NotImplemented for prio in (prio_self, prio_other)):
-            # None has a prio, `self` should decide if it should go first.
-            x = self._sub.__lt__(other._sub)
-            assert isinstance(x, bool)
-            return x
-        # In case only one has a priority, we change the order such that the one that implements
-        #  a `__lt__()` goes first.
-        if prio_self is NotImplemented:
-            assert isinstance(prio_other, int)
-            return True
-        if prio_other is NotImplemented:
-            assert isinstance(prio_self, int)
-            return False
-        assert all(isinstance(prio, int) for prio in (prio_other, prio_self))
-        return prio_self < prio_other

From 6dd0bf6239bf86c3ee3862a028d7edcf7418ce1d Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Tue, 23 Apr 2024 11:20:14 +0200
Subject: [PATCH 041/458] Forgot to update some small part.

---
 src/jace/translator/sub_translators/__init__.py | 6 +-----
 1 file changed, 1 insertion(+), 5 deletions(-)

diff --git a/src/jace/translator/sub_translators/__init__.py b/src/jace/translator/sub_translators/__init__.py
index c9e1557..dc81752 100644
--- a/src/jace/translator/sub_translators/__init__.py
+++ b/src/jace/translator/sub_translators/__init__.py
@@ -73,13 +73,9 @@ def _get_subtranslators_cls(
         If the externally defined subtranslators are requested they will be
             first and ordered as FILO order.
     """
-    # It is important that the externally defined are ordered before the builtins
-    #  and are ordered in FILO order, especuially if multiple subtranslator per
-    #  primitive are registered. Because this way they are inserted first
-    #  into the internal list of the driver, and furthermore since `sorted()`
-    #  is stable they will tend to end up more to the front.
     ret: list[type[jtrans.JaCeSubTranslatorInterface]] = []
     if with_external:
+        # Guarantees that we get them in FIFO order.
         ret.extend(reversed(_EXTERNAL_SUBTRANSLATORS.keys()))
     if builtins:
         ret.extend(_BUILTIN_SUBTRANSLATORS)

From c01f068b772ee2f0e0b19ea9542b09e597463b8c Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Tue, 23 Apr 2024 13:02:12 +0200
Subject: [PATCH 042/458] Made the ALU translator more compatible.

But we should split that thing and make it nicer.
---
 .../sub_translators/alu_translator.py         | 43 -------------------
 1 file changed, 43 deletions(-)

diff --git a/src/jace/translator/sub_translators/alu_translator.py b/src/jace/translator/sub_translators/alu_translator.py
index 78ef172..cec080d 100644
--- a/src/jace/translator/sub_translators/alu_translator.py
+++ b/src/jace/translator/sub_translators/alu_translator.py
@@ -74,54 +74,11 @@ def __init__(self, **kwargs: Any) -> None:
         """Initialize the `ALUTranslator`."""
         super().__init__(**kwargs)
 
-    # end def: __init__
-
     @override
     def get_handled_primitives(self) -> Collection[str] | str:
         """Returns the list of all known primitives."""
         return set(self._unary_ops.keys()).union(self._binary_ops.keys())
 
-    @override
-    def can_translate_jaxeqn(
-        self,
-        driver: jtranslator.JaxprTranslationDriver,
-        in_var_names: Sequence[str | None],
-        out_var_names: Sequence[str],
-        eqn: jcore.JaxprEqn,
-    ) -> bool:
-        """Tests if the translator can handle the primitive.
-
-        Notes:
-            A user can generally expect that this function returns `True`.
-        """
-        is_scalar: bool = len(eqn.outvars[0].aval.shape) == 0
-        prim_name: str = eqn.primitive.name
-        if len(eqn.invars) == 1:
-            if prim_name not in self._unary_ops:
-                return False
-        elif len(eqn.invars) == 2:
-            if prim_name not in self._binary_ops:
-                return False
-        else:
-            return False
-        if out_var_names[0] is None:
-            raise RuntimeError(f"Encountered a literal output '{eqn}'.")
-        if len(eqn.outvars) != 1:
-            return False
-        if (not is_scalar) and all(x is None for x in in_var_names):
-            # Only literals as input are only allowed if we are scalar.
-            return False
-        if len(eqn.effects) != 0:
-            return False
-        if not all(
-            invar.aval.shape == ()
-            for invar, inname in zip(eqn.invars, in_var_names)
-            if inname is None
-        ):
-            # All literals must be scalars
-            return False
-        return True
-
     @override
     def translate_jaxeqn(
         self,

From 30ce4f2a0e374ee5cb1aad1ddfdbb8b4ceee8839 Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Tue, 23 Apr 2024 13:06:07 +0200
Subject: [PATCH 043/458] Fixed a bug in the `ALUTranslator`.

The output memlet for the scalar case was not handled correctly.
---
 .../translator/sub_translators/alu_translator.py    | 13 ++++++++-----
 1 file changed, 8 insertions(+), 5 deletions(-)

diff --git a/src/jace/translator/sub_translators/alu_translator.py b/src/jace/translator/sub_translators/alu_translator.py
index cec080d..039c44a 100644
--- a/src/jace/translator/sub_translators/alu_translator.py
+++ b/src/jace/translator/sub_translators/alu_translator.py
@@ -26,7 +26,7 @@ class ALUTranslator(jtranslator.JaCeSubTranslatorInterface):
 
     __slots__ = ()
 
-    # Contains all translation templates for unarry operations.
+    # Contains all translation templates for unary operations.
     _unary_ops: Final[dict[str, str]] = {
         "pos": "__out0 = +(__in0)",
         "neg": "__out0 = -(__in0)",
@@ -187,10 +187,13 @@ def translate_jaxeqn(
             tskl_inputs.append((f"__in{i}", i_memlet))
 
         # Now generate the Memlets for the output
-        tskl_output = (
-            "__out0",
-            dace.Memlet.simple(out_var_names[0], ", ".join([X[0] for X in tskl_map_ranges])),
-        )
+        if is_scalar:
+            tskl_output = ("__out0", dace.Memlet.simple(out_var_names[0], "0"))
+        else:
+            tskl_output = (
+                "__out0",
+                dace.Memlet.simple(out_var_names[0], ", ".join([X[0] for X in tskl_map_ranges])),
+            )
 
         if is_scalar:
             tskl_tasklet = eqn_state.add_tasklet(

From e4bdef078da3792f8c68c7d924843b0893dceffd Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Tue, 23 Apr 2024 15:18:44 +0200
Subject: [PATCH 044/458] Added a function that allows to run a
 `JaCeTranslationMemento`.

It is only for debugging.
---
 src/jace/translator/util/debug.py | 68 +++++++++++++++++++++++++++++++
 1 file changed, 68 insertions(+)
 create mode 100644 src/jace/translator/util/debug.py

diff --git a/src/jace/translator/util/debug.py b/src/jace/translator/util/debug.py
new file mode 100644
index 0000000..4b77071
--- /dev/null
+++ b/src/jace/translator/util/debug.py
@@ -0,0 +1,68 @@
+# JaCe - JAX Just-In-Time compilation using DaCe (Data Centric Parallel Programming)
+#
+# Copyright (c) 2024, ETH Zurich
+# All rights reserved.
+#
+# SPDX-License-Identifier: BSD-3-Clause
+
+"""This module contains functions for debugging the translator."""
+
+from __future__ import annotations
+
+from typing import Any
+
+import dace
+
+from jace.translator import util as jtrutil
+
+
+def run_memento(
+    memento: jtrutil.JaCeTranslationMemento,
+    *args: Any,
+) -> tuple[Any, ...] | Any:
+    """Calls the SDFG with the supplied arguments.
+
+    Notes:
+        Currently the SDFG must not have any undefined symbols, i.e. no undefined sizes.
+        The function either returns a value or a tuple of values, i.e. no tree.
+    """
+    from dace.data import Data, Scalar, make_array_from_descriptor
+
+    # This is a simplification that makes our life simply
+    if len(memento.sdfg.used_symbols) != 0:
+        raise ValueError("No externally defined symbols are allowed.")
+    if len(memento.inp_names) != len(args):
+        raise ValueError(
+            f"Wrong numbers of arguments expected {len(memento.inp_names)} got {len(args)}."
+        )
+
+    # We use a return by reference approach, for calling the SDFG
+    call_args: dict[str, Any] = {}
+    for in_name, in_val in zip(memento.inp_names, args):
+        call_args[in_name] = in_val
+    for out_name in memento.out_names:
+        sarray: Data = memento.sdfg.arrays[out_name]
+        if isinstance(sarray, Scalar):
+            raise NotImplementedError("Do not support non array in return value.")
+        assert out_name not in call_args
+        call_args[out_name] = make_array_from_descriptor(sarray)
+
+    # Canonical SDFGs do not have global memory, so we must transform it.
+    #  We will afterwards undo it.
+    for glob_name in memento.inp_names + memento.out_names:  # type: ignore[operator]  # concatenation
+        memento.sdfg.arrays[glob_name].transient = True
+
+    try:
+        csdfg: dace.CompiledSDFG = memento.sdfg.compile()
+        csdfg(**call_args)
+
+        if len(memento.out_names) == 0:
+            return None
+        ret_val: tuple[Any] = tuple(call_args[out_name] for out_name in memento.out_names)
+        if len(memento.out_names) == 1:
+            return ret_val[0]
+        return ret_val
+
+    finally:
+        for name, tstate in memento.inp_names + memento.out_names:  # type: ignore[operator]  # concatenation
+            memento.sdfg.arrays[name].transient = tstate

From 85303e2f254b425b8634a0393fa2658f0e971089 Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Tue, 23 Apr 2024 15:26:12 +0200
Subject: [PATCH 045/458] Added a function that allows to fire the
 trabnsformation pipeline in one go.

This function is highly internal and should not be used.
---
 src/jace/translator/util/__init__.py |  3 +++
 src/jace/translator/util/debug.py    | 27 ++++++++++++++++++++++-----
 2 files changed, 25 insertions(+), 5 deletions(-)

diff --git a/src/jace/translator/util/__init__.py b/src/jace/translator/util/__init__.py
index 910589e..da9c1d4 100644
--- a/src/jace/translator/util/__init__.py
+++ b/src/jace/translator/util/__init__.py
@@ -9,6 +9,7 @@
 
 from __future__ import annotations
 
+from .debug import _jace_run, run_memento
 from .jace_translation_memento import JaCeTranslationMemento
 from .revision_counter import RevisionCounterManager
 from .util import list_to_dict
@@ -19,4 +20,6 @@
     "JaCeTranslationMemento",
     "RevisionCounterManager",
     "list_to_dict",
+    "run_memento",
+    "_jace_run",
 ]
diff --git a/src/jace/translator/util/debug.py b/src/jace/translator/util/debug.py
index 4b77071..69724c4 100644
--- a/src/jace/translator/util/debug.py
+++ b/src/jace/translator/util/debug.py
@@ -9,9 +9,11 @@
 
 from __future__ import annotations
 
+from collections.abc import Callable
 from typing import Any
 
 import dace
+import jax
 
 from jace.translator import util as jtrutil
 
@@ -29,7 +31,7 @@ def run_memento(
     from dace.data import Data, Scalar, make_array_from_descriptor
 
     # This is a simplification that makes our life simply
-    if len(memento.sdfg.used_symbols) != 0:
+    if len(memento.sdfg.free_symbols) != 0:
         raise ValueError("No externally defined symbols are allowed.")
     if len(memento.inp_names) != len(args):
         raise ValueError(
@@ -50,11 +52,13 @@ def run_memento(
     # Canonical SDFGs do not have global memory, so we must transform it.
     #  We will afterwards undo it.
     for glob_name in memento.inp_names + memento.out_names:  # type: ignore[operator]  # concatenation
-        memento.sdfg.arrays[glob_name].transient = True
+        memento.sdfg.arrays[glob_name].transient = False
 
     try:
         csdfg: dace.CompiledSDFG = memento.sdfg.compile()
-        csdfg(**call_args)
+        with dace.config.temporary_config():
+            dace.Config.set("compiler", "allow_view_arguments", value=True)
+            csdfg(**call_args)
 
         if len(memento.out_names) == 0:
             return None
@@ -64,5 +68,18 @@ def run_memento(
         return ret_val
 
     finally:
-        for name, tstate in memento.inp_names + memento.out_names:  # type: ignore[operator]  # concatenation
-            memento.sdfg.arrays[name].transient = tstate
+        for name in memento.inp_names + memento.out_names:  # type: ignore[operator]  # concatenation
+            memento.sdfg.arrays[name].transient = True
+
+
+def _jace_run(
+    fun: Callable,
+    *args: Any,
+) -> Any:
+    """Traces and run function `fun` using `Jax | DaCe`."""
+    from jace.translator import JaxprTranslationDriver
+
+    jaxpr = jax.make_jaxpr(fun)(*args)
+    driver = JaxprTranslationDriver()
+    memento = driver.translate_jaxpr(jaxpr)
+    return run_memento(memento, *args)

From 68b4d3463339114e08202e26086ab8cdf23d00d7 Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Tue, 23 Apr 2024 15:53:00 +0200
Subject: [PATCH 046/458] Made some small fixes.

---
 .gitignore                                      |  3 +++
 src/jace/translator/jaxpr_translator_driver.py  |  6 +++---
 .../sub_translators/alu_translator.py           |  6 +++---
 src/jace/util/jax.py                            | 17 ++++++-----------
 4 files changed, 15 insertions(+), 17 deletions(-)

diff --git a/.gitignore b/.gitignore
index 25cf9a4..15604f3 100644
--- a/.gitignore
+++ b/.gitignore
@@ -153,6 +153,9 @@ src/*/_version.py
 ehthumbs.db
 Thumbs.db
 
+# DaCe
+.dacecache/
+
 # Common editor files
 *~
 *.swp
diff --git a/src/jace/translator/jaxpr_translator_driver.py b/src/jace/translator/jaxpr_translator_driver.py
index 7be5636..f9eba29 100644
--- a/src/jace/translator/jaxpr_translator_driver.py
+++ b/src/jace/translator/jaxpr_translator_driver.py
@@ -621,7 +621,9 @@ def add_array(
                 )
             alt_name = jutil.get_jax_var_name(arg)
         if alt_name is not None:
-            assert isinstance(alt_name, str)
+            assert isinstance(
+                alt_name, str
+            ), f"Got '{type(alt_name)}' instead of 'str' for 'alt_name'."
             find_new_name = False  # If a name was given, then use it no matter what.
             if len(alt_name) == 0:
                 raise ValueError("Passed an empty 'alt_name'.")
@@ -629,8 +631,6 @@ def add_array(
                 raise ValueError("'alt_name' is a forbidden name.")
             if not re.fullmatch("[a-zA-Z_][a-zA-Z0-9_]*", alt_name):
                 raise ValueError(f"The passed name 'alt_name' '{alt_name}' is invalid.")
-            if force_jax_name:
-                raise ValueError("Specified 'force_jax_name' but passed 'alt_name'.")
             if name_prefix is not None:
                 raise ValueError(
                     f"Specified 'name_prefix' ('{name_prefix}') but passed '{alt_name}' as 'alt_name'."
diff --git a/src/jace/translator/sub_translators/alu_translator.py b/src/jace/translator/sub_translators/alu_translator.py
index 039c44a..f1c1946 100644
--- a/src/jace/translator/sub_translators/alu_translator.py
+++ b/src/jace/translator/sub_translators/alu_translator.py
@@ -164,7 +164,7 @@ def translate_jaxeqn(
         tskl_map_ranges: list[tuple[str, str]] = [
             (f"__i{dim}", f"0:{N}") for dim, N in enumerate(eqn.outvars[0].aval.shape)
         ]
-        tskl_outputs: tuple[str, dace.Memlet] = None
+        tskl_output: tuple[str, dace.Memlet] = None
         tskl_inputs: list[tuple[str, dace.Memlet] | tuple[None, None]] = []
 
         # Generate the Memlets for the input.
@@ -199,7 +199,7 @@ def translate_jaxeqn(
             tskl_tasklet = eqn_state.add_tasklet(
                 tskl_name,
                 jtutil.list_to_dict(tskl_inputs).keys(),
-                jtutil.list_to_dict([tskl_outputs]).keys(),
+                jtutil.list_to_dict([tskl_output]).keys(),
                 tskl_code,
             )
             for in_var, (in_connector, in_memlet) in zip(in_var_names, tskl_inputs, strict=False):
@@ -225,7 +225,7 @@ def translate_jaxeqn(
                 map_ranges=jtutil.list_to_dict(tskl_map_ranges),
                 inputs=jtutil.list_to_dict(tskl_inputs),
                 code=tskl_code,
-                outputs=jtutil.list_to_dict([tskl_outputs]),
+                outputs=jtutil.list_to_dict([tskl_output]),
                 external_edges=True,
             )
 
diff --git a/src/jace/util/jax.py b/src/jace/util/jax.py
index 755e6a3..845ba16 100644
--- a/src/jace/util/jax.py
+++ b/src/jace/util/jax.py
@@ -13,6 +13,7 @@
 
 from __future__ import annotations
 
+import re
 from dataclasses import dataclass
 from typing import Any
 
@@ -44,15 +45,12 @@ def get_jax_var_name(jax_var: jcore.Atom | JaCeVar | str) -> str:
 
     Args:
         jax_var:     The variable to stringify.
-
-    Todos:
-        Implement a regex check for the name.
     """
     if isinstance(jax_var, jcore.DropVar):
         return "_"
     if isinstance(jax_var, JaCeVar):
-        return jax_var.name
-    if isinstance(jax_var, jcore.Atom):
+        jax_name = jax_var.name
+    elif isinstance(jax_var, jcore.Atom):
         jax_name = str(jax_var)  # This only works up to some version
     elif isinstance(jax_var, str):
         jax_name = jax_var
@@ -60,13 +58,10 @@ def get_jax_var_name(jax_var: jcore.Atom | JaCeVar | str) -> str:
         raise TypeError(
             f"Does not know how to transform '{jax_var}' (type: '{type(jax_var).__name__}') into a string."
         )
-    # TODO(phimuell): Add regex to ensure that the name is legit.
     assert isinstance(jax_name, str)
-    if len(jax_name) == 0:
-        raise ValueError(
-            f"Failed to translate the Jax variable '{jax_var}' into a name, the result was empty."
-        )
-    return jax_var
+    if not re.fullmatch("[a-zA-Z_][a-zA-Z_]*", jax_name):
+        raise ValueError(f"Deduced Jax name '{jax_name}' is invalid.")
+    return jax_name
 
 
 def get_jax_var_shape(jax_var: jcore.Atom) -> tuple[int, ...]:

From 34b525a664f73297c33dc044311328fe21a376a2 Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Tue, 23 Apr 2024 16:01:21 +0200
Subject: [PATCH 047/458] Added a new test to test the ALU.

---
 tests/test_sub_translators_alu.py | 35 +++++++++++++++++++++++++++++++
 1 file changed, 35 insertions(+)
 create mode 100644 tests/test_sub_translators_alu.py

diff --git a/tests/test_sub_translators_alu.py b/tests/test_sub_translators_alu.py
new file mode 100644
index 0000000..006d4b3
--- /dev/null
+++ b/tests/test_sub_translators_alu.py
@@ -0,0 +1,35 @@
+# JaCe - JAX Just-In-Time compilation using DaCe (Data Centric Parallel Programming)
+#
+# Copyright (c) 2024, ETH Zurich
+# All rights reserved.
+#
+# SPDX-License-Identifier: BSD-3-Clause
+
+"""Implements tests for the ALU translator."""
+
+from __future__ import annotations
+
+import jax
+import numpy as np
+
+from jace.translator.util import debug as jtrudebug
+
+
+def test_add():
+    """Simple add function."""
+    jax.config.update("jax_enable_x64", True)
+
+    def testee(A: np.ndarray, B: np.ndarray) -> np.ndarray:
+        return A + B
+
+    A = np.arange(12, dtype=np.float64).reshape((4, 3))
+    B = np.full((4, 3), 10, dtype=np.float64)
+
+    ref = testee(A, B)
+    res = jtrudebug._jace_run(testee, A, B)
+
+    assert np.allclose(ref, res), f"Expected '{ref}' got '{res}'."
+
+
+if __name__ == "__main__":
+    test_add()

From 0eb8cb1650abefe15c646cbde04b2a8aa81d192f Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Fri, 26 Apr 2024 08:35:08 +0200
Subject: [PATCH 048/458] Fixed the `get_jax_var_name()` function.

The function is now able to handle more recent Jax functions, however, it now produces very starnge names.
I think we should have some kind of context, similar to the one used by Jax itself.
---
 src/jace/util/jax.py | 16 ++++++++++++----
 1 file changed, 12 insertions(+), 4 deletions(-)

diff --git a/src/jace/util/jax.py b/src/jace/util/jax.py
index 845ba16..2a1a2aa 100644
--- a/src/jace/util/jax.py
+++ b/src/jace/util/jax.py
@@ -50,16 +50,24 @@ def get_jax_var_name(jax_var: jcore.Atom | JaCeVar | str) -> str:
         return "_"
     if isinstance(jax_var, JaCeVar):
         jax_name = jax_var.name
-    elif isinstance(jax_var, jcore.Atom):
-        jax_name = str(jax_var)  # This only works up to some version
+    elif isinstance(jax_var, jcore.Var):
+        # This stopped working after version 0.20.4, because of some changes in Jax
+        #  See `https://github.com/google/jax/pull/10573` for more information.
+        #  The following implementation will generate stable names, but decouples
+        #  them from pretty printed Jaxpr, we maybe need a pretty print context somewhere.
+        jax_name = f"jax{jax_var.count}{jax_var.suffix}"
+    elif isinstance(jax_var, jcore.Literal):
+        raise TypeError("Can not translate a Jax Literal to a variable name.")
     elif isinstance(jax_var, str):
         jax_name = jax_var
     else:
         raise TypeError(
-            f"Does not know how to transform '{jax_var}' (type: '{type(jax_var).__name__}') into a string."
+            f"Can not transform '{jax_var}' (type: '{type(jax_var).__name__}') not a name."
         )
     assert isinstance(jax_name, str)
-    if not re.fullmatch("[a-zA-Z_][a-zA-Z_]*", jax_name):
+    if not (
+        re.fullmatch("jax[1-9][0-9]*", jax_name) or re.fullmatch("[a-zA-Z][a-zA-Z]*", jax_name)
+    ):
         raise ValueError(f"Deduced Jax name '{jax_name}' is invalid.")
     return jax_name
 

From 529c291732b7b8fd09824565d3432d8330a563ae Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Fri, 26 Apr 2024 08:39:52 +0200
Subject: [PATCH 049/458] Reorganized the `jace.util` package.

---
 src/jace/util/__init__.py                 | 19 +++++++---
 src/jace/util/{dace.py => dace_helper.py} |  0
 src/jace/util/{jax.py => jax_helper.py}   | 43 +++++++++++++++++++++++
 src/jace/util/util.py                     | 14 ++++++++
 4 files changed, 72 insertions(+), 4 deletions(-)
 rename src/jace/util/{dace.py => dace_helper.py} (100%)
 rename src/jace/util/{jax.py => jax_helper.py} (75%)

diff --git a/src/jace/util/__init__.py b/src/jace/util/__init__.py
index 0bd9a15..20b0f50 100644
--- a/src/jace/util/__init__.py
+++ b/src/jace/util/__init__.py
@@ -9,15 +9,26 @@
 
 from __future__ import annotations
 
-from .jax import JaCeVar, get_jax_var_dtype, get_jax_var_name, get_jax_var_shape, translate_dtype
-from .util import ensure_iterability
+from .jax_helper import (
+    JaCeVar,
+    get_jax_var_dtype,
+    get_jax_var_name,
+    get_jax_var_shape,
+    is_jaxified,
+    is_tracing_ongoing,
+    translate_dtype,
+)
+from .util import ensure_iterability, is_jaceified
 
 
 __all__ = [
+    "ensure_iterability",
+    "is_tracing_ongoing",
+    "is_jaceified",
+    "is_jaxified",
+    "JaCeVar",
     "get_jax_var_name",
     "get_jax_var_shape",
     "get_jax_var_dtype",
-    "ensure_iterability",
     "translate_dtype",
-    "JaCeVar",
 ]
diff --git a/src/jace/util/dace.py b/src/jace/util/dace_helper.py
similarity index 100%
rename from src/jace/util/dace.py
rename to src/jace/util/dace_helper.py
diff --git a/src/jace/util/jax.py b/src/jace/util/jax_helper.py
similarity index 75%
rename from src/jace/util/jax.py
rename to src/jace/util/jax_helper.py
index 2a1a2aa..dccfda3 100644
--- a/src/jace/util/jax.py
+++ b/src/jace/util/jax_helper.py
@@ -9,11 +9,14 @@
 
 Most of the functions defined here allow an unified access to Jax' internals
 in a consistent and stable way.
+It is important that this module is different from the `jace.jax` module, which
+mimics the full `jax` package itself.
 """
 
 from __future__ import annotations
 
 import re
+from collections.abc import Sequence
 from dataclasses import dataclass
 from typing import Any
 
@@ -95,6 +98,46 @@ def get_jax_var_dtype(jax_var: jcore.Atom) -> dace.typeclass:
     raise TypeError(f"'get_jax_var_dtype()` is not implemented for '{type(jax_var)}'.")
 
 
+def is_tracing_ongoing(
+    *args: Any,
+    **kwargs: Any,
+) -> bool:
+    """Test if tracing is ongoing.
+
+    While a return value `True` guarantees that a translation is ongoing,
+    a value of `False` does not guarantees that no tracing is active.
+
+    Raises:
+        RuntimeError: If the function fails to make a detection.
+    """
+    from itertools import chain
+
+    # The current implementation only checks the arguments if it contains tracers.
+    if (len(args) == 0) and (len(kwargs) == 0):
+        raise RuntimeError("Failed to determine if tracing is ongoing.")
+    return any(isinstance(x, jcore.Tracer) for x in chain(args, kwargs.values()))
+
+
+def is_jaxified(obj: Any) -> bool:
+    """Tests if `obj` is a "jaxified" object.
+
+    A "jexified" object is an object that was processed by Jax.
+    While a return value of `True` guarantees a jaxified object,
+    `False` might not proof the contrary.
+    """
+    from jax._src import pjit as jaxpjit
+    import jaxlib
+
+    # These are all types we consider as jaxify
+    jaxify_types: Sequence[type] = (
+        jcore.Primitive,
+        # jstage.Wrapped, # Not runtime chakable
+        jaxpjit.JitWrapped,
+        jaxlib.xla_extension.PjitFunction
+    )
+    return isinstance(obj, jaxify_types)
+
+
 def translate_dtype(dtype: Any) -> dace.typeclass:
     """Turns a Jax datatype into a DaCe datatype."""
 
diff --git a/src/jace/util/util.py b/src/jace/util/util.py
index d728be5..c58a691 100644
--- a/src/jace/util/util.py
+++ b/src/jace/util/util.py
@@ -28,3 +28,17 @@ def ensure_iterability(
     elif isinstance(x, Iterable):
         pass
     return x
+
+
+def is_jaceified(obj: Any) -> bool:
+    """Tests if `obj` is decorated by JaCe.
+
+    Similar to `jace.util.is_jaxified`, but for JaCe object.
+    """
+    from jace import jax as jjax, util as jutil
+
+    if jutil.is_jaxified(obj):
+        return False
+    # Currently it is quite simple because we can just check if `obj`
+    #  is derived from `jace.jax.JitWrapped`, might become harder in the future.
+    return isinstance(obj, jjax.JitWrapped)

From 11a2f57ca8636bfe4852ff9564422b12255d413d Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Fri, 26 Apr 2024 08:41:35 +0200
Subject: [PATCH 050/458] Started with a `jace.jax` package that can be used as
 a better drop in replacement.

I think that we will need it in the future, for example it is, in my view, currently the best place to put `jace.jit`.
Another idea that could be worthwhile to consider is to mimick the `jace` package after `jax`.
---
 src/jace/jax/__init__.py | 8 ++++++++
 1 file changed, 8 insertions(+)
 create mode 100644 src/jace/jax/__init__.py

diff --git a/src/jace/jax/__init__.py b/src/jace/jax/__init__.py
new file mode 100644
index 0000000..b7aa000
--- /dev/null
+++ b/src/jace/jax/__init__.py
@@ -0,0 +1,8 @@
+# JaCe - JAX Just-In-Time compilation using DaCe (Data Centric Parallel Programming)
+#
+# Copyright (c) 2024, ETH Zurich
+# All rights reserved.
+#
+# SPDX-License-Identifier: BSD-3-Clause
+
+"""This package mimics parts of the interface of the `jax` package that is supported by JaCe."""

From 998a529630b8b5fbca53374bacb39401f2e4455d Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Fri, 26 Apr 2024 10:28:51 +0200
Subject: [PATCH 051/458] Updated `_jace_run()` to also accept arguments for
 the driver.

---
 src/jace/translator/util/debug.py | 10 ++++++++--
 1 file changed, 8 insertions(+), 2 deletions(-)

diff --git a/src/jace/translator/util/debug.py b/src/jace/translator/util/debug.py
index 69724c4..6ba8ff2 100644
--- a/src/jace/translator/util/debug.py
+++ b/src/jace/translator/util/debug.py
@@ -75,11 +75,17 @@ def run_memento(
 def _jace_run(
     fun: Callable,
     *args: Any,
+    **kwargs: Any,
 ) -> Any:
-    """Traces and run function `fun` using `Jax | DaCe`."""
+    """Traces and run function `fun` using `Jax | DaCe`.
+
+    Args:
+        *args:      Forwarded to the tracing and final execution of the SDFG.
+        **kwargs:   Used to construct the driver.
+    """
     from jace.translator import JaxprTranslationDriver
 
     jaxpr = jax.make_jaxpr(fun)(*args)
-    driver = JaxprTranslationDriver()
+    driver = JaxprTranslationDriver(**kwargs)
     memento = driver.translate_jaxpr(jaxpr)
     return run_memento(memento, *args)

From 3b40e1802edfb3a246b2ddbf21703de7f4f03439 Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Fri, 26 Apr 2024 10:43:43 +0200
Subject: [PATCH 052/458] Made it poissible to now jit from Jace directly.

However, it does not cache the compiled code yet.
And it is not tested yet.
---
 src/jace/__init__.py       |  5 ++
 src/jace/jax/__init__.py   | 14 ++++++
 src/jace/jax/api.py        | 98 ++++++++++++++++++++++++++++++++++++++
 src/jace/jax/api_helper.py | 84 ++++++++++++++++++++++++++++++++
 4 files changed, 201 insertions(+)
 create mode 100644 src/jace/jax/api.py
 create mode 100644 src/jace/jax/api_helper.py

diff --git a/src/jace/__init__.py b/src/jace/__init__.py
index 5e0595b..5d8ec9e 100644
--- a/src/jace/__init__.py
+++ b/src/jace/__init__.py
@@ -10,11 +10,16 @@
 from __future__ import annotations
 
 from .__about__ import __author__, __copyright__, __license__, __version__, __version_info__
+from .jax import grad, jacfwd, jacrev, jit
 
 
 __all__ = [
     "__author__",
     "__copyright__",
+    "grad",
+    "jit",
+    "jacfwd",
+    "jacrev",
     "__license__",
     "__version__",
     "__version_info__",
diff --git a/src/jace/jax/__init__.py b/src/jace/jax/__init__.py
index b7aa000..de56d5d 100644
--- a/src/jace/jax/__init__.py
+++ b/src/jace/jax/__init__.py
@@ -6,3 +6,17 @@
 # SPDX-License-Identifier: BSD-3-Clause
 
 """This package mimics parts of the interface of the `jax` package that is supported by JaCe."""
+
+from __future__ import annotations
+
+from .api import grad, jacfwd, jacrev, jit
+from .api_helper import JitWrapped
+
+
+__all__ = [
+    "JitWrapped",
+    "jit",
+    "jacfwd",
+    "jacrev",
+    "grad",
+]
diff --git a/src/jace/jax/api.py b/src/jace/jax/api.py
new file mode 100644
index 0000000..4915d98
--- /dev/null
+++ b/src/jace/jax/api.py
@@ -0,0 +1,98 @@
+# JaCe - JAX Just-In-Time compilation using DaCe (Data Centric Parallel Programming)
+#
+# Copyright (c) 2024, ETH Zurich
+# All rights reserved.
+#
+# SPDX-License-Identifier: BSD-3-Clause
+
+"""Contains the implementation of the jit functioanlity of JaCe."""
+
+from __future__ import annotations
+
+from collections.abc import Callable
+from typing import Any, cast
+
+from jace import jax as jjax, util as jutil
+
+
+def jit(
+    fun: Callable | None = None,
+    /,
+    **kwargs: Any,
+) -> jjax.JitWrapped:
+    """Creates a jit wrapper instance."""
+    import jax
+
+    if fun is None:
+        assert len(kwargs) > 0
+
+        def wrapper(f: Callable) -> jjax.JitWrapped:
+            return jit(f, **kwargs)
+
+        return wrapper  # type: ignore[return-value]
+
+    # in case we are dealing with a JaCe object, we first unwrap it.
+    #  Recursion to handle arbitrary deep nestings.
+    if jutil.is_jaceified(fun):
+        fun = cast(jjax.JitWrapped, fun)
+        return jit(fun.__wrapped__)
+
+    # Prevents the creation of a level of unnecessary jit.
+    #  Probably better solution by using the `disable_jit()`?
+    if len(kwargs) == 0:
+        return jjax.JitWrapped(fun)
+    return jjax.JitWrapped(jax.jit(fun, **kwargs))
+
+
+def grad(
+    fun: Callable | None = None,
+    /,
+    **kwargs: Any,
+) -> jjax.JitWrapped:
+    """The gradient transformation."""
+    import jax
+
+    if fun is None:
+
+        def wrapper(f: Callable) -> jjax.JitWrapped:
+            return grad(f, **kwargs)
+
+        return wrapper  # type: ignore[return-value]
+
+    return jjax.JitWrapped(jax.grad(fun, **kwargs))
+
+
+def jacfwd(
+    fun: Callable | None = None,
+    /,
+    **kwargs: Any,
+) -> jjax.JitWrapped:
+    """Returns the Jacobian of `fun` in forward differentiation mode."""
+    import jax
+
+    if fun is None:
+
+        def wrapper(f: Callable) -> jjax.JitWrapped:
+            return jacfwd(f, **kwargs)
+
+        return wrapper  # type: ignore[return-value]
+
+    return jjax.JitWrapped(jax.jacfwd(fun, **kwargs))
+
+
+def jacrev(
+    fun: Callable | None = None,
+    /,
+    **kwargs: Any,
+) -> jjax.JitWrapped:
+    """Returns the Jacobian of `fun` in reverse differentiation mode."""
+    import jax
+
+    if fun is None:
+
+        def wrapper(f: Callable) -> jjax.JitWrapped:
+            return jacrev(f, **kwargs)
+
+        return wrapper  # type: ignore[return-value]
+
+    return jjax.JitWrapped(jax.jacrev(fun, **kwargs))
diff --git a/src/jace/jax/api_helper.py b/src/jace/jax/api_helper.py
new file mode 100644
index 0000000..72bcdb8
--- /dev/null
+++ b/src/jace/jax/api_helper.py
@@ -0,0 +1,84 @@
+# JaCe - JAX Just-In-Time compilation using DaCe (Data Centric Parallel Programming)
+#
+# Copyright (c) 2024, ETH Zurich
+# All rights reserved.
+#
+# SPDX-License-Identifier: BSD-3-Clause
+
+"""Helper functionality for `jace.jax.jit()`."""
+
+from __future__ import annotations
+
+from typing import Any
+
+from jace import util as jutil
+
+
+class JitWrapped:
+    """Result class of all jited functions.
+
+    It is essentially a wrapper around an already jited, i.e. passed to a Jax primitive function.
+    The function is then able to compile it if needed.
+    However, the wrapped object is itself again tracable, thus it does not break anything.
+
+    Todo:
+        Implement a compile cache (shape, data type, strides, location).
+        Turn this into a primitive.
+        Handles pytrees.
+    """
+
+    def __init__(
+        self,
+        jax_prim: Any,  # No idea if there is a better type.
+    ) -> None:
+        """Creates a wrapped jace jitable object of `jax_prim`."""
+        assert jax_prim is not None
+        self._fun = jax_prim
+
+    def __call__(
+        self,
+        *args: Any,
+        **kwargs: Any,
+    ) -> Any:
+        """Compile and run the wrapped function.
+
+        In case `self` is called by Jax during a trace, the call will
+        transparently forwarded to the wrapped function.
+        This guarantees that `self` itself is traceable.
+        """
+
+        if jutil.is_tracing_ongoing(*args, **kwargs):
+            return self._forward_trace(*args, **kwargs)
+        return self._call_sdfg(*args, **kwargs)
+
+    def _forward_trace(
+        self,
+        *args: Any,
+        **kwargs: Any,
+    ) -> Any:
+        """Is called by `self.__call__` if a trace operation was detected.
+
+        I.e. it will simply forward the call to the wrapped function.
+        """
+        if len(kwargs) != 0:
+            raise RuntimeError("Passed kwargs, which are not allowed in tracing.")
+        return self._fun(*args, **kwargs)
+
+    def _call_sdfg(
+        self,
+        *args: Any,
+        **kwargs: Any,
+    ) -> Any:
+        """Compiles and run the wrapped function.
+
+        Notes:
+            Currently no caching of the compiled object is done.
+        """
+        from jace.translator.util import debug as jtrudebug
+
+        return jtrudebug._jace_run(self._fun, *args, **kwargs)
+
+    @property
+    def __wrapped__(self) -> Any:
+        """Returns the wrapped object."""
+        return self._fun

From 7317a996aa16545e0385820e504ddf61fd4aac1e Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Fri, 26 Apr 2024 13:34:22 +0200
Subject: [PATCH 053/458] Updated the function to run mementos.

There is still the problem of scalars as return values.
However, even DaCe turns them into arrays.
---
 src/jace/translator/util/debug.py | 18 +++++++++++++-----
 1 file changed, 13 insertions(+), 5 deletions(-)

diff --git a/src/jace/translator/util/debug.py b/src/jace/translator/util/debug.py
index 6ba8ff2..a28c9d8 100644
--- a/src/jace/translator/util/debug.py
+++ b/src/jace/translator/util/debug.py
@@ -28,11 +28,13 @@ def run_memento(
         Currently the SDFG must not have any undefined symbols, i.e. no undefined sizes.
         The function either returns a value or a tuple of values, i.e. no tree.
     """
-    from dace.data import Data, Scalar, make_array_from_descriptor
+    from dace.data import Array, Data, Scalar, make_array_from_descriptor
 
     # This is a simplification that makes our life simply
     if len(memento.sdfg.free_symbols) != 0:
-        raise ValueError("No externally defined symbols are allowed.")
+        raise ValueError(
+            f"No externally defined symbols are allowed, found: {memento.sdfg.free_symbols}"
+        )
     if len(memento.inp_names) != len(args):
         raise ValueError(
             f"Wrong numbers of arguments expected {len(memento.inp_names)} got {len(args)}."
@@ -44,10 +46,16 @@ def run_memento(
         call_args[in_name] = in_val
     for out_name in memento.out_names:
         sarray: Data = memento.sdfg.arrays[out_name]
-        if isinstance(sarray, Scalar):
-            raise NotImplementedError("Do not support non array in return value.")
         assert out_name not in call_args
-        call_args[out_name] = make_array_from_descriptor(sarray)
+
+        if (out_name == "__return") or (out_name.startswith("__return_")):
+            continue
+        if isinstance(sarray, Scalar):
+            raise NotImplementedError("Scalars as return values are not supported.")
+        if isinstance(sarray, Array):
+            call_args[out_name] = make_array_from_descriptor(sarray)
+        else:
+            raise NotImplementedError(f"Can not handle '{type(sarray).__name__}' as output.")
 
     # Canonical SDFGs do not have global memory, so we must transform it.
     #  We will afterwards undo it.

From f24f2981182953dc9f58777aecfca6c373f89421 Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Fri, 26 Apr 2024 13:36:26 +0200
Subject: [PATCH 054/458] Fixed an error in the ALU Transformator.

---
 src/jace/translator/sub_translators/alu_translator.py | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/src/jace/translator/sub_translators/alu_translator.py b/src/jace/translator/sub_translators/alu_translator.py
index f1c1946..86d6e5e 100644
--- a/src/jace/translator/sub_translators/alu_translator.py
+++ b/src/jace/translator/sub_translators/alu_translator.py
@@ -164,11 +164,11 @@ def translate_jaxeqn(
         tskl_map_ranges: list[tuple[str, str]] = [
             (f"__i{dim}", f"0:{N}") for dim, N in enumerate(eqn.outvars[0].aval.shape)
         ]
-        tskl_output: tuple[str, dace.Memlet] = None
+        tskl_output: tuple[str, dace.Memlet] = None  # type: ignore[assignment]
         tskl_inputs: list[tuple[str, dace.Memlet] | tuple[None, None]] = []
 
         # Generate the Memlets for the input.
-        for i, dims_to_bcast in enumerate([dims_to_bcastl, dims_to_bcastr]):
+        for i, dims_to_bcast in zip(range(len(in_var_names)), [dims_to_bcastl, dims_to_bcastr]):
             if in_var_names[i] is None:  # Literal: No input needed.
                 tskl_inputs.append((None, None))
                 continue

From c1db33f94782a876392a5115f7848d0fbdda7ddb Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Fri, 26 Apr 2024 14:03:26 +0200
Subject: [PATCH 055/458] Added a test for the jitting and composition.

However, it is not yet cached.
---
 tests/test_jax_api.py | 123 ++++++++++++++++++++++++++++++++++++++++++
 1 file changed, 123 insertions(+)
 create mode 100644 tests/test_jax_api.py

diff --git a/tests/test_jax_api.py b/tests/test_jax_api.py
new file mode 100644
index 0000000..a48022c
--- /dev/null
+++ b/tests/test_jax_api.py
@@ -0,0 +1,123 @@
+# JaCe - JAX Just-In-Time compilation using DaCe (Data Centric Parallel Programming)
+#
+# Copyright (c) 2024, ETH Zurich
+# All rights reserved.
+#
+# SPDX-License-Identifier: BSD-3-Clause
+
+"""Tests the compability of the JaCe api to Jax."""
+
+from __future__ import annotations
+
+import jax
+import numpy as np
+import pytest
+from jax import numpy as jnp
+
+import jace
+from jace import util as jutil
+
+
+np.random.seed(42)
+
+
+def test_jit():
+    """Simple add function."""
+    jax.config.update("jax_enable_x64", True)
+
+    def testee(A: np.ndarray, B: np.ndarray) -> np.ndarray:
+        return A + B
+
+    A = np.arange(12, dtype=np.float64).reshape((4, 3))
+    B = np.full((4, 3), 10, dtype=np.float64)
+
+    jax_testee = jax.jit(testee)
+    jace_testee = jace.jit(testee)
+
+    assert jutil.is_jaxified(jax_testee)
+    assert not jutil.is_jaxified(jace_testee)
+    assert not jutil.is_jaceified(jax_testee)
+    assert jutil.is_jaceified(jace_testee)
+
+    ref = jax_testee(A, B)
+    res = jace_testee(A, B)
+
+    assert np.allclose(ref, res), f"Expected '{ref}' got '{res}'."
+
+
+@pytest.mark.skip(reason="Scalar return values are not handled.")
+def test_composition1():
+    jax.config.update("jax_enable_x64", True)
+
+    def f_(x):
+        return jnp.sin(x)
+
+    def df_(x):
+        return jnp.cos(x)
+
+    def ddf_(x):
+        return -jnp.sin(x)
+
+    x = 1.0
+
+    # Jacify it.
+    f = jace.jit(f_)
+    assert jutil.is_jaceified(f)
+    assert not jutil.is_jaxified(f)
+
+    ref = f_(x)
+    res = f(x)
+    assert np.allclose(ref, res), f"f: Expected '{ref}', got '{res}'."
+
+    # Now apply a Jax transformation to the jaceified function.
+    df = jax.grad(f)
+
+    ref = df_(x)
+    res = df(x)
+    assert np.allclose(ref, res), f"df: Expected '{ref}', got '{res}'."
+
+    # Now apply a jace transformation around a jaxified transformation.
+    ddf = jace.grad(df)
+
+    ref = ddf_(x)
+    res = ddf(x)
+    assert np.allclose(ref, res), f"ddf: Expected '{ref}', got '{res}'."
+
+
+def test_composition2():
+    jax.config.update("jax_enable_x64", True)
+
+    def f1_(A, B):
+        return A + B
+
+    f1 = jax.jit(f1_)
+
+    def f2_(A, B, C):
+        return f1(A, B) - C
+
+    f2 = jace.jit(f2_)
+
+    def f3_(A, B, C, D):
+        return f2(A, B, C) * D
+
+    f3_jax = jax.jit(f3_)
+    f3_jace = jace.jit(f3_)
+
+    A, B, C, D = (np.random.random((10, 3, 50)) for _ in range(4))
+
+    ref = ((A + B) - C) * D
+
+    # We have to disable it, because currently there is no `pjit` instruction
+    #  that can handle the nesting.
+    with jax.disable_jit():
+        res_jax = f3_jax(A, B, C, D)
+        res_jace = f3_jace(A, B, C, D)
+
+    assert np.allclose(ref, res_jax), "Jax failed."
+    assert np.allclose(ref, res_jace), "JaCe Failed."
+
+
+if __name__ == "__main__":
+    test_jit()
+    # test_composition1()
+    test_composition2()

From 97a35beaeffb9f873484803c436f834f58d85686 Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Fri, 26 Apr 2024 15:35:32 +0200
Subject: [PATCH 056/458] WIP: Started with a caching mechanism for teh Jiting.

However, I have to think more.
There are some things that I do not like, especially that we have to chache the "abstract input data" but must also use value.

I think that this should be solved a bit differently.
---
 src/jace/jax/api_helper.py | 115 ++++++++++++++++++++++++++++++++++++-
 1 file changed, 114 insertions(+), 1 deletion(-)

diff --git a/src/jace/jax/api_helper.py b/src/jace/jax/api_helper.py
index 72bcdb8..526b7f3 100644
--- a/src/jace/jax/api_helper.py
+++ b/src/jace/jax/api_helper.py
@@ -9,9 +9,14 @@
 
 from __future__ import annotations
 
+from functools import lru_cache
 from typing import Any
 
+import dace
+import jax
+
 from jace import util as jutil
+from jace.translator import util as jtrutil
 
 
 class JitWrapped:
@@ -34,6 +39,7 @@ def __init__(
         """Creates a wrapped jace jitable object of `jax_prim`."""
         assert jax_prim is not None
         self._fun = jax_prim
+        self._tran_count = 0
 
     def __call__(
         self,
@@ -76,9 +82,116 @@ def _call_sdfg(
         """
         from jace.translator.util import debug as jtrudebug
 
-        return jtrudebug._jace_run(self._fun, *args, **kwargs)
+        memento: jtrutil.JaCeTranslationMemento = self._get_memento(*args, **kwargs)
+        return jtrudebug.run_memento(memento, *args)
+
+    def _get_memento(
+        self,
+        *args: Any,
+        **kwargs: Any,
+    ) -> jtrutil.JaCeTranslationMemento:
+        """This function returns the Memento.
+
+        The function will transform its arguments into `_ArgInfo` versions.
+        This is needed since Jax only cares about the information stored inside it.
+        The positional only arguments are used to cache the settings important for Jax
+        and the kwonly arguments are used to influence the Jaxpr to SDFG translator.
+
+        Notes:
+            It is forbidden to permanently modify the returned memento.
+                Doing so results in undefined behaviour.
+        """
+        return self._get_memento_cached(
+            *(_ArgInfo.from_value(v) for v in args),
+            **kwargs,
+        )
+
+    @lru_cache
+    def _get_memento_cached(
+        self,
+        *args: _ArgInfo,
+        **kwargs: Any,
+    ) -> jtrutil.JaCeTranslationMemento:
+        """Generates the SDFG from
+
+        Todo:
+            Also make the SDFG compiled and permanent also in the memento
+            Implement a better cache that avoids using this strange way to pass values around.
+
+        Notes:
+            It is forbidden to permanently modify the returned memento.
+                Doing so results in undefined behaviour.
+        """
+        from jace.translator import JaxprTranslationDriver
+
+        real_args: tuple[Any, ...] = tuple(x._get_val_once() for x in args)
+        jaxpr = jax.make_jaxpr(self.__wrapped__)(*real_args)
+        driver = JaxprTranslationDriver(**kwargs)
+        return driver.translate_jaxpr(jaxpr)
 
     @property
     def __wrapped__(self) -> Any:
         """Returns the wrapped object."""
         return self._fun
+
+    def __hash__(self) -> int:
+        """Hash based on the wrapped function (needed for caching)."""
+        return hash(self.__wrapped__)
+
+    def __eq__(self, other: Any) -> bool:
+        """Wrapped function based equality testing (needed for caching)."""
+        if not isinstance(other, JitWrapped):
+            return False
+        return self.__wrapped__ == other.__wrapped__
+
+
+class _ArgInfo:
+    """Abstracts argument for the case of the `JitWrapped` object.
+
+    Essentially represents a single argument.
+    To construct it use the `from_value()` function.
+
+    Notes:
+        An `_ArgInfo` instance also keeps a reference to the value that was used to construct it.
+            However this value can only retrieved once and is removed afterwards.
+            Conceptionally it should be a weak reerence, but several classes (especially `int`
+            and `float` can not be weakly referenced.
+    """
+
+    shape: tuple[int, ...]
+    strides: tuple[int, ...]
+    dtype: dace.typeclass
+    location: dace.StorageType  # We only need CPU and GPU.
+    _val: Any | None  # May not be allocated.
+
+    def __init__(self, *args: Any, **kwargs: Any) -> None:
+        """To construct an `_ArgInfo` instance use `from_val()`."""
+        raise NotImplementedError("Use '_ArgInfo.from_value()' to construct an instance.")
+
+    def __hash__(self) -> int:
+        return hash((self.shape, self.strides, self.dtype, self.location))
+
+    def __eq__(self, other: Any) -> bool:
+        if not isinstance(other, _ArgInfo):
+            return False
+        return (self.shape, self.strides, self.dtype, self.location) == (
+            (other.shape, other.strides, other.dtype, other.location)
+        )
+
+    def _get_val_once(self) -> Any:
+        """Returns the wrapped object.
+
+        This function only works for a single time.
+        Calling it will null the reference of `self`.
+        """
+        if self._val is None:
+            raise RuntimeError("Value was already consumed.")
+        val = self._val
+        self._val = None
+        return val
+
+    @classmethod
+    def from_value(cls, val: Any) -> _ArgInfo:
+        """Constructs an `_ArgInfo` instance from `val`."""
+        arginfo: _ArgInfo = cls.__new__(cls)
+        raise NotImplementedError("'_ArgInfo.from_value()' is not implemented.")

From 78e55fb5ee8d272df7260f88018b92298538b869 Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?Philip=20M=C3=BCller?=
 <147368808+philip-paul-mueller@users.noreply.github.com>
Date: Mon, 29 Apr 2024 11:28:45 +0200
Subject: [PATCH 057/458] Update src/jace/__init__.py
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

Co-authored-by: Enrique González Paredes <enriqueg@cscs.ch>
---
 src/jace/__init__.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/src/jace/__init__.py b/src/jace/__init__.py
index 5e0595b..9b44225 100644
--- a/src/jace/__init__.py
+++ b/src/jace/__init__.py
@@ -5,7 +5,7 @@
 #
 # SPDX-License-Identifier: BSD-3-Clause
 
-"""Python library for translating Jax programs into SDFG."""
+"""JaCe - JAX Just-In-Time compilation using DaCe."""
 
 from __future__ import annotations
 

From 6c0e2c1e7022e4df1bd35bfc6b569607e80d8b21 Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Mon, 29 Apr 2024 08:53:37 +0200
Subject: [PATCH 058/458] First batch of first review.

---
 .../jace_subtranslator_interface.py           | 57 +++++--------------
 .../translator/jaxpr_translator_driver.py     |  2 +-
 .../sub_translators/alu_translator.py         |  6 +-
 3 files changed, 19 insertions(+), 46 deletions(-)

diff --git a/src/jace/translator/jace_subtranslator_interface.py b/src/jace/translator/jace_subtranslator_interface.py
index 5f58375..6cf02d4 100644
--- a/src/jace/translator/jace_subtranslator_interface.py
+++ b/src/jace/translator/jace_subtranslator_interface.py
@@ -7,7 +7,7 @@
 
 from __future__ import annotations
 
-from collections.abc import Collection, Sequence
+from collections.abc import Sequence
 from typing import TYPE_CHECKING, Any
 
 import dace
@@ -19,26 +19,25 @@
 
 
 class JaCeSubTranslatorInterface:
-    """Interface for all Jax primitive/intrinsic subtranslators.
+    """Interface for all Jax primitive subtranslators.
 
-    A translator for a primitive, sometimes also called intrinsic, translates
-    a single equation of a Jaxpr into its SDFG equivalent. A type that
-    implements this interface must fulfil the following properties:
+    A translator for a primitive translates a single equation of a Jaxpr into its SDFG equivalent.
+    A type that implements this interface must fulfil the following properties:
     - It must be stateless.
         It is still possible and explicitly allowed to have an
         immutable configuration state.
     - All subclasses has to accept `**kwargs` arguments and must
         forward all unconsumed arguments to the base.
 
-    Subtranslators are rather simple objects that only have to perform
-    the translation. The translation process itself is managed by a driver
-    object, which owns and manage the subtranslators.
+    Subtranslators are simple, but highly specialized objects that are only able to perform the translation of a single primitive.
+    The overall translation process itself is managed by a driver object, which also owns and manage the subtranslators.
     In the end this implements the delegation pattern.
 
-    A subtranslator uses its `get_handled_primitives()` function to indicate
-    for which Jax primitives it want to register. It is important that there
-    is no limits on the number of primitives a subtranslator can register itself.
-    However, only one subtranslator can be registered for a primitive.
+    After instantiation a driver calls the subtranslator's `get_handled_primitive()` method.
+    This function returns the name of the Jax primitive the subtranslator is able to handle.
+    In case a subtranslator is able to handle multiple primitives, it should return a list with their names.
+    While there is no limit to the numbers of primitive a subtranslator can register itself for,
+    only one subtranslator can be register for any primitive.
     """
 
     __slots__ = ()
@@ -53,17 +52,13 @@ def __init__(
         It is required that subclasses calls this method during initialization.
         """
 
-    def get_handled_primitives(self) -> Collection[str] | str:
-        """Returns the names of all Jax primitives that `self` is able to handle.
+    def get_handled_primitive(self) -> str | Sequence[str]:
+        """Returns the names of the Jax primitive that `self` is able to handle.
 
-        There is no limit on the number of primitives for which a subtranslator
-        can register.
-
-        Notes:
-            In case a string is returned it is interpreted as 1 element collection.
+        In case `self` can handle multiple primitives, it should return a list with these names.
         """
         raise NotImplementedError(
-            "Class '{type(self).__name__}' does not implement 'get_handled_primitives()'."
+            "Class '{type(self).__name__}' does not implement 'get_handled_primitive()'."
         )
 
     def translate_jaxeqn(
@@ -124,25 +119,3 @@ def translate_jaxeqn(
         raise NotImplementedError(
             "Class '{type(self).__name__}' does not implement 'translate_jaxeqn()'."
         )
-
-    def __eq__(
-        self,
-        other: Any,
-    ) -> bool:
-        """Tests if two subtranslators are equal.
-
-        The default implementation checks if `self` and `other` have the same
-        type.
-        """
-        if not isinstance(other, JaCeSubTranslatorInterface):
-            return NotImplemented
-        return type(self) == type(other)
-
-    def __hash__(self) -> int:
-        """Computes the hash of the subtranslator.
-
-        The default implementation return a hash that is based on the class.
-        Thus all instances of a particular subtranslator will have the same
-        hash value.
-        """
-        return id(self.__class__)
diff --git a/src/jace/translator/jaxpr_translator_driver.py b/src/jace/translator/jaxpr_translator_driver.py
index f9eba29..0187360 100644
--- a/src/jace/translator/jaxpr_translator_driver.py
+++ b/src/jace/translator/jaxpr_translator_driver.py
@@ -937,7 +937,7 @@ def _init_sub_translators(
         for sub_translator_cls in jtsubt._get_subtranslators_cls():
             sub_translator: jtrans.JaCeSubTranslatorInterface = sub_translator_cls(**subtrans_args)
             handled_primitives: Iterable[str] = jutil.ensure_iterability(
-                sub_translator.get_handled_primitives()
+                sub_translator.get_handled_primitive()
             )
             for handled_primitive in handled_primitives:
                 if handled_primitive in sub_translators:
diff --git a/src/jace/translator/sub_translators/alu_translator.py b/src/jace/translator/sub_translators/alu_translator.py
index f1c1946..d0df6d4 100644
--- a/src/jace/translator/sub_translators/alu_translator.py
+++ b/src/jace/translator/sub_translators/alu_translator.py
@@ -9,7 +9,7 @@
 
 from __future__ import annotations
 
-from collections.abc import Collection, Sequence
+from collections.abc import Sequence
 from typing import Any, Final, cast
 
 import dace
@@ -75,9 +75,9 @@ def __init__(self, **kwargs: Any) -> None:
         super().__init__(**kwargs)
 
     @override
-    def get_handled_primitives(self) -> Collection[str] | str:
+    def get_handled_primitive(self) -> Sequence[str]:
         """Returns the list of all known primitives."""
-        return set(self._unary_ops.keys()).union(self._binary_ops.keys())
+        return list(self._unary_ops.keys()) + list(self._binary_ops.keys())
 
     @override
     def translate_jaxeqn(

From 789df78662b28df6b3d7525688eadbc758a77882 Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Mon, 29 Apr 2024 09:10:26 +0200
Subject: [PATCH 059/458] First round: Relocated the util package.

---
 src/jace/translator/__init__.py               |  2 ++
 .../{util => }/jace_translation_memento.py    |  0
 .../translator/jaxpr_translator_driver.py     | 14 +++++------
 .../sub_translators/alu_translator.py         | 13 +++++-----
 src/jace/translator/util/__init__.py          | 25 -------------------
 src/jace/translator/util/util.py              | 21 ----------------
 src/jace/util/__init__.py                     | 10 ++++++--
 src/jace/{translator => }/util/debug.py       |  4 +--
 .../{translator => }/util/revision_counter.py |  0
 src/jace/util/util.py                         | 10 +++++++-
 tests/test_sub_translators_alu.py             |  4 +--
 11 files changed, 36 insertions(+), 67 deletions(-)
 rename src/jace/translator/{util => }/jace_translation_memento.py (100%)
 delete mode 100644 src/jace/translator/util/__init__.py
 delete mode 100644 src/jace/translator/util/util.py
 rename src/jace/{translator => }/util/debug.py (96%)
 rename src/jace/{translator => }/util/revision_counter.py (100%)

diff --git a/src/jace/translator/__init__.py b/src/jace/translator/__init__.py
index 71b567b..78c9095 100644
--- a/src/jace/translator/__init__.py
+++ b/src/jace/translator/__init__.py
@@ -10,10 +10,12 @@
 from __future__ import annotations
 
 from .jace_subtranslator_interface import JaCeSubTranslatorInterface
+from .jace_translation_memento import JaCeTranslationMemento
 from .jaxpr_translator_driver import JaxprTranslationDriver
 
 
 __all__ = [
     "JaCeSubTranslatorInterface",
     "JaxprTranslationDriver",
+    "JaCeTranslationMemento",
 ]
diff --git a/src/jace/translator/util/jace_translation_memento.py b/src/jace/translator/jace_translation_memento.py
similarity index 100%
rename from src/jace/translator/util/jace_translation_memento.py
rename to src/jace/translator/jace_translation_memento.py
diff --git a/src/jace/translator/jaxpr_translator_driver.py b/src/jace/translator/jaxpr_translator_driver.py
index 0187360..0c3e5c1 100644
--- a/src/jace/translator/jaxpr_translator_driver.py
+++ b/src/jace/translator/jaxpr_translator_driver.py
@@ -17,7 +17,7 @@
 from jax import core as jcore
 
 from jace import translator as jtrans, util as jutil
-from jace.translator import sub_translators as jtsubt, util as jtrutil
+from jace.translator import sub_translators as jtsubt
 
 
 class JaxprTranslationDriver:
@@ -137,7 +137,7 @@ def __init__(
         # This is the manager for the revision counter.
         #  It is shared among all children.
         #  Might be overwritten if we are in the context of 'fork()'.
-        self._rev_manager: jtrutil.RevisionCounterManager = jtrutil.RevisionCounterManager()
+        self._rev_manager: jutil.RevisionCounterManager = jutil.RevisionCounterManager()
 
         # This is the revision of self.
         #  Unlike the manager it is not shared and private.
@@ -158,7 +158,7 @@ def translate_jaxpr(
         reserved_names: str | Collection[str] | None = None,
         allow_empty_jaxpr: bool = False,
         **kwargs: Any,
-    ) -> jtrutil.JaCeTranslationMemento:
+    ) -> jtrans.JaCeTranslationMemento:
         """Perform the translation of a Jaxpr description into a SDFG.
 
         Returns:
@@ -208,7 +208,7 @@ def translate_jaxpr(
         self._create_constants(
             jaxpr=jaxpr,
         )
-        memento: jtrutil.JaCeTranslationMemento = self._translate_jaxpr_internal(jaxpr)
+        memento: jtrans.JaCeTranslationMemento = self._translate_jaxpr_internal(jaxpr)
 
         # If the translation context is not cleared `self` and `memento` will share the same data.
         #  There is some legitimate use for that.
@@ -1109,7 +1109,7 @@ def _translate_single_eqn(
     def _translate_jaxpr_internal(
         self,
         jaxpr: jcore.ClosedJaxpr,
-    ) -> jtrutil.JaCeTranslationMemento:
+    ) -> jtrans.JaCeTranslationMemento:
         """Performs the actual translation of the Jaxpr into an SDFG.
 
         The function assumes that the context is already allocated and the initial
@@ -1151,7 +1151,7 @@ def _translate_jaxpr_internal(
 
         return self._export_memento()
 
-    def _export_memento(self) -> jtrutil.JaCeTranslationMemento:
+    def _export_memento(self) -> jtrans.JaCeTranslationMemento:
         """Encapsulate the translation context of `self` into a memento.
 
         This function will not deallocate the internal context of `self`.
@@ -1161,7 +1161,7 @@ def _export_memento(self) -> jtrutil.JaCeTranslationMemento:
         assert all((isinstance(x, str) and (len(x) > 0)) for x in self._sdfg_in_names)
         assert all((isinstance(x, str) and (len(x) > 0)) for x in self._sdfg_out_names)
 
-        return jtrutil.JaCeTranslationMemento(
+        return jtrans.JaCeTranslationMemento(
             sdfg=self._sdfg,
             start_state=self._init_sdfg_state,
             terminal_state=self._term_sdfg_state,
diff --git a/src/jace/translator/sub_translators/alu_translator.py b/src/jace/translator/sub_translators/alu_translator.py
index d0df6d4..3dad14a 100644
--- a/src/jace/translator/sub_translators/alu_translator.py
+++ b/src/jace/translator/sub_translators/alu_translator.py
@@ -17,8 +17,7 @@
 from jax import core as jcore
 from typing_extensions import override
 
-from jace import translator as jtranslator
-from jace.translator import util as jtutil
+from jace import translator as jtranslator, util as jutil
 
 
 class ALUTranslator(jtranslator.JaCeSubTranslatorInterface):
@@ -198,8 +197,8 @@ def translate_jaxeqn(
         if is_scalar:
             tskl_tasklet = eqn_state.add_tasklet(
                 tskl_name,
-                jtutil.list_to_dict(tskl_inputs).keys(),
-                jtutil.list_to_dict([tskl_output]).keys(),
+                jutil.list_to_dict(tskl_inputs).keys(),
+                jutil.list_to_dict([tskl_output]).keys(),
                 tskl_code,
             )
             for in_var, (in_connector, in_memlet) in zip(in_var_names, tskl_inputs, strict=False):
@@ -222,10 +221,10 @@ def translate_jaxeqn(
         else:
             eqn_state.add_mapped_tasklet(
                 name=tskl_name,
-                map_ranges=jtutil.list_to_dict(tskl_map_ranges),
-                inputs=jtutil.list_to_dict(tskl_inputs),
+                map_ranges=jutil.list_to_dict(tskl_map_ranges),
+                inputs=jutil.list_to_dict(tskl_inputs),
                 code=tskl_code,
-                outputs=jtutil.list_to_dict([tskl_output]),
+                outputs=jutil.list_to_dict([tskl_output]),
                 external_edges=True,
             )
 
diff --git a/src/jace/translator/util/__init__.py b/src/jace/translator/util/__init__.py
deleted file mode 100644
index da9c1d4..0000000
--- a/src/jace/translator/util/__init__.py
+++ /dev/null
@@ -1,25 +0,0 @@
-# JaCe - JAX Just-In-Time compilation using DaCe (Data Centric Parallel Programming)
-#
-# Copyright (c) 2024, ETH Zurich
-# All rights reserved.
-#
-# SPDX-License-Identifier: BSD-3-Clause
-
-"""Subpackage containing all utilities related to the translators."""
-
-from __future__ import annotations
-
-from .debug import _jace_run, run_memento
-from .jace_translation_memento import JaCeTranslationMemento
-from .revision_counter import RevisionCounterManager
-from .util import list_to_dict
-
-
-# Q: Is there a way to import everything from `.util` and put it into `__all__` without writing it manually?
-__all__ = [
-    "JaCeTranslationMemento",
-    "RevisionCounterManager",
-    "list_to_dict",
-    "run_memento",
-    "_jace_run",
-]
diff --git a/src/jace/translator/util/util.py b/src/jace/translator/util/util.py
deleted file mode 100644
index 484b4ef..0000000
--- a/src/jace/translator/util/util.py
+++ /dev/null
@@ -1,21 +0,0 @@
-# JaCe - JAX Just-In-Time compilation using DaCe (Data Centric Parallel Programming)
-#
-# Copyright (c) 2024, ETH Zurich
-# All rights reserved.
-#
-# SPDX-License-Identifier: BSD-3-Clause
-
-"""Contains all general helper functions needed inside the translator."""
-
-from __future__ import annotations
-
-from collections.abc import Sequence
-from typing import Any
-
-
-def list_to_dict(inp: Sequence[tuple[None | Any, Any]]) -> dict[Any, Any]:
-    """This method turns a `list` of pairs into a `dict` and applies a `None` filter.
-
-    The function will only include pairs whose key, i.e. first element is not `None`.
-    """
-    return {k: v for k, v in inp if k is not None}
diff --git a/src/jace/util/__init__.py b/src/jace/util/__init__.py
index 0bd9a15..933aee1 100644
--- a/src/jace/util/__init__.py
+++ b/src/jace/util/__init__.py
@@ -9,15 +9,21 @@
 
 from __future__ import annotations
 
+from .debug import _jace_run, run_memento
 from .jax import JaCeVar, get_jax_var_dtype, get_jax_var_name, get_jax_var_shape, translate_dtype
-from .util import ensure_iterability
+from .revision_counter import RevisionCounterManager
+from .util import ensure_iterability, list_to_dict
 
 
 __all__ = [
+    "RevisionCounterManager",
+    "JaCeVar",
     "get_jax_var_name",
     "get_jax_var_shape",
     "get_jax_var_dtype",
     "ensure_iterability",
     "translate_dtype",
-    "JaCeVar",
+    "list_to_dict",
+    "run_memento",
+    "_jace_run",
 ]
diff --git a/src/jace/translator/util/debug.py b/src/jace/util/debug.py
similarity index 96%
rename from src/jace/translator/util/debug.py
rename to src/jace/util/debug.py
index 69724c4..92ab0f5 100644
--- a/src/jace/translator/util/debug.py
+++ b/src/jace/util/debug.py
@@ -15,11 +15,11 @@
 import dace
 import jax
 
-from jace.translator import util as jtrutil
+from jace import translator as jtrans
 
 
 def run_memento(
-    memento: jtrutil.JaCeTranslationMemento,
+    memento: jtrans.JaCeTranslationMemento,
     *args: Any,
 ) -> tuple[Any, ...] | Any:
     """Calls the SDFG with the supplied arguments.
diff --git a/src/jace/translator/util/revision_counter.py b/src/jace/util/revision_counter.py
similarity index 100%
rename from src/jace/translator/util/revision_counter.py
rename to src/jace/util/revision_counter.py
diff --git a/src/jace/util/util.py b/src/jace/util/util.py
index d728be5..7a71bc2 100644
--- a/src/jace/util/util.py
+++ b/src/jace/util/util.py
@@ -7,7 +7,7 @@
 
 from __future__ import annotations
 
-from collections.abc import Iterable
+from collections.abc import Iterable, Sequence
 from typing import Any
 
 
@@ -28,3 +28,11 @@ def ensure_iterability(
     elif isinstance(x, Iterable):
         pass
     return x
+
+
+def list_to_dict(inp: Sequence[tuple[None | Any, Any]]) -> dict[Any, Any]:
+    """This method turns a `list` of pairs into a `dict` and applies a `None` filter.
+
+    The function will only include pairs whose key, i.e. first element is not `None`.
+    """
+    return {k: v for k, v in inp if k is not None}
diff --git a/tests/test_sub_translators_alu.py b/tests/test_sub_translators_alu.py
index 006d4b3..c7910f7 100644
--- a/tests/test_sub_translators_alu.py
+++ b/tests/test_sub_translators_alu.py
@@ -12,7 +12,7 @@
 import jax
 import numpy as np
 
-from jace.translator.util import debug as jtrudebug
+from jace import util as jutil
 
 
 def test_add():
@@ -26,7 +26,7 @@ def testee(A: np.ndarray, B: np.ndarray) -> np.ndarray:
     B = np.full((4, 3), 10, dtype=np.float64)
 
     ref = testee(A, B)
-    res = jtrudebug._jace_run(testee, A, B)
+    res = jutil._jace_run(testee, A, B)
 
     assert np.allclose(ref, res), f"Expected '{ref}' got '{res}'."
 

From c8a9b62cd91cb89c8c43e9994a1e1ec735ef652d Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Mon, 29 Apr 2024 09:34:01 +0200
Subject: [PATCH 060/458] First round: Updated the Memento.

---
 src/jace/translator/jace_translation_memento.py | 15 ---------------
 1 file changed, 15 deletions(-)

diff --git a/src/jace/translator/jace_translation_memento.py b/src/jace/translator/jace_translation_memento.py
index d551082..a4a34e7 100644
--- a/src/jace/translator/jace_translation_memento.py
+++ b/src/jace/translator/jace_translation_memento.py
@@ -59,18 +59,3 @@ def __getitem__(self, idx: str) -> Any:
         if not hasattr(self, idx):
             raise KeyError(f"The key '{idx}' is not known.")
         return getattr(self, idx)
-
-    def __hash__(self) -> int:
-        """Computes the hash of the underlying SDFG object."""
-        return hash(self.sdfg)
-
-    def __eq__(self, other: Any) -> bool:
-        """Compares the underlying SDFG object with 'rhs'."""
-        if isinstance(other, JaCeTranslationMemento):
-            return bool(self.sdfg == other.sdfg)
-        if hasattr(other, "__sdfg__"):
-            other = other.__sdfg__()
-        elif not isinstance(other, dace.SDFG):
-            return NotImplemented
-        x: bool = self.sdfg.__eq__(other)
-        return x

From 24f6a3dac9281013d18bae51eb079ac5a3a8d5ec Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Mon, 29 Apr 2024 09:54:24 +0200
Subject: [PATCH 061/458] First round: Removed the revision counter manager and
 replaced it with `itertools.count()`.

---
 .../translator/jaxpr_translator_driver.py     | 27 ++++++++++++-------
 src/jace/util/__init__.py                     |  2 --
 tests/test_jaxpr_translator_driver.py         |  1 -
 3 files changed, 17 insertions(+), 13 deletions(-)

diff --git a/src/jace/translator/jaxpr_translator_driver.py b/src/jace/translator/jaxpr_translator_driver.py
index 0c3e5c1..33b58a1 100644
--- a/src/jace/translator/jaxpr_translator_driver.py
+++ b/src/jace/translator/jaxpr_translator_driver.py
@@ -7,6 +7,7 @@
 
 from __future__ import annotations
 
+import itertools
 import re
 from collections.abc import Collection, Iterable, Mapping, Sequence
 from typing import Any, Final, cast, overload
@@ -134,21 +135,25 @@ def __init__(
         self._sdfg_in_names: Sequence[str] = None  # type: ignore[assignment]
         self._sdfg_out_names: Sequence[str] = None  # type: ignore[assignment]
 
-        # This is the manager for the revision counter.
-        #  It is shared among all children.
-        #  Might be overwritten if we are in the context of 'fork()'.
-        self._rev_manager: jutil.RevisionCounterManager = jutil.RevisionCounterManager()
+        # Shared revision counter manager.
+        #  This object produces the revision indexes we need for the children.
+        #  It is only allocated for head translators and shared between
+        self._rev_manager: itertools.count[int] = None  # type: ignore[assignment]
 
         # This is the revision of self.
         #  Unlike the manager it is not shared and private.
-        #  Might be overwritten in the context of a fork.
-        self._rev_idx: int = self._rev_manager.assign_revision()
-        assert self.is_head_translator()
+        self._rev_idx: int = None  # type: ignore[assignment]
 
         # If requested we will now allocate some internal state
         if allocate_shared_parts:
+            # Creating of the subtranslators.
             self._init_sub_translators(kwargs)
 
+            # Creating of the revision indexes and manager.
+            self._rev_manager = itertools.count(0, 1)
+            self._rev_idx = next(self._rev_manager)
+            assert self.is_head_translator()
+
     def translate_jaxpr(
         self,
         jaxpr: jcore.ClosedJaxpr,
@@ -249,7 +254,7 @@ def fork(self) -> JaxprTranslationDriver:
             setattr(dolly, slot_name, getattr(self, slot_name))
 
         # Handle the special members and initialize them.
-        dolly._rev_idx = dolly._rev_manager.assign_revision()
+        dolly._rev_idx = next(self._rev_manager)
         assert not dolly.is_head_translator()
 
         # We will now copy the reserved name list
@@ -429,7 +434,9 @@ def is_head_translator(self) -> bool:
         A head translator is a translator/driver that was created explicitly,
         i.e. not by `self.fork()`.
         """
-        return self._rev_manager.is_root_revision(self._rev_idx)
+        assert self._rev_manager is not None
+        assert self._rev_idx is not None
+        return self._rev_idx == 0
 
     def same_family(
         self,
@@ -974,7 +981,7 @@ def _clear_translation_ctx(self) -> JaxprTranslationDriver:
             #  Since this function is only called at the very end, we know that the translation
             #  process as a whole has finished. We reset the state that the numbers are small
             #  again when we start anew.
-            self._rev_manager._reset_state()
+            self._rev_manager = itertools.count(0, 1)
 
             # Freeing the reserved names only for heads make it more safe in case a child
             #  translator is reused.c On the other hand reusing a child translator is
diff --git a/src/jace/util/__init__.py b/src/jace/util/__init__.py
index 933aee1..84eb0f2 100644
--- a/src/jace/util/__init__.py
+++ b/src/jace/util/__init__.py
@@ -11,12 +11,10 @@
 
 from .debug import _jace_run, run_memento
 from .jax import JaCeVar, get_jax_var_dtype, get_jax_var_name, get_jax_var_shape, translate_dtype
-from .revision_counter import RevisionCounterManager
 from .util import ensure_iterability, list_to_dict
 
 
 __all__ = [
-    "RevisionCounterManager",
     "JaCeVar",
     "get_jax_var_name",
     "get_jax_var_shape",
diff --git a/tests/test_jaxpr_translator_driver.py b/tests/test_jaxpr_translator_driver.py
index ad70e05..d826706 100644
--- a/tests/test_jaxpr_translator_driver.py
+++ b/tests/test_jaxpr_translator_driver.py
@@ -107,7 +107,6 @@ def test_driver_fork() -> None:
     driver._clear_translation_ctx()
     assert not driver.is_allocated()
     assert driver.is_head_translator()
-    assert driver._rev_manager._next_revision == dolly_rev
     assert driver._reserved_names is None
 
 
From 1056187d8ca0f4988e3b92443d0399f600016478 Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Mon, 29 Apr 2024 10:01:22 +0200
Subject: [PATCH 062/458] Moved the `list_to_dict()` function to the ALU
 Translator.

As Enrique pointed out it has a bad name for beeing so prominently.
It is also not used in that many translators in the prototype, less thabn I remember.
---
 .../sub_translators/alu_translator.py         | 22 +++++++++++++------
 src/jace/util/__init__.py                     |  3 +--
 src/jace/util/util.py                         | 10 +--------
 3 files changed, 17 insertions(+), 18 deletions(-)

diff --git a/src/jace/translator/sub_translators/alu_translator.py b/src/jace/translator/sub_translators/alu_translator.py
index 3dad14a..e411f28 100644
--- a/src/jace/translator/sub_translators/alu_translator.py
+++ b/src/jace/translator/sub_translators/alu_translator.py
@@ -17,7 +17,7 @@
 from jax import core as jcore
 from typing_extensions import override
 
-from jace import translator as jtranslator, util as jutil
+from jace import translator as jtranslator
 
 
 class ALUTranslator(jtranslator.JaCeSubTranslatorInterface):
@@ -163,7 +163,7 @@ def translate_jaxeqn(
         tskl_map_ranges: list[tuple[str, str]] = [
             (f"__i{dim}", f"0:{N}") for dim, N in enumerate(eqn.outvars[0].aval.shape)
         ]
-        tskl_output: tuple[str, dace.Memlet] = None
+        tskl_output: tuple[str, dace.Memlet] = None  # type: ignore[assignment]
         tskl_inputs: list[tuple[str, dace.Memlet] | tuple[None, None]] = []
 
         # Generate the Memlets for the input.
@@ -197,8 +197,8 @@ def translate_jaxeqn(
         if is_scalar:
             tskl_tasklet = eqn_state.add_tasklet(
                 tskl_name,
-                jutil.list_to_dict(tskl_inputs).keys(),
-                jutil.list_to_dict([tskl_output]).keys(),
+                _list_to_dict(tskl_inputs).keys(),
+                _list_to_dict([tskl_output]).keys(),
                 tskl_code,
             )
             for in_var, (in_connector, in_memlet) in zip(in_var_names, tskl_inputs, strict=False):
@@ -221,10 +221,10 @@ def translate_jaxeqn(
         else:
             eqn_state.add_mapped_tasklet(
                 name=tskl_name,
-                map_ranges=jutil.list_to_dict(tskl_map_ranges),
-                inputs=jutil.list_to_dict(tskl_inputs),
+                map_ranges=_list_to_dict(tskl_map_ranges),
+                inputs=_list_to_dict(tskl_inputs),
                 code=tskl_code,
-                outputs=jutil.list_to_dict([tskl_output]),
+                outputs=_list_to_dict([tskl_output]),
                 external_edges=True,
             )
 
@@ -289,3 +289,11 @@ def _writeTaskletCode(
             t_code = t_code.format(**eqn.params)
 
         return t_code
+
+
+def _list_to_dict(inp: Sequence[tuple[None | Any, Any]]) -> dict[Any, Any]:
+    """This method turns a `list` of pairs into a `dict` and applies a `None` filter.
+
+    The function will only include pairs whose key, i.e. first element is not `None`.
+    """
+    return {k: v for k, v in inp if k is not None}
diff --git a/src/jace/util/__init__.py b/src/jace/util/__init__.py
index 84eb0f2..4e1d951 100644
--- a/src/jace/util/__init__.py
+++ b/src/jace/util/__init__.py
@@ -11,7 +11,7 @@
 
 from .debug import _jace_run, run_memento
 from .jax import JaCeVar, get_jax_var_dtype, get_jax_var_name, get_jax_var_shape, translate_dtype
-from .util import ensure_iterability, list_to_dict
+from .util import ensure_iterability
 
 
 __all__ = [
@@ -21,7 +21,6 @@
     "get_jax_var_dtype",
     "ensure_iterability",
     "translate_dtype",
-    "list_to_dict",
     "run_memento",
     "_jace_run",
 ]
diff --git a/src/jace/util/util.py b/src/jace/util/util.py
index 7a71bc2..d728be5 100644
--- a/src/jace/util/util.py
+++ b/src/jace/util/util.py
@@ -7,7 +7,7 @@
 
 from __future__ import annotations
 
-from collections.abc import Iterable, Sequence
+from collections.abc import Iterable
 from typing import Any
 
 
@@ -28,11 +28,3 @@ def ensure_iterability(
     elif isinstance(x, Iterable):
         pass
     return x
-
-
-def list_to_dict(inp: Sequence[tuple[None | Any, Any]]) -> dict[Any, Any]:
-    """This method turns a `list` of pairs into a `dict` and applies a `None` filter.
-
-    The function will only include pairs whose key, i.e. first element is not `None`.
-    """
-    return {k: v for k, v in inp if k is not None}

From e0ca8a55d19aa75ced118790ef8540070aaac956 Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Mon, 29 Apr 2024 10:56:55 +0200
Subject: [PATCH 063/458] First round: Updated the `util.jax` module.

---
 src/jace/util/jax.py | 97 +++++++++++++++++++++++---------------------
 1 file changed, 51 insertions(+), 46 deletions(-)

diff --git a/src/jace/util/jax.py b/src/jace/util/jax.py
index 845ba16..9739db5 100644
--- a/src/jace/util/jax.py
+++ b/src/jace/util/jax.py
@@ -18,10 +18,13 @@
 from typing import Any
 
 import dace
-import jax
 import jax.core as jcore
 
 
+# Used by `get_jax_var_name()` to test if a name for a jax variable is valid.
+_VALID_JAX_NAME_PATTERN: re.Pattern = re.compile("[a-zA-Z_][a-zA-Z0-9_]*")
+
+
 @dataclass(init=True, repr=True, eq=True, frozen=True, slots=True)
 class JaCeVar:
     """Substitute class for Jax' `Var` instance.
@@ -46,67 +49,69 @@ def get_jax_var_name(jax_var: jcore.Atom | JaCeVar | str) -> str:
     Args:
         jax_var:     The variable to stringify.
     """
-    if isinstance(jax_var, jcore.DropVar):
-        return "_"
-    if isinstance(jax_var, JaCeVar):
-        jax_name = jax_var.name
-    elif isinstance(jax_var, jcore.Atom):
-        jax_name = str(jax_var)  # This only works up to some version
-    elif isinstance(jax_var, str):
-        jax_name = jax_var
-    else:
-        raise TypeError(
-            f"Does not know how to transform '{jax_var}' (type: '{type(jax_var).__name__}') into a string."
-        )
+    match jax_var:
+        case jcore.DropVar():
+            return "_"
+
+        case JaCeVar():
+            jax_name = jax_var.name
+
+        case jcore.Var():
+            # Does only work for jax 0.4.20; will be reworked later.
+            jax_name = str(jax_var)
+
+        case jcore.Literal():
+            raise TypeError("Can not derive a name from a Jax Literal.")
+
+        case str():
+            jax_name = jax_var
+
+        case _:
+            raise TypeError(
+                f"Does not know how to transform '{jax_var}' (type: '{type(jax_var).__name__}') into a string."
+            )
     assert isinstance(jax_name, str)
-    if not re.fullmatch("[a-zA-Z_][a-zA-Z_]*", jax_name):
+
+    if not _VALID_JAX_NAME_PATTERN.fullmatch(jax_name):
         raise ValueError(f"Deduced Jax name '{jax_name}' is invalid.")
     return jax_name
 
 
-def get_jax_var_shape(jax_var: jcore.Atom) -> tuple[int, ...]:
+def get_jax_var_shape(jax_var: jcore.Atom | JaCeVar) -> tuple[int, ...]:
     """Returns the shape of a Jax variable.
 
     Args:
         jax_var:     The variable to process
     """
-    if isinstance(jax_var, jcore.Atom):
-        return jax_var.aval.shape
-    if isinstance(jax_var, JaCeVar):
-        assert isinstance(jax_var.shape, tuple)
-        return jax_var.shape
-    raise TypeError(f"'get_jax_var_shape()` is not implemented for '{type(jax_var)}'.")
+    match jax_var:
+        case jcore.Var() | jcore.Literal():
+            return jax_var.aval.shape
+
+        case JaCeVar():
+            return jax_var.shape
 
+        case _:
+            raise TypeError(f"'get_jax_var_shape()` is not implemented for '{type(jax_var)}'.")
 
-def get_jax_var_dtype(jax_var: jcore.Atom) -> dace.typeclass:
+
+def get_jax_var_dtype(jax_var: jcore.Atom | JaCeVar) -> dace.typeclass:
     """Returns the DaCe equivalent of `jax_var`s datatype."""
-    if isinstance(jax_var, jcore.Atom):
-        return translate_dtype(jax_var.aval.dtype)
-    if isinstance(jax_var, JaCeVar):
-        return translate_dtype(jax_var.dtype)
-    raise TypeError(f"'get_jax_var_dtype()` is not implemented for '{type(jax_var)}'.")
+    match jax_var:
+        case jcore.Var() | jcore.Literal():
+            return translate_dtype(jax_var.aval.dtype)
+
+        case JaCeVar():
+            return translate_dtype(jax_var.dtype)
+
+        case _:
+            raise TypeError(f"'get_jax_var_dtype()` is not implemented for '{type(jax_var)}'.")
 
 
 def translate_dtype(dtype: Any) -> dace.typeclass:
     """Turns a Jax datatype into a DaCe datatype."""
-
     if isinstance(dtype, dace.typeclass):
         return dtype
-
-    # Make some basic checks if the datatype is okay
-    name_of_dtype = str(dtype)
-    if (not jax.config.read("jax_enable_x64")) and (name_of_dtype == "float64"):
-        raise ValueError("Found a 'float64' type but 'x64' support is disabled.")
-    if name_of_dtype.startswith("complex"):
-        raise NotImplementedError("Support for complecx computation is not implemented yet.")
-
-    # Now extract the datatype from dace, this is extremely ugly.
-    if not hasattr(dace.dtypes, name_of_dtype):
-        raise TypeError(f"Could not find '{name_of_dtype}' ({type(dtype).__name__}) in 'dace'.")
-    dcd_type = getattr(dace.dtypes, name_of_dtype)
-
-    if not isinstance(dcd_type, dace.dtypes.typeclass):
-        raise TypeError(
-            f"'{name_of_dtype}' does not map to a 'dace.typeclass' but to a '{type(dcd_type).__name__}'."
-        )
-    return dcd_type
+    if dtype is None:
+        # Special behaviour of `dtype_to_typeclass()`
+        raise NotImplementedError()
+    return dace.dtype_to_typeclass(dtype)

From ccea3d9003b69206fee10130090c446f2402a33e Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Mon, 29 Apr 2024 11:07:41 +0200
Subject: [PATCH 064/458] First round: Updated the naming of the subtranslator
 interface to the one Enrique suggested.

I have to say that I like it more than the old one, but I have not changed the terminology yet.
Thus I still use the world subtranslator and I think we should keep it because I still think that it is the best name.

However, I do not like the name because it suggests that it is able to already translate everything.
---
 src/jace/translator/__init__.py                    |  4 ++--
 src/jace/translator/jaxpr_translator_driver.py     | 12 ++++++------
 ...slator_interface.py => primitive_translator.py} |  5 +++--
 src/jace/translator/sub_translators/__init__.py    | 14 +++++++-------
 .../translator/sub_translators/alu_translator.py   |  2 +-
 tests/test_subtranslator_helper.py                 |  4 ++--
 6 files changed, 21 insertions(+), 20 deletions(-)
 rename src/jace/translator/{jace_subtranslator_interface.py => primitive_translator.py} (97%)

diff --git a/src/jace/translator/__init__.py b/src/jace/translator/__init__.py
index 78c9095..66bba54 100644
--- a/src/jace/translator/__init__.py
+++ b/src/jace/translator/__init__.py
@@ -9,13 +9,13 @@
 
 from __future__ import annotations
 
-from .jace_subtranslator_interface import JaCeSubTranslatorInterface
+from .primitive_translator import PrimitiveTranslator
 from .jace_translation_memento import JaCeTranslationMemento
 from .jaxpr_translator_driver import JaxprTranslationDriver
 
 
 __all__ = [
-    "JaCeSubTranslatorInterface",
+    "PrimitiveTranslator",
     "JaxprTranslationDriver",
     "JaCeTranslationMemento",
 ]
diff --git a/src/jace/translator/jaxpr_translator_driver.py b/src/jace/translator/jaxpr_translator_driver.py
index 33b58a1..9ef8ef9 100644
--- a/src/jace/translator/jaxpr_translator_driver.py
+++ b/src/jace/translator/jaxpr_translator_driver.py
@@ -43,7 +43,7 @@ class JaxprTranslationDriver:
     The actual translation is not handled by the driver instead a so called
     subtranslator object is used. A subtranslator is specialized to translate
     one type of primitive. For more information on the subtranslators see the
-    documentation of `JaCeSubTranslatorInterface`.
+    documentation of `PrimitiveTranslator`.
 
     To support nested Jaxpr expressions the driver provides the possibility to
     clone/fork itself, see `self.fork()` for more. Every clone, i.e. return
@@ -105,7 +105,7 @@ def __init__(
         #  They are partitioned by the names of the primitive they have registered for.
         #  This member is allocated by '_init_sub_translators()' and remains allocated
         #  during the lifetime of the object.
-        self._sub_translators: dict[str, jtrans.JaCeSubTranslatorInterface] = None  # type: ignore[assignment]
+        self._sub_translators: dict[str, jtrans.PrimitiveTranslator] = None  # type: ignore[assignment]
 
         # The SDFG object that we are currently constructing.
         #  Only allocated during an ongoing translation.
@@ -940,9 +940,9 @@ def _init_sub_translators(
 
         subtrans_args = {k: v for k, v in subtrans_args.items() if not k.startswith("_")}  # type: ignore[unreachable]
 
-        sub_translators: dict[str, jtrans.JaCeSubTranslatorInterface] = {}
+        sub_translators: dict[str, jtrans.PrimitiveTranslator] = {}
         for sub_translator_cls in jtsubt._get_subtranslators_cls():
-            sub_translator: jtrans.JaCeSubTranslatorInterface = sub_translator_cls(**subtrans_args)
+            sub_translator: jtrans.PrimitiveTranslator = sub_translator_cls(**subtrans_args)
             handled_primitives: Iterable[str] = jutil.ensure_iterability(
                 sub_translator.get_handled_primitive()
             )
@@ -992,7 +992,7 @@ def _clear_translation_ctx(self) -> JaxprTranslationDriver:
     def _find_sub_translator_for(
         self,
         eqn: jcore.JaxprEqn,
-    ) -> jtrans.JaCeSubTranslatorInterface:
+    ) -> jtrans.PrimitiveTranslator:
         """Returns the appropriate subtranslator for equation `eqn`."""
         assert self._sub_translators is not None
 
@@ -1043,7 +1043,7 @@ def _translate_single_eqn(
         )
 
         # Find the subtranslator
-        subtranslator: jtrans.JaCeSubTranslatorInterface = self._find_sub_translator_for(eqn)
+        subtranslator: jtrans.PrimitiveTranslator = self._find_sub_translator_for(eqn)
 
         # Create the state into which the equation should be translated
         last_term_state: dace.SDFGState = self.get_terminal_sdfg_state()  # noqa: F841 # Will be used later
diff --git a/src/jace/translator/jace_subtranslator_interface.py b/src/jace/translator/primitive_translator.py
similarity index 97%
rename from src/jace/translator/jace_subtranslator_interface.py
rename to src/jace/translator/primitive_translator.py
index 6cf02d4..8472a66 100644
--- a/src/jace/translator/jace_subtranslator_interface.py
+++ b/src/jace/translator/primitive_translator.py
@@ -8,7 +8,7 @@
 from __future__ import annotations
 
 from collections.abc import Sequence
-from typing import TYPE_CHECKING, Any
+from typing import TYPE_CHECKING, Any, Protocol, runtime_checkable
 
 import dace
 from jax import core as jcore
@@ -18,7 +18,8 @@
     from .jaxpr_translator_driver import JaxprTranslationDriver
 
 
-class JaCeSubTranslatorInterface:
+@runtime_checkable
+class PrimitiveTranslator(Protocol):
     """Interface for all Jax primitive subtranslators.
 
     A translator for a primitive translates a single equation of a Jaxpr into its SDFG equivalent.
diff --git a/src/jace/translator/sub_translators/__init__.py b/src/jace/translator/sub_translators/__init__.py
index 4a02ea2..d5eb640 100644
--- a/src/jace/translator/sub_translators/__init__.py
+++ b/src/jace/translator/sub_translators/__init__.py
@@ -18,18 +18,18 @@
 
 
 # List of all subtranslators that ships with JaCe.
-_BUILTIN_SUBTRANSLATORS: Final[list[type[jtrans.JaCeSubTranslatorInterface]]] = [
+_BUILTIN_SUBTRANSLATORS: Final[list[type[jtrans.PrimitiveTranslator]]] = [
     ALUTranslator,
 ]
 
 # All externally supplied subtranslator implementation.
 #  It is a `dict` to do fast access and remember the order, value is always `None`.
 #  The list is manipulated through `{add,rm}_subtranslator()`.
-_EXTERNAL_SUBTRANSLATORS: dict[type[jtrans.JaCeSubTranslatorInterface], None] = {}
+_EXTERNAL_SUBTRANSLATORS: dict[type[jtrans.PrimitiveTranslator], None] = {}
 
 
 def add_subtranslator(
-    subtrans: type[jtrans.JaCeSubTranslatorInterface],
+    subtrans: type[jtrans.PrimitiveTranslator],
 ) -> bool:
     """Add `subtrans` to the externally defined subtranslators.
 
@@ -41,14 +41,14 @@ def add_subtranslator(
         return False
     if not isclass(subtrans):
         return False
-    if not issubclass(subtrans, jtrans.JaCeSubTranslatorInterface):
+    if not issubclass(subtrans, jtrans.PrimitiveTranslator):
         return False
     _EXTERNAL_SUBTRANSLATORS[subtrans] = None
     return True
 
 
 def rm_subtranslator(
-    subtrans: type[jtrans.JaCeSubTranslatorInterface],
+    subtrans: type[jtrans.PrimitiveTranslator],
     strict: bool = False,
 ) -> bool:
     """Remove `subtrans` as externally defined subtranslators.
@@ -66,7 +66,7 @@ def rm_subtranslator(
 def _get_subtranslators_cls(
     with_external: bool = True,
     builtins: bool = True,
-) -> Sequence[type[jtrans.JaCeSubTranslatorInterface]]:
+) -> Sequence[type[jtrans.PrimitiveTranslator]]:
     """Returns the list of all subtranslator known to JaCe.
 
     Args:
@@ -77,7 +77,7 @@ def _get_subtranslators_cls(
         If the externally defined subtranslators are requested they will be
             first and ordered as FILO order.
     """
-    ret: list[type[jtrans.JaCeSubTranslatorInterface]] = []
+    ret: list[type[jtrans.PrimitiveTranslator]] = []
     if with_external:
         # Guarantees that we get them in FIFO order.
         ret.extend(reversed(_EXTERNAL_SUBTRANSLATORS.keys()))
diff --git a/src/jace/translator/sub_translators/alu_translator.py b/src/jace/translator/sub_translators/alu_translator.py
index e411f28..6313f68 100644
--- a/src/jace/translator/sub_translators/alu_translator.py
+++ b/src/jace/translator/sub_translators/alu_translator.py
@@ -20,7 +20,7 @@
 from jace import translator as jtranslator
 
 
-class ALUTranslator(jtranslator.JaCeSubTranslatorInterface):
+class ALUTranslator(jtranslator.PrimitiveTranslator):
     """This translator handles all arithmetic and logical operations."""
 
     __slots__ = ()
diff --git a/tests/test_subtranslator_helper.py b/tests/test_subtranslator_helper.py
index 3af1038..92b0669 100644
--- a/tests/test_subtranslator_helper.py
+++ b/tests/test_subtranslator_helper.py
@@ -25,11 +25,11 @@ def test_subtranslatior_managing():
         rm_subtranslator,
     )
 
-    class ValidSubTrans(jtrans.JaCeSubTranslatorInterface):
+    class ValidSubTrans(jtrans.PrimitiveTranslator):
         def __init__(self, *args, **kwargs):
             super().__init__(*args, **kwargs)
 
-    class ValidSubTrans2(jtrans.JaCeSubTranslatorInterface):
+    class ValidSubTrans2(jtrans.PrimitiveTranslator):
         def __init__(self, *args, **kwargs):
             super().__init__(*args, **kwargs)
 

From 7f47ebcde0559fcf3243a9b7f3b4c2bf6fb3ab81 Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Mon, 29 Apr 2024 11:38:01 +0200
Subject: [PATCH 065/458] Small modification.

---
 src/jace/util/jax_helper.py | 15 ++++++++-------
 1 file changed, 8 insertions(+), 7 deletions(-)

diff --git a/src/jace/util/jax_helper.py b/src/jace/util/jax_helper.py
index 56c31c8..52a5e17 100644
--- a/src/jace/util/jax_helper.py
+++ b/src/jace/util/jax_helper.py
@@ -16,7 +16,6 @@
 from __future__ import annotations
 
 import re
-from collections.abc import Sequence
 from dataclasses import dataclass
 from typing import Any
 
@@ -144,13 +143,15 @@ def is_jaxified(obj: Any) -> bool:
     from jax._src import pjit as jaxpjit
 
     # These are all types we consider as jaxify
-    jaxify_types: Sequence[type] = (
-        jcore.Primitive,
-        # jstage.Wrapped, # Not runtime chakable
-        jaxpjit.JitWrapped,
-        jaxlib.xla_extension.PjitFunction,
+    return isinstance(
+        obj,
+        (
+            jcore.Primitive,
+            # jstage.Wrapped, # Not runtime chakable
+            jaxpjit.JitWrapped,
+            jaxlib.xla_extension.PjitFunction,
+        ),
     )
-    return isinstance(obj, jaxify_types)
 
 
 def translate_dtype(dtype: Any) -> dace.typeclass:

From 960482b5d1aa9810d5d40dfce510991810ee65f1 Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Mon, 29 Apr 2024 12:49:05 +0200
Subject: [PATCH 066/458] This should take care of all import loops.

---
 src/jace/jax/api_helper.py                           | 12 +++++-------
 src/jace/translator/jaxpr_translator_driver.py       |  6 +++---
 src/jace/translator/sub_translators/__init__.py      | 10 +++++++---
 .../translator/sub_translators/alu_translator.py     |  4 ++++
 src/jace/util/debug.py                               |  6 ++++--
 5 files changed, 23 insertions(+), 15 deletions(-)

diff --git a/src/jace/jax/api_helper.py b/src/jace/jax/api_helper.py
index 526b7f3..28d3485 100644
--- a/src/jace/jax/api_helper.py
+++ b/src/jace/jax/api_helper.py
@@ -15,8 +15,7 @@
 import dace
 import jax
 
-from jace import util as jutil
-from jace.translator import util as jtrutil
+from jace import translator as jtrans, util as jutil
 
 
 class JitWrapped:
@@ -80,16 +79,15 @@ def _call_sdfg(
         Notes:
             Currently no caching of the compiled object is done.
         """
-        from jace.translator.util import debug as jtrudebug
 
-        memento: jtrutil.JaCeTranslationMemento = self._get_memento(*args, **kwargs)
-        return jtrudebug.run_memento(memento, *args)
+        memento: jtrans.JaCeTranslationMemento = self._get_memento(*args, **kwargs)
+        return jutil.run_memento(memento, *args)
 
     def _get_memento(
         self,
         *args: Any,
         **kwargs: Any,
-    ) -> jtrutil.JaCeTranslationMemento:
+    ) -> jtrans.JaCeTranslationMemento:
         """This function returns the Memento.
 
         The function will transform its arguments into `_ArgInfo` versions.
@@ -111,7 +109,7 @@ def _get_memento_cached(
         self,
         *args: _ArgInfo,
         **kwargs: Any,
-    ) -> jtrutil.JaCeTranslationMemento:
+    ) -> jtrans.JaCeTranslationMemento:
         """Generates the SDFG from
 
         Todo:
diff --git a/src/jace/translator/jaxpr_translator_driver.py b/src/jace/translator/jaxpr_translator_driver.py
index 9ef8ef9..44a0e7d 100644
--- a/src/jace/translator/jaxpr_translator_driver.py
+++ b/src/jace/translator/jaxpr_translator_driver.py
@@ -18,7 +18,6 @@
 from jax import core as jcore
 
 from jace import translator as jtrans, util as jutil
-from jace.translator import sub_translators as jtsubt
 
 
 class JaxprTranslationDriver:
@@ -936,12 +935,13 @@ def _init_sub_translators(
         The function forwards `kwargs` to the constructor of the subtranslators.
         However, it will remove all arguments starting with an underscore.
         """
+        from jace.translator.sub_translators import _get_subtranslators_cls  # Avoid import cycle
+
         assert self._sub_translators is None
 
         subtrans_args = {k: v for k, v in subtrans_args.items() if not k.startswith("_")}  # type: ignore[unreachable]
-
         sub_translators: dict[str, jtrans.PrimitiveTranslator] = {}
-        for sub_translator_cls in jtsubt._get_subtranslators_cls():
+        for sub_translator_cls in _get_subtranslators_cls():
             sub_translator: jtrans.PrimitiveTranslator = sub_translator_cls(**subtrans_args)
             handled_primitives: Iterable[str] = jutil.ensure_iterability(
                 sub_translator.get_handled_primitive()
diff --git a/src/jace/translator/sub_translators/__init__.py b/src/jace/translator/sub_translators/__init__.py
index d5eb640..5812dbb 100644
--- a/src/jace/translator/sub_translators/__init__.py
+++ b/src/jace/translator/sub_translators/__init__.py
@@ -10,9 +10,11 @@
 from __future__ import annotations
 
 from collections.abc import Sequence
-from typing import Final
+from typing import TYPE_CHECKING, Final
 
-from jace import translator as jtrans
+
+if TYPE_CHECKING:
+    from jace import translator as jtrans
 
 from .alu_translator import ALUTranslator
 
@@ -37,11 +39,13 @@ def add_subtranslator(
     """
     from inspect import isclass
 
+    from jace.translator import PrimitiveTranslator  # Import cycle
+
     if subtrans in _EXTERNAL_SUBTRANSLATORS:
         return False
     if not isclass(subtrans):
         return False
-    if not issubclass(subtrans, jtrans.PrimitiveTranslator):
+    if not issubclass(subtrans, PrimitiveTranslator):
         return False
     _EXTERNAL_SUBTRANSLATORS[subtrans] = None
     return True
diff --git a/src/jace/translator/sub_translators/alu_translator.py b/src/jace/translator/sub_translators/alu_translator.py
index 22b6d8d..21aa1ba 100644
--- a/src/jace/translator/sub_translators/alu_translator.py
+++ b/src/jace/translator/sub_translators/alu_translator.py
@@ -20,7 +20,11 @@
 from jace import translator as jtranslator
 
 
+# from ..primitive_translator import PrimitiveTranslator
+
+
 class ALUTranslator(jtranslator.PrimitiveTranslator):
+    # class ALUTranslator(PrimitiveTranslator):
     """This translator handles all arithmetic and logical operations."""
 
     __slots__ = ()
diff --git a/src/jace/util/debug.py b/src/jace/util/debug.py
index e6e79db..e50185f 100644
--- a/src/jace/util/debug.py
+++ b/src/jace/util/debug.py
@@ -10,12 +10,14 @@
 from __future__ import annotations
 
 from collections.abc import Callable
-from typing import Any
+from typing import TYPE_CHECKING, Any
 
 import dace
 import jax
 
-from jace import translator as jtrans
+
+if TYPE_CHECKING:
+    from jace import translator as jtrans
 
 
 def run_memento(

From 19974a3b11326630721f0186972950677a2586a0 Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Mon, 29 Apr 2024 13:10:30 +0200
Subject: [PATCH 067/458] Fixed some error in the conversion of the dtype.

---
 src/jace/util/jax_helper.py | 17 ++++++++++++++++-
 1 file changed, 16 insertions(+), 1 deletion(-)

diff --git a/src/jace/util/jax_helper.py b/src/jace/util/jax_helper.py
index 52a5e17..08f73cc 100644
--- a/src/jace/util/jax_helper.py
+++ b/src/jace/util/jax_helper.py
@@ -21,6 +21,7 @@
 
 import dace
 import jax.core as jcore
+import numpy as np
 
 
 # Used by `get_jax_var_name()` to test if a name for a jax variable is valid.
@@ -161,4 +162,18 @@ def translate_dtype(dtype: Any) -> dace.typeclass:
     if dtype is None:
         # Special behaviour of `dtype_to_typeclass()`
         raise NotImplementedError()
-    return dace.dtype_to_typeclass(dtype)
+
+    # For reasons unknown to me we have to do the dtype conversion this way.
+    #  It is not possible to simply call `dace.typeclass(dtype)` or pass it to
+    #  `dace.dtype_to_typeclass()`, it will generate an error.
+    #  We keep the `dtype_to_typeclass()` function call, in order to handle
+    #  NumPy types as DaCe intended them to be handled.
+    try:
+        return dace.dtype_to_typeclass(dtype)
+    except KeyError:
+        dtype_name = str(dtype)
+        if hasattr(dace.dtypes, dtype_name):
+            return getattr(dace.dtypes, dtype_name)
+        if hasattr(np, dtype_name):
+            dtype = getattr(np, dtype)
+            return dace.dtype_to_typeclass(dtype)

From 82b5e56e6df9bf99dae4c6fb95501bcc9a8542a4 Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Mon, 29 Apr 2024 13:12:45 +0200
Subject: [PATCH 068/458] Added a proper variable naming for Jax variables.

This is not the final one, however, it allows the code to run.
---
 src/jace/util/jax.py | 7 +++++--
 1 file changed, 5 insertions(+), 2 deletions(-)

diff --git a/src/jace/util/jax.py b/src/jace/util/jax.py
index 9739db5..3ee2cb9 100644
--- a/src/jace/util/jax.py
+++ b/src/jace/util/jax.py
@@ -57,8 +57,11 @@ def get_jax_var_name(jax_var: jcore.Atom | JaCeVar | str) -> str:
             jax_name = jax_var.name
 
         case jcore.Var():
-            # Does only work for jax 0.4.20; will be reworked later.
-            jax_name = str(jax_var)
+            # This stopped working after version 0.20.4, because of some changes in Jax
+            #  See `https://github.com/google/jax/pull/10573` for more information.
+            #  The following implementation will generate stable names, but decouples
+            #  them from pretty printed Jaxpr, we maybe need a pretty print context somewhere.
+            jax_name = f"jax{jax_var.count}{jax_var.suffix}"
 
         case jcore.Literal():
             raise TypeError("Can not derive a name from a Jax Literal.")

From 2080ef5a6aaa2161b071ad8bf4721879f797c628 Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Mon, 29 Apr 2024 13:14:00 +0200
Subject: [PATCH 069/458] Updated the data type conversion.

For reasons I do not understand we have to do the variable conversion this way.
All other ways I tried/were suggested fails.
---
 src/jace/util/jax.py | 17 ++++++++++++++++-
 1 file changed, 16 insertions(+), 1 deletion(-)

diff --git a/src/jace/util/jax.py b/src/jace/util/jax.py
index 3ee2cb9..1d0f3ea 100644
--- a/src/jace/util/jax.py
+++ b/src/jace/util/jax.py
@@ -19,6 +19,7 @@
 
 import dace
 import jax.core as jcore
+import numpy as np
 
 
 # Used by `get_jax_var_name()` to test if a name for a jax variable is valid.
@@ -117,4 +118,18 @@ def translate_dtype(dtype: Any) -> dace.typeclass:
     if dtype is None:
         # Special behaviour of `dtype_to_typeclass()`
         raise NotImplementedError()
-    return dace.dtype_to_typeclass(dtype)
+
+    # For reasons unknown to me we have to do the dtype conversion this way.
+    #  It is not possible to simply call `dace.typeclass(dtype)` or pass it to
+    #  `dace.dtype_to_typeclass()`, it will generate an error.
+    #  We keep the `dtype_to_typeclass()` function call, in order to handle
+    #  NumPy types as DaCe intended them to be handled.
+    try:
+        return dace.dtype_to_typeclass(dtype)
+    except KeyError:
+        dtype_name = str(dtype)
+        if hasattr(dace.dtypes, dtype_name):
+            return getattr(dace.dtypes, dtype_name)
+        if hasattr(np, dtype_name):
+            dtype = getattr(np, dtype)
+            return dace.dtype_to_typeclass(dtype)

From 04de0869bf57d79c244af2734dff887cdc57be6b Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Mon, 29 Apr 2024 13:26:12 +0200
Subject: [PATCH 070/458] The constants are now created before the initial
 arguments.

This is consistant with how they are processed in Jax.
If you look at a pretty printed Jaxpr you see that constants are shown first.
---
 src/jace/translator/jaxpr_translator_driver.py | 6 +++---
 1 file changed, 3 insertions(+), 3 deletions(-)

diff --git a/src/jace/translator/jaxpr_translator_driver.py b/src/jace/translator/jaxpr_translator_driver.py
index 44a0e7d..51805ed 100644
--- a/src/jace/translator/jaxpr_translator_driver.py
+++ b/src/jace/translator/jaxpr_translator_driver.py
@@ -205,12 +205,12 @@ def translate_jaxpr(
             name=name,
             reserved_names=reserved_names,
         )
-        self._create_initial_input(
+        self._create_constants(
             jaxpr=jaxpr,
-            inp_scalar_as_array=inp_scalar_as_array,
         )
-        self._create_constants(
+        self._create_initial_input(
             jaxpr=jaxpr,
+            inp_scalar_as_array=inp_scalar_as_array,
         )
         memento: jtrans.JaCeTranslationMemento = self._translate_jaxpr_internal(jaxpr)
 

From b05d1d4b8bee767286626c6cc312d511c0d589b5 Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Mon, 29 Apr 2024 16:13:58 +0200
Subject: [PATCH 071/458] WIP: Some modification to the whole thing.

I now did some stuff on the variable naming, that it more aligns with what Jax produces.
Probably the wrong choice, working on the jiting was probably the better call.
---
 .../translator/jaxpr_translator_driver.py     | 115 ++++++++++++------
 src/jace/util/__init__.py                     |   4 +
 src/jace/util/jax_helper.py                   |  86 ++++++++++++-
 3 files changed, 159 insertions(+), 46 deletions(-)

diff --git a/src/jace/translator/jaxpr_translator_driver.py b/src/jace/translator/jaxpr_translator_driver.py
index 51805ed..0ec054d 100644
--- a/src/jace/translator/jaxpr_translator_driver.py
+++ b/src/jace/translator/jaxpr_translator_driver.py
@@ -118,9 +118,11 @@ def __init__(
         #  Only allocated during an ongoing translation.
         self._init_sdfg_state: dace.SDFGState = None
 
-        # This is the mapping, that maps the Jax name to the name that is used inside the SDFG.
+        # Maps a Jax variable to the name of its SDFG equivalent.
+        #  As an extension it is also able to map JaCe Variables.
+        #  In case the key (Jax Variable) is a Literal, the mapped value is None.
         #  Only allocated during an ongoing translation.
-        self._jax_name_map: dict[str, str] = None  # type: ignore[assignment]
+        self._jax_name_map: dict[jcore.Var | jutil.JaCeVar, str | None] = None  # type: ignore[assignment]
 
         # These names can not be used for the automatic naming of Jax variables.
         #  They differ from the forbidden names, that they denote valid SDFG names.
@@ -340,15 +342,14 @@ def get_array(
         assert self._sdfg is not None
 
         if isinstance(name, str):
-            pass
-        elif isinstance(name, (jcore.Atom, jutil.JaCeVar)):
-            name = self.map_jax_var_to_sdfg(name)
+            sdfg_name: str = name
+        elif isinstance(name, (jcore.Var, jutil.JaCeVar)):
+            sdfg_name = self.map_jax_var_to_sdfg(name)
         else:
             raise TypeError(f"Does not know how to handle '{type(name).__name__}'.")
-        if name not in self._sdfg.arrays:
+        if sdfg_name not in self._sdfg.arrays:
             raise KeyError(f"Requested the SDFG array '{name}' but it is not known.")
-
-        return self._sdfg.arrays[name]
+        return self._sdfg.arrays[sdfg_name]
 
     @overload
     def map_jax_var_to_sdfg(
@@ -368,22 +369,37 @@ def map_jax_var_to_sdfg(
         jax_var: str | jcore.Atom | jutil.JaCeVar,
         allow_fail: bool = False,
     ) -> str | None:
-        """Returns the name of the SDFG variable that the Jax variable `jax_var` is referring to.
+        """Get the _name_ of the SDFG variable to which `jax_var` is referring to.
+
+        For convenient this function will consider a string as input to be already an SDFG variable name.
 
         Args:
             jax_var:        The Jax variable to look up.
             allow_fail:     If mapping is not known return `None` instead of raise `KeyError`.
+
+        Notes:
+            Despite the fact that Jax literals can be added to the internal variable mapping 
+                it is an error to pass a Jax `Literal` object as `jax_var`.
         """
         assert self._jax_name_map is not None
         assert isinstance(jax_var, (jcore.Atom, str, jutil.JaCeVar))
 
-        jax_var = jutil.get_jax_var_name(jax_var)
-        if jax_var not in self._jax_name_map:
-            if allow_fail:
-                return None
+        if(isinstance(jax_var, str)):
+            sdfg_name: str = jax_var
+        elif(isinstance(jax_var, jcore.Literal)):
+            raise RuntimeError("There is no SDFG variable for literal '{jax_var}'.")
+        elif(jax_var in self._jax_name_map):
+            sdfg_name: str = self._jax_name_map[jax_var]
+            assert isinstance(sdfg_name, str)
+        elif(allow_fail):
+            return None
+        else:
             KeyError(f"The Jax variable '{jax_var}' was never registered.")
 
-        return self._jax_name_map[jax_var]
+        if(sdfg_name not in self._sdfg.arrays):
+            raise KeyError(f"Jax variable '{jax_var}' was supposed to map to '{sdfg_name}',"
+                            "but no such SDFG variable is known.")
+        return sdfg_name
 
     def get_sdfg(self) -> dace.SDFG:
         """Returns the SDFG that is currently constructed.
@@ -430,8 +446,7 @@ def is_allocated(self) -> bool:
     def is_head_translator(self) -> bool:
         """Tests if `self` is a head translator.
 
-        A head translator is a translator/driver that was created explicitly,
-        i.e. not by `self.fork()`.
+        A head translator is a translator/driver that was created explicitly, i.e. not by `self.fork()`.
         """
         assert self._rev_manager is not None
         assert self._rev_idx is not None
@@ -443,10 +458,8 @@ def same_family(
     ) -> bool:
         """Test if `self` and `other` belongs to the same family of driver/translators.
 
-        A driver is either explicitly created, i.e. head translator, or created
-        by a call to `fork()`. All drivers that descend from the same head translator
-        from a family.
-
+        A driver is either explicitly created, i.e. head translator, or created by a call to `fork()`.
+        All drivers that descend from the same head translator from a family.
         """
         if not isinstance(other, JaxprTranslationDriver):
             return NotImplemented  # type: ignore[unreachable]
@@ -459,16 +472,31 @@ def same_family(
     def get_rev_idx(self) -> int:
         """Returns the revision index of `self`.
 
-        To distinguish members of same family every diver has a unique identifier,
-        known as revision. However, the revision is only unique within a single
-        family and during an ongoing translation.
+        To distinguish members of same family every diver has a unique identifier, known as revision.
+        However, the revision is only unique within a single family and during an ongoing translation.
         """
         return self._rev_idx
 
+    @overload
     def add_jax_name_mapping(
         self,
-        jax_var: str | jcore.Atom | jutil.JaCeVar,
+        jax_var: jcore.Var | jutil.JaCeVar,
         sdfg_name: str,
+    ) -> JaxprTranslationDriver:
+        ...
+
+    @overload
+    def add_jax_name_mapping(
+        self,
+        jax_var: jcore.Literal,
+        sdfg_name: None,
+    ) -> JaxprTranslationDriver:
+        ...
+
+    def add_jax_name_mapping(
+        self,
+        jax_var: jcore.Atom | jutil.JaCeVar,
+        sdfg_name: str | None,
     ) -> JaxprTranslationDriver:
         """Creates a mapping between `jax_var` to `sdfg_name`.
 
@@ -482,12 +510,20 @@ def add_jax_name_mapping(
             sdfg_name:   The name of the corresponding SDFG variable.
         """
         assert self._jax_name_map is not None
-        assert isinstance(jax_var, (jcore.Atom, str, jutil.JaCeVar))
-        assert isinstance(sdfg_name, str)
+        assert isinstance(jax_var, (jcore.Atom, jutil.JaCeVar))
+
+        # Adding literals to the variable map.
+        #  The only reason why we allow to add literals to the map is because
+        #  we need them in the proposing of Jax names, see `_propose_jax_name()`.
+        if(isinstance(jax_var, jcore.Literal)):
+            assert sdfg_name is None
+            self._jax_name_map[jax_var] = None
+            return self
+
+        assert isinstance(sdfg_name, str) and (len(sdfg_name) > 0)
 
-        jax_name = jutil.get_jax_var_name(jax_var)
-        if jax_name in self._jax_name_map:
-            if self._jax_name_map[jax_name] == sdfg_name:  # We consider this as no ops.
+        if jax_var in self._jax_name_map:
+            if self._jax_name_map[jax_var] == sdfg_name:  # noops.
                 return self
             raise ValueError(
                 f"Tried to create the mapping '{jax_name} -> {sdfg_name}', but '{jax_name}'"
@@ -498,7 +534,7 @@ def add_jax_name_mapping(
         if sdfg_name in self._forbidden_names:
             raise NameError(f"Mapping '{jax_name} -> {sdfg_name}': Forbidden name.")
 
-        self._jax_name_map[jax_name] = sdfg_name
+        self._jax_name_map[jax_var] = sdfg_name
         return self
 
     def add_reserved_names(
@@ -596,8 +632,6 @@ def add_array(
                 a new new, thus if the name is unavailable an error is generated.
                 However, this excluds variable names that are known.
             Specifying `alt_name` implies `find_new_name=False`.
-            The effect of specifying `force_jax_name` is as passing
-                `jutil.get_jax_var_name(arg)` as `alt_name`.
             If you need to create a special array, you can use `jace.util.JaCeVar`
                 to create a pseudo Jax variable.
         """
@@ -625,7 +659,7 @@ def add_array(
                 raise ValueError(
                     f"Specified 'force_jax_name', but passed '{name_prefix}' as 'name_prefix'."
                 )
-            alt_name = jutil.get_jax_var_name(arg)
+            alt_name = jutil._propose_jax_name(arg, self._jax_name_map)
         if alt_name is not None:
             assert isinstance(
                 alt_name, str
@@ -669,7 +703,7 @@ def add_array(
         if alt_name is not None:
             prop_name = alt_name  # Just for completion: will be ignored later
         elif isinstance(arg, (jcore.Var, jutil.JaCeVar)):
-            prop_name = jutil.get_jax_var_name(arg)
+            prop_name = jutil._propose_jax_name(arg, self._jax_name_map)
             if prop_name.startswith("__"):
                 raise ValueError(
                     f"You tried to create the variable '{prop_name}' which"
@@ -779,11 +813,10 @@ def create_jax_var_list(
     ) -> list[None | str]:
         """Creates SDFG variables for the listed Jax variables and returns their SDFG names.
 
-        Before the function will create a variable, by using `add_array()` with
-        `update_var_mapping=True`, it will check if the variable is known and if
-        so no new variable is created. Instead the name of the previously created
-        variable is added to the list. In case the Jax Atom denotes a Jax Literal,
-        no variable will be created, instead `None` will be added to the list.
+        Before the function will create a variable, by using `add_array()` with `update_var_mapping=True`,
+        it will check if the variable is known and if so no new variable is created.
+        Instead the name of the previously created variable is added to the list.
+        In case the Jax Atom denotes a Jax Literal, no variable will be created, instead `None` will be added to the list.
 
         Args:
             jax_var_list:       The list of Jax variables that should be transformed to SDFG names.
@@ -793,9 +826,10 @@ def create_jax_var_list(
 
         Notes:
             If `only_creation` is set, then literals will cause an error.
-            It is an error to pass the `update_var_mapping` argument.
+            It is an error to pass the `update_var_mapping` argument to this function.
         """
         assert self._jax_name_map is not None
+        assert "update_var_mapping" in kwargs
         if only_creation and prevent_creation:
             raise ValueError("Specified both 'only_creation' and 'prevent_creation'.")
 
@@ -804,6 +838,7 @@ def create_jax_var_list(
             if isinstance(jax_var, jcore.Literal):
                 if only_creation:
                     raise ValueError(f"Requested 'only_creation', but '{jax_var}' is a 'Literal'.")
+                # SOMEHOW TO UPDATE
                 ret_list.append(None)
             elif isinstance(jax_var, (jcore.Var, jutil.JaCeVar)):
                 mapped_sdfg_name: str | None = self.map_jax_var_to_sdfg(jax_var, allow_fail=True)
diff --git a/src/jace/util/__init__.py b/src/jace/util/__init__.py
index ad4b268..fcbe0fc 100644
--- a/src/jace/util/__init__.py
+++ b/src/jace/util/__init__.py
@@ -18,12 +18,15 @@
     is_jaxified,
     is_tracing_ongoing,
     translate_dtype,
+    is_drop_var,
+    _propose_jax_name,
 )
 from .util import ensure_iterability, is_jaceified
 
 
 __all__ = [
     "ensure_iterability",
+    "is_drop_var",
     "is_tracing_ongoing",
     "is_jaceified",
     "is_jaxified",
@@ -34,4 +37,5 @@
     "translate_dtype",
     "run_memento",
     "_jace_run",
+    "_propose_jax_name",
 ]
diff --git a/src/jace/util/jax_helper.py b/src/jace/util/jax_helper.py
index 08f73cc..86c1e16 100644
--- a/src/jace/util/jax_helper.py
+++ b/src/jace/util/jax_helper.py
@@ -17,7 +17,7 @@
 
 import re
 from dataclasses import dataclass
-from typing import Any
+from typing import Any, Mapping, Optional
 
 import dace
 import jax.core as jcore
@@ -28,29 +28,45 @@
 _VALID_JAX_NAME_PATTERN: re.Pattern = re.compile("[a-zA-Z_][a-zA-Z0-9_]*")
 
 
-@dataclass(init=True, repr=True, eq=True, frozen=True, slots=True)
+@dataclass(init=True, repr=True, frozen=True, slots=True)
 class JaCeVar:
     """Substitute class for Jax' `Var` instance.
 
     This class is similar to a `jax.core.Var` class, but much simpler.
     It is only a container for a name, shape and a datatype.
-    All extractor functions `get_jax_var{name, shape, dtype}()` will accept it,
-    as well as multiple functions of the driver.
+    All extractor functions `get_jax_var{name, shape, dtype}()` will accept it, as well as multiple functions of the driver.
 
     Notes:
         Main intention is to test functionality.
+        While for a Jax `Var` object the name is rather irrelevant, `JaCeVar` use their name.
     """
 
     name: str
     shape: tuple[int | dace.symbol | str, ...] | int | dace.symbol | str | tuple[()]
     dtype: dace.typeclass
 
+    def __hash__(self) -> int:
+        return hash(self.name)
+
+    def __eq__(
+        self,
+        other: Any
+    ) -> bool:
+        if(not isinstance(other, JaCeVar)):
+            return NotImplemented
+        return self.name == other.name
+
+
 
 def get_jax_var_name(jax_var: jcore.Atom | JaCeVar | str) -> str:
     """Returns the name of the Jax variable as a string.
 
     Args:
         jax_var:     The variable to stringify.
+
+    Notes:
+        Due to some modification in Jax itself, this function is unable to return "proper" variable names.
+        This function is subject for removal.
     """
     match jax_var:
         case jcore.DropVar():
@@ -62,8 +78,8 @@ def get_jax_var_name(jax_var: jcore.Atom | JaCeVar | str) -> str:
         case jcore.Var():
             # This stopped working after version 0.20.4, because of some changes in Jax
             #  See `https://github.com/google/jax/pull/10573` for more information.
-            #  The following implementation will generate stable names, but decouples
-            #  them from pretty printed Jaxpr, we maybe need a pretty print context somewhere.
+            #  The following implementation will generate stable names, however, they will be decoupled
+            #  from output of the pretty printed Jaxpr
             jax_name = f"jax{jax_var.count}{jax_var.suffix}"
 
         case jcore.Literal():
@@ -177,3 +193,61 @@ def translate_dtype(dtype: Any) -> dace.typeclass:
         if hasattr(np, dtype_name):
             dtype = getattr(np, dtype)
             return dace.dtype_to_typeclass(dtype)
+
+
+def is_drop_var(jax_var: jcore.Atom | JaCeVar) -> bool:
+    """Tests if `jax_var` is a drop variable.
+    """
+
+    if(isinstance(jax_var, jcore.DropVar)):
+        return True
+    if(isinstance(jax_var, JaCeVar)):
+        return jax_var.name == '_'
+    return False
+
+
+def _propose_jax_name(
+        jax_var: jcore.Atom | JaCeVar,
+        jax_name_map: Optional[Mapping[jcore.Var | JaCeVar, Any]] = None,
+) -> str:
+    """Proposes a variable name for `jax_var`.
+
+    There are two modes for proposing new names.
+    In the first mode, `get_jax_var_name()` is used to derive a name.
+    The second mode, proposes a name based on all names that are already known,
+    this leads to names similar to the ones used by Jax.
+
+    Args:
+        jax_var:        The variable for which a name to propose.
+        jax_name_map:   A mapping of all Jax variables that were already named.
+
+    Notes:
+        The second mode is activated by passing `jax_name_map` as argument.
+        The naming of variables are only consistent with the inner most Jaxpr a variable is defined in.
+        Dropped variables will always be named `'_'`.
+    """
+    if(is_drop_var(jax_var)):
+        return "_"
+    if(isinstance(jax_var, jcore.Literal)):
+        raise TypeError(f"Can not propose a name for literal '{jax_var}'.")
+    if(jax_var in jax_name_map):
+        raise RuntimeError(
+            f"Can not propose a second name for '{jax_var}', it already known as '{jax_name_map[jax_var]}'."
+        )
+    if(jax_name_map is None):
+        return get_jax_var_name(jax_var)
+    if(isinstance(jax_var, JaCeVar)):
+        return jax_var.name
+    assert isinstance(jax_var, jcore.Atom)
+
+    c = len(jax_name_map)
+    jax_name = ""
+    while len(jax_name) == 0 or c == 0:
+        c, i = c // 26, c % 26
+        jax_name = chr(97 + i % 26) + jax_name
+    return jax_name
+
+
+
+
+

From c338f88cef06e8c5910da91e4c6ef2ef3fbda99f Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Tue, 30 Apr 2024 12:48:34 +0200
Subject: [PATCH 072/458] Updated the driver.

Now fixed the variable naming.
They now should have proper Jax variables at least in one Jaxpr.
Also why did I happened with the Literals.
---
 .../translator/jace_translation_memento.py    |   5 +-
 .../translator/jaxpr_translator_driver.py     | 110 ++++++++----------
 src/jace/util/jax_helper.py                   |  43 +++----
 3 files changed, 67 insertions(+), 91 deletions(-)

diff --git a/src/jace/translator/jace_translation_memento.py b/src/jace/translator/jace_translation_memento.py
index a4a34e7..e996bf9 100644
--- a/src/jace/translator/jace_translation_memento.py
+++ b/src/jace/translator/jace_translation_memento.py
@@ -12,6 +12,9 @@
 from typing import Any
 
 import dace
+from jax import core as jcore
+
+from jace import util as jutil
 
 
 @dataclass(init=True, repr=True, eq=False, frozen=True, kw_only=True, slots=True)
@@ -32,7 +35,7 @@ class JaCeTranslationMemento:
     sdfg: dace.SDFG
     start_state: dace.SDFGState
     terminal_state: dace.SDFGState
-    jax_name_map: Mapping[str, str]
+    jax_name_map: Mapping[jcore.Var | jutil.JaCeVar, str]
     inp_names: Sequence[str]
     out_names: Sequence[str]
 
diff --git a/src/jace/translator/jaxpr_translator_driver.py b/src/jace/translator/jaxpr_translator_driver.py
index 0ec054d..2499315 100644
--- a/src/jace/translator/jaxpr_translator_driver.py
+++ b/src/jace/translator/jaxpr_translator_driver.py
@@ -120,9 +120,8 @@ def __init__(
 
         # Maps a Jax variable to the name of its SDFG equivalent.
         #  As an extension it is also able to map JaCe Variables.
-        #  In case the key (Jax Variable) is a Literal, the mapped value is None.
         #  Only allocated during an ongoing translation.
-        self._jax_name_map: dict[jcore.Var | jutil.JaCeVar, str | None] = None  # type: ignore[assignment]
+        self._jax_name_map: dict[jcore.Var | jutil.JaCeVar, str] = None  # type: ignore[assignment]
 
         # These names can not be used for the automatic naming of Jax variables.
         #  They differ from the forbidden names, that they denote valid SDFG names.
@@ -376,29 +375,27 @@ def map_jax_var_to_sdfg(
         Args:
             jax_var:        The Jax variable to look up.
             allow_fail:     If mapping is not known return `None` instead of raise `KeyError`.
-
-        Notes:
-            Despite the fact that Jax literals can be added to the internal variable mapping 
-                it is an error to pass a Jax `Literal` object as `jax_var`.
         """
         assert self._jax_name_map is not None
         assert isinstance(jax_var, (jcore.Atom, str, jutil.JaCeVar))
 
-        if(isinstance(jax_var, str)):
+        if isinstance(jax_var, str):
             sdfg_name: str = jax_var
-        elif(isinstance(jax_var, jcore.Literal)):
+        elif isinstance(jax_var, jcore.Literal):
             raise RuntimeError("There is no SDFG variable for literal '{jax_var}'.")
-        elif(jax_var in self._jax_name_map):
-            sdfg_name: str = self._jax_name_map[jax_var]
+        elif jax_var in self._jax_name_map:
+            sdfg_name = self._jax_name_map[jax_var]
             assert isinstance(sdfg_name, str)
-        elif(allow_fail):
+        elif allow_fail:
             return None
         else:
             KeyError(f"The Jax variable '{jax_var}' was never registered.")
 
-        if(sdfg_name not in self._sdfg.arrays):
-            raise KeyError(f"Jax variable '{jax_var}' was supposed to map to '{sdfg_name}',"
-                            "but no such SDFG variable is known.")
+        if sdfg_name not in self._sdfg.arrays:
+            raise KeyError(
+                f"Jax variable '{jax_var}' was supposed to map to '{sdfg_name}',"
+                "but no such SDFG variable is known."
+            )
         return sdfg_name
 
     def get_sdfg(self) -> dace.SDFG:
@@ -477,26 +474,10 @@ def get_rev_idx(self) -> int:
         """
         return self._rev_idx
 
-    @overload
     def add_jax_name_mapping(
         self,
         jax_var: jcore.Var | jutil.JaCeVar,
         sdfg_name: str,
-    ) -> JaxprTranslationDriver:
-        ...
-
-    @overload
-    def add_jax_name_mapping(
-        self,
-        jax_var: jcore.Literal,
-        sdfg_name: None,
-    ) -> JaxprTranslationDriver:
-        ...
-
-    def add_jax_name_mapping(
-        self,
-        jax_var: jcore.Atom | jutil.JaCeVar,
-        sdfg_name: str | None,
     ) -> JaxprTranslationDriver:
         """Creates a mapping between `jax_var` to `sdfg_name`.
 
@@ -510,29 +491,20 @@ def add_jax_name_mapping(
             sdfg_name:   The name of the corresponding SDFG variable.
         """
         assert self._jax_name_map is not None
-        assert isinstance(jax_var, (jcore.Atom, jutil.JaCeVar))
-
-        # Adding literals to the variable map.
-        #  The only reason why we allow to add literals to the map is because
-        #  we need them in the proposing of Jax names, see `_propose_jax_name()`.
-        if(isinstance(jax_var, jcore.Literal)):
-            assert sdfg_name is None
-            self._jax_name_map[jax_var] = None
-            return self
-
-        assert isinstance(sdfg_name, str) and (len(sdfg_name) > 0)
+        assert isinstance(jax_var, (jcore.Var, jutil.JaCeVar))
+        assert isinstance(sdfg_name, str) and (len(sdfg_name) > 0)  # noqa: PT018  # Should be one assertion.
 
         if jax_var in self._jax_name_map:
             if self._jax_name_map[jax_var] == sdfg_name:  # noops.
                 return self
             raise ValueError(
-                f"Tried to create the mapping '{jax_name} -> {sdfg_name}', but '{jax_name}'"
-                f" already points to '{self.map_jax_var_to_sdfg(jax_name)}'."
+                f"Tried to create the mapping '{jax_var} -> {sdfg_name}', but '{jax_var}'"
+                f" already points to '{self.map_jax_var_to_sdfg(jax_var)}'."
             )
         if sdfg_name not in self.get_arrays():
-            raise KeyError(f"Mapping '{jax_name} -> {sdfg_name}': SDFG target unknown.")
+            raise KeyError(f"Mapping '{jax_var} -> {sdfg_name}': SDFG target unknown.")
         if sdfg_name in self._forbidden_names:
-            raise NameError(f"Mapping '{jax_name} -> {sdfg_name}': Forbidden name.")
+            raise NameError(f"Mapping '{jax_var} -> {sdfg_name}': Forbidden name.")
 
         self._jax_name_map[jax_var] = sdfg_name
         return self
@@ -809,49 +781,57 @@ def create_jax_var_list(
         jax_var_list: Sequence[jcore.Atom | jutil.JaCeVar],
         prevent_creation: bool = False,
         only_creation: bool = False,
+        handle_literals: bool = False,
         **kwargs: Any,
     ) -> list[None | str]:
         """Creates SDFG variables for the listed Jax variables and returns their SDFG names.
 
-        Before the function will create a variable, by using `add_array()` with `update_var_mapping=True`,
-        it will check if the variable is known and if so no new variable is created.
-        Instead the name of the previously created variable is added to the list.
-        In case the Jax Atom denotes a Jax Literal, no variable will be created, instead `None` will be added to the list.
+        If a Jax variable already has a SDFG equivalent then the function will use this variable.
+        If no SDFG variable is known the function will create one using `add_array()`, with `update_var_mapping` set to `True`.
+
+        By setting `prevent_creation` the function will not create any new SDFG variables.
+        This mode is used to indicate that all variables already have to exists already.
+        By setting `only_creation` the function will only create new SDFG variables.
+        If a Jax variable already has a known SDFG equivalent an error is generated.
+
+        By default literals cause an error.
+        However, by setting `handle_literals` to `True` literals will will be included in the output with the value `None`.
 
         Args:
             jax_var_list:       The list of Jax variables that should be transformed to SDFG names.
-            prevent_creation:   Never create a variable, indicates that all variables must exists.
-            only_creation:      Variables must be generated, generate an error instead of using it.
-            kwargs:             Will be forwarded to `self.add_array()` if a variable as to be created.
-
-        Notes:
-            If `only_creation` is set, then literals will cause an error.
-            It is an error to pass the `update_var_mapping` argument to this function.
+            prevent_creation:   Never create a variable, all must already be known.
+            only_creation:      Always create a variable, it is an error if one already exist.
+            handle_literals:    Allow the processing of literals.
+            kwargs:             Will be forwarded to `self.add_array()` if a variable as to be created,
         """
         assert self._jax_name_map is not None
-        assert "update_var_mapping" in kwargs
+        assert "update_var_mapping" not in kwargs
         if only_creation and prevent_creation:
             raise ValueError("Specified both 'only_creation' and 'prevent_creation'.")
 
         ret_list: list[None | str] = []
         for jax_var in jax_var_list:
             if isinstance(jax_var, jcore.Literal):
-                if only_creation:
-                    raise ValueError(f"Requested 'only_creation', but '{jax_var}' is a 'Literal'.")
-                # SOMEHOW TO UPDATE
-                ret_list.append(None)
+                if not handle_literals:
+                    raise ValueError("Encountered a literal but `handle_literals` was `False`.")
+                sdfg_name = None
             elif isinstance(jax_var, (jcore.Var, jutil.JaCeVar)):
                 mapped_sdfg_name: str | None = self.map_jax_var_to_sdfg(jax_var, allow_fail=True)
                 if (mapped_sdfg_name is None) and prevent_creation:
-                    raise ValueError(f"prevent_creation' given but have to create '{jax_var}'.")
+                    raise ValueError(f"'prevent_creation' given but have to create '{jax_var}'.")
                 if mapped_sdfg_name is None:
-                    ret_list.append(self.add_array(arg=jax_var, update_var_mapping=True, **kwargs))
+                    sdfg_name = self.add_array(arg=jax_var, update_var_mapping=True, **kwargs)
                 elif only_creation:
                     raise ValueError(f"'only_creation' given '{jax_var}' already exists.")
                 else:
-                    ret_list.append(mapped_sdfg_name)
+                    sdfg_name = mapped_sdfg_name
+                # `add_jax_name_mapping` is save, because if the mapping does already exists it is a no ops.
+                self.add_jax_name_mapping(jax_var, sdfg_name)
             else:
                 raise TypeError(f"Does not know how to handle '{type(jax_var).__name__}'")
+
+            ret_list.append(sdfg_name)
+
         return ret_list
 
     def _create_initial_input(
@@ -884,6 +864,7 @@ def _create_initial_input(
             jax_var_list=jaxpr.jaxpr.invars,
             only_creation=True,
             as_transient=True,  # Explicit transient; no error!
+            handle_literals=False,  # Initial arguments are never literals
             force_array=inp_scalar_as_array,
             force_jax_name=self.is_head_translator(),  # Ensure head get pure Jax names.
         )
@@ -1070,6 +1051,7 @@ def _translate_single_eqn(
             self.create_jax_var_list(
                 eqn.invars,
                 prevent_creation=True,  # Inputs must already exists.
+                handle_literals=True,  #  but they can be literals.
             )
         )
         out_var_names: Sequence[str] = self.create_jax_var_list(  # type: ignore[assignment]
diff --git a/src/jace/util/jax_helper.py b/src/jace/util/jax_helper.py
index 86c1e16..c60ac71 100644
--- a/src/jace/util/jax_helper.py
+++ b/src/jace/util/jax_helper.py
@@ -16,8 +16,9 @@
 from __future__ import annotations
 
 import re
+from collections.abc import Mapping
 from dataclasses import dataclass
-from typing import Any, Mapping, Optional
+from typing import Any
 
 import dace
 import jax.core as jcore
@@ -48,16 +49,12 @@ class JaCeVar:
     def __hash__(self) -> int:
         return hash(self.name)
 
-    def __eq__(
-        self,
-        other: Any
-    ) -> bool:
-        if(not isinstance(other, JaCeVar)):
+    def __eq__(self, other: Any) -> bool:
+        if not isinstance(other, JaCeVar):
             return NotImplemented
         return self.name == other.name
 
 
-
 def get_jax_var_name(jax_var: jcore.Atom | JaCeVar | str) -> str:
     """Returns the name of the Jax variable as a string.
 
@@ -196,19 +193,18 @@ def translate_dtype(dtype: Any) -> dace.typeclass:
 
 
 def is_drop_var(jax_var: jcore.Atom | JaCeVar) -> bool:
-    """Tests if `jax_var` is a drop variable.
-    """
+    """Tests if `jax_var` is a drop variable."""
 
-    if(isinstance(jax_var, jcore.DropVar)):
+    if isinstance(jax_var, jcore.DropVar):
         return True
-    if(isinstance(jax_var, JaCeVar)):
-        return jax_var.name == '_'
+    if isinstance(jax_var, JaCeVar):
+        return jax_var.name == "_"
     return False
 
 
 def _propose_jax_name(
-        jax_var: jcore.Atom | JaCeVar,
-        jax_name_map: Optional[Mapping[jcore.Var | JaCeVar, Any]] = None,
+    jax_var: jcore.Atom | JaCeVar,
+    jax_name_map: Mapping[jcore.Var | JaCeVar, Any] | None = None,
 ) -> str:
     """Proposes a variable name for `jax_var`.
 
@@ -226,28 +222,23 @@ def _propose_jax_name(
         The naming of variables are only consistent with the inner most Jaxpr a variable is defined in.
         Dropped variables will always be named `'_'`.
     """
-    if(is_drop_var(jax_var)):
+    if is_drop_var(jax_var):
         return "_"
-    if(isinstance(jax_var, jcore.Literal)):
+    if isinstance(jax_var, jcore.Literal):
         raise TypeError(f"Can not propose a name for literal '{jax_var}'.")
-    if(jax_var in jax_name_map):
+    if jax_name_map is None:
+        return get_jax_var_name(jax_var)
+    if jax_var in jax_name_map:
         raise RuntimeError(
             f"Can not propose a second name for '{jax_var}', it already known as '{jax_name_map[jax_var]}'."
         )
-    if(jax_name_map is None):
-        return get_jax_var_name(jax_var)
-    if(isinstance(jax_var, JaCeVar)):
+    if isinstance(jax_var, JaCeVar):
         return jax_var.name
     assert isinstance(jax_var, jcore.Atom)
 
     c = len(jax_name_map)
     jax_name = ""
-    while len(jax_name) == 0 or c == 0:
+    while len(jax_name) == 0 or c != 0:
         c, i = c // 26, c % 26
         jax_name = chr(97 + i % 26) + jax_name
     return jax_name
-
-
-
-
-

From 87483043d5f22632eed32d5a4ee16b20336b0d6e Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Tue, 30 Apr 2024 12:52:01 +0200
Subject: [PATCH 073/458] Added a new test this time with literals.

---
 tests/test_sub_translators_alu.py | 20 ++++++++++++++++++++
 1 file changed, 20 insertions(+)

diff --git a/tests/test_sub_translators_alu.py b/tests/test_sub_translators_alu.py
index c7910f7..d6bc7b9 100644
--- a/tests/test_sub_translators_alu.py
+++ b/tests/test_sub_translators_alu.py
@@ -31,5 +31,25 @@ def testee(A: np.ndarray, B: np.ndarray) -> np.ndarray:
     assert np.allclose(ref, res), f"Expected '{ref}' got '{res}'."
 
 
+def test_add2():
+    """Simple add function, with literal."""
+    jax.config.update("jax_enable_x64", True)
+
+    def testee(A: np.ndarray, B: np.ndarray) -> np.ndarray:
+        c = A + 0.01
+        d = B * 0.6
+        e = c / 1.0
+        f = d - 0.1
+        return e + f * d
+
+    A = np.arange(12, dtype=np.float64).reshape((4, 3))
+    B = np.full((4, 3), 10, dtype=np.float64)
+
+    ref = testee(A, B)
+    res = jutil._jace_run(testee, A, B)
+
+    assert np.allclose(ref, res), f"Expected '{ref}' got '{res}'."
+
+
 if __name__ == "__main__":
     test_add()

From 70ec73b186166058835b52c60c507ddbc5bbbea5 Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Thu, 2 May 2024 09:36:28 +0200
Subject: [PATCH 074/458] Made some small modifications.

---
 src/jace/translator/jace_translation_memento.py | 10 +++++-----
 1 file changed, 5 insertions(+), 5 deletions(-)

diff --git a/src/jace/translator/jace_translation_memento.py b/src/jace/translator/jace_translation_memento.py
index e996bf9..110f5a0 100644
--- a/src/jace/translator/jace_translation_memento.py
+++ b/src/jace/translator/jace_translation_memento.py
@@ -25,11 +25,11 @@ class JaCeTranslationMemento:
     - `sdfg` the SDFG object that was created.
     - `start_state` the first state in the SDFG state machine.
     - `terminal_state` the last state in the state machine.
-    - `jax_name_map` a `dict` that maps every Jax name to its corresponding SDFG variable name.
-    - `inp_names` a `list` of the SDFG variables that are used as input,
-            in the same order as `Jaxpr.invars`.
-    - `out_names` a `list` of the SDFG variables that are used as output,
-            in the same order as `Jaxpr.outvars`.
+    - `jax_name_map` a `dict` that maps every Jax variable to its corresponding SDFG variable _name_.
+    - `inp_names` a `list` of the SDFG variables that are used as input, in the same order as `Jaxpr.invars`.
+    - `out_names` a `list` of the SDFG variables that are used as output, in the same order as `Jaxpr.outvars`.
+
+    Note that `inp_names` and `out_names` may not be disjunct.
     """
 
     sdfg: dace.SDFG

From 903d694172f09410b349894d8782604ff5342c8e Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Thu, 2 May 2024 09:59:24 +0200
Subject: [PATCH 075/458] The proposed name now also takes the suffix into
 consideration.

---
 src/jace/util/jax_helper.py | 3 ++-
 1 file changed, 2 insertions(+), 1 deletion(-)

diff --git a/src/jace/util/jax_helper.py b/src/jace/util/jax_helper.py
index c60ac71..f4e469f 100644
--- a/src/jace/util/jax_helper.py
+++ b/src/jace/util/jax_helper.py
@@ -229,6 +229,7 @@ def _propose_jax_name(
     if jax_name_map is None:
         return get_jax_var_name(jax_var)
     if jax_var in jax_name_map:
+        # Should be turned into a lookup?
         raise RuntimeError(
             f"Can not propose a second name for '{jax_var}', it already known as '{jax_name_map[jax_var]}'."
         )
@@ -241,4 +242,4 @@ def _propose_jax_name(
     while len(jax_name) == 0 or c != 0:
         c, i = c // 26, c % 26
         jax_name = chr(97 + i % 26) + jax_name
-    return jax_name
+    return jax_name + jax_var.suffix

From de591729b4608987f1182cfbe0a0de16104379cd Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Thu, 2 May 2024 10:33:48 +0200
Subject: [PATCH 076/458] Subtranslators are now created by a classmethod that
 acts as factory.

---
 .../translator/jaxpr_translator_driver.py     |  2 +-
 src/jace/translator/primitive_translator.py   | 20 ++++++++-----------
 .../sub_translators/alu_translator.py         | 12 ++++++++---
 3 files changed, 18 insertions(+), 16 deletions(-)

diff --git a/src/jace/translator/jaxpr_translator_driver.py b/src/jace/translator/jaxpr_translator_driver.py
index 2499315..133357c 100644
--- a/src/jace/translator/jaxpr_translator_driver.py
+++ b/src/jace/translator/jaxpr_translator_driver.py
@@ -958,7 +958,7 @@ def _init_sub_translators(
         subtrans_args = {k: v for k, v in subtrans_args.items() if not k.startswith("_")}  # type: ignore[unreachable]
         sub_translators: dict[str, jtrans.PrimitiveTranslator] = {}
         for sub_translator_cls in _get_subtranslators_cls():
-            sub_translator: jtrans.PrimitiveTranslator = sub_translator_cls(**subtrans_args)
+            sub_translator: jtrans.PrimitiveTranslator = sub_translator_cls.CREATE(**subtrans_args)
             handled_primitives: Iterable[str] = jutil.ensure_iterability(
                 sub_translator.get_handled_primitive()
             )
diff --git a/src/jace/translator/primitive_translator.py b/src/jace/translator/primitive_translator.py
index 8472a66..3d9cb5d 100644
--- a/src/jace/translator/primitive_translator.py
+++ b/src/jace/translator/primitive_translator.py
@@ -24,11 +24,8 @@ class PrimitiveTranslator(Protocol):
 
     A translator for a primitive translates a single equation of a Jaxpr into its SDFG equivalent.
     A type that implements this interface must fulfil the following properties:
-    - It must be stateless.
-        It is still possible and explicitly allowed to have an
-        immutable configuration state.
-    - All subclasses has to accept `**kwargs` arguments and must
-        forward all unconsumed arguments to the base.
+    - It must be immutable after construction.
+    - All subclass must implement the class method `CREATE()` to construct an instance.
 
     Subtranslators are simple, but highly specialized objects that are only able to perform the translation of a single primitive.
     The overall translation process itself is managed by a driver object, which also owns and manage the subtranslators.
@@ -43,15 +40,14 @@ class PrimitiveTranslator(Protocol):
 
     __slots__ = ()
 
-    def __init__(
-        self,
+    @classmethod
+    def CREATE(
+        cls,
         *args: Any,
         **kwargs: Any,
-    ) -> None:
-        """Initialize the interface.
-
-        It is required that subclasses calls this method during initialization.
-        """
+    ) -> PrimitiveTranslator:
+        """Creates an instance of a subtranslator."""
+        raise NotImplementedError("Class '{type(self).__name__}' does not implement 'CREATE()'.")
 
     def get_handled_primitive(self) -> str | Sequence[str]:
         """Returns the names of the Jax primitive that `self` is able to handle.
diff --git a/src/jace/translator/sub_translators/alu_translator.py b/src/jace/translator/sub_translators/alu_translator.py
index 21aa1ba..bbaf469 100644
--- a/src/jace/translator/sub_translators/alu_translator.py
+++ b/src/jace/translator/sub_translators/alu_translator.py
@@ -20,9 +20,6 @@
 from jace import translator as jtranslator
 
 
-# from ..primitive_translator import PrimitiveTranslator
-
-
 class ALUTranslator(jtranslator.PrimitiveTranslator):
     # class ALUTranslator(PrimitiveTranslator):
     """This translator handles all arithmetic and logical operations."""
@@ -73,6 +70,15 @@ class ALUTranslator(jtranslator.PrimitiveTranslator):
         "lt": "__out0 = __in0 < __in1",
     }
 
+    @classmethod
+    def CREATE(
+        cls,
+        *args: Any,
+        **kwargs: Any,
+    ) -> ALUTranslator:
+        """Creates an `ALUTranslator` instance."""
+        return cls(*args, **kwargs)
+
     def __init__(self, **kwargs: Any) -> None:
         """Initialize the `ALUTranslator`."""
         super().__init__(**kwargs)

From f1a53cce38fcf6ce9e2285b0cfac3617bb0759d4 Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Thu, 2 May 2024 10:35:10 +0200
Subject: [PATCH 077/458] Smaller fixes.

---
 src/jace/util/jax_helper.py | 23 ++++++-----------------
 1 file changed, 6 insertions(+), 17 deletions(-)

diff --git a/src/jace/util/jax_helper.py b/src/jace/util/jax_helper.py
index f4e469f..44304f1 100644
--- a/src/jace/util/jax_helper.py
+++ b/src/jace/util/jax_helper.py
@@ -68,23 +68,18 @@ def get_jax_var_name(jax_var: jcore.Atom | JaCeVar | str) -> str:
     match jax_var:
         case jcore.DropVar():
             return "_"
-
         case JaCeVar():
             jax_name = jax_var.name
-
         case jcore.Var():
             # This stopped working after version 0.20.4, because of some changes in Jax
             #  See `https://github.com/google/jax/pull/10573` for more information.
             #  The following implementation will generate stable names, however, they will be decoupled
             #  from output of the pretty printed Jaxpr
             jax_name = f"jax{jax_var.count}{jax_var.suffix}"
-
         case jcore.Literal():
             raise TypeError("Can not derive a name from a Jax Literal.")
-
         case str():
             jax_name = jax_var
-
         case _:
             raise TypeError(
                 f"Does not know how to transform '{jax_var}' (type: '{type(jax_var).__name__}') into a string."
@@ -105,10 +100,8 @@ def get_jax_var_shape(jax_var: jcore.Atom | JaCeVar) -> tuple[int, ...]:
     match jax_var:
         case jcore.Var() | jcore.Literal():
             return jax_var.aval.shape
-
         case JaCeVar():
             return jax_var.shape
-
         case _:
             raise TypeError(f"'get_jax_var_shape()` is not implemented for '{type(jax_var)}'.")
 
@@ -118,10 +111,8 @@ def get_jax_var_dtype(jax_var: jcore.Atom | JaCeVar) -> dace.typeclass:
     match jax_var:
         case jcore.Var() | jcore.Literal():
             return translate_dtype(jax_var.aval.dtype)
-
         case JaCeVar():
             return translate_dtype(jax_var.dtype)
-
         case _:
             raise TypeError(f"'get_jax_var_dtype()` is not implemented for '{type(jax_var)}'.")
 
@@ -157,15 +148,13 @@ def is_jaxified(obj: Any) -> bool:
     from jax._src import pjit as jaxpjit
 
     # These are all types we consider as jaxify
-    return isinstance(
-        obj,
-        (
-            jcore.Primitive,
-            # jstage.Wrapped, # Not runtime chakable
-            jaxpjit.JitWrapped,
-            jaxlib.xla_extension.PjitFunction,
-        ),
+    jaxifyed_types = (
+        jcore.Primitive,
+        # jstage.Wrapped is not runtime chakable
+        jaxpjit.JitWrapped,
+        jaxlib.xla_extension.PjitFunction,
     )
+    return isinstance(obj, jaxifyed_types)
 
 
 def translate_dtype(dtype: Any) -> dace.typeclass:

From 48641a2c66c8377174e4de97b0abaa3a4d32f017 Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Thu, 2 May 2024 10:59:02 +0200
Subject: [PATCH 078/458] Renamed the Memento to `TranslatedJaxprSDFG`.

I am not sure if I should use this class also as context object.
SInce I want to keep it simple and user facing.
---
 src/jace/jax/api_helper.py                    | 23 +++++-----
 src/jace/translator/__init__.py               |  4 +-
 .../translator/jaxpr_translator_driver.py     | 36 +++++++--------
 ...on_memento.py => translated_jaxpr_sdfg.py} |  2 +-
 src/jace/util/__init__.py                     |  8 ++--
 src/jace/util/debug.py                        | 46 ++++++++++---------
 6 files changed, 60 insertions(+), 59 deletions(-)
 rename src/jace/translator/{jace_translation_memento.py => translated_jaxpr_sdfg.py} (98%)

diff --git a/src/jace/jax/api_helper.py b/src/jace/jax/api_helper.py
index 28d3485..1932b5b 100644
--- a/src/jace/jax/api_helper.py
+++ b/src/jace/jax/api_helper.py
@@ -79,16 +79,15 @@ def _call_sdfg(
         Notes:
             Currently no caching of the compiled object is done.
         """
+        jsdfg: jtrans.TranslatedJaxprSDFG = self._get_translated_sdfg(*args, **kwargs)
+        return jutil.run_jax_sdfg(jsdfg, *args)
 
-        memento: jtrans.JaCeTranslationMemento = self._get_memento(*args, **kwargs)
-        return jutil.run_memento(memento, *args)
-
-    def _get_memento(
+    def _get_translated_sdfg(
         self,
         *args: Any,
         **kwargs: Any,
-    ) -> jtrans.JaCeTranslationMemento:
-        """This function returns the Memento.
+    ) -> jtrans.TranslatedJaxprSDFG:
+        """This function returns the `TranslatedJaxprSDFG` object.
 
         The function will transform its arguments into `_ArgInfo` versions.
         This is needed since Jax only cares about the information stored inside it.
@@ -96,28 +95,28 @@ def _get_memento(
         and the kwonly arguments are used to influence the Jaxpr to SDFG translator.
 
         Notes:
-            It is forbidden to permanently modify the returned memento.
+            It is forbidden to permanently modify the returned translated SDFG.
                 Doing so results in undefined behaviour.
         """
-        return self._get_memento_cached(
+        return self._get_translated_sdfg_cached(
             *(_ArgInfo.from_value(v) for v in args),
             **kwargs,
         )
 
     @lru_cache
-    def _get_memento_cached(
+    def _get_translated_sdfg_cached(
         self,
         *args: _ArgInfo,
         **kwargs: Any,
-    ) -> jtrans.JaCeTranslationMemento:
+    ) -> jtrans.TranslatedJaxprSDFG:
         """Generates the SDFG from
 
         Todo:
-            Also make the SDFG compiled and permanent also in the memento
+            Also make the SDFG compiled and permanent also in the translated SDFG object; maybe.
             Implement a better cache that avoids using this strange way to pass values around.
 
         Notes:
-            It is forbidden to permanently modify the returned memento.
+            It is forbidden to permanently modify the returned translated SDFG.
                 Doing so results in undefined behaviour.
         """
         from jace.translator import JaxprTranslationDriver
diff --git a/src/jace/translator/__init__.py b/src/jace/translator/__init__.py
index 49b9808..8ca5476 100644
--- a/src/jace/translator/__init__.py
+++ b/src/jace/translator/__init__.py
@@ -9,13 +9,13 @@
 
 from __future__ import annotations
 
-from .jace_translation_memento import JaCeTranslationMemento
 from .jaxpr_translator_driver import JaxprTranslationDriver
 from .primitive_translator import PrimitiveTranslator
+from .translated_jaxpr_sdfg import TranslatedJaxprSDFG
 
 
 __all__ = [
     "PrimitiveTranslator",
     "JaxprTranslationDriver",
-    "JaCeTranslationMemento",
+    "TranslatedJaxprSDFG",
 ]
diff --git a/src/jace/translator/jaxpr_translator_driver.py b/src/jace/translator/jaxpr_translator_driver.py
index 133357c..faea557 100644
--- a/src/jace/translator/jaxpr_translator_driver.py
+++ b/src/jace/translator/jaxpr_translator_driver.py
@@ -163,14 +163,13 @@ def translate_jaxpr(
         reserved_names: str | Collection[str] | None = None,
         allow_empty_jaxpr: bool = False,
         **kwargs: Any,
-    ) -> jtrans.JaCeTranslationMemento:
+    ) -> jtrans.TranslatedJaxprSDFG:
         """Perform the translation of a Jaxpr description into a SDFG.
 
         Returns:
             The function will translate the passed Jaxpr object into an SDFG.
-            However, the SDFG will be in canonical form and needs further
-            processing. The SDFG is encapsulated inside a `JaCeTranslationMemento`,
-            that contains additional metadata for further manipulation.
+            However, the SDFG will be in canonical form and needs further processing.
+            The SDFG is encapsulated inside a `TranslatedJaxprSDFG`, that contains additional metadata.
 
         Args:
             inp_scalar_as_array:    Translate scalar _input_ arguments to arrays of length 1.
@@ -181,7 +180,7 @@ def translate_jaxpr(
 
         Returns:
             The function will not return the SDFG directly.
-            Instead it will be wrapped inside a `JaCeTranslationMemento` instance.
+            Instead it will be wrapped inside a `TranslatedJaxprSDFG` instance.
             That contains the SDFG and some meta data needed for further processing.
         """
         if self.is_allocated():
@@ -213,14 +212,14 @@ def translate_jaxpr(
             jaxpr=jaxpr,
             inp_scalar_as_array=inp_scalar_as_array,
         )
-        memento: jtrans.JaCeTranslationMemento = self._translate_jaxpr_internal(jaxpr)
+        jsdfg: jtrans.TranslatedJaxprSDFG = self._translate_jaxpr_internal(jaxpr)
 
-        # If the translation context is not cleared `self` and `memento` will share the same data.
+        # If the translation context is not cleared `self` and `jsdfg` will share the same data.
         #  There is some legitimate use for that.
         if _clear_translation_ctx:
             self._clear_translation_ctx()
 
-        return memento
+        return jsdfg
 
     def fork(self) -> JaxprTranslationDriver:
         """Return a child of `self` ready for transformation.
@@ -1133,14 +1132,12 @@ def _translate_single_eqn(
     def _translate_jaxpr_internal(
         self,
         jaxpr: jcore.ClosedJaxpr,
-    ) -> jtrans.JaCeTranslationMemento:
+    ) -> jtrans.TranslatedJaxprSDFG:
         """Performs the actual translation of the Jaxpr into an SDFG.
 
-        The function assumes that the context is already allocated and the initial
-        input variables were already created. The function will store the internal
-        state of `self` into a memento and return it.
-        However, it will not deallocate the translation context, thus `self`
-        and the memento share the same context in memory.
+        The function assumes that the context is allocated as well as initial variables.
+        The function will return the internal state of `self` as a `TranslatedJaxprSDFG` object.
+        However, it will not deallocate the translation context, thus `self` and the return value share the same memory.
 
         Args:
             jaxpr:      The Jaxpr to translate.
@@ -1173,19 +1170,20 @@ def _translate_jaxpr_internal(
             out_var_names = self._handle_null_jaxpr(jaxpr)
         self._sdfg_out_names = tuple(out_var_names)
 
-        return self._export_memento()
+        return self._export_context()
 
-    def _export_memento(self) -> jtrans.JaCeTranslationMemento:
-        """Encapsulate the translation context of `self` into a memento.
+    def _export_context(self) -> jtrans.TranslatedJaxprSDFG:
+        """Encapsulate the translation context of `self` into a `TranslatedJaxprSDFG` object..
 
         This function will not deallocate the internal context of `self`.
-        Thus the memento and `self` share the same context in memory.
+        Thus `self` and the return value will share the same context in memory.
+        To free the context of `self` use `self._clear_translation_ctx()`.
         """
         assert self.is_allocated()
         assert all((isinstance(x, str) and (len(x) > 0)) for x in self._sdfg_in_names)
         assert all((isinstance(x, str) and (len(x) > 0)) for x in self._sdfg_out_names)
 
-        return jtrans.JaCeTranslationMemento(
+        return jtrans.TranslatedJaxprSDFG(
             sdfg=self._sdfg,
             start_state=self._init_sdfg_state,
             terminal_state=self._term_sdfg_state,
diff --git a/src/jace/translator/jace_translation_memento.py b/src/jace/translator/translated_jaxpr_sdfg.py
similarity index 98%
rename from src/jace/translator/jace_translation_memento.py
rename to src/jace/translator/translated_jaxpr_sdfg.py
index 110f5a0..b0562e6 100644
--- a/src/jace/translator/jace_translation_memento.py
+++ b/src/jace/translator/translated_jaxpr_sdfg.py
@@ -18,7 +18,7 @@
 
 
 @dataclass(init=True, repr=True, eq=False, frozen=True, kw_only=True, slots=True)
-class JaCeTranslationMemento:
+class TranslatedJaxprSDFG:
     """Encapsulates the result of a translation run of the `JaxprTranslationDriver` object.
 
     It defines the following members:
diff --git a/src/jace/util/__init__.py b/src/jace/util/__init__.py
index fcbe0fc..29c5276 100644
--- a/src/jace/util/__init__.py
+++ b/src/jace/util/__init__.py
@@ -9,17 +9,17 @@
 
 from __future__ import annotations
 
-from .debug import _jace_run, run_memento
+from .debug import _jace_run, run_jax_sdfg
 from .jax_helper import (
     JaCeVar,
+    _propose_jax_name,
     get_jax_var_dtype,
     get_jax_var_name,
     get_jax_var_shape,
+    is_drop_var,
     is_jaxified,
     is_tracing_ongoing,
     translate_dtype,
-    is_drop_var,
-    _propose_jax_name,
 )
 from .util import ensure_iterability, is_jaceified
 
@@ -35,7 +35,7 @@
     "get_jax_var_shape",
     "get_jax_var_dtype",
     "translate_dtype",
-    "run_memento",
+    "run_jax_sdfg",
     "_jace_run",
     "_propose_jax_name",
 ]
diff --git a/src/jace/util/debug.py b/src/jace/util/debug.py
index e50185f..b3a84f3 100644
--- a/src/jace/util/debug.py
+++ b/src/jace/util/debug.py
@@ -5,7 +5,10 @@
 #
 # SPDX-License-Identifier: BSD-3-Clause
 
-"""This module contains functions for debugging the translator."""
+"""This module contains functions for debugging the translator.
+
+Everything in this module is experimental and might vanish anytime.
+"""
 
 from __future__ import annotations
 
@@ -20,34 +23,35 @@
     from jace import translator as jtrans
 
 
-def run_memento(
-    memento: jtrans.JaCeTranslationMemento,
+def run_jax_sdfg(
+    jsdfg: jtrans.TranslatedJaxprSDFG,
     *args: Any,
 ) -> tuple[Any, ...] | Any:
-    """Calls the SDFG with the supplied arguments.
+    """Calls the SDFG that is encapsulated with the supplied arguments.
 
     Notes:
         Currently the SDFG must not have any undefined symbols, i.e. no undefined sizes.
+        Currently denoted arguments are not fully respected.
         The function either returns a value or a tuple of values, i.e. no tree.
     """
     from dace.data import Array, Data, Scalar, make_array_from_descriptor
 
     # This is a simplification that makes our life simply
-    if len(memento.sdfg.free_symbols) != 0:
+    if len(jsdfg.sdfg.free_symbols) != 0:
         raise ValueError(
-            f"No externally defined symbols are allowed, found: {memento.sdfg.free_symbols}"
+            f"No externally defined symbols are allowed, found: {jsdfg.sdfg.free_symbols}"
         )
-    if len(memento.inp_names) != len(args):
+    if len(jsdfg.inp_names) != len(args):
         raise ValueError(
-            f"Wrong numbers of arguments expected {len(memento.inp_names)} got {len(args)}."
+            f"Wrong numbers of arguments expected {len(jsdfg.inp_names)} got {len(args)}."
         )
 
     # We use a return by reference approach, for calling the SDFG
     call_args: dict[str, Any] = {}
-    for in_name, in_val in zip(memento.inp_names, args):
+    for in_name, in_val in zip(jsdfg.inp_names, args):
         call_args[in_name] = in_val
-    for out_name in memento.out_names:
-        sarray: Data = memento.sdfg.arrays[out_name]
+    for out_name in jsdfg.out_names:
+        sarray: Data = jsdfg.sdfg.arrays[out_name]
         assert out_name not in call_args
 
         if (out_name == "__return") or (out_name.startswith("__return_")):
@@ -61,25 +65,25 @@ def run_memento(
 
     # Canonical SDFGs do not have global memory, so we must transform it.
     #  We will afterwards undo it.
-    for glob_name in memento.inp_names + memento.out_names:  # type: ignore[operator]  # concatenation
-        memento.sdfg.arrays[glob_name].transient = False
+    for glob_name in jsdfg.inp_names + jsdfg.out_names:  # type: ignore[operator]  # concatenation
+        jsdfg.sdfg.arrays[glob_name].transient = False
 
     try:
-        csdfg: dace.CompiledSDFG = memento.sdfg.compile()
+        csdfg: dace.CompiledSDFG = jsdfg.sdfg.compile()
         with dace.config.temporary_config():
             dace.Config.set("compiler", "allow_view_arguments", value=True)
             csdfg(**call_args)
 
-        if len(memento.out_names) == 0:
+        if len(jsdfg.out_names) == 0:
             return None
-        ret_val: tuple[Any] = tuple(call_args[out_name] for out_name in memento.out_names)
-        if len(memento.out_names) == 1:
+        ret_val: tuple[Any] = tuple(call_args[out_name] for out_name in jsdfg.out_names)
+        if len(jsdfg.out_names) == 1:
             return ret_val[0]
         return ret_val
 
     finally:
-        for name in memento.inp_names + memento.out_names:  # type: ignore[operator]  # concatenation
-            memento.sdfg.arrays[name].transient = True
+        for name in jsdfg.inp_names + jsdfg.out_names:  # type: ignore[operator]  # concatenation
+            jsdfg.sdfg.arrays[name].transient = True
 
 
 def _jace_run(
@@ -97,5 +101,5 @@ def _jace_run(
 
     jaxpr = jax.make_jaxpr(fun)(*args)
     driver = JaxprTranslationDriver(**kwargs)
-    memento = driver.translate_jaxpr(jaxpr)
-    return run_memento(memento, *args)
+    jsdfg = driver.translate_jaxpr(jaxpr)
+    return run_jax_sdfg(jsdfg, *args)

From b8799917c1195f0b336dc9677051e8f85d227f80 Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Thu, 2 May 2024 14:53:13 +0200
Subject: [PATCH 079/458] Now we have a translation conext and stacking.

---
 src/jace/translator/_translation_context.py   | 157 ++++++
 .../translator/jaxpr_translator_driver.py     | 459 ++++++------------
 src/jace/translator/translated_jaxpr_sdfg.py  |   6 +-
 3 files changed, 322 insertions(+), 300 deletions(-)
 create mode 100644 src/jace/translator/_translation_context.py

diff --git a/src/jace/translator/_translation_context.py b/src/jace/translator/_translation_context.py
new file mode 100644
index 0000000..4858f3c
--- /dev/null
+++ b/src/jace/translator/_translation_context.py
@@ -0,0 +1,157 @@
+# JaCe - JAX Just-In-Time compilation using DaCe (Data Centric Parallel Programming)
+#
+# Copyright (c) 2024, ETH Zurich
+# All rights reserved.
+#
+# SPDX-License-Identifier: BSD-3-Clause
+
+"""This module contains the translation context for the `JaxprTranslationDriver`."""
+
+from __future__ import annotations
+
+from collections.abc import MutableMapping, Sequence
+from typing import TYPE_CHECKING
+
+import dace
+from jax import core as jcore
+
+from jace import util as jutil
+
+
+if TYPE_CHECKING:
+    from jace import translator as jtrans
+
+
+class _TranslationContext:
+    """Represents the context of a `JaxprTranslationDriver`.
+
+    Essentially it contains the following variables:
+    - `sdfg`:
+        The SDFG object that is under construction.
+    - `start_state`:
+        The first state in the SDFG state machine.
+    - `terminal_state`:
+        The current terminal state of the SDFG state machine.
+    - `jax_name_map`:
+        A `dict` that maps every Jax variable to its corresponding SDFG variable _name_.
+    - `inp_names`:
+        A `list` of the SDFG variable names that are used for input.
+        Their order is the same as in `Jaxpr.invars`.
+        Filled at the very beginning.
+    - `out_names`:
+        A `list` of the SDFG variables names that are used for output,
+        Their order is the same as in `Jaxpr.outvars`.
+        Only filled at the very end.
+    - `rev_idx`:
+        The revision index (used to generate unique names in the translation.
+
+    Notes:
+        It might be that a name appears in both the `inp_names` and `out_names` list.
+            This happens if the corresponding variable is used as both input and output.
+            In Jax this is called argument donation.
+        This class is similar to but different to `TranslatedJaxprSDFG`.
+            This class is used to represent the dynamic state of the translation object,
+            `TranslatedJaxprSDFG` is used to result the end.
+    """
+
+    __slots__ = (
+        "_sdfg",
+        "_start_state",
+        "_terminal_state",
+        "_jax_name_map",
+        "_inp_names",
+        "_out_names",
+        "_rev_idx",
+    )
+
+    def __init__(
+        self,
+        rev_idx: int,
+        name: str | None = None,
+    ) -> None:
+        """Initializes the context.
+
+        Args:
+            rev_idx:    The revision index of the context.
+            name:       Name of the SDFG object.
+        """
+
+        self._sdfg: dace.SDFG = dace.SDFG(name=(name or f"unnamed_SDFG_{id(self)}"))
+        self._start_state: dace.SDFGState = self._sdfg.add_state(
+            label="initial_state", is_start_block=True
+        )
+        self._terminal_state: dace.SDFGState = self._start_state
+        self._jax_name_map: MutableMapping[jcore.Var | jutil.JaCeVar, str] = {}
+        self._inp_names: tuple[str, ...] = ()
+        self._out_names: tuple[str, ...] = ()
+        self._rev_idx: int = rev_idx
+
+    def to_translated_jaxpr_sdfg(self) -> jtrans.TranslatedJaxprSDFG:
+        """Transforms `self` into a `TranslatedJaxprSDFG`."""
+        return jtrans.TranslatedJaxprSDFG(
+            sdfg=self._sdfg,
+            start_state=self._start_state,
+            terminal_state=self._terminal_state,
+            jax_name_map=self._jax_name_map,
+            inp_names=self._inp_names,
+            out_names=self._out_names,
+        )
+
+    @property
+    def sdfg(self) -> dace.SDFG:
+        return self._sdfg
+
+    @property
+    def start_state(self) -> dace.SDFGState:
+        return self._start_state
+
+    @property
+    def terminal_state(self) -> dace.SDFGState:
+        return self._terminal_state
+
+    @terminal_state.setter
+    def terminal_state(
+        self,
+        new_term_state: dace.SDFGState,
+    ) -> None:
+        self._terminal_state = new_term_state
+
+    @property
+    def jax_name_map(self) -> MutableMapping[jcore.Var | jutil.JaCeVar, str]:
+        return self._jax_name_map
+
+    @property
+    def inp_names(self) -> tuple[str, ...]:
+        return self._inp_names
+
+    @inp_names.setter
+    def inp_names(
+        self,
+        inp_names: Sequence[str],
+    ) -> None:
+        if isinstance(inp_names, str):
+            self._inp_names = (inp_names,)
+        elif isinstance(inp_names, tuple):
+            self._inp_names = inp_names
+        else:
+            self._inp_names = tuple(inp_names)
+
+    @property
+    def out_names(self) -> tuple[str, ...]:
+        return self._out_names
+
+    @out_names.setter
+    def out_names(
+        self,
+        out_names: Sequence[str],
+    ) -> None:
+        if isinstance(out_names, str):
+            self._out_names = (out_names,)
+        elif isinstance(out_names, tuple):
+            self._out_names = out_names
+        else:
+            self._out_names = tuple(out_names)
+
+    @property
+    def rev_idx(self) -> int:
+        return self._rev_idx
diff --git a/src/jace/translator/jaxpr_translator_driver.py b/src/jace/translator/jaxpr_translator_driver.py
index faea557..a336946 100644
--- a/src/jace/translator/jaxpr_translator_driver.py
+++ b/src/jace/translator/jaxpr_translator_driver.py
@@ -23,15 +23,16 @@
 class JaxprTranslationDriver:
     """Internal driver class for creating an SDFG equivalent of a `Jaxpr` instance.
 
-    This class builds an SDFG of a very particular form, which for us is
-    canonical, which is not directly usable. Thus this class should not be
-    directly used, instead a user should use TBA.
-    The canonical form is characterized by the following:
+    The SDFG that is created by this class has a very particular form, which we consider canonical.
+    The main feature of a canonical SDFG are:
     - the SDFG is a list of states, ideally each state corresponds to single Jax primitive,
     - all variable names are derived from Jax names,
-    - there are no global variables inside the SDFG,
-    - It lacks the special `__return` variable.
-    - The argument names are not set.
+    - there are only transient variables inside the SDFG,
+    - It lacks the special `__return` variable,
+    - the `arg_names` parameter is not set.
+
+    For these reasons the SDFG is not directly usable, and further manipulations have to be performed.
+    TBA where to look for them.
 
     The idea of the translator is extremely simple. Since Jaxpr is a list
     consisting of more or less simple instructions/equations, they get processed
@@ -39,45 +40,25 @@ class JaxprTranslationDriver:
     is appended to the SDFG, thus the SDFG is a long list of states. In certain
     cases it might be that an equation needs more states, but this is an exception.
 
-    The actual translation is not handled by the driver instead a so called
-    subtranslator object is used. A subtranslator is specialized to translate
-    one type of primitive. For more information on the subtranslators see the
-    documentation of `PrimitiveTranslator`.
-
-    To support nested Jaxpr expressions the driver provides the possibility to
-    clone/fork itself, see `self.fork()` for more. Every clone, i.e. return
-    value of `self.fork()`, of a driver, which is also known as child, has
-    a unique identifier. This identifier is used for example to generate
-    unique SDFG variable names during a translation process,
-    see `self.same_family() for more.
-
-    If no translation is ongoing the only function that makes sense to call
-    is `translate_jaxpr()` which starts a translation.
+    The actual translation of the equation is not handled by the driver.
+    Instead the request is forwarded to a `PrimitiveTranslator` object, also known as subtranslator.
+    This is a highly specialized object that is able to handle one kind of primitive.
+    For more information on the subtranslators see the documentation of `PrimitiveTranslator`.
 
-    Todos:
-        Find a better way than to allow giving access to protected functions.
-            Probably using composition with the higher level instance.
+    To start a translation the `translate_jaxpr()` function should be called,
+    if this happens it is said that the driver has an ongoing translation.
+    If `translate_jaxpr()` is called on driver that has an ongoing translation, a new translation context will be set up.
+    Thus the driver will then translate the supplied (nested) Jaxpr and return the result.
+    However, this will have no influence on the translation process that is already going.
     """
 
-    # Member variables private to an instance, i.e. they are not passed on to the children.
-    #  By definition all of them belongs to the translation context but not all variable of
-    #  the translation context are private, some are actually shared.
-    __private_slots__ = (
-        "_sdfg",
-        "_term_sdfg_state",
-        "_init_sdfg_state",
-        "_jax_name_map",
-        "_sdfg_in_names",
-        "_sdfg_out_names",
-        "_rev_idx",
-    )
-    # Variables that are shared among the instances of a family.
-    __shared_slots__ = (
+    __slots__ = (
+        "_ctx_stack",  # Stack of all contexts
+        "_ctx",  # Current top of the context stack.
         "_reserved_names",  # Part of the context, but is copied.
         "_sub_translators",
-        "_rev_manager",  # This is the revision counter manager
+        "_rev_manager",
     )
-    __slot__ = __private_slots__ + __shared_slots__
 
     def __init__(
         self,
@@ -88,9 +69,6 @@ def __init__(
         All arguments that does not start with an underscore are used as
         arguments to construct the subtranslators.
 
-        Args:
-            _no_shared_alloc (bool):     If set then all allocation will be avoided (internal)
-
         Notes:
             This function will not allocate the translation context of `self`
                 but will only allocate the shared members.
@@ -98,7 +76,7 @@ def __init__(
                 the shared part. This flag is provided only for implementing
                 `self.fork()` using it is an error and undefined behaviour.
         """
-        allocate_shared_parts: bool = not kwargs.pop("_no_shared_alloc", False)
+        from ._translation_context import _TranslationContext
 
         # Contains all the subtranslators that we need.
         #  They are partitioned by the names of the primitive they have registered for.
@@ -106,53 +84,24 @@ def __init__(
         #  during the lifetime of the object.
         self._sub_translators: dict[str, jtrans.PrimitiveTranslator] = None  # type: ignore[assignment]
 
-        # The SDFG object that we are currently constructing.
-        #  Only allocated during an ongoing translation.
-        self._sdfg: dace.SDFG = None
-
-        # This is the HEAD SDFG state, i.e. the last state in which we translated an equation.
-        #  Only allocated during an ongoing translation.
-        self._term_sdfg_state: dace.SDFGState = None
-
-        # This is the beginning of the SDFG, i.e. the original SDFG HEAD.
-        #  Only allocated during an ongoing translation.
-        self._init_sdfg_state: dace.SDFGState = None
-
-        # Maps a Jax variable to the name of its SDFG equivalent.
-        #  As an extension it is also able to map JaCe Variables.
-        #  Only allocated during an ongoing translation.
-        self._jax_name_map: dict[jcore.Var | jutil.JaCeVar, str] = None  # type: ignore[assignment]
-
         # These names can not be used for the automatic naming of Jax variables.
         #  They differ from the forbidden names, that they denote valid SDFG names.
         #  An example would be names of the function arguments.
         #  Only allocated during an ongoing translation.
         self._reserved_names: set[str] = None  # type: ignore[assignment]
 
-        # These are the names of the SDFG variables that serves as input and output.
-        #  They have the same order as in the Jaxpr.
-        #  Only allocated during an ongoing translation.
-        self._sdfg_in_names: Sequence[str] = None  # type: ignore[assignment]
-        self._sdfg_out_names: Sequence[str] = None  # type: ignore[assignment]
-
         # Shared revision counter manager.
-        #  This object produces the revision indexes we need for the children.
-        #  It is only allocated for head translators and shared between
-        self._rev_manager: itertools.count[int] = None  # type: ignore[assignment]
-
-        # This is the revision of self.
-        #  Unlike the manager it is not shared and private.
-        self._rev_idx: int = None  # type: ignore[assignment]
+        #  Generates the revision numbers we need.
+        #  Is reset after every translation.
+        self._rev_manager: itertools.count[int] = itertools.count(0, 1)
 
-        # If requested we will now allocate some internal state
-        if allocate_shared_parts:
-            # Creating of the subtranslators.
-            self._init_sub_translators(kwargs)
+        # Context stack and current context.
+        #  Only allocated during an ongoing translation
+        self._ctx_stack: list[_TranslationContext] = []
+        self._ctx: _TranslationContext = None  # type: ignore[assignment]
 
-            # Creating of the revision indexes and manager.
-            self._rev_manager = itertools.count(0, 1)
-            self._rev_idx = next(self._rev_manager)
-            assert self.is_head_translator()
+        # Creating of the subtranslators.
+        self._init_sub_translators(kwargs)
 
     def translate_jaxpr(
         self,
@@ -164,12 +113,15 @@ def translate_jaxpr(
         allow_empty_jaxpr: bool = False,
         **kwargs: Any,
     ) -> jtrans.TranslatedJaxprSDFG:
-        """Perform the translation of a Jaxpr description into a SDFG.
+        """Perform the translation of a Jaxpr into a SDFG.
+
+        In case this function is called and `self` has an ongoing translation process, a new translation context will be created.
+        This means the Jaxpr will be translated independently from the previous one.
 
         Returns:
-            The function will translate the passed Jaxpr object into an SDFG.
-            However, the SDFG will be in canonical form and needs further processing.
-            The SDFG is encapsulated inside a `TranslatedJaxprSDFG`, that contains additional metadata.
+            The function will translate the passed Jaxpr object into an SDFG in canonical form.
+            This SDFG together with additional meta data, that is needed for further processing
+            is encapsulated inside a `TranslatedJaxprSDFG` object.
 
         Args:
             inp_scalar_as_array:    Translate scalar _input_ arguments to arrays of length 1.
@@ -178,15 +130,9 @@ def translate_jaxpr(
                                         see `self.add_array()` for more.
             allow_empty_jaxpr:      Allows empty Jaxpr.
 
-        Returns:
-            The function will not return the SDFG directly.
-            Instead it will be wrapped inside a `TranslatedJaxprSDFG` instance.
-            That contains the SDFG and some meta data needed for further processing.
+        Notes:
+            Every time this function is called a new revision index is generated.
         """
-        if self.is_allocated():
-            raise RuntimeError(
-                "The translator driver is already allocated, you should resort to 'fork()'."
-            )
         if (len(jaxpr.eqns) == 0) and (not allow_empty_jaxpr):
             raise ValueError("Passed an empty Jaxpr, but did not allow for empty Jaxpr.")
         if not isinstance(jaxpr, jcore.ClosedJaxpr):
@@ -201,6 +147,11 @@ def translate_jaxpr(
         # Consume the hidden flags
         _clear_translation_ctx: bool = kwargs.pop("_clear_translation_ctx", True)
 
+        # NOTE: If `self` is already allocated, i.e. has an ongoing translation process
+        #       This function will create a new translation context. Thus the driver
+        #       will start to translate a second (nested) SDFG.
+        #       Also note that there is no mechanism that forces the integration of the
+        #       nested SDFG/Jaxpr.
         self._allocate_translation_ctx(
             name=name,
             reserved_names=reserved_names,
@@ -221,48 +172,6 @@ def translate_jaxpr(
 
         return jsdfg
 
-    def fork(self) -> JaxprTranslationDriver:
-        """Return a child of `self` ready for transformation.
-
-        The returned object should be seen as a partial clone if `self`. It will
-        have an unallocated translation context, but all other variables are schared.
-        To distinguish children all have a unique identifier, see `self.same_family()`.
-
-        The main reason for its function is to implement nested Jaxpr. If
-        `self.translate_jaxpr()` is called on the returned object it will behave
-        the exact same way as its parent would, with a different Jaxpr argument.
-
-        Notes:
-            A user has to ensure that the lifetime of a child ends before the
-                lifetime of its direct parent. In case of a head translator,
-                the lifetime of its children have to end before the translation
-                process finishes.
-            It is important that a clone instance should not be reused,
-                instead you should fork it again.
-        """
-        from copy import copy as scpy
-
-        if not self.is_allocated():
-            raise RuntimeError("Only allocated driver can fork.")
-
-        # Create a new (empty) driver instance; prevent allocation to make it cheep
-        dolly: JaxprTranslationDriver = JaxprTranslationDriver(_no_shared_alloc=True)
-
-        # Copy the shared members from parent to fork.
-        for slot_name in self.__shared_slots__:
-            setattr(dolly, slot_name, getattr(self, slot_name))
-
-        # Handle the special members and initialize them.
-        dolly._rev_idx = next(self._rev_manager)
-        assert not dolly.is_head_translator()
-
-        # We will now copy the reserved name list
-        #  Although they are shared, only their content is shared.
-        #  This prevents a feedback from the child to the parent.
-        dolly._reserved_names = scpy(self._reserved_names)
-
-        return dolly
-
     def append_new_state(
         self,
         label: str | None = None,
@@ -286,36 +195,24 @@ def append_new_state(
             assignments:    Symbol assignments that should be done during the transition.
             prev_state:     Alternative `SDFGState` at which we should append the new state.
 
-        Notes:
-            In case no `SDFGState` exists yet, an initial SDFGState will be created first.
         """
-        assert self._sdfg is not None
-
-        # Test if we must create a start state.
-        if self._sdfg.start_block is None:
-            assert all(
-                x is None for x in (self._init_sub_translators, self._term_sdfg_state, prev_state)
-            )
-            self._init_sdfg_state = self._sdfg.add_state(label="initial_state", is_start_block=True)
-            self._term_sdfg_state = self._init_sdfg_state
-
         # Decide if appending to that state will modify the terminal state.
         modify_term_state: bool = False
-        if (prev_state is self._term_sdfg_state) or (prev_state is None):
+        if (prev_state is self._ctx.terminal_state) or (prev_state is None):
             modify_term_state = True
-            app_state = self._term_sdfg_state
+            app_state = self._ctx.terminal_state
         else:
             app_state = prev_state
 
-        new_state = self._sdfg.add_state(label, is_start_block=False)
-        self._sdfg.add_edge(
+        new_state = self._ctx.sdfg.add_state(label, is_start_block=False)
+        self._ctx.sdfg.add_edge(
             app_state,
             new_state,
             dace.sdfg.InterstateEdge(condition=condition, assignments=assignments),
         )
 
         if modify_term_state:
-            self._term_sdfg_state = new_state
+            self._ctx.terminal_state = new_state
         return new_state
 
     def get_arrays(self) -> Mapping[str, ddata.Data]:
@@ -325,8 +222,7 @@ def get_arrays(self) -> Mapping[str, ddata.Data]:
             Essentially a shorthand and preferred way for `self.get_sdfg().arrays`.
             For getting a specific data descriptor use `self.get_array()`.
         """
-        assert self._sdfg is not None
-        return cast(Mapping[str, ddata.Data], self._sdfg.arrays)
+        return cast(Mapping[str, ddata.Data], self._ctx.sdfg.arrays)
 
     def get_array(
         self,
@@ -337,17 +233,15 @@ def get_array(
         If `name` is a string it is directly interpreted as the name of an SDFG variable.
         In case it is a `jax.core.Atom` it is first translated, see `self.map_jax_var_to_sdfg()`.
         """
-        assert self._sdfg is not None
-
         if isinstance(name, str):
             sdfg_name: str = name
         elif isinstance(name, (jcore.Var, jutil.JaCeVar)):
             sdfg_name = self.map_jax_var_to_sdfg(name)
         else:
             raise TypeError(f"Does not know how to handle '{type(name).__name__}'.")
-        if sdfg_name not in self._sdfg.arrays:
-            raise KeyError(f"Requested the SDFG array '{name}' but it is not known.")
-        return self._sdfg.arrays[sdfg_name]
+        if sdfg_name not in self._ctx.sdfg.arrays:
+            raise KeyError(f"Requested SDFG array '{name}' but it is not known.")
+        return self._ctx.sdfg.arrays[sdfg_name]
 
     @overload
     def map_jax_var_to_sdfg(
@@ -375,25 +269,20 @@ def map_jax_var_to_sdfg(
             jax_var:        The Jax variable to look up.
             allow_fail:     If mapping is not known return `None` instead of raise `KeyError`.
         """
-        assert self._jax_name_map is not None
-        assert isinstance(jax_var, (jcore.Atom, str, jutil.JaCeVar))
-
         if isinstance(jax_var, str):
             sdfg_name: str = jax_var
         elif isinstance(jax_var, jcore.Literal):
             raise RuntimeError("There is no SDFG variable for literal '{jax_var}'.")
-        elif jax_var in self._jax_name_map:
-            sdfg_name = self._jax_name_map[jax_var]
-            assert isinstance(sdfg_name, str)
+        elif jax_var in self._ctx.jax_name_map:
+            sdfg_name = self._ctx.jax_name_map[jax_var]
         elif allow_fail:
             return None
         else:
             KeyError(f"The Jax variable '{jax_var}' was never registered.")
-
-        if sdfg_name not in self._sdfg.arrays:
+        if sdfg_name not in self._ctx.sdfg.arrays:
             raise KeyError(
                 f"Jax variable '{jax_var}' was supposed to map to '{sdfg_name}',"
-                "but no such SDFG variable is known."
+                " but no such SDFG variable is known."
             )
         return sdfg_name
 
@@ -402,9 +291,7 @@ def get_sdfg(self) -> dace.SDFG:
 
         If you want access to the arrays of the SDFG use `self.get_arrays()`/`self.get_array()`.
         """
-        assert self._sdfg is not None
-        assert (self._init_sdfg_state is None) or (self._init_sdfg_state is self._sdfg.start_block)
-        return self._sdfg
+        return self._ctx.sdfg
 
     def get_terminal_sdfg_state(self) -> dace.SDFGState:
         """Returns the current terminal state of the SDFG under construction.
@@ -413,65 +300,37 @@ def get_terminal_sdfg_state(self) -> dace.SDFGState:
         New states are appended at the current terminal/end state and becoming the new terminal state.
         This function returns the current terminal state.
         """
-        assert all(x is not None for x in (self._sdfg, self._term_sdfg_state))
-        return self._term_sdfg_state
+        return self._ctx.terminal_state
 
     def is_allocated(self) -> bool:
-        """Tests if the translation context of `self` is allocated.
+        """Tests if `self` has an allocated context.
 
-        Notes:
-            It is safe to call this function any time.
-            If this function returns `True` it means that an allocation is ongoing.
+        If `self` is allocated then there is also an ongoing translation process.
         """
-        small_ctx: Sequence[Any] = [
-            # for the proper implementation of forking the reserved names are handled special.
-            getattr(self, x)
-            for x in self.__private_slots__
-            if x != "_rev_idx"
-        ]
-        assert isinstance(self._rev_idx, int)
         assert isinstance(self._sub_translators, dict)
-        if all((x is not None) for x in small_ctx):
-            if self._reserved_names is None:
-                raise RuntimeError("Invalid allocation state: Reserved names not allocated.")
+        if self._ctx is not None:
+            assert self._ctx_stack[-1] is self._ctx
             return True
-        if all((x is None) for x in small_ctx):
-            return False
-        raise RuntimeError("Invalid allocation state: Translation context partially allocated.")
+        assert len(self._ctx_stack) == 0  # type: ignore[unreachable]
+        return False
 
-    def is_head_translator(self) -> bool:
-        """Tests if `self` is a head translator.
+    def is_root_translator(self) -> bool:
+        """Tests if `self` is a root translator.
 
-        A head translator is a translator/driver that was created explicitly, i.e. not by `self.fork()`.
+        The root translator (context) is the very first translator process that was started.
         """
-        assert self._rev_manager is not None
-        assert self._rev_idx is not None
-        return self._rev_idx == 0
-
-    def same_family(
-        self,
-        other: JaxprTranslationDriver,
-    ) -> bool:
-        """Test if `self` and `other` belongs to the same family of driver/translators.
-
-        A driver is either explicitly created, i.e. head translator, or created by a call to `fork()`.
-        All drivers that descend from the same head translator from a family.
-        """
-        if not isinstance(other, JaxprTranslationDriver):
-            return NotImplemented  # type: ignore[unreachable]
-        if all(getattr(self, x) is getattr(self, x) for x in self.__shared_slots__):
+        if not self.is_allocated():
+            raise RuntimeError("Driver is not allocated.")
+        if self._ctx.rev_idx == 0:
+            assert len(self._ctx_stack) == 1
             return True
-        assert not any(getattr(self, x) is getattr(self, x) for x in self.__shared_slots__)
-
         return False
 
     def get_rev_idx(self) -> int:
-        """Returns the revision index of `self`.
-
-        To distinguish members of same family every diver has a unique identifier, known as revision.
-        However, the revision is only unique within a single family and during an ongoing translation.
-        """
-        return self._rev_idx
+        """Returns the revision index of `self`."""
+        if not self.is_allocated():
+            raise RuntimeError("Driver is not allocated.")
+        return self._ctx.rev_idx
 
     def add_jax_name_mapping(
         self,
@@ -489,12 +348,10 @@ def add_jax_name_mapping(
             jax_var:     The Jax variable.
             sdfg_name:   The name of the corresponding SDFG variable.
         """
-        assert self._jax_name_map is not None
-        assert isinstance(jax_var, (jcore.Var, jutil.JaCeVar))
         assert isinstance(sdfg_name, str) and (len(sdfg_name) > 0)  # noqa: PT018  # Should be one assertion.
 
-        if jax_var in self._jax_name_map:
-            if self._jax_name_map[jax_var] == sdfg_name:  # noops.
+        if jax_var in self._ctx.jax_name_map:
+            if self._ctx.jax_name_map[jax_var] == sdfg_name:  # noops.
                 return self
             raise ValueError(
                 f"Tried to create the mapping '{jax_var} -> {sdfg_name}', but '{jax_var}'"
@@ -505,7 +362,7 @@ def add_jax_name_mapping(
         if sdfg_name in self._forbidden_names:
             raise NameError(f"Mapping '{jax_var} -> {sdfg_name}': Forbidden name.")
 
-        self._jax_name_map[jax_var] = sdfg_name
+        self._ctx.jax_name_map[jax_var] = sdfg_name
         return self
 
     def add_reserved_names(
@@ -630,7 +487,7 @@ def add_array(
                 raise ValueError(
                     f"Specified 'force_jax_name', but passed '{name_prefix}' as 'name_prefix'."
                 )
-            alt_name = jutil._propose_jax_name(arg, self._jax_name_map)
+            alt_name = jutil._propose_jax_name(arg, self._ctx.jax_name_map)
         if alt_name is not None:
             assert isinstance(
                 alt_name, str
@@ -646,7 +503,7 @@ def add_array(
                 raise ValueError(
                     f"Specified 'name_prefix' ('{name_prefix}') but passed '{alt_name}' as 'alt_name'."
                 )
-            if alt_name in self._sdfg.arrays:
+            if alt_name in self._ctx.sdfg.arrays:
                 raise ValueError(f"Variable '{alt_name}' already exists.")
         if name_prefix is not None:
             assert isinstance(name_prefix, str)
@@ -674,7 +531,7 @@ def add_array(
         if alt_name is not None:
             prop_name = alt_name  # Just for completion: will be ignored later
         elif isinstance(arg, (jcore.Var, jutil.JaCeVar)):
-            prop_name = jutil._propose_jax_name(arg, self._jax_name_map)
+            prop_name = jutil._propose_jax_name(arg, self._ctx.jax_name_map)
             if prop_name.startswith("__"):
                 raise ValueError(
                     f"You tried to create the variable '{prop_name}' which"
@@ -692,7 +549,9 @@ def add_array(
         if alt_name is None:
             # If we are the root translator, then we will use `prop_name` directly;
             #  otherwise we will append the revision of `self` to the name.
-            arg_name = prop_name + ("" if self.is_head_translator() else f"_rev_idx{self._rev_idx}")
+            arg_name = prop_name + (
+                "" if self.is_root_translator() else f"_rev_idx{self._ctx.rev_idx}"
+            )
         else:
             arg_name = str(alt_name)
 
@@ -711,7 +570,7 @@ def add_array(
                 if (
                     (_arg_name in self._forbidden_names)
                     or (_arg_name in self._reserved_names)
-                    or (_arg_name in self._sdfg.arrays)
+                    or (_arg_name in self._ctx.sdfg.arrays)
                 ):
                     continue  # The proposed variable is known, so try next value.
                 arg_name = _arg_name  # We found a name that we can use.
@@ -723,7 +582,7 @@ def add_array(
         # Final name check
         if arg_name in self._forbidden_names:
             raise ValueError(f"Can't create variable '{arg_name}', name is forbidden.")
-        if arg_name in self._sdfg.arrays:
+        if arg_name in self._ctx.sdfg.arrays:
             raise ValueError(f"Can't create variable '{arg_name}', variable is already created.")
         if not re.fullmatch("[a-zA-Z_][a-zA-Z0-9_]*", arg_name):
             raise ValueError(f"The requested variable name '{arg_name}' is invalid.")
@@ -747,11 +606,11 @@ def add_array(
             ]
 
         if is_scalar:
-            self._sdfg.add_scalar(
+            self._ctx.sdfg.add_scalar(
                 name=arg_name, storage=storage, dtype=dtype, transient=as_transient
             )
         elif as_view:
-            self._sdfg.add_view(
+            self._ctx.sdfg.add_view(
                 name=arg_name,
                 shape=shape,
                 strides=strides,
@@ -760,7 +619,7 @@ def add_array(
                 dtype=dtype,
             )
         else:
-            self._sdfg.add_array(
+            self._ctx.sdfg.add_array(
                 name=arg_name,
                 shape=shape,
                 strides=strides,
@@ -803,10 +662,9 @@ def create_jax_var_list(
             handle_literals:    Allow the processing of literals.
             kwargs:             Will be forwarded to `self.add_array()` if a variable as to be created,
         """
-        assert self._jax_name_map is not None
-        assert "update_var_mapping" not in kwargs
         if only_creation and prevent_creation:
             raise ValueError("Specified both 'only_creation' and 'prevent_creation'.")
+        assert "update_var_mapping" not in kwargs
 
         ret_list: list[None | str] = []
         for jax_var in jax_var_list:
@@ -850,28 +708,28 @@ def _create_initial_input(
         Notes:
             This function will fill the internal list of inputs.
         """
-        assert self.is_allocated()
-        assert len(jaxpr.jaxpr.invars)
 
-        if len(self._sdfg_in_names) != 0:
+        if not self.is_allocated():
+            raise RuntimeError("Driver is not allocated, can not create constants.")
+        if len(self._ctx.inp_names) != 0:
             raise RuntimeError("Called '_create_initial_input()' twice?")
-        assert len(self._sdfg_out_names) == 0
+        assert len(self._ctx.out_names) == 0
 
         # Handle the initial input arguments
-        sdfg: dace.SDFG = self._sdfg
+        sdfg: dace.SDFG = self._ctx.sdfg
         init_in_var_names: Sequence[str] = self.create_jax_var_list(  # type: ignore[assignment]
             jax_var_list=jaxpr.jaxpr.invars,
             only_creation=True,
             as_transient=True,  # Explicit transient; no error!
             handle_literals=False,  # Initial arguments are never literals
             force_array=inp_scalar_as_array,
-            force_jax_name=self.is_head_translator(),  # Ensure head get pure Jax names.
+            force_jax_name=self.is_root_translator(),  # Ensure root get pure Jax names.
         )
         sdfg.arg_names.extend(init_in_var_names)
 
         # Store the list of inputs in self; this is done to simplify exporting.
         #  The output list is populated by `self._translate_jaxpr_internal()`
-        self._sdfg_in_names = tuple(init_in_var_names)
+        self._ctx.inp_names = tuple(init_in_var_names)
 
         return init_in_var_names
 
@@ -889,7 +747,8 @@ def _create_constants(
         """
         from copy import deepcopy
 
-        assert self.is_allocated()
+        if not self.is_allocated():
+            raise RuntimeError("Driver is not allocated, can not create constants.")
         if not len(jaxpr.consts):
             return []
 
@@ -904,7 +763,9 @@ def _create_constants(
                 update_var_mapping=True,
             )
             # We have to pass the data descriptor to `add_constant()`, otherwise a new one would be created.
-            self._sdfg.add_constant(c_sdfg_name, deepcopy(cValue), self._sdfg.arrays[c_sdfg_name])
+            self._ctx.sdfg.add_constant(
+                c_sdfg_name, deepcopy(cValue), self._ctx.sdfg.arrays[c_sdfg_name]
+            )
             const_names.append(c_sdfg_name)
         return const_names
 
@@ -915,31 +776,39 @@ def _allocate_translation_ctx(
     ) -> JaxprTranslationDriver:
         """This function allocates and initialize the members of the translation context of `self`.
 
-        After this function is called, `self` is said to have an ongoing translation process.
+        If this function is called and `self` is already allocated, the function will create a new context.
+        This allows the driver to handle nested Jaxpr.
+        The first context that is created is also known as root translator.
 
         Args:
             name:               The name of the SDFG.
             reserved_names:     Add these name to the set of resered names of `self`.
         """
-        if self.is_allocated():
-            raise RuntimeError("The translator is already allocated.")
+        from ._translation_context import _TranslationContext
+
         if name and (not re.fullmatch("[a-zA-Z_][a-zA-Z0-9_]*", name)):
             raise ValueError(f"The provided name '{name}' for the SDFG is invalid.")
 
-        self._sdfg = dace.SDFG(name=(name or f"unnamed_SDFG_{id(self)}"))
-        self._init_sdfg_state = self._sdfg.add_state(label="initial_state", is_start_block=True)
-        self._term_sdfg_state = self._init_sdfg_state
-        self._jax_name_map = {}
-        self._sdfg_in_names = ()
-        self._sdfg_out_names = ()
-
-        # If the reserved names are already allocated then keep them.
-        #  This is needed to preserve them among forks.
-        if self._reserved_names is None:
-            self._reserved_names = set()  # type: ignore[unreachable]
-        elif not isinstance(self._reserved_names, set):
-            raise RuntimeError("The reserved names are allocated incorrectly.")
-        return self.add_reserved_names(reserved_names)
+        # Create a new translation context and put it on the stack.
+        self._ctx = _TranslationContext(
+            rev_idx=next(self._rev_manager),
+            name=name,
+        )
+        self._ctx_stack.append(self._ctx)
+
+        if self.is_root_translator():
+            # The root translation, i.e. the very first context allocation
+            #  Thus we also have to allocate the additional members
+            #  which are shared among all contexts.
+            self._reserved_names = set()
+            self.add_reserved_names(reserved_names)
+
+        else:
+            # We are in a nested context.
+            #  We might have to update the reserved names.
+            self.add_reserved_names(reserved_names)
+
+        return self
 
     def _init_sub_translators(
         self,
@@ -975,33 +844,25 @@ def _clear_translation_ctx(self) -> JaxprTranslationDriver:
         Notes:
             While it is allowed for outside code to call this explicitly function,
                 it is is most likely an error.
-            If this function is called on a head translator, then the translation
-                process ends. This implies that all direct and indirect children,
-                i.e. output of `self.fork()` must already be deallocated. A further
-                side effect is that now revision indexes might be reused.
             If `self` is not allocated this function acts as a noops.
-            The reserved names are only deallocated if `self` is a head translator.
+            The reserved names are only deallocated if `self` is a root translator.
         """
         if not self.is_allocated():
             return self
-        self._sdfg = None
-        self._init_sdfg_state = None
-        self._term_sdfg_state = None
-        self._jax_name_map = None  # type: ignore[assignment]
-        self._sdfg_in_names = None  # type: ignore[assignment]
-        self._sdfg_out_names = None  # type: ignore[assignment]
-
-        if self.is_head_translator():
-            # We are the head translator thus we reset the revision manager.
-            #  Since this function is only called at the very end, we know that the translation
-            #  process as a whole has finished. We reset the state that the numbers are small
-            #  again when we start anew.
-            self._rev_manager = itertools.count(0, 1)
 
-            # Freeing the reserved names only for heads make it more safe in case a child
-            #  translator is reused.c On the other hand reusing a child translator is
-            #  discouraged, but not forbidden.
+        assert self._ctx is self._ctx_stack[-1], "Inconsistent stack detected."
+        if self.is_root_translator():
+            self._rev_manager = itertools.count(0, 1)
             self._reserved_names = None  # type: ignore[assignment]
+
+            self._ctx = None  # type: ignore[assignment]
+            self._ctx_stack.pop()
+
+        else:
+            # Restore the previous state
+            assert len(self._ctx_stack) > 1
+            self._ctx_stack.pop()
+            self._ctx = self._ctx_stack[-1]
         return self
 
     def _find_sub_translator_for(
@@ -1079,7 +940,7 @@ def _translate_single_eqn(
 
         # Determine the new (tentative) terminal state of the SDFG we are building.
         if new_sdfg_term_state is None:
-            if eqn_state is not self._term_sdfg_state:
+            if eqn_state is not self._ctx.terminal_state:
                 raise RuntimeError("Inconsistent terminal state was detected.")
             new_sdfg_term_state = eqn_state
         elif isinstance(new_sdfg_term_state, dace.SDFGState):
@@ -1124,8 +985,8 @@ def _translate_single_eqn(
                     f" is of type '{type(sdfg_var).__name__}' which I does not know how to handle."
                 )
 
-        # Modify terminal head state of 'self'
-        self._term_sdfg_state = new_sdfg_term_state
+        # Modify terminal root state of 'self'
+        self._ctx.terminal_state = new_sdfg_term_state
 
         return (in_var_names, out_var_names)
 
@@ -1168,7 +1029,7 @@ def _translate_jaxpr_internal(
         if nb_translated_eqn == 0:
             # There were no equation, so handle the copying of input to output.
             out_var_names = self._handle_null_jaxpr(jaxpr)
-        self._sdfg_out_names = tuple(out_var_names)
+        self._ctx.out_names = tuple(out_var_names)
 
         return self._export_context()
 
@@ -1180,16 +1041,16 @@ def _export_context(self) -> jtrans.TranslatedJaxprSDFG:
         To free the context of `self` use `self._clear_translation_ctx()`.
         """
         assert self.is_allocated()
-        assert all((isinstance(x, str) and (len(x) > 0)) for x in self._sdfg_in_names)
-        assert all((isinstance(x, str) and (len(x) > 0)) for x in self._sdfg_out_names)
+        assert all((isinstance(x, str) and (len(x) > 0)) for x in self._ctx.inp_names)
+        assert all((isinstance(x, str) and (len(x) > 0)) for x in self._ctx.out_names)
 
         return jtrans.TranslatedJaxprSDFG(
-            sdfg=self._sdfg,
-            start_state=self._init_sdfg_state,
-            terminal_state=self._term_sdfg_state,
-            jax_name_map=self._jax_name_map,
-            inp_names=self._sdfg_in_names,
-            out_names=self._sdfg_out_names,
+            sdfg=self._ctx.sdfg,
+            start_state=self._ctx.start_state,
+            terminal_state=self._ctx.terminal_state,
+            jax_name_map=self._ctx.jax_name_map,
+            inp_names=self._ctx.inp_names,
+            out_names=self._ctx.out_names,
         )
 
     def _handle_null_jaxpr(
@@ -1211,9 +1072,9 @@ def _handle_null_jaxpr(
         if len(jaxpr.out_avals) == 0:
             # There is not output so we do not have to copy anything around.
             return ()
-        assert self._term_sdfg_state is self._init_sdfg_state
-        assert len(self._sdfg_in_names) > 0
-        assert len(self._sdfg_out_names) == 0
+        assert self._ctx.terminal_state is self._ctx.start_state
+        assert len(self._ctx.inp_names) > 0
+        assert len(self._ctx.out_names) == 0
 
         # We will use this list to build the list of output names.
         #  This is important for the exporter.
@@ -1247,9 +1108,9 @@ def _handle_null_jaxpr(
             out_var_names.append(jax_out_name)
 
             # Now copy the input into the fake output variable.
-            inp_acc = self._init_sdfg_state.add_read(self.map_jax_var_to_sdfg(jax_inp_name))
-            out_acc = self._init_sdfg_state.add_write(self.map_jax_var_to_sdfg(jax_out_var))
-            self._init_sdfg_state.add_nedge(
+            inp_acc = self._ctx.start_state.add_read(self.map_jax_var_to_sdfg(jax_inp_name))
+            out_acc = self._ctx.start_state.add_write(self.map_jax_var_to_sdfg(jax_out_var))
+            self._ctx.start_state.add_nedge(
                 src=inp_acc,
                 dst=out_acc,
                 data=dace.Memlet.from_array(
diff --git a/src/jace/translator/translated_jaxpr_sdfg.py b/src/jace/translator/translated_jaxpr_sdfg.py
index b0562e6..8e6fb78 100644
--- a/src/jace/translator/translated_jaxpr_sdfg.py
+++ b/src/jace/translator/translated_jaxpr_sdfg.py
@@ -29,7 +29,11 @@ class TranslatedJaxprSDFG:
     - `inp_names` a `list` of the SDFG variables that are used as input, in the same order as `Jaxpr.invars`.
     - `out_names` a `list` of the SDFG variables that are used as output, in the same order as `Jaxpr.outvars`.
 
-    Note that `inp_names` and `out_names` may not be disjunct.
+    The SDFG is in a so called canonical form, that is not directly usable, see `JaxprTranslationDriver` for more.
+
+    It might be that a name appears in both the `inp_names` and `out_names` list.
+    This happens if the corresponding variable is used as both input and output.
+    In Jax this is called argument donation.
     """
 
     sdfg: dace.SDFG

From f3368124225eb1cf47bcffe061d0c7f6e43fb805 Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Thu, 2 May 2024 14:58:59 +0200
Subject: [PATCH 080/458] Updated the translated SDFG object.

It is no longer frozen and some attributes are no loger requiered.
This is because the SDFG has to be modified anyway later.
Furthermore it made it distinct from the context.
---
 src/jace/translator/translated_jaxpr_sdfg.py | 12 ++++++------
 1 file changed, 6 insertions(+), 6 deletions(-)

diff --git a/src/jace/translator/translated_jaxpr_sdfg.py b/src/jace/translator/translated_jaxpr_sdfg.py
index 8e6fb78..b2b7dc8 100644
--- a/src/jace/translator/translated_jaxpr_sdfg.py
+++ b/src/jace/translator/translated_jaxpr_sdfg.py
@@ -17,15 +17,15 @@
 from jace import util as jutil
 
 
-@dataclass(init=True, repr=True, eq=False, frozen=True, kw_only=True, slots=True)
+@dataclass(init=True, repr=True, eq=False, frozen=False, kw_only=True, slots=True)
 class TranslatedJaxprSDFG:
     """Encapsulates the result of a translation run of the `JaxprTranslationDriver` object.
 
     It defines the following members:
     - `sdfg` the SDFG object that was created.
+    - `jax_name_map` a `dict` that maps every Jax variable to its corresponding SDFG variable _name_.
     - `start_state` the first state in the SDFG state machine.
     - `terminal_state` the last state in the state machine.
-    - `jax_name_map` a `dict` that maps every Jax variable to its corresponding SDFG variable _name_.
     - `inp_names` a `list` of the SDFG variables that are used as input, in the same order as `Jaxpr.invars`.
     - `out_names` a `list` of the SDFG variables that are used as output, in the same order as `Jaxpr.outvars`.
 
@@ -37,11 +37,11 @@ class TranslatedJaxprSDFG:
     """
 
     sdfg: dace.SDFG
-    start_state: dace.SDFGState
-    terminal_state: dace.SDFGState
     jax_name_map: Mapping[jcore.Var | jutil.JaCeVar, str]
-    inp_names: Sequence[str]
-    out_names: Sequence[str]
+    start_state: dace.SDFGState | None = None
+    terminal_state: dace.SDFGState | None = None
+    inp_names: Sequence[str] | None = None
+    out_names: Sequence[str] | None = None
 
     def validate(self) -> bool:
         """Validate the underlying SDFG."""

From 67d963a125920b4d805c5bbf8719d3f327892cfa Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Thu, 2 May 2024 15:34:27 +0200
Subject: [PATCH 081/458] Implemented Enrique's suggestions about the type
 traits.

---
 .../translator/jaxpr_translator_driver.py     |  2 +-
 src/jace/util/__init__.py                     |  6 ++--
 src/jace/util/traits.py                       | 20 +++++++++++
 src/jace/util/util.py                         | 36 ++++++++++---------
 4 files changed, 45 insertions(+), 19 deletions(-)
 create mode 100644 src/jace/util/traits.py

diff --git a/src/jace/translator/jaxpr_translator_driver.py b/src/jace/translator/jaxpr_translator_driver.py
index a336946..5a9003a 100644
--- a/src/jace/translator/jaxpr_translator_driver.py
+++ b/src/jace/translator/jaxpr_translator_driver.py
@@ -827,7 +827,7 @@ def _init_sub_translators(
         sub_translators: dict[str, jtrans.PrimitiveTranslator] = {}
         for sub_translator_cls in _get_subtranslators_cls():
             sub_translator: jtrans.PrimitiveTranslator = sub_translator_cls.CREATE(**subtrans_args)
-            handled_primitives: Iterable[str] = jutil.ensure_iterability(
+            handled_primitives: Iterable[str] = jutil.as_sequence(
                 sub_translator.get_handled_primitive()
             )
             for handled_primitive in handled_primitives:
diff --git a/src/jace/util/__init__.py b/src/jace/util/__init__.py
index 29c5276..f6aa78f 100644
--- a/src/jace/util/__init__.py
+++ b/src/jace/util/__init__.py
@@ -21,15 +21,17 @@
     is_tracing_ongoing,
     translate_dtype,
 )
-from .util import ensure_iterability, is_jaceified
+from .traits import is_non_string_iterable
+from .util import as_sequence, is_jaceified
 
 
 __all__ = [
-    "ensure_iterability",
+    "as_sequence",
     "is_drop_var",
     "is_tracing_ongoing",
     "is_jaceified",
     "is_jaxified",
+    "is_non_string_iterable",
     "JaCeVar",
     "get_jax_var_name",
     "get_jax_var_shape",
diff --git a/src/jace/util/traits.py b/src/jace/util/traits.py
new file mode 100644
index 0000000..0ec5909
--- /dev/null
+++ b/src/jace/util/traits.py
@@ -0,0 +1,20 @@
+# JaCe - JAX Just-In-Time compilation using DaCe (Data Centric Parallel Programming)
+#
+# Copyright (c) 2024, ETH Zurich
+# All rights reserved.
+#
+# SPDX-License-Identifier: BSD-3-Clause
+
+"""Contains all traits function needed inside JaCe."""
+
+from __future__ import annotations
+
+from collections.abc import Iterable
+from typing import Any, TypeGuard
+
+
+class NonStringIterable(Iterable): ...
+
+
+def is_non_string_iterable(val: Any) -> TypeGuard[NonStringIterable]:
+    return isinstance(val, Iterable) and not isinstance(val, str)
diff --git a/src/jace/util/util.py b/src/jace/util/util.py
index c58a691..cc575ab 100644
--- a/src/jace/util/util.py
+++ b/src/jace/util/util.py
@@ -8,26 +8,30 @@
 from __future__ import annotations
 
 from collections.abc import Iterable
-from typing import Any
+from typing import Any, TypeVar, cast, overload
 
 
-def ensure_iterability(
-    x: Any,
-    ign_str: bool = True,
-) -> Iterable[Any]:
-    """Ensures that `x` is iterable.
+_T = TypeVar("_T")
 
-    By default strings are _not_ considered iterable.
 
-    Args:
-        x:          To test.
-        ign_str:    Ignore that a string is iterabile.
-    """
-    if ign_str and isinstance(x, str):
-        x = [x]
-    elif isinstance(x, Iterable):
-        pass
-    return x
+@overload
+def as_sequence(value: str) -> Iterable[str]: ...
+
+
+@overload
+def as_sequence(value: Iterable[_T]) -> Iterable[_T]: ...
+
+
+@overload
+def as_sequence(value: _T) -> Iterable[_T]: ...
+
+
+def as_sequence(value: _T | Iterable[_T]) -> Iterable[_T]:
+    from jace.util.traits import is_non_string_iterable
+
+    if is_non_string_iterable(value):
+        return value
+    return cast(Iterable[_T], [value])
 
 
 def is_jaceified(obj: Any) -> bool:

From 253b948af39c5ffa9e758f3435988d49a98e00a1 Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Thu, 2 May 2024 15:43:28 +0200
Subject: [PATCH 082/458] Remodeled the type trait part of teh util package.

---
 src/jace/util/__init__.py   |  6 ++---
 src/jace/util/jax_helper.py | 32 ++-----------------------
 src/jace/util/traits.py     | 48 +++++++++++++++++++++++++++++++++++++
 src/jace/util/util.py       | 16 +------------
 4 files changed, 53 insertions(+), 49 deletions(-)

diff --git a/src/jace/util/__init__.py b/src/jace/util/__init__.py
index f6aa78f..a161184 100644
--- a/src/jace/util/__init__.py
+++ b/src/jace/util/__init__.py
@@ -16,13 +16,11 @@
     get_jax_var_dtype,
     get_jax_var_name,
     get_jax_var_shape,
-    is_drop_var,
-    is_jaxified,
     is_tracing_ongoing,
     translate_dtype,
 )
-from .traits import is_non_string_iterable
-from .util import as_sequence, is_jaceified
+from .traits import is_drop_var, is_jaceified, is_jaxified, is_non_string_iterable
+from .util import as_sequence
 
 
 __all__ = [
diff --git a/src/jace/util/jax_helper.py b/src/jace/util/jax_helper.py
index 44304f1..b02a7de 100644
--- a/src/jace/util/jax_helper.py
+++ b/src/jace/util/jax_helper.py
@@ -137,26 +137,6 @@ def is_tracing_ongoing(
     return any(isinstance(x, jcore.Tracer) for x in chain(args, kwargs.values()))
 
 
-def is_jaxified(obj: Any) -> bool:
-    """Tests if `obj` is a "jaxified" object.
-
-    A "jexified" object is an object that was processed by Jax.
-    While a return value of `True` guarantees a jaxified object,
-    `False` might not proof the contrary.
-    """
-    import jaxlib
-    from jax._src import pjit as jaxpjit
-
-    # These are all types we consider as jaxify
-    jaxifyed_types = (
-        jcore.Primitive,
-        # jstage.Wrapped is not runtime chakable
-        jaxpjit.JitWrapped,
-        jaxlib.xla_extension.PjitFunction,
-    )
-    return isinstance(obj, jaxifyed_types)
-
-
 def translate_dtype(dtype: Any) -> dace.typeclass:
     """Turns a Jax datatype into a DaCe datatype."""
     if isinstance(dtype, dace.typeclass):
@@ -181,16 +161,6 @@ def translate_dtype(dtype: Any) -> dace.typeclass:
             return dace.dtype_to_typeclass(dtype)
 
 
-def is_drop_var(jax_var: jcore.Atom | JaCeVar) -> bool:
-    """Tests if `jax_var` is a drop variable."""
-
-    if isinstance(jax_var, jcore.DropVar):
-        return True
-    if isinstance(jax_var, JaCeVar):
-        return jax_var.name == "_"
-    return False
-
-
 def _propose_jax_name(
     jax_var: jcore.Atom | JaCeVar,
     jax_name_map: Mapping[jcore.Var | JaCeVar, Any] | None = None,
@@ -211,6 +181,8 @@ def _propose_jax_name(
         The naming of variables are only consistent with the inner most Jaxpr a variable is defined in.
         Dropped variables will always be named `'_'`.
     """
+    from jace.util.traits import is_drop_var
+
     if is_drop_var(jax_var):
         return "_"
     if isinstance(jax_var, jcore.Literal):
diff --git a/src/jace/util/traits.py b/src/jace/util/traits.py
index 0ec5909..417cdcb 100644
--- a/src/jace/util/traits.py
+++ b/src/jace/util/traits.py
@@ -12,9 +12,57 @@
 from collections.abc import Iterable
 from typing import Any, TypeGuard
 
+from jax import core as jcore
+
+from jace import util as jutil
+
 
 class NonStringIterable(Iterable): ...
 
 
 def is_non_string_iterable(val: Any) -> TypeGuard[NonStringIterable]:
     return isinstance(val, Iterable) and not isinstance(val, str)
+
+
+def is_jaceified(obj: Any) -> bool:
+    """Tests if `obj` is decorated by JaCe.
+
+    Similar to `jace.util.is_jaxified`, but for JaCe object.
+    """
+    from jace import jax as jjax, util as jutil
+
+    if jutil.is_jaxified(obj):
+        return False
+    # Currently it is quite simple because we can just check if `obj`
+    #  is derived from `jace.jax.JitWrapped`, might become harder in the future.
+    return isinstance(obj, jjax.JitWrapped)
+
+
+def is_drop_var(jax_var: jcore.Atom | jutil.JaCeVar) -> bool:
+    """Tests if `jax_var` is a drop variable."""
+
+    if isinstance(jax_var, jcore.DropVar):
+        return True
+    if isinstance(jax_var, jutil.JaCeVar):
+        return jax_var.name == "_"
+    return False
+
+
+def is_jaxified(obj: Any) -> bool:
+    """Tests if `obj` is a "jaxified" object.
+
+    A "jexified" object is an object that was processed by Jax.
+    While a return value of `True` guarantees a jaxified object,
+    `False` might not proof the contrary.
+    """
+    import jaxlib
+    from jax._src import pjit as jaxpjit
+
+    # These are all types we consider as jaxify
+    jaxifyed_types = (
+        jcore.Primitive,
+        # jstage.Wrapped is not runtime chakable
+        jaxpjit.JitWrapped,
+        jaxlib.xla_extension.PjitFunction,
+    )
+    return isinstance(obj, jaxifyed_types)
diff --git a/src/jace/util/util.py b/src/jace/util/util.py
index cc575ab..3943743 100644
--- a/src/jace/util/util.py
+++ b/src/jace/util/util.py
@@ -8,7 +8,7 @@
 from __future__ import annotations
 
 from collections.abc import Iterable
-from typing import Any, TypeVar, cast, overload
+from typing import TypeVar, cast, overload
 
 
 _T = TypeVar("_T")
@@ -32,17 +32,3 @@ def as_sequence(value: _T | Iterable[_T]) -> Iterable[_T]:
     if is_non_string_iterable(value):
         return value
     return cast(Iterable[_T], [value])
-
-
-def is_jaceified(obj: Any) -> bool:
-    """Tests if `obj` is decorated by JaCe.
-
-    Similar to `jace.util.is_jaxified`, but for JaCe object.
-    """
-    from jace import jax as jjax, util as jutil
-
-    if jutil.is_jaxified(obj):
-        return False
-    # Currently it is quite simple because we can just check if `obj`
-    #  is derived from `jace.jax.JitWrapped`, might become harder in the future.
-    return isinstance(obj, jjax.JitWrapped)

From 75ca97e8d8051ce4f4db24dd935363891ed88722 Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Thu, 2 May 2024 15:45:10 +0200
Subject: [PATCH 083/458] Updated some checks in the driver.

---
 src/jace/translator/jaxpr_translator_driver.py | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/src/jace/translator/jaxpr_translator_driver.py b/src/jace/translator/jaxpr_translator_driver.py
index 5a9003a..2b8da49 100644
--- a/src/jace/translator/jaxpr_translator_driver.py
+++ b/src/jace/translator/jaxpr_translator_driver.py
@@ -1018,9 +1018,9 @@ def _translate_jaxpr_internal(
             assert len(eqn.effects) == 0
             if len(eqn.outvars) == 0:  # Do we need this special case.
                 continue  #  Looks more like internal Jax error.
-            if any(jutil.get_jax_var_name(outVar) == "_" for outVar in eqn.outvars):
+            if any(jutil.is_drop_var(outVar) for outVar in eqn.outvars):
                 assert (len(eqn.outvars) == 1) or all(
-                    jutil.get_jax_var_name(outVar) == "_" for outVar in eqn.outvars
+                    jutil.is_drop_var(outVar) for outVar in eqn.outvars
                 )
                 continue
             _, out_var_names = self._translate_single_eqn(jaxpr=jaxpr, eqn=eqn)

From f9d76f4bd6b7f16dcdfa7186ca453838c37560bc Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Fri, 3 May 2024 08:07:22 +0200
Subject: [PATCH 084/458] Updated the primitive translator interface.

The primitivs that are handled are now implemented as a property.
The methods are now abstract.
---
 src/jace/translator/jaxpr_translator_driver.py  |  5 ++---
 src/jace/translator/primitive_translator.py     | 17 +++++++++--------
 .../sub_translators/alu_translator.py           |  3 ++-
 3 files changed, 13 insertions(+), 12 deletions(-)

diff --git a/src/jace/translator/jaxpr_translator_driver.py b/src/jace/translator/jaxpr_translator_driver.py
index 2b8da49..0dbb257 100644
--- a/src/jace/translator/jaxpr_translator_driver.py
+++ b/src/jace/translator/jaxpr_translator_driver.py
@@ -827,9 +827,8 @@ def _init_sub_translators(
         sub_translators: dict[str, jtrans.PrimitiveTranslator] = {}
         for sub_translator_cls in _get_subtranslators_cls():
             sub_translator: jtrans.PrimitiveTranslator = sub_translator_cls.CREATE(**subtrans_args)
-            handled_primitives: Iterable[str] = jutil.as_sequence(
-                sub_translator.get_handled_primitive()
-            )
+            handled_primitives: Iterable[str] = jutil.as_sequence(sub_translator.primitive)
+
             for handled_primitive in handled_primitives:
                 if handled_primitive in sub_translators:
                     raise RuntimeError(f"Multiple sub_translators for '{handled_primitive}' found.")
diff --git a/src/jace/translator/primitive_translator.py b/src/jace/translator/primitive_translator.py
index 3d9cb5d..816b709 100644
--- a/src/jace/translator/primitive_translator.py
+++ b/src/jace/translator/primitive_translator.py
@@ -7,6 +7,7 @@
 
 from __future__ import annotations
 
+from abc import abstractmethod
 from collections.abc import Sequence
 from typing import TYPE_CHECKING, Any, Protocol, runtime_checkable
 
@@ -41,23 +42,25 @@ class PrimitiveTranslator(Protocol):
     __slots__ = ()
 
     @classmethod
+    @abstractmethod
     def CREATE(
         cls,
         *args: Any,
         **kwargs: Any,
     ) -> PrimitiveTranslator:
         """Creates an instance of a subtranslator."""
-        raise NotImplementedError("Class '{type(self).__name__}' does not implement 'CREATE()'.")
+        ...
 
-    def get_handled_primitive(self) -> str | Sequence[str]:
+    @property
+    @abstractmethod
+    def primitive(self) -> str | Sequence[str]:
         """Returns the names of the Jax primitive that `self` is able to handle.
 
         In case `self` can handle multiple primitives, it should return a list with these names.
         """
-        raise NotImplementedError(
-            "Class '{type(self).__name__}' does not implement 'get_handled_primitive()'."
-        )
+        ...
 
+    @abstractmethod
     def translate_jaxeqn(
         self,
         driver: JaxprTranslationDriver,
@@ -113,6 +116,4 @@ def translate_jaxeqn(
             eqn_state:      State into which the primitive`s SDFG representation
                                 should be constructed.
         """
-        raise NotImplementedError(
-            "Class '{type(self).__name__}' does not implement 'translate_jaxeqn()'."
-        )
+        ...
diff --git a/src/jace/translator/sub_translators/alu_translator.py b/src/jace/translator/sub_translators/alu_translator.py
index bbaf469..b08e474 100644
--- a/src/jace/translator/sub_translators/alu_translator.py
+++ b/src/jace/translator/sub_translators/alu_translator.py
@@ -83,8 +83,9 @@ def __init__(self, **kwargs: Any) -> None:
         """Initialize the `ALUTranslator`."""
         super().__init__(**kwargs)
 
+    @property
     @override
-    def get_handled_primitive(self) -> Sequence[str]:
+    def primitive(self) -> Sequence[str]:
         """Returns the list of all known primitives."""
         return list(self._unary_ops.keys()) + list(self._binary_ops.keys())
 

From b1e8459c47d70e02da43acd2a2f03b9b754dc543 Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Fri, 3 May 2024 08:27:19 +0200
Subject: [PATCH 085/458] Updated the sub translator module.

Removed the functions.
---
 .../translator/sub_translators/__init__.py    | 66 ++++---------------
 1 file changed, 11 insertions(+), 55 deletions(-)

diff --git a/src/jace/translator/sub_translators/__init__.py b/src/jace/translator/sub_translators/__init__.py
index 5812dbb..ec3be8d 100644
--- a/src/jace/translator/sub_translators/__init__.py
+++ b/src/jace/translator/sub_translators/__init__.py
@@ -10,25 +10,17 @@
 from __future__ import annotations
 
 from collections.abc import Sequence
-from typing import TYPE_CHECKING, Final
 
-
-if TYPE_CHECKING:
-    from jace import translator as jtrans
+from jace import translator as jtrans
 
 from .alu_translator import ALUTranslator
 
 
 # List of all subtranslators that ships with JaCe.
-_BUILTIN_SUBTRANSLATORS: Final[list[type[jtrans.PrimitiveTranslator]]] = [
+_KNOWN_SUBTRANSLATORS: list[type[jtrans.PrimitiveTranslator]] = [
     ALUTranslator,
 ]
 
-# All externally supplied subtranslator implementation.
-#  It is a `dict` to do fast access and remember the order, value is always `None`.
-#  The list is manipulated through `{add,rm}_subtranslator()`.
-_EXTERNAL_SUBTRANSLATORS: dict[type[jtrans.PrimitiveTranslator], None] = {}
-
 
 def add_subtranslator(
     subtrans: type[jtrans.PrimitiveTranslator],
@@ -37,60 +29,24 @@ def add_subtranslator(
 
     The function returns `True` if it was added and `False` is not.
     """
-    from inspect import isclass
-
-    from jace.translator import PrimitiveTranslator  # Import cycle
-
-    if subtrans in _EXTERNAL_SUBTRANSLATORS:
+    # NOTE: Because `PrimitiveTranslator` has a property, it is not possible to use
+    #         `issubclass()` here, to check if the interface is ready implemented.
+    if subtrans in _KNOWN_SUBTRANSLATORS:
+        # TODO: Consider moving `subtrans` to the front (last element).
         return False
-    if not isclass(subtrans):
-        return False
-    if not issubclass(subtrans, PrimitiveTranslator):
-        return False
-    _EXTERNAL_SUBTRANSLATORS[subtrans] = None
+    _KNOWN_SUBTRANSLATORS.append(subtrans)
     return True
 
 
-def rm_subtranslator(
-    subtrans: type[jtrans.PrimitiveTranslator],
-    strict: bool = False,
-) -> bool:
-    """Remove `subtrans` as externally defined subtranslators.
-
-    If `subtrans` is not known no error is generated unless `strict` is set to `True`.
-    """
-    if subtrans not in _EXTERNAL_SUBTRANSLATORS:
-        if strict:
-            raise KeyError(f"Subtranslator '{type(subtrans)}' is not known.")
-        return False
-    del _EXTERNAL_SUBTRANSLATORS[subtrans]
-    return True
-
-
-def _get_subtranslators_cls(
-    with_external: bool = True,
-    builtins: bool = True,
-) -> Sequence[type[jtrans.PrimitiveTranslator]]:
+def _get_subtranslators_cls() -> Sequence[type[jtrans.PrimitiveTranslator]]:
     """Returns the list of all subtranslator known to JaCe.
 
-    Args:
-        with_external:  Include the translators that were externally supplied.
-        builtins:       Include the build in translators.
-
-    Notes:
-        If the externally defined subtranslators are requested they will be
-            first and ordered as FILO order.
+    The translators are returned in FIFO order.
     """
-    ret: list[type[jtrans.PrimitiveTranslator]] = []
-    if with_external:
-        # Guarantees that we get them in FIFO order.
-        ret.extend(reversed(_EXTERNAL_SUBTRANSLATORS.keys()))
-    if builtins:
-        ret.extend(_BUILTIN_SUBTRANSLATORS)
-    return ret
+    return list(reversed(_KNOWN_SUBTRANSLATORS))
 
 
 __all__ = [
+    "ALUTranslator",
     "add_subtranslator",
-    "rm_subtranslator",
 ]

From 87c43f6d7baaf6d112bbaf1f1d69dd6b35a96f3d Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Fri, 3 May 2024 08:55:43 +0200
Subject: [PATCH 086/458] Updated some tests.

---
 tests/test_subtranslator_helper.py | 151 ++++++++---------------------
 1 file changed, 42 insertions(+), 109 deletions(-)

diff --git a/tests/test_subtranslator_helper.py b/tests/test_subtranslator_helper.py
index 92b0669..4c7ddd8 100644
--- a/tests/test_subtranslator_helper.py
+++ b/tests/test_subtranslator_helper.py
@@ -9,11 +9,6 @@
 
 from __future__ import annotations
 
-from collections.abc import Collection
-from typing import Any
-
-import pytest
-
 from jace import translator as jtrans
 
 
@@ -22,112 +17,50 @@ def test_subtranslatior_managing():
     from jace.translator.sub_translators import (
         _get_subtranslators_cls,
         add_subtranslator,
-        rm_subtranslator,
     )
 
-    class ValidSubTrans(jtrans.PrimitiveTranslator):
-        def __init__(self, *args, **kwargs):
-            super().__init__(*args, **kwargs)
-
-    class ValidSubTrans2(jtrans.PrimitiveTranslator):
-        def __init__(self, *args, **kwargs):
-            super().__init__(*args, **kwargs)
-
-    class InvalidSubTrans:
-        def __init__(self): ...
-        def get_handled_primitives(self) -> Collection[str] | str:
-            return "add"
-
-        def can_translate_jaxeqn(self, *args: Any, **kwargs: Any):  # noqa: ARG002  # Unused arguments
-            return False
-
-        def translate_jaxeqn(self, *args: Any, **kwargs: Any):
-            raise NotImplementedError()
-
-        def get_priority(self) -> int:
-            return 0
-
-        def has_default_priority(self) -> bool:
-            return False
-
-        def __lt__(self, other: Any) -> bool:
-            return NotImplemented
-
-        def __eq__(self, other: Any) -> bool:
-            return id(self) == id(other)
-
-        def __hash__(self) -> int:
-            return id(self)
-
-        def __ne__(self, other: Any) -> bool:
-            return NotImplemented
-
-        def __le__(self, other: Any) -> bool:
-            return NotImplemented
-
-        def __ge__(self, other: Any) -> bool:
-            return NotImplemented
-
-        def __gt__(self, other: Any) -> bool:
-            return NotImplemented
-
-    #
-
-    # Test the initial conditions
-    builtin_subtrans = _get_subtranslators_cls(with_external=False)
-    curr_external_subtrans = _get_subtranslators_cls(builtins=False)
-    exp_curr_external_subtrans = []
-    assert (
-        curr_external_subtrans == exp_curr_external_subtrans
-    ), f"Expected no external subtranslators but found: {builtin_subtrans}"
-    assert (
-        len(builtin_subtrans) != 0
-    ), "Expected to have some builtin subtranslator, but there were none."
-    assert builtin_subtrans is not _get_subtranslators_cls()  # Ensures no sharing
-
-    # Add a subtranslator to the internal list
-    assert add_subtranslator(ValidSubTrans), "Failed to add 'ValidSubTrans'"
-    exp_curr_external_subtrans = [ValidSubTrans]
-    curr_external_subtrans = _get_subtranslators_cls(builtins=False)
-    assert (
-        curr_external_subtrans == exp_curr_external_subtrans
-    ), f"Wrong subtranslator order, expected '{exp_curr_external_subtrans}' got '{curr_external_subtrans}'."
-    assert builtin_subtrans == _get_subtranslators_cls(with_external=False)
-    assert _get_subtranslators_cls() == exp_curr_external_subtrans + builtin_subtrans
-
-    # Add a second translator
-    assert add_subtranslator(ValidSubTrans2), "Failed to add 'ValidSubTrans2'"
-    exp_curr_external_subtrans = [ValidSubTrans2, ValidSubTrans]  # FILO order
-    curr_external_subtrans = _get_subtranslators_cls(builtins=False)
-    assert (
-        exp_curr_external_subtrans == curr_external_subtrans
-    ), f"Wrong subtranslator order, expected '{exp_curr_external_subtrans}' got '{curr_external_subtrans}'."
-    assert exp_curr_external_subtrans + builtin_subtrans == _get_subtranslators_cls()
-
-    # Now we try to add some translators that will be rejected.
-    assert not add_subtranslator(ValidSubTrans)  # Already known
-    assert not add_subtranslator(ValidSubTrans2)  # Already known
-    assert not add_subtranslator(ValidSubTrans())  # Is an instance
-    assert not add_subtranslator(InvalidSubTrans)  # Not implementing interface
-    assert exp_curr_external_subtrans + builtin_subtrans == _get_subtranslators_cls()
-
-    # Now we remove a translator from the list.
-    assert rm_subtranslator(ValidSubTrans), "Failed to remove 'ValidSubTrans'"
-    exp_curr_external_subtrans = [ValidSubTrans2]
-    curr_external_subtrans = _get_subtranslators_cls(builtins=False)
-    assert (
-        curr_external_subtrans == exp_curr_external_subtrans
-    ), f"Wrong subtranslator order, expected '{exp_curr_external_subtrans}' got '{curr_external_subtrans}'."
-    assert builtin_subtrans == _get_subtranslators_cls(with_external=False)
-    assert _get_subtranslators_cls() == exp_curr_external_subtrans + builtin_subtrans
-
-    # Now try to remove it again.
-    assert not rm_subtranslator(ValidSubTrans), "Was allowed to remove 'ValidSubTrans' again!"
-    with pytest.raises(
-        expected_exception=KeyError, match=f"Subtranslator '{type(ValidSubTrans)}' is not known."
-    ):
-        rm_subtranslator(ValidSubTrans, strict=True)
-    #
+    # These are all initial subtranslators
+    builtin_subtrans_cls = _get_subtranslators_cls()
+
+    # Definitions of some classes to help.
+    class SubTrans1(jtrans.PrimitiveTranslator):
+        @classmethod
+        def CREATE(cls) -> SubTrans1:
+            return SubTrans1()
+
+        @property
+        def primitive(self):
+            return "non_existing_primitive1"
+
+        def translate_jaxeqn(self) -> None:  # type: ignore[override]  # Arguments
+            return None
+
+    class SubTrans2(jtrans.PrimitiveTranslator):
+        @classmethod
+        def CREATE(cls) -> SubTrans2:
+            return SubTrans2()
+
+        @property
+        def primitive(self):
+            return "non_existing_primitive2"
+
+        def translate_jaxeqn(self) -> None:  # type: ignore[override]  # Arguments
+            return None
+
+    # Adding the first subtranslator to the list.
+    assert add_subtranslator(SubTrans1)
+
+    curr_subtrans_cls = _get_subtranslators_cls()
+    assert len(curr_subtrans_cls) == len(builtin_subtrans_cls) + 1
+    assert [SubTrans1, *builtin_subtrans_cls] == curr_subtrans_cls
+
+    # Now adding the second subtranslator
+    assert add_subtranslator(SubTrans2)
+
+    curr_subtrans_cls2 = _get_subtranslators_cls()
+    assert len(curr_subtrans_cls2) == len(builtin_subtrans_cls) + 2
+    assert [SubTrans2, SubTrans1, *builtin_subtrans_cls] == curr_subtrans_cls2
+    assert curr_subtrans_cls2 is not curr_subtrans_cls
 
 
 if __name__ == "__main__":

From 6ec08b51589ca57cb5f63d84282cd0624af4916f Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Fri, 3 May 2024 09:18:30 +0200
Subject: [PATCH 087/458] Created a central place for all patterns that are
 needed.

---
 src/jace/translator/_translation_context.py   |  2 ++
 .../translator/jaxpr_translator_driver.py     | 19 +++++++++-------
 src/jace/util/__init__.py                     |  4 ++++
 src/jace/util/jax_helper.py                   |  7 ++----
 src/jace/util/re_pattern.py                   | 22 +++++++++++++++++++
 5 files changed, 41 insertions(+), 13 deletions(-)
 create mode 100644 src/jace/util/re_pattern.py

diff --git a/src/jace/translator/_translation_context.py b/src/jace/translator/_translation_context.py
index 4858f3c..075892f 100644
--- a/src/jace/translator/_translation_context.py
+++ b/src/jace/translator/_translation_context.py
@@ -75,6 +75,8 @@ def __init__(
             rev_idx:    The revision index of the context.
             name:       Name of the SDFG object.
         """
+        if isinstance(name, str) and not jutil._VALID_SDFG_OBJ_NAME.fullmatch(name):
+            raise ValueError(f"'{name}' is not a valid SDFG name.")
 
         self._sdfg: dace.SDFG = dace.SDFG(name=(name or f"unnamed_SDFG_{id(self)}"))
         self._start_state: dace.SDFGState = self._sdfg.add_state(
diff --git a/src/jace/translator/jaxpr_translator_driver.py b/src/jace/translator/jaxpr_translator_driver.py
index 0dbb257..b1ca609 100644
--- a/src/jace/translator/jaxpr_translator_driver.py
+++ b/src/jace/translator/jaxpr_translator_driver.py
@@ -8,7 +8,6 @@
 from __future__ import annotations
 
 import itertools
-import re
 from collections.abc import Collection, Iterable, Mapping, Sequence
 from typing import Any, Final, cast, overload
 
@@ -196,6 +195,9 @@ def append_new_state(
             prev_state:     Alternative `SDFGState` at which we should append the new state.
 
         """
+        if isinstance(label, str) and (not jutil._VALID_SDFG_OBJ_NAME.fullmatch(label)):
+            raise ValueError(f"Can not create state with label '{label}' since it is invalid.")
+
         # Decide if appending to that state will modify the terminal state.
         modify_term_state: bool = False
         if (prev_state is self._ctx.terminal_state) or (prev_state is None):
@@ -380,8 +382,12 @@ def add_reserved_names(
             pass
         else:
             raise TypeError(f"Does not know how to handle the type '{type(reserved_names)}'.")
-        if not all(isinstance(x, str) and (len(x) != 0) for x in reserved_names):
-            raise TypeError("Reserved names must all be non empty strings.")
+        for rev_name in reserved_names:
+            assert isinstance(rev_name, str)
+            if not jutil._VALID_SDFG_VAR_NAME.fullmatch(rev_name):
+                raise ValueError(
+                    f"Can not use '{rev_name}' as reserved name as it is not a valid SDFG name."
+                )
         self._reserved_names.update(reserved_names)
         return self
 
@@ -497,7 +503,7 @@ def add_array(
                 raise ValueError("Passed an empty 'alt_name'.")
             if alt_name in self._forbidden_names:
                 raise ValueError("'alt_name' is a forbidden name.")
-            if not re.fullmatch("[a-zA-Z_][a-zA-Z0-9_]*", alt_name):
+            if not jutil._VALID_SDFG_VAR_NAME.fullmatch(alt_name):
                 raise ValueError(f"The passed name 'alt_name' '{alt_name}' is invalid.")
             if name_prefix is not None:
                 raise ValueError(
@@ -584,7 +590,7 @@ def add_array(
             raise ValueError(f"Can't create variable '{arg_name}', name is forbidden.")
         if arg_name in self._ctx.sdfg.arrays:
             raise ValueError(f"Can't create variable '{arg_name}', variable is already created.")
-        if not re.fullmatch("[a-zA-Z_][a-zA-Z0-9_]*", arg_name):
+        if not jutil._VALID_SDFG_VAR_NAME.fullmatch(arg_name):
             raise ValueError(f"The requested variable name '{arg_name}' is invalid.")
 
         # Promotion of scalar to array.
@@ -786,9 +792,6 @@ def _allocate_translation_ctx(
         """
         from ._translation_context import _TranslationContext
 
-        if name and (not re.fullmatch("[a-zA-Z_][a-zA-Z0-9_]*", name)):
-            raise ValueError(f"The provided name '{name}' for the SDFG is invalid.")
-
         # Create a new translation context and put it on the stack.
         self._ctx = _TranslationContext(
             rev_idx=next(self._rev_manager),
diff --git a/src/jace/util/__init__.py b/src/jace/util/__init__.py
index a161184..b9865b9 100644
--- a/src/jace/util/__init__.py
+++ b/src/jace/util/__init__.py
@@ -19,6 +19,7 @@
     is_tracing_ongoing,
     translate_dtype,
 )
+from .re_pattern import _VALID_JAX_VAR_NAME, _VALID_SDFG_OBJ_NAME, _VALID_SDFG_VAR_NAME
 from .traits import is_drop_var, is_jaceified, is_jaxified, is_non_string_iterable
 from .util import as_sequence
 
@@ -38,4 +39,7 @@
     "run_jax_sdfg",
     "_jace_run",
     "_propose_jax_name",
+    "_VALID_JAX_VAR_NAME",
+    "_VALID_SDFG_OBJ_NAME",
+    "_VALID_SDFG_VAR_NAME",
 ]
diff --git a/src/jace/util/jax_helper.py b/src/jace/util/jax_helper.py
index b02a7de..f85e812 100644
--- a/src/jace/util/jax_helper.py
+++ b/src/jace/util/jax_helper.py
@@ -15,7 +15,6 @@
 
 from __future__ import annotations
 
-import re
 from collections.abc import Mapping
 from dataclasses import dataclass
 from typing import Any
@@ -24,9 +23,7 @@
 import jax.core as jcore
 import numpy as np
 
-
-# Used by `get_jax_var_name()` to test if a name for a jax variable is valid.
-_VALID_JAX_NAME_PATTERN: re.Pattern = re.compile("[a-zA-Z_][a-zA-Z0-9_]*")
+from jace import util
 
 
 @dataclass(init=True, repr=True, frozen=True, slots=True)
@@ -86,7 +83,7 @@ def get_jax_var_name(jax_var: jcore.Atom | JaCeVar | str) -> str:
             )
     assert isinstance(jax_name, str)
 
-    if not _VALID_JAX_NAME_PATTERN.fullmatch(jax_name):
+    if not util._VALID_JAX_VAR_NAME.fullmatch(jax_name):
         raise ValueError(f"Deduced Jax name '{jax_name}' is invalid.")
     return jax_name
 
diff --git a/src/jace/util/re_pattern.py b/src/jace/util/re_pattern.py
new file mode 100644
index 0000000..99fb71a
--- /dev/null
+++ b/src/jace/util/re_pattern.py
@@ -0,0 +1,22 @@
+# JaCe - JAX Just-In-Time compilation using DaCe (Data Centric Parallel Programming)
+#
+# Copyright (c) 2024, ETH Zurich
+# All rights reserved.
+#
+# SPDX-License-Identifier: BSD-3-Clause
+
+"""Module containing all regex pattern that we need inside JaCe."""
+
+from __future__ import annotations
+
+import re
+
+
+# Valid name for a jax variable.
+_VALID_JAX_VAR_NAME: re.Pattern = re.compile("(jax[0-9]+_?)|([a-z]+_?)")
+
+# Valid name for an SDFG variable.
+_VALID_SDFG_VAR_NAME: re.Pattern = re.compile("[a-zA-Z_][a-zA-Z0-9_]*")
+
+# Valid name for an SDFG itself, includes `SDFGState` objects.
+_VALID_SDFG_OBJ_NAME: re.Pattern = re.compile("[a-zA-Z_][a-zA-Z0-9_]*")

From cfda8f3300ad35b2df581fa852d6d804de3ecddd Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Fri, 3 May 2024 10:32:54 +0200
Subject: [PATCH 088/458] Updated the driver test to make it work again.

---
 tests/test_jaxpr_translator_driver.py | 99 ++++++++++-----------------
 1 file changed, 36 insertions(+), 63 deletions(-)

diff --git a/tests/test_jaxpr_translator_driver.py b/tests/test_jaxpr_translator_driver.py
index d826706..25b32bf 100644
--- a/tests/test_jaxpr_translator_driver.py
+++ b/tests/test_jaxpr_translator_driver.py
@@ -12,8 +12,12 @@
 import dace
 import pytest
 
-from jace import translator as jtrans
+import re
+
+from dace.data import Array, Data, Scalar
 
+from jace import translator as jtrans
+from jace.util import JaCeVar
 
 @pytest.fixture(scope="module")
 def alloc_driver():
@@ -28,6 +32,8 @@ def test_driver_alloc() -> None:
     """Tests the state right after allocation."""
     driver = jtrans.JaxprTranslationDriver()
     assert not driver.is_allocated(), "Driver was created allocated."
+    assert driver._ctx is None
+    assert len(driver._ctx_stack) == 0
 
     # The reserved names will be tested in `test_driver_fork()`.
     sdfg_name = "qwertzuiopasdfghjkl"
@@ -35,79 +41,51 @@ def test_driver_alloc() -> None:
 
     sdfg: dace.SDFG = driver.get_sdfg()
 
+    assert driver._ctx.sdfg is sdfg
     assert driver.get_sdfg().name == sdfg_name
     assert sdfg.number_of_nodes() == 1
     assert sdfg.number_of_edges() == 0
-    assert sdfg.start_block is driver._init_sdfg_state
-    assert driver.get_terminal_sdfg_state() is driver._init_sdfg_state
+    assert sdfg.start_block is driver._ctx.start_state
+    assert driver.get_terminal_sdfg_state() is driver._ctx.start_state
+
 
+def test_driver_nested() -> None:
+    """Tests the ability of the nesting of the driver.
 
-def test_driver_fork() -> None:
-    """Tests the fork ability of the driver."""
+    Note this test does the creation of subcontext manually, which is not recommended.
+    """
 
     # This is the parent driver.
     driver = jtrans.JaxprTranslationDriver()
     assert not driver.is_allocated(), "Driver should not be allocated."
 
-    with pytest.raises(expected_exception=RuntimeError, match="Only allocated driver can fork."):
-        _ = driver.fork()
-    #
-
     # We allocate the driver directly, because we need to set some internals.
     #  This is also the reason why we do not use the fixture.
     org_res_names = {"a", "b"}
     driver._allocate_translation_ctx("driver", reserved_names=org_res_names)
+    driver._ctx.inp_names = ("a", "b")
+    driver._ctx.out_names = ("c", "d")
     assert driver.is_allocated()
+    assert len(driver._ctx_stack) == 1
     assert driver._reserved_names == org_res_names
 
-    # Now we allocate a child
-    dolly = driver.fork()
-    dolly_rev = dolly.get_rev_idx()
-    assert not dolly.is_allocated()
-    assert not dolly.is_head_translator()
-    assert driver.is_head_translator()
-    assert dolly.same_family(driver)
-    assert driver.same_family(dolly)
-    assert driver._sub_translators is dolly._sub_translators
-    assert driver._rev_manager is dolly._rev_manager
-    assert dolly._reserved_names == driver._reserved_names
-    assert dolly._reserved_names is not driver._reserved_names
-
-    # Test if allocation of fork works properly
-    dolly_only_res_names = ["c"]  # reserved names that are only known to dolly; Added latter
-    dolly_full_res_names = org_res_names.union(dolly_only_res_names)
-    dolly._allocate_translation_ctx(
-        "dolly",
-    )
-
-    assert dolly.is_allocated()
-    assert dolly._reserved_names == org_res_names
-    assert driver._reserved_names == org_res_names
-
-    # Now adding reserved names to dolly after construction.
-    dolly.add_reserved_names(None)
-    assert dolly._reserved_names == org_res_names
-    dolly.add_reserved_names(dolly_only_res_names)
-    assert dolly._reserved_names == dolly_full_res_names
-    assert driver._reserved_names == org_res_names
-
-    # Now we deallocate dolly
-    dolly._clear_translation_ctx()
-    assert not dolly.is_allocated()
-    assert dolly._reserved_names is not None
-    assert dolly._reserved_names == dolly_full_res_names
+    # Now we increase the stack by one.
+    org_ctx = driver._ctx
+    driver._allocate_translation_ctx("driver2")
+    driver._ctx.inp_names = ("e", "f")
+    driver._ctx.out_names = ("g", "h")
+    assert driver.is_allocated()
+    assert len(driver._ctx_stack) == 2
+    assert driver._ctx is driver._ctx_stack[-1]
+    assert driver._ctx is not driver._ctx_stack[0]
+    assert org_ctx is driver._ctx_stack[0]
 
-    # Now we test if the revision index is again increased properly.
-    dolly2 = driver.fork()
-    assert dolly_rev < dolly2.get_rev_idx()
-    assert dolly2.same_family(dolly)
-    assert dolly2.same_family(driver)
+    for member_name in driver._ctx.__slots__:
+        org = getattr(org_ctx, member_name)
+        nest = getattr(driver._ctx, member_name)
+        assert org is not nest, f"Detected sharing for '{member_name}'"
 
-    # Deallocate the driver
-    driver._clear_translation_ctx()
-    assert not driver.is_allocated()
-    assert driver.is_head_translator()
-    assert driver._reserved_names is None
+    assert org_ctx.rev_idx < driver._ctx.rev_idx
 
 
 def test_driver_append_state(alloc_driver: jtrans.JaxprTranslationDriver) -> None:
@@ -118,9 +96,9 @@ def test_driver_append_state(alloc_driver: jtrans.JaxprTranslationDriver) -> Non
     assert sdfg.number_of_nodes() == 2
     assert sdfg.number_of_edges() == 1
     assert terminal_state_1 is alloc_driver.get_terminal_sdfg_state()
-    assert alloc_driver.get_terminal_sdfg_state() is alloc_driver._term_sdfg_state
-    assert alloc_driver._init_sdfg_state is sdfg.start_block
-    assert alloc_driver._init_sdfg_state is not terminal_state_1
+    assert alloc_driver.get_terminal_sdfg_state() is alloc_driver._ctx.terminal_state
+    assert alloc_driver._ctx.start_state is sdfg.start_block
+    assert alloc_driver._ctx.start_state is not terminal_state_1
     assert next(iter(sdfg.edges())).src is sdfg.start_block
     assert next(iter(sdfg.edges())).dst is terminal_state_1
 
@@ -151,10 +129,6 @@ def test_driver_array(alloc_driver: jtrans.JaxprTranslationDriver) -> None:
 
     However, it does so without using Jax variables.
     """
-    from dace.data import Array, Data, Scalar
-
-    from jace.util import JaCeVar
-
     # Since we do not have Jax variables, we are using JaCe substitute for it.
 
     # Creating a scalar.
@@ -293,4 +267,3 @@ def test_driver_array(alloc_driver: jtrans.JaxprTranslationDriver) -> None:
 
 if __name__ == "__main__":
     test_driver_alloc()
-    test_driver_fork()

From 16a3bdfdf9db0f42a1f66d6c17d961213a5b3f4c Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Fri, 3 May 2024 10:38:37 +0200
Subject: [PATCH 089/458] Updated the handling of JaCe variables.

Updated how the `__hash__` and `__eq__` works.
Before they only considered the name, which was not good.
There was also a short period, where all members were considered.
However, this commit changes them such that they only consider the `id()` value.
This is more in line with what Jax is doing.

Furthrmore if the name of a `JaCeVar` is empyt then the toolchain will consider them more like Jax variables.
---
 src/jace/util/jax_helper.py | 29 ++++++++++++++++++++++-------
 1 file changed, 22 insertions(+), 7 deletions(-)

diff --git a/src/jace/util/jax_helper.py b/src/jace/util/jax_helper.py
index f85e812..3bd2b32 100644
--- a/src/jace/util/jax_helper.py
+++ b/src/jace/util/jax_helper.py
@@ -37,6 +37,9 @@ class JaCeVar:
     Notes:
         Main intention is to test functionality.
         While for a Jax `Var` object the name is rather irrelevant, `JaCeVar` use their name.
+        If the name of a `JaCeVar` is '_' it is considered a drop variable.
+        If the name of a `JaCeVar` is empty, the automatic naming will consider it as a Jax variable.
+        The definition of `__hash__` and `__eq__` is in accordance how Jax variable works.
     """
 
     name: str
@@ -44,12 +47,16 @@ class JaCeVar:
     dtype: dace.typeclass
 
     def __hash__(self) -> int:
-        return hash(self.name)
+        return id(self)
 
     def __eq__(self, other: Any) -> bool:
         if not isinstance(other, JaCeVar):
             return NotImplemented
-        return self.name == other.name
+        return id(self) == id(other)
+
+    def __post_init__(self) -> None:
+        if not isinstance(self.shape, tuple):
+            raise ValueError("The 'shape' member of a 'JaCeVar' must be a tuple.")
 
 
 def get_jax_var_name(jax_var: jcore.Atom | JaCeVar | str) -> str:
@@ -66,7 +73,9 @@ def get_jax_var_name(jax_var: jcore.Atom | JaCeVar | str) -> str:
         case jcore.DropVar():
             return "_"
         case JaCeVar():
-            jax_name = jax_var.name
+            # In case of an empty name consider the jace variable as a Jax variable.
+            #  This is mostly for testing.
+            jax_name = f"jax{id(jax_var)}" if jax_var.name == "" else jax_var.name
         case jcore.Var():
             # This stopped working after version 0.20.4, because of some changes in Jax
             #  See `https://github.com/google/jax/pull/10573` for more information.
@@ -191,13 +200,19 @@ def _propose_jax_name(
         raise RuntimeError(
             f"Can not propose a second name for '{jax_var}', it already known as '{jax_name_map[jax_var]}'."
         )
-    if isinstance(jax_var, JaCeVar):
-        return jax_var.name
-    assert isinstance(jax_var, jcore.Atom)
+    if isinstance(jax_var, jcore.Var):
+        pass
+    elif isinstance(jax_var, JaCeVar):
+        # If the name of the JaCe variable is empty, then use the name proposing
+        #  technique used for Jax variables; Mostly used for debugging.
+        if jax_var.name != "":
+            return jax_var.name
+    else:
+        raise TypeError(f"Can not propose a name for '{jax_var}'")
 
     c = len(jax_name_map)
     jax_name = ""
     while len(jax_name) == 0 or c != 0:
         c, i = c // 26, c % 26
         jax_name = chr(97 + i % 26) + jax_name
-    return jax_name + jax_var.suffix
+    return jax_name + getattr(jax_var, "suffix", "")

From 4fe04ae62a67fa0c636548127ab3b733a5347f46 Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Fri, 3 May 2024 10:59:38 +0200
Subject: [PATCH 090/458] Made a reminder.

---
 src/jace/translator/jaxpr_translator_driver.py | 3 +++
 1 file changed, 3 insertions(+)

diff --git a/src/jace/translator/jaxpr_translator_driver.py b/src/jace/translator/jaxpr_translator_driver.py
index b1ca609..c6fdb46 100644
--- a/src/jace/translator/jaxpr_translator_driver.py
+++ b/src/jace/translator/jaxpr_translator_driver.py
@@ -667,6 +667,9 @@ def create_jax_var_list(
             only_creation:      Always create a variable, it is an error if one already exist.
             handle_literals:    Allow the processing of literals.
             kwargs:             Will be forwarded to `self.add_array()` if a variable as to be created,
+
+        Todo:
+            Rollback if the creation fails.
         """
         if only_creation and prevent_creation:
             raise ValueError("Specified both 'only_creation' and 'prevent_creation'.")

From 37f9acc60cde3449516a999621c8152a9872e088 Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Fri, 3 May 2024 11:02:01 +0200
Subject: [PATCH 091/458] Updated the test for teh driver again.

---
 tests/test_jaxpr_translator_driver.py | 83 +++++++++++++++++++++++++--
 1 file changed, 79 insertions(+), 4 deletions(-)

diff --git a/tests/test_jaxpr_translator_driver.py b/tests/test_jaxpr_translator_driver.py
index 25b32bf..46ea10b 100644
--- a/tests/test_jaxpr_translator_driver.py
+++ b/tests/test_jaxpr_translator_driver.py
@@ -9,16 +9,16 @@
 
 from __future__ import annotations
 
-import dace
-import pytest
-
 import re
 
+import dace
+import pytest
 from dace.data import Array, Data, Scalar
 
 from jace import translator as jtrans
 from jace.util import JaCeVar
 
+
 @pytest.fixture(scope="module")
 def alloc_driver():
     """Returns an allocated driver instance."""
@@ -33,7 +33,7 @@ def test_driver_alloc() -> None:
     driver = jtrans.JaxprTranslationDriver()
     assert not driver.is_allocated(), "Driver was created allocated."
     assert driver._ctx is None
-    assert len(driver._ctx_stack) == 0
+    assert len(driver._ctx_stack) == 0  # type: ignore[unreachable]
 
     # The reserved names will be tested in `test_driver_fork()`.
     sdfg_name = "qwertzuiopasdfghjkl"
@@ -87,6 +87,18 @@ def test_driver_nested() -> None:
 
     assert org_ctx.rev_idx < driver._ctx.rev_idx
 
+    # Now we go back one state, i.e. pretend that we are done with translating the nested jaxpr.
+    driver._clear_translation_ctx()
+    assert driver._ctx is org_ctx
+    assert len(driver._ctx_stack) == 1
+    assert driver._reserved_names == org_res_names
+
+    # Now if we fully deallocate then we expect that it is fully deallocated.
+    driver._clear_translation_ctx()
+    assert driver._ctx is None
+    assert len(driver._ctx_stack) == 0  # type: ignore[unreachable]
+    assert driver._reserved_names is None
+
 
 def test_driver_append_state(alloc_driver: jtrans.JaxprTranslationDriver) -> None:
     """Tests the functionality of appending states."""
@@ -265,5 +277,68 @@ def test_driver_array(alloc_driver: jtrans.JaxprTranslationDriver) -> None:
             assert isinstance(stri, (str, dace.symbol))
 
 
+def test_driver_array2() -> None:
+    """This function tests the array creation routine with respect to the automatic naming.
+
+    Todo:
+        - Literals.
+    """
+    # This is the parent driver.
+    driver = jtrans.JaxprTranslationDriver()
+    assert not driver.is_allocated(), "Driver should not be allocated."
+
+    # Creating JaCe Variables with empty names, forces the driver to use the
+    #  Jax naming algorithm.
+    var_a = JaCeVar("", (10, 19), dace.int64)
+    var_b = JaCeVar("", (10, 909), dace.float16)
+
+    # These are the reserved names, so `a` should be named as is, but `b` should have another name.
+    org_res_names = {"b"}
+    driver._allocate_translation_ctx("driver", reserved_names=org_res_names)
+
+    # These are the expected names
+    exp_names = [
+        "a",
+        "_jax_variable__b__0",
+    ]
+    res_names = driver.create_jax_var_list(
+        [var_a, var_b],
+        only_creation=True,
+    )
+    assert res_names == exp_names, f"Expected names '{exp_names}' but got '{res_names}'."
+    assert len(driver._ctx.jax_name_map) == 2
+
+    # Try to create variable `c` and `a`, however, since variable `a` already exists it will fail.
+    #  However, currently the variable `c` will be created, this might change in the future.
+    var_c = JaCeVar("", (10, 19), dace.int64)
+    with pytest.raises(
+        expected_exception=ValueError,
+        match=re.escape(f"'only_creation' given '{var_a}' already exists."),
+    ):
+        res_names = driver.create_jax_var_list(
+            [var_c, var_a],
+            only_creation=True,
+        )
+    assert len(driver._ctx.jax_name_map) == 3, f"{driver._ctx.jax_name_map}"
+    assert driver._ctx.jax_name_map[var_c] == "c"
+
+    # Now we test the only collection mode
+    res_names = driver.create_jax_var_list(
+        [var_c, var_a],
+        prevent_creation=True,
+    )
+    assert len(driver._ctx.jax_name_map) == 3, f"{driver._ctx.jax_name_map}"
+    assert res_names == ["c", "a"]
+
+    # Now also the mixed mode, i.e. between collecting and creating.
+    var_d = JaCeVar("", (10, 19), dace.int64)
+    exp_names = ["c", "d", "a"]
+    res_names = driver.create_jax_var_list(
+        [var_c, var_d, var_a],
+    )
+    assert len(driver._ctx.jax_name_map) == 4
+    assert exp_names == res_names
+
+
 if __name__ == "__main__":
     test_driver_alloc()

From 8effc52a6f00cc9351b0eab141ae7626ba2aa58d Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Fri, 3 May 2024 11:33:39 +0200
Subject: [PATCH 092/458] Made the API tests pass again.

The hack is not nice but it works.
---
 src/jace/jax/api_helper.py | 16 ++++++++++++----
 tests/test_package.py      |  3 +++
 2 files changed, 15 insertions(+), 4 deletions(-)

diff --git a/src/jace/jax/api_helper.py b/src/jace/jax/api_helper.py
index 1932b5b..65f4266 100644
--- a/src/jace/jax/api_helper.py
+++ b/src/jace/jax/api_helper.py
@@ -98,10 +98,18 @@ def _get_translated_sdfg(
             It is forbidden to permanently modify the returned translated SDFG.
                 Doing so results in undefined behaviour.
         """
-        return self._get_translated_sdfg_cached(
-            *(_ArgInfo.from_value(v) for v in args),
-            **kwargs,
-        )
+        from jace.translator import JaxprTranslationDriver
+
+        # TODO(phimuell): This is only to make the API tests pass with the half implemented cache.
+        try:
+            return self._get_translated_sdfg_cached(
+                *(_ArgInfo.from_value(v) for v in args),
+                **kwargs,
+            )
+        except NotImplementedError:
+            jaxpr = jax.make_jaxpr(self.__wrapped__)(*args)
+            driver = JaxprTranslationDriver(**kwargs)
+            return driver.translate_jaxpr(jaxpr)
 
     @lru_cache
     def _get_translated_sdfg_cached(
diff --git a/tests/test_package.py b/tests/test_package.py
index bf92c00..5237aeb 100644
--- a/tests/test_package.py
+++ b/tests/test_package.py
@@ -9,8 +9,11 @@
 
 import importlib.metadata
 
+import pytest
+
 import jace as m
 
 
+@pytest.mark.skip(reason="This does not work yet.")
 def test_version():
     assert importlib.metadata.version("jace") == m.__version__

From 686db6a075c7bfe03349cf97c98151221bceaf8b Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Fri, 3 May 2024 12:59:48 +0200
Subject: [PATCH 093/458] For merging.


From 66da7a12160e49994f1d0ed76c96900632305103 Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Fri, 3 May 2024 14:45:46 +0200
Subject: [PATCH 094/458] Made some fixes to the verification function of the
 `TranslatedJaxprSDFG`.

---
 src/jace/translator/translated_jaxpr_sdfg.py | 12 +++++++++---
 1 file changed, 9 insertions(+), 3 deletions(-)

diff --git a/src/jace/translator/translated_jaxpr_sdfg.py b/src/jace/translator/translated_jaxpr_sdfg.py
index b2b7dc8..bc1ffab 100644
--- a/src/jace/translator/translated_jaxpr_sdfg.py
+++ b/src/jace/translator/translated_jaxpr_sdfg.py
@@ -46,12 +46,18 @@ class TranslatedJaxprSDFG:
     def validate(self) -> bool:
         """Validate the underlying SDFG."""
 
-        # To prevent the 'non initialized' data warnings we have to temporary promote the
-        #  input arguments as global.
+        # To prevent the 'non initialized' data warnings we have to temporary
+        #  promote input and output arguments to globals
+        promote_to_glob: set[str] = set()
         org_trans_state: dict[str, bool] = {}
-        for var in self.inp_names:
+        if self.inp_names:
+            promote_to_glob.update(self.inp_names)
+        if self.out_names:
+            promote_to_glob.update(self.out_names)
+        for var in promote_to_glob:
             org_trans_state[var] = self.sdfg.arrays[var].transient
             self.sdfg.arrays[var].transient = False
+
         try:
             self.sdfg.validate()
         finally:

From 15520e48d7e372aeee8d149e1fae6b0e9a5e5dc9 Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Fri, 3 May 2024 14:40:42 +0200
Subject: [PATCH 095/458] Fixing some import names.

---
 src/jace/jax/api.py                           |   4 +-
 src/jace/jax/api_helper.py                    |  18 +--
 src/jace/translator/__init__.py               |   2 -
 src/jace/translator/_translation_context.py   |  14 +--
 .../translator/jaxpr_translator_driver.py     | 119 +++++++++---------
 .../translator/sub_translators/__init__.py    |  12 +-
 .../a_primitive_translator.py}                |  14 ++-
 .../sub_translators/alu_translator.py         |  15 ++-
 src/jace/translator/translated_jaxpr_sdfg.py  |   6 +-
 src/jace/util/debug.py                        |  12 +-
 src/jace/util/jax_helper.py                   |  50 ++++----
 src/jace/util/traits.py                       |  20 +--
 src/jace/util/util.py                         |   6 +-
 13 files changed, 152 insertions(+), 140 deletions(-)
 rename src/jace/translator/{primitive_translator.py => sub_translators/a_primitive_translator.py} (90%)

diff --git a/src/jace/jax/api.py b/src/jace/jax/api.py
index 4915d98..c7f1a2a 100644
--- a/src/jace/jax/api.py
+++ b/src/jace/jax/api.py
@@ -12,7 +12,7 @@
 from collections.abc import Callable
 from typing import Any, cast
 
-from jace import jax as jjax, util as jutil
+from jace import jax as jjax, util
 
 
 def jit(
@@ -33,7 +33,7 @@ def wrapper(f: Callable) -> jjax.JitWrapped:
 
     # in case we are dealing with a JaCe object, we first unwrap it.
     #  Recursion to handle arbitrary deep nestings.
-    if jutil.is_jaceified(fun):
+    if util.is_jaceified(fun):
         fun = cast(jjax.JitWrapped, fun)
         return jit(fun.__wrapped__)
 
diff --git a/src/jace/jax/api_helper.py b/src/jace/jax/api_helper.py
index 65f4266..936f5ee 100644
--- a/src/jace/jax/api_helper.py
+++ b/src/jace/jax/api_helper.py
@@ -10,12 +10,16 @@
 from __future__ import annotations
 
 from functools import lru_cache
-from typing import Any
+from typing import TYPE_CHECKING, Any
 
 import dace
 import jax
 
-from jace import translator as jtrans, util as jutil
+from jace import util
+
+
+if TYPE_CHECKING:
+    from jace import translator
 
 
 class JitWrapped:
@@ -52,7 +56,7 @@ def __call__(
         This guarantees that `self` itself is traceable.
         """
 
-        if jutil.is_tracing_ongoing(*args, **kwargs):
+        if util.is_tracing_ongoing(*args, **kwargs):
             return self._forward_trace(*args, **kwargs)
         return self._call_sdfg(*args, **kwargs)
 
@@ -79,14 +83,14 @@ def _call_sdfg(
         Notes:
             Currently no caching of the compiled object is done.
         """
-        jsdfg: jtrans.TranslatedJaxprSDFG = self._get_translated_sdfg(*args, **kwargs)
-        return jutil.run_jax_sdfg(jsdfg, *args)
+        jsdfg: translator.TranslatedJaxprSDFG = self._get_translated_sdfg(*args, **kwargs)
+        return util.run_jax_sdfg(jsdfg, *args)
 
     def _get_translated_sdfg(
         self,
         *args: Any,
         **kwargs: Any,
-    ) -> jtrans.TranslatedJaxprSDFG:
+    ) -> translator.TranslatedJaxprSDFG:
         """This function returns the `TranslatedJaxprSDFG` object.
 
         The function will transform its arguments into `_ArgInfo` versions.
@@ -116,7 +120,7 @@ def _get_translated_sdfg_cached(
         self,
         *args: _ArgInfo,
         **kwargs: Any,
-    ) -> jtrans.TranslatedJaxprSDFG:
+    ) -> translator.TranslatedJaxprSDFG:
         """Generates the SDFG from
 
         Todo:
diff --git a/src/jace/translator/__init__.py b/src/jace/translator/__init__.py
index 8ca5476..d6bb0c7 100644
--- a/src/jace/translator/__init__.py
+++ b/src/jace/translator/__init__.py
@@ -10,12 +10,10 @@
 from __future__ import annotations
 
 from .jaxpr_translator_driver import JaxprTranslationDriver
-from .primitive_translator import PrimitiveTranslator
 from .translated_jaxpr_sdfg import TranslatedJaxprSDFG
 
 
 __all__ = [
-    "PrimitiveTranslator",
     "JaxprTranslationDriver",
     "TranslatedJaxprSDFG",
 ]
diff --git a/src/jace/translator/_translation_context.py b/src/jace/translator/_translation_context.py
index a0c1854..6d9c43f 100644
--- a/src/jace/translator/_translation_context.py
+++ b/src/jace/translator/_translation_context.py
@@ -12,9 +12,9 @@
 from collections.abc import MutableMapping, Sequence
 
 import dace
-from jax import core as jcore
+from jax import core as jax_core
 
-from jace import translator as jtrans, util as jutil
+from jace import translator, util
 
 
 class _TranslationContext:
@@ -70,7 +70,7 @@ def __init__(
             rev_idx:    The revision index of the context.
             name:       Name of the SDFG object.
         """
-        if isinstance(name, str) and not jutil._VALID_SDFG_OBJ_NAME.fullmatch(name):
+        if isinstance(name, str) and not util._VALID_SDFG_OBJ_NAME.fullmatch(name):
             raise ValueError(f"'{name}' is not a valid SDFG name.")
 
         self._sdfg: dace.SDFG = dace.SDFG(name=(name or f"unnamed_SDFG_{id(self)}"))
@@ -78,14 +78,14 @@ def __init__(
             label="initial_state", is_start_block=True
         )
         self._terminal_state: dace.SDFGState = self._start_state
-        self._jax_name_map: MutableMapping[jcore.Var | jutil.JaCeVar, str] = {}
+        self._jax_name_map: MutableMapping[jax_core.Var | util.JaCeVar, str] = {}
         self._inp_names: tuple[str, ...] = ()
         self._out_names: tuple[str, ...] = ()
         self._rev_idx: int = rev_idx
 
-    def to_translated_jaxpr_sdfg(self) -> jtrans.TranslatedJaxprSDFG:
+    def to_translated_jaxpr_sdfg(self) -> translator.TranslatedJaxprSDFG:
         """Transforms `self` into a `TranslatedJaxprSDFG`."""
-        return jtrans.TranslatedJaxprSDFG(
+        return translator.TranslatedJaxprSDFG(
             sdfg=self._sdfg,
             start_state=self._start_state,
             terminal_state=self._terminal_state,
@@ -114,7 +114,7 @@ def terminal_state(
         self._terminal_state = new_term_state
 
     @property
-    def jax_name_map(self) -> MutableMapping[jcore.Var | jutil.JaCeVar, str]:
+    def jax_name_map(self) -> MutableMapping[jax_core.Var | util.JaCeVar, str]:
         return self._jax_name_map
 
     @property
diff --git a/src/jace/translator/jaxpr_translator_driver.py b/src/jace/translator/jaxpr_translator_driver.py
index c6fdb46..5b01fd2 100644
--- a/src/jace/translator/jaxpr_translator_driver.py
+++ b/src/jace/translator/jaxpr_translator_driver.py
@@ -14,9 +14,10 @@
 import dace
 import jax
 from dace import data as ddata, properties as dprop
-from jax import core as jcore
+from jax import core as jax_core
 
-from jace import translator as jtrans, util as jutil
+from jace import translator, util
+from jace.translator import sub_translators
 
 
 class JaxprTranslationDriver:
@@ -81,7 +82,7 @@ def __init__(
         #  They are partitioned by the names of the primitive they have registered for.
         #  This member is allocated by '_init_sub_translators()' and remains allocated
         #  during the lifetime of the object.
-        self._sub_translators: dict[str, jtrans.PrimitiveTranslator] = None  # type: ignore[assignment]
+        self._sub_translators: dict[str, translator.PrimitiveTranslator] = None  # type: ignore[assignment]
 
         # These names can not be used for the automatic naming of Jax variables.
         #  They differ from the forbidden names, that they denote valid SDFG names.
@@ -104,14 +105,14 @@ def __init__(
 
     def translate_jaxpr(
         self,
-        jaxpr: jcore.ClosedJaxpr,
+        jaxpr: jax_core.ClosedJaxpr,
         *,
         inp_scalar_as_array: bool = False,
         name: str | None = None,
         reserved_names: str | Collection[str] | None = None,
         allow_empty_jaxpr: bool = False,
         **kwargs: Any,
-    ) -> jtrans.TranslatedJaxprSDFG:
+    ) -> translator.TranslatedJaxprSDFG:
         """Perform the translation of a Jaxpr into a SDFG.
 
         In case this function is called and `self` has an ongoing translation process, a new translation context will be created.
@@ -134,7 +135,7 @@ def translate_jaxpr(
         """
         if (len(jaxpr.eqns) == 0) and (not allow_empty_jaxpr):
             raise ValueError("Passed an empty Jaxpr, but did not allow for empty Jaxpr.")
-        if not isinstance(jaxpr, jcore.ClosedJaxpr):
+        if not isinstance(jaxpr, jax_core.ClosedJaxpr):
             raise TypeError(f"Expected a 'jax.core.ClosedJaxp' instance but got '{type(jaxpr)}'")
         if len(jaxpr.effects) != 0:
             raise NotImplementedError("'Jaxpr' with side effects are not supported.")
@@ -162,7 +163,7 @@ def translate_jaxpr(
             jaxpr=jaxpr,
             inp_scalar_as_array=inp_scalar_as_array,
         )
-        jsdfg: jtrans.TranslatedJaxprSDFG = self._translate_jaxpr_internal(jaxpr)
+        jsdfg: translator.TranslatedJaxprSDFG = self._translate_jaxpr_internal(jaxpr)
 
         # If the translation context is not cleared `self` and `jsdfg` will share the same data.
         #  There is some legitimate use for that.
@@ -195,7 +196,7 @@ def append_new_state(
             prev_state:     Alternative `SDFGState` at which we should append the new state.
 
         """
-        if isinstance(label, str) and (not jutil._VALID_SDFG_OBJ_NAME.fullmatch(label)):
+        if isinstance(label, str) and (not util._VALID_SDFG_OBJ_NAME.fullmatch(label)):
             raise ValueError(f"Can not create state with label '{label}' since it is invalid.")
 
         # Decide if appending to that state will modify the terminal state.
@@ -228,7 +229,7 @@ def get_arrays(self) -> Mapping[str, ddata.Data]:
 
     def get_array(
         self,
-        name: str | jcore.Atom | jutil.JaCeVar,
+        name: str | jax_core.Atom | util.JaCeVar,
     ) -> ddata.Data:
         """Returns the SDFG `Data` object `name` referees to.
 
@@ -237,7 +238,7 @@ def get_array(
         """
         if isinstance(name, str):
             sdfg_name: str = name
-        elif isinstance(name, (jcore.Var, jutil.JaCeVar)):
+        elif isinstance(name, (jax_core.Var, util.JaCeVar)):
             sdfg_name = self.map_jax_var_to_sdfg(name)
         else:
             raise TypeError(f"Does not know how to handle '{type(name).__name__}'.")
@@ -248,19 +249,19 @@ def get_array(
     @overload
     def map_jax_var_to_sdfg(
         self,
-        jax_var: str | jcore.Atom | jutil.JaCeVar,
+        jax_var: str | jax_core.Atom | util.JaCeVar,
     ) -> str: ...
 
     @overload
     def map_jax_var_to_sdfg(
         self,
-        jax_var: str | jcore.Atom | jutil.JaCeVar,
+        jax_var: str | jax_core.Atom | util.JaCeVar,
         allow_fail: bool,
     ) -> str | None: ...
 
     def map_jax_var_to_sdfg(
         self,
-        jax_var: str | jcore.Atom | jutil.JaCeVar,
+        jax_var: str | jax_core.Atom | util.JaCeVar,
         allow_fail: bool = False,
     ) -> str | None:
         """Get the _name_ of the SDFG variable to which `jax_var` is referring to.
@@ -273,7 +274,7 @@ def map_jax_var_to_sdfg(
         """
         if isinstance(jax_var, str):
             sdfg_name: str = jax_var
-        elif isinstance(jax_var, jcore.Literal):
+        elif isinstance(jax_var, jax_core.Literal):
             raise RuntimeError("There is no SDFG variable for literal '{jax_var}'.")
         elif jax_var in self._ctx.jax_name_map:
             sdfg_name = self._ctx.jax_name_map[jax_var]
@@ -336,7 +337,7 @@ def get_rev_idx(self) -> int:
 
     def add_jax_name_mapping(
         self,
-        jax_var: jcore.Var | jutil.JaCeVar,
+        jax_var: jax_core.Var | util.JaCeVar,
         sdfg_name: str,
     ) -> JaxprTranslationDriver:
         """Creates a mapping between `jax_var` to `sdfg_name`.
@@ -384,7 +385,7 @@ def add_reserved_names(
             raise TypeError(f"Does not know how to handle the type '{type(reserved_names)}'.")
         for rev_name in reserved_names:
             assert isinstance(rev_name, str)
-            if not jutil._VALID_SDFG_VAR_NAME.fullmatch(rev_name):
+            if not util._VALID_SDFG_VAR_NAME.fullmatch(rev_name):
                 raise ValueError(
                     f"Can not use '{rev_name}' as reserved name as it is not a valid SDFG name."
                 )
@@ -393,7 +394,7 @@ def add_reserved_names(
 
     def add_array(
         self,
-        arg: jcore.Atom | jutil.JaCeVar,
+        arg: jax_core.Atom | util.JaCeVar,
         *,
         as_transient: bool = True,
         alt_name: str | None = None,
@@ -471,8 +472,8 @@ def add_array(
         """
         assert self.is_allocated()
 
-        shape: Sequence[int] = jutil.get_jax_var_shape(arg)
-        dtype = jutil.get_jax_var_dtype(arg)
+        shape: Sequence[int] = util.get_jax_var_shape(arg)
+        dtype = util.get_jax_var_dtype(arg)
         offset = None  # i.e. no offset
         storage: dace.StorageType = dace.StorageType.Default  # Set at later stages (optimization)
         is_scalar: bool = shape == ()
@@ -493,7 +494,7 @@ def add_array(
                 raise ValueError(
                     f"Specified 'force_jax_name', but passed '{name_prefix}' as 'name_prefix'."
                 )
-            alt_name = jutil._propose_jax_name(arg, self._ctx.jax_name_map)
+            alt_name = util._propose_jax_name(arg, self._ctx.jax_name_map)
         if alt_name is not None:
             assert isinstance(
                 alt_name, str
@@ -503,7 +504,7 @@ def add_array(
                 raise ValueError("Passed an empty 'alt_name'.")
             if alt_name in self._forbidden_names:
                 raise ValueError("'alt_name' is a forbidden name.")
-            if not jutil._VALID_SDFG_VAR_NAME.fullmatch(alt_name):
+            if not util._VALID_SDFG_VAR_NAME.fullmatch(alt_name):
                 raise ValueError(f"The passed name 'alt_name' '{alt_name}' is invalid.")
             if name_prefix is not None:
                 raise ValueError(
@@ -536,8 +537,8 @@ def add_array(
         #  Depending on the situation, we will further manipulate it.
         if alt_name is not None:
             prop_name = alt_name  # Just for completion: will be ignored later
-        elif isinstance(arg, (jcore.Var, jutil.JaCeVar)):
-            prop_name = jutil._propose_jax_name(arg, self._ctx.jax_name_map)
+        elif isinstance(arg, (jax_core.Var, util.JaCeVar)):
+            prop_name = util._propose_jax_name(arg, self._ctx.jax_name_map)
             if prop_name.startswith("__"):
                 raise ValueError(
                     f"You tried to create the variable '{prop_name}' which"
@@ -545,7 +546,7 @@ def add_array(
                 )
             if name_prefix is not None:
                 prop_name = name_prefix + prop_name
-        elif isinstance(arg, jcore.Literal):  # type: ignore[unreachable]
+        elif isinstance(arg, jax_core.Literal):  # type: ignore[unreachable]
             if not allow_literals:
                 raise NotImplementedError("Jax Literals are not supported.")
             if alt_name is None:
@@ -590,7 +591,7 @@ def add_array(
             raise ValueError(f"Can't create variable '{arg_name}', name is forbidden.")
         if arg_name in self._ctx.sdfg.arrays:
             raise ValueError(f"Can't create variable '{arg_name}', variable is already created.")
-        if not jutil._VALID_SDFG_VAR_NAME.fullmatch(arg_name):
+        if not util._VALID_SDFG_VAR_NAME.fullmatch(arg_name):
             raise ValueError(f"The requested variable name '{arg_name}' is invalid.")
 
         # Promotion of scalar to array.
@@ -642,7 +643,7 @@ def add_array(
 
     def create_jax_var_list(
         self,
-        jax_var_list: Sequence[jcore.Atom | jutil.JaCeVar],
+        jax_var_list: Sequence[jax_core.Atom | util.JaCeVar],
         prevent_creation: bool = False,
         only_creation: bool = False,
         handle_literals: bool = False,
@@ -677,11 +678,11 @@ def create_jax_var_list(
 
         ret_list: list[None | str] = []
         for jax_var in jax_var_list:
-            if isinstance(jax_var, jcore.Literal):
+            if isinstance(jax_var, jax_core.Literal):
                 if not handle_literals:
                     raise ValueError("Encountered a literal but `handle_literals` was `False`.")
                 sdfg_name = None
-            elif isinstance(jax_var, (jcore.Var, jutil.JaCeVar)):
+            elif isinstance(jax_var, (jax_core.Var, util.JaCeVar)):
                 mapped_sdfg_name: str | None = self.map_jax_var_to_sdfg(jax_var, allow_fail=True)
                 if (mapped_sdfg_name is None) and prevent_creation:
                     raise ValueError(f"'prevent_creation' given but have to create '{jax_var}'.")
@@ -702,7 +703,7 @@ def create_jax_var_list(
 
     def _create_initial_input(
         self,
-        jaxpr: jcore.ClosedJaxpr,
+        jaxpr: jax_core.ClosedJaxpr,
         inp_scalar_as_array: bool,
     ) -> Sequence[str]:
         """This function will create the internal input variables that are used for the SDFG.
@@ -744,7 +745,7 @@ def _create_initial_input(
 
     def _create_constants(
         self,
-        jaxpr: jcore.ClosedJaxpr,
+        jaxpr: jax_core.ClosedJaxpr,
     ) -> Sequence[str]:
         """Creates all constants requested by the `jaxpr`.
 
@@ -825,21 +826,21 @@ def _init_sub_translators(
         The function forwards `kwargs` to the constructor of the subtranslators.
         However, it will remove all arguments starting with an underscore.
         """
-        from jace.translator.sub_translators import _get_subtranslators_cls  # Avoid import cycle
-
         assert self._sub_translators is None
 
         subtrans_args = {k: v for k, v in subtrans_args.items() if not k.startswith("_")}  # type: ignore[unreachable]
-        sub_translators: dict[str, jtrans.PrimitiveTranslator] = {}
-        for sub_translator_cls in _get_subtranslators_cls():
-            sub_translator: jtrans.PrimitiveTranslator = sub_translator_cls.CREATE(**subtrans_args)
-            handled_primitives: Iterable[str] = jutil.as_sequence(sub_translator.primitive)
+        prim_translators: dict[str, translator.PrimitiveTranslator] = {}
+        for prim_translator_cls in sub_translators._get_subtranslators_cls():
+            prim_translator: translator.PrimitiveTranslator = prim_translator_cls.CREATE(
+                **subtrans_args
+            )
+            handled_primitives: Iterable[str] = util.as_sequence(prim_translator.primitive)
 
             for handled_primitive in handled_primitives:
-                if handled_primitive in sub_translators:
-                    raise RuntimeError(f"Multiple sub_translators for '{handled_primitive}' found.")
-                sub_translators[handled_primitive] = sub_translator
-        self._sub_translators = sub_translators
+                if handled_primitive in prim_translators:
+                    raise RuntimeError(f"Multiple sub translators for '{handled_primitive}' found.")
+                prim_translators[handled_primitive] = prim_translator
+        self._sub_translators = prim_translators
 
         return self
 
@@ -872,8 +873,8 @@ def _clear_translation_ctx(self) -> JaxprTranslationDriver:
 
     def _find_sub_translator_for(
         self,
-        eqn: jcore.JaxprEqn,
-    ) -> jtrans.PrimitiveTranslator:
+        eqn: jax_core.JaxprEqn,
+    ) -> translator.PrimitiveTranslator:
         """Returns the appropriate subtranslator for equation `eqn`."""
         assert self._sub_translators is not None
 
@@ -885,8 +886,8 @@ def _find_sub_translator_for(
 
     def _translate_single_eqn(
         self,
-        jaxpr: jcore.ClosedJaxpr,
-        eqn: jcore.JaxprEqn,
+        jaxpr: jax_core.ClosedJaxpr,
+        eqn: jax_core.JaxprEqn,
     ) -> tuple[Sequence[str | None], Sequence[str]]:
         """Translate `eqn` into its SDFG equivalent.
 
@@ -904,8 +905,8 @@ def _translate_single_eqn(
             While `jaxpr` must be a `ClosedJaxpr`, `eqn` must come from the unclosed instance.
             The function will perform some consistency checking after the subtranslator was called.
         """
-        assert isinstance(eqn, jcore.JaxprEqn)
-        assert isinstance(jaxpr, jcore.ClosedJaxpr)
+        assert isinstance(eqn, jax_core.JaxprEqn)
+        assert isinstance(jaxpr, jax_core.ClosedJaxpr)
 
         if len(eqn.effects) != 0:
             raise NotImplementedError(f"Equation '{eqn}' has side effects.")
@@ -925,7 +926,7 @@ def _translate_single_eqn(
         )
 
         # Find the subtranslator
-        subtranslator: jtrans.PrimitiveTranslator = self._find_sub_translator_for(eqn)
+        subtranslator: translator.PrimitiveTranslator = self._find_sub_translator_for(eqn)
 
         # Create the state into which the equation should be translated
         last_term_state: dace.SDFGState = self.get_terminal_sdfg_state()  # noqa: F841 # Will be used later
@@ -963,7 +964,7 @@ def _translate_single_eqn(
             )
         for expectedSDFGName, jax_var in zip(out_var_names, eqn.outvars, strict=True):
             mapped_sdfg_name = self.map_jax_var_to_sdfg(jax_var)
-            jax_name = jutil.get_jax_var_name(jax_var)
+            jax_name = util.get_jax_var_name(jax_var)
             if mapped_sdfg_name != expectedSDFGName:
                 raise ValueError(
                     f"Mapping inconsistency detected, expected that Jax variable"
@@ -980,13 +981,13 @@ def _translate_single_eqn(
                 pass
             elif isinstance(sdfg_var, dace.data.View):
                 raise TypeError(
-                    f"For Jax variable '{jutil.get_jax_var_name(jax_var)}' (SDFG: '{outVarName}'),"
+                    f"For Jax variable '{util.get_jax_var_name(jax_var)}' (SDFG: '{outVarName}'),"
                     f" which is an output, you used a View, which is not possible."
                     " It must either be an array or a scalar."
                 )
             else:
                 raise NotImplementedError(
-                    f"Output variable '{jutil.get_jax_var_name(jax_var)}' (SDFG: '{outVarName}')"
+                    f"Output variable '{util.get_jax_var_name(jax_var)}' (SDFG: '{outVarName}')"
                     f" is of type '{type(sdfg_var).__name__}' which I does not know how to handle."
                 )
 
@@ -997,8 +998,8 @@ def _translate_single_eqn(
 
     def _translate_jaxpr_internal(
         self,
-        jaxpr: jcore.ClosedJaxpr,
-    ) -> jtrans.TranslatedJaxprSDFG:
+        jaxpr: jax_core.ClosedJaxpr,
+    ) -> translator.TranslatedJaxprSDFG:
         """Performs the actual translation of the Jaxpr into an SDFG.
 
         The function assumes that the context is allocated as well as initial variables.
@@ -1014,7 +1015,7 @@ def _translate_jaxpr_internal(
                 this is used by Jax to indicate that they are never read.
                 Such variables are included by some transformations such as `grad()`.
         """
-        assert isinstance(jaxpr, jcore.ClosedJaxpr)
+        assert isinstance(jaxpr, jax_core.ClosedJaxpr)
         assert self.is_allocated()
 
         nb_translated_eqn: int = 0
@@ -1023,9 +1024,9 @@ def _translate_jaxpr_internal(
             assert len(eqn.effects) == 0
             if len(eqn.outvars) == 0:  # Do we need this special case.
                 continue  #  Looks more like internal Jax error.
-            if any(jutil.is_drop_var(outVar) for outVar in eqn.outvars):
+            if any(util.is_drop_var(outVar) for outVar in eqn.outvars):
                 assert (len(eqn.outvars) == 1) or all(
-                    jutil.is_drop_var(outVar) for outVar in eqn.outvars
+                    util.is_drop_var(outVar) for outVar in eqn.outvars
                 )
                 continue
             _, out_var_names = self._translate_single_eqn(jaxpr=jaxpr, eqn=eqn)
@@ -1038,7 +1039,7 @@ def _translate_jaxpr_internal(
 
         return self._export_context()
 
-    def _export_context(self) -> jtrans.TranslatedJaxprSDFG:
+    def _export_context(self) -> translator.TranslatedJaxprSDFG:
         """Encapsulate the translation context of `self` into a `TranslatedJaxprSDFG` object..
 
         This function will not deallocate the internal context of `self`.
@@ -1049,7 +1050,7 @@ def _export_context(self) -> jtrans.TranslatedJaxprSDFG:
         assert all((isinstance(x, str) and (len(x) > 0)) for x in self._ctx.inp_names)
         assert all((isinstance(x, str) and (len(x) > 0)) for x in self._ctx.out_names)
 
-        return jtrans.TranslatedJaxprSDFG(
+        return translator.TranslatedJaxprSDFG(
             sdfg=self._ctx.sdfg,
             start_state=self._ctx.start_state,
             terminal_state=self._ctx.terminal_state,
@@ -1060,7 +1061,7 @@ def _export_context(self) -> jtrans.TranslatedJaxprSDFG:
 
     def _handle_null_jaxpr(
         self,
-        jaxpr: jcore.ClosedJaxpr,
+        jaxpr: jax_core.ClosedJaxpr,
     ) -> Sequence[str]:
         """This function is called in case a `Jaxpr` with zero equations is encountered.
 
@@ -1092,7 +1093,7 @@ def _handle_null_jaxpr(
         #  Thus we have to introduce a some fake output name and explicitly copy the data around.
         #  Once DaCe will inline the nested SDFG it will remove this intermediate copy.
         for jax_out_var in jaxpr.jaxpr.outvars:
-            jax_inp_name = jutil.get_jax_var_name(
+            jax_inp_name = util.get_jax_var_name(
                 jax_out_var
             )  # Since output == input their names must be the same.
             assert self.map_jax_var_to_sdfg(jax_inp_name, allow_fail=True)
diff --git a/src/jace/translator/sub_translators/__init__.py b/src/jace/translator/sub_translators/__init__.py
index 7019076..88c239c 100644
--- a/src/jace/translator/sub_translators/__init__.py
+++ b/src/jace/translator/sub_translators/__init__.py
@@ -4,25 +4,24 @@
 # All rights reserved.
 #
 # SPDX-License-Identifier: BSD-3-Clause
-
 """Module collecting all built-in subtranslators."""
 
 from __future__ import annotations
 
 from collections.abc import Sequence
 
-from jace import translator as jtrans
-from jace.translator.sub_translators.alu_translator import ALUTranslator
+from .a_primitive_translator import PrimitiveTranslator  # has to be the first import.
+from .alu_translator import ALUTranslator
 
 
 # List of all subtranslators that ships with JaCe.
-_KNOWN_SUBTRANSLATORS: list[type[jtrans.PrimitiveTranslator]] = [
+_KNOWN_SUBTRANSLATORS: list[type[PrimitiveTranslator]] = [
     ALUTranslator,
 ]
 
 
 def add_subtranslator(
-    subtrans: type[jtrans.PrimitiveTranslator],
+    subtrans: type[PrimitiveTranslator],
 ) -> bool:
     """Add `subtrans` to the externally defined subtranslators.
 
@@ -37,7 +36,7 @@ def add_subtranslator(
     return True
 
 
-def _get_subtranslators_cls() -> Sequence[type[jtrans.PrimitiveTranslator]]:
+def _get_subtranslators_cls() -> Sequence[type[PrimitiveTranslator]]:
     """Returns the list of all subtranslator known to JaCe.
 
     The translators are returned in FIFO order.
@@ -48,4 +47,5 @@ def _get_subtranslators_cls() -> Sequence[type[jtrans.PrimitiveTranslator]]:
 __all__ = [
     "ALUTranslator",
     "add_subtranslator",
+    "PrimitiveTranslator",
 ]
diff --git a/src/jace/translator/primitive_translator.py b/src/jace/translator/sub_translators/a_primitive_translator.py
similarity index 90%
rename from src/jace/translator/primitive_translator.py
rename to src/jace/translator/sub_translators/a_primitive_translator.py
index 816b709..16d2d4b 100644
--- a/src/jace/translator/primitive_translator.py
+++ b/src/jace/translator/sub_translators/a_primitive_translator.py
@@ -4,6 +4,14 @@
 # All rights reserved.
 #
 # SPDX-License-Identifier: BSD-3-Clause
+"""Contains the interface for all primitive subtranslators.
+
+Note the name of this file is because it has to be the first that is imported in the `__init__.py` file.
+If not, we would get a cyclic import error.
+However, all attempts to prevent ruff from mindlessly (rule abiding) destroying this orders failed.
+Thus the name was changed to enforce this.
+If you have the solution, feel free to implement it.
+"""
 
 from __future__ import annotations
 
@@ -12,7 +20,7 @@
 from typing import TYPE_CHECKING, Any, Protocol, runtime_checkable
 
 import dace
-from jax import core as jcore
+from jax import core as jax_core
 
 
 if TYPE_CHECKING:
@@ -21,7 +29,7 @@
 
 @runtime_checkable
 class PrimitiveTranslator(Protocol):
-    """Interface for all Jax primitive subtranslators.
+    """Interface for all Jax primitive translators, also known as subtranslator.
 
     A translator for a primitive translates a single equation of a Jaxpr into its SDFG equivalent.
     A type that implements this interface must fulfil the following properties:
@@ -66,7 +74,7 @@ def translate_jaxeqn(
         driver: JaxprTranslationDriver,
         in_var_names: Sequence[str | None],
         out_var_names: Sequence[str],
-        eqn: jcore.JaxprEqn,
+        eqn: jax_core.JaxprEqn,
         eqn_state: dace.SDFGState,
     ) -> dace.SDFGState | None:
         """Translates the Jax primitive into its SDFG equivalent.
diff --git a/src/jace/translator/sub_translators/alu_translator.py b/src/jace/translator/sub_translators/alu_translator.py
index b08e474..f397bb3 100644
--- a/src/jace/translator/sub_translators/alu_translator.py
+++ b/src/jace/translator/sub_translators/alu_translator.py
@@ -14,14 +14,13 @@
 
 import dace
 import numpy as np
-from jax import core as jcore
+from jax import core as jax_core
 from typing_extensions import override
 
-from jace import translator as jtranslator
+from jace.translator import sub_translators
 
 
-class ALUTranslator(jtranslator.PrimitiveTranslator):
-    # class ALUTranslator(PrimitiveTranslator):
+class ALUTranslator(sub_translators.PrimitiveTranslator):
     """This translator handles all arithmetic and logical operations."""
 
     __slots__ = ()
@@ -92,10 +91,10 @@ def primitive(self) -> Sequence[str]:
     @override
     def translate_jaxeqn(
         self,
-        driver: jtranslator.JaxprTranslationDriver,
+        driver: sub_translators.JaxprTranslationDriver,
         in_var_names: Sequence[str | None],
         out_var_names: Sequence[str],
-        eqn: jcore.JaxprEqn,
+        eqn: jax_core.JaxprEqn,
         eqn_state: dace.SDFGState,
     ) -> None:
         """Perform the translation.
@@ -244,7 +243,7 @@ def translate_jaxeqn(
     def _writeTaskletCode(
         self,
         in_var_names: Sequence[str | None],
-        eqn: jcore.JaxprEqn,
+        eqn: jax_core.JaxprEqn,
     ) -> str:
         """This function generates the Tasklet code based on a primitive.
 
@@ -284,7 +283,7 @@ def _writeTaskletCode(
             if in_var_name is not None:
                 continue
 
-            jax_in_var: jcore.Literal = cast(jcore.Literal, eqn.invars[i])
+            jax_in_var: jax_core.Literal = cast(jax_core.Literal, eqn.invars[i])
             if jax_in_var.aval.shape == ():
                 t_val = jax_in_var.val
                 if isinstance(t_val, np.ndarray):
diff --git a/src/jace/translator/translated_jaxpr_sdfg.py b/src/jace/translator/translated_jaxpr_sdfg.py
index bc1ffab..3a3bb6b 100644
--- a/src/jace/translator/translated_jaxpr_sdfg.py
+++ b/src/jace/translator/translated_jaxpr_sdfg.py
@@ -12,9 +12,9 @@
 from typing import Any
 
 import dace
-from jax import core as jcore
+from jax import core as jax_core
 
-from jace import util as jutil
+from jace import util
 
 
 @dataclass(init=True, repr=True, eq=False, frozen=False, kw_only=True, slots=True)
@@ -37,7 +37,7 @@ class TranslatedJaxprSDFG:
     """
 
     sdfg: dace.SDFG
-    jax_name_map: Mapping[jcore.Var | jutil.JaCeVar, str]
+    jax_name_map: Mapping[jax_core.Var | util.JaCeVar, str]
     start_state: dace.SDFGState | None = None
     terminal_state: dace.SDFGState | None = None
     inp_names: Sequence[str] | None = None
diff --git a/src/jace/util/debug.py b/src/jace/util/debug.py
index b3a84f3..27c57aa 100644
--- a/src/jace/util/debug.py
+++ b/src/jace/util/debug.py
@@ -13,18 +13,16 @@
 from __future__ import annotations
 
 from collections.abc import Callable
-from typing import TYPE_CHECKING, Any
+from typing import Any
 
 import dace
 import jax
 
-
-if TYPE_CHECKING:
-    from jace import translator as jtrans
+from jace import translator
 
 
 def run_jax_sdfg(
-    jsdfg: jtrans.TranslatedJaxprSDFG,
+    jsdfg: translator.TranslatedJaxprSDFG,
     *args: Any,
 ) -> tuple[Any, ...] | Any:
     """Calls the SDFG that is encapsulated with the supplied arguments.
@@ -97,9 +95,7 @@ def _jace_run(
         *args:      Forwarded to the tracing and final execution of the SDFG.
         **kwargs:   Used to construct the driver.
     """
-    from jace.translator import JaxprTranslationDriver
-
     jaxpr = jax.make_jaxpr(fun)(*args)
-    driver = JaxprTranslationDriver(**kwargs)
+    driver = translator.JaxprTranslationDriver(**kwargs)
     jsdfg = driver.translate_jaxpr(jaxpr)
     return run_jax_sdfg(jsdfg, *args)
diff --git a/src/jace/util/jax_helper.py b/src/jace/util/jax_helper.py
index 3bd2b32..f6f5347 100644
--- a/src/jace/util/jax_helper.py
+++ b/src/jace/util/jax_helper.py
@@ -15,12 +15,13 @@
 
 from __future__ import annotations
 
+import itertools
 from collections.abc import Mapping
 from dataclasses import dataclass
-from typing import Any
+from typing import Any, overload
 
 import dace
-import jax.core as jcore
+import jax.core as jax_core
 import numpy as np
 
 from jace import util
@@ -36,14 +37,13 @@ class JaCeVar:
 
     Notes:
         Main intention is to test functionality.
-        While for a Jax `Var` object the name is rather irrelevant, `JaCeVar` use their name.
         If the name of a `JaCeVar` is '_' it is considered a drop variable.
         If the name of a `JaCeVar` is empty, the automatic naming will consider it as a Jax variable.
         The definition of `__hash__` and `__eq__` is in accordance how Jax variable works.
     """
 
     name: str
-    shape: tuple[int | dace.symbol | str, ...] | int | dace.symbol | str | tuple[()]
+    shape: tuple[int | dace.symbol | str, ...] | tuple[()]
     dtype: dace.typeclass
 
     def __hash__(self) -> int:
@@ -59,7 +59,7 @@ def __post_init__(self) -> None:
             raise ValueError("The 'shape' member of a 'JaCeVar' must be a tuple.")
 
 
-def get_jax_var_name(jax_var: jcore.Atom | JaCeVar | str) -> str:
+def get_jax_var_name(jax_var: jax_core.Atom | JaCeVar | str) -> str:
     """Returns the name of the Jax variable as a string.
 
     Args:
@@ -70,19 +70,19 @@ def get_jax_var_name(jax_var: jcore.Atom | JaCeVar | str) -> str:
         This function is subject for removal.
     """
     match jax_var:
-        case jcore.DropVar():
+        case jax_core.DropVar():
             return "_"
         case JaCeVar():
             # In case of an empty name consider the jace variable as a Jax variable.
             #  This is mostly for testing.
             jax_name = f"jax{id(jax_var)}" if jax_var.name == "" else jax_var.name
-        case jcore.Var():
+        case jax_core.Var():
             # This stopped working after version 0.20.4, because of some changes in Jax
             #  See `https://github.com/google/jax/pull/10573` for more information.
             #  The following implementation will generate stable names, however, they will be decoupled
             #  from output of the pretty printed Jaxpr
             jax_name = f"jax{jax_var.count}{jax_var.suffix}"
-        case jcore.Literal():
+        case jax_core.Literal():
             raise TypeError("Can not derive a name from a Jax Literal.")
         case str():
             jax_name = jax_var
@@ -97,14 +97,24 @@ def get_jax_var_name(jax_var: jcore.Atom | JaCeVar | str) -> str:
     return jax_name
 
 
-def get_jax_var_shape(jax_var: jcore.Atom | JaCeVar) -> tuple[int, ...]:
+@overload
+def get_jax_var_shape(jax_var: JaCeVar) -> tuple[int | dace.symbol | str, ...] | tuple[()]: ...
+
+
+@overload
+def get_jax_var_shape(jax_var: jax_core.Atom) -> tuple[int, ...] | tuple[()]: ...
+
+
+def get_jax_var_shape(
+    jax_var: jax_core.Atom | JaCeVar,
+) -> tuple[int | dace.symbol | str, ...] | tuple[()]:
     """Returns the shape of a Jax variable.
 
     Args:
         jax_var:     The variable to process
     """
     match jax_var:
-        case jcore.Var() | jcore.Literal():
+        case jax_core.Var() | jax_core.Literal():
             return jax_var.aval.shape
         case JaCeVar():
             return jax_var.shape
@@ -112,10 +122,10 @@ def get_jax_var_shape(jax_var: jcore.Atom | JaCeVar) -> tuple[int, ...]:
             raise TypeError(f"'get_jax_var_shape()` is not implemented for '{type(jax_var)}'.")
 
 
-def get_jax_var_dtype(jax_var: jcore.Atom | JaCeVar) -> dace.typeclass:
+def get_jax_var_dtype(jax_var: jax_core.Atom | JaCeVar) -> dace.typeclass:
     """Returns the DaCe equivalent of `jax_var`s datatype."""
     match jax_var:
-        case jcore.Var() | jcore.Literal():
+        case jax_core.Var() | jax_core.Literal():
             return translate_dtype(jax_var.aval.dtype)
         case JaCeVar():
             return translate_dtype(jax_var.dtype)
@@ -135,12 +145,10 @@ def is_tracing_ongoing(
     Raises:
         RuntimeError: If the function fails to make a detection.
     """
-    from itertools import chain
-
     # The current implementation only checks the arguments if it contains tracers.
     if (len(args) == 0) and (len(kwargs) == 0):
         raise RuntimeError("Failed to determine if tracing is ongoing.")
-    return any(isinstance(x, jcore.Tracer) for x in chain(args, kwargs.values()))
+    return any(isinstance(x, jax_core.Tracer) for x in itertools.chain(args, kwargs.values()))
 
 
 def translate_dtype(dtype: Any) -> dace.typeclass:
@@ -168,8 +176,8 @@ def translate_dtype(dtype: Any) -> dace.typeclass:
 
 
 def _propose_jax_name(
-    jax_var: jcore.Atom | JaCeVar,
-    jax_name_map: Mapping[jcore.Var | JaCeVar, Any] | None = None,
+    jax_var: jax_core.Atom | JaCeVar,
+    jax_name_map: Mapping[jax_core.Var | JaCeVar, Any] | None = None,
 ) -> str:
     """Proposes a variable name for `jax_var`.
 
@@ -187,11 +195,9 @@ def _propose_jax_name(
         The naming of variables are only consistent with the inner most Jaxpr a variable is defined in.
         Dropped variables will always be named `'_'`.
     """
-    from jace.util.traits import is_drop_var
-
-    if is_drop_var(jax_var):
+    if util.traits.is_drop_var(jax_var):
         return "_"
-    if isinstance(jax_var, jcore.Literal):
+    if isinstance(jax_var, jax_core.Literal):
         raise TypeError(f"Can not propose a name for literal '{jax_var}'.")
     if jax_name_map is None:
         return get_jax_var_name(jax_var)
@@ -200,7 +206,7 @@ def _propose_jax_name(
         raise RuntimeError(
             f"Can not propose a second name for '{jax_var}', it already known as '{jax_name_map[jax_var]}'."
         )
-    if isinstance(jax_var, jcore.Var):
+    if isinstance(jax_var, jax_core.Var):
         pass
     elif isinstance(jax_var, JaCeVar):
         # If the name of the JaCe variable is empty, then use the name proposing
diff --git a/src/jace/util/traits.py b/src/jace/util/traits.py
index 417cdcb..8d3eecc 100644
--- a/src/jace/util/traits.py
+++ b/src/jace/util/traits.py
@@ -12,9 +12,9 @@
 from collections.abc import Iterable
 from typing import Any, TypeGuard
 
-from jax import core as jcore
+from jax import core as jax_core
 
-from jace import util as jutil
+from jace import util
 
 
 class NonStringIterable(Iterable): ...
@@ -29,21 +29,21 @@ def is_jaceified(obj: Any) -> bool:
 
     Similar to `jace.util.is_jaxified`, but for JaCe object.
     """
-    from jace import jax as jjax, util as jutil
+    from jace import jax as jjax
 
-    if jutil.is_jaxified(obj):
+    if util.is_jaxified(obj):
         return False
     # Currently it is quite simple because we can just check if `obj`
     #  is derived from `jace.jax.JitWrapped`, might become harder in the future.
     return isinstance(obj, jjax.JitWrapped)
 
 
-def is_drop_var(jax_var: jcore.Atom | jutil.JaCeVar) -> bool:
+def is_drop_var(jax_var: jax_core.Atom | util.JaCeVar) -> bool:
     """Tests if `jax_var` is a drop variable."""
 
-    if isinstance(jax_var, jcore.DropVar):
+    if isinstance(jax_var, jax_core.DropVar):
         return True
-    if isinstance(jax_var, jutil.JaCeVar):
+    if isinstance(jax_var, util.JaCeVar):
         return jax_var.name == "_"
     return False
 
@@ -56,13 +56,13 @@ def is_jaxified(obj: Any) -> bool:
     `False` might not proof the contrary.
     """
     import jaxlib
-    from jax._src import pjit as jaxpjit
+    from jax import _src as jax_src
 
     # These are all types we consider as jaxify
     jaxifyed_types = (
-        jcore.Primitive,
+        jax_core.Primitive,
         # jstage.Wrapped is not runtime chakable
-        jaxpjit.JitWrapped,
+        jax_src.pjit.JitWrapped,
         jaxlib.xla_extension.PjitFunction,
     )
     return isinstance(obj, jaxifyed_types)
diff --git a/src/jace/util/util.py b/src/jace/util/util.py
index 3943743..96bfa20 100644
--- a/src/jace/util/util.py
+++ b/src/jace/util/util.py
@@ -10,6 +10,8 @@
 from collections.abc import Iterable
 from typing import TypeVar, cast, overload
 
+from jace.util import traits
+
 
 _T = TypeVar("_T")
 
@@ -27,8 +29,6 @@ def as_sequence(value: _T) -> Iterable[_T]: ...
 
 
 def as_sequence(value: _T | Iterable[_T]) -> Iterable[_T]:
-    from jace.util.traits import is_non_string_iterable
-
-    if is_non_string_iterable(value):
+    if traits.is_non_string_iterable(value):
         return value
     return cast(Iterable[_T], [value])

From e2b496fa99ded0842d930a84f6c7ca62ce37b97d Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Fri, 3 May 2024 14:45:46 +0200
Subject: [PATCH 096/458] Made some fixes to the verification function of the
 `TranslatedJaxprSDFG`.

---
 src/jace/translator/translated_jaxpr_sdfg.py | 12 +++++++++---
 1 file changed, 9 insertions(+), 3 deletions(-)

diff --git a/src/jace/translator/translated_jaxpr_sdfg.py b/src/jace/translator/translated_jaxpr_sdfg.py
index b2b7dc8..bc1ffab 100644
--- a/src/jace/translator/translated_jaxpr_sdfg.py
+++ b/src/jace/translator/translated_jaxpr_sdfg.py
@@ -46,12 +46,18 @@ class TranslatedJaxprSDFG:
     def validate(self) -> bool:
         """Validate the underlying SDFG."""
 
-        # To prevent the 'non initialized' data warnings we have to temporary promote the
-        #  input arguments as global.
+        # To prevent the 'non initialized' data warnings we have to temporary
+        #  promote input and output arguments to globals
+        promote_to_glob: set[str] = set()
         org_trans_state: dict[str, bool] = {}
-        for var in self.inp_names:
+        if self.inp_names:
+            promote_to_glob.update(self.inp_names)
+        if self.out_names:
+            promote_to_glob.update(self.out_names)
+        for var in promote_to_glob:
             org_trans_state[var] = self.sdfg.arrays[var].transient
             self.sdfg.arrays[var].transient = False
+
         try:
             self.sdfg.validate()
         finally:

From c185444b4038b29cbbb0747d11c5f26b879a042a Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Fri, 3 May 2024 14:40:42 +0200
Subject: [PATCH 097/458] Fixing some import names.

---
 src/jace/translator/__init__.py               |   2 -
 src/jace/translator/_translation_context.py   |  14 +--
 .../translator/jaxpr_translator_driver.py     | 119 +++++++++---------
 .../translator/sub_translators/__init__.py    |  12 +-
 .../a_primitive_translator.py}                |  14 ++-
 .../sub_translators/alu_translator.py         |  15 ++-
 src/jace/translator/translated_jaxpr_sdfg.py  |   6 +-
 src/jace/util/debug.py                        |  12 +-
 src/jace/util/jax_helper.py                   |  45 ++++---
 src/jace/util/traits.py                       |  10 +-
 src/jace/util/util.py                         |   6 +-
 11 files changed, 132 insertions(+), 123 deletions(-)
 rename src/jace/translator/{primitive_translator.py => sub_translators/a_primitive_translator.py} (90%)

diff --git a/src/jace/translator/__init__.py b/src/jace/translator/__init__.py
index 8ca5476..d6bb0c7 100644
--- a/src/jace/translator/__init__.py
+++ b/src/jace/translator/__init__.py
@@ -10,12 +10,10 @@
 from __future__ import annotations
 
 from .jaxpr_translator_driver import JaxprTranslationDriver
-from .primitive_translator import PrimitiveTranslator
 from .translated_jaxpr_sdfg import TranslatedJaxprSDFG
 
 
 __all__ = [
-    "PrimitiveTranslator",
     "JaxprTranslationDriver",
     "TranslatedJaxprSDFG",
 ]
diff --git a/src/jace/translator/_translation_context.py b/src/jace/translator/_translation_context.py
index a0c1854..6d9c43f 100644
--- a/src/jace/translator/_translation_context.py
+++ b/src/jace/translator/_translation_context.py
@@ -12,9 +12,9 @@
 from collections.abc import MutableMapping, Sequence
 
 import dace
-from jax import core as jcore
+from jax import core as jax_core
 
-from jace import translator as jtrans, util as jutil
+from jace import translator, util
 
 
 class _TranslationContext:
@@ -70,7 +70,7 @@ def __init__(
             rev_idx:    The revision index of the context.
             name:       Name of the SDFG object.
         """
-        if isinstance(name, str) and not jutil._VALID_SDFG_OBJ_NAME.fullmatch(name):
+        if isinstance(name, str) and not util._VALID_SDFG_OBJ_NAME.fullmatch(name):
             raise ValueError(f"'{name}' is not a valid SDFG name.")
 
         self._sdfg: dace.SDFG = dace.SDFG(name=(name or f"unnamed_SDFG_{id(self)}"))
@@ -78,14 +78,14 @@ def __init__(
             label="initial_state", is_start_block=True
         )
         self._terminal_state: dace.SDFGState = self._start_state
-        self._jax_name_map: MutableMapping[jcore.Var | jutil.JaCeVar, str] = {}
+        self._jax_name_map: MutableMapping[jax_core.Var | util.JaCeVar, str] = {}
         self._inp_names: tuple[str, ...] = ()
         self._out_names: tuple[str, ...] = ()
         self._rev_idx: int = rev_idx
 
-    def to_translated_jaxpr_sdfg(self) -> jtrans.TranslatedJaxprSDFG:
+    def to_translated_jaxpr_sdfg(self) -> translator.TranslatedJaxprSDFG:
         """Transforms `self` into a `TranslatedJaxprSDFG`."""
-        return jtrans.TranslatedJaxprSDFG(
+        return translator.TranslatedJaxprSDFG(
             sdfg=self._sdfg,
             start_state=self._start_state,
             terminal_state=self._terminal_state,
@@ -114,7 +114,7 @@ def terminal_state(
         self._terminal_state = new_term_state
 
     @property
-    def jax_name_map(self) -> MutableMapping[jcore.Var | jutil.JaCeVar, str]:
+    def jax_name_map(self) -> MutableMapping[jax_core.Var | util.JaCeVar, str]:
         return self._jax_name_map
 
     @property
diff --git a/src/jace/translator/jaxpr_translator_driver.py b/src/jace/translator/jaxpr_translator_driver.py
index c6fdb46..5b01fd2 100644
--- a/src/jace/translator/jaxpr_translator_driver.py
+++ b/src/jace/translator/jaxpr_translator_driver.py
@@ -14,9 +14,10 @@
 import dace
 import jax
 from dace import data as ddata, properties as dprop
-from jax import core as jcore
+from jax import core as jax_core
 
-from jace import translator as jtrans, util as jutil
+from jace import translator, util
+from jace.translator import sub_translators
 
 
 class JaxprTranslationDriver:
@@ -81,7 +82,7 @@ def __init__(
         #  They are partitioned by the names of the primitive they have registered for.
         #  This member is allocated by '_init_sub_translators()' and remains allocated
         #  during the lifetime of the object.
-        self._sub_translators: dict[str, jtrans.PrimitiveTranslator] = None  # type: ignore[assignment]
+        self._sub_translators: dict[str, translator.PrimitiveTranslator] = None  # type: ignore[assignment]
 
         # These names can not be used for the automatic naming of Jax variables.
         #  They differ from the forbidden names, that they denote valid SDFG names.
@@ -104,14 +105,14 @@ def __init__(
 
     def translate_jaxpr(
         self,
-        jaxpr: jcore.ClosedJaxpr,
+        jaxpr: jax_core.ClosedJaxpr,
         *,
         inp_scalar_as_array: bool = False,
         name: str | None = None,
         reserved_names: str | Collection[str] | None = None,
         allow_empty_jaxpr: bool = False,
         **kwargs: Any,
-    ) -> jtrans.TranslatedJaxprSDFG:
+    ) -> translator.TranslatedJaxprSDFG:
         """Perform the translation of a Jaxpr into a SDFG.
 
         In case this function is called and `self` has an ongoing translation process, a new translation context will be created.
@@ -134,7 +135,7 @@ def translate_jaxpr(
         """
         if (len(jaxpr.eqns) == 0) and (not allow_empty_jaxpr):
             raise ValueError("Passed an empty Jaxpr, but did not allow for empty Jaxpr.")
-        if not isinstance(jaxpr, jcore.ClosedJaxpr):
+        if not isinstance(jaxpr, jax_core.ClosedJaxpr):
             raise TypeError(f"Expected a 'jax.core.ClosedJaxp' instance but got '{type(jaxpr)}'")
         if len(jaxpr.effects) != 0:
             raise NotImplementedError("'Jaxpr' with side effects are not supported.")
@@ -162,7 +163,7 @@ def translate_jaxpr(
             jaxpr=jaxpr,
             inp_scalar_as_array=inp_scalar_as_array,
         )
-        jsdfg: jtrans.TranslatedJaxprSDFG = self._translate_jaxpr_internal(jaxpr)
+        jsdfg: translator.TranslatedJaxprSDFG = self._translate_jaxpr_internal(jaxpr)
 
         # If the translation context is not cleared `self` and `jsdfg` will share the same data.
         #  There is some legitimate use for that.
@@ -195,7 +196,7 @@ def append_new_state(
             prev_state:     Alternative `SDFGState` at which we should append the new state.
 
         """
-        if isinstance(label, str) and (not jutil._VALID_SDFG_OBJ_NAME.fullmatch(label)):
+        if isinstance(label, str) and (not util._VALID_SDFG_OBJ_NAME.fullmatch(label)):
             raise ValueError(f"Can not create state with label '{label}' since it is invalid.")
 
         # Decide if appending to that state will modify the terminal state.
@@ -228,7 +229,7 @@ def get_arrays(self) -> Mapping[str, ddata.Data]:
 
     def get_array(
         self,
-        name: str | jcore.Atom | jutil.JaCeVar,
+        name: str | jax_core.Atom | util.JaCeVar,
     ) -> ddata.Data:
         """Returns the SDFG `Data` object `name` referees to.
 
@@ -237,7 +238,7 @@ def get_array(
         """
         if isinstance(name, str):
             sdfg_name: str = name
-        elif isinstance(name, (jcore.Var, jutil.JaCeVar)):
+        elif isinstance(name, (jax_core.Var, util.JaCeVar)):
             sdfg_name = self.map_jax_var_to_sdfg(name)
         else:
             raise TypeError(f"Does not know how to handle '{type(name).__name__}'.")
@@ -248,19 +249,19 @@ def get_array(
     @overload
     def map_jax_var_to_sdfg(
         self,
-        jax_var: str | jcore.Atom | jutil.JaCeVar,
+        jax_var: str | jax_core.Atom | util.JaCeVar,
     ) -> str: ...
 
     @overload
     def map_jax_var_to_sdfg(
         self,
-        jax_var: str | jcore.Atom | jutil.JaCeVar,
+        jax_var: str | jax_core.Atom | util.JaCeVar,
         allow_fail: bool,
     ) -> str | None: ...
 
     def map_jax_var_to_sdfg(
         self,
-        jax_var: str | jcore.Atom | jutil.JaCeVar,
+        jax_var: str | jax_core.Atom | util.JaCeVar,
         allow_fail: bool = False,
     ) -> str | None:
         """Get the _name_ of the SDFG variable to which `jax_var` is referring to.
@@ -273,7 +274,7 @@ def map_jax_var_to_sdfg(
         """
         if isinstance(jax_var, str):
             sdfg_name: str = jax_var
-        elif isinstance(jax_var, jcore.Literal):
+        elif isinstance(jax_var, jax_core.Literal):
             raise RuntimeError("There is no SDFG variable for literal '{jax_var}'.")
         elif jax_var in self._ctx.jax_name_map:
             sdfg_name = self._ctx.jax_name_map[jax_var]
@@ -336,7 +337,7 @@ def get_rev_idx(self) -> int:
 
     def add_jax_name_mapping(
         self,
-        jax_var: jcore.Var | jutil.JaCeVar,
+        jax_var: jax_core.Var | util.JaCeVar,
         sdfg_name: str,
     ) -> JaxprTranslationDriver:
         """Creates a mapping between `jax_var` to `sdfg_name`.
@@ -384,7 +385,7 @@ def add_reserved_names(
             raise TypeError(f"Does not know how to handle the type '{type(reserved_names)}'.")
         for rev_name in reserved_names:
             assert isinstance(rev_name, str)
-            if not jutil._VALID_SDFG_VAR_NAME.fullmatch(rev_name):
+            if not util._VALID_SDFG_VAR_NAME.fullmatch(rev_name):
                 raise ValueError(
                     f"Can not use '{rev_name}' as reserved name as it is not a valid SDFG name."
                 )
@@ -393,7 +394,7 @@ def add_reserved_names(
 
     def add_array(
         self,
-        arg: jcore.Atom | jutil.JaCeVar,
+        arg: jax_core.Atom | util.JaCeVar,
         *,
         as_transient: bool = True,
         alt_name: str | None = None,
@@ -471,8 +472,8 @@ def add_array(
         """
         assert self.is_allocated()
 
-        shape: Sequence[int] = jutil.get_jax_var_shape(arg)
-        dtype = jutil.get_jax_var_dtype(arg)
+        shape: Sequence[int] = util.get_jax_var_shape(arg)
+        dtype = util.get_jax_var_dtype(arg)
         offset = None  # i.e. no offset
         storage: dace.StorageType = dace.StorageType.Default  # Set at later stages (optimization)
         is_scalar: bool = shape == ()
@@ -493,7 +494,7 @@ def add_array(
                 raise ValueError(
                     f"Specified 'force_jax_name', but passed '{name_prefix}' as 'name_prefix'."
                 )
-            alt_name = jutil._propose_jax_name(arg, self._ctx.jax_name_map)
+            alt_name = util._propose_jax_name(arg, self._ctx.jax_name_map)
         if alt_name is not None:
             assert isinstance(
                 alt_name, str
@@ -503,7 +504,7 @@ def add_array(
                 raise ValueError("Passed an empty 'alt_name'.")
             if alt_name in self._forbidden_names:
                 raise ValueError("'alt_name' is a forbidden name.")
-            if not jutil._VALID_SDFG_VAR_NAME.fullmatch(alt_name):
+            if not util._VALID_SDFG_VAR_NAME.fullmatch(alt_name):
                 raise ValueError(f"The passed name 'alt_name' '{alt_name}' is invalid.")
             if name_prefix is not None:
                 raise ValueError(
@@ -536,8 +537,8 @@ def add_array(
         #  Depending on the situation, we will further manipulate it.
         if alt_name is not None:
             prop_name = alt_name  # Just for completion: will be ignored later
-        elif isinstance(arg, (jcore.Var, jutil.JaCeVar)):
-            prop_name = jutil._propose_jax_name(arg, self._ctx.jax_name_map)
+        elif isinstance(arg, (jax_core.Var, util.JaCeVar)):
+            prop_name = util._propose_jax_name(arg, self._ctx.jax_name_map)
             if prop_name.startswith("__"):
                 raise ValueError(
                     f"You tried to create the variable '{prop_name}' which"
@@ -545,7 +546,7 @@ def add_array(
                 )
             if name_prefix is not None:
                 prop_name = name_prefix + prop_name
-        elif isinstance(arg, jcore.Literal):  # type: ignore[unreachable]
+        elif isinstance(arg, jax_core.Literal):  # type: ignore[unreachable]
             if not allow_literals:
                 raise NotImplementedError("Jax Literals are not supported.")
             if alt_name is None:
@@ -590,7 +591,7 @@ def add_array(
             raise ValueError(f"Can't create variable '{arg_name}', name is forbidden.")
         if arg_name in self._ctx.sdfg.arrays:
             raise ValueError(f"Can't create variable '{arg_name}', variable is already created.")
-        if not jutil._VALID_SDFG_VAR_NAME.fullmatch(arg_name):
+        if not util._VALID_SDFG_VAR_NAME.fullmatch(arg_name):
             raise ValueError(f"The requested variable name '{arg_name}' is invalid.")
 
         # Promotion of scalar to array.
@@ -642,7 +643,7 @@ def add_array(
 
     def create_jax_var_list(
         self,
-        jax_var_list: Sequence[jcore.Atom | jutil.JaCeVar],
+        jax_var_list: Sequence[jax_core.Atom | util.JaCeVar],
         prevent_creation: bool = False,
         only_creation: bool = False,
         handle_literals: bool = False,
@@ -677,11 +678,11 @@ def create_jax_var_list(
 
         ret_list: list[None | str] = []
         for jax_var in jax_var_list:
-            if isinstance(jax_var, jcore.Literal):
+            if isinstance(jax_var, jax_core.Literal):
                 if not handle_literals:
                     raise ValueError("Encountered a literal but `handle_literals` was `False`.")
                 sdfg_name = None
-            elif isinstance(jax_var, (jcore.Var, jutil.JaCeVar)):
+            elif isinstance(jax_var, (jax_core.Var, util.JaCeVar)):
                 mapped_sdfg_name: str | None = self.map_jax_var_to_sdfg(jax_var, allow_fail=True)
                 if (mapped_sdfg_name is None) and prevent_creation:
                     raise ValueError(f"'prevent_creation' given but have to create '{jax_var}'.")
@@ -702,7 +703,7 @@ def create_jax_var_list(
 
     def _create_initial_input(
         self,
-        jaxpr: jcore.ClosedJaxpr,
+        jaxpr: jax_core.ClosedJaxpr,
         inp_scalar_as_array: bool,
     ) -> Sequence[str]:
         """This function will create the internal input variables that are used for the SDFG.
@@ -744,7 +745,7 @@ def _create_initial_input(
 
     def _create_constants(
         self,
-        jaxpr: jcore.ClosedJaxpr,
+        jaxpr: jax_core.ClosedJaxpr,
     ) -> Sequence[str]:
         """Creates all constants requested by the `jaxpr`.
 
@@ -825,21 +826,21 @@ def _init_sub_translators(
         The function forwards `kwargs` to the constructor of the subtranslators.
         However, it will remove all arguments starting with an underscore.
         """
-        from jace.translator.sub_translators import _get_subtranslators_cls  # Avoid import cycle
-
         assert self._sub_translators is None
 
         subtrans_args = {k: v for k, v in subtrans_args.items() if not k.startswith("_")}  # type: ignore[unreachable]
-        sub_translators: dict[str, jtrans.PrimitiveTranslator] = {}
-        for sub_translator_cls in _get_subtranslators_cls():
-            sub_translator: jtrans.PrimitiveTranslator = sub_translator_cls.CREATE(**subtrans_args)
-            handled_primitives: Iterable[str] = jutil.as_sequence(sub_translator.primitive)
+        prim_translators: dict[str, translator.PrimitiveTranslator] = {}
+        for prim_translator_cls in sub_translators._get_subtranslators_cls():
+            prim_translator: translator.PrimitiveTranslator = prim_translator_cls.CREATE(
+                **subtrans_args
+            )
+            handled_primitives: Iterable[str] = util.as_sequence(prim_translator.primitive)
 
             for handled_primitive in handled_primitives:
-                if handled_primitive in sub_translators:
-                    raise RuntimeError(f"Multiple sub_translators for '{handled_primitive}' found.")
-                sub_translators[handled_primitive] = sub_translator
-        self._sub_translators = sub_translators
+                if handled_primitive in prim_translators:
+                    raise RuntimeError(f"Multiple sub translators for '{handled_primitive}' found.")
+                prim_translators[handled_primitive] = prim_translator
+        self._sub_translators = prim_translators
 
         return self
 
@@ -872,8 +873,8 @@ def _clear_translation_ctx(self) -> JaxprTranslationDriver:
 
     def _find_sub_translator_for(
         self,
-        eqn: jcore.JaxprEqn,
-    ) -> jtrans.PrimitiveTranslator:
+        eqn: jax_core.JaxprEqn,
+    ) -> translator.PrimitiveTranslator:
         """Returns the appropriate subtranslator for equation `eqn`."""
         assert self._sub_translators is not None
 
@@ -885,8 +886,8 @@ def _find_sub_translator_for(
 
     def _translate_single_eqn(
         self,
-        jaxpr: jcore.ClosedJaxpr,
-        eqn: jcore.JaxprEqn,
+        jaxpr: jax_core.ClosedJaxpr,
+        eqn: jax_core.JaxprEqn,
     ) -> tuple[Sequence[str | None], Sequence[str]]:
         """Translate `eqn` into its SDFG equivalent.
 
@@ -904,8 +905,8 @@ def _translate_single_eqn(
             While `jaxpr` must be a `ClosedJaxpr`, `eqn` must come from the unclosed instance.
             The function will perform some consistency checking after the subtranslator was called.
         """
-        assert isinstance(eqn, jcore.JaxprEqn)
-        assert isinstance(jaxpr, jcore.ClosedJaxpr)
+        assert isinstance(eqn, jax_core.JaxprEqn)
+        assert isinstance(jaxpr, jax_core.ClosedJaxpr)
 
         if len(eqn.effects) != 0:
             raise NotImplementedError(f"Equation '{eqn}' has side effects.")
@@ -925,7 +926,7 @@ def _translate_single_eqn(
         )
 
         # Find the subtranslator
-        subtranslator: jtrans.PrimitiveTranslator = self._find_sub_translator_for(eqn)
+        subtranslator: translator.PrimitiveTranslator = self._find_sub_translator_for(eqn)
 
         # Create the state into which the equation should be translated
         last_term_state: dace.SDFGState = self.get_terminal_sdfg_state()  # noqa: F841 # Will be used later
@@ -963,7 +964,7 @@ def _translate_single_eqn(
             )
         for expectedSDFGName, jax_var in zip(out_var_names, eqn.outvars, strict=True):
             mapped_sdfg_name = self.map_jax_var_to_sdfg(jax_var)
-            jax_name = jutil.get_jax_var_name(jax_var)
+            jax_name = util.get_jax_var_name(jax_var)
             if mapped_sdfg_name != expectedSDFGName:
                 raise ValueError(
                     f"Mapping inconsistency detected, expected that Jax variable"
@@ -980,13 +981,13 @@ def _translate_single_eqn(
                 pass
             elif isinstance(sdfg_var, dace.data.View):
                 raise TypeError(
-                    f"For Jax variable '{jutil.get_jax_var_name(jax_var)}' (SDFG: '{outVarName}'),"
+                    f"For Jax variable '{util.get_jax_var_name(jax_var)}' (SDFG: '{outVarName}'),"
                     f" which is an output, you used a View, which is not possible."
                     " It must either be an array or a scalar."
                 )
             else:
                 raise NotImplementedError(
-                    f"Output variable '{jutil.get_jax_var_name(jax_var)}' (SDFG: '{outVarName}')"
+                    f"Output variable '{util.get_jax_var_name(jax_var)}' (SDFG: '{outVarName}')"
                     f" is of type '{type(sdfg_var).__name__}' which I does not know how to handle."
                 )
 
@@ -997,8 +998,8 @@ def _translate_single_eqn(
 
     def _translate_jaxpr_internal(
         self,
-        jaxpr: jcore.ClosedJaxpr,
-    ) -> jtrans.TranslatedJaxprSDFG:
+        jaxpr: jax_core.ClosedJaxpr,
+    ) -> translator.TranslatedJaxprSDFG:
         """Performs the actual translation of the Jaxpr into an SDFG.
 
         The function assumes that the context is allocated as well as initial variables.
@@ -1014,7 +1015,7 @@ def _translate_jaxpr_internal(
                 this is used by Jax to indicate that they are never read.
                 Such variables are included by some transformations such as `grad()`.
         """
-        assert isinstance(jaxpr, jcore.ClosedJaxpr)
+        assert isinstance(jaxpr, jax_core.ClosedJaxpr)
         assert self.is_allocated()
 
         nb_translated_eqn: int = 0
@@ -1023,9 +1024,9 @@ def _translate_jaxpr_internal(
             assert len(eqn.effects) == 0
             if len(eqn.outvars) == 0:  # Do we need this special case.
                 continue  #  Looks more like internal Jax error.
-            if any(jutil.is_drop_var(outVar) for outVar in eqn.outvars):
+            if any(util.is_drop_var(outVar) for outVar in eqn.outvars):
                 assert (len(eqn.outvars) == 1) or all(
-                    jutil.is_drop_var(outVar) for outVar in eqn.outvars
+                    util.is_drop_var(outVar) for outVar in eqn.outvars
                 )
                 continue
             _, out_var_names = self._translate_single_eqn(jaxpr=jaxpr, eqn=eqn)
@@ -1038,7 +1039,7 @@ def _translate_jaxpr_internal(
 
         return self._export_context()
 
-    def _export_context(self) -> jtrans.TranslatedJaxprSDFG:
+    def _export_context(self) -> translator.TranslatedJaxprSDFG:
         """Encapsulate the translation context of `self` into a `TranslatedJaxprSDFG` object..
 
         This function will not deallocate the internal context of `self`.
@@ -1049,7 +1050,7 @@ def _export_context(self) -> jtrans.TranslatedJaxprSDFG:
         assert all((isinstance(x, str) and (len(x) > 0)) for x in self._ctx.inp_names)
         assert all((isinstance(x, str) and (len(x) > 0)) for x in self._ctx.out_names)
 
-        return jtrans.TranslatedJaxprSDFG(
+        return translator.TranslatedJaxprSDFG(
             sdfg=self._ctx.sdfg,
             start_state=self._ctx.start_state,
             terminal_state=self._ctx.terminal_state,
@@ -1060,7 +1061,7 @@ def _export_context(self) -> jtrans.TranslatedJaxprSDFG:
 
     def _handle_null_jaxpr(
         self,
-        jaxpr: jcore.ClosedJaxpr,
+        jaxpr: jax_core.ClosedJaxpr,
     ) -> Sequence[str]:
         """This function is called in case a `Jaxpr` with zero equations is encountered.
 
@@ -1092,7 +1093,7 @@ def _handle_null_jaxpr(
         #  Thus we have to introduce a some fake output name and explicitly copy the data around.
         #  Once DaCe will inline the nested SDFG it will remove this intermediate copy.
         for jax_out_var in jaxpr.jaxpr.outvars:
-            jax_inp_name = jutil.get_jax_var_name(
+            jax_inp_name = util.get_jax_var_name(
                 jax_out_var
             )  # Since output == input their names must be the same.
             assert self.map_jax_var_to_sdfg(jax_inp_name, allow_fail=True)
diff --git a/src/jace/translator/sub_translators/__init__.py b/src/jace/translator/sub_translators/__init__.py
index 7019076..88c239c 100644
--- a/src/jace/translator/sub_translators/__init__.py
+++ b/src/jace/translator/sub_translators/__init__.py
@@ -4,25 +4,24 @@
 # All rights reserved.
 #
 # SPDX-License-Identifier: BSD-3-Clause
-
 """Module collecting all built-in subtranslators."""
 
 from __future__ import annotations
 
 from collections.abc import Sequence
 
-from jace import translator as jtrans
-from jace.translator.sub_translators.alu_translator import ALUTranslator
+from .a_primitive_translator import PrimitiveTranslator  # has to be the first import.
+from .alu_translator import ALUTranslator
 
 
 # List of all subtranslators that ships with JaCe.
-_KNOWN_SUBTRANSLATORS: list[type[jtrans.PrimitiveTranslator]] = [
+_KNOWN_SUBTRANSLATORS: list[type[PrimitiveTranslator]] = [
     ALUTranslator,
 ]
 
 
 def add_subtranslator(
-    subtrans: type[jtrans.PrimitiveTranslator],
+    subtrans: type[PrimitiveTranslator],
 ) -> bool:
     """Add `subtrans` to the externally defined subtranslators.
 
@@ -37,7 +36,7 @@ def add_subtranslator(
     return True
 
 
-def _get_subtranslators_cls() -> Sequence[type[jtrans.PrimitiveTranslator]]:
+def _get_subtranslators_cls() -> Sequence[type[PrimitiveTranslator]]:
     """Returns the list of all subtranslator known to JaCe.
 
     The translators are returned in FIFO order.
@@ -48,4 +47,5 @@ def _get_subtranslators_cls() -> Sequence[type[jtrans.PrimitiveTranslator]]:
 __all__ = [
     "ALUTranslator",
     "add_subtranslator",
+    "PrimitiveTranslator",
 ]
diff --git a/src/jace/translator/primitive_translator.py b/src/jace/translator/sub_translators/a_primitive_translator.py
similarity index 90%
rename from src/jace/translator/primitive_translator.py
rename to src/jace/translator/sub_translators/a_primitive_translator.py
index 816b709..16d2d4b 100644
--- a/src/jace/translator/primitive_translator.py
+++ b/src/jace/translator/sub_translators/a_primitive_translator.py
@@ -4,6 +4,14 @@
 # All rights reserved.
 #
 # SPDX-License-Identifier: BSD-3-Clause
+"""Contains the interface for all primitive subtranslators.
+
+Note the name of this file is because it has to be the first that is imported in the `__init__.py` file.
+If not, we would get a cyclic import error.
+However, all attempts to prevent ruff from mindlessly (rule abiding) destroying this orders failed.
+Thus the name was changed to enforce this.
+If you have the solution, feel free to implement it.
+"""
 
 from __future__ import annotations
 
@@ -12,7 +20,7 @@
 from typing import TYPE_CHECKING, Any, Protocol, runtime_checkable
 
 import dace
-from jax import core as jcore
+from jax import core as jax_core
 
 
 if TYPE_CHECKING:
@@ -21,7 +29,7 @@
 
 @runtime_checkable
 class PrimitiveTranslator(Protocol):
-    """Interface for all Jax primitive subtranslators.
+    """Interface for all Jax primitive translators, also known as subtranslator.
 
     A translator for a primitive translates a single equation of a Jaxpr into its SDFG equivalent.
     A type that implements this interface must fulfil the following properties:
@@ -66,7 +74,7 @@ def translate_jaxeqn(
         driver: JaxprTranslationDriver,
         in_var_names: Sequence[str | None],
         out_var_names: Sequence[str],
-        eqn: jcore.JaxprEqn,
+        eqn: jax_core.JaxprEqn,
         eqn_state: dace.SDFGState,
     ) -> dace.SDFGState | None:
         """Translates the Jax primitive into its SDFG equivalent.
diff --git a/src/jace/translator/sub_translators/alu_translator.py b/src/jace/translator/sub_translators/alu_translator.py
index b08e474..f397bb3 100644
--- a/src/jace/translator/sub_translators/alu_translator.py
+++ b/src/jace/translator/sub_translators/alu_translator.py
@@ -14,14 +14,13 @@
 
 import dace
 import numpy as np
-from jax import core as jcore
+from jax import core as jax_core
 from typing_extensions import override
 
-from jace import translator as jtranslator
+from jace.translator import sub_translators
 
 
-class ALUTranslator(jtranslator.PrimitiveTranslator):
-    # class ALUTranslator(PrimitiveTranslator):
+class ALUTranslator(sub_translators.PrimitiveTranslator):
     """This translator handles all arithmetic and logical operations."""
 
     __slots__ = ()
@@ -92,10 +91,10 @@ def primitive(self) -> Sequence[str]:
     @override
     def translate_jaxeqn(
         self,
-        driver: jtranslator.JaxprTranslationDriver,
+        driver: sub_translators.JaxprTranslationDriver,
         in_var_names: Sequence[str | None],
         out_var_names: Sequence[str],
-        eqn: jcore.JaxprEqn,
+        eqn: jax_core.JaxprEqn,
         eqn_state: dace.SDFGState,
     ) -> None:
         """Perform the translation.
@@ -244,7 +243,7 @@ def translate_jaxeqn(
     def _writeTaskletCode(
         self,
         in_var_names: Sequence[str | None],
-        eqn: jcore.JaxprEqn,
+        eqn: jax_core.JaxprEqn,
     ) -> str:
         """This function generates the Tasklet code based on a primitive.
 
@@ -284,7 +283,7 @@ def _writeTaskletCode(
             if in_var_name is not None:
                 continue
 
-            jax_in_var: jcore.Literal = cast(jcore.Literal, eqn.invars[i])
+            jax_in_var: jax_core.Literal = cast(jax_core.Literal, eqn.invars[i])
             if jax_in_var.aval.shape == ():
                 t_val = jax_in_var.val
                 if isinstance(t_val, np.ndarray):
diff --git a/src/jace/translator/translated_jaxpr_sdfg.py b/src/jace/translator/translated_jaxpr_sdfg.py
index bc1ffab..3a3bb6b 100644
--- a/src/jace/translator/translated_jaxpr_sdfg.py
+++ b/src/jace/translator/translated_jaxpr_sdfg.py
@@ -12,9 +12,9 @@
 from typing import Any
 
 import dace
-from jax import core as jcore
+from jax import core as jax_core
 
-from jace import util as jutil
+from jace import util
 
 
 @dataclass(init=True, repr=True, eq=False, frozen=False, kw_only=True, slots=True)
@@ -37,7 +37,7 @@ class TranslatedJaxprSDFG:
     """
 
     sdfg: dace.SDFG
-    jax_name_map: Mapping[jcore.Var | jutil.JaCeVar, str]
+    jax_name_map: Mapping[jax_core.Var | util.JaCeVar, str]
     start_state: dace.SDFGState | None = None
     terminal_state: dace.SDFGState | None = None
     inp_names: Sequence[str] | None = None
diff --git a/src/jace/util/debug.py b/src/jace/util/debug.py
index b3a84f3..27c57aa 100644
--- a/src/jace/util/debug.py
+++ b/src/jace/util/debug.py
@@ -13,18 +13,16 @@
 from __future__ import annotations
 
 from collections.abc import Callable
-from typing import TYPE_CHECKING, Any
+from typing import Any
 
 import dace
 import jax
 
-
-if TYPE_CHECKING:
-    from jace import translator as jtrans
+from jace import translator
 
 
 def run_jax_sdfg(
-    jsdfg: jtrans.TranslatedJaxprSDFG,
+    jsdfg: translator.TranslatedJaxprSDFG,
     *args: Any,
 ) -> tuple[Any, ...] | Any:
     """Calls the SDFG that is encapsulated with the supplied arguments.
@@ -97,9 +95,7 @@ def _jace_run(
         *args:      Forwarded to the tracing and final execution of the SDFG.
         **kwargs:   Used to construct the driver.
     """
-    from jace.translator import JaxprTranslationDriver
-
     jaxpr = jax.make_jaxpr(fun)(*args)
-    driver = JaxprTranslationDriver(**kwargs)
+    driver = translator.JaxprTranslationDriver(**kwargs)
     jsdfg = driver.translate_jaxpr(jaxpr)
     return run_jax_sdfg(jsdfg, *args)
diff --git a/src/jace/util/jax_helper.py b/src/jace/util/jax_helper.py
index 5bd7596..80018fc 100644
--- a/src/jace/util/jax_helper.py
+++ b/src/jace/util/jax_helper.py
@@ -17,10 +17,10 @@
 
 from collections.abc import Mapping
 from dataclasses import dataclass
-from typing import Any
+from typing import Any, overload
 
 import dace
-import jax.core as jcore
+import jax.core as jax_core
 import numpy as np
 
 from jace import util
@@ -36,14 +36,13 @@ class JaCeVar:
 
     Notes:
         Main intention is to test functionality.
-        While for a Jax `Var` object the name is rather irrelevant, `JaCeVar` use their name.
         If the name of a `JaCeVar` is '_' it is considered a drop variable.
         If the name of a `JaCeVar` is empty, the automatic naming will consider it as a Jax variable.
         The definition of `__hash__` and `__eq__` is in accordance how Jax variable works.
     """
 
     name: str
-    shape: tuple[int | dace.symbol | str, ...] | int | dace.symbol | str | tuple[()]
+    shape: tuple[int | dace.symbol | str, ...] | tuple[()]
     dtype: dace.typeclass
 
     def __hash__(self) -> int:
@@ -59,7 +58,7 @@ def __post_init__(self) -> None:
             raise ValueError("The 'shape' member of a 'JaCeVar' must be a tuple.")
 
 
-def get_jax_var_name(jax_var: jcore.Atom | JaCeVar | str) -> str:
+def get_jax_var_name(jax_var: jax_core.Atom | JaCeVar | str) -> str:
     """Returns the name of the Jax variable as a string.
 
     Args:
@@ -70,19 +69,19 @@ def get_jax_var_name(jax_var: jcore.Atom | JaCeVar | str) -> str:
         This function is subject for removal.
     """
     match jax_var:
-        case jcore.DropVar():
+        case jax_core.DropVar():
             return "_"
         case JaCeVar():
             # In case of an empty name consider the jace variable as a Jax variable.
             #  This is mostly for testing.
             jax_name = f"jax{id(jax_var)}" if jax_var.name == "" else jax_var.name
-        case jcore.Var():
+        case jax_core.Var():
             # This stopped working after version 0.20.4, because of some changes in Jax
             #  See `https://github.com/google/jax/pull/10573` for more information.
             #  The following implementation will generate stable names, however, they will be decoupled
             #  from output of the pretty printed Jaxpr
             jax_name = f"jax{jax_var.count}{jax_var.suffix}"
-        case jcore.Literal():
+        case jax_core.Literal():
             raise TypeError("Can not derive a name from a Jax Literal.")
         case str():
             jax_name = jax_var
@@ -97,14 +96,24 @@ def get_jax_var_name(jax_var: jcore.Atom | JaCeVar | str) -> str:
     return jax_name
 
 
-def get_jax_var_shape(jax_var: jcore.Atom | JaCeVar) -> tuple[int, ...]:
+@overload
+def get_jax_var_shape(jax_var: JaCeVar) -> tuple[int | dace.symbol | str, ...] | tuple[()]: ...
+
+
+@overload
+def get_jax_var_shape(jax_var: jax_core.Atom) -> tuple[int, ...] | tuple[()]: ...
+
+
+def get_jax_var_shape(
+    jax_var: jax_core.Atom | JaCeVar,
+) -> tuple[int | dace.symbol | str, ...] | tuple[()]:
     """Returns the shape of a Jax variable.
 
     Args:
         jax_var:     The variable to process
     """
     match jax_var:
-        case jcore.Var() | jcore.Literal():
+        case jax_core.Var() | jax_core.Literal():
             return jax_var.aval.shape
         case JaCeVar():
             return jax_var.shape
@@ -112,10 +121,10 @@ def get_jax_var_shape(jax_var: jcore.Atom | JaCeVar) -> tuple[int, ...]:
             raise TypeError(f"'get_jax_var_shape()` is not implemented for '{type(jax_var)}'.")
 
 
-def get_jax_var_dtype(jax_var: jcore.Atom | JaCeVar) -> dace.typeclass:
+def get_jax_var_dtype(jax_var: jax_core.Atom | JaCeVar) -> dace.typeclass:
     """Returns the DaCe equivalent of `jax_var`s datatype."""
     match jax_var:
-        case jcore.Var() | jcore.Literal():
+        case jax_core.Var() | jax_core.Literal():
             return translate_dtype(jax_var.aval.dtype)
         case JaCeVar():
             return translate_dtype(jax_var.dtype)
@@ -148,8 +157,8 @@ def translate_dtype(dtype: Any) -> dace.typeclass:
 
 
 def _propose_jax_name(
-    jax_var: jcore.Atom | JaCeVar,
-    jax_name_map: Mapping[jcore.Var | JaCeVar, Any] | None = None,
+    jax_var: jax_core.Atom | JaCeVar,
+    jax_name_map: Mapping[jax_core.Var | JaCeVar, Any] | None = None,
 ) -> str:
     """Proposes a variable name for `jax_var`.
 
@@ -167,11 +176,9 @@ def _propose_jax_name(
         The naming of variables are only consistent with the inner most Jaxpr a variable is defined in.
         Dropped variables will always be named `'_'`.
     """
-    from jace.util.traits import is_drop_var
-
-    if is_drop_var(jax_var):
+    if util.traits.is_drop_var(jax_var):
         return "_"
-    if isinstance(jax_var, jcore.Literal):
+    if isinstance(jax_var, jax_core.Literal):
         raise TypeError(f"Can not propose a name for literal '{jax_var}'.")
     if jax_name_map is None:
         return get_jax_var_name(jax_var)
@@ -180,7 +187,7 @@ def _propose_jax_name(
         raise RuntimeError(
             f"Can not propose a second name for '{jax_var}', it already known as '{jax_name_map[jax_var]}'."
         )
-    if isinstance(jax_var, jcore.Var):
+    if isinstance(jax_var, jax_core.Var):
         pass
     elif isinstance(jax_var, JaCeVar):
         # If the name of the JaCe variable is empty, then use the name proposing
diff --git a/src/jace/util/traits.py b/src/jace/util/traits.py
index 247c999..1e063c8 100644
--- a/src/jace/util/traits.py
+++ b/src/jace/util/traits.py
@@ -12,9 +12,9 @@
 from collections.abc import Iterable
 from typing import Any, TypeGuard
 
-from jax import core as jcore
+from jax import core as jax_core
 
-from jace import util as jutil
+from jace import util
 
 
 class NonStringIterable(Iterable): ...
@@ -24,11 +24,11 @@ def is_non_string_iterable(val: Any) -> TypeGuard[NonStringIterable]:
     return isinstance(val, Iterable) and not isinstance(val, str)
 
 
-def is_drop_var(jax_var: jcore.Atom | jutil.JaCeVar) -> bool:
+def is_drop_var(jax_var: jax_core.Atom | util.JaCeVar) -> bool:
     """Tests if `jax_var` is a drop variable."""
 
-    if isinstance(jax_var, jcore.DropVar):
+    if isinstance(jax_var, jax_core.DropVar):
         return True
-    if isinstance(jax_var, jutil.JaCeVar):
+    if isinstance(jax_var, util.JaCeVar):
         return jax_var.name == "_"
     return False
diff --git a/src/jace/util/util.py b/src/jace/util/util.py
index 3943743..96bfa20 100644
--- a/src/jace/util/util.py
+++ b/src/jace/util/util.py
@@ -10,6 +10,8 @@
 from collections.abc import Iterable
 from typing import TypeVar, cast, overload
 
+from jace.util import traits
+
 
 _T = TypeVar("_T")
 
@@ -27,8 +29,6 @@ def as_sequence(value: _T) -> Iterable[_T]: ...
 
 
 def as_sequence(value: _T | Iterable[_T]) -> Iterable[_T]:
-    from jace.util.traits import is_non_string_iterable
-
-    if is_non_string_iterable(value):
+    if traits.is_non_string_iterable(value):
         return value
     return cast(Iterable[_T], [value])

From f139a180a7e15f373602f2d1f8f445fc870a8df0 Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Mon, 6 May 2024 07:19:58 +0200
Subject: [PATCH 098/458] Updated the translation context class.

It is now less complex.
---
 src/jace/translator/_translation_context.py | 101 ++++----------------
 1 file changed, 21 insertions(+), 80 deletions(-)

diff --git a/src/jace/translator/_translation_context.py b/src/jace/translator/_translation_context.py
index 6d9c43f..15dd47f 100644
--- a/src/jace/translator/_translation_context.py
+++ b/src/jace/translator/_translation_context.py
@@ -9,7 +9,7 @@
 
 from __future__ import annotations
 
-from collections.abc import MutableMapping, Sequence
+from collections.abc import MutableMapping
 
 import dace
 from jax import core as jax_core
@@ -50,13 +50,13 @@ class _TranslationContext:
     """
 
     __slots__ = (
-        "_sdfg",
-        "_start_state",
-        "_terminal_state",
-        "_jax_name_map",
-        "_inp_names",
-        "_out_names",
-        "_rev_idx",
+        "sdfg",
+        "start_state",
+        "terminal_state",
+        "jax_name_map",
+        "inp_names",
+        "out_names",
+        "rev_idx",
     )
 
     def __init__(
@@ -73,82 +73,23 @@ def __init__(
         if isinstance(name, str) and not util._VALID_SDFG_OBJ_NAME.fullmatch(name):
             raise ValueError(f"'{name}' is not a valid SDFG name.")
 
-        self._sdfg: dace.SDFG = dace.SDFG(name=(name or f"unnamed_SDFG_{id(self)}"))
-        self._start_state: dace.SDFGState = self._sdfg.add_state(
+        self.sdfg: dace.SDFG = dace.SDFG(name=(name or f"unnamed_SDFG_{id(self)}"))
+        self.start_state: dace.SDFGState = self.sdfg.add_state(
             label="initial_state", is_start_block=True
         )
-        self._terminal_state: dace.SDFGState = self._start_state
-        self._jax_name_map: MutableMapping[jax_core.Var | util.JaCeVar, str] = {}
-        self._inp_names: tuple[str, ...] = ()
-        self._out_names: tuple[str, ...] = ()
-        self._rev_idx: int = rev_idx
+        self.terminal_state: dace.SDFGState = self.start_state
+        self.jax_name_map: MutableMapping[jax_core.Var | util.JaCeVar, str] = {}
+        self.inp_names: tuple[str, ...] = ()
+        self.out_names: tuple[str, ...] = ()
+        self.rev_idx: int = rev_idx
 
     def to_translated_jaxpr_sdfg(self) -> translator.TranslatedJaxprSDFG:
         """Transforms `self` into a `TranslatedJaxprSDFG`."""
         return translator.TranslatedJaxprSDFG(
-            sdfg=self._sdfg,
-            start_state=self._start_state,
-            terminal_state=self._terminal_state,
-            jax_name_map=self._jax_name_map,
-            inp_names=self._inp_names,
-            out_names=self._out_names,
+            sdfg=self.sdfg,
+            start_state=self.start_state,
+            terminal_state=self.terminal_state,
+            jax_name_map=self.jax_name_map,
+            inp_names=self.inp_names,
+            out_names=self.out_names,
         )
-
-    @property
-    def sdfg(self) -> dace.SDFG:
-        return self._sdfg
-
-    @property
-    def start_state(self) -> dace.SDFGState:
-        return self._start_state
-
-    @property
-    def terminal_state(self) -> dace.SDFGState:
-        return self._terminal_state
-
-    @terminal_state.setter
-    def terminal_state(
-        self,
-        new_term_state: dace.SDFGState,
-    ) -> None:
-        self._terminal_state = new_term_state
-
-    @property
-    def jax_name_map(self) -> MutableMapping[jax_core.Var | util.JaCeVar, str]:
-        return self._jax_name_map
-
-    @property
-    def inp_names(self) -> tuple[str, ...]:
-        return self._inp_names
-
-    @inp_names.setter
-    def inp_names(
-        self,
-        inp_names: Sequence[str],
-    ) -> None:
-        if isinstance(inp_names, str):
-            self._inp_names = (inp_names,)
-        elif isinstance(inp_names, tuple):
-            self._inp_names = inp_names
-        else:
-            self._inp_names = tuple(inp_names)
-
-    @property
-    def out_names(self) -> tuple[str, ...]:
-        return self._out_names
-
-    @out_names.setter
-    def out_names(
-        self,
-        out_names: Sequence[str],
-    ) -> None:
-        if isinstance(out_names, str):
-            self._out_names = (out_names,)
-        elif isinstance(out_names, tuple):
-            self._out_names = out_names
-        else:
-            self._out_names = tuple(out_names)
-
-    @property
-    def rev_idx(self) -> int:
-        return self._rev_idx

From aa4516badaea7e450f5f05286e00d7ee1b8f5068 Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Mon, 6 May 2024 07:19:58 +0200
Subject: [PATCH 099/458] Updated the translation context class.

It is now less complex.
---
 src/jace/translator/_translation_context.py | 101 ++++----------------
 1 file changed, 21 insertions(+), 80 deletions(-)

diff --git a/src/jace/translator/_translation_context.py b/src/jace/translator/_translation_context.py
index 6d9c43f..15dd47f 100644
--- a/src/jace/translator/_translation_context.py
+++ b/src/jace/translator/_translation_context.py
@@ -9,7 +9,7 @@
 
 from __future__ import annotations
 
-from collections.abc import MutableMapping, Sequence
+from collections.abc import MutableMapping
 
 import dace
 from jax import core as jax_core
@@ -50,13 +50,13 @@ class _TranslationContext:
     """
 
     __slots__ = (
-        "_sdfg",
-        "_start_state",
-        "_terminal_state",
-        "_jax_name_map",
-        "_inp_names",
-        "_out_names",
-        "_rev_idx",
+        "sdfg",
+        "start_state",
+        "terminal_state",
+        "jax_name_map",
+        "inp_names",
+        "out_names",
+        "rev_idx",
     )
 
     def __init__(
@@ -73,82 +73,23 @@ def __init__(
         if isinstance(name, str) and not util._VALID_SDFG_OBJ_NAME.fullmatch(name):
             raise ValueError(f"'{name}' is not a valid SDFG name.")
 
-        self._sdfg: dace.SDFG = dace.SDFG(name=(name or f"unnamed_SDFG_{id(self)}"))
-        self._start_state: dace.SDFGState = self._sdfg.add_state(
+        self.sdfg: dace.SDFG = dace.SDFG(name=(name or f"unnamed_SDFG_{id(self)}"))
+        self.start_state: dace.SDFGState = self.sdfg.add_state(
             label="initial_state", is_start_block=True
         )
-        self._terminal_state: dace.SDFGState = self._start_state
-        self._jax_name_map: MutableMapping[jax_core.Var | util.JaCeVar, str] = {}
-        self._inp_names: tuple[str, ...] = ()
-        self._out_names: tuple[str, ...] = ()
-        self._rev_idx: int = rev_idx
+        self.terminal_state: dace.SDFGState = self.start_state
+        self.jax_name_map: MutableMapping[jax_core.Var | util.JaCeVar, str] = {}
+        self.inp_names: tuple[str, ...] = ()
+        self.out_names: tuple[str, ...] = ()
+        self.rev_idx: int = rev_idx
 
     def to_translated_jaxpr_sdfg(self) -> translator.TranslatedJaxprSDFG:
         """Transforms `self` into a `TranslatedJaxprSDFG`."""
         return translator.TranslatedJaxprSDFG(
-            sdfg=self._sdfg,
-            start_state=self._start_state,
-            terminal_state=self._terminal_state,
-            jax_name_map=self._jax_name_map,
-            inp_names=self._inp_names,
-            out_names=self._out_names,
+            sdfg=self.sdfg,
+            start_state=self.start_state,
+            terminal_state=self.terminal_state,
+            jax_name_map=self.jax_name_map,
+            inp_names=self.inp_names,
+            out_names=self.out_names,
         )
-
-    @property
-    def sdfg(self) -> dace.SDFG:
-        return self._sdfg
-
-    @property
-    def start_state(self) -> dace.SDFGState:
-        return self._start_state
-
-    @property
-    def terminal_state(self) -> dace.SDFGState:
-        return self._terminal_state
-
-    @terminal_state.setter
-    def terminal_state(
-        self,
-        new_term_state: dace.SDFGState,
-    ) -> None:
-        self._terminal_state = new_term_state
-
-    @property
-    def jax_name_map(self) -> MutableMapping[jax_core.Var | util.JaCeVar, str]:
-        return self._jax_name_map
-
-    @property
-    def inp_names(self) -> tuple[str, ...]:
-        return self._inp_names
-
-    @inp_names.setter
-    def inp_names(
-        self,
-        inp_names: Sequence[str],
-    ) -> None:
-        if isinstance(inp_names, str):
-            self._inp_names = (inp_names,)
-        elif isinstance(inp_names, tuple):
-            self._inp_names = inp_names
-        else:
-            self._inp_names = tuple(inp_names)
-
-    @property
-    def out_names(self) -> tuple[str, ...]:
-        return self._out_names
-
-    @out_names.setter
-    def out_names(
-        self,
-        out_names: Sequence[str],
-    ) -> None:
-        if isinstance(out_names, str):
-            self._out_names = (out_names,)
-        elif isinstance(out_names, tuple):
-            self._out_names = out_names
-        else:
-            self._out_names = tuple(out_names)
-
-    @property
-    def rev_idx(self) -> int:
-        return self._rev_idx

From 458c72139270ff7bc8000d8bd4e9a92d529f7239 Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Mon, 6 May 2024 07:41:27 +0200
Subject: [PATCH 100/458] Updated the function to translate a dtype from Jax to
 DaCe.

I found this function `canonicalize_dtype()` function in Jax.
However, it does not realy worked.
Nevertheless I tried to keep the code to keel it as kind of documentation.
---
 src/jace/util/jax_helper.py | 22 ++++++++++++++++------
 1 file changed, 16 insertions(+), 6 deletions(-)

diff --git a/src/jace/util/jax_helper.py b/src/jace/util/jax_helper.py
index f6f5347..ef5e91a 100644
--- a/src/jace/util/jax_helper.py
+++ b/src/jace/util/jax_helper.py
@@ -22,6 +22,7 @@
 
 import dace
 import jax.core as jax_core
+import jax.dtypes as jax_dtypes
 import numpy as np
 
 from jace import util
@@ -167,12 +168,21 @@ def translate_dtype(dtype: Any) -> dace.typeclass:
     try:
         return dace.dtype_to_typeclass(dtype)
     except KeyError:
-        dtype_name = str(dtype)
-        if hasattr(dace.dtypes, dtype_name):
-            return getattr(dace.dtypes, dtype_name)
-        if hasattr(np, dtype_name):
-            dtype = getattr(np, dtype)
-            return dace.dtype_to_typeclass(dtype)
+        pass
+
+    try:
+        dtype_ = jax_dtypes.canonicalize_dtype(dtype)
+        return dace.dtype_to_typeclass(dtype_)
+    except Exception:
+        pass
+
+    dtype_name = str(dtype)
+    if hasattr(dace.dtypes, dtype_name):
+        return getattr(dace.dtypes, dtype_name)
+    if hasattr(np, dtype_name):
+        dtype = getattr(np, dtype)
+        return dace.dtype_to_typeclass(dtype)
+    raise ValueError(f"Unable to translate '{dtype}' ino a DaCe dtype.")
 
 
 def _propose_jax_name(

From a817bf4c9450c3b31d5a847819b1e8d027731d1a Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Mon, 6 May 2024 13:39:52 +0200
Subject: [PATCH 101/458] The `TranslatedJaxprSDFG` object now also has a field
 to store the compiled SDFG object.

---
 src/jace/translator/translated_jaxpr_sdfg.py | 2 ++
 1 file changed, 2 insertions(+)

diff --git a/src/jace/translator/translated_jaxpr_sdfg.py b/src/jace/translator/translated_jaxpr_sdfg.py
index 3a3bb6b..d5ddd6f 100644
--- a/src/jace/translator/translated_jaxpr_sdfg.py
+++ b/src/jace/translator/translated_jaxpr_sdfg.py
@@ -28,6 +28,7 @@ class TranslatedJaxprSDFG:
     - `terminal_state` the last state in the state machine.
     - `inp_names` a `list` of the SDFG variables that are used as input, in the same order as `Jaxpr.invars`.
     - `out_names` a `list` of the SDFG variables that are used as output, in the same order as `Jaxpr.outvars`.
+    - `csdfg` a compiled SDFG object; Optional might be empyt.
 
     The SDFG is in a so called canonical form, that is not directly usable, see `JaxprTranslationDriver` for more.
 
@@ -42,6 +43,7 @@ class TranslatedJaxprSDFG:
     terminal_state: dace.SDFGState | None = None
     inp_names: Sequence[str] | None = None
     out_names: Sequence[str] | None = None
+    csdfg: dace.CompiledSDFG | None = None
 
     def validate(self) -> bool:
         """Validate the underlying SDFG."""

From d8e8f1c953c457a605d1fea857b48532b638ffb1 Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Mon, 6 May 2024 13:47:16 +0200
Subject: [PATCH 102/458] Updated the `debug` module.

The function now make use of the new `csdfg` field of the `TranslatedJaxprSDFG` object.
Furthermore, the compilation and run part are now split into separate functions.
---
 src/jace/util/__init__.py |   3 +-
 src/jace/util/debug.py    | 168 +++++++++++++++++++++++++++++---------
 2 files changed, 130 insertions(+), 41 deletions(-)

diff --git a/src/jace/util/__init__.py b/src/jace/util/__init__.py
index b9865b9..9da254b 100644
--- a/src/jace/util/__init__.py
+++ b/src/jace/util/__init__.py
@@ -9,7 +9,7 @@
 
 from __future__ import annotations
 
-from .debug import _jace_run, run_jax_sdfg
+from .debug import _jace_run, compile_jax_sdfg, run_jax_sdfg
 from .jax_helper import (
     JaCeVar,
     _propose_jax_name,
@@ -26,6 +26,7 @@
 
 __all__ = [
     "as_sequence",
+    "compile_jax_sdfg",
     "is_drop_var",
     "is_tracing_ongoing",
     "is_jaceified",
diff --git a/src/jace/util/debug.py b/src/jace/util/debug.py
index 27c57aa..80b281d 100644
--- a/src/jace/util/debug.py
+++ b/src/jace/util/debug.py
@@ -12,7 +12,8 @@
 
 from __future__ import annotations
 
-from collections.abc import Callable
+from collections.abc import Callable, Sequence
+from functools import singledispatch
 from typing import Any
 
 import dace
@@ -21,39 +22,129 @@
 from jace import translator
 
 
-def run_jax_sdfg(
-    jsdfg: translator.TranslatedJaxprSDFG,
-    *args: Any,
-) -> tuple[Any, ...] | Any:
-    """Calls the SDFG that is encapsulated with the supplied arguments.
+def compile_jax_sdfg(
+    jsdfg: translator.TranslatedJaxprSDFG, force: bool = False, save: bool = True
+) -> dace.CompiledSDFG:
+    """This function compiles the embedded SDFG and return it.
+
+    The SDFG is compiled in a very special way, i.e. all arguments and return values have to be passed as arguments.
+
+    Before doing anything the function will inspect the `csdfg` filed of the `TranslatedJaxprSDFG`.
+    If it is not `None` the function will return this value.
+    This can be disabled by setting `focre` to `True`.
+    If the SDFG is compiled the function will store the compiled SDFG inside the `TranslatedJaxprSDFG` object's `csdfg` field.
+    However, by setting `save` to `False` the field will not be modified.
+
+    Args:
+        force:      Force compilation even if the `csdfg` field is already set.
+        save:       Store the compiled SDFG inside the `TranslatedJaxprSDFG` object's `csdfg` field.
 
     Notes:
         Currently the SDFG must not have any undefined symbols, i.e. no undefined sizes.
-        Currently denoted arguments are not fully respected.
         The function either returns a value or a tuple of values, i.e. no tree.
     """
-    from dace.data import Array, Data, Scalar, make_array_from_descriptor
-
-    # This is a simplification that makes our life simply
+    if not jsdfg.inp_names:
+        raise ValueError("The passed SDFG did not had any input arguments.")
+    if not jsdfg.out_names:
+        raise ValueError("The passed SDFG did not had any output arguments.")
+    if any(out_name.startswith("__return") for out_name in jsdfg.out_names):
+        raise NotImplementedError("No return statement is supported yet.")
+
+    if (not force) and (jsdfg.csdfg is not None):
+        assert isinstance(jsdfg.csdfg, dace.CompiledSDFG)
+        return jsdfg.csdfg
+
+    # This is a simplification that makes our life simply.
+    #  However, we should consider lifting it at some point.
     if len(jsdfg.sdfg.free_symbols) != 0:
         raise ValueError(
             f"No externally defined symbols are allowed, found: {jsdfg.sdfg.free_symbols}"
         )
-    if len(jsdfg.inp_names) != len(args):
-        raise ValueError(
-            f"Wrong numbers of arguments expected {len(jsdfg.inp_names)} got {len(args)}."
-        )
 
-    # We use a return by reference approach, for calling the SDFG
+    # Canonical SDFGs do not have global memory, so we must transform it; undo afterwards
+    prev_trans_state: dict[str, bool] = {}
+    for glob_name in jsdfg.inp_names + jsdfg.out_names:  # type: ignore[operator]  # concatenation
+        if glob_name in prev_trans_state:  # Donated arguments
+            continue
+        prev_trans_state[glob_name] = jsdfg.sdfg.arrays[glob_name].transient
+        jsdfg.sdfg.arrays[glob_name].transient = False
+
+    try:
+        csdfg: dace.CompiledSDFG = jsdfg.sdfg.compile()
+        if save:
+            jsdfg.csdfg = csdfg
+        return csdfg
+
+    finally:
+        # Restore the initial transient state
+        for var_name, trans_state in prev_trans_state.items():
+            jsdfg.sdfg.arrays[var_name].transient = trans_state
+
+
+@singledispatch
+def run_jax_sdfg(
+    jsdfg: translator.TranslatedJaxprSDFG,
+    /,
+    *args: Any,
+    **kwargs: Any,
+) -> tuple[Any, ...] | Any:
+    """Run the `TranslatedJaxprSDFG` object.
+
+    If the `TranslatedJaxprSDFG` object does not contain a precompiled SDFG object the function will compile it.
+    However, the compiled SDFG will not be cached in the `TranslatedJaxprSDFG` object.
+    """
+    if jsdfg.inp_names is None:
+        raise ValueError("Input names are not specified.")
+    if jsdfg.out_names is None:
+        raise ValueError("Output names are not specified.")
+
+    if jsdfg.csdfg is not None:
+        csdfg: dace.CompiledSDFG = jsdfg.csdfg
+    else:
+        csdfg = compile_jax_sdfg(jsdfg, save=False)
+    return run_jax_sdfg(
+        csdfg,
+        jsdfg.inp_names,
+        jsdfg.out_names,
+        *args,
+        **kwargs,
+    )
+
+
+@run_jax_sdfg.register(dace.CompiledSDFG)
+def _(
+    csdfg: dace.CompiledSDFG,
+    inp_names: Sequence[str],
+    out_names: Sequence[str],
+    /,
+    *args: Any,
+    **kwargs: Any,
+) -> tuple[Any, ...] | Any:
+    """Call the compiled SDFG.
+
+    The function assumes that the SDFG was compiled in accordance with `compile_jax_sdfg()`
+    """
+    from dace.data import Array, Data, Scalar, make_array_from_descriptor
+
+    if len(inp_names) != len(args):
+        raise RuntimeError("Wrong number of arguments.")
+    if len(kwargs) != 0:
+        raise NotImplementedError("No kwargs are supported yet.")
+
+    sdfg: dace.SDFG = csdfg.sdfg
+
+    # Build the argument list that we will pass to the compiled object.
     call_args: dict[str, Any] = {}
-    for in_name, in_val in zip(jsdfg.inp_names, args):
+    for in_name, in_val in zip(inp_names, args):
         call_args[in_name] = in_val
-    for out_name in jsdfg.out_names:
-        sarray: Data = jsdfg.sdfg.arrays[out_name]
-        assert out_name not in call_args
+    for out_name in out_names:
+        assert not ((out_name == "__return") or (out_name.startswith("__return_")))  # noqa: PT018 # Assert split
 
-        if (out_name == "__return") or (out_name.startswith("__return_")):
+        if out_name in call_args:  # Donated arguments
+            assert out_name in inp_names
             continue
+
+        sarray: Data = sdfg.arrays[out_name]
         if isinstance(sarray, Scalar):
             raise NotImplementedError("Scalars as return values are not supported.")
         if isinstance(sarray, Array):
@@ -61,27 +152,24 @@ def run_jax_sdfg(
         else:
             raise NotImplementedError(f"Can not handle '{type(sarray).__name__}' as output.")
 
-    # Canonical SDFGs do not have global memory, so we must transform it.
-    #  We will afterwards undo it.
-    for glob_name in jsdfg.inp_names + jsdfg.out_names:  # type: ignore[operator]  # concatenation
-        jsdfg.sdfg.arrays[glob_name].transient = False
-
-    try:
-        csdfg: dace.CompiledSDFG = jsdfg.sdfg.compile()
-        with dace.config.temporary_config():
-            dace.Config.set("compiler", "allow_view_arguments", value=True)
-            csdfg(**call_args)
-
-        if len(jsdfg.out_names) == 0:
-            return None
-        ret_val: tuple[Any] = tuple(call_args[out_name] for out_name in jsdfg.out_names)
-        if len(jsdfg.out_names) == 1:
-            return ret_val[0]
-        return ret_val
+    if len(call_args) != len(csdfg.argnames):
+        raise ValueError(
+            "Failed to construct the call arguments,"
+            f" expected {len(csdfg.argnames)} but got {len(call_args)}."
+        )
 
-    finally:
-        for name in jsdfg.inp_names + jsdfg.out_names:  # type: ignore[operator]  # concatenation
-            jsdfg.sdfg.arrays[name].transient = True
+    # Calling the SDFG
+    with dace.config.temporary_config():
+        dace.Config.set("compiler", "allow_view_arguments", value=True)
+        csdfg(**call_args)
+
+    # Handling the output (pytrees are missing)
+    if len(out_names) == 0:
+        return None
+    ret_val: tuple[Any] = tuple(call_args[out_name] for out_name in out_names)
+    if len(out_names) == 1:
+        return ret_val[0]
+    return ret_val
 
 
 def _jace_run(

From 7d0eb2a29e12e3ee8085ca7362ab1c3f301b0885 Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Mon, 6 May 2024 14:17:22 +0200
Subject: [PATCH 103/458] Blocked all static arguments.

---
 src/jace/jax/api.py | 5 +++++
 1 file changed, 5 insertions(+)

diff --git a/src/jace/jax/api.py b/src/jace/jax/api.py
index c7f1a2a..337b564 100644
--- a/src/jace/jax/api.py
+++ b/src/jace/jax/api.py
@@ -23,6 +23,11 @@ def jit(
     """Creates a jit wrapper instance."""
     import jax
 
+    if any(
+        kwargs.get(static, None) is not None for static in ["static_argnums", "static_argnames"]
+    ):
+        raise NotImplementedError("Static arguments are not yet supported.")
+
     if fun is None:
         assert len(kwargs) > 0
 

From 160e9ccab17a5abe8d7b5a4fd8a0e74cf78df388 Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Mon, 6 May 2024 14:18:52 +0200
Subject: [PATCH 104/458] Updated the whole stage stuff in jace.

It is now a copy of Jax and I must say it is much cleaner now.
However, the imports are not that nice yet, since actually everything should be in the same package, however, I do not like the idea.
---
 src/jace/jax/__init__.py                     |  18 +-
 src/jace/jax/api.py                          |  28 +--
 src/jace/jax/api_helper.py                   | 206 -------------------
 src/jace/jax/jace_compiled.py                |  61 ++++++
 src/jace/jax/jace_jitted.py                  |  69 +++++++
 src/jace/jax/jace_lowered.py                 |  73 +++++++
 src/jace/jax/stages.py                       | 182 ++++++++++++++++
 src/jace/translator/translated_jaxpr_sdfg.py |   3 +-
 src/jace/util/dace_helper.py                 |   8 +
 src/jace/util/debug.py                       |  34 +--
 src/jace/util/traits.py                      |   4 +-
 11 files changed, 449 insertions(+), 237 deletions(-)
 delete mode 100644 src/jace/jax/api_helper.py
 create mode 100644 src/jace/jax/jace_compiled.py
 create mode 100644 src/jace/jax/jace_jitted.py
 create mode 100644 src/jace/jax/jace_lowered.py
 create mode 100644 src/jace/jax/stages.py

diff --git a/src/jace/jax/__init__.py b/src/jace/jax/__init__.py
index de56d5d..ea2c0ff 100644
--- a/src/jace/jax/__init__.py
+++ b/src/jace/jax/__init__.py
@@ -10,11 +10,25 @@
 from __future__ import annotations
 
 from .api import grad, jacfwd, jacrev, jit
-from .api_helper import JitWrapped
+from .jace_compiled import JaceCompiled
+from .jace_jitted import JaceWrapped
+from .jace_lowered import JaceLowered
+from .stages import (  # type: ignore[attr-defined] # not explicit exported
+    Compiled,
+    CompilerOptions,
+    Lowered,
+    Wrapped,
+)
 
 
 __all__ = [
-    "JitWrapped",
+    "Compiled",
+    "CompilerOptions",
+    "JaceWrapped",
+    "JaceLowered",
+    "JaceCompiled",
+    "Lowered",
+    "Wrapped",
     "jit",
     "jacfwd",
     "jacrev",
diff --git a/src/jace/jax/api.py b/src/jace/jax/api.py
index 337b564..cdb154e 100644
--- a/src/jace/jax/api.py
+++ b/src/jace/jax/api.py
@@ -19,7 +19,7 @@ def jit(
     fun: Callable | None = None,
     /,
     **kwargs: Any,
-) -> jjax.JitWrapped:
+) -> jjax.JaceWrapped:
     """Creates a jit wrapper instance."""
     import jax
 
@@ -31,7 +31,7 @@ def jit(
     if fun is None:
         assert len(kwargs) > 0
 
-        def wrapper(f: Callable) -> jjax.JitWrapped:
+        def wrapper(f: Callable) -> jjax.JaceWrapped:
             return jit(f, **kwargs)
 
         return wrapper  # type: ignore[return-value]
@@ -39,65 +39,65 @@ def wrapper(f: Callable) -> jjax.JitWrapped:
     # in case we are dealing with a JaCe object, we first unwrap it.
     #  Recursion to handle arbitrary deep nestings.
     if util.is_jaceified(fun):
-        fun = cast(jjax.JitWrapped, fun)
+        fun = cast(jjax.JaceWrapped, fun)
         return jit(fun.__wrapped__)
 
     # Prevents the creation of a level of unnecessary jit.
     #  Probably better solution by using the `disable_jit()`?
     if len(kwargs) == 0:
-        return jjax.JitWrapped(fun)
-    return jjax.JitWrapped(jax.jit(fun, **kwargs))
+        return jjax.JaceWrapped(fun)
+    return jjax.JaceWrapped(jax.jit(fun, **kwargs))
 
 
 def grad(
     fun: Callable | None = None,
     /,
     **kwargs: Any,
-) -> jjax.JitWrapped:
+) -> jjax.JaceWrapped:
     """The gradient transformation."""
     import jax
 
     if fun is None:
 
-        def wrapper(f: Callable) -> jjax.JitWrapped:
+        def wrapper(f: Callable) -> jjax.JaceWrapped:
             return grad(f, **kwargs)
 
         return wrapper  # type: ignore[return-value]
 
-    return jjax.JitWrapped(jax.grad(fun, **kwargs))
+    return jjax.JaceWrapped(jax.grad(fun, **kwargs))
 
 
 def jacfwd(
     fun: Callable | None = None,
     /,
     **kwargs: Any,
-) -> jjax.JitWrapped:
+) -> jjax.JaceWrapped:
     """Returns the Jacobian of `fun` in forward differentiation mode."""
     import jax
 
     if fun is None:
 
-        def wrapper(f: Callable) -> jjax.JitWrapped:
+        def wrapper(f: Callable) -> jjax.JaceWrapped:
             return jacfwd(f, **kwargs)
 
         return wrapper  # type: ignore[return-value]
 
-    return jjax.JitWrapped(jax.jacfwd(fun, **kwargs))
+    return jjax.JaceWrapped(jax.jacfwd(fun, **kwargs))
 
 
 def jacrev(
     fun: Callable | None = None,
     /,
     **kwargs: Any,
-) -> jjax.JitWrapped:
+) -> jjax.JaceWrapped:
     """Returns the Jacobian of `fun` in reverse differentiation mode."""
     import jax
 
     if fun is None:
 
-        def wrapper(f: Callable) -> jjax.JitWrapped:
+        def wrapper(f: Callable) -> jjax.JaceWrapped:
             return jacrev(f, **kwargs)
 
         return wrapper  # type: ignore[return-value]
 
-    return jjax.JitWrapped(jax.jacrev(fun, **kwargs))
+    return jjax.JaceWrapped(jax.jacrev(fun, **kwargs))
diff --git a/src/jace/jax/api_helper.py b/src/jace/jax/api_helper.py
deleted file mode 100644
index 936f5ee..0000000
--- a/src/jace/jax/api_helper.py
+++ /dev/null
@@ -1,206 +0,0 @@
-# JaCe - JAX Just-In-Time compilation using DaCe (Data Centric Parallel Programming)
-#
-# Copyright (c) 2024, ETH Zurich
-# All rights reserved.
-#
-# SPDX-License-Identifier: BSD-3-Clause
-
-"""Helper functionality for `jace.jax.jit()`."""
-
-from __future__ import annotations
-
-from functools import lru_cache
-from typing import TYPE_CHECKING, Any
-
-import dace
-import jax
-
-from jace import util
-
-
-if TYPE_CHECKING:
-    from jace import translator
-
-
-class JitWrapped:
-    """Result class of all jited functions.
-
-    It is essentially a wrapper around an already jited, i.e. passed to a Jax primitive function.
-    The function is then able to compile it if needed.
-    However, the wrapped object is itself again tracable, thus it does not break anything.
-
-    Todo:
-        Implement a compile cache (shape, data type, strides, location).
-        Turn this into a primitive.
-        Handles pytrees.
-    """
-
-    def __init__(
-        self,
-        jax_prim: Any,  # No idea if there is a better type.
-    ) -> None:
-        """Creates a wrapped jace jitable object of `jax_prim`."""
-        assert jax_prim is not None
-        self._fun = jax_prim
-        self._tran_count = 0
-
-    def __call__(
-        self,
-        *args: Any,
-        **kwargs: Any,
-    ) -> Any:
-        """Compile and run the wrapped function.
-
-        In case `self` is called by Jax during a trace, the call will
-        transparently forwarded to the wrapped function.
-        This guarantees that `self` itself is traceable.
-        """
-
-        if util.is_tracing_ongoing(*args, **kwargs):
-            return self._forward_trace(*args, **kwargs)
-        return self._call_sdfg(*args, **kwargs)
-
-    def _forward_trace(
-        self,
-        *args: Any,
-        **kwargs: Any,
-    ) -> Any:
-        """Is called by `self.__call__` if a trace operation was detected.
-
-        I.e. it will simply forward the call to the wrapped function.
-        """
-        if len(kwargs) != 0:
-            raise RuntimeError("Passed kwargs, which are not allowed in tracing.")
-        return self._fun(*args, **kwargs)
-
-    def _call_sdfg(
-        self,
-        *args: Any,
-        **kwargs: Any,
-    ) -> Any:
-        """Compiles and run the wrapped function.
-
-        Notes:
-            Currently no caching of the compiled object is done.
-        """
-        jsdfg: translator.TranslatedJaxprSDFG = self._get_translated_sdfg(*args, **kwargs)
-        return util.run_jax_sdfg(jsdfg, *args)
-
-    def _get_translated_sdfg(
-        self,
-        *args: Any,
-        **kwargs: Any,
-    ) -> translator.TranslatedJaxprSDFG:
-        """This function returns the `TranslatedJaxprSDFG` object.
-
-        The function will transform its arguments into `_ArgInfo` versions.
-        This is needed since Jax only cares about the information stored inside it.
-        The positional only arguments are used to cache the settings important for Jax
-        and the kwonly arguments are used to influence the Jaxpr to SDFG translator.
-
-        Notes:
-            It is forbidden to permanently modify the returned translated SDFG.
-                Doing so results in undefined behaviour.
-        """
-        from jace.translator import JaxprTranslationDriver
-
-        # TODO(phimuell): This is only to make the API tests pass with the half implemented cache.
-        try:
-            return self._get_translated_sdfg_cached(
-                *(_ArgInfo.from_value(v) for v in args),
-                **kwargs,
-            )
-        except NotImplementedError:
-            jaxpr = jax.make_jaxpr(self.__wrapped__)(*args)
-            driver = JaxprTranslationDriver(**kwargs)
-            return driver.translate_jaxpr(jaxpr)
-
-    @lru_cache
-    def _get_translated_sdfg_cached(
-        self,
-        *args: _ArgInfo,
-        **kwargs: Any,
-    ) -> translator.TranslatedJaxprSDFG:
-        """Generates the SDFG from
-
-        Todo:
-            Also make the SDFG compiled and permanent also in the translated SDFG object; maybe.
-            Implement a better cache that avoids using this strange way to pass values around.
-
-        Notes:
-            It is forbidden to permanently modify the returned translated SDFG.
-                Doing so results in undefined behaviour.
-        """
-        from jace.translator import JaxprTranslationDriver
-
-        real_args: tuple[Any, ...] = tuple(x._get_val_once() for x in args)
-        jaxpr = jax.make_jaxpr(self.__wrapped__)(*real_args)
-        driver = JaxprTranslationDriver(**kwargs)
-        return driver.translate_jaxpr(jaxpr)
-
-    @property
-    def __wrapped__(self) -> Any:
-        """Returns the wrapped object."""
-        return self._fun
-
-    def __hash__(self) -> int:
-        """Hash based on the wrapped function (needed for caching)."""
-        return hash(self.__wrapped__)
-
-    def __eq__(self, other: Any) -> bool:
-        """Wrapped function based equality testing (needed for caching)."""
-        if not isinstance(other, JitWrapped):
-            return False
-        return self.__wrapped__ == other.__wrapped__
-
-
-class _ArgInfo:
-    """Abstracts argument for the case of the `JitWrapped` object.
-
-    Essentially represents a single argument.
-    To construct it use the `from_value()` function.
-
-    Notes:
-        An `_ArgInfo` instance also keeps a reference to the value that was used to construct it.
-            However this value can only retrieved once and is removed afterwards.
-            Conceptionally it should be a weak reerence, but several classes (especially `int`
-            and `float` can not be weakly referenced.
-    """
-
-    shape: tuple[int, ...]
-    strides: tuple[int, ...]
-    dtype: dace.typeclass
-    location: dace.StorageType  # We only need CPU and GPU.
-    _val: Any | None  # May not be allocated.
-
-    def __init__(self, *args: Any, **kwargs: Any) -> None:
-        """To construct an `_ArgInfo` instance use `from_val()`."""
-        raise NotImplementedError("Use '_ArgInfo.from_value()' to construct an instance.")
-
-    def __hash__(self) -> int:
-        return hash((self.shape, self.strides, self.dtype, self.location))
-
-    def __eq__(self, other: Any) -> bool:
-        if not isinstance(other, _ArgInfo):
-            return False
-        return (self.shape, self.strides, self.dtype, self.location) == (
-            (other.shape, other.strides, other.dtype, other.location)
-        )
-
-    def _get_val_once(self) -> Any:
-        """Returns the wrapped object.
-
-        This function only works for a single time.
-        Calling it will null the reference of `self`.
-        """
-        if self._val is None:
-            raise RuntimeError("Value was already consumed.")
-        val = self._val
-        self._val = None
-        return val
-
-    @classmethod
-    def from_value(cls, val: Any) -> _ArgInfo:
-        """Constructs an `_ArgInfo` instance from `val`."""
-        arginfo: _ArgInfo = cls.__new__(cls)
-        raise NotImplementedError("'_ArgInfo.from_value()' is not implemented.")
diff --git a/src/jace/jax/jace_compiled.py b/src/jace/jax/jace_compiled.py
new file mode 100644
index 0000000..4d64db9
--- /dev/null
+++ b/src/jace/jax/jace_compiled.py
@@ -0,0 +1,61 @@
+# JaCe - JAX Just-In-Time compilation using DaCe (Data Centric Parallel Programming)
+#
+# Copyright (c) 2024, ETH Zurich
+# All rights reserved.
+#
+# SPDX-License-Identifier: BSD-3-Clause
+
+"""Implementation of the `jace.jax.stages.Compiled` stage for Jace."""
+
+from __future__ import annotations
+
+from collections.abc import Sequence
+from typing import Any
+
+from jace import util
+from jace.jax import stages
+from jace.util import dace_helper as jdace
+
+
+class JaceCompiled(stages.Compiled):
+    """Compiled version of the SDFG.
+
+    Todo:
+        Handle pytrees.
+    """
+
+    __slots__ = (
+        "_csdfg",
+        "_inp_names",
+        "_out_names",
+    )
+
+    _csdfg: jdace.CompiledSDFG  # The compiled SDFG object.
+    _inp_names: tuple[str, ...]  # Name of all input arguments.
+    _out_names: tuple[str, ...]  # Name of all output arguments.
+
+    def __init__(
+        self,
+        csdfg: jdace.CompiledSDFG,
+        inp_names: Sequence[str],
+        out_names: Sequence[str],
+    ) -> None:
+        if (len(inp_names) == 0) or (len(out_names) == 0):
+            raise ValueError("Input and output can not be empty.")
+        self._csdfg = csdfg
+        self._inp_names = tuple(inp_names)
+        self._out_names = tuple(out_names)
+
+    def __call__(
+        self,
+        *args: Any,
+        **kwargs: Any,
+    ) -> Any:
+        """Calls the embedded computation."""
+        return util.run_jax_sdfg(
+            self._csdfg,
+            self._inp_names,
+            self._out_names,
+            *args,
+            **kwargs,
+        )
diff --git a/src/jace/jax/jace_jitted.py b/src/jace/jax/jace_jitted.py
new file mode 100644
index 0000000..d8f5bce
--- /dev/null
+++ b/src/jace/jax/jace_jitted.py
@@ -0,0 +1,69 @@
+# JaCe - JAX Just-In-Time compilation using DaCe (Data Centric Parallel Programming)
+#
+# Copyright (c) 2024, ETH Zurich
+# All rights reserved.
+#
+# SPDX-License-Identifier: BSD-3-Clause
+
+"""Implementation of the `jace.jax.stages.Wrapped` protocol."""
+
+from __future__ import annotations
+
+from collections.abc import Callable
+from typing import Any
+
+from jace import jax as jjax, translator
+from jace.jax import stages
+
+
+class JaceWrapped(stages.Wrapped):
+    """Result class of all jited functions in Jace.
+
+    It is essentially a wrapper around an already jited, i.e. passed to a Jax primitive function.
+    The function is then able to compile it if needed.
+    However, the wrapped object is itself again tracable, thus it does not break anything.
+
+    Todo:
+        Handles pytrees.
+        Configuration of the driver?
+        Copy the `jax._src.pjit.make_jit()` functionality to remove `jax.make_jaxpr()`.
+    """
+
+    __slots__ = ("fun_",)
+
+    _fun: Callable
+
+    def __init__(
+        self,
+        fun: Callable,
+    ) -> None:
+        """Creates a wrapped jace jitable object of `jax_prim`."""
+        assert fun is not None
+        self._fun: Callable = fun
+
+    def lower(
+        self,
+        *args: Any,
+        **kwargs: Any,
+    ) -> jjax.Lowered:
+        """Lower this function explicitly for the given arguments.
+
+        Performs the first two steps of the AOT steps described above,
+        i.e. transformation into Jaxpr and then to SDFG.
+        The result is encapsulated into a `Lowered` object.
+        """
+        import jax as jax_jax
+
+        if len(kwargs) != 0:
+            raise NotImplementedError("Currently only positional arguments are supported.")
+        # TODO(phimuell): Handle pytrees.
+        real_args: tuple[Any, ...] = args
+        jaxpr = jax_jax.make_jaxpr(self._fun)(*real_args)
+        driver = translator.JaxprTranslationDriver()
+        translated_sdfg: translator.TranslatedJaxprSDFG = driver.translate_jaxpr(jaxpr)
+        return jjax.JaceLowered(translated_sdfg)
+
+    @property
+    def __wrapped__(self) -> Any:
+        """Returns the wrapped object."""
+        return self._fun
diff --git a/src/jace/jax/jace_lowered.py b/src/jace/jax/jace_lowered.py
new file mode 100644
index 0000000..3a27e8e
--- /dev/null
+++ b/src/jace/jax/jace_lowered.py
@@ -0,0 +1,73 @@
+# JaCe - JAX Just-In-Time compilation using DaCe (Data Centric Parallel Programming)
+#
+# Copyright (c) 2024, ETH Zurich
+# All rights reserved.
+#
+# SPDX-License-Identifier: BSD-3-Clause
+
+"""Implementation of the `jace.jax.stages.Lowered` stage for Jace."""
+
+from __future__ import annotations
+
+from typing import Any
+
+from typing_extensions import override
+
+from jace import jax as jjax, translator, util
+from jace.jax import stages
+from jace.util import dace_helper as jdace
+
+
+class JaceLowered(stages.Lowered):
+    """Represents the original computation that was lowered to SDFG."""
+
+    __slots__ = ("_translated_sdfg",)
+
+    _translated_sdfg: translator.TranslatedJaxprSDFG
+
+    def __init__(
+        self,
+        translated_sdfg: translator.TranslatedJaxprSDFG,
+    ) -> None:
+        """Constructs the wrapper."""
+        if translated_sdfg.inp_names is None:
+            raise ValueError("Input names must be defined.")
+        if translated_sdfg.out_names is None:
+            raise ValueError("Output names must be defined.")
+        self._translated_sdfg = translated_sdfg
+
+    def compiler_ir(self, dialect: str | None = None) -> translator.TranslatedJaxprSDFG:
+        if (dialect is None) or (dialect.upper() == "SDFG"):
+            return self._translated_sdfg
+        raise ValueError(f"Unknown dialect '{dialect}'.")
+
+    @override
+    def optimize(
+        self,
+        **kwargs: Any,
+    ) -> jjax.JaceLowered:
+        """Perform optimization _inplace_ and return `self`.
+
+        Currently no optimization is done, thus `self` is returned unmodified.
+        """
+        return self
+
+    @override
+    def compile(
+        self,
+        compiler_options: jjax.CompilerOptions | None = None,
+    ) -> jjax.JaceCompiled:
+        """Compile the SDFG.
+
+        Returns an Object that encapsulates a
+        """
+        csdfg: jdace.CompiledSDFG = util.compile_jax_sdfg(
+            self._translated_sdfg,
+            force=True,
+            save=False,
+        )
+        return jjax.JaceCompiled(
+            csdfg=csdfg,
+            inp_names=self._translated_sdfg.inp_names,  # type: ignore[arg-type]  # init guarantees this
+            out_names=self._translated_sdfg.out_names,  # type: ignore[arg-type]
+        )
diff --git a/src/jace/jax/stages.py b/src/jace/jax/stages.py
new file mode 100644
index 0000000..d323327
--- /dev/null
+++ b/src/jace/jax/stages.py
@@ -0,0 +1,182 @@
+# JaCe - JAX Just-In-Time compilation using DaCe (Data Centric Parallel Programming)
+#
+# Copyright (c) 2024, ETH Zurich
+# All rights reserved.
+#
+# SPDX-License-Identifier: BSD-3-Clause
+
+"""Reimplementation of the `jax.stages` module.
+
+The module either imports or reimplements Jax classes.
+In case classes/functions are reimplemented they might be slightly different to fit their usage within Jace.
+
+As in Jax Jace has different stages, the terminology is taken from [Jax' AOT-Tutorial](https://jax.readthedocs.io/en/latest/aot.html).
+- Stage out:
+    In this phase we translate an executable python function into Jaxpr.
+- Lower:
+    This will transform the Jaxpr into an SDFG equivalent.
+    As a implementation note, currently this and the previous step are handled as a single step.
+- Compile:
+    This will turn the SDFG into an executable object, see `dace.codegen.CompiledSDFG`.
+- Execution:
+    This is the actual running of the computation.
+"""
+
+from __future__ import annotations
+
+import json
+from abc import abstractmethod
+from collections.abc import Callable
+from typing import Any, Protocol
+
+from jax._src import stages as jax_stages
+from jax.stages import CompilerOptions
+
+from jace import translator, util
+
+
+class Stage(jax_stages.Stage):
+    """A distinct step in the compilation chain, see module description.
+
+    This class inherent from its Jax counterpart.
+    """
+
+
+class Wrapped(Protocol):
+    """A function ready to be specialized, lowered, and compiled.
+
+    This protocol reflects the output of functions such as `jax.jit`.
+    Calling it results in jit (just-in-time) lowering, compilation, and execution.
+    It can also be explicitly lowered prior to compilation, and the result compiled prior to execution.
+
+    Notes:
+        Reimplementation of `jax.stages.Wrapped` protocol.
+    """
+
+    def __call__(
+        self,
+        *args: Any,
+        **kwargs: Any,
+    ) -> Any:
+        """Executes the wrapped function, lowering and compiling as needed in one step."""
+
+        # This allows us to be composable with Jax transformations.
+        if util.is_tracing_ongoing(*args, **kwargs):
+            return self.__wrapped__(*args, **kwargs)
+
+        # TODO(phimuell): Handle static arguments correctly
+        #                   https://jax.readthedocs.io/en/latest/aot.html#lowering-with-static-arguments
+        return self.lower(*args, **kwargs).optimize().compile()(*args, **kwargs)
+
+    @abstractmethod
+    def lower(
+        self,
+        *args: Any,
+        **kwargs: Any,
+    ) -> Lowered:
+        """Lower this function explicitly for the given arguments.
+
+        Performs the first two steps of the AOT steps described above,
+        i.e. stage the computation out to Jaxpr and then translate it to SDFG.
+        The result is encapsulated into a `Lowered` object.
+        """
+        ...
+
+    @property
+    @abstractmethod
+    def __wrapped__(self) -> Callable:
+        """Returns the wrapped function.
+
+        This is a Jace extension.
+        """
+        ...
+
+
+class Lowered(Stage):
+    """A lowered version of a Python function.
+
+    Essentially this object represents an _unoptimized_ SDFG.
+    In addition it contains all meta data that is necessary to compile and run it.
+
+    Notes:
+        Partial reimplementation of `jax._src.stages.Lowered`.
+    """
+
+    def compile(
+        self,
+        compiler_options: CompilerOptions | None = None,
+    ) -> Compiled:
+        """Returns a compiled version of the lowered SDFG.
+
+        The SDFG is compiled as-is, i.e. no transformation or optimizations are applied to it.
+        For optimization use the `self.optimize()` function to perform _in-place_ optimization.
+        """
+        raise NotImplementedError
+
+    def optimize(
+        self,
+        **kwargs: Any,  # noqa: ARG002  # unused arguments
+    ) -> Lowered:
+        """Perform optimization _inplace_ and return `self`."""
+        return self
+
+    def as_text(self, dialect: str | None = None) -> str:
+        """Textual representation of the SDFG.
+
+        By default, the function will return the Json representation of the SDFG.
+        However, by specifying `'html'` as `dialect` the function will call `view()` on the underlying SDFG.
+
+        Notes:
+            You should prefer `self.as_html()` instead of this function.
+        """
+        if (dialect is None) or (dialect.upper() == "JSON"):
+            return json.dumps(self.compiler_ir().sdfg.to_json())
+        if dialect.upper() == "HTML":
+            self.as_html()
+            return ""  # For the interface
+        raise ValueError(f"Unknown dialect '{dialect}'.")
+
+    def as_html(self, filename: str | None = None) -> None:
+        """Runs the `view()` method of the underlying SDFG function.
+
+        This is a Jace extension.
+        """
+        self.compiler_ir().sdfg.view(filename=filename, verbose=False)
+
+    def compiler_ir(self, dialect: str | None = None) -> translator.TranslatedJaxprSDFG:
+        """An arbitrary object representation of this lowering.
+
+        The class will return a `TranslatedJaxprSDFG` object.
+        Modifying the returned object is undefined behaviour.
+
+        Args:
+            dialect: Optional string specifying a lowering dialect (e.g. "SDFG")
+
+        Notes:
+            The Jax documentation points out this function is mainly for debugging.
+            The Jax version of this function might return `None`, however, in Jace
+                it will always succeed.
+        """
+        raise NotImplementedError()
+
+    def cost_analysis(self) -> Any | None:
+        """A summary of execution cost estimates.
+
+        Not implemented use the DaCe [instrumentation API](https://spcldace.readthedocs.io/en/latest/optimization/profiling.html) directly.
+        """
+        raise NotImplementedError()
+
+
+class Compiled(Stage):
+    """A compiled version of the computation.
+
+    It contains all necessary information to actually run the computation.
+    """
+
+    def __call__(
+        self,
+        *args: Any,
+        **kwargs: Any,
+    ) -> Any:
+        """Executes the wrapped computation."""
+        raise NotImplementedError
diff --git a/src/jace/translator/translated_jaxpr_sdfg.py b/src/jace/translator/translated_jaxpr_sdfg.py
index d5ddd6f..2c99156 100644
--- a/src/jace/translator/translated_jaxpr_sdfg.py
+++ b/src/jace/translator/translated_jaxpr_sdfg.py
@@ -15,6 +15,7 @@
 from jax import core as jax_core
 
 from jace import util
+from jace.util import dace_helper as jdace
 
 
 @dataclass(init=True, repr=True, eq=False, frozen=False, kw_only=True, slots=True)
@@ -43,7 +44,7 @@ class TranslatedJaxprSDFG:
     terminal_state: dace.SDFGState | None = None
     inp_names: Sequence[str] | None = None
     out_names: Sequence[str] | None = None
-    csdfg: dace.CompiledSDFG | None = None
+    csdfg: jdace.CompiledSDFG | None = None
 
     def validate(self) -> bool:
         """Validate the underlying SDFG."""
diff --git a/src/jace/util/dace_helper.py b/src/jace/util/dace_helper.py
index 1c75a55..ee23ca7 100644
--- a/src/jace/util/dace_helper.py
+++ b/src/jace/util/dace_helper.py
@@ -12,3 +12,11 @@
 """
 
 from __future__ import annotations
+
+# The compiled SDFG is not aviable in the dace namespace or anywhere else
+#  Thus we import it here directly
+from dace.codegen.compiled_sdfg import CompiledSDFG as CompiledSDFG
+
+
+
+
diff --git a/src/jace/util/debug.py b/src/jace/util/debug.py
index 80b281d..463e99e 100644
--- a/src/jace/util/debug.py
+++ b/src/jace/util/debug.py
@@ -20,11 +20,12 @@
 import jax
 
 from jace import translator
+from jace.util import dace_helper as jdace
 
 
 def compile_jax_sdfg(
     jsdfg: translator.TranslatedJaxprSDFG, force: bool = False, save: bool = True
-) -> dace.CompiledSDFG:
+) -> jdace.CompiledSDFG:
     """This function compiles the embedded SDFG and return it.
 
     The SDFG is compiled in a very special way, i.e. all arguments and return values have to be passed as arguments.
@@ -51,7 +52,7 @@ def compile_jax_sdfg(
         raise NotImplementedError("No return statement is supported yet.")
 
     if (not force) and (jsdfg.csdfg is not None):
-        assert isinstance(jsdfg.csdfg, dace.CompiledSDFG)
+        assert isinstance(jsdfg.csdfg, jdace.CompiledSDFG)
         return jsdfg.csdfg
 
     # This is a simplification that makes our life simply.
@@ -63,14 +64,21 @@ def compile_jax_sdfg(
 
     # Canonical SDFGs do not have global memory, so we must transform it; undo afterwards
     prev_trans_state: dict[str, bool] = {}
-    for glob_name in jsdfg.inp_names + jsdfg.out_names:  # type: ignore[operator]  # concatenation
-        if glob_name in prev_trans_state:  # Donated arguments
-            continue
-        prev_trans_state[glob_name] = jsdfg.sdfg.arrays[glob_name].transient
-        jsdfg.sdfg.arrays[glob_name].transient = False
-
+    org_arg_names: Any = jsdfg.sdfg.arg_names
+    sdfg_arg_names: list[str] = []
     try:
-        csdfg: dace.CompiledSDFG = jsdfg.sdfg.compile()
+        for glob_name in jsdfg.inp_names + jsdfg.out_names:  # type: ignore[operator]  # concatenation
+            if glob_name in prev_trans_state:  # Donated arguments
+                continue
+            prev_trans_state[glob_name] = jsdfg.sdfg.arrays[glob_name].transient
+            jsdfg.sdfg.arrays[glob_name].transient = False
+            sdfg_arg_names.append(glob_name)
+
+        # This forces the signature of the SDFG to include all arguments in order they appear.
+        jsdfg.sdfg.arg_names = sdfg_arg_names
+
+        # Actual compiling the stuff
+        csdfg: jdace.CompiledSDFG = jsdfg.sdfg.compile()
         if save:
             jsdfg.csdfg = csdfg
         return csdfg
@@ -79,6 +87,7 @@ def compile_jax_sdfg(
         # Restore the initial transient state
         for var_name, trans_state in prev_trans_state.items():
             jsdfg.sdfg.arrays[var_name].transient = trans_state
+        jsdfg.sdfg.arg_names = org_arg_names
 
 
 @singledispatch
@@ -99,7 +108,7 @@ def run_jax_sdfg(
         raise ValueError("Output names are not specified.")
 
     if jsdfg.csdfg is not None:
-        csdfg: dace.CompiledSDFG = jsdfg.csdfg
+        csdfg: jdace.CompiledSDFG = jsdfg.csdfg
     else:
         csdfg = compile_jax_sdfg(jsdfg, save=False)
     return run_jax_sdfg(
@@ -111,9 +120,9 @@ def run_jax_sdfg(
     )
 
 
-@run_jax_sdfg.register(dace.CompiledSDFG)
+@run_jax_sdfg.register(jdace.CompiledSDFG)
 def _(
-    csdfg: dace.CompiledSDFG,
+    csdfg: jdace.CompiledSDFG,
     inp_names: Sequence[str],
     out_names: Sequence[str],
     /,
@@ -156,6 +165,7 @@ def _(
         raise ValueError(
             "Failed to construct the call arguments,"
             f" expected {len(csdfg.argnames)} but got {len(call_args)}."
+            f"\nExpected: {csdfg.argnames}\nGot: {list(call_args.keys())}"
         )
 
     # Calling the SDFG
diff --git a/src/jace/util/traits.py b/src/jace/util/traits.py
index 8d3eecc..24cd945 100644
--- a/src/jace/util/traits.py
+++ b/src/jace/util/traits.py
@@ -34,8 +34,8 @@ def is_jaceified(obj: Any) -> bool:
     if util.is_jaxified(obj):
         return False
     # Currently it is quite simple because we can just check if `obj`
-    #  is derived from `jace.jax.JitWrapped`, might become harder in the future.
-    return isinstance(obj, jjax.JitWrapped)
+    #  is derived from `jace.jax.JaceWrapped`, might become harder in the future.
+    return isinstance(obj, jjax.JaceWrapped)
 
 
 def is_drop_var(jax_var: jax_core.Atom | util.JaCeVar) -> bool:

From f52c14def38d83e3503b98e7d15b5fa72330b7f3 Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Mon, 6 May 2024 15:13:49 +0200
Subject: [PATCH 105/458] Fixed the driver.

The description of the canonical SDFG is clearly stating that the `arg_names` parameter is not set on the SDFG.
However, for some (probaly copy past) reason this was still set.
---
 src/jace/translator/jaxpr_translator_driver.py | 3 ++-
 1 file changed, 2 insertions(+), 1 deletion(-)

diff --git a/src/jace/translator/jaxpr_translator_driver.py b/src/jace/translator/jaxpr_translator_driver.py
index 5b01fd2..dfd6695 100644
--- a/src/jace/translator/jaxpr_translator_driver.py
+++ b/src/jace/translator/jaxpr_translator_driver.py
@@ -735,7 +735,8 @@ def _create_initial_input(
             force_array=inp_scalar_as_array,
             force_jax_name=self.is_root_translator(),  # Ensure root get pure Jax names.
         )
-        sdfg.arg_names.extend(init_in_var_names)
+        # This forces the code to only accept kwargs
+        sdfg.arg_names = []
 
         # Store the list of inputs in self; this is done to simplify exporting.
         #  The output list is populated by `self._translate_jaxpr_internal()`

From 583311f8133712447ae41ee4f27bf2b5a8e14860 Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Mon, 6 May 2024 15:38:47 +0200
Subject: [PATCH 106/458] Added a tests for the stage compilation.

---
 tests/test_decorator.py | 57 +++++++++++++++++++++++++++++++++++++++++
 1 file changed, 57 insertions(+)
 create mode 100644 tests/test_decorator.py

diff --git a/tests/test_decorator.py b/tests/test_decorator.py
new file mode 100644
index 0000000..2ef6c2d
--- /dev/null
+++ b/tests/test_decorator.py
@@ -0,0 +1,57 @@
+# JaCe - JAX Just-In-Time compilation using DaCe (Data Centric Parallel Programming)
+#
+# Copyright (c) 2024, ETH Zurich
+# All rights reserved.
+#
+# SPDX-License-Identifier: BSD-3-Clause
+
+"""Implements tests for the jit decorator.
+
+Also see the `test_jax_api.py` test file, that tests composability.
+."""
+
+from __future__ import annotations
+
+import jax
+import numpy as np
+
+import jace
+
+
+def test_decorator_individually():
+    """Tests the compilation steps individually."""
+    jax.config.update("jax_enable_x64", True)
+
+    def testee_(A: np.ndarray, B: np.ndarray) -> np.ndarray:
+        return A + B
+
+    A = np.arange(12, dtype=np.float64).reshape((4, 3))
+    B = np.full((4, 3), 10, dtype=np.float64)
+
+    testee = jace.jit(testee_)
+    lowered = testee.lower(A, B)
+    optimized = lowered.optimize()
+    compiled = optimized.compile()
+
+    ref = testee_(A, B)
+    res = compiled(A, B)
+
+    assert np.allclose(ref, res), f"Expected '{ref}' got '{res}'."
+
+
+def test_decorator_one_go():
+    """Tests the compilation steps in one go."""
+    jax.config.update("jax_enable_x64", True)
+
+    def testee_(A: np.ndarray, B: np.ndarray) -> np.ndarray:
+        return A + B
+
+    testee = jace.jit(testee_)
+
+    A = np.arange(12, dtype=np.float64).reshape((4, 3))
+    B = np.full((4, 3), 10, dtype=np.float64)
+
+    ref = testee_(A, B)
+    res = testee(A, B)
+
+    assert np.allclose(ref, res), f"Expected '{ref}' got '{res}'."

From 11eb76cdc453af869101331416ee2c707331096c Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Mon, 6 May 2024 16:00:24 +0200
Subject: [PATCH 107/458] PEP8 compatibility.

---
 src/jace/jax/{jace_jitted.py => jace_wrapped.py} | 0
 src/jace/jax/stages.py                           | 8 ++++++--
 2 files changed, 6 insertions(+), 2 deletions(-)
 rename src/jace/jax/{jace_jitted.py => jace_wrapped.py} (100%)

diff --git a/src/jace/jax/jace_jitted.py b/src/jace/jax/jace_wrapped.py
similarity index 100%
rename from src/jace/jax/jace_jitted.py
rename to src/jace/jax/jace_wrapped.py
diff --git a/src/jace/jax/stages.py b/src/jace/jax/stages.py
index d323327..6cfb128 100644
--- a/src/jace/jax/stages.py
+++ b/src/jace/jax/stages.py
@@ -36,7 +36,7 @@
 
 
 class Stage(jax_stages.Stage):
-    """A distinct step in the compilation chain, see module description.
+    """A distinct step in the compilation chain, see module description for more.
 
     This class inherent from its Jax counterpart.
     """
@@ -45,7 +45,7 @@ class Stage(jax_stages.Stage):
 class Wrapped(Protocol):
     """A function ready to be specialized, lowered, and compiled.
 
-    This protocol reflects the output of functions such as `jax.jit`.
+    This protocol reflects the output of functions such as `jace.jit`.
     Calling it results in jit (just-in-time) lowering, compilation, and execution.
     It can also be explicitly lowered prior to compilation, and the result compiled prior to execution.
 
@@ -79,6 +79,10 @@ def lower(
         Performs the first two steps of the AOT steps described above,
         i.e. stage the computation out to Jaxpr and then translate it to SDFG.
         The result is encapsulated into a `Lowered` object.
+
+        Note:
+            As a Jace extension this this function might be change such that it just performs
+                the staging out of the Jaxpr, i.e. lowering to SDFG might become a separate step.
         """
         ...
 

From 7f799e77df2b32ad8e350cf4b245cf6b9142fcfb Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Tue, 7 May 2024 09:58:41 +0200
Subject: [PATCH 108/458] Also made `jaxlib` a known third party library.

---
 pyproject.toml | 1 +
 1 file changed, 1 insertion(+)

diff --git a/pyproject.toml b/pyproject.toml
index 4d551f1..e4786e2 100644
--- a/pyproject.toml
+++ b/pyproject.toml
@@ -129,6 +129,7 @@ known-third-party = [
   'cupy',
   'dace',
   'jax',
+  'jaxlib',
   'numpy',
   'pytest',
   'typing_extensions'

From f9cae92b5d92783c4ba3a13b73fc20f6ea0f30a9 Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Tue, 7 May 2024 10:00:35 +0200
Subject: [PATCH 109/458] Updated the traits header.

It now makes use of the `TypeGuard`.
---
 src/jace/util/traits.py | 29 +++++++++++++++--------------
 1 file changed, 15 insertions(+), 14 deletions(-)

diff --git a/src/jace/util/traits.py b/src/jace/util/traits.py
index 24cd945..58881fa 100644
--- a/src/jace/util/traits.py
+++ b/src/jace/util/traits.py
@@ -12,9 +12,10 @@
 from collections.abc import Iterable
 from typing import Any, TypeGuard
 
-from jax import core as jax_core
+from jax import _src as jax_src, core as jax_core
+from jaxlib import xla_extension as jax_xe
 
-from jace import util
+from jace import jax as jjax, util
 
 
 class NonStringIterable(Iterable): ...
@@ -24,13 +25,11 @@ def is_non_string_iterable(val: Any) -> TypeGuard[NonStringIterable]:
     return isinstance(val, Iterable) and not isinstance(val, str)
 
 
-def is_jaceified(obj: Any) -> bool:
+def is_jaceified(obj: Any) -> TypeGuard[jjax.JaceWrapped]:
     """Tests if `obj` is decorated by JaCe.
 
     Similar to `jace.util.is_jaxified`, but for JaCe object.
     """
-    from jace import jax as jjax
-
     if util.is_jaxified(obj):
         return False
     # Currently it is quite simple because we can just check if `obj`
@@ -38,31 +37,33 @@ def is_jaceified(obj: Any) -> bool:
     return isinstance(obj, jjax.JaceWrapped)
 
 
-def is_drop_var(jax_var: jax_core.Atom | util.JaCeVar) -> bool:
-    """Tests if `jax_var` is a drop variable."""
+def is_drop_var(jax_var: jax_core.Atom | util.JaCeVar) -> TypeGuard[jax_core.Dorp]:
+    """Tests if `jax_var` is a drop variable, i.e. a variable that is not read from in a Jaxpr."""
 
     if isinstance(jax_var, jax_core.DropVar):
         return True
     if isinstance(jax_var, util.JaCeVar):
+        # We type narrow it to a pure jax DropVar, because essentially
+        #  you can not do anything with it.
         return jax_var.name == "_"
     return False
 
 
-def is_jaxified(obj: Any) -> bool:
+def is_jaxified(
+    obj: Any,
+) -> TypeGuard[jax_core.Primitive | jax_src.pjit.JitWrapped | jax_xe.PjitFunction]:
     """Tests if `obj` is a "jaxified" object.
 
-    A "jexified" object is an object that was processed by Jax.
-    While a return value of `True` guarantees a jaxified object,
-    `False` might not proof the contrary.
+    A "jaxified" object is an object that was processed by Jax.
+    While a return value of `True` guarantees a jaxified object, `False` might not proof the contrary.
+    See also `jace.util.is_jaceified()` to tests if something is a Jace object.
     """
-    import jaxlib
-    from jax import _src as jax_src
 
     # These are all types we consider as jaxify
     jaxifyed_types = (
         jax_core.Primitive,
         # jstage.Wrapped is not runtime chakable
         jax_src.pjit.JitWrapped,
-        jaxlib.xla_extension.PjitFunction,
+        jax_xe.PjitFunction,
     )
     return isinstance(obj, jaxifyed_types)

From 9445c7f0b755e4f25ccc8152c37ebe17b3a9e098 Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Tue, 7 May 2024 11:23:23 +0200
Subject: [PATCH 110/458] Fixed the dace helper module.

---
 src/jace/util/dace_helper.py | 6 +-----
 1 file changed, 1 insertion(+), 5 deletions(-)

diff --git a/src/jace/util/dace_helper.py b/src/jace/util/dace_helper.py
index ee23ca7..a380272 100644
--- a/src/jace/util/dace_helper.py
+++ b/src/jace/util/dace_helper.py
@@ -13,10 +13,6 @@
 
 from __future__ import annotations
 
-# The compiled SDFG is not aviable in the dace namespace or anywhere else
+# The compiled SDFG is not available in the dace namespace or anywhere else
 #  Thus we import it here directly
 from dace.codegen.compiled_sdfg import CompiledSDFG as CompiledSDFG
-
-
-
-

From 13686497d882aedb178894708aad1bf31db96100 Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Tue, 7 May 2024 11:37:37 +0200
Subject: [PATCH 111/458] Updated `jace.jax.stages`.

It is now a package, which allows better organization.
Furthermore, the interfaces where removed, since they where pretty much useless.
---
 src/jace/jax/__init__.py                   |  11 +-
 src/jace/jax/jace_wrapped.py               |  69 --------
 src/jace/jax/stages.py                     | 186 ---------------------
 src/jace/jax/stages/__init__.py            |  41 +++++
 src/jace/jax/{ => stages}/jace_compiled.py |   6 +-
 src/jace/jax/{ => stages}/jace_lowered.py  |  62 +++++--
 src/jace/jax/stages/jace_wrapped.py        |  96 +++++++++++
 src/jace/jax/stages/stage.py               |  22 +++
 8 files changed, 212 insertions(+), 281 deletions(-)
 delete mode 100644 src/jace/jax/jace_wrapped.py
 delete mode 100644 src/jace/jax/stages.py
 create mode 100644 src/jace/jax/stages/__init__.py
 rename src/jace/jax/{ => stages}/jace_compiled.py (90%)
 rename src/jace/jax/{ => stages}/jace_lowered.py (53%)
 create mode 100644 src/jace/jax/stages/jace_wrapped.py
 create mode 100644 src/jace/jax/stages/stage.py

diff --git a/src/jace/jax/__init__.py b/src/jace/jax/__init__.py
index ea2c0ff..fe908a2 100644
--- a/src/jace/jax/__init__.py
+++ b/src/jace/jax/__init__.py
@@ -10,14 +10,11 @@
 from __future__ import annotations
 
 from .api import grad, jacfwd, jacrev, jit
-from .jace_compiled import JaceCompiled
-from .jace_jitted import JaceWrapped
-from .jace_lowered import JaceLowered
-from .stages import (  # type: ignore[attr-defined] # not explicit exported
-    Compiled,
+from .stages import (
     CompilerOptions,
-    Lowered,
-    Wrapped,
+    JaceCompiled,
+    JaceLowered,
+    JaceWrapped,
 )
 
 
diff --git a/src/jace/jax/jace_wrapped.py b/src/jace/jax/jace_wrapped.py
deleted file mode 100644
index d8f5bce..0000000
--- a/src/jace/jax/jace_wrapped.py
+++ /dev/null
@@ -1,69 +0,0 @@
-# JaCe - JAX Just-In-Time compilation using DaCe (Data Centric Parallel Programming)
-#
-# Copyright (c) 2024, ETH Zurich
-# All rights reserved.
-#
-# SPDX-License-Identifier: BSD-3-Clause
-
-"""Implementation of the `jace.jax.stages.Wrapped` protocol."""
-
-from __future__ import annotations
-
-from collections.abc import Callable
-from typing import Any
-
-from jace import jax as jjax, translator
-from jace.jax import stages
-
-
-class JaceWrapped(stages.Wrapped):
-    """Result class of all jited functions in Jace.
-
-    It is essentially a wrapper around an already jited, i.e. passed to a Jax primitive function.
-    The function is then able to compile it if needed.
-    However, the wrapped object is itself again tracable, thus it does not break anything.
-
-    Todo:
-        Handles pytrees.
-        Configuration of the driver?
-        Copy the `jax._src.pjit.make_jit()` functionality to remove `jax.make_jaxpr()`.
-    """
-
-    __slots__ = ("fun_",)
-
-    _fun: Callable
-
-    def __init__(
-        self,
-        fun: Callable,
-    ) -> None:
-        """Creates a wrapped jace jitable object of `jax_prim`."""
-        assert fun is not None
-        self._fun: Callable = fun
-
-    def lower(
-        self,
-        *args: Any,
-        **kwargs: Any,
-    ) -> jjax.Lowered:
-        """Lower this function explicitly for the given arguments.
-
-        Performs the first two steps of the AOT steps described above,
-        i.e. transformation into Jaxpr and then to SDFG.
-        The result is encapsulated into a `Lowered` object.
-        """
-        import jax as jax_jax
-
-        if len(kwargs) != 0:
-            raise NotImplementedError("Currently only positional arguments are supported.")
-        # TODO(phimuell): Handle pytrees.
-        real_args: tuple[Any, ...] = args
-        jaxpr = jax_jax.make_jaxpr(self._fun)(*real_args)
-        driver = translator.JaxprTranslationDriver()
-        translated_sdfg: translator.TranslatedJaxprSDFG = driver.translate_jaxpr(jaxpr)
-        return jjax.JaceLowered(translated_sdfg)
-
-    @property
-    def __wrapped__(self) -> Any:
-        """Returns the wrapped object."""
-        return self._fun
diff --git a/src/jace/jax/stages.py b/src/jace/jax/stages.py
deleted file mode 100644
index 6cfb128..0000000
--- a/src/jace/jax/stages.py
+++ /dev/null
@@ -1,186 +0,0 @@
-# JaCe - JAX Just-In-Time compilation using DaCe (Data Centric Parallel Programming)
-#
-# Copyright (c) 2024, ETH Zurich
-# All rights reserved.
-#
-# SPDX-License-Identifier: BSD-3-Clause
-
-"""Reimplementation of the `jax.stages` module.
-
-The module either imports or reimplements Jax classes.
-In case classes/functions are reimplemented they might be slightly different to fit their usage within Jace.
-
-As in Jax Jace has different stages, the terminology is taken from [Jax' AOT-Tutorial](https://jax.readthedocs.io/en/latest/aot.html).
-- Stage out:
-    In this phase we translate an executable python function into Jaxpr.
-- Lower:
-    This will transform the Jaxpr into an SDFG equivalent.
-    As a implementation note, currently this and the previous step are handled as a single step.
-- Compile:
-    This will turn the SDFG into an executable object, see `dace.codegen.CompiledSDFG`.
-- Execution:
-    This is the actual running of the computation.
-"""
-
-from __future__ import annotations
-
-import json
-from abc import abstractmethod
-from collections.abc import Callable
-from typing import Any, Protocol
-
-from jax._src import stages as jax_stages
-from jax.stages import CompilerOptions
-
-from jace import translator, util
-
-
-class Stage(jax_stages.Stage):
-    """A distinct step in the compilation chain, see module description for more.
-
-    This class inherent from its Jax counterpart.
-    """
-
-
-class Wrapped(Protocol):
-    """A function ready to be specialized, lowered, and compiled.
-
-    This protocol reflects the output of functions such as `jace.jit`.
-    Calling it results in jit (just-in-time) lowering, compilation, and execution.
-    It can also be explicitly lowered prior to compilation, and the result compiled prior to execution.
-
-    Notes:
-        Reimplementation of `jax.stages.Wrapped` protocol.
-    """
-
-    def __call__(
-        self,
-        *args: Any,
-        **kwargs: Any,
-    ) -> Any:
-        """Executes the wrapped function, lowering and compiling as needed in one step."""
-
-        # This allows us to be composable with Jax transformations.
-        if util.is_tracing_ongoing(*args, **kwargs):
-            return self.__wrapped__(*args, **kwargs)
-
-        # TODO(phimuell): Handle static arguments correctly
-        #                   https://jax.readthedocs.io/en/latest/aot.html#lowering-with-static-arguments
-        return self.lower(*args, **kwargs).optimize().compile()(*args, **kwargs)
-
-    @abstractmethod
-    def lower(
-        self,
-        *args: Any,
-        **kwargs: Any,
-    ) -> Lowered:
-        """Lower this function explicitly for the given arguments.
-
-        Performs the first two steps of the AOT steps described above,
-        i.e. stage the computation out to Jaxpr and then translate it to SDFG.
-        The result is encapsulated into a `Lowered` object.
-
-        Note:
-            As a Jace extension this this function might be change such that it just performs
-                the staging out of the Jaxpr, i.e. lowering to SDFG might become a separate step.
-        """
-        ...
-
-    @property
-    @abstractmethod
-    def __wrapped__(self) -> Callable:
-        """Returns the wrapped function.
-
-        This is a Jace extension.
-        """
-        ...
-
-
-class Lowered(Stage):
-    """A lowered version of a Python function.
-
-    Essentially this object represents an _unoptimized_ SDFG.
-    In addition it contains all meta data that is necessary to compile and run it.
-
-    Notes:
-        Partial reimplementation of `jax._src.stages.Lowered`.
-    """
-
-    def compile(
-        self,
-        compiler_options: CompilerOptions | None = None,
-    ) -> Compiled:
-        """Returns a compiled version of the lowered SDFG.
-
-        The SDFG is compiled as-is, i.e. no transformation or optimizations are applied to it.
-        For optimization use the `self.optimize()` function to perform _in-place_ optimization.
-        """
-        raise NotImplementedError
-
-    def optimize(
-        self,
-        **kwargs: Any,  # noqa: ARG002  # unused arguments
-    ) -> Lowered:
-        """Perform optimization _inplace_ and return `self`."""
-        return self
-
-    def as_text(self, dialect: str | None = None) -> str:
-        """Textual representation of the SDFG.
-
-        By default, the function will return the Json representation of the SDFG.
-        However, by specifying `'html'` as `dialect` the function will call `view()` on the underlying SDFG.
-
-        Notes:
-            You should prefer `self.as_html()` instead of this function.
-        """
-        if (dialect is None) or (dialect.upper() == "JSON"):
-            return json.dumps(self.compiler_ir().sdfg.to_json())
-        if dialect.upper() == "HTML":
-            self.as_html()
-            return ""  # For the interface
-        raise ValueError(f"Unknown dialect '{dialect}'.")
-
-    def as_html(self, filename: str | None = None) -> None:
-        """Runs the `view()` method of the underlying SDFG function.
-
-        This is a Jace extension.
-        """
-        self.compiler_ir().sdfg.view(filename=filename, verbose=False)
-
-    def compiler_ir(self, dialect: str | None = None) -> translator.TranslatedJaxprSDFG:
-        """An arbitrary object representation of this lowering.
-
-        The class will return a `TranslatedJaxprSDFG` object.
-        Modifying the returned object is undefined behaviour.
-
-        Args:
-            dialect: Optional string specifying a lowering dialect (e.g. "SDFG")
-
-        Notes:
-            The Jax documentation points out this function is mainly for debugging.
-            The Jax version of this function might return `None`, however, in Jace
-                it will always succeed.
-        """
-        raise NotImplementedError()
-
-    def cost_analysis(self) -> Any | None:
-        """A summary of execution cost estimates.
-
-        Not implemented use the DaCe [instrumentation API](https://spcldace.readthedocs.io/en/latest/optimization/profiling.html) directly.
-        """
-        raise NotImplementedError()
-
-
-class Compiled(Stage):
-    """A compiled version of the computation.
-
-    It contains all necessary information to actually run the computation.
-    """
-
-    def __call__(
-        self,
-        *args: Any,
-        **kwargs: Any,
-    ) -> Any:
-        """Executes the wrapped computation."""
-        raise NotImplementedError
diff --git a/src/jace/jax/stages/__init__.py b/src/jace/jax/stages/__init__.py
new file mode 100644
index 0000000..cf597f7
--- /dev/null
+++ b/src/jace/jax/stages/__init__.py
@@ -0,0 +1,41 @@
+# JaCe - JAX Just-In-Time compilation using DaCe (Data Centric Parallel Programming)
+#
+# Copyright (c) 2024, ETH Zurich
+# All rights reserved.
+#
+# SPDX-License-Identifier: BSD-3-Clause
+
+"""Reimplementation of the `jax.stages` module.
+
+The module either imports or reimplements Jax classes.
+In case classes/functions are reimplemented they might be slightly different to fit their usage within Jace.
+
+As in Jax Jace has different stages, the terminology is taken from [Jax' AOT-Tutorial](https://jax.readthedocs.io/en/latest/aot.html).
+- Stage out:
+    In this phase we translate an executable python function into Jaxpr.
+- Lower:
+    This will transform the Jaxpr into an SDFG equivalent.
+    As a implementation note, currently this and the previous step are handled as a single step.
+- Compile:
+    This will turn the SDFG into an executable object, see `dace.codegen.CompiledSDFG`.
+- Execution:
+    This is the actual running of the computation.
+"""
+
+from __future__ import annotations
+
+from jax.stages import CompilerOptions
+
+from .jace_compiled import JaceCompiled
+from .jace_lowered import JaceLowered
+from .jace_wrapped import JaceWrapped
+from .stage import Stage
+
+
+__all__ = [
+    "Stage",
+    "CompilerOptions",
+    "JaceWrapped",
+    "JaceLowered",
+    "JaceCompiled",
+]
diff --git a/src/jace/jax/jace_compiled.py b/src/jace/jax/stages/jace_compiled.py
similarity index 90%
rename from src/jace/jax/jace_compiled.py
rename to src/jace/jax/stages/jace_compiled.py
index 4d64db9..5d4e888 100644
--- a/src/jace/jax/jace_compiled.py
+++ b/src/jace/jax/stages/jace_compiled.py
@@ -17,9 +17,11 @@
 from jace.util import dace_helper as jdace
 
 
-class JaceCompiled(stages.Compiled):
+class JaceCompiled(stages.Stage):
     """Compiled version of the SDFG.
 
+    Contains all the information to run the associated computation.
+
     Todo:
         Handle pytrees.
     """
@@ -40,7 +42,7 @@ def __init__(
         inp_names: Sequence[str],
         out_names: Sequence[str],
     ) -> None:
-        if (len(inp_names) == 0) or (len(out_names) == 0):
+        if (not inp_names) or (not out_names):
             raise ValueError("Input and output can not be empty.")
         self._csdfg = csdfg
         self._inp_names = tuple(inp_names)
diff --git a/src/jace/jax/jace_lowered.py b/src/jace/jax/stages/jace_lowered.py
similarity index 53%
rename from src/jace/jax/jace_lowered.py
rename to src/jace/jax/stages/jace_lowered.py
index 3a27e8e..e3475be 100644
--- a/src/jace/jax/jace_lowered.py
+++ b/src/jace/jax/stages/jace_lowered.py
@@ -9,16 +9,15 @@
 
 from __future__ import annotations
 
+import json
 from typing import Any
 
-from typing_extensions import override
-
-from jace import jax as jjax, translator, util
+from jace import translator, util
 from jace.jax import stages
 from jace.util import dace_helper as jdace
 
 
-class JaceLowered(stages.Lowered):
+class JaceLowered(stages.Stage):
     """Represents the original computation that was lowered to SDFG."""
 
     __slots__ = ("_translated_sdfg",)
@@ -36,27 +35,21 @@ def __init__(
             raise ValueError("Output names must be defined.")
         self._translated_sdfg = translated_sdfg
 
-    def compiler_ir(self, dialect: str | None = None) -> translator.TranslatedJaxprSDFG:
-        if (dialect is None) or (dialect.upper() == "SDFG"):
-            return self._translated_sdfg
-        raise ValueError(f"Unknown dialect '{dialect}'.")
-
-    @override
     def optimize(
         self,
-        **kwargs: Any,
-    ) -> jjax.JaceLowered:
+        **kwargs: Any,  # noqa: ARG002  # Unused agument
+    ) -> JaceLowered:
         """Perform optimization _inplace_ and return `self`.
 
-        Currently no optimization is done, thus `self` is returned unmodified.
+        Notes:
+            Currently no optimization is performed.
         """
         return self
 
-    @override
     def compile(
         self,
-        compiler_options: jjax.CompilerOptions | None = None,
-    ) -> jjax.JaceCompiled:
+        compiler_options: stages.CompilerOptions | None = None,  # noqa: ARG002  # Unused arguments
+    ) -> stages.JaceCompiled:
         """Compile the SDFG.
 
         Returns an Object that encapsulates a
@@ -66,8 +59,43 @@ def compile(
             force=True,
             save=False,
         )
-        return jjax.JaceCompiled(
+        return stages.JaceCompiled(
             csdfg=csdfg,
             inp_names=self._translated_sdfg.inp_names,  # type: ignore[arg-type]  # init guarantees this
             out_names=self._translated_sdfg.out_names,  # type: ignore[arg-type]
         )
+
+    def compiler_ir(self, dialect: str | None = None) -> translator.TranslatedJaxprSDFG:
+        if (dialect is None) or (dialect.upper() == "SDFG"):
+            return self._translated_sdfg
+        raise ValueError(f"Unknown dialect '{dialect}'.")
+
+    def as_html(self, filename: str | None = None) -> None:
+        """Runs the `view()` method of the underlying SDFG.
+
+        This is a Jace extension.
+        """
+        self.compiler_ir().sdfg.view(filename=filename, verbose=False)
+
+    def as_text(self, dialect: str | None = None) -> str:
+        """Textual representation of the SDFG.
+
+        By default, the function will return the Json representation of the SDFG.
+        However, by specifying `'html'` as `dialect` the function will call `view()` on the underlying SDFG.
+
+        Notes:
+            You should prefer `self.as_html()` instead of this function.
+        """
+        if (dialect is None) or (dialect.upper() == "JSON"):
+            return json.dumps(self.compiler_ir().sdfg.to_json())
+        if dialect.upper() == "HTML":
+            self.as_html()
+            return ""  # For the interface
+        raise ValueError(f"Unknown dialect '{dialect}'.")
+
+    def cost_analysis(self) -> Any | None:
+        """A summary of execution cost estimates.
+
+        Not implemented use the DaCe [instrumentation API](https://spcldace.readthedocs.io/en/latest/optimization/profiling.html) directly.
+        """
+        raise NotImplementedError()
diff --git a/src/jace/jax/stages/jace_wrapped.py b/src/jace/jax/stages/jace_wrapped.py
new file mode 100644
index 0000000..28aa58c
--- /dev/null
+++ b/src/jace/jax/stages/jace_wrapped.py
@@ -0,0 +1,96 @@
+# JaCe - JAX Just-In-Time compilation using DaCe (Data Centric Parallel Programming)
+#
+# Copyright (c) 2024, ETH Zurich
+# All rights reserved.
+#
+# SPDX-License-Identifier: BSD-3-Clause
+
+"""Implementation of the `jace.jax.stages.Wrapped` protocol."""
+
+from __future__ import annotations
+
+from collections.abc import Callable
+from typing import Any
+
+import jax as jax_jax
+
+from jace import translator, util
+from jace.jax import stages
+
+
+class JaceWrapped(stages.Stage):
+    """A function ready to be specialized, lowered, and compiled.
+
+    This class represents the output of functions such as `jace.jit()`.
+    Calling it results in jit (just-in-time) lowering, compilation, and execution.
+    It can also be explicitly lowered prior to compilation, and the result compiled prior to execution.
+
+    Notes:
+        Reimplementation of `jax.stages.Wrapped` protocol.
+        Function wrapped by this class are again tracable by Jax.
+
+    Todo:
+        Handles pytrees.
+        Configuration of the driver?
+        Copy the `jax._src.pjit.make_jit()` functionality to remove `jax.make_jaxpr()`.
+    """
+
+    __slots__ = ("fun_",)
+
+    _fun: Callable
+
+    def __init__(
+        self,
+        fun: Callable,
+    ) -> None:
+        """Creates a wrapped jace jitable object of `jax_prim`."""
+        assert fun is not None
+        self._fun: Callable = fun
+
+    def __call__(
+        self,
+        *args: Any,
+        **kwargs: Any,
+    ) -> Any:
+        """Executes the wrapped function, lowering and compiling as needed in one step."""
+
+        # This allows us to be composable with Jax transformations.
+        if util.is_tracing_ongoing(*args, **kwargs):
+            return self.__wrapped__(*args, **kwargs)
+        # TODO(phimuell): Handle the case of gradients:
+        #                   It seems that this one uses special tracers, since they can handle comparisons.
+        #                   https://jax.readthedocs.io/en/latest/notebooks/Common_Gotchas_in_JAX.html#python-control-flow-autodiff
+
+        # TODO(phimuell): Handle static arguments correctly
+        #                   https://jax.readthedocs.io/en/latest/aot.html#lowering-with-static-arguments
+        return self.lower(*args, **kwargs).optimize().compile()(*args, **kwargs)
+
+    def lower(
+        self,
+        *args: Any,
+        **kwargs: Any,
+    ) -> stages.JaceLowered:
+        """Lower this function explicitly for the given arguments.
+
+        Performs the first two steps of the AOT steps described above,
+        i.e. transformation into Jaxpr and then to SDFG.
+        The result is encapsulated into a `Lowered` object.
+        """
+        if len(kwargs) != 0:
+            raise NotImplementedError("Currently only positional arguments are supported.")
+
+        # TODO(phimuell): Handle pytrees.
+        real_args: tuple[Any, ...] = args
+
+        jaxpr = jax_jax.make_jaxpr(self._fun)(*real_args)
+        driver = translator.JaxprTranslationDriver()
+        translated_sdfg: translator.TranslatedJaxprSDFG = driver.translate_jaxpr(jaxpr)
+        return stages.JaceLowered(translated_sdfg)
+
+    @property
+    def __wrapped__(self) -> Callable:
+        """Returns the wrapped function.
+
+        This is a Jace extension.
+        """
+        return self._fun
diff --git a/src/jace/jax/stages/stage.py b/src/jace/jax/stages/stage.py
new file mode 100644
index 0000000..0608c0a
--- /dev/null
+++ b/src/jace/jax/stages/stage.py
@@ -0,0 +1,22 @@
+# JaCe - JAX Just-In-Time compilation using DaCe (Data Centric Parallel Programming)
+#
+# Copyright (c) 2024, ETH Zurich
+# All rights reserved.
+#
+# SPDX-License-Identifier: BSD-3-Clause
+
+
+from __future__ import annotations
+
+from jax._src import stages as jax_stages
+
+
+class Stage(jax_stages.Stage):
+    """A distinct step in the compilation chain, see module description for more.
+
+    This class inherent from its Jax counterpart.
+    The concrete steps are implemented in:
+    - JaceWrapped
+    - JaceLowered
+    - JaceCompiled
+    """

From e71c234fc3c188779e9802bbd17bdffd4ac21651 Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Tue, 7 May 2024 12:06:52 +0200
Subject: [PATCH 112/458] Fixed a problem caused by ruff.

---
 src/jace/jax/stages/__init__.py              | 2 +-
 src/jace/jax/stages/{stage.py => a_stage.py} | 5 +++++
 2 files changed, 6 insertions(+), 1 deletion(-)
 rename src/jace/jax/stages/{stage.py => a_stage.py} (68%)

diff --git a/src/jace/jax/stages/__init__.py b/src/jace/jax/stages/__init__.py
index cf597f7..49f13bd 100644
--- a/src/jace/jax/stages/__init__.py
+++ b/src/jace/jax/stages/__init__.py
@@ -26,10 +26,10 @@
 
 from jax.stages import CompilerOptions
 
+from .a_stage import Stage
 from .jace_compiled import JaceCompiled
 from .jace_lowered import JaceLowered
 from .jace_wrapped import JaceWrapped
-from .stage import Stage
 
 
 __all__ = [
diff --git a/src/jace/jax/stages/stage.py b/src/jace/jax/stages/a_stage.py
similarity index 68%
rename from src/jace/jax/stages/stage.py
rename to src/jace/jax/stages/a_stage.py
index 0608c0a..80c3c9f 100644
--- a/src/jace/jax/stages/stage.py
+++ b/src/jace/jax/stages/a_stage.py
@@ -4,7 +4,12 @@
 # All rights reserved.
 #
 # SPDX-License-Identifier: BSD-3-Clause
+"""Interface of the Stages.
 
+In `jace.jax.stages.__init__.py` this file must be imported first.
+However, isort/ruff fail to do that and can not be convinced otherwise. 
+For that reason this file was renamed to ensure that it comes at first.
+"""
 
 from __future__ import annotations
 

From 3b56a0b776e5b43a6c7b1f6ae472add9b30d49e8 Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Tue, 7 May 2024 13:04:08 +0200
Subject: [PATCH 113/458] Updated the api.

The function now blocks a lot more of the functionality that is not yet supported.
---
 src/jace/jax/api.py | 51 ++++++++++++++++++++++++++++-----------------
 1 file changed, 32 insertions(+), 19 deletions(-)

diff --git a/src/jace/jax/api.py b/src/jace/jax/api.py
index cdb154e..3b173b0 100644
--- a/src/jace/jax/api.py
+++ b/src/jace/jax/api.py
@@ -10,7 +10,7 @@
 from __future__ import annotations
 
 from collections.abc import Callable
-from typing import Any, cast
+from typing import Any
 
 from jace import jax as jjax, util
 
@@ -22,29 +22,38 @@ def jit(
 ) -> jjax.JaceWrapped:
     """Creates a jit wrapper instance."""
     import jax
+    from jax._src import sharding_impls
 
+    if any(kwargs.get(arg, None) is not None for arg in ["static_argnums", "static_argnames"]):
+        raise NotImplementedError("Static arguments are not yet supported.")
+    if any(kwargs.get(arg, None) is not None for arg in ["donate_argnums", "donate_argnames"]):
+        # Donated arguments are not yet (fully) supported, since they are more like a "hint"
+        #  to jax we will silently ignore them.
+        kwargs["donate_argnums"] = None
+        kwargs["donate_argnames"] = None
     if any(
-        kwargs.get(static, None) is not None for static in ["static_argnums", "static_argnames"]
+        kwargs.get(x, sharding_impls.UNSPECIFIED) is not sharding_impls.UNSPECIFIED
+        for x in ["in_shardings", "out_shardings"]
     ):
-        raise NotImplementedError("Static arguments are not yet supported.")
+        raise NotImplementedError("Sharding is not yet supported.")
+    if kwargs.get("device", None) is not None:
+        raise NotImplementedError("Selecting of device is not yet supported.")
+    if kwargs.get("backend", None) is not None:
+        raise NotImplementedError("Selecting of backend is not yet supported.")
 
+    # fmt: off
     if fun is None:
         assert len(kwargs) > 0
-
         def wrapper(f: Callable) -> jjax.JaceWrapped:
             return jit(f, **kwargs)
-
         return wrapper  # type: ignore[return-value]
+    # fmt: on
 
-    # in case we are dealing with a JaCe object, we first unwrap it.
-    #  Recursion to handle arbitrary deep nestings.
     if util.is_jaceified(fun):
-        fun = cast(jjax.JaceWrapped, fun)
-        return jit(fun.__wrapped__)
-
-    # Prevents the creation of a level of unnecessary jit.
-    #  Probably better solution by using the `disable_jit()`?
+        return jit(fun.__wrapped__, **kwargs)
     if len(kwargs) == 0:
+        # Prevents the creation of a level of unnecessary jit.
+        #  TODO(philmuell): Find a better way, probably better hijacking or `inline`.
         return jjax.JaceWrapped(fun)
     return jjax.JaceWrapped(jax.jit(fun, **kwargs))
 
@@ -54,15 +63,19 @@ def grad(
     /,
     **kwargs: Any,
 ) -> jjax.JaceWrapped:
-    """The gradient transformation."""
+    """The gradient transformation.
+
+    Todo:
+        Handle controlflow properly (https://jax.readthedocs.io/en/latest/notebooks/Common_Gotchas_in_JAX.html#python-control-flow-autodiff)
+    """
     import jax
 
+    # fmt: off
     if fun is None:
-
         def wrapper(f: Callable) -> jjax.JaceWrapped:
             return grad(f, **kwargs)
-
         return wrapper  # type: ignore[return-value]
+    # fmt: on
 
     return jjax.JaceWrapped(jax.grad(fun, **kwargs))
 
@@ -75,12 +88,12 @@ def jacfwd(
     """Returns the Jacobian of `fun` in forward differentiation mode."""
     import jax
 
+    # fmt: off
     if fun is None:
-
         def wrapper(f: Callable) -> jjax.JaceWrapped:
             return jacfwd(f, **kwargs)
-
         return wrapper  # type: ignore[return-value]
+    # fmt: on
 
     return jjax.JaceWrapped(jax.jacfwd(fun, **kwargs))
 
@@ -93,11 +106,11 @@ def jacrev(
     """Returns the Jacobian of `fun` in reverse differentiation mode."""
     import jax
 
+    # fmt: off
     if fun is None:
-
         def wrapper(f: Callable) -> jjax.JaceWrapped:
             return jacrev(f, **kwargs)
-
         return wrapper  # type: ignore[return-value]
+    # fmt: on
 
     return jjax.JaceWrapped(jax.jacrev(fun, **kwargs))

From 4402ae68dc67dc207c41ebd7a14fca49654b6f40 Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Tue, 7 May 2024 15:15:36 +0200
Subject: [PATCH 114/458] Updated the api interface.

It is now cleaner.
---
 src/jace/jax/__init__.py   |   2 +
 src/jace/jax/api.py        | 104 +++++++++++++++++++++++--------------
 src/jace/jax/api_helper.py |  37 +++++++++++++
 tests/test_decorator.py    |   5 ++
 4 files changed, 110 insertions(+), 38 deletions(-)
 create mode 100644 src/jace/jax/api_helper.py

diff --git a/src/jace/jax/__init__.py b/src/jace/jax/__init__.py
index fe908a2..46ec45a 100644
--- a/src/jace/jax/__init__.py
+++ b/src/jace/jax/__init__.py
@@ -9,6 +9,7 @@
 
 from __future__ import annotations
 
+from . import api_helper
 from .api import grad, jacfwd, jacrev, jit
 from .stages import (
     CompilerOptions,
@@ -26,6 +27,7 @@
     "JaceCompiled",
     "Lowered",
     "Wrapped",
+    "api_helper",
     "jit",
     "jacfwd",
     "jacrev",
diff --git a/src/jace/jax/api.py b/src/jace/jax/api.py
index 3b173b0..dd3973e 100644
--- a/src/jace/jax/api.py
+++ b/src/jace/jax/api.py
@@ -12,15 +12,26 @@
 from collections.abc import Callable
 from typing import Any
 
+import jax as _jax_jax
+
 from jace import jax as jjax, util
+from jace.jax import api_helper
 
 
+@api_helper.jax_wrapper(_jax_jax.jit)
 def jit(
     fun: Callable | None = None,
     /,
     **kwargs: Any,
 ) -> jjax.JaceWrapped:
-    """Creates a jit wrapper instance."""
+    """Jace wrapper for `jax.jit`.
+
+    Wraps the computation `fun` into a wrapped instance, that can either be traced or compiled.
+    For more information see `jace.jax.stages`.
+
+    Notes:
+        The function can either be used as decorator or as a command.
+    """
     import jax
     from jax._src import sharding_impls
 
@@ -58,59 +69,76 @@ def wrapper(f: Callable) -> jjax.JaceWrapped:
     return jjax.JaceWrapped(jax.jit(fun, **kwargs))
 
 
-def grad(
-    fun: Callable | None = None,
+@api_helper.jax_wrapper(_jax_jax.pmap)
+def pmap(
+    fun: Callable | None = None,  # noqa: ARG001  # Unused argument
     /,
-    **kwargs: Any,
+    **kwargs: Any,  # noqa: ARG001 # Unused argument.
 ) -> jjax.JaceWrapped:
-    """The gradient transformation.
+    """Jace wrapper around `jax.pmap`.
 
-    Todo:
-        Handle controlflow properly (https://jax.readthedocs.io/en/latest/notebooks/Common_Gotchas_in_JAX.html#python-control-flow-autodiff)
+    Notes:
+        Will be supported in a very late state.
     """
-    import jax
+    raise NotImplementedError("Currently Jace is not able to run in multi resource mode.")
 
-    # fmt: off
-    if fun is None:
-        def wrapper(f: Callable) -> jjax.JaceWrapped:
-            return grad(f, **kwargs)
-        return wrapper  # type: ignore[return-value]
-    # fmt: on
 
-    return jjax.JaceWrapped(jax.grad(fun, **kwargs))
+@api_helper.jax_wrapper(_jax_jax.vmap)
+def vmap(
+    fun: Callable,
+    /,
+    **kwargs: Any,
+) -> jjax.JaceWrapped:
+    """Jace wrapper around `jax.vmap`.
 
+    Notes:
+        Currently that is an untested extension.
+    """
+    import warnings
 
-def jacfwd(
+    warnings.warn(
+        "You are using the highly untested 'vamp' interface.",
+        stacklevel=2,
+    )
+    return jit(
+        _jax_jax.vmap(
+            fun,
+            **kwargs,
+        ),
+    )
+
+
+@api_helper.jax_wrapper(_jax_jax.grad)
+def grad(
     fun: Callable | None = None,
     /,
     **kwargs: Any,
-) -> jjax.JaceWrapped:
-    """Returns the Jacobian of `fun` in forward differentiation mode."""
-    import jax
+) -> Callable:
+    """Jace wrapper for `jax.grad`.
 
-    # fmt: off
-    if fun is None:
-        def wrapper(f: Callable) -> jjax.JaceWrapped:
-            return jacfwd(f, **kwargs)
-        return wrapper  # type: ignore[return-value]
-    # fmt: on
-
-    return jjax.JaceWrapped(jax.jacfwd(fun, **kwargs))
+    Notes:
+        Note we can not put it into a `JaceWrapped` object because in autodiff mode
+            control primitives, such as `if` are allowed, but not in `jit`.
+            Thus there need to be this extra layer.
+    """
+    return _jax_jax.grad(fun, **kwargs)
 
 
-def jacrev(
+@api_helper.jax_wrapper(_jax_jax.jacfwd)
+def jacfwd(
     fun: Callable | None = None,
     /,
     **kwargs: Any,
-) -> jjax.JaceWrapped:
-    """Returns the Jacobian of `fun` in reverse differentiation mode."""
-    import jax
+) -> Callable:
+    """Jace wrapper around `jax.jacfwd`."""
+    return _jax_jax.jacfwd(fun, **kwargs)
 
-    # fmt: off
-    if fun is None:
-        def wrapper(f: Callable) -> jjax.JaceWrapped:
-            return jacrev(f, **kwargs)
-        return wrapper  # type: ignore[return-value]
-    # fmt: on
 
-    return jjax.JaceWrapped(jax.jacrev(fun, **kwargs))
+@api_helper.jax_wrapper(_jax_jax.jacrev)
+def jacrev(
+    fun: Callable | None = None,
+    /,
+    **kwargs: Any,
+) -> Callable:
+    """Jace wrapper around `jax.jacrev`."""
+    return _jax_jax.jacrev(fun, **kwargs)
diff --git a/src/jace/jax/api_helper.py b/src/jace/jax/api_helper.py
new file mode 100644
index 0000000..fbc441f
--- /dev/null
+++ b/src/jace/jax/api_helper.py
@@ -0,0 +1,37 @@
+# JaCe - JAX Just-In-Time compilation using DaCe (Data Centric Parallel Programming)
+#
+# Copyright (c) 2024, ETH Zurich
+# All rights reserved.
+#
+# SPDX-License-Identifier: BSD-3-Clause
+
+"""Helper function for the api."""
+
+from __future__ import annotations
+
+import functools as ft
+from collections.abc import Callable
+from typing import Any
+
+
+def jax_wrapper(
+    jax_fun: Callable,
+    fun: Callable | None = None,
+    /,
+    **kwargs: Any,
+) -> Callable:
+    """Creates a wrapper function for"""
+
+    # fmt: off
+    if fun is None:
+        def _inner_jax_wrapper(fun: Callable) -> Callable:
+            return jax_wrapper(jax_fun, fun, **kwargs)
+        return _inner_jax_wrapper
+    # fmt: on
+
+    ft.update_wrapper(
+        wrapper=fun,
+        wrapped=jax_fun,
+        **kwargs,
+    )
+    return fun
diff --git a/tests/test_decorator.py b/tests/test_decorator.py
index 2ef6c2d..4a35774 100644
--- a/tests/test_decorator.py
+++ b/tests/test_decorator.py
@@ -18,6 +18,11 @@
 import jace
 
 
+def test_decorator_annotation():
+    """Tests the annotation, essential `jace.jax.api_helper.jax_wrapper`."""
+    assert jax.jit.__doc__ == jace.jit.__doc__
+
+
 def test_decorator_individually():
     """Tests the compilation steps individually."""
     jax.config.update("jax_enable_x64", True)

From b2dafe03f4775ea4c9c24c8e44a11d6954d7faa3 Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Tue, 7 May 2024 15:26:57 +0200
Subject: [PATCH 115/458] Updated the tests.

The test ensure that the gradient is correctly working, i.e. can handle control flow.
---
 tests/test_jax_api.py | 28 +++++++++++++++++++++++-----
 1 file changed, 23 insertions(+), 5 deletions(-)

diff --git a/tests/test_jax_api.py b/tests/test_jax_api.py
index a48022c..1e7b911 100644
--- a/tests/test_jax_api.py
+++ b/tests/test_jax_api.py
@@ -5,7 +5,7 @@
 #
 # SPDX-License-Identifier: BSD-3-Clause
 
-"""Tests the compability of the JaCe api to Jax."""
+"""Tests the compatibility of the JaCe api to Jax."""
 
 from __future__ import annotations
 
@@ -117,7 +117,25 @@ def f3_(A, B, C, D):
     assert np.allclose(ref, res_jace), "JaCe Failed."
 
 
-if __name__ == "__main__":
-    test_jit()
-    # test_composition1()
-    test_composition2()
+@pytest.mark.skip(reason="Scalar return values are not handled.")
+def test_grad_control_flow():
+    """Tests if `grad` and controlflow works.
+
+    This requirement is mentioned in `https://jax.readthedocs.io/en/latest/notebooks/Common_Gotchas_in_JAX.html#python-control-flow-autodiff`.
+    """
+    jax.config.update("jax_enable_x64", True)
+
+    def f(x):
+        if x < 3:
+            return 3.0 * x**2
+        return -4 * x
+
+    df = jace.grad(f)
+
+    x1 = 2.0
+    df_x1 = 6 * x1
+    x2 = 4.0
+    df_x2 = -4.0
+
+    assert (res := df(x1)) == df_x1, f"Failed lower branch, expected '{df_x1}', got '{res}'."
+    assert (res := df(x2)) == df_x2, f"Failed upper branch, expected '{df_x2}', got '{res}'."

From 4dc68dcf8027363bda7a98fa84783c05e40b6da9 Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Tue, 7 May 2024 15:27:20 +0200
Subject: [PATCH 116/458] Updated the `pyproject.toml` file.

The tests allow now assignements in asserts.
I think this is good because it allows to write a bit shorter tests.
---
 pyproject.toml | 6 +++++-
 1 file changed, 5 insertions(+), 1 deletion(-)

diff --git a/pyproject.toml b/pyproject.toml
index e4786e2..ad44121 100644
--- a/pyproject.toml
+++ b/pyproject.toml
@@ -149,4 +149,8 @@ section-order = [
 [tool.ruff.lint.per-file-ignores]
 "!tests/**.py" = ["PT"]  # Ignore `flake8-pytest-style` everywhere except in `tests/`
 "noxfile.py" = ["T20"]  # Ignore `flake8-print`
-"tests/**" = ["T10", "T20"]  # Ignore `flake8-debugger` and `flake8-print`
+"tests/**" = [
+  "T10",
+  "T20",  # Ignore `flake8-debugger` and `flake8-print`
+  "RUF018"  # Ignore assignment in `assert`s; for printing
+]

From a2c63032db9dd1e81e309c6023ba10c8602e7695 Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Wed, 8 May 2024 07:12:06 +0200
Subject: [PATCH 117/458] Updated a test a little bit to make it more
 copatible.

---
 tests/test_decorator.py | 5 ++++-
 1 file changed, 4 insertions(+), 1 deletion(-)

diff --git a/tests/test_decorator.py b/tests/test_decorator.py
index 4a35774..940e1f6 100644
--- a/tests/test_decorator.py
+++ b/tests/test_decorator.py
@@ -30,10 +30,13 @@ def test_decorator_individually():
     def testee_(A: np.ndarray, B: np.ndarray) -> np.ndarray:
         return A + B
 
+    @jace.jit
+    def testee(A: np.ndarray, B: np.ndarray) -> np.ndarray:
+        return testee_(A, B)
+
     A = np.arange(12, dtype=np.float64).reshape((4, 3))
     B = np.full((4, 3), 10, dtype=np.float64)
 
-    testee = jace.jit(testee_)
     lowered = testee.lower(A, B)
     optimized = lowered.optimize()
     compiled = optimized.compile()

From 2d2cf570963ba853c9b9f368e43860edbb2b1a57 Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Wed, 8 May 2024 11:07:52 +0200
Subject: [PATCH 118/458] Added a function to create a special dataclass.

The class essentially allows to create some preprocessing step before calling the actuall init.
This way more arguments can be accepted.
---
 src/jace/util/__init__.py |  3 ++-
 src/jace/util/util.py     | 47 +++++++++++++++++++++++++++++++++++++--
 2 files changed, 47 insertions(+), 3 deletions(-)

diff --git a/src/jace/util/__init__.py b/src/jace/util/__init__.py
index 9da254b..afe61a6 100644
--- a/src/jace/util/__init__.py
+++ b/src/jace/util/__init__.py
@@ -21,12 +21,13 @@
 )
 from .re_pattern import _VALID_JAX_VAR_NAME, _VALID_SDFG_OBJ_NAME, _VALID_SDFG_VAR_NAME
 from .traits import is_drop_var, is_jaceified, is_jaxified, is_non_string_iterable
-from .util import as_sequence
+from .util import as_sequence, dataclass_with_default_init
 
 
 __all__ = [
     "as_sequence",
     "compile_jax_sdfg",
+    "dataclass_with_default_init",
     "is_drop_var",
     "is_tracing_ongoing",
     "is_jaceified",
diff --git a/src/jace/util/util.py b/src/jace/util/util.py
index 96bfa20..f3dbdd4 100644
--- a/src/jace/util/util.py
+++ b/src/jace/util/util.py
@@ -7,8 +7,8 @@
 
 from __future__ import annotations
 
-from collections.abc import Iterable
-from typing import TypeVar, cast, overload
+from collections.abc import Callable, Iterable
+from typing import Any, TypeVar, cast, overload
 
 from jace.util import traits
 
@@ -32,3 +32,46 @@ def as_sequence(value: _T | Iterable[_T]) -> Iterable[_T]:
     if traits.is_non_string_iterable(value):
         return value
     return cast(Iterable[_T], [value])
+
+
+def dataclass_with_default_init(
+    _cls: type | None = None,
+    *args: Any,
+    **kwargs: Any,
+) -> type | Callable[[type], type]:
+    """The dataclasses `__init__` will now be made available as `__default_init__` if `_cls` define `__init__`.
+
+    Adapted from `https://stackoverflow.com/a/58336722`
+    """
+    from dataclasses import dataclass
+
+    def wrap(cls: type) -> type:
+        # Save the current __init__ and remove it so dataclass will create the default __init__.
+        #  But only do something if the class has an `__init__` function.
+        has_user_init = hasattr(cls, "__init__")
+        if has_user_init:
+            user_init = getattr(cls, "__init__", None)
+            delattr(cls, "__init__")
+
+        # let dataclass process our class.
+        result = dataclass(cls, *args, **kwargs)  # type: ignore[var-annotated]
+
+        # If there is no init function in the original class then, we are done.
+        if not has_user_init:
+            return result
+
+        # Restore the user's __init__ save the default init to __default_init__.
+        result.__default_init__ = result.__init__
+        result.__init__ = user_init
+
+        # Just in case that dataclass will return a new instance,
+        # (currently, does not happen), restore cls's __init__.
+        if result is not cls:
+            cls.__init__ = user_init  # type: ignore[misc]
+
+        return result
+
+    # Support both dataclass_with_default_init() and dataclass_with_default_init
+    if _cls is None:
+        return wrap
+    return wrap(_cls)

From b77dfccf7adcd78ee2ff4e97fe76af70d570ac15 Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Wed, 8 May 2024 11:11:39 +0200
Subject: [PATCH 119/458] Updated the trait functions.

---
 src/jace/util/__init__.py | 13 ++++++++++++-
 src/jace/util/traits.py   | 40 ++++++++++++++++++++++++++++++++++++++-
 2 files changed, 51 insertions(+), 2 deletions(-)

diff --git a/src/jace/util/__init__.py b/src/jace/util/__init__.py
index afe61a6..eec5d57 100644
--- a/src/jace/util/__init__.py
+++ b/src/jace/util/__init__.py
@@ -20,7 +20,15 @@
     translate_dtype,
 )
 from .re_pattern import _VALID_JAX_VAR_NAME, _VALID_SDFG_OBJ_NAME, _VALID_SDFG_VAR_NAME
-from .traits import is_drop_var, is_jaceified, is_jaxified, is_non_string_iterable
+from .traits import (
+    is_drop_var,
+    is_fully_addressable,
+    is_jaceified,
+    is_jax_array,
+    is_jaxified,
+    is_non_string_iterable,
+    is_on_device,
+)
 from .util import as_sequence, dataclass_with_default_init
 
 
@@ -32,7 +40,10 @@
     "is_tracing_ongoing",
     "is_jaceified",
     "is_jaxified",
+    "is_jax_array",
+    "is_fully_addressable",
     "is_non_string_iterable",
+    "is_on_device",
     "JaCeVar",
     "get_jax_var_name",
     "get_jax_var_shape",
diff --git a/src/jace/util/traits.py b/src/jace/util/traits.py
index 58881fa..750b7bb 100644
--- a/src/jace/util/traits.py
+++ b/src/jace/util/traits.py
@@ -37,7 +37,7 @@ def is_jaceified(obj: Any) -> TypeGuard[jjax.JaceWrapped]:
     return isinstance(obj, jjax.JaceWrapped)
 
 
-def is_drop_var(jax_var: jax_core.Atom | util.JaCeVar) -> TypeGuard[jax_core.Dorp]:
+def is_drop_var(jax_var: jax_core.Atom | util.JaCeVar) -> TypeGuard[jax_core.DropVarp]:
     """Tests if `jax_var` is a drop variable, i.e. a variable that is not read from in a Jaxpr."""
 
     if isinstance(jax_var, jax_core.DropVar):
@@ -67,3 +67,41 @@ def is_jaxified(
         jax_xe.PjitFunction,
     )
     return isinstance(obj, jaxifyed_types)
+
+
+def is_jax_array(
+    obj: Any,
+) -> bool:
+    """Tests if `obj` is a jax array.
+
+    Todo:
+        Find the Jax type for `TypeGuard`.
+    """
+    # Currently this seams to be the besst way to identify Jax arrays.
+    return all(hasattr(obj, x) for x in ["sharding", "is_fully_addressable"])
+
+
+def is_on_device(
+    obj: Any,
+) -> bool:
+    """Tests if `obj` is on a device."""
+    # The problem is, that we can not test if `__cuda_array_interface__` exists.
+    #  because Jax array have that even on CPU, thus it is a bit mnore complex.
+    # TODO(phimuell): Hip
+    if is_jax_array(obj):
+        obj = obj.__array__()
+    return hasattr(obj, "__cuda_array_interface__")
+
+
+def is_fully_addressable(
+    obj: Any,
+) -> bool:
+    """Tests if `obj` is fully addreassable, i.e. is only on this host.
+
+    Notes:
+        The function (currently) assumes that everything that is not a distributed
+            Jax array is on this host.
+    """
+    if is_jax_array(obj):
+        return obj.is_fully_addressable()
+    return True

From dc2d9baf854151a39bff31be88d35ed4492d3724 Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Wed, 8 May 2024 11:19:55 +0200
Subject: [PATCH 120/458] Added an import.

Let's hope that it is a good idea.
---
 src/jace/translator/__init__.py | 2 ++
 1 file changed, 2 insertions(+)

diff --git a/src/jace/translator/__init__.py b/src/jace/translator/__init__.py
index d6bb0c7..b643776 100644
--- a/src/jace/translator/__init__.py
+++ b/src/jace/translator/__init__.py
@@ -10,10 +10,12 @@
 from __future__ import annotations
 
 from .jaxpr_translator_driver import JaxprTranslationDriver
+from .sub_translators import PrimitiveTranslator
 from .translated_jaxpr_sdfg import TranslatedJaxprSDFG
 
 
 __all__ = [
     "JaxprTranslationDriver",
+    "PrimitiveTranslator",
     "TranslatedJaxprSDFG",
 ]

From 22064ab22413b45295acde47205cd169f958754b Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Wed, 8 May 2024 11:20:51 +0200
Subject: [PATCH 121/458] Explicitly exporting the `jace.jax.stages` interface.

---
 src/jace/jax/__init__.py | 3 ++-
 1 file changed, 2 insertions(+), 1 deletion(-)

diff --git a/src/jace/jax/__init__.py b/src/jace/jax/__init__.py
index 46ec45a..bb826a1 100644
--- a/src/jace/jax/__init__.py
+++ b/src/jace/jax/__init__.py
@@ -9,7 +9,7 @@
 
 from __future__ import annotations
 
-from . import api_helper
+from . import api_helper, stages
 from .api import grad, jacfwd, jacrev, jit
 from .stages import (
     CompilerOptions,
@@ -20,6 +20,7 @@
 
 
 __all__ = [
+    "stages",
     "Compiled",
     "CompilerOptions",
     "JaceWrapped",

From d28ec0e4967ab4e718668e9860a9923dfe0831b0 Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Wed, 8 May 2024 11:27:30 +0200
Subject: [PATCH 122/458] Updated the `JaCeVar` class.

It now uses the new kind of dataclass, thus it has now a decent constructor.
Furthermore, it now also has a storage property, which the Jax stuff does not have.
Probably it also misses strides, who knows.
---
 .../translator/jaxpr_translator_driver.py     |  5 +++
 src/jace/util/jax_helper.py                   | 44 ++++++++++++++-----
 src/jace/util/traits.py                       |  9 +++-
 3 files changed, 46 insertions(+), 12 deletions(-)

diff --git a/src/jace/translator/jaxpr_translator_driver.py b/src/jace/translator/jaxpr_translator_driver.py
index dfd6695..910a0ae 100644
--- a/src/jace/translator/jaxpr_translator_driver.py
+++ b/src/jace/translator/jaxpr_translator_driver.py
@@ -478,6 +478,11 @@ def add_array(
         storage: dace.StorageType = dace.StorageType.Default  # Set at later stages (optimization)
         is_scalar: bool = shape == ()
 
+        # Use the storage if passed in the variable.
+        #  Note that this is a bad idea, since one should always specialize later.
+        if isinstance(arg, util.JaCeVar):
+            storage = arg.storage
+
         if (alt_name is None) and (self.map_jax_var_to_sdfg(arg, allow_fail=True) is not None):
             # Maybe the test could be more robust, but it will check if we try to create
             #  a variable for a second time. It is, however, okay to use one as template,
diff --git a/src/jace/util/jax_helper.py b/src/jace/util/jax_helper.py
index ef5e91a..f7015bb 100644
--- a/src/jace/util/jax_helper.py
+++ b/src/jace/util/jax_helper.py
@@ -16,8 +16,7 @@
 from __future__ import annotations
 
 import itertools
-from collections.abc import Mapping
-from dataclasses import dataclass
+from collections.abc import Mapping, Sequence
 from typing import Any, overload
 
 import dace
@@ -26,26 +25,53 @@
 import numpy as np
 
 from jace import util
+from jace.util import util as dcutil  # Partially initialized module
 
 
-@dataclass(init=True, repr=True, frozen=True, slots=True)
+@dcutil.dataclass_with_default_init(init=True, repr=True, frozen=True, slots=True)
 class JaCeVar:
     """Substitute class for Jax' `Var` instance.
 
-    This class is similar to a `jax.core.Var` class, but much simpler.
-    It is only a container for a name, shape and a datatype.
-    All extractor functions `get_jax_var{name, shape, dtype}()` will accept it, as well as multiple functions of the driver.
+    This class can be seen as some kind of substitute `jax.core.Var`.
+    The main intention of this class is as an internal representation of values,
+    as they are used in Jax, but without the Jax machinery.
+    The main differences to Jax variable is, that this class has a name and also a storage type.
 
     Notes:
         Main intention is to test functionality.
         If the name of a `JaCeVar` is '_' it is considered a drop variable.
         If the name of a `JaCeVar` is empty, the automatic naming will consider it as a Jax variable.
         The definition of `__hash__` and `__eq__` is in accordance how Jax variable works.
+
+    Todo:
+        Do we need strides for caching; I would say so.
     """
 
     name: str
     shape: tuple[int | dace.symbol | str, ...] | tuple[()]
     dtype: dace.typeclass
+    storage: dace.StorageType = dace.StorageType.Default
+
+    def __init__(
+        self,
+        name: str,
+        shape: Sequence[int | dace.symbol | str] | int | dace.symbol | str,
+        dtype: Any,
+        storage: dace.StorageType = dace.StorageType.Default,
+    ) -> None:
+        if name == "":
+            pass  # Explicit allowed in the interface, but a bit strange.
+        elif (name != "_") and (not util._VALID_SDFG_VAR_NAME.fullmatch(name)):
+            raise ValueError(f"Passed an invalid name '{name}'.")
+        if isinstance(shape, (int, dace.symbol, str)):
+            shape = (shape,)
+        elif not isinstance(shape, tuple):
+            shape = tuple(shape)
+        if not isinstance(dtype, dace.typeclass):
+            dtype = translate_dtype(dtype)
+        assert all(isinstance(x, (int, dace.symbol, str)) for x in shape)
+        assert isinstance(storage, dace.StorageType)
+        self.__default_init__(name=name, shape=shape, dtype=dtype, storage=storage)  # type: ignore[attr-defined]  # __default_init__ is existing.
 
     def __hash__(self) -> int:
         return id(self)
@@ -55,10 +81,6 @@ def __eq__(self, other: Any) -> bool:
             return NotImplemented
         return id(self) == id(other)
 
-    def __post_init__(self) -> None:
-        if not isinstance(self.shape, tuple):
-            raise ValueError("The 'shape' member of a 'JaCeVar' must be a tuple.")
-
 
 def get_jax_var_name(jax_var: jax_core.Atom | JaCeVar | str) -> str:
     """Returns the name of the Jax variable as a string.
@@ -99,7 +121,7 @@ def get_jax_var_name(jax_var: jax_core.Atom | JaCeVar | str) -> str:
 
 
 @overload
-def get_jax_var_shape(jax_var: JaCeVar) -> tuple[int | dace.symbol | str, ...] | tuple[()]: ...
+def get_jax_var_shape(jax_var: JaCeVar) -> tuple[int | dace.symbol | str, ...] | tuple[()]: ...  # type: ignore[overload-overlap]
 
 
 @overload
diff --git a/src/jace/util/traits.py b/src/jace/util/traits.py
index 750b7bb..91def43 100644
--- a/src/jace/util/traits.py
+++ b/src/jace/util/traits.py
@@ -12,6 +12,7 @@
 from collections.abc import Iterable
 from typing import Any, TypeGuard
 
+import dace
 from jax import _src as jax_src, core as jax_core
 from jaxlib import xla_extension as jax_xe
 
@@ -84,7 +85,13 @@ def is_jax_array(
 def is_on_device(
     obj: Any,
 ) -> bool:
-    """Tests if `obj` is on a device."""
+    """Tests if `obj` is on a device.
+
+    The function will recognize and correctly handle `JaCeVar` objects.
+    """
+    if isinstance(obj, util.JaCeVar):
+        return obj.storage in [dace.StorageType.GPU_Global, dace.StorageType.GPU_Shared]
+
     # The problem is, that we can not test if `__cuda_array_interface__` exists.
     #  because Jax array have that even on CPU, thus it is a bit mnore complex.
     # TODO(phimuell): Hip

From 9b029618833a192779bcc81d85197f85a5bb0a40 Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Wed, 8 May 2024 12:01:11 +0200
Subject: [PATCH 123/458] Added a cache for the stages.

However, it is not yet integrated.
---
 src/jace/util/__init__.py          |   2 +-
 src/jace/util/translation_cache.py | 252 +++++++++++++++++++++++++++++
 2 files changed, 253 insertions(+), 1 deletion(-)
 create mode 100644 src/jace/util/translation_cache.py

diff --git a/src/jace/util/__init__.py b/src/jace/util/__init__.py
index eec5d57..d9f8476 100644
--- a/src/jace/util/__init__.py
+++ b/src/jace/util/__init__.py
@@ -33,6 +33,7 @@
 
 
 __all__ = [
+    "JaCeVar",
     "as_sequence",
     "compile_jax_sdfg",
     "dataclass_with_default_init",
@@ -44,7 +45,6 @@
     "is_fully_addressable",
     "is_non_string_iterable",
     "is_on_device",
-    "JaCeVar",
     "get_jax_var_name",
     "get_jax_var_shape",
     "get_jax_var_dtype",
diff --git a/src/jace/util/translation_cache.py b/src/jace/util/translation_cache.py
new file mode 100644
index 0000000..5a3af02
--- /dev/null
+++ b/src/jace/util/translation_cache.py
@@ -0,0 +1,252 @@
+# JaCe - JAX Just-In-Time compilation using DaCe (Data Centric Parallel Programming)
+#
+# Copyright (c) 2024, ETH Zurich
+# All rights reserved.
+#
+# SPDX-License-Identifier: BSD-3-Clause
+
+"""This module contains the functionality related to the compilation cache of the stages.
+
+Actually there are two different caches:
+- The lowering cache.
+- And the compilation cache.
+
+Both are implemented as a singleton.
+"""
+
+from __future__ import annotations
+
+from collections import OrderedDict
+from collections.abc import Callable
+from dataclasses import dataclass
+from typing import Any
+
+import dace
+from jax import core as jax_core
+
+from jace import util
+from jace.jax import stages
+
+
+def get_cache(
+    name: str,
+    size: int = 128,
+) -> TranslationCache:
+    """Returns the cache associated to `name`.
+
+    If called for the first time, the cache sizes will be set to `size`.
+    In all later calls this value is ignored.
+    """
+    # Get the caches and if not present, create them.
+    if not hasattr(get_cache, "_caches"):
+        _caches: dict[str, TranslationCache] = {}
+        _caches["lowering"] = TranslationCache(size=size)
+        _caches["compiling"] = TranslationCache(size=size)
+        get_cache._caches = _caches  # type: ignore[attr-defined]  # ruff removes the `getattr()` calls
+    _caches = get_cache._caches  # type: ignore[attr-defined]
+
+    if name not in _caches:
+        raise ValueError(f"The cache '{name}' is unknown.")
+    return _caches[name]
+
+
+@util.dataclass_with_default_init(init=True, repr=True, frozen=True, slots=True)
+class _JaCeVarWrapper:
+    """Wrapper class around `JaCeVar` for use in `_CacheKey`.
+
+    It essentially makes the hash depend on the content, with the exception of name.
+    """
+
+    _slots__ = ("var", "_hash")
+    var: util.JaCeVar
+    _hash: int
+
+    def __init__(self, var: util.JaCeVar) -> None:
+        _hash: int = hash((var.shape, var.dtype, var.storage))
+        if var.name != "":
+            raise ValueError("Key can not have a name.")
+        self.__default_init__(var=var, _hash=_hash)  # type: ignore[attr-defined]
+
+    def __hash__(self) -> int:
+        return self._hash
+
+    def __eq__(self, other: Any) -> bool:
+        if not isinstance(other, _JaCeVarWrapper):
+            return NotImplemented
+        return (self.var.shape, self.var.dtype, self.var.storage) == (
+            other.var.shape,
+            other.var.dtype,
+            other.var.storage,
+        )
+
+    @classmethod
+    def from_value(
+        cls,
+        val: Any,
+    ) -> _JaCeVarWrapper:
+        """Returns a `JaCe` variable constructed from `val`.
+
+        If `val` is on the device, its storage type will be `GPU_Global` otherwise the default.
+
+        Todo:
+            Improve, such that NumPy arrays are on CPU, CuPy on GPU and so on.
+        """
+        if not util.is_fully_addressable(val):
+            raise NotImplementedError("Distributed arrays are not addressed yet.")
+
+        if isinstance(val, util.JaCeVar):
+            return cls(var=val)
+
+        # Define the storage as given by on device.
+        storage: dace.StorageType | None = (
+            dace.StorageType.GPU_Global if util.is_on_device(val) else None
+        )
+
+        if isinstance(val, jax_core.Var):
+            val = val.aval
+        if isinstance(val, jax_core.Literal):
+            raise TypeError("Jax Literals are not supported as cache keys.")
+
+        # We need at least a shaped array
+        if isinstance(val, jax_core.ShpedArray):
+            return cls(
+                util.JaCeVar(
+                    name="",
+                    shape=val.aval.shape,
+                    dtype=val,
+                    storage=storage,
+                ),
+            )
+        if isinstance(val, jax_core.AbstractValue):
+            raise TypeError(f"Can not make 'JaCeVar' from '{type(val).__name__}', too abstract.")
+
+        # If we are here, then we where not able, thus we will will now try Jax
+        #  This is inefficient and we should make it better.
+        return cls.from_value(jax_core.get_aval(val))
+
+
+@dataclass(init=True, eq=True, frozen=True, unsafe_hash=True)
+class _CacheKey:
+    """Wrapper around the arguments"""
+
+    __slots__ = ("fun", "sdfg_hash", "vars", "_hash")
+
+    # Note that either `_fun` or `_sdfg_hash` are not `None`.
+    fun: Callable | None
+    sdfg_hash: int | None
+    fargs: tuple[_JaCeVarWrapper, ...]
+
+    @classmethod
+    def Create(
+        cls,
+        stage: stages.Stage,
+        *args: Any,
+        **kwargs: Any,
+    ) -> _CacheKey:
+        """Creates a cache key for the stage object `stage` that was called to advance."""
+        if len(kwargs) != 0:
+            raise NotImplementedError("kwargs are not implemented.")
+
+        if isinstance(stage, stages.JaceWrapped):
+            fun = stage.__wrapped__
+            sdfg_hash = None
+        elif isinstance(stage, stages.JaceLowered):
+            fun = None
+            sdfg_hash = int(stage.compiler_ir().sdfg.hash_sdfg, 16)
+        else:
+            raise TypeError(f"Can not make key from '{type(stage).__name__}'.")
+
+        fargs = tuple(_JaCeVarWrapper.from_value(x) for x in args)
+
+        return cls(fun=fun, sdfg_hash=sdfg_hash, fargs=fargs)
+
+
+class TranslationCache:
+    """The _internal_ cache object.
+
+    It implements a simple LRU cache.
+
+    Todo:
+        Also handle abstract values.
+    """
+
+    __slots__ = ["_memory", "_size"]
+
+    _memory: OrderedDict[_CacheKey, stages.Stage]
+    _size: int
+
+    def __init__(
+        self,
+        size: int = 128,
+    ) -> None:
+        """Creates a cache instance of size `size`."""
+        if size <= 0:
+            raise ValueError(f"Invalid cache size of '{size}'")
+        self._memory: OrderedDict[_CacheKey, stages.Stage] = OrderedDict()
+        self._size = size
+
+    @staticmethod
+    def make_key(
+        stage: stages.Stage,
+        *args: Any,
+        **kwargs: Any,
+    ) -> _CacheKey:
+        """Create a key object for `stage`."""
+        if len(kwargs) != 0:
+            raise NotImplementedError
+        return _CacheKey.Create(stage, *args, **kwargs)
+
+    def has(
+        self,
+        key: _CacheKey,
+    ) -> bool:
+        """Check if `self` have a record of `key`.
+
+        To generate `key` use the `make_key` function.
+        """
+        return key in self._memory
+
+    def get(
+        self,
+        key: _CacheKey,
+    ) -> stages.Stage:
+        """Get the next stage associated with `key`.
+
+        It is an error if `key` does not exists.
+        This function will move `key` to front of `self`.
+        """
+        if not self.has(key):
+            raise KeyError(f"Key '{key}' is unknown.")
+        self._memory.move_to_end(key, last=False)
+        return self._memory.get(key)  # type: ignore[return-value]  # type confusion
+
+    def add(
+        self,
+        key: _CacheKey,
+        res: stages.Stage,
+    ) -> TranslationCache:
+        """Adds `res` under `key` to `self`.
+
+        In case `key` is already known, it will first be eviceted and then reinserted.
+        If `self` is larger than specified the oldest one will be evicted.
+        """
+        self._evict(key)
+        while len(self._memory) >= self._size:
+            self._memory.popitem(last=True)
+        self._memory[key] = res
+        self._memory.move_to_end(key, last=False)
+        return self
+
+    def _evict(
+        self,
+        key: _CacheKey,
+    ) -> bool:
+        """Evict `key` from `self`.
+
+        Returns if it was evicted or not.
+        """
+        if not self.has(key):
+            return False
+        self._memory.move_to_end(key, last=True)
+        self._memory.popitem(last=True)
+        return True

From a5b593a17b44b3e0df29069eb4863e5025fe4f88 Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Wed, 8 May 2024 15:03:13 +0200
Subject: [PATCH 124/458] WIP: Starting to integrate the caching, however,
 nothing is tested yet, it will probably not work.

---
 src/jace/jax/stages/jace_wrapped.py |  9 ++++++++-
 src/jace/util/translation_cache.py  | 25 +++++++++++++++++++++++++
 2 files changed, 33 insertions(+), 1 deletion(-)

diff --git a/src/jace/jax/stages/jace_wrapped.py b/src/jace/jax/stages/jace_wrapped.py
index 28aa58c..72a5971 100644
--- a/src/jace/jax/stages/jace_wrapped.py
+++ b/src/jace/jax/stages/jace_wrapped.py
@@ -16,6 +16,7 @@
 
 from jace import translator, util
 from jace.jax import stages
+from jace.util import translation_cache as tcache
 
 
 class JaceWrapped(stages.Stage):
@@ -35,9 +36,13 @@ class JaceWrapped(stages.Stage):
         Copy the `jax._src.pjit.make_jit()` functionality to remove `jax.make_jaxpr()`.
     """
 
-    __slots__ = ("fun_",)
+    __slots__ = (
+        "fun_",
+        "_cache",
+    )
 
     _fun: Callable
+    _cache: tcache.TranslationCache
 
     def __init__(
         self,
@@ -46,6 +51,7 @@ def __init__(
         """Creates a wrapped jace jitable object of `jax_prim`."""
         assert fun is not None
         self._fun: Callable = fun
+        self._cache: tcache.TranslationCache = tcache.get_cache("lowering")
 
     def __call__(
         self,
@@ -65,6 +71,7 @@ def __call__(
         #                   https://jax.readthedocs.io/en/latest/aot.html#lowering-with-static-arguments
         return self.lower(*args, **kwargs).optimize().compile()(*args, **kwargs)
 
+    @tcache.cached_translation
     def lower(
         self,
         *args: Any,
diff --git a/src/jace/util/translation_cache.py b/src/jace/util/translation_cache.py
index 5a3af02..057507b 100644
--- a/src/jace/util/translation_cache.py
+++ b/src/jace/util/translation_cache.py
@@ -16,6 +16,7 @@
 
 from __future__ import annotations
 
+import functools as ft
 from collections import OrderedDict
 from collections.abc import Callable
 from dataclasses import dataclass
@@ -50,6 +51,30 @@ def get_cache(
     return _caches[name]
 
 
+def cached_translation(
+    action: Callable,
+) -> Callable:
+    """Decorator for making the function cacheable."""
+
+    @ft.wraps(action)
+    def _action_wrapper(
+        self: stages.Stage,
+        *args: Any,
+        **kwargs: Any,
+    ) -> stages.Stage:
+        assert hasattr(self, "_cache")
+        cache: TranslationCache = self._cache
+        key: _CacheKey = self.make_key(self, *args, **kwargs)
+        if cache.has(key):
+            return cache.get(key)
+
+        next_stage: stages.Stage = action(*args, **kwargs)
+        cache.add(key, next_stage)
+        return next_stage
+
+    return _action_wrapper
+
+
 @util.dataclass_with_default_init(init=True, repr=True, frozen=True, slots=True)
 class _JaCeVarWrapper:
     """Wrapper class around `JaCeVar` for use in `_CacheKey`.

From 1ae6f3a1d1c7ff8ac31234dcf43082dbd194b658 Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Mon, 13 May 2024 07:14:23 +0200
Subject: [PATCH 125/458] Relocated the variable Patterns.

---
 src/jace/translator/_translation_context.py   |  2 +-
 .../translator/jaxpr_translator_driver.py     |  8 +++----
 src/jace/util/__init__.py                     | 15 ++++++++-----
 src/jace/util/jax_helper.py                   |  4 ++--
 src/jace/util/re_pattern.py                   | 22 -------------------
 src/jace/util/util.py                         | 11 ++++++++++
 6 files changed, 28 insertions(+), 34 deletions(-)
 delete mode 100644 src/jace/util/re_pattern.py

diff --git a/src/jace/translator/_translation_context.py b/src/jace/translator/_translation_context.py
index 15dd47f..6253118 100644
--- a/src/jace/translator/_translation_context.py
+++ b/src/jace/translator/_translation_context.py
@@ -70,7 +70,7 @@ def __init__(
             rev_idx:    The revision index of the context.
             name:       Name of the SDFG object.
         """
-        if isinstance(name, str) and not util._VALID_SDFG_OBJ_NAME.fullmatch(name):
+        if isinstance(name, str) and not util.VALID_SDFG_OBJ_NAME.fullmatch(name):
             raise ValueError(f"'{name}' is not a valid SDFG name.")
 
         self.sdfg: dace.SDFG = dace.SDFG(name=(name or f"unnamed_SDFG_{id(self)}"))
diff --git a/src/jace/translator/jaxpr_translator_driver.py b/src/jace/translator/jaxpr_translator_driver.py
index 910a0ae..11af050 100644
--- a/src/jace/translator/jaxpr_translator_driver.py
+++ b/src/jace/translator/jaxpr_translator_driver.py
@@ -196,7 +196,7 @@ def append_new_state(
             prev_state:     Alternative `SDFGState` at which we should append the new state.
 
         """
-        if isinstance(label, str) and (not util._VALID_SDFG_OBJ_NAME.fullmatch(label)):
+        if isinstance(label, str) and (not util.VALID_SDFG_OBJ_NAME.fullmatch(label)):
             raise ValueError(f"Can not create state with label '{label}' since it is invalid.")
 
         # Decide if appending to that state will modify the terminal state.
@@ -385,7 +385,7 @@ def add_reserved_names(
             raise TypeError(f"Does not know how to handle the type '{type(reserved_names)}'.")
         for rev_name in reserved_names:
             assert isinstance(rev_name, str)
-            if not util._VALID_SDFG_VAR_NAME.fullmatch(rev_name):
+            if not util.VALID_SDFG_VAR_NAME.fullmatch(rev_name):
                 raise ValueError(
                     f"Can not use '{rev_name}' as reserved name as it is not a valid SDFG name."
                 )
@@ -509,7 +509,7 @@ def add_array(
                 raise ValueError("Passed an empty 'alt_name'.")
             if alt_name in self._forbidden_names:
                 raise ValueError("'alt_name' is a forbidden name.")
-            if not util._VALID_SDFG_VAR_NAME.fullmatch(alt_name):
+            if not util.VALID_SDFG_VAR_NAME.fullmatch(alt_name):
                 raise ValueError(f"The passed name 'alt_name' '{alt_name}' is invalid.")
             if name_prefix is not None:
                 raise ValueError(
@@ -596,7 +596,7 @@ def add_array(
             raise ValueError(f"Can't create variable '{arg_name}', name is forbidden.")
         if arg_name in self._ctx.sdfg.arrays:
             raise ValueError(f"Can't create variable '{arg_name}', variable is already created.")
-        if not util._VALID_SDFG_VAR_NAME.fullmatch(arg_name):
+        if not util.VALID_SDFG_VAR_NAME.fullmatch(arg_name):
             raise ValueError(f"The requested variable name '{arg_name}' is invalid.")
 
         # Promotion of scalar to array.
diff --git a/src/jace/util/__init__.py b/src/jace/util/__init__.py
index d9f8476..3a85f98 100644
--- a/src/jace/util/__init__.py
+++ b/src/jace/util/__init__.py
@@ -19,7 +19,6 @@
     is_tracing_ongoing,
     translate_dtype,
 )
-from .re_pattern import _VALID_JAX_VAR_NAME, _VALID_SDFG_OBJ_NAME, _VALID_SDFG_VAR_NAME
 from .traits import (
     is_drop_var,
     is_fully_addressable,
@@ -29,7 +28,13 @@
     is_non_string_iterable,
     is_on_device,
 )
-from .util import as_sequence, dataclass_with_default_init
+from .util import (
+    VALID_JAX_VAR_NAME,
+    VALID_SDFG_OBJ_NAME,
+    VALID_SDFG_VAR_NAME,
+    as_sequence,
+    dataclass_with_default_init,
+)
 
 
 __all__ = [
@@ -52,7 +57,7 @@
     "run_jax_sdfg",
     "_jace_run",
     "_propose_jax_name",
-    "_VALID_JAX_VAR_NAME",
-    "_VALID_SDFG_OBJ_NAME",
-    "_VALID_SDFG_VAR_NAME",
+    "VALID_JAX_VAR_NAME",
+    "VALID_SDFG_OBJ_NAME",
+    "VALID_SDFG_VAR_NAME",
 ]
diff --git a/src/jace/util/jax_helper.py b/src/jace/util/jax_helper.py
index f7015bb..3d27e24 100644
--- a/src/jace/util/jax_helper.py
+++ b/src/jace/util/jax_helper.py
@@ -61,7 +61,7 @@ def __init__(
     ) -> None:
         if name == "":
             pass  # Explicit allowed in the interface, but a bit strange.
-        elif (name != "_") and (not util._VALID_SDFG_VAR_NAME.fullmatch(name)):
+        elif (name != "_") and (not util.VALID_SDFG_VAR_NAME.fullmatch(name)):
             raise ValueError(f"Passed an invalid name '{name}'.")
         if isinstance(shape, (int, dace.symbol, str)):
             shape = (shape,)
@@ -115,7 +115,7 @@ def get_jax_var_name(jax_var: jax_core.Atom | JaCeVar | str) -> str:
             )
     assert isinstance(jax_name, str)
 
-    if not util._VALID_JAX_VAR_NAME.fullmatch(jax_name):
+    if not util.VALID_JAX_VAR_NAME.fullmatch(jax_name):
         raise ValueError(f"Deduced Jax name '{jax_name}' is invalid.")
     return jax_name
 
diff --git a/src/jace/util/re_pattern.py b/src/jace/util/re_pattern.py
deleted file mode 100644
index 99fb71a..0000000
--- a/src/jace/util/re_pattern.py
+++ /dev/null
@@ -1,22 +0,0 @@
-# JaCe - JAX Just-In-Time compilation using DaCe (Data Centric Parallel Programming)
-#
-# Copyright (c) 2024, ETH Zurich
-# All rights reserved.
-#
-# SPDX-License-Identifier: BSD-3-Clause
-
-"""Module containing all regex pattern that we need inside JaCe."""
-
-from __future__ import annotations
-
-import re
-
-
-# Valid name for a jax variable.
-_VALID_JAX_VAR_NAME: re.Pattern = re.compile("(jax[0-9]+_?)|([a-z]+_?)")
-
-# Valid name for an SDFG variable.
-_VALID_SDFG_VAR_NAME: re.Pattern = re.compile("[a-zA-Z_][a-zA-Z0-9_]*")
-
-# Valid name for an SDFG itself, includes `SDFGState` objects.
-_VALID_SDFG_OBJ_NAME: re.Pattern = re.compile("[a-zA-Z_][a-zA-Z0-9_]*")
diff --git a/src/jace/util/util.py b/src/jace/util/util.py
index f3dbdd4..72e3ee6 100644
--- a/src/jace/util/util.py
+++ b/src/jace/util/util.py
@@ -7,6 +7,7 @@
 
 from __future__ import annotations
 
+import re
 from collections.abc import Callable, Iterable
 from typing import Any, TypeVar, cast, overload
 
@@ -75,3 +76,13 @@ def wrap(cls: type) -> type:
     if _cls is None:
         return wrap
     return wrap(_cls)
+
+
+# Valid name for a jax variable.
+VALID_JAX_VAR_NAME: re.Pattern = re.compile("(jax[0-9]+_?)|([a-z]+_?)")
+
+# Valid name for an SDFG variable.
+VALID_SDFG_VAR_NAME: re.Pattern = re.compile("[a-zA-Z_][a-zA-Z0-9_]*")
+
+# Valid name for an SDFG itself, includes `SDFGState` objects.
+VALID_SDFG_OBJ_NAME: re.Pattern = re.compile("[a-zA-Z_][a-zA-Z0-9_]*")

From 27fa2bf607b68a629280da5f4fcf5c31e7840298 Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Mon, 13 May 2024 07:29:41 +0200
Subject: [PATCH 126/458] Updated the `JaCeVar` class.

It is now simpler again.
However, we have to change the cache mechanism again.
---
 .../translator/jaxpr_translator_driver.py     |  5 ---
 src/jace/util/jax_helper.py                   | 45 ++++++++++---------
 2 files changed, 25 insertions(+), 25 deletions(-)

diff --git a/src/jace/translator/jaxpr_translator_driver.py b/src/jace/translator/jaxpr_translator_driver.py
index 11af050..92ca8be 100644
--- a/src/jace/translator/jaxpr_translator_driver.py
+++ b/src/jace/translator/jaxpr_translator_driver.py
@@ -478,11 +478,6 @@ def add_array(
         storage: dace.StorageType = dace.StorageType.Default  # Set at later stages (optimization)
         is_scalar: bool = shape == ()
 
-        # Use the storage if passed in the variable.
-        #  Note that this is a bad idea, since one should always specialize later.
-        if isinstance(arg, util.JaCeVar):
-            storage = arg.storage
-
         if (alt_name is None) and (self.map_jax_var_to_sdfg(arg, allow_fail=True) is not None):
             # Maybe the test could be more robust, but it will check if we try to create
             #  a variable for a second time. It is, however, okay to use one as template,
diff --git a/src/jace/util/jax_helper.py b/src/jace/util/jax_helper.py
index 3d27e24..72ff85d 100644
--- a/src/jace/util/jax_helper.py
+++ b/src/jace/util/jax_helper.py
@@ -17,6 +17,7 @@
 
 import itertools
 from collections.abc import Mapping, Sequence
+from dataclasses import dataclass
 from typing import Any, overload
 
 import dace
@@ -25,40 +26,53 @@
 import numpy as np
 
 from jace import util
-from jace.util import util as dcutil  # Partially initialized module
 
 
-@dcutil.dataclass_with_default_init(init=True, repr=True, frozen=True, slots=True)
+@dataclass(init=True, repr=True, frozen=True, eq=False)
 class JaCeVar:
     """Substitute class for Jax' `Var` instance.
 
     This class can be seen as some kind of substitute `jax.core.Var`.
     The main intention of this class is as an internal representation of values,
     as they are used in Jax, but without the Jax machinery.
-    The main differences to Jax variable is, that this class has a name and also a storage type.
+    The main differences to Jax variable is that this class has a name.
 
     Notes:
         Main intention is to test functionality.
         If the name of a `JaCeVar` is '_' it is considered a drop variable.
         If the name of a `JaCeVar` is empty, the automatic naming will consider it as a Jax variable.
         The definition of `__hash__` and `__eq__` is in accordance how Jax variable works.
-
-    Todo:
-        Do we need strides for caching; I would say so.
     """
 
     name: str
     shape: tuple[int | dace.symbol | str, ...] | tuple[()]
     dtype: dace.typeclass
-    storage: dace.StorageType = dace.StorageType.Default
 
-    def __init__(
-        self,
+    def __hash__(self) -> int:
+        return id(self)
+
+    def __eq__(self, other: Any) -> bool:
+        if not isinstance(other, JaCeVar):
+            return NotImplemented
+        return id(self) == id(other)
+
+    @classmethod
+    def Create(
+        cls,
         name: str,
         shape: Sequence[int | dace.symbol | str] | int | dace.symbol | str,
         dtype: Any,
-        storage: dace.StorageType = dace.StorageType.Default,
     ) -> None:
+        """Creates a `JaCeVar` object.
+
+        Performs some sanity checks on the input.
+        It is also possible that `shape` can be an integer or symbol, that is then translated into an tuple.
+
+        Args:
+            name:       Name of the variable, might be empty.
+            shape:      The shape of the array.
+            dtype:      The datatype, will be transformed into a dace datatype.
+        """
         if name == "":
             pass  # Explicit allowed in the interface, but a bit strange.
         elif (name != "_") and (not util.VALID_SDFG_VAR_NAME.fullmatch(name)):
@@ -70,16 +84,7 @@ def __init__(
         if not isinstance(dtype, dace.typeclass):
             dtype = translate_dtype(dtype)
         assert all(isinstance(x, (int, dace.symbol, str)) for x in shape)
-        assert isinstance(storage, dace.StorageType)
-        self.__default_init__(name=name, shape=shape, dtype=dtype, storage=storage)  # type: ignore[attr-defined]  # __default_init__ is existing.
-
-    def __hash__(self) -> int:
-        return id(self)
-
-    def __eq__(self, other: Any) -> bool:
-        if not isinstance(other, JaCeVar):
-            return NotImplemented
-        return id(self) == id(other)
+        return cls(name=name, shape=shape, dtype=dtype)
 
 
 def get_jax_var_name(jax_var: jax_core.Atom | JaCeVar | str) -> str:

From 07fd08681b7fdd94a6a2499b0f216d35cf2f100e Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Mon, 13 May 2024 07:31:35 +0200
Subject: [PATCH 127/458] Removed the `dataclass_with_default_init` function.

Note that this commit renders the caching mechanism unusable.
---
 src/jace/util/__init__.py |  1 -
 src/jace/util/util.py     | 47 ++-------------------------------------
 2 files changed, 2 insertions(+), 46 deletions(-)

diff --git a/src/jace/util/__init__.py b/src/jace/util/__init__.py
index 3a85f98..b1f9255 100644
--- a/src/jace/util/__init__.py
+++ b/src/jace/util/__init__.py
@@ -33,7 +33,6 @@
     VALID_SDFG_OBJ_NAME,
     VALID_SDFG_VAR_NAME,
     as_sequence,
-    dataclass_with_default_init,
 )
 
 
diff --git a/src/jace/util/util.py b/src/jace/util/util.py
index 72e3ee6..4e97e8c 100644
--- a/src/jace/util/util.py
+++ b/src/jace/util/util.py
@@ -8,8 +8,8 @@
 from __future__ import annotations
 
 import re
-from collections.abc import Callable, Iterable
-from typing import Any, TypeVar, cast, overload
+from collections.abc import Iterable
+from typing import TypeVar, cast, overload
 
 from jace.util import traits
 
@@ -35,49 +35,6 @@ def as_sequence(value: _T | Iterable[_T]) -> Iterable[_T]:
     return cast(Iterable[_T], [value])
 
 
-def dataclass_with_default_init(
-    _cls: type | None = None,
-    *args: Any,
-    **kwargs: Any,
-) -> type | Callable[[type], type]:
-    """The dataclasses `__init__` will now be made available as `__default_init__` if `_cls` define `__init__`.
-
-    Adapted from `https://stackoverflow.com/a/58336722`
-    """
-    from dataclasses import dataclass
-
-    def wrap(cls: type) -> type:
-        # Save the current __init__ and remove it so dataclass will create the default __init__.
-        #  But only do something if the class has an `__init__` function.
-        has_user_init = hasattr(cls, "__init__")
-        if has_user_init:
-            user_init = getattr(cls, "__init__", None)
-            delattr(cls, "__init__")
-
-        # let dataclass process our class.
-        result = dataclass(cls, *args, **kwargs)  # type: ignore[var-annotated]
-
-        # If there is no init function in the original class then, we are done.
-        if not has_user_init:
-            return result
-
-        # Restore the user's __init__ save the default init to __default_init__.
-        result.__default_init__ = result.__init__
-        result.__init__ = user_init
-
-        # Just in case that dataclass will return a new instance,
-        # (currently, does not happen), restore cls's __init__.
-        if result is not cls:
-            cls.__init__ = user_init  # type: ignore[misc]
-
-        return result
-
-    # Support both dataclass_with_default_init() and dataclass_with_default_init
-    if _cls is None:
-        return wrap
-    return wrap(_cls)
-
-
 # Valid name for a jax variable.
 VALID_JAX_VAR_NAME: re.Pattern = re.compile("(jax[0-9]+_?)|([a-z]+_?)")
 

From b6d92758a92bb745161118f16f680990f470552e Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Mon, 13 May 2024 08:02:56 +0200
Subject: [PATCH 128/458] Updated some traits functions.

---
 src/jace/util/__init__.py |  2 ++
 src/jace/util/traits.py   | 20 +++++++++++---------
 2 files changed, 13 insertions(+), 9 deletions(-)

diff --git a/src/jace/util/__init__.py b/src/jace/util/__init__.py
index b1f9255..11469fc 100644
--- a/src/jace/util/__init__.py
+++ b/src/jace/util/__init__.py
@@ -20,6 +20,7 @@
     translate_dtype,
 )
 from .traits import (
+    is_array,
     is_drop_var,
     is_fully_addressable,
     is_jaceified,
@@ -41,6 +42,7 @@
     "as_sequence",
     "compile_jax_sdfg",
     "dataclass_with_default_init",
+    "is_array",
     "is_drop_var",
     "is_tracing_ongoing",
     "is_jaceified",
diff --git a/src/jace/util/traits.py b/src/jace/util/traits.py
index 91def43..779a8dd 100644
--- a/src/jace/util/traits.py
+++ b/src/jace/util/traits.py
@@ -82,22 +82,24 @@ def is_jax_array(
     return all(hasattr(obj, x) for x in ["sharding", "is_fully_addressable"])
 
 
-def is_on_device(
+def is_array(
     obj: Any,
 ) -> bool:
-    """Tests if `obj` is on a device.
+    """Identifies arrays, this also includes Jax arrays."""
+    if is_jax_array(obj):
+        return True
+    return dace.is_array(obj)
 
-    The function will recognize and correctly handle `JaCeVar` objects.
-    """
-    if isinstance(obj, util.JaCeVar):
-        return obj.storage in [dace.StorageType.GPU_Global, dace.StorageType.GPU_Shared]
 
+def is_on_device(
+    obj: Any,
+) -> bool:
+    """Tests if `obj` is on a device."""
     # The problem is, that we can not test if `__cuda_array_interface__` exists.
     #  because Jax array have that even on CPU, thus it is a bit mnore complex.
-    # TODO(phimuell): Hip
     if is_jax_array(obj):
-        obj = obj.__array__()
-    return hasattr(obj, "__cuda_array_interface__")
+        obj = obj.__array__(copy=False)
+    return dace.is_gpu_array(obj)
 
 
 def is_fully_addressable(

From 311f1f6bf7ac1fc4065955ad02e839c048bad56a Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Mon, 13 May 2024 08:19:25 +0200
Subject: [PATCH 129/458] Updated the cache implementation.

It no longer builds on the `JaCeVar` but makes it itself.
This commit also introduces the ability to cache the compiled result.

However, IT IS NOT TESTED!
---
 src/jace/jax/stages/jace_compiled.py |   1 +
 src/jace/jax/stages/jace_lowered.py  |  22 +++--
 src/jace/jax/stages/jace_wrapped.py  |   2 +-
 src/jace/util/translation_cache.py   | 136 +++++++++++++--------------
 4 files changed, 82 insertions(+), 79 deletions(-)

diff --git a/src/jace/jax/stages/jace_compiled.py b/src/jace/jax/stages/jace_compiled.py
index 5d4e888..7b7e089 100644
--- a/src/jace/jax/stages/jace_compiled.py
+++ b/src/jace/jax/stages/jace_compiled.py
@@ -35,6 +35,7 @@ class JaceCompiled(stages.Stage):
     _csdfg: jdace.CompiledSDFG  # The compiled SDFG object.
     _inp_names: tuple[str, ...]  # Name of all input arguments.
     _out_names: tuple[str, ...]  # Name of all output arguments.
+    # TODO(phimuell): Also store description of output, such that we do not have to rely on internal sdfg.
 
     def __init__(
         self,
diff --git a/src/jace/jax/stages/jace_lowered.py b/src/jace/jax/stages/jace_lowered.py
index e3475be..581cefe 100644
--- a/src/jace/jax/stages/jace_lowered.py
+++ b/src/jace/jax/stages/jace_lowered.py
@@ -14,15 +14,19 @@
 
 from jace import translator, util
 from jace.jax import stages
-from jace.util import dace_helper as jdace
+from jace.util import dace_helper as jdace, translation_cache as tcache
 
 
 class JaceLowered(stages.Stage):
     """Represents the original computation that was lowered to SDFG."""
 
-    __slots__ = ("_translated_sdfg",)
+    __slots__ = (
+        "_translated_sdfg",
+        "_cache",
+    )
 
     _translated_sdfg: translator.TranslatedJaxprSDFG
+    _cache: tcache.TranslationCache
 
     def __init__(
         self,
@@ -34,10 +38,11 @@ def __init__(
         if translated_sdfg.out_names is None:
             raise ValueError("Output names must be defined.")
         self._translated_sdfg = translated_sdfg
+        self._cache: tcache.TranslationCache = tcache.get_cache(self)
 
     def optimize(
         self,
-        **kwargs: Any,  # noqa: ARG002  # Unused agument
+        **kwargs: Any,  # noqa: ARG002  # Unused argument
     ) -> JaceLowered:
         """Perform optimization _inplace_ and return `self`.
 
@@ -46,6 +51,7 @@ def optimize(
         """
         return self
 
+    @tcache.cached_translation
     def compile(
         self,
         compiler_options: stages.CompilerOptions | None = None,  # noqa: ARG002  # Unused arguments
@@ -54,15 +60,11 @@ def compile(
 
         Returns an Object that encapsulates a
         """
-        csdfg: jdace.CompiledSDFG = util.compile_jax_sdfg(
-            self._translated_sdfg,
-            force=True,
-            save=False,
-        )
+        csdfg: jdace.CompiledSDFG = util.compile_jax_sdfg(self._translated_sdfg)
         return stages.JaceCompiled(
             csdfg=csdfg,
-            inp_names=self._translated_sdfg.inp_names,  # type: ignore[arg-type]  # init guarantees this
-            out_names=self._translated_sdfg.out_names,  # type: ignore[arg-type]
+            inp_names=self._translated_sdfg.inp_names,
+            out_names=self._translated_sdfg.out_names,
         )
 
     def compiler_ir(self, dialect: str | None = None) -> translator.TranslatedJaxprSDFG:
diff --git a/src/jace/jax/stages/jace_wrapped.py b/src/jace/jax/stages/jace_wrapped.py
index 72a5971..526b165 100644
--- a/src/jace/jax/stages/jace_wrapped.py
+++ b/src/jace/jax/stages/jace_wrapped.py
@@ -51,7 +51,7 @@ def __init__(
         """Creates a wrapped jace jitable object of `jax_prim`."""
         assert fun is not None
         self._fun: Callable = fun
-        self._cache: tcache.TranslationCache = tcache.get_cache("lowering")
+        self._cache: tcache.TranslationCache = tcache.get_cache(self)
 
     def __call__(
         self,
diff --git a/src/jace/util/translation_cache.py b/src/jace/util/translation_cache.py
index 057507b..2ca78dc 100644
--- a/src/jace/util/translation_cache.py
+++ b/src/jace/util/translation_cache.py
@@ -30,7 +30,7 @@
 
 
 def get_cache(
-    name: str,
+    self: stages.Stage,
     size: int = 128,
 ) -> TranslationCache:
     """Returns the cache associated to `name`.
@@ -40,15 +40,14 @@ def get_cache(
     """
     # Get the caches and if not present, create them.
     if not hasattr(get_cache, "_caches"):
-        _caches: dict[str, TranslationCache] = {}
-        _caches["lowering"] = TranslationCache(size=size)
-        _caches["compiling"] = TranslationCache(size=size)
+        _caches: dict[type[stages.Stage], TranslationCache] = {}
         get_cache._caches = _caches  # type: ignore[attr-defined]  # ruff removes the `getattr()` calls
     _caches = get_cache._caches  # type: ignore[attr-defined]
 
-    if name not in _caches:
-        raise ValueError(f"The cache '{name}' is unknown.")
-    return _caches[name]
+    if type(self) not in _caches:
+        _caches[type(self)] = TranslationCache(size=size)
+
+    return _caches[type(self)]
 
 
 def cached_translation(
@@ -62,86 +61,69 @@ def _action_wrapper(
         *args: Any,
         **kwargs: Any,
     ) -> stages.Stage:
-        assert hasattr(self, "_cache")
+        assert hasattr(self, "_cache"), f"Type '{type(self).__name__}' does not have `_cache`."
         cache: TranslationCache = self._cache
-        key: _CacheKey = self.make_key(self, *args, **kwargs)
+        key: _CacheKey = cache.make_key(self, *args, **kwargs)
         if cache.has(key):
             return cache.get(key)
-
-        next_stage: stages.Stage = action(*args, **kwargs)
+        next_stage: stages.Stage = action(self, *args, **kwargs)
         cache.add(key, next_stage)
         return next_stage
 
     return _action_wrapper
 
 
-@util.dataclass_with_default_init(init=True, repr=True, frozen=True, slots=True)
-class _JaCeVarWrapper:
-    """Wrapper class around `JaCeVar` for use in `_CacheKey`.
-
-    It essentially makes the hash depend on the content, with the exception of name.
-    """
-
-    _slots__ = ("var", "_hash")
-    var: util.JaCeVar
-    _hash: int
-
-    def __init__(self, var: util.JaCeVar) -> None:
-        _hash: int = hash((var.shape, var.dtype, var.storage))
-        if var.name != "":
-            raise ValueError("Key can not have a name.")
-        self.__default_init__(var=var, _hash=_hash)  # type: ignore[attr-defined]
+@dataclass(init=True, eq=True, frozen=True)
+class _AbstarctCallArgument:
+    """Class to represent the call arguments used in the cache."""
 
-    def __hash__(self) -> int:
-        return self._hash
-
-    def __eq__(self, other: Any) -> bool:
-        if not isinstance(other, _JaCeVarWrapper):
-            return NotImplemented
-        return (self.var.shape, self.var.dtype, self.var.storage) == (
-            other.var.shape,
-            other.var.dtype,
-            other.var.storage,
-        )
+    shape: tuple[int, ...] | tuple[()]
+    dtype: dace.typeclass
+    strides: tuple[int, ...] | tuple[()] | None
+    storage: dace.StorageType
 
     @classmethod
     def from_value(
         cls,
         val: Any,
-    ) -> _JaCeVarWrapper:
-        """Returns a `JaCe` variable constructed from `val`.
-
-        If `val` is on the device, its storage type will be `GPU_Global` otherwise the default.
+    ) -> _AbstarctCallArgument:
+        """Construct an `_AbstarctCallArgument` from a value.
 
         Todo:
             Improve, such that NumPy arrays are on CPU, CuPy on GPU and so on.
+            This function also probably fails for scalars.
         """
         if not util.is_fully_addressable(val):
             raise NotImplementedError("Distributed arrays are not addressed yet.")
+        if isinstance(val, jax_core.Literal):
+            raise TypeError("Jax Literals are not supported as cache keys.")
 
-        if isinstance(val, util.JaCeVar):
-            return cls(var=val)
+        # TODO(phimuell): is `CPU_Heap` okay?
 
-        # Define the storage as given by on device.
-        storage: dace.StorageType | None = (
-            dace.StorageType.GPU_Global if util.is_on_device(val) else None
-        )
+        if util.is_array(val):
+            if util.is_jax_array(val):
+                val = val.__array__(copy=False)
+            shape = val.shape
+            dtype = util.translate_dtype(val.dtype)
+            strides = getattr(val, "strides", None)
+            storage = (
+                dace.StorageType.GPU_Global if util.is_on_device(val) else dace.StorageType.CPU_Heap
+            )
 
-        if isinstance(val, jax_core.Var):
-            val = val.aval
-        if isinstance(val, jax_core.Literal):
-            raise TypeError("Jax Literals are not supported as cache keys.")
+            return cls(shape=shape, dtype=dtype, strides=strides, storage=storage)
 
-        # We need at least a shaped array
         if isinstance(val, jax_core.ShpedArray):
-            return cls(
-                util.JaCeVar(
-                    name="",
-                    shape=val.aval.shape,
-                    dtype=val,
-                    storage=storage,
-                ),
+            shape = val.aval.shape
+            dtype = val.aval.dtype
+            strides = None
+            storage = (
+                dace.StorageType.GPU_Global
+                if util.is_on_device(val.val)
+                else dace.StorageType.CPU_Heap
             )
+
+            return cls(shape=shape, dtype=dtype, strides=strides, storage=storage)
+
         if isinstance(val, jax_core.AbstractValue):
             raise TypeError(f"Can not make 'JaCeVar' from '{type(val).__name__}', too abstract.")
 
@@ -154,15 +136,14 @@ def from_value(
 class _CacheKey:
     """Wrapper around the arguments"""
 
-    __slots__ = ("fun", "sdfg_hash", "vars", "_hash")
-
     # Note that either `_fun` or `_sdfg_hash` are not `None`.
+    # TODO(phimuell): Static arguments.
     fun: Callable | None
     sdfg_hash: int | None
-    fargs: tuple[_JaCeVarWrapper, ...]
+    fargs: tuple[_AbstarctCallArgument, ...] | tuple[tuple[str, Any], ...]
 
     @classmethod
-    def Create(
+    def make_key(
         cls,
         stage: stages.Stage,
         *args: Any,
@@ -175,14 +156,33 @@ def Create(
         if isinstance(stage, stages.JaceWrapped):
             fun = stage.__wrapped__
             sdfg_hash = None
+            fargs: Any = tuple(  # Any is here to prevent typeconfusion in mypy.
+                _AbstarctCallArgument.from_value(x) for x in args
+            )
+
         elif isinstance(stage, stages.JaceLowered):
             fun = None
-            sdfg_hash = int(stage.compiler_ir().sdfg.hash_sdfg, 16)
+            sdfg_hash = int(stage.compiler_ir().sdfg.hash_sdfg(), 16)
+
+            # In this mode the inputs are compiler options, which are encapsulated in
+            #  `CompilerOptions` (aka. `dict`), or it is None.
+            assert len(args) <= 1
+            comp_ops: stages.CompilerOptions = (
+                stages.CompilerOptions() if len(args) == 0 else args[0]
+            )
+            assert isinstance(comp_ops, dict)
+
+            # Make `(argname, value)` pairs and sort them to get a concrete key
+            fargs = tuple(
+                sorted(
+                    ((k, v) for k, v in comp_ops.items()),
+                    key=lambda X: X[0],
+                )
+            )
+
         else:
             raise TypeError(f"Can not make key from '{type(stage).__name__}'.")
 
-        fargs = tuple(_JaCeVarWrapper.from_value(x) for x in args)
-
         return cls(fun=fun, sdfg_hash=sdfg_hash, fargs=fargs)
 
 
@@ -219,7 +219,7 @@ def make_key(
         """Create a key object for `stage`."""
         if len(kwargs) != 0:
             raise NotImplementedError
-        return _CacheKey.Create(stage, *args, **kwargs)
+        return _CacheKey.make_key(stage, *args, **kwargs)
 
     def has(
         self,

From 9930cdb153ec9e7754279fbed5838ace8c4fc9a8 Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Mon, 13 May 2024 10:53:02 +0200
Subject: [PATCH 130/458] Updated the translator interfaces.

This commit fixes some import errors, but it also marks the `out_var_names` argument of the translator function as `MutableSequence`.
This is because it is explicitly allowed to modify it.
---
 .../sub_translators/a_primitive_translator.py | 45 ++++++++-----------
 .../sub_translators/alu_translator.py         |  7 +--
 2 files changed, 23 insertions(+), 29 deletions(-)

diff --git a/src/jace/translator/sub_translators/a_primitive_translator.py b/src/jace/translator/sub_translators/a_primitive_translator.py
index 16d2d4b..a1f34e6 100644
--- a/src/jace/translator/sub_translators/a_primitive_translator.py
+++ b/src/jace/translator/sub_translators/a_primitive_translator.py
@@ -16,15 +16,13 @@
 from __future__ import annotations
 
 from abc import abstractmethod
-from collections.abc import Sequence
-from typing import TYPE_CHECKING, Any, Protocol, runtime_checkable
+from collections.abc import MutableSequence, Sequence
+from typing import Any, Protocol, runtime_checkable
 
 import dace
 from jax import core as jax_core
 
-
-if TYPE_CHECKING:
-    from .jaxpr_translator_driver import JaxprTranslationDriver
+from jace import translator
 
 
 @runtime_checkable
@@ -71,9 +69,9 @@ def primitive(self) -> str | Sequence[str]:
     @abstractmethod
     def translate_jaxeqn(
         self,
-        driver: JaxprTranslationDriver,
+        driver: translator.JaxprTranslationDriver,
         in_var_names: Sequence[str | None],
-        out_var_names: Sequence[str],
+        out_var_names: MutableSequence[str],
         eqn: jax_core.JaxprEqn,
         eqn_state: dace.SDFGState,
     ) -> dace.SDFGState | None:
@@ -94,25 +92,20 @@ def translate_jaxeqn(
             `eqn_state` argument. This state is guaranteed to be empty and
             `translator.get_terminal_sdfg_state() is eqn_state` holds.
 
-        Then the subtranslator is called. Usually a subtranslator should
-        construct the dataflow graph inside `eqn_state`. It is allowed that the
-        subtranslators creates more states if needed, but this state machine
-        has to have a single terminal state, which must be returned
-        and reachable from `eqn_state`.
-        If the function returns `None` the driver will assume that
-        subtranslator was able to fully construct the dataflow graph
-        within `eqn_state`.
-
-        While a subtranslator is forbidden from meddling with the input
-        variables mentioned in `in_var_names` in any way, it is allowed to
-        modify the output variables. For example he could create a new
-        SDFG variable, with different strides. But in that case the
-        subtranslator must update the internal mapping of the driver TBA HOW,
-        and modify the mapping in `out_var_names`.
-        However, the subtranslator is allowed to create internal temporary
-        variables. It just have to ensure that no name collision will occur,
-        a way to do this is to use a passed variable name as prefix.
-
+        Then the subtranslator is called.
+        Usually a subtranslator should construct the dataflow graph inside `eqn_state`.
+        It is allowed that the subtranslators creates more states if needed, but this state machinery
+        has to have a single terminal state, which must be returned and reachable from `eqn_state`.
+        If the function returns `None` the driver will assume that subtranslator was able to
+        fully construct the dataflow graph within `eqn_state`.
+
+        While a subtranslator is forbidden from meddling with the input variables mentioned in
+        `in_var_names` in any way, it is allowed to modify the output variables.
+        For example it could create a new SDFG variable, with different strides.
+        But in that case the subtranslator must update the internal mapping of the driver TBA HOW,
+        and modify the mapping specified by `out_var_names`.
+        However, the subtranslator is allowed to create internal temporary variables.
+        It just have to ensure that no name collision will occur, a way to do this is to use a passed variable name as prefix.
 
         Args:
             driver:         The driver object of the translation.
diff --git a/src/jace/translator/sub_translators/alu_translator.py b/src/jace/translator/sub_translators/alu_translator.py
index f397bb3..8cc2466 100644
--- a/src/jace/translator/sub_translators/alu_translator.py
+++ b/src/jace/translator/sub_translators/alu_translator.py
@@ -9,7 +9,7 @@
 
 from __future__ import annotations
 
-from collections.abc import Sequence
+from collections.abc import MutableSequence, Sequence
 from typing import Any, Final, cast
 
 import dace
@@ -17,6 +17,7 @@
 from jax import core as jax_core
 from typing_extensions import override
 
+from jace import translator
 from jace.translator import sub_translators
 
 
@@ -91,9 +92,9 @@ def primitive(self) -> Sequence[str]:
     @override
     def translate_jaxeqn(
         self,
-        driver: sub_translators.JaxprTranslationDriver,
+        driver: translator.JaxprTranslationDriver,
         in_var_names: Sequence[str | None],
-        out_var_names: Sequence[str],
+        out_var_names: MutableSequence[str],
         eqn: jax_core.JaxprEqn,
         eqn_state: dace.SDFGState,
     ) -> None:

From bb4a3a3620ea1beaa13efa2f871d3b1c31dab6cd Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Mon, 13 May 2024 11:03:17 +0200
Subject: [PATCH 131/458] First update to the driver.

This is just a first step in the update process.
- "Simplifies" the `add_array()` function.
- Makes some changes to the general structure of the code, i.e. "Simplifies"
- Make `JaxprTranslatorDriver._ctx` a property.
- Updates some tests.

Todo:
- Unify return value, i.e. translated Jaxpr, and inner context.
---
 pyproject.toml                                |   1 +
 .../translator/jaxpr_translator_driver.py     | 323 +++++++-----------
 tests/test_jaxpr_translator_driver.py         | 144 ++++----
 tests/test_sub_translators_alu.py             |  15 +-
 4 files changed, 218 insertions(+), 265 deletions(-)

diff --git a/pyproject.toml b/pyproject.toml
index ad44121..a2a1a90 100644
--- a/pyproject.toml
+++ b/pyproject.toml
@@ -152,5 +152,6 @@ section-order = [
 "tests/**" = [
   "T10",
   "T20",  # Ignore `flake8-debugger` and `flake8-print`
+  "F841",  # Ignore assigned but not used; inside `with` to test if throw.
   "RUF018"  # Ignore assignment in `assert`s; for printing
 ]
diff --git a/src/jace/translator/jaxpr_translator_driver.py b/src/jace/translator/jaxpr_translator_driver.py
index 92ca8be..7d2012f 100644
--- a/src/jace/translator/jaxpr_translator_driver.py
+++ b/src/jace/translator/jaxpr_translator_driver.py
@@ -8,7 +8,7 @@
 from __future__ import annotations
 
 import itertools
-from collections.abc import Collection, Iterable, Mapping, Sequence
+from collections.abc import Collection, Iterable, Mapping, MutableSequence, Sequence
 from typing import Any, Final, cast, overload
 
 import dace
@@ -54,7 +54,6 @@ class JaxprTranslationDriver:
 
     __slots__ = (
         "_ctx_stack",  # Stack of all contexts
-        "_ctx",  # Current top of the context stack.
         "_reserved_names",  # Part of the context, but is copied.
         "_sub_translators",
         "_rev_manager",
@@ -98,7 +97,6 @@ def __init__(
         # Context stack and current context.
         #  Only allocated during an ongoing translation
         self._ctx_stack: list[_TranslationContext] = []
-        self._ctx: _TranslationContext = None  # type: ignore[assignment]
 
         # Creating of the subtranslators.
         self._init_sub_translators(kwargs)
@@ -261,22 +259,18 @@ def map_jax_var_to_sdfg(
 
     def map_jax_var_to_sdfg(
         self,
-        jax_var: str | jax_core.Atom | util.JaCeVar,
+        jax_var: jax_core.Atom | util.JaCeVar,
         allow_fail: bool = False,
     ) -> str | None:
         """Get the _name_ of the SDFG variable to which `jax_var` is referring to.
 
-        For convenient this function will consider a string as input to be already an SDFG variable name.
-
         Args:
             jax_var:        The Jax variable to look up.
             allow_fail:     If mapping is not known return `None` instead of raise `KeyError`.
         """
-        if isinstance(jax_var, str):
-            sdfg_name: str = jax_var
-        elif isinstance(jax_var, jax_core.Literal):
+        if isinstance(jax_var, jax_core.Literal):
             raise RuntimeError("There is no SDFG variable for literal '{jax_var}'.")
-        elif jax_var in self._ctx.jax_name_map:
+        if jax_var in self._ctx.jax_name_map:
             sdfg_name = self._ctx.jax_name_map[jax_var]
         elif allow_fail:
             return None
@@ -310,11 +304,8 @@ def is_allocated(self) -> bool:
 
         If `self` is allocated then there is also an ongoing translation process.
         """
-        assert isinstance(self._sub_translators, dict)
-        if self._ctx is not None:
-            assert self._ctx_stack[-1] is self._ctx
+        if len(self._ctx_stack) != 0:
             return True
-        assert len(self._ctx_stack) == 0  # type: ignore[unreachable]
         return False
 
     def is_root_translator(self) -> bool:
@@ -383,12 +374,6 @@ def add_reserved_names(
             pass
         else:
             raise TypeError(f"Does not know how to handle the type '{type(reserved_names)}'.")
-        for rev_name in reserved_names:
-            assert isinstance(rev_name, str)
-            if not util.VALID_SDFG_VAR_NAME.fullmatch(rev_name):
-                raise ValueError(
-                    f"Can not use '{rev_name}' as reserved name as it is not a valid SDFG name."
-                )
         self._reserved_names.update(reserved_names)
         return self
 
@@ -399,42 +384,31 @@ def add_array(
         as_transient: bool = True,
         alt_name: str | None = None,
         name_prefix: str | None = None,
+        find_new_name: bool | None = None,
         force_array: bool = False,
-        as_view: bool = False,
         strides: Sequence[int | dace.symbol | str] | None = None,
-        symb_strides: bool | None = None,
-        find_new_name: bool | None = None,
         allow_literals: bool = False,
         force_jax_name: bool = False,
         update_var_mapping: bool = False,
     ) -> str:
         """Creates an SDFG variable for the Jax variable `arg` and returns its SDFG name.
 
-        By default the function will create a transient, use `as_transient` to
-        change that. By default the function will honor if the Jax variable is
-        a scalar or an array. However, by setting `force_array` the function
-        will always generate an array.
+        By default the function will create a transient, use `as_transient=True` to change that.
+        By default the function will honor if the Jax variable is a scalar or an array.
+        However, by setting `force_array` the function will always generate an array.
 
         By default the name for the SDFG variable is derived from the Jax variable.
-        It is guaranteed that this name is unique in the SDFG, even in the presence
-        of nested SDFGs. By specifying `alt_name` it is possible to force a certain
-        name on a variable. It is important that if `alt_name` is specified the function
-        will either generate the variable or fail.
+        It is guaranteed that this name is unique in the SDFG, even in the presence of nested SDFGs.
+        By specifying `alt_name` it is possible to force a certain name on a variable.
+        It is important that if `alt_name` is specified the function will either generate the variable or fail.
 
         The  driver distinguishes between two kinds of "bad (SDFG) variable names".
         The first category are the forbidden names, which the function refuses to generate.
-        The second type are the so called reserved names, which were set at the beginning.
-        These names can be used if they are specified through `alt_name` but are not used
-        in automatic naming.
-
-        If nothing is specified, the strides of the data are determined by DaCe, which is
-        continuous C order. There are two ways to change that.
-        The first way is to specify the `strides` argument, which are then forwarded
-        to the underlying DaCe function. The second way is to set `symb_strides`
-        to `True` in which case the function will generate symbols and use them.
-        However, even if symbolic strides are activated, arrays with just one
-        dimensions have always a non symbolic stride of 1. Furthermore, dimensions
-        with shape 1 will always have stride 0.
+        The second type are the so called reserved names, which were set at the beginning, or by `self.add_reserved_names()`.
+        These names can be used if the name is specified through `alt_name` but are not used in automatic naming.
+
+        If nothing is specified, the strides of the data are determined by DaCe, which is continuous C order.
+        It is possible to set a certain values by setting `strides` appropriate.
 
         By default this function does not update the internal variable map.
         However, by setting `update_var_mapping` to `True` the function will
@@ -445,14 +419,9 @@ def add_array(
             as_transient:       If set, the SDFG variable is a transient, `True` by default.
             alt_name:           Try to create the variable with this name; either succeed or fail.
             name_prefix:        If given and in automatic naming mode, add this prefix to the name.
+            find_new_name:      The translator will try to find a new name if the designated is already occupied.
             force_array:        Instead of a `dace.Scalar` create a `dace.Array` with one element.
-            as_view:            Creates a view instead of an array, if it is a scalar
-                                    it is silently ignored.
             strides:            Instead of the default strides use these values.
-            symb_strides:       Create symbols and use them for fully symbolic strides.
-            find_new_name:      The translator will try to find a new name if the designated
-                                    is already occupied. This does not work if the name
-                                    was supplied by `alt_name`.
             allow_literals:     If `True` then also allows JaxLiterals as `arg`.
             force_jax_name:     If `True` then, the verbatim Jax name will be used.
             update_var_mapping: Update the internal variable mapping; by default `False`.
@@ -460,13 +429,6 @@ def add_array(
         Notes:
             If this function is used directly a user is advised to always set
                 `update_var_mapping` to `True`.
-            If `find_new_name` is `None` the default, the function will only
-                look for a new name if there is a need for it. If it is `True`
-                the function will always look for a new name, even if the initial
-                name was fine. If it is `False` the function will never look for
-                a new new, thus if the name is unavailable an error is generated.
-                However, this excluds variable names that are known.
-            Specifying `alt_name` implies `find_new_name=False`.
             If you need to create a special array, you can use `jace.util.JaCeVar`
                 to create a pseudo Jax variable.
         """
@@ -483,7 +445,7 @@ def add_array(
             #  a variable for a second time. It is, however, okay to use one as template,
             #  if another name is specified from the beginning.
             raise ValueError(
-                f"Tried to create variable '{arg}' again, without specifying an alternative name.."
+                f"Tried to create variable '{arg}' again, without specifying an alternative name."
             )
         if force_jax_name:
             if alt_name is not None:
@@ -494,11 +456,12 @@ def add_array(
                 raise ValueError(
                     f"Specified 'force_jax_name', but passed '{name_prefix}' as 'name_prefix'."
                 )
+            if find_new_name:
+                raise ValueError("Specified `force_jax_name` but also wanted a new name.")
+            find_new_name = False
             alt_name = util._propose_jax_name(arg, self._ctx.jax_name_map)
         if alt_name is not None:
-            assert isinstance(
-                alt_name, str
-            ), f"Got '{type(alt_name)}' instead of 'str' for 'alt_name'."
+            assert isinstance(alt_name, str)
             find_new_name = False  # If a name was given, then use it no matter what.
             if len(alt_name) == 0:
                 raise ValueError("Passed an empty 'alt_name'.")
@@ -506,32 +469,30 @@ def add_array(
                 raise ValueError("'alt_name' is a forbidden name.")
             if not util.VALID_SDFG_VAR_NAME.fullmatch(alt_name):
                 raise ValueError(f"The passed name 'alt_name' '{alt_name}' is invalid.")
+            if update_var_mapping and arg in self._ctx.jax_name_map:
+                raise ValueError(f"Variable '{alt_name}' already registered.")
+            if alt_name in self._ctx.sdfg.arrays:
+                raise ValueError(f"Variable '{alt_name}' already exists.")
             if name_prefix is not None:
                 raise ValueError(
                     f"Specified 'name_prefix' ('{name_prefix}') but passed '{alt_name}' as 'alt_name'."
                 )
-            if alt_name in self._ctx.sdfg.arrays:
-                raise ValueError(f"Variable '{alt_name}' already exists.")
         if name_prefix is not None:
             assert isinstance(name_prefix, str)
             if len(name_prefix) == 0:
                 raise ValueError("Specified an empty 'name_prefix'.")
-        if as_view and (not as_transient):
-            raise ValueError("You tried to create a global view, which is not allowed.")
 
         # Checking the strides.
-        if (symb_strides is None) and (strides is None):
-            def_symb_stride = False  # default value for symbolic strides
-            symb_strides = False if (len(shape) <= 1) else def_symb_stride  # Keep for the future
-        elif (symb_strides is not None) and (strides is not None):
-            raise ValueError("Specified 'symb_strides' and 'stride at the same time.")
-        elif strides is not None:
+        if strides is not None:
+            if is_scalar:
+                raise ValueError("Specified a stride for a scalar.")
+            if isinstance(strides, (str, dace.symbol, int)):
+                strides = (strides,)
+            assert isinstance(strides, tuple)
             if len(strides) != len(shape):
                 raise ValueError(
                     f"'strides' has length {len(strides)}, but array rank is {len(shape)}."
                 )
-        else:
-            assert isinstance(symb_strides, bool)
 
         # Now we determine the proposed name of the variable.
         #  Depending on the situation, we will further manipulate it.
@@ -539,20 +500,17 @@ def add_array(
             prop_name = alt_name  # Just for completion: will be ignored later
         elif isinstance(arg, (jax_core.Var, util.JaCeVar)):
             prop_name = util._propose_jax_name(arg, self._ctx.jax_name_map)
-            if prop_name.startswith("__"):
-                raise ValueError(
-                    f"You tried to create the variable '{prop_name}' which"
-                    "starts with two underscores, use 'alt_name' for that."
-                )
+            assert not prop_name.startswith("__")
             if name_prefix is not None:
                 prop_name = name_prefix + prop_name
         elif isinstance(arg, jax_core.Literal):  # type: ignore[unreachable]
-            if not allow_literals:
+            if not allow_literals:  # Allows to use a literal as template.
                 raise NotImplementedError("Jax Literals are not supported.")
             if alt_name is None:
                 raise ValueError(f"Passed literal '{arg}', but not specified a name to use.")
         else:
             raise TypeError(f"Does not know how to handle '{type(arg).__name__}'.")
+
         if alt_name is None:
             # If we are the root translator, then we will use `prop_name` directly;
             #  otherwise we will append the revision of `self` to the name.
@@ -560,6 +518,7 @@ def add_array(
                 "" if self.is_root_translator() else f"_rev_idx{self._ctx.rev_idx}"
             )
         else:
+            # Use the supplied name directly.
             arg_name = str(alt_name)
 
         # Determine if we should look for a new name or not, if nothing was specified
@@ -567,10 +526,10 @@ def add_array(
             if arg_name in self._reserved_names:
                 find_new_name = True
             if arg_name in self._forbidden_names:
+                # This is not an error, but happens if we handle Jax variable `if`.
                 find_new_name = True
 
         if find_new_name:
-            # We have to find a new name.
             name_tmpl = "_jax_variable__" + arg_name + "__{}"
             for iCounter in range(1000):
                 _arg_name = name_tmpl.format(iCounter)
@@ -597,34 +556,13 @@ def add_array(
         # Promotion of scalar to array.
         if is_scalar and force_array:
             shape = (1,)
-            symb_strides = False
             strides = None
             is_scalar = False
 
-        # Set the stride if we have to change.
-        if strides is not None:
-            strides = tuple(strides)
-            assert len(strides) == len(shape)
-
-        elif (symb_strides is True) and (not is_scalar):
-            strides = [
-                dace.symbol(f"{arg_name}_stride{dim}", dace.int64) if size >= 2 else 0
-                for dim, size in enumerate(shape)
-            ]
-
         if is_scalar:
             self._ctx.sdfg.add_scalar(
                 name=arg_name, storage=storage, dtype=dtype, transient=as_transient
             )
-        elif as_view:
-            self._ctx.sdfg.add_view(
-                name=arg_name,
-                shape=shape,
-                strides=strides,
-                offset=offset,
-                storage=storage,
-                dtype=dtype,
-            )
         else:
             self._ctx.sdfg.add_array(
                 name=arg_name,
@@ -641,7 +579,27 @@ def add_array(
 
         return arg_name
 
+    @overload
     def create_jax_var_list(
+        self,
+        jax_var_list: Sequence[jax_core.Atom | util.JaCeVar],
+        prevent_creation: bool = False,
+        only_creation: bool = True,
+        handle_literals: bool = False,
+        **kwargs: Any,
+    ) -> list[str]: ...
+
+    @overload
+    def create_jax_var_list(  # type: ignore[misc]
+        self,
+        jax_var_list: Sequence[jax_core.Atom | util.JaCeVar],
+        prevent_creation: bool = False,
+        only_creation: bool = False,
+        handle_literals: bool = False,
+        **kwargs: Any,
+    ) -> list[None | str]: ...
+
+    def create_jax_var_list(  # type: ignore[misc]
         self,
         jax_var_list: Sequence[jax_core.Atom | util.JaCeVar],
         prevent_creation: bool = False,
@@ -655,7 +613,7 @@ def create_jax_var_list(
         If no SDFG variable is known the function will create one using `add_array()`, with `update_var_mapping` set to `True`.
 
         By setting `prevent_creation` the function will not create any new SDFG variables.
-        This mode is used to indicate that all variables already have to exists already.
+        This mode is used to indicate that all variables have to exists already.
         By setting `only_creation` the function will only create new SDFG variables.
         If a Jax variable already has a known SDFG equivalent an error is generated.
 
@@ -692,7 +650,7 @@ def create_jax_var_list(
                     raise ValueError(f"'only_creation' given '{jax_var}' already exists.")
                 else:
                     sdfg_name = mapped_sdfg_name
-                # `add_jax_name_mapping` is save, because if the mapping does already exists it is a no ops.
+                # Calling `add_jax_name_mapping` is save, because if the mapping does already exists it is a no ops.
                 self.add_jax_name_mapping(jax_var, sdfg_name)
             else:
                 raise TypeError(f"Does not know how to handle '{type(jax_var).__name__}'")
@@ -727,7 +685,7 @@ def _create_initial_input(
 
         # Handle the initial input arguments
         sdfg: dace.SDFG = self._ctx.sdfg
-        init_in_var_names: Sequence[str] = self.create_jax_var_list(  # type: ignore[assignment]
+        init_in_var_names: Sequence[str] = self.create_jax_var_list(
             jax_var_list=jaxpr.jaxpr.invars,
             only_creation=True,
             as_transient=True,  # Explicit transient; no error!
@@ -736,10 +694,10 @@ def _create_initial_input(
             force_jax_name=self.is_root_translator(),  # Ensure root get pure Jax names.
         )
         # This forces the code to only accept kwargs
+        #  Is also part of "what a canonical sdfg" is.
         sdfg.arg_names = []
 
-        # Store the list of inputs in self; this is done to simplify exporting.
-        #  The output list is populated by `self._translate_jaxpr_internal()`
+        # The output list is populated by `self._translate_jaxpr_internal()`
         self._ctx.inp_names = tuple(init_in_var_names)
 
         return init_in_var_names
@@ -760,25 +718,22 @@ def _create_constants(
 
         if not self.is_allocated():
             raise RuntimeError("Driver is not allocated, can not create constants.")
-        if not len(jaxpr.consts):
+        if len(jaxpr.consts) == 0:
             return []
 
-        const_names: list[str] = []
-        for cJaxVar, cValue in zip(jaxpr.jaxpr.constvars, jaxpr.consts, strict=False):
-            c_sdfg_name = self.add_array(
-                arg=cJaxVar,
-                name_prefix="__const_",
-                as_transient=True,
-                symb_strides=False,
-                strides=None,
-                update_var_mapping=True,
-            )
+        sdfg_const_names: Sequence[str] = self.create_jax_var_list(
+            jax_var_list=jaxpr.jaxpr.constvars,
+            only_creation=True,
+            strides=None,
+            name_prefix="__const_",
+        )
+
+        for sdfg_name, const_value in zip(sdfg_const_names, jaxpr.consts, strict=True):
             # We have to pass the data descriptor to `add_constant()`, otherwise a new one would be created.
             self._ctx.sdfg.add_constant(
-                c_sdfg_name, deepcopy(cValue), self._ctx.sdfg.arrays[c_sdfg_name]
+                sdfg_name, deepcopy(const_value), self._ctx.sdfg.arrays[sdfg_name]
             )
-            const_names.append(c_sdfg_name)
-        return const_names
+        return sdfg_const_names
 
     def _allocate_translation_ctx(
         self,
@@ -798,11 +753,12 @@ def _allocate_translation_ctx(
         from ._translation_context import _TranslationContext
 
         # Create a new translation context and put it on the stack.
-        self._ctx = _TranslationContext(
-            rev_idx=next(self._rev_manager),
-            name=name,
+        self._ctx_stack.append(
+            _TranslationContext(
+                rev_idx=next(self._rev_manager),
+                name=name,
+            )
         )
-        self._ctx_stack.append(self._ctx)
 
         if self.is_root_translator():
             # The root translation, i.e. the very first context allocation
@@ -818,6 +774,12 @@ def _allocate_translation_ctx(
 
         return self
 
+    @property
+    def _ctx(self) -> _TranslationContext:
+        """Returns the currently active translation context."""
+        assert len(self._ctx_stack) != 0, "No context is active."
+        return self._ctx_stack[-1]
+
     def _init_sub_translators(
         self,
         subtrans_args: Mapping[str, Any],
@@ -839,7 +801,7 @@ def _init_sub_translators(
 
             for handled_primitive in handled_primitives:
                 if handled_primitive in prim_translators:
-                    raise RuntimeError(f"Multiple sub translators for '{handled_primitive}' found.")
+                    raise RuntimeError(f"Multiple translators for '{handled_primitive}' found.")
                 prim_translators[handled_primitive] = prim_translator
         self._sub_translators = prim_translators
 
@@ -849,7 +811,7 @@ def _clear_translation_ctx(self) -> JaxprTranslationDriver:
         """This function deallocate the translation context of `self`.
 
         Notes:
-            While it is allowed for outside code to call this explicitly function,
+            While it is allowed for outside code to call this function explicit
                 it is is most likely an error.
             If `self` is not allocated this function acts as a noops.
             The reserved names are only deallocated if `self` is a root translator.
@@ -857,19 +819,14 @@ def _clear_translation_ctx(self) -> JaxprTranslationDriver:
         if not self.is_allocated():
             return self
 
-        assert self._ctx is self._ctx_stack[-1], "Inconsistent stack detected."
         if self.is_root_translator():
             self._rev_manager = itertools.count(0, 1)
             self._reserved_names = None  # type: ignore[assignment]
-
-            self._ctx = None  # type: ignore[assignment]
             self._ctx_stack.pop()
 
         else:
             # Restore the previous state
-            assert len(self._ctx_stack) > 1
             self._ctx_stack.pop()
-            self._ctx = self._ctx_stack[-1]
         return self
 
     def _find_sub_translator_for(
@@ -877,8 +834,6 @@ def _find_sub_translator_for(
         eqn: jax_core.JaxprEqn,
     ) -> translator.PrimitiveTranslator:
         """Returns the appropriate subtranslator for equation `eqn`."""
-        assert self._sub_translators is not None
-
         prim_name: str = eqn.primitive.name
         if prim_name not in self._sub_translators:
             raise NotImplementedError(f"No subtranslators known to handle '{prim_name}'.")
@@ -887,7 +842,6 @@ def _find_sub_translator_for(
 
     def _translate_single_eqn(
         self,
-        jaxpr: jax_core.ClosedJaxpr,
         eqn: jax_core.JaxprEqn,
     ) -> tuple[Sequence[str | None], Sequence[str]]:
         """Translate `eqn` into its SDFG equivalent.
@@ -903,17 +857,14 @@ def _translate_single_eqn(
             The inputs might contain `None` which indicates that that input was a Jax Literal.
 
         Notes:
-            While `jaxpr` must be a `ClosedJaxpr`, `eqn` must come from the unclosed instance.
+            The equation, `eqn` must come from the unclosed jaxpr instance.
             The function will perform some consistency checking after the subtranslator was called.
         """
-        assert isinstance(eqn, jax_core.JaxprEqn)
-        assert isinstance(jaxpr, jax_core.ClosedJaxpr)
-
         if len(eqn.effects) != 0:
             raise NotImplementedError(f"Equation '{eqn}' has side effects.")
 
         # Input/Output variables
-        #  Using a tuple for the input ensures that it is not modified.
+        #  Using a tuple for the input ensures that it cannot be modified.
         in_var_names: Sequence[str | None] = tuple(
             self.create_jax_var_list(
                 eqn.invars,
@@ -921,7 +872,7 @@ def _translate_single_eqn(
                 handle_literals=True,  #  but they can be literals.
             )
         )
-        out_var_names: Sequence[str] = self.create_jax_var_list(  # type: ignore[assignment]
+        out_var_names: MutableSequence[str] = self.create_jax_var_list(
             eqn.outvars,
             only_creation=True,  # Output must not exist yet.
         )
@@ -933,7 +884,7 @@ def _translate_single_eqn(
         last_term_state: dace.SDFGState = self.get_terminal_sdfg_state()  # noqa: F841 # Will be used later
         eqn_state = self.append_new_state(
             label=f"{eqn.primitive.name}_{out_var_names[0]}",
-            prev_state=None,  # forces terminal state
+            prev_state=None,  # forces terminal state to use
         )
 
         # Now perform the actual translation of the equation.
@@ -958,40 +909,15 @@ def _translate_single_eqn(
 
         # In case a subtranslator decided to not use the variables we created for it, which is allowed
         #  but he must update the `out_var_names` list correctly, we will now verify this.
-        if len(out_var_names) != len(eqn.outvars):
-            raise RuntimeError(
-                f"Modified 'out_var_names'! Expected {len(eqn.outvars)} variables."
-                f" but found {len(out_var_names)}"
-            )
         for expectedSDFGName, jax_var in zip(out_var_names, eqn.outvars, strict=True):
             mapped_sdfg_name = self.map_jax_var_to_sdfg(jax_var)
-            jax_name = util.get_jax_var_name(jax_var)
             if mapped_sdfg_name != expectedSDFGName:
                 raise ValueError(
                     f"Mapping inconsistency detected, expected that Jax variable"
-                    f" '{jax_name}' maps to '{expectedSDFGName}' but it actually"
+                    f" '{jax_var}' maps to '{expectedSDFGName}' but it actually"
                     f" maps to '{mapped_sdfg_name}'."
                 )
 
-        # Views can only be used if there is a direct connection, between source,
-        #  view and destination (place of usage). Because of the way how Jax works,
-        #  it is impossible that an output variable is a View.
-        for outVarName, jax_var in zip(out_var_names, eqn.outvars, strict=True):
-            sdfg_var = self.get_array(outVarName)
-            if isinstance(sdfg_var, (dace.data.Array, dace.data.Scalar)):
-                pass
-            elif isinstance(sdfg_var, dace.data.View):
-                raise TypeError(
-                    f"For Jax variable '{util.get_jax_var_name(jax_var)}' (SDFG: '{outVarName}'),"
-                    f" which is an output, you used a View, which is not possible."
-                    " It must either be an array or a scalar."
-                )
-            else:
-                raise NotImplementedError(
-                    f"Output variable '{util.get_jax_var_name(jax_var)}' (SDFG: '{outVarName}')"
-                    f" is of type '{type(sdfg_var).__name__}' which I does not know how to handle."
-                )
-
         # Modify terminal root state of 'self'
         self._ctx.terminal_state = new_sdfg_term_state
 
@@ -1021,21 +947,21 @@ def _translate_jaxpr_internal(
 
         nb_translated_eqn: int = 0
         out_var_names: Sequence[str] = []
-        for eqn in jaxpr.jaxpr.eqns:  # Translate the equations one by one.
+
+        # Translate the equations one by one.
+        for eqn in jaxpr.jaxpr.eqns:
             assert len(eqn.effects) == 0
-            if len(eqn.outvars) == 0:  # Do we need this special case.
-                continue  #  Looks more like internal Jax error.
             if any(util.is_drop_var(outVar) for outVar in eqn.outvars):
-                assert (len(eqn.outvars) == 1) or all(
-                    util.is_drop_var(outVar) for outVar in eqn.outvars
-                )
+                assert all(util.is_drop_var(outVar) for outVar in eqn.outvars)
                 continue
-            _, out_var_names = self._translate_single_eqn(jaxpr=jaxpr, eqn=eqn)
+            _, out_var_names = self._translate_single_eqn(eqn=eqn)
             nb_translated_eqn += 1
 
+        # There were no equation, so handle the copying of input to output.
         if nb_translated_eqn == 0:
-            # There were no equation, so handle the copying of input to output.
             out_var_names = self._handle_null_jaxpr(jaxpr)
+
+        # Set the output names inside the context.
         self._ctx.out_names = tuple(out_var_names)
 
         return self._export_context()
@@ -1066,9 +992,9 @@ def _handle_null_jaxpr(
     ) -> Sequence[str]:
         """This function is called in case a `Jaxpr` with zero equations is encountered.
 
-        A function with zero equation might still have output, in which case an
-        input is copied to an output. This function will handle the copying from
-        the input into the corresponding output variable.
+        A function with zero equation might still have output, in which case an input is copied to an output.
+        This function will handle the copying from the input into the corresponding output variable.
+        It is important that the function will remove the input and output variables from the internal mapping.
 
         Returns:
             The function returns a list denoting the SDFG variables that refers to the output.
@@ -1083,47 +1009,46 @@ def _handle_null_jaxpr(
         assert len(self._ctx.inp_names) > 0
         assert len(self._ctx.out_names) == 0
 
-        # We will use this list to build the list of output names.
-        #  This is important for the exporter.
+        # List of the output variables.
         out_var_names: list[str] = []
 
         # If we are here then we are dealing with a nested SDFG/Jaxpr.
-        #  Because an input also serves as output, the nested SDFG will have connector pairs
-        #  with the same name, one serving as input the other as output, with the same name.
+        #  Because an input also serves as output, the nested SDFG will have a connector for the
+        #  input and one for the output, but both with the same name.
         #  This will make node validation fail.
-        #  Thus we have to introduce a some fake output name and explicitly copy the data around.
-        #  Once DaCe will inline the nested SDFG it will remove this intermediate copy.
+        #  We have to work around by introducing some fake copies, which will be removed by DaCe later.
         for jax_out_var in jaxpr.jaxpr.outvars:
-            jax_inp_name = util.get_jax_var_name(
-                jax_out_var
-            )  # Since output == input their names must be the same.
-            assert self.map_jax_var_to_sdfg(jax_inp_name, allow_fail=True)
+            # Since the output is also used as an input the variable mapping must be known.
+            sdfg_in_name: str = self.map_jax_var_to_sdfg(jax_out_var)
 
-            # This is the name we give to fictive Jax variable serving as output.
-            jax_out_name = f"_zero_equation_output_{self.map_jax_var_to_sdfg(jax_out_var)}"
-
-            # Now create the SDFG variable for it, give it a unique name.
+            # Now we create a variable that serves as true output, however, since the Jax variable
+            #  is already known we can not update the variable mapping.
             sdfg_out_name = self.add_array(
                 jax_out_var,
                 as_transient=True,
                 name_prefix="_zero_equation_output_for_",
                 update_var_mapping=False,
             )
+            out_var_names.append(sdfg_out_name)
 
-            # We now create a new mapping, we do this that we will later find the variable again.
-            self.add_jax_name_mapping(jax_var=jax_out_name, sdfg_name=sdfg_out_name)
-            out_var_names.append(jax_out_name)
-
-            # Now copy the input into the fake output variable.
-            inp_acc = self._ctx.start_state.add_read(self.map_jax_var_to_sdfg(jax_inp_name))
-            out_acc = self._ctx.start_state.add_write(self.map_jax_var_to_sdfg(jax_out_var))
+            # Now we perform the copy from the input variable in the newly created output variable.
+            inp_acc = self._ctx.start_state.add_read(sdfg_in_name)
+            out_acc = self._ctx.start_state.add_write(sdfg_out_name)
             self._ctx.start_state.add_nedge(
                 src=inp_acc,
                 dst=out_acc,
                 data=dace.Memlet.from_array(
-                    jax_inp_name, self.get_array(self.map_jax_var_to_sdfg(jax_inp_name))
+                    sdfg_in_name, self.get_array(self.map_jax_var_to_sdfg(sdfg_in_name))
                 ),
             )
+
+            # A Jax variable now has two SDFG equivalent, the input, that was previously created by
+            #  `self._create_initial_input()` and the `sdfg_out_name` we just created.
+            #  But we can not add this to the mapping, because of this situation we will now remove
+            #  the variable from the mapping. I am open for different approaches.
+            #  Note that input variables that are not used, will remain in the mapping.
+            self._ctx.jax_name_map.pop(jax_out_var)
+
         return tuple(out_var_names)
 
     # fmt: off
diff --git a/tests/test_jaxpr_translator_driver.py b/tests/test_jaxpr_translator_driver.py
index 46ea10b..1570471 100644
--- a/tests/test_jaxpr_translator_driver.py
+++ b/tests/test_jaxpr_translator_driver.py
@@ -32,8 +32,7 @@ def test_driver_alloc() -> None:
     """Tests the state right after allocation."""
     driver = jtrans.JaxprTranslationDriver()
     assert not driver.is_allocated(), "Driver was created allocated."
-    assert driver._ctx is None
-    assert len(driver._ctx_stack) == 0  # type: ignore[unreachable]
+    assert len(driver._ctx_stack) == 0
 
     # The reserved names will be tested in `test_driver_fork()`.
     sdfg_name = "qwertzuiopasdfghjkl"
@@ -78,7 +77,6 @@ def test_driver_nested() -> None:
     assert len(driver._ctx_stack) == 2
     assert driver._ctx is driver._ctx_stack[-1]
     assert driver._ctx is not driver._ctx_stack[0]
-    assert org_ctx is driver._ctx_stack[0]
 
     for member_name in driver._ctx.__slots__:
         org = getattr(org_ctx, member_name)
@@ -95,8 +93,7 @@ def test_driver_nested() -> None:
 
     # Now if we fully deallocate then we expect that it is fully deallocated.
     driver._clear_translation_ctx()
-    assert driver._ctx is None
-    assert len(driver._ctx_stack) == 0  # type: ignore[unreachable]
+    assert len(driver._ctx_stack) == 0
     assert driver._reserved_names is None
 
 
@@ -136,8 +133,8 @@ def test_driver_append_state(alloc_driver: jtrans.JaxprTranslationDriver) -> Non
     assert next(iter(sdfg.in_edges(non_terminal_state))).src is terminal_state_1
 
 
-def test_driver_array(alloc_driver: jtrans.JaxprTranslationDriver) -> None:
-    """This function tests the array creation routines.
+def test_driver_scalar(alloc_driver: jtrans.JaxprTranslationDriver) -> None:
+    """This function tests the array creation routines, especially the scalar part.
 
     However, it does so without using Jax variables.
     """
@@ -169,41 +166,91 @@ def test_driver_array(alloc_driver: jtrans.JaxprTranslationDriver) -> None:
     assert scal2.strides == (1,)
     assert scal2.dtype == scal2_j.dtype
 
-    # Create a scalar force it as an array and use symbolic strides.
+    # Using a special name for the variable
     scal3_j = JaCeVar("scal3", (), dace.int64)
+    scal3_n = "scal3_special_name"
     scal3_: str = alloc_driver.add_array(
         arg=scal3_j,
-        force_array=True,
-        symb_strides=True,  # Will have no effect.
+        alt_name=scal3_n,
+        update_var_mapping=True,
     )
-    scal3: Data = alloc_driver.get_array(scal3_)
-    assert isinstance(scal2, Array)
-    assert scal3_ == scal3_j.name
-    assert scal3.shape == (1,)
-    assert scal3.strides == (1,)
-    assert scal3.dtype == scal3_j.dtype
+    assert scal3_ == scal3_n
+    assert scal3_ == alloc_driver.map_jax_var_to_sdfg(scal3_j)
 
-    # Using a special name for the variable
-    scal4_j = scal3_j
-    scal4_n = "scal4_special_name"
-    scal4_: str = alloc_driver.add_array(
+    # Test the prefix functionality
+    scal4_j = JaCeVar("scal4", (), dace.float64)
+    scal4_p = "my_prefix"
+    scal4_n = "scal4_unused_name"
+    with pytest.raises(
+        expected_exception=ValueError,
+        match=re.escape(
+            f"Specified 'name_prefix' ('{scal4_p}') but passed '{scal4_n}' as 'alt_name'."
+        ),
+    ):
+        scal4_: str = alloc_driver.add_array(
+            arg=scal4_j,
+            alt_name=scal4_n,
+            name_prefix=scal4_p,
+        )
+    # Now create it correctly
+    scal4_ = alloc_driver.add_array(
         arg=scal4_j,
-        alt_name=scal4_n,
-        update_var_mapping=True,
+        name_prefix=scal4_p,
     )
-    assert scal4_ == scal4_n
-    assert scal4_ == alloc_driver.map_jax_var_to_sdfg(scal4_j)
+    assert scal4_.startswith(scal4_p)
+    assert scal4_j.name in scal4_
 
-    # Test the prefix functionality
+    # Test the strides, or the inability to use it.
     scal5_j = JaCeVar("scal5", (), dace.float64)
-    scal5_p = "my_prefix"
-    scal5_: str = alloc_driver.add_array(
-        arg=scal5_j,
-        name_prefix=scal5_p,
+    with pytest.raises(
+        expected_exception=ValueError,
+        match="Specified a stride for a scalar.",
+    ):
+        scal5_: str = alloc_driver.add_array(arg=scal5_j, strides=(3,))
+
+    # test the force jax name feature
+    scal6_j = JaCeVar("scal6", (), dace.float64)
+    scal6_n: str = "scal6_name"
+    scal6_np: str = "scal6_name_prefix"
+    with pytest.raises(
+        expected_exception=ValueError,
+        match=f"Specified 'force_jax_name', but passed '{scal6_n}' as 'alt_name'.",
+    ):
+        scal6_: str = alloc_driver.add_array(
+            arg=scal6_j,
+            alt_name=scal6_n,
+            force_jax_name=True,
+        )
+    with pytest.raises(
+        expected_exception=ValueError,
+        match=f"Specified 'force_jax_name', but passed '{scal6_np}' as 'name_prefix'.",
+    ):
+        scal6_ = alloc_driver.add_array(
+            arg=scal6_j,
+            name_prefix=scal6_np,
+            force_jax_name=True,
+        )
+    with pytest.raises(
+        expected_exception=ValueError,
+        match="Specified `force_jax_name` but also wanted a new name.",
+    ):
+        scal6_ = alloc_driver.add_array(
+            arg=scal6_j,
+            force_jax_name=True,
+            find_new_name=True,
+        )
+    scal6_ = alloc_driver.add_array(
+        arg=scal6_j,
+        force_jax_name=True,
     )
-    assert scal5_.startswith(scal5_p)
-    assert scal5_j.name in scal5_
+    assert scal6_ == scal6_j.name
+
 
+def test_driver_array(alloc_driver: jtrans.JaxprTranslationDriver) -> None:
+    """This function tests the array creation routines.
+
+    However, it does so without using Jax variables.
+    """
     # Allocating an array
     arr1_j = JaCeVar("arr1", (5, 3), dace.float32)
     arr1_: str = alloc_driver.add_array(
@@ -216,7 +263,7 @@ def test_driver_array(alloc_driver: jtrans.JaxprTranslationDriver) -> None:
     assert arr1.strides == (3, 1)
     assert arr1.dtype == arr1_j.dtype
 
-    # Create a variable that has a name that is already known.
+    # Create a variable that has a sdfg name that is already known.
     arr2_j = JaCeVar(arr1_, (10,), dace.float64)
     with pytest.raises(
         expected_exception=ValueError,
@@ -224,10 +271,9 @@ def test_driver_array(alloc_driver: jtrans.JaxprTranslationDriver) -> None:
     ):
         arr2_: str = alloc_driver.add_array(arg=arr2_j)
     with pytest.raises(expected_exception=ValueError, match=f"Variable '{arr1_}' already exists."):
-        # `alt_name` will not work because variable still exists.
+        # `alt_name` will not work because name still exists.
         arr2_ = alloc_driver.add_array(arg=arr2_j, alt_name=arr2_j.name)
     # However, specifying `find_new_name` will solve this issue
-    #  NOTE: Doing this is not a good idea.
     arr2_ = alloc_driver.add_array(
         arg=arr2_j,
         find_new_name=True,
@@ -246,36 +292,6 @@ def test_driver_array(alloc_driver: jtrans.JaxprTranslationDriver) -> None:
     assert arr3.shape == arr3_j.shape
     assert arr3.strides == arr3_st
 
-    # Test if specifying `symb_strides` and a stride at the same time is an error.
-    arr4_j = JaCeVar("arr4", arr3_j.shape, dace.uintp)
-    arr4_st = arr3_st
-    with pytest.raises(
-        expected_exception=ValueError,
-        match="Specified 'symb_strides' and 'stride at the same time.",
-    ):
-        arr4_: str = alloc_driver.add_array(
-            arg=arr4_j,
-            symb_strides=True,
-            strides=arr4_st,
-        )
-
-    # Test if specifying the symbolic stride alone works.
-    #  Because a shape is `1` there should be no symbolic for it.
-    arr4_ = alloc_driver.add_array(
-        arg=arr4_j,
-        symb_strides=True,
-    )
-    arr4: Data = alloc_driver.get_array(arr4_)
-    assert isinstance(arr4, Array)
-    assert arr4.shape == arr4_j.shape
-
-    for shp, stri in zip(arr4.shape, arr4.strides):
-        if shp == 1:
-            assert isinstance(stri, int)
-            assert stri == 0, f"Expected a stride of 0, but got '{stri}'."
-        else:
-            assert isinstance(stri, (str, dace.symbol))
-
 
 def test_driver_array2() -> None:
     """This function tests the array creation routine with respect to the automatic naming.
diff --git a/tests/test_sub_translators_alu.py b/tests/test_sub_translators_alu.py
index d6bc7b9..50128e8 100644
--- a/tests/test_sub_translators_alu.py
+++ b/tests/test_sub_translators_alu.py
@@ -51,5 +51,16 @@ def testee(A: np.ndarray, B: np.ndarray) -> np.ndarray:
     assert np.allclose(ref, res), f"Expected '{ref}' got '{res}'."
 
 
-if __name__ == "__main__":
-    test_add()
+def test_add3():
+    """Simple add function, with constant."""
+    jax.config.update("jax_enable_x64", True)
+
+    def testee(A: np.ndarray) -> np.ndarray:
+        return A + jax.numpy.array([[1.0, 2.0, 3.0], [4.0, 5.0, 6.0], [7.0, 8.0, 9.0]])
+
+    A = np.ones((3, 3), dtype=np.float64)
+
+    ref = testee(A)
+    res = jutil._jace_run(testee, A)
+
+    assert np.allclose(ref, res), f"Expected '{ref}' got '{res}'."

From af9db463f3322f9fe7bae238c0ce824e2dedaaeb Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Mon, 13 May 2024 12:30:31 +0200
Subject: [PATCH 132/458] Reworked how compilation works.

This commit removes the `csdfg` member of the `TranslatedJaxprSDFG` object, thus it is not cached anymore.
More importantly however, is the changes made to the compilation itself.
Before the SDFG was modified (global variables, arg_names) and then compiled, and then restored.
However, since the SDFG is part of teh CompiledSDFG this is inconsistent, for that reason the SDFG is deepcopied before processing.
This is surely not the best solution, but should prevent some nasty bugs.
---
 src/jace/translator/translated_jaxpr_sdfg.py |  3 -
 src/jace/util/debug.py                       | 81 ++++++++------------
 2 files changed, 33 insertions(+), 51 deletions(-)

diff --git a/src/jace/translator/translated_jaxpr_sdfg.py b/src/jace/translator/translated_jaxpr_sdfg.py
index 2c99156..3a3bb6b 100644
--- a/src/jace/translator/translated_jaxpr_sdfg.py
+++ b/src/jace/translator/translated_jaxpr_sdfg.py
@@ -15,7 +15,6 @@
 from jax import core as jax_core
 
 from jace import util
-from jace.util import dace_helper as jdace
 
 
 @dataclass(init=True, repr=True, eq=False, frozen=False, kw_only=True, slots=True)
@@ -29,7 +28,6 @@ class TranslatedJaxprSDFG:
     - `terminal_state` the last state in the state machine.
     - `inp_names` a `list` of the SDFG variables that are used as input, in the same order as `Jaxpr.invars`.
     - `out_names` a `list` of the SDFG variables that are used as output, in the same order as `Jaxpr.outvars`.
-    - `csdfg` a compiled SDFG object; Optional might be empyt.
 
     The SDFG is in a so called canonical form, that is not directly usable, see `JaxprTranslationDriver` for more.
 
@@ -44,7 +42,6 @@ class TranslatedJaxprSDFG:
     terminal_state: dace.SDFGState | None = None
     inp_names: Sequence[str] | None = None
     out_names: Sequence[str] | None = None
-    csdfg: jdace.CompiledSDFG | None = None
 
     def validate(self) -> bool:
         """Validate the underlying SDFG."""
diff --git a/src/jace/util/debug.py b/src/jace/util/debug.py
index 463e99e..799f882 100644
--- a/src/jace/util/debug.py
+++ b/src/jace/util/debug.py
@@ -24,26 +24,17 @@
 
 
 def compile_jax_sdfg(
-    jsdfg: translator.TranslatedJaxprSDFG, force: bool = False, save: bool = True
+    jsdfg: translator.TranslatedJaxprSDFG,
 ) -> jdace.CompiledSDFG:
     """This function compiles the embedded SDFG and return it.
 
     The SDFG is compiled in a very special way, i.e. all arguments and return values have to be passed as arguments.
 
-    Before doing anything the function will inspect the `csdfg` filed of the `TranslatedJaxprSDFG`.
-    If it is not `None` the function will return this value.
-    This can be disabled by setting `focre` to `True`.
-    If the SDFG is compiled the function will store the compiled SDFG inside the `TranslatedJaxprSDFG` object's `csdfg` field.
-    However, by setting `save` to `False` the field will not be modified.
-
-    Args:
-        force:      Force compilation even if the `csdfg` field is already set.
-        save:       Store the compiled SDFG inside the `TranslatedJaxprSDFG` object's `csdfg` field.
-
     Notes:
         Currently the SDFG must not have any undefined symbols, i.e. no undefined sizes.
-        The function either returns a value or a tuple of values, i.e. no tree.
     """
+    from copy import deepcopy
+
     if not jsdfg.inp_names:
         raise ValueError("The passed SDFG did not had any input arguments.")
     if not jsdfg.out_names:
@@ -51,10 +42,6 @@ def compile_jax_sdfg(
     if any(out_name.startswith("__return") for out_name in jsdfg.out_names):
         raise NotImplementedError("No return statement is supported yet.")
 
-    if (not force) and (jsdfg.csdfg is not None):
-        assert isinstance(jsdfg.csdfg, jdace.CompiledSDFG)
-        return jsdfg.csdfg
-
     # This is a simplification that makes our life simply.
     #  However, we should consider lifting it at some point.
     if len(jsdfg.sdfg.free_symbols) != 0:
@@ -62,32 +49,26 @@ def compile_jax_sdfg(
             f"No externally defined symbols are allowed, found: {jsdfg.sdfg.free_symbols}"
         )
 
-    # Canonical SDFGs do not have global memory, so we must transform it; undo afterwards
-    prev_trans_state: dict[str, bool] = {}
-    org_arg_names: Any = jsdfg.sdfg.arg_names
+    # We will now deepcopy the SDFG.
+    #  We do this because the SDFG is also a member of the `CompiledSDFG` object.
+    #  And currently we rely on the integrity of this object in the run function,
+    #  i.e. in the allocation of the return values as well as `arg_names`.
+    sdfg: dace.SDFG = deepcopy(jsdfg.sdfg)
+
+    # Canonical SDFGs do not have global memory, so we must transform it
     sdfg_arg_names: list[str] = []
-    try:
-        for glob_name in jsdfg.inp_names + jsdfg.out_names:  # type: ignore[operator]  # concatenation
-            if glob_name in prev_trans_state:  # Donated arguments
-                continue
-            prev_trans_state[glob_name] = jsdfg.sdfg.arrays[glob_name].transient
-            jsdfg.sdfg.arrays[glob_name].transient = False
-            sdfg_arg_names.append(glob_name)
-
-        # This forces the signature of the SDFG to include all arguments in order they appear.
-        jsdfg.sdfg.arg_names = sdfg_arg_names
-
-        # Actual compiling the stuff
-        csdfg: jdace.CompiledSDFG = jsdfg.sdfg.compile()
-        if save:
-            jsdfg.csdfg = csdfg
-        return csdfg
-
-    finally:
-        # Restore the initial transient state
-        for var_name, trans_state in prev_trans_state.items():
-            jsdfg.sdfg.arrays[var_name].transient = trans_state
-        jsdfg.sdfg.arg_names = org_arg_names
+    for glob_name in jsdfg.inp_names + jsdfg.out_names:
+        if glob_name in sdfg_arg_names:  # Donated arguments
+            continue
+        sdfg.arrays[glob_name].transient = False
+        sdfg_arg_names.append(glob_name)
+
+    # This forces the signature of the SDFG to include all arguments in order they appear.
+    sdfg.arg_names = sdfg_arg_names
+
+    # Actual compiling the stuff
+    csdfg: jdace.CompiledSDFG = sdfg.compile()
+    return csdfg
 
 
 @singledispatch
@@ -99,18 +80,16 @@ def run_jax_sdfg(
 ) -> tuple[Any, ...] | Any:
     """Run the `TranslatedJaxprSDFG` object.
 
-    If the `TranslatedJaxprSDFG` object does not contain a precompiled SDFG object the function will compile it.
-    However, the compiled SDFG will not be cached in the `TranslatedJaxprSDFG` object.
+    Notes:
+        The function either returns a value or a tuple of values, i.e. no tree.
+        There is an overload of this function that accepts an already compiled SDFG and runs it.
     """
     if jsdfg.inp_names is None:
         raise ValueError("Input names are not specified.")
     if jsdfg.out_names is None:
         raise ValueError("Output names are not specified.")
+    csdfg: jdace.CompiledSDFG = compile_jax_sdfg(jsdfg)
 
-    if jsdfg.csdfg is not None:
-        csdfg: jdace.CompiledSDFG = jsdfg.csdfg
-    else:
-        csdfg = compile_jax_sdfg(jsdfg, save=False)
     return run_jax_sdfg(
         csdfg,
         jsdfg.inp_names,
@@ -140,11 +119,14 @@ def _(
     if len(kwargs) != 0:
         raise NotImplementedError("No kwargs are supported yet.")
 
+    # We need the SDFG to construct/allocate the memory for the return values.
+    #  Actually, we would only need the descriptors, but this is currently the only way to get them.
+    #  Note that this is safe to do, because in the compile function we decoupled the SDFG from all.
     sdfg: dace.SDFG = csdfg.sdfg
 
     # Build the argument list that we will pass to the compiled object.
     call_args: dict[str, Any] = {}
-    for in_name, in_val in zip(inp_names, args):
+    for in_name, in_val in zip(inp_names, args, strict=True):
         call_args[in_name] = in_val
     for out_name in out_names:
         assert not ((out_name == "__return") or (out_name.startswith("__return_")))  # noqa: PT018 # Assert split
@@ -192,6 +174,9 @@ def _jace_run(
     Args:
         *args:      Forwarded to the tracing and final execution of the SDFG.
         **kwargs:   Used to construct the driver.
+
+    Notes:
+        This function will be removed soon.
     """
     jaxpr = jax.make_jaxpr(fun)(*args)
     driver = translator.JaxprTranslationDriver(**kwargs)

From 8ca36d35bf1528ff59cb45d35e9fd633eb332cb5 Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Mon, 13 May 2024 12:56:58 +0200
Subject: [PATCH 133/458] Removed the `TranslationContext` object.

The job of the context and the return value will now be done by the `TranslatedJaxprSDFG` object in "Personalunion".
---
 src/jace/translator/_translation_context.py   | 95 -------------------
 .../translator/jaxpr_translator_driver.py     | 21 +---
 src/jace/translator/translated_jaxpr_sdfg.py  | 87 +++++++++++------
 3 files changed, 64 insertions(+), 139 deletions(-)
 delete mode 100644 src/jace/translator/_translation_context.py

diff --git a/src/jace/translator/_translation_context.py b/src/jace/translator/_translation_context.py
deleted file mode 100644
index 6253118..0000000
--- a/src/jace/translator/_translation_context.py
+++ /dev/null
@@ -1,95 +0,0 @@
-# JaCe - JAX Just-In-Time compilation using DaCe (Data Centric Parallel Programming)
-#
-# Copyright (c) 2024, ETH Zurich
-# All rights reserved.
-#
-# SPDX-License-Identifier: BSD-3-Clause
-
-"""This module contains the translation context for the `JaxprTranslationDriver`."""
-
-from __future__ import annotations
-
-from collections.abc import MutableMapping
-
-import dace
-from jax import core as jax_core
-
-from jace import translator, util
-
-
-class _TranslationContext:
-    """Represents the context of a `JaxprTranslationDriver`.
-
-    Essentially it contains the following variables:
-    - `sdfg`:
-        The SDFG object that is under construction.
-    - `start_state`:
-        The first state in the SDFG state machine.
-    - `terminal_state`:
-        The current terminal state of the SDFG state machine.
-    - `jax_name_map`:
-        A `dict` that maps every Jax variable to its corresponding SDFG variable _name_.
-    - `inp_names`:
-        A `list` of the SDFG variable names that are used for input.
-        Their order is the same as in `Jaxpr.invars`.
-        Filled at the very beginning.
-    - `out_names`:
-        A `list` of the SDFG variables names that are used for output,
-        Their order is the same as in `Jaxpr.outvars`.
-        Only filled at the very end.
-    - `rev_idx`:
-        The revision index (used to generate unique names in the translation.
-
-    Notes:
-        It might be that a name appears in both the `inp_names` and `out_names` list.
-            This happens if the corresponding variable is used as both input and output.
-            In Jax this is called argument donation.
-        This class is similar to but different to `TranslatedJaxprSDFG`.
-            This class is used to represent the dynamic state of the translation object,
-            `TranslatedJaxprSDFG` is used to result the end.
-    """
-
-    __slots__ = (
-        "sdfg",
-        "start_state",
-        "terminal_state",
-        "jax_name_map",
-        "inp_names",
-        "out_names",
-        "rev_idx",
-    )
-
-    def __init__(
-        self,
-        rev_idx: int,
-        name: str | None = None,
-    ) -> None:
-        """Initializes the context.
-
-        Args:
-            rev_idx:    The revision index of the context.
-            name:       Name of the SDFG object.
-        """
-        if isinstance(name, str) and not util.VALID_SDFG_OBJ_NAME.fullmatch(name):
-            raise ValueError(f"'{name}' is not a valid SDFG name.")
-
-        self.sdfg: dace.SDFG = dace.SDFG(name=(name or f"unnamed_SDFG_{id(self)}"))
-        self.start_state: dace.SDFGState = self.sdfg.add_state(
-            label="initial_state", is_start_block=True
-        )
-        self.terminal_state: dace.SDFGState = self.start_state
-        self.jax_name_map: MutableMapping[jax_core.Var | util.JaCeVar, str] = {}
-        self.inp_names: tuple[str, ...] = ()
-        self.out_names: tuple[str, ...] = ()
-        self.rev_idx: int = rev_idx
-
-    def to_translated_jaxpr_sdfg(self) -> translator.TranslatedJaxprSDFG:
-        """Transforms `self` into a `TranslatedJaxprSDFG`."""
-        return translator.TranslatedJaxprSDFG(
-            sdfg=self.sdfg,
-            start_state=self.start_state,
-            terminal_state=self.terminal_state,
-            jax_name_map=self.jax_name_map,
-            inp_names=self.inp_names,
-            out_names=self.out_names,
-        )
diff --git a/src/jace/translator/jaxpr_translator_driver.py b/src/jace/translator/jaxpr_translator_driver.py
index 7d2012f..99c92f2 100644
--- a/src/jace/translator/jaxpr_translator_driver.py
+++ b/src/jace/translator/jaxpr_translator_driver.py
@@ -75,8 +75,6 @@ def __init__(
                 the shared part. This flag is provided only for implementing
                 `self.fork()` using it is an error and undefined behaviour.
         """
-        from ._translation_context import _TranslationContext
-
         # Contains all the subtranslators that we need.
         #  They are partitioned by the names of the primitive they have registered for.
         #  This member is allocated by '_init_sub_translators()' and remains allocated
@@ -96,7 +94,7 @@ def __init__(
 
         # Context stack and current context.
         #  Only allocated during an ongoing translation
-        self._ctx_stack: list[_TranslationContext] = []
+        self._ctx_stack: list[translator.TranslatedJaxprSDFG] = []
 
         # Creating of the subtranslators.
         self._init_sub_translators(kwargs)
@@ -676,7 +674,6 @@ def _create_initial_input(
         Notes:
             This function will fill the internal list of inputs.
         """
-
         if not self.is_allocated():
             raise RuntimeError("Driver is not allocated, can not create constants.")
         if len(self._ctx.inp_names) != 0:
@@ -750,11 +747,9 @@ def _allocate_translation_ctx(
             name:               The name of the SDFG.
             reserved_names:     Add these name to the set of resered names of `self`.
         """
-        from ._translation_context import _TranslationContext
-
         # Create a new translation context and put it on the stack.
         self._ctx_stack.append(
-            _TranslationContext(
+            translator.TranslatedJaxprSDFG(
                 rev_idx=next(self._rev_manager),
                 name=name,
             )
@@ -775,7 +770,7 @@ def _allocate_translation_ctx(
         return self
 
     @property
-    def _ctx(self) -> _TranslationContext:
+    def _ctx(self) -> translator.TranslatedJaxprSDFG:
         """Returns the currently active translation context."""
         assert len(self._ctx_stack) != 0, "No context is active."
         return self._ctx_stack[-1]
@@ -976,15 +971,7 @@ def _export_context(self) -> translator.TranslatedJaxprSDFG:
         assert self.is_allocated()
         assert all((isinstance(x, str) and (len(x) > 0)) for x in self._ctx.inp_names)
         assert all((isinstance(x, str) and (len(x) > 0)) for x in self._ctx.out_names)
-
-        return translator.TranslatedJaxprSDFG(
-            sdfg=self._ctx.sdfg,
-            start_state=self._ctx.start_state,
-            terminal_state=self._ctx.terminal_state,
-            jax_name_map=self._ctx.jax_name_map,
-            inp_names=self._ctx.inp_names,
-            out_names=self._ctx.out_names,
-        )
+        return self._ctx
 
     def _handle_null_jaxpr(
         self,
diff --git a/src/jace/translator/translated_jaxpr_sdfg.py b/src/jace/translator/translated_jaxpr_sdfg.py
index 3a3bb6b..369572c 100644
--- a/src/jace/translator/translated_jaxpr_sdfg.py
+++ b/src/jace/translator/translated_jaxpr_sdfg.py
@@ -7,9 +7,8 @@
 
 from __future__ import annotations
 
-from collections.abc import Mapping, Sequence
+from collections.abc import MutableMapping
 from dataclasses import dataclass
-from typing import Any
 
 import dace
 from jax import core as jax_core
@@ -17,11 +16,14 @@
 from jace import util
 
 
-@dataclass(init=True, repr=True, eq=False, frozen=False, kw_only=True, slots=True)
+@dataclass(slots=True)
 class TranslatedJaxprSDFG:
     """Encapsulates the result of a translation run of the `JaxprTranslationDriver` object.
 
-    It defines the following members:
+    This class is also used to represent the internal state of the `JaxprTranslationDriver` during the translation.
+    For that reason the object defines some fields that only have a meaning during the actually translation.
+
+    The fields used to store the result are:
     - `sdfg` the SDFG object that was created.
     - `jax_name_map` a `dict` that maps every Jax variable to its corresponding SDFG variable _name_.
     - `start_state` the first state in the SDFG state machine.
@@ -29,32 +31,71 @@ class TranslatedJaxprSDFG:
     - `inp_names` a `list` of the SDFG variables that are used as input, in the same order as `Jaxpr.invars`.
     - `out_names` a `list` of the SDFG variables that are used as output, in the same order as `Jaxpr.outvars`.
 
-    The SDFG is in a so called canonical form, that is not directly usable, see `JaxprTranslationDriver` for more.
+    Please consider the following important points:
+    - The SDFG is in canonical form, which means that it is not directly usable, see `JaxprTranslationDriver` for more.
+    - It might be that a name appears in both the `inp_names` and `out_names` list.
+        This happens if the corresponding variable is used as both input and output.
+        In Jax this is called argument donation.
+
+    During the translation the following members are also allocated:
+    - `rev_idx` the revision index, used for name mangling.
 
-    It might be that a name appears in both the `inp_names` and `out_names` list.
-    This happens if the corresponding variable is used as both input and output.
-    In Jax this is called argument donation.
+    While they remain allocated, accessing them is considered an error.
     """
 
     sdfg: dace.SDFG
-    jax_name_map: Mapping[jax_core.Var | util.JaCeVar, str]
-    start_state: dace.SDFGState | None = None
-    terminal_state: dace.SDFGState | None = None
-    inp_names: Sequence[str] | None = None
-    out_names: Sequence[str] | None = None
+    jax_name_map: MutableMapping[jax_core.Var | util.JaCeVar, str]
+    start_state: dace.SDFGState
+    terminal_state: dace.SDFGState
+    inp_names: tuple[str, ...]
+    out_names: tuple[str, ...]
+    rev_idx: int
+
+    def __init__(
+        self,
+        rev_idx: int,
+        name: str | None = None,
+    ) -> None:
+        """Initializes the context.
+
+        The function allocates the SDFG and initializes the members properly.
+
+        Args:
+            rev_idx:    The revision index of the context.
+            name:       Name of the SDFG object.
+        """
+        if isinstance(name, str) and not util.VALID_SDFG_OBJ_NAME.fullmatch(name):
+            raise ValueError(f"'{name}' is not a valid SDFG name.")
+
+        self.sdfg: dace.SDFG = dace.SDFG(name=(name or f"unnamed_SDFG_{id(self)}"))
+        self.start_state: dace.SDFGState = self.sdfg.add_state(
+            label="initial_state", is_start_block=True
+        )
+        self.terminal_state: dace.SDFGState = self.start_state
+        self.jax_name_map: MutableMapping[jax_core.Var | util.JaCeVar, str] = {}
+        self.inp_names: tuple[str, ...] = ()
+        self.out_names: tuple[str, ...] = ()
+        self.rev_idx: int = rev_idx
 
     def validate(self) -> bool:
         """Validate the underlying SDFG."""
 
         # To prevent the 'non initialized' data warnings we have to temporary
         #  promote input and output arguments to globals
-        promote_to_glob: set[str] = set()
         org_trans_state: dict[str, bool] = {}
-        if self.inp_names:
-            promote_to_glob.update(self.inp_names)
-        if self.out_names:
-            promote_to_glob.update(self.out_names)
-        for var in promote_to_glob:
+        if not self.inp_names:
+            raise dace.sdfg.InvalidSDFGError(
+                "There are no input arguments.",
+                self.sdfg,
+                self.sdfg.node_id(self.start_state),
+            )
+        if not self.out_names:
+            raise dace.sdfg.InvalidSDFGError(
+                "There are no output arguments.",
+                self.sdfg,
+                self.sdfg.node_id(self.start_state),
+            )
+        for var in set(self.inp_names + self.out_names):  # set is needed for donated args.
             org_trans_state[var] = self.sdfg.arrays[var].transient
             self.sdfg.arrays[var].transient = False
 
@@ -64,11 +105,3 @@ def validate(self) -> bool:
             for var, orgValue in org_trans_state.items():
                 self.sdfg.arrays[var].transient = orgValue
         return True
-
-    def __getitem__(self, idx: str) -> Any:
-        """Allows member access using brackets."""
-        if not isinstance(idx, str):
-            raise TypeError(f"Expected 'idx' as 'str' but got '{type(str)}'")
-        if not hasattr(self, idx):
-            raise KeyError(f"The key '{idx}' is not known.")
-        return getattr(self, idx)

From c54c7e41143e6937d609a01a033ac11fea72b70f Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Mon, 13 May 2024 13:54:17 +0200
Subject: [PATCH 134/458] Removed the `TranslationContext` object.

The job of the context and the return value will now be done by the `TranslatedJaxprSDFG` object in "Personalunion".
---
 .../translator/jaxpr_translator_driver.py     | 33 +++++++------------
 1 file changed, 12 insertions(+), 21 deletions(-)

diff --git a/src/jace/translator/jaxpr_translator_driver.py b/src/jace/translator/jaxpr_translator_driver.py
index 99c92f2..e319389 100644
--- a/src/jace/translator/jaxpr_translator_driver.py
+++ b/src/jace/translator/jaxpr_translator_driver.py
@@ -80,6 +80,7 @@ def __init__(
         #  This member is allocated by '_init_sub_translators()' and remains allocated
         #  during the lifetime of the object.
         self._sub_translators: dict[str, translator.PrimitiveTranslator] = None  # type: ignore[assignment]
+        self._init_sub_translators(kwargs)
 
         # These names can not be used for the automatic naming of Jax variables.
         #  They differ from the forbidden names, that they denote valid SDFG names.
@@ -96,9 +97,6 @@ def __init__(
         #  Only allocated during an ongoing translation
         self._ctx_stack: list[translator.TranslatedJaxprSDFG] = []
 
-        # Creating of the subtranslators.
-        self._init_sub_translators(kwargs)
-
     def translate_jaxpr(
         self,
         jaxpr: jax_core.ClosedJaxpr,
@@ -122,8 +120,7 @@ def translate_jaxpr(
         Args:
             inp_scalar_as_array:    Translate scalar _input_ arguments to arrays of length 1.
             name:                   Use this name for the SDFG instead some generated one.
-            reserved_names:         Prevent the generation of variables with these names,
-                                        see `self.add_array()` for more.
+            reserved_names:         Prevent the generation of variables with these names, see `self.add_array()` for more.
             allow_empty_jaxpr:      Allows empty Jaxpr.
 
         Notes:
@@ -140,14 +137,15 @@ def translate_jaxpr(
         if not jax.config.read("jax_enable_x64"):
             raise NotImplementedError("The translation only works if 'jax_enable_x64' is enabled.")
 
-        # Consume the hidden flags
+        # The point of this flag is, that one can have the translator, but still have access
+        #  the the function of self, such as `add_array()` (is needed in later stages).
         _clear_translation_ctx: bool = kwargs.pop("_clear_translation_ctx", True)
 
-        # NOTE: If `self` is already allocated, i.e. has an ongoing translation process
-        #       This function will create a new translation context. Thus the driver
-        #       will start to translate a second (nested) SDFG.
-        #       Also note that there is no mechanism that forces the integration of the
-        #       nested SDFG/Jaxpr.
+        # NOTE: If `self` is already allocated, i.e. has an ongoing translation process,
+        #       the `_allocate_translation_ctx()` function will start a new context.
+        #       Thus the driver will start to translate a second (nested) SDFG.
+        #       Also note that there is no mechanism that forces the integration of the nested SDFG/Jaxpr,
+        #       this must be done manually.
         self._allocate_translation_ctx(
             name=name,
             reserved_names=reserved_names,
@@ -159,10 +157,8 @@ def translate_jaxpr(
             jaxpr=jaxpr,
             inp_scalar_as_array=inp_scalar_as_array,
         )
+        # Note that `self` and `jsdfg` still share the same underlying memory, i.e. context.
         jsdfg: translator.TranslatedJaxprSDFG = self._translate_jaxpr_internal(jaxpr)
-
-        # If the translation context is not cleared `self` and `jsdfg` will share the same data.
-        #  There is some legitimate use for that.
         if _clear_translation_ctx:
             self._clear_translation_ctx()
 
@@ -362,7 +358,6 @@ def add_reserved_names(
         reserved_names: None | str | Collection[str],
     ) -> JaxprTranslationDriver:
         """Adds the names listed in `reserved_names` to the internal list."""
-        assert isinstance(self._reserved_names, set)
 
         if reserved_names is None:
             return self
@@ -784,9 +779,9 @@ def _init_sub_translators(
         The function forwards `kwargs` to the constructor of the subtranslators.
         However, it will remove all arguments starting with an underscore.
         """
-        assert self._sub_translators is None
+        from jace.translator import sub_translators  # Cyclic import
 
-        subtrans_args = {k: v for k, v in subtrans_args.items() if not k.startswith("_")}  # type: ignore[unreachable]
+        subtrans_args = {k: v for k, v in subtrans_args.items() if not k.startswith("_")}
         prim_translators: dict[str, translator.PrimitiveTranslator] = {}
         for prim_translator_cls in sub_translators._get_subtranslators_cls():
             prim_translator: translator.PrimitiveTranslator = prim_translator_cls.CREATE(
@@ -937,15 +932,11 @@ def _translate_jaxpr_internal(
                 this is used by Jax to indicate that they are never read.
                 Such variables are included by some transformations such as `grad()`.
         """
-        assert isinstance(jaxpr, jax_core.ClosedJaxpr)
-        assert self.is_allocated()
-
         nb_translated_eqn: int = 0
         out_var_names: Sequence[str] = []
 
         # Translate the equations one by one.
         for eqn in jaxpr.jaxpr.eqns:
-            assert len(eqn.effects) == 0
             if any(util.is_drop_var(outVar) for outVar in eqn.outvars):
                 assert all(util.is_drop_var(outVar) for outVar in eqn.outvars)
                 continue

From 9b0338be3b7a03ef74363b8a18e3121288e84440 Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Mon, 13 May 2024 13:40:02 +0200
Subject: [PATCH 135/458] Updated some package importing stuff.

---
 src/jace/translator/__init__.py                          | 2 +-
 src/jace/translator/jaxpr_translator_driver.py           | 1 -
 ...a_primitive_translator.py => primitive_translator.py} | 0
 src/jace/translator/sub_translators/__init__.py          | 9 +++++----
 src/jace/translator/sub_translators/alu_translator.py    | 3 +--
 5 files changed, 7 insertions(+), 8 deletions(-)
 rename src/jace/translator/{sub_translators/a_primitive_translator.py => primitive_translator.py} (100%)

diff --git a/src/jace/translator/__init__.py b/src/jace/translator/__init__.py
index b643776..042f82a 100644
--- a/src/jace/translator/__init__.py
+++ b/src/jace/translator/__init__.py
@@ -10,7 +10,7 @@
 from __future__ import annotations
 
 from .jaxpr_translator_driver import JaxprTranslationDriver
-from .sub_translators import PrimitiveTranslator
+from .primitive_translator import PrimitiveTranslator
 from .translated_jaxpr_sdfg import TranslatedJaxprSDFG
 
 
diff --git a/src/jace/translator/jaxpr_translator_driver.py b/src/jace/translator/jaxpr_translator_driver.py
index e319389..6ce6e4c 100644
--- a/src/jace/translator/jaxpr_translator_driver.py
+++ b/src/jace/translator/jaxpr_translator_driver.py
@@ -17,7 +17,6 @@
 from jax import core as jax_core
 
 from jace import translator, util
-from jace.translator import sub_translators
 
 
 class JaxprTranslationDriver:
diff --git a/src/jace/translator/sub_translators/a_primitive_translator.py b/src/jace/translator/primitive_translator.py
similarity index 100%
rename from src/jace/translator/sub_translators/a_primitive_translator.py
rename to src/jace/translator/primitive_translator.py
diff --git a/src/jace/translator/sub_translators/__init__.py b/src/jace/translator/sub_translators/__init__.py
index 88c239c..7e52b28 100644
--- a/src/jace/translator/sub_translators/__init__.py
+++ b/src/jace/translator/sub_translators/__init__.py
@@ -10,18 +10,19 @@
 
 from collections.abc import Sequence
 
-from .a_primitive_translator import PrimitiveTranslator  # has to be the first import.
+from jace import translator
+
 from .alu_translator import ALUTranslator
 
 
 # List of all subtranslators that ships with JaCe.
-_KNOWN_SUBTRANSLATORS: list[type[PrimitiveTranslator]] = [
+_KNOWN_SUBTRANSLATORS: list[type[translator.PrimitiveTranslator]] = [
     ALUTranslator,
 ]
 
 
 def add_subtranslator(
-    subtrans: type[PrimitiveTranslator],
+    subtrans: type[translator.PrimitiveTranslator],
 ) -> bool:
     """Add `subtrans` to the externally defined subtranslators.
 
@@ -36,7 +37,7 @@ def add_subtranslator(
     return True
 
 
-def _get_subtranslators_cls() -> Sequence[type[PrimitiveTranslator]]:
+def _get_subtranslators_cls() -> Sequence[type[translator.PrimitiveTranslator]]:
     """Returns the list of all subtranslator known to JaCe.
 
     The translators are returned in FIFO order.
diff --git a/src/jace/translator/sub_translators/alu_translator.py b/src/jace/translator/sub_translators/alu_translator.py
index 8cc2466..23f0cb3 100644
--- a/src/jace/translator/sub_translators/alu_translator.py
+++ b/src/jace/translator/sub_translators/alu_translator.py
@@ -18,10 +18,9 @@
 from typing_extensions import override
 
 from jace import translator
-from jace.translator import sub_translators
 
 
-class ALUTranslator(sub_translators.PrimitiveTranslator):
+class ALUTranslator(translator.PrimitiveTranslator):
     """This translator handles all arithmetic and logical operations."""
 
     __slots__ = ()

From 4e5eab97c515ed2964223ef59f3736a818557427 Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Mon, 13 May 2024 07:14:23 +0200
Subject: [PATCH 136/458] Relocated the variable Patterns.

---
 src/jace/translator/_translation_context.py   |  2 +-
 .../translator/jaxpr_translator_driver.py     |  8 +++----
 src/jace/util/__init__.py                     | 14 +++++++-----
 src/jace/util/jax_helper.py                   |  2 +-
 src/jace/util/re_pattern.py                   | 22 -------------------
 src/jace/util/util.py                         | 11 ++++++++++
 6 files changed, 26 insertions(+), 33 deletions(-)
 delete mode 100644 src/jace/util/re_pattern.py

diff --git a/src/jace/translator/_translation_context.py b/src/jace/translator/_translation_context.py
index 15dd47f..6253118 100644
--- a/src/jace/translator/_translation_context.py
+++ b/src/jace/translator/_translation_context.py
@@ -70,7 +70,7 @@ def __init__(
             rev_idx:    The revision index of the context.
             name:       Name of the SDFG object.
         """
-        if isinstance(name, str) and not util._VALID_SDFG_OBJ_NAME.fullmatch(name):
+        if isinstance(name, str) and not util.VALID_SDFG_OBJ_NAME.fullmatch(name):
             raise ValueError(f"'{name}' is not a valid SDFG name.")
 
         self.sdfg: dace.SDFG = dace.SDFG(name=(name or f"unnamed_SDFG_{id(self)}"))
diff --git a/src/jace/translator/jaxpr_translator_driver.py b/src/jace/translator/jaxpr_translator_driver.py
index 5b01fd2..e34975a 100644
--- a/src/jace/translator/jaxpr_translator_driver.py
+++ b/src/jace/translator/jaxpr_translator_driver.py
@@ -196,7 +196,7 @@ def append_new_state(
             prev_state:     Alternative `SDFGState` at which we should append the new state.
 
         """
-        if isinstance(label, str) and (not util._VALID_SDFG_OBJ_NAME.fullmatch(label)):
+        if isinstance(label, str) and (not util.VALID_SDFG_OBJ_NAME.fullmatch(label)):
             raise ValueError(f"Can not create state with label '{label}' since it is invalid.")
 
         # Decide if appending to that state will modify the terminal state.
@@ -385,7 +385,7 @@ def add_reserved_names(
             raise TypeError(f"Does not know how to handle the type '{type(reserved_names)}'.")
         for rev_name in reserved_names:
             assert isinstance(rev_name, str)
-            if not util._VALID_SDFG_VAR_NAME.fullmatch(rev_name):
+            if not util.VALID_SDFG_VAR_NAME.fullmatch(rev_name):
                 raise ValueError(
                     f"Can not use '{rev_name}' as reserved name as it is not a valid SDFG name."
                 )
@@ -504,7 +504,7 @@ def add_array(
                 raise ValueError("Passed an empty 'alt_name'.")
             if alt_name in self._forbidden_names:
                 raise ValueError("'alt_name' is a forbidden name.")
-            if not util._VALID_SDFG_VAR_NAME.fullmatch(alt_name):
+            if not util.VALID_SDFG_VAR_NAME.fullmatch(alt_name):
                 raise ValueError(f"The passed name 'alt_name' '{alt_name}' is invalid.")
             if name_prefix is not None:
                 raise ValueError(
@@ -591,7 +591,7 @@ def add_array(
             raise ValueError(f"Can't create variable '{arg_name}', name is forbidden.")
         if arg_name in self._ctx.sdfg.arrays:
             raise ValueError(f"Can't create variable '{arg_name}', variable is already created.")
-        if not util._VALID_SDFG_VAR_NAME.fullmatch(arg_name):
+        if not util.VALID_SDFG_VAR_NAME.fullmatch(arg_name):
             raise ValueError(f"The requested variable name '{arg_name}' is invalid.")
 
         # Promotion of scalar to array.
diff --git a/src/jace/util/__init__.py b/src/jace/util/__init__.py
index 81988ed..bfc449b 100644
--- a/src/jace/util/__init__.py
+++ b/src/jace/util/__init__.py
@@ -18,9 +18,13 @@
     get_jax_var_shape,
     translate_dtype,
 )
-from .re_pattern import _VALID_JAX_VAR_NAME, _VALID_SDFG_OBJ_NAME, _VALID_SDFG_VAR_NAME
 from .traits import is_drop_var, is_non_string_iterable
-from .util import as_sequence
+from .util import (
+    VALID_JAX_VAR_NAME,
+    VALID_SDFG_OBJ_NAME,
+    VALID_SDFG_VAR_NAME,
+    as_sequence,
+)
 
 
 __all__ = [
@@ -35,7 +39,7 @@
     "run_jax_sdfg",
     "_jace_run",
     "_propose_jax_name",
-    "_VALID_JAX_VAR_NAME",
-    "_VALID_SDFG_OBJ_NAME",
-    "_VALID_SDFG_VAR_NAME",
+    "VALID_JAX_VAR_NAME",
+    "VALID_SDFG_OBJ_NAME",
+    "VALID_SDFG_VAR_NAME",
 ]
diff --git a/src/jace/util/jax_helper.py b/src/jace/util/jax_helper.py
index 80018fc..fb4619a 100644
--- a/src/jace/util/jax_helper.py
+++ b/src/jace/util/jax_helper.py
@@ -91,7 +91,7 @@ def get_jax_var_name(jax_var: jax_core.Atom | JaCeVar | str) -> str:
             )
     assert isinstance(jax_name, str)
 
-    if not util._VALID_JAX_VAR_NAME.fullmatch(jax_name):
+    if not util.VALID_JAX_VAR_NAME.fullmatch(jax_name):
         raise ValueError(f"Deduced Jax name '{jax_name}' is invalid.")
     return jax_name
 
diff --git a/src/jace/util/re_pattern.py b/src/jace/util/re_pattern.py
deleted file mode 100644
index 99fb71a..0000000
--- a/src/jace/util/re_pattern.py
+++ /dev/null
@@ -1,22 +0,0 @@
-# JaCe - JAX Just-In-Time compilation using DaCe (Data Centric Parallel Programming)
-#
-# Copyright (c) 2024, ETH Zurich
-# All rights reserved.
-#
-# SPDX-License-Identifier: BSD-3-Clause
-
-"""Module containing all regex pattern that we need inside JaCe."""
-
-from __future__ import annotations
-
-import re
-
-
-# Valid name for a jax variable.
-_VALID_JAX_VAR_NAME: re.Pattern = re.compile("(jax[0-9]+_?)|([a-z]+_?)")
-
-# Valid name for an SDFG variable.
-_VALID_SDFG_VAR_NAME: re.Pattern = re.compile("[a-zA-Z_][a-zA-Z0-9_]*")
-
-# Valid name for an SDFG itself, includes `SDFGState` objects.
-_VALID_SDFG_OBJ_NAME: re.Pattern = re.compile("[a-zA-Z_][a-zA-Z0-9_]*")
diff --git a/src/jace/util/util.py b/src/jace/util/util.py
index 96bfa20..4e97e8c 100644
--- a/src/jace/util/util.py
+++ b/src/jace/util/util.py
@@ -7,6 +7,7 @@
 
 from __future__ import annotations
 
+import re
 from collections.abc import Iterable
 from typing import TypeVar, cast, overload
 
@@ -32,3 +33,13 @@ def as_sequence(value: _T | Iterable[_T]) -> Iterable[_T]:
     if traits.is_non_string_iterable(value):
         return value
     return cast(Iterable[_T], [value])
+
+
+# Valid name for a jax variable.
+VALID_JAX_VAR_NAME: re.Pattern = re.compile("(jax[0-9]+_?)|([a-z]+_?)")
+
+# Valid name for an SDFG variable.
+VALID_SDFG_VAR_NAME: re.Pattern = re.compile("[a-zA-Z_][a-zA-Z0-9_]*")
+
+# Valid name for an SDFG itself, includes `SDFGState` objects.
+VALID_SDFG_OBJ_NAME: re.Pattern = re.compile("[a-zA-Z_][a-zA-Z0-9_]*")

From 4f6e91bcbc45bcd32fa40ca94e747b4149a57411 Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Mon, 13 May 2024 14:49:04 +0200
Subject: [PATCH 137/458] Updated the translator interfaces.

This commit fixes some import errors, but it also marks the `out_var_names` argument of the translator function as `MutableSequence`.
This is because it is explicitly allowed to modify it.
---
 .../sub_translators/a_primitive_translator.py | 45 ++++++++-----------
 .../sub_translators/alu_translator.py         |  7 +--
 2 files changed, 23 insertions(+), 29 deletions(-)

diff --git a/src/jace/translator/sub_translators/a_primitive_translator.py b/src/jace/translator/sub_translators/a_primitive_translator.py
index 16d2d4b..a1f34e6 100644
--- a/src/jace/translator/sub_translators/a_primitive_translator.py
+++ b/src/jace/translator/sub_translators/a_primitive_translator.py
@@ -16,15 +16,13 @@
 from __future__ import annotations
 
 from abc import abstractmethod
-from collections.abc import Sequence
-from typing import TYPE_CHECKING, Any, Protocol, runtime_checkable
+from collections.abc import MutableSequence, Sequence
+from typing import Any, Protocol, runtime_checkable
 
 import dace
 from jax import core as jax_core
 
-
-if TYPE_CHECKING:
-    from .jaxpr_translator_driver import JaxprTranslationDriver
+from jace import translator
 
 
 @runtime_checkable
@@ -71,9 +69,9 @@ def primitive(self) -> str | Sequence[str]:
     @abstractmethod
     def translate_jaxeqn(
         self,
-        driver: JaxprTranslationDriver,
+        driver: translator.JaxprTranslationDriver,
         in_var_names: Sequence[str | None],
-        out_var_names: Sequence[str],
+        out_var_names: MutableSequence[str],
         eqn: jax_core.JaxprEqn,
         eqn_state: dace.SDFGState,
     ) -> dace.SDFGState | None:
@@ -94,25 +92,20 @@ def translate_jaxeqn(
             `eqn_state` argument. This state is guaranteed to be empty and
             `translator.get_terminal_sdfg_state() is eqn_state` holds.
 
-        Then the subtranslator is called. Usually a subtranslator should
-        construct the dataflow graph inside `eqn_state`. It is allowed that the
-        subtranslators creates more states if needed, but this state machine
-        has to have a single terminal state, which must be returned
-        and reachable from `eqn_state`.
-        If the function returns `None` the driver will assume that
-        subtranslator was able to fully construct the dataflow graph
-        within `eqn_state`.
-
-        While a subtranslator is forbidden from meddling with the input
-        variables mentioned in `in_var_names` in any way, it is allowed to
-        modify the output variables. For example he could create a new
-        SDFG variable, with different strides. But in that case the
-        subtranslator must update the internal mapping of the driver TBA HOW,
-        and modify the mapping in `out_var_names`.
-        However, the subtranslator is allowed to create internal temporary
-        variables. It just have to ensure that no name collision will occur,
-        a way to do this is to use a passed variable name as prefix.
-
+        Then the subtranslator is called.
+        Usually a subtranslator should construct the dataflow graph inside `eqn_state`.
+        It is allowed that the subtranslators creates more states if needed, but this state machinery
+        has to have a single terminal state, which must be returned and reachable from `eqn_state`.
+        If the function returns `None` the driver will assume that subtranslator was able to
+        fully construct the dataflow graph within `eqn_state`.
+
+        While a subtranslator is forbidden from meddling with the input variables mentioned in
+        `in_var_names` in any way, it is allowed to modify the output variables.
+        For example it could create a new SDFG variable, with different strides.
+        But in that case the subtranslator must update the internal mapping of the driver TBA HOW,
+        and modify the mapping specified by `out_var_names`.
+        However, the subtranslator is allowed to create internal temporary variables.
+        It just have to ensure that no name collision will occur, a way to do this is to use a passed variable name as prefix.
 
         Args:
             driver:         The driver object of the translation.
diff --git a/src/jace/translator/sub_translators/alu_translator.py b/src/jace/translator/sub_translators/alu_translator.py
index f397bb3..8cc2466 100644
--- a/src/jace/translator/sub_translators/alu_translator.py
+++ b/src/jace/translator/sub_translators/alu_translator.py
@@ -9,7 +9,7 @@
 
 from __future__ import annotations
 
-from collections.abc import Sequence
+from collections.abc import MutableSequence, Sequence
 from typing import Any, Final, cast
 
 import dace
@@ -17,6 +17,7 @@
 from jax import core as jax_core
 from typing_extensions import override
 
+from jace import translator
 from jace.translator import sub_translators
 
 
@@ -91,9 +92,9 @@ def primitive(self) -> Sequence[str]:
     @override
     def translate_jaxeqn(
         self,
-        driver: sub_translators.JaxprTranslationDriver,
+        driver: translator.JaxprTranslationDriver,
         in_var_names: Sequence[str | None],
-        out_var_names: Sequence[str],
+        out_var_names: MutableSequence[str],
         eqn: jax_core.JaxprEqn,
         eqn_state: dace.SDFGState,
     ) -> None:

From 9dc817e81de18f7cc00a2a2cffe5612365786e87 Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Mon, 13 May 2024 11:03:17 +0200
Subject: [PATCH 138/458] First update to the driver.

This is just a first step in the update process.
- "Simplifies" the `add_array()` function.
- Makes some changes to the general structure of the code, i.e. "Simplifies"
- Make `JaxprTranslatorDriver._ctx` a property.
- Updates some tests.

Todo:
- Unify return value, i.e. translated Jaxpr, and inner context.
---
 pyproject.toml                                |   6 +-
 .../translator/jaxpr_translator_driver.py     | 359 +++++++-----------
 tests/test_jaxpr_translator_driver.py         | 144 +++----
 tests/test_sub_translators_alu.py             |  15 +-
 4 files changed, 236 insertions(+), 288 deletions(-)

diff --git a/pyproject.toml b/pyproject.toml
index 4d551f1..f05b72a 100644
--- a/pyproject.toml
+++ b/pyproject.toml
@@ -148,4 +148,8 @@ section-order = [
 [tool.ruff.lint.per-file-ignores]
 "!tests/**.py" = ["PT"]  # Ignore `flake8-pytest-style` everywhere except in `tests/`
 "noxfile.py" = ["T20"]  # Ignore `flake8-print`
-"tests/**" = ["T10", "T20"]  # Ignore `flake8-debugger` and `flake8-print`
+"tests/**" = [
+  "T10",
+  "T20",  # Ignore `flake8-debugger` and `flake8-print`
+  "F841",  # Ignore assigned but not used; inside `with` to test if throw.
+]
diff --git a/src/jace/translator/jaxpr_translator_driver.py b/src/jace/translator/jaxpr_translator_driver.py
index e34975a..09329e1 100644
--- a/src/jace/translator/jaxpr_translator_driver.py
+++ b/src/jace/translator/jaxpr_translator_driver.py
@@ -8,7 +8,7 @@
 from __future__ import annotations
 
 import itertools
-from collections.abc import Collection, Iterable, Mapping, Sequence
+from collections.abc import Collection, Iterable, Mapping, MutableSequence, Sequence
 from typing import Any, Final, cast, overload
 
 import dace
@@ -54,7 +54,6 @@ class JaxprTranslationDriver:
 
     __slots__ = (
         "_ctx_stack",  # Stack of all contexts
-        "_ctx",  # Current top of the context stack.
         "_reserved_names",  # Part of the context, but is copied.
         "_sub_translators",
         "_rev_manager",
@@ -83,6 +82,7 @@ def __init__(
         #  This member is allocated by '_init_sub_translators()' and remains allocated
         #  during the lifetime of the object.
         self._sub_translators: dict[str, translator.PrimitiveTranslator] = None  # type: ignore[assignment]
+        self._init_sub_translators(kwargs)
 
         # These names can not be used for the automatic naming of Jax variables.
         #  They differ from the forbidden names, that they denote valid SDFG names.
@@ -98,10 +98,6 @@ def __init__(
         # Context stack and current context.
         #  Only allocated during an ongoing translation
         self._ctx_stack: list[_TranslationContext] = []
-        self._ctx: _TranslationContext = None  # type: ignore[assignment]
-
-        # Creating of the subtranslators.
-        self._init_sub_translators(kwargs)
 
     def translate_jaxpr(
         self,
@@ -126,8 +122,7 @@ def translate_jaxpr(
         Args:
             inp_scalar_as_array:    Translate scalar _input_ arguments to arrays of length 1.
             name:                   Use this name for the SDFG instead some generated one.
-            reserved_names:         Prevent the generation of variables with these names,
-                                        see `self.add_array()` for more.
+            reserved_names:         Prevent the generation of variables with these names, see `self.add_array()` for more.
             allow_empty_jaxpr:      Allows empty Jaxpr.
 
         Notes:
@@ -144,14 +139,15 @@ def translate_jaxpr(
         if not jax.config.read("jax_enable_x64"):
             raise NotImplementedError("The translation only works if 'jax_enable_x64' is enabled.")
 
-        # Consume the hidden flags
+        # The point of this flag is, that one can have the translator, but still have access
+        #  the the function of self, such as `add_array()` (is needed in later stages).
         _clear_translation_ctx: bool = kwargs.pop("_clear_translation_ctx", True)
 
-        # NOTE: If `self` is already allocated, i.e. has an ongoing translation process
-        #       This function will create a new translation context. Thus the driver
-        #       will start to translate a second (nested) SDFG.
-        #       Also note that there is no mechanism that forces the integration of the
-        #       nested SDFG/Jaxpr.
+        # NOTE: If `self` is already allocated, i.e. has an ongoing translation process,
+        #       the `_allocate_translation_ctx()` function will start a new context.
+        #       Thus the driver will start to translate a second (nested) SDFG.
+        #       Also note that there is no mechanism that forces the integration of the nested SDFG/Jaxpr,
+        #       this must be done manually.
         self._allocate_translation_ctx(
             name=name,
             reserved_names=reserved_names,
@@ -163,10 +159,8 @@ def translate_jaxpr(
             jaxpr=jaxpr,
             inp_scalar_as_array=inp_scalar_as_array,
         )
+        # Note that `self` and `jsdfg` still share the same underlying memory, i.e. context.
         jsdfg: translator.TranslatedJaxprSDFG = self._translate_jaxpr_internal(jaxpr)
-
-        # If the translation context is not cleared `self` and `jsdfg` will share the same data.
-        #  There is some legitimate use for that.
         if _clear_translation_ctx:
             self._clear_translation_ctx()
 
@@ -261,22 +255,18 @@ def map_jax_var_to_sdfg(
 
     def map_jax_var_to_sdfg(
         self,
-        jax_var: str | jax_core.Atom | util.JaCeVar,
+        jax_var: jax_core.Atom | util.JaCeVar,
         allow_fail: bool = False,
     ) -> str | None:
         """Get the _name_ of the SDFG variable to which `jax_var` is referring to.
 
-        For convenient this function will consider a string as input to be already an SDFG variable name.
-
         Args:
             jax_var:        The Jax variable to look up.
             allow_fail:     If mapping is not known return `None` instead of raise `KeyError`.
         """
-        if isinstance(jax_var, str):
-            sdfg_name: str = jax_var
-        elif isinstance(jax_var, jax_core.Literal):
+        if isinstance(jax_var, jax_core.Literal):
             raise RuntimeError("There is no SDFG variable for literal '{jax_var}'.")
-        elif jax_var in self._ctx.jax_name_map:
+        if jax_var in self._ctx.jax_name_map:
             sdfg_name = self._ctx.jax_name_map[jax_var]
         elif allow_fail:
             return None
@@ -310,11 +300,8 @@ def is_allocated(self) -> bool:
 
         If `self` is allocated then there is also an ongoing translation process.
         """
-        assert isinstance(self._sub_translators, dict)
-        if self._ctx is not None:
-            assert self._ctx_stack[-1] is self._ctx
+        if len(self._ctx_stack) != 0:
             return True
-        assert len(self._ctx_stack) == 0  # type: ignore[unreachable]
         return False
 
     def is_root_translator(self) -> bool:
@@ -373,7 +360,6 @@ def add_reserved_names(
         reserved_names: None | str | Collection[str],
     ) -> JaxprTranslationDriver:
         """Adds the names listed in `reserved_names` to the internal list."""
-        assert isinstance(self._reserved_names, set)
 
         if reserved_names is None:
             return self
@@ -383,12 +369,6 @@ def add_reserved_names(
             pass
         else:
             raise TypeError(f"Does not know how to handle the type '{type(reserved_names)}'.")
-        for rev_name in reserved_names:
-            assert isinstance(rev_name, str)
-            if not util.VALID_SDFG_VAR_NAME.fullmatch(rev_name):
-                raise ValueError(
-                    f"Can not use '{rev_name}' as reserved name as it is not a valid SDFG name."
-                )
         self._reserved_names.update(reserved_names)
         return self
 
@@ -399,42 +379,31 @@ def add_array(
         as_transient: bool = True,
         alt_name: str | None = None,
         name_prefix: str | None = None,
+        find_new_name: bool | None = None,
         force_array: bool = False,
-        as_view: bool = False,
         strides: Sequence[int | dace.symbol | str] | None = None,
-        symb_strides: bool | None = None,
-        find_new_name: bool | None = None,
         allow_literals: bool = False,
         force_jax_name: bool = False,
         update_var_mapping: bool = False,
     ) -> str:
         """Creates an SDFG variable for the Jax variable `arg` and returns its SDFG name.
 
-        By default the function will create a transient, use `as_transient` to
-        change that. By default the function will honor if the Jax variable is
-        a scalar or an array. However, by setting `force_array` the function
-        will always generate an array.
+        By default the function will create a transient, use `as_transient=True` to change that.
+        By default the function will honor if the Jax variable is a scalar or an array.
+        However, by setting `force_array` the function will always generate an array.
 
         By default the name for the SDFG variable is derived from the Jax variable.
-        It is guaranteed that this name is unique in the SDFG, even in the presence
-        of nested SDFGs. By specifying `alt_name` it is possible to force a certain
-        name on a variable. It is important that if `alt_name` is specified the function
-        will either generate the variable or fail.
+        It is guaranteed that this name is unique in the SDFG, even in the presence of nested SDFGs.
+        By specifying `alt_name` it is possible to force a certain name on a variable.
+        It is important that if `alt_name` is specified the function will either generate the variable or fail.
 
         The  driver distinguishes between two kinds of "bad (SDFG) variable names".
         The first category are the forbidden names, which the function refuses to generate.
-        The second type are the so called reserved names, which were set at the beginning.
-        These names can be used if they are specified through `alt_name` but are not used
-        in automatic naming.
-
-        If nothing is specified, the strides of the data are determined by DaCe, which is
-        continuous C order. There are two ways to change that.
-        The first way is to specify the `strides` argument, which are then forwarded
-        to the underlying DaCe function. The second way is to set `symb_strides`
-        to `True` in which case the function will generate symbols and use them.
-        However, even if symbolic strides are activated, arrays with just one
-        dimensions have always a non symbolic stride of 1. Furthermore, dimensions
-        with shape 1 will always have stride 0.
+        The second type are the so called reserved names, which were set at the beginning, or by `self.add_reserved_names()`.
+        These names can be used if the name is specified through `alt_name` but are not used in automatic naming.
+
+        If nothing is specified, the strides of the data are determined by DaCe, which is continuous C order.
+        It is possible to set a certain values by setting `strides` appropriate.
 
         By default this function does not update the internal variable map.
         However, by setting `update_var_mapping` to `True` the function will
@@ -445,14 +414,9 @@ def add_array(
             as_transient:       If set, the SDFG variable is a transient, `True` by default.
             alt_name:           Try to create the variable with this name; either succeed or fail.
             name_prefix:        If given and in automatic naming mode, add this prefix to the name.
+            find_new_name:      The translator will try to find a new name if the designated is already occupied.
             force_array:        Instead of a `dace.Scalar` create a `dace.Array` with one element.
-            as_view:            Creates a view instead of an array, if it is a scalar
-                                    it is silently ignored.
             strides:            Instead of the default strides use these values.
-            symb_strides:       Create symbols and use them for fully symbolic strides.
-            find_new_name:      The translator will try to find a new name if the designated
-                                    is already occupied. This does not work if the name
-                                    was supplied by `alt_name`.
             allow_literals:     If `True` then also allows JaxLiterals as `arg`.
             force_jax_name:     If `True` then, the verbatim Jax name will be used.
             update_var_mapping: Update the internal variable mapping; by default `False`.
@@ -460,13 +424,6 @@ def add_array(
         Notes:
             If this function is used directly a user is advised to always set
                 `update_var_mapping` to `True`.
-            If `find_new_name` is `None` the default, the function will only
-                look for a new name if there is a need for it. If it is `True`
-                the function will always look for a new name, even if the initial
-                name was fine. If it is `False` the function will never look for
-                a new new, thus if the name is unavailable an error is generated.
-                However, this excluds variable names that are known.
-            Specifying `alt_name` implies `find_new_name=False`.
             If you need to create a special array, you can use `jace.util.JaCeVar`
                 to create a pseudo Jax variable.
         """
@@ -483,7 +440,7 @@ def add_array(
             #  a variable for a second time. It is, however, okay to use one as template,
             #  if another name is specified from the beginning.
             raise ValueError(
-                f"Tried to create variable '{arg}' again, without specifying an alternative name.."
+                f"Tried to create variable '{arg}' again, without specifying an alternative name."
             )
         if force_jax_name:
             if alt_name is not None:
@@ -494,11 +451,12 @@ def add_array(
                 raise ValueError(
                     f"Specified 'force_jax_name', but passed '{name_prefix}' as 'name_prefix'."
                 )
+            if find_new_name:
+                raise ValueError("Specified `force_jax_name` but also wanted a new name.")
+            find_new_name = False
             alt_name = util._propose_jax_name(arg, self._ctx.jax_name_map)
         if alt_name is not None:
-            assert isinstance(
-                alt_name, str
-            ), f"Got '{type(alt_name)}' instead of 'str' for 'alt_name'."
+            assert isinstance(alt_name, str)
             find_new_name = False  # If a name was given, then use it no matter what.
             if len(alt_name) == 0:
                 raise ValueError("Passed an empty 'alt_name'.")
@@ -506,32 +464,30 @@ def add_array(
                 raise ValueError("'alt_name' is a forbidden name.")
             if not util.VALID_SDFG_VAR_NAME.fullmatch(alt_name):
                 raise ValueError(f"The passed name 'alt_name' '{alt_name}' is invalid.")
+            if update_var_mapping and arg in self._ctx.jax_name_map:
+                raise ValueError(f"Variable '{alt_name}' already registered.")
+            if alt_name in self._ctx.sdfg.arrays:
+                raise ValueError(f"Variable '{alt_name}' already exists.")
             if name_prefix is not None:
                 raise ValueError(
                     f"Specified 'name_prefix' ('{name_prefix}') but passed '{alt_name}' as 'alt_name'."
                 )
-            if alt_name in self._ctx.sdfg.arrays:
-                raise ValueError(f"Variable '{alt_name}' already exists.")
         if name_prefix is not None:
             assert isinstance(name_prefix, str)
             if len(name_prefix) == 0:
                 raise ValueError("Specified an empty 'name_prefix'.")
-        if as_view and (not as_transient):
-            raise ValueError("You tried to create a global view, which is not allowed.")
 
         # Checking the strides.
-        if (symb_strides is None) and (strides is None):
-            def_symb_stride = False  # default value for symbolic strides
-            symb_strides = False if (len(shape) <= 1) else def_symb_stride  # Keep for the future
-        elif (symb_strides is not None) and (strides is not None):
-            raise ValueError("Specified 'symb_strides' and 'stride at the same time.")
-        elif strides is not None:
+        if strides is not None:
+            if is_scalar:
+                raise ValueError("Specified a stride for a scalar.")
+            if isinstance(strides, (str, dace.symbol, int)):
+                strides = (strides,)
+            assert isinstance(strides, tuple)
             if len(strides) != len(shape):
                 raise ValueError(
                     f"'strides' has length {len(strides)}, but array rank is {len(shape)}."
                 )
-        else:
-            assert isinstance(symb_strides, bool)
 
         # Now we determine the proposed name of the variable.
         #  Depending on the situation, we will further manipulate it.
@@ -539,20 +495,17 @@ def add_array(
             prop_name = alt_name  # Just for completion: will be ignored later
         elif isinstance(arg, (jax_core.Var, util.JaCeVar)):
             prop_name = util._propose_jax_name(arg, self._ctx.jax_name_map)
-            if prop_name.startswith("__"):
-                raise ValueError(
-                    f"You tried to create the variable '{prop_name}' which"
-                    "starts with two underscores, use 'alt_name' for that."
-                )
+            assert not prop_name.startswith("__")
             if name_prefix is not None:
                 prop_name = name_prefix + prop_name
         elif isinstance(arg, jax_core.Literal):  # type: ignore[unreachable]
-            if not allow_literals:
+            if not allow_literals:  # Allows to use a literal as template.
                 raise NotImplementedError("Jax Literals are not supported.")
             if alt_name is None:
                 raise ValueError(f"Passed literal '{arg}', but not specified a name to use.")
         else:
             raise TypeError(f"Does not know how to handle '{type(arg).__name__}'.")
+
         if alt_name is None:
             # If we are the root translator, then we will use `prop_name` directly;
             #  otherwise we will append the revision of `self` to the name.
@@ -560,6 +513,7 @@ def add_array(
                 "" if self.is_root_translator() else f"_rev_idx{self._ctx.rev_idx}"
             )
         else:
+            # Use the supplied name directly.
             arg_name = str(alt_name)
 
         # Determine if we should look for a new name or not, if nothing was specified
@@ -567,10 +521,10 @@ def add_array(
             if arg_name in self._reserved_names:
                 find_new_name = True
             if arg_name in self._forbidden_names:
+                # This is not an error, but happens if we handle Jax variable `if`.
                 find_new_name = True
 
         if find_new_name:
-            # We have to find a new name.
             name_tmpl = "_jax_variable__" + arg_name + "__{}"
             for iCounter in range(1000):
                 _arg_name = name_tmpl.format(iCounter)
@@ -597,34 +551,13 @@ def add_array(
         # Promotion of scalar to array.
         if is_scalar and force_array:
             shape = (1,)
-            symb_strides = False
             strides = None
             is_scalar = False
 
-        # Set the stride if we have to change.
-        if strides is not None:
-            strides = tuple(strides)
-            assert len(strides) == len(shape)
-
-        elif (symb_strides is True) and (not is_scalar):
-            strides = [
-                dace.symbol(f"{arg_name}_stride{dim}", dace.int64) if size >= 2 else 0
-                for dim, size in enumerate(shape)
-            ]
-
         if is_scalar:
             self._ctx.sdfg.add_scalar(
                 name=arg_name, storage=storage, dtype=dtype, transient=as_transient
             )
-        elif as_view:
-            self._ctx.sdfg.add_view(
-                name=arg_name,
-                shape=shape,
-                strides=strides,
-                offset=offset,
-                storage=storage,
-                dtype=dtype,
-            )
         else:
             self._ctx.sdfg.add_array(
                 name=arg_name,
@@ -641,7 +574,27 @@ def add_array(
 
         return arg_name
 
+    @overload
     def create_jax_var_list(
+        self,
+        jax_var_list: Sequence[jax_core.Atom | util.JaCeVar],
+        prevent_creation: bool = False,
+        only_creation: bool = True,
+        handle_literals: bool = False,
+        **kwargs: Any,
+    ) -> list[str]: ...
+
+    @overload
+    def create_jax_var_list(  # type: ignore[misc]
+        self,
+        jax_var_list: Sequence[jax_core.Atom | util.JaCeVar],
+        prevent_creation: bool = False,
+        only_creation: bool = False,
+        handle_literals: bool = False,
+        **kwargs: Any,
+    ) -> list[None | str]: ...
+
+    def create_jax_var_list(  # type: ignore[misc]
         self,
         jax_var_list: Sequence[jax_core.Atom | util.JaCeVar],
         prevent_creation: bool = False,
@@ -655,7 +608,7 @@ def create_jax_var_list(
         If no SDFG variable is known the function will create one using `add_array()`, with `update_var_mapping` set to `True`.
 
         By setting `prevent_creation` the function will not create any new SDFG variables.
-        This mode is used to indicate that all variables already have to exists already.
+        This mode is used to indicate that all variables have to exists already.
         By setting `only_creation` the function will only create new SDFG variables.
         If a Jax variable already has a known SDFG equivalent an error is generated.
 
@@ -692,7 +645,7 @@ def create_jax_var_list(
                     raise ValueError(f"'only_creation' given '{jax_var}' already exists.")
                 else:
                     sdfg_name = mapped_sdfg_name
-                # `add_jax_name_mapping` is save, because if the mapping does already exists it is a no ops.
+                # Calling `add_jax_name_mapping` is save, because if the mapping does already exists it is a no ops.
                 self.add_jax_name_mapping(jax_var, sdfg_name)
             else:
                 raise TypeError(f"Does not know how to handle '{type(jax_var).__name__}'")
@@ -727,7 +680,7 @@ def _create_initial_input(
 
         # Handle the initial input arguments
         sdfg: dace.SDFG = self._ctx.sdfg
-        init_in_var_names: Sequence[str] = self.create_jax_var_list(  # type: ignore[assignment]
+        init_in_var_names: Sequence[str] = self.create_jax_var_list(
             jax_var_list=jaxpr.jaxpr.invars,
             only_creation=True,
             as_transient=True,  # Explicit transient; no error!
@@ -735,10 +688,11 @@ def _create_initial_input(
             force_array=inp_scalar_as_array,
             force_jax_name=self.is_root_translator(),  # Ensure root get pure Jax names.
         )
-        sdfg.arg_names.extend(init_in_var_names)
+        # This forces the code to only accept kwargs
+        #  Is also part of "what a canonical sdfg" is.
+        sdfg.arg_names = []
 
-        # Store the list of inputs in self; this is done to simplify exporting.
-        #  The output list is populated by `self._translate_jaxpr_internal()`
+        # The output list is populated by `self._translate_jaxpr_internal()`
         self._ctx.inp_names = tuple(init_in_var_names)
 
         return init_in_var_names
@@ -759,25 +713,22 @@ def _create_constants(
 
         if not self.is_allocated():
             raise RuntimeError("Driver is not allocated, can not create constants.")
-        if not len(jaxpr.consts):
+        if len(jaxpr.consts) == 0:
             return []
 
-        const_names: list[str] = []
-        for cJaxVar, cValue in zip(jaxpr.jaxpr.constvars, jaxpr.consts, strict=False):
-            c_sdfg_name = self.add_array(
-                arg=cJaxVar,
-                name_prefix="__const_",
-                as_transient=True,
-                symb_strides=False,
-                strides=None,
-                update_var_mapping=True,
-            )
+        sdfg_const_names: Sequence[str] = self.create_jax_var_list(
+            jax_var_list=jaxpr.jaxpr.constvars,
+            only_creation=True,
+            strides=None,
+            name_prefix="__const_",
+        )
+
+        for sdfg_name, const_value in zip(sdfg_const_names, jaxpr.consts, strict=True):
             # We have to pass the data descriptor to `add_constant()`, otherwise a new one would be created.
             self._ctx.sdfg.add_constant(
-                c_sdfg_name, deepcopy(cValue), self._ctx.sdfg.arrays[c_sdfg_name]
+                sdfg_name, deepcopy(const_value), self._ctx.sdfg.arrays[sdfg_name]
             )
-            const_names.append(c_sdfg_name)
-        return const_names
+        return sdfg_const_names
 
     def _allocate_translation_ctx(
         self,
@@ -797,11 +748,12 @@ def _allocate_translation_ctx(
         from ._translation_context import _TranslationContext
 
         # Create a new translation context and put it on the stack.
-        self._ctx = _TranslationContext(
-            rev_idx=next(self._rev_manager),
-            name=name,
+        self._ctx_stack.append(
+            _TranslationContext(
+                rev_idx=next(self._rev_manager),
+                name=name,
+            )
         )
-        self._ctx_stack.append(self._ctx)
 
         if self.is_root_translator():
             # The root translation, i.e. the very first context allocation
@@ -817,6 +769,12 @@ def _allocate_translation_ctx(
 
         return self
 
+    @property
+    def _ctx(self) -> _TranslationContext:
+        """Returns the currently active translation context."""
+        assert len(self._ctx_stack) != 0, "No context is active."
+        return self._ctx_stack[-1]
+
     def _init_sub_translators(
         self,
         subtrans_args: Mapping[str, Any],
@@ -826,9 +784,9 @@ def _init_sub_translators(
         The function forwards `kwargs` to the constructor of the subtranslators.
         However, it will remove all arguments starting with an underscore.
         """
-        assert self._sub_translators is None
+        from jace.translator import sub_translators  # Cyclic import
 
-        subtrans_args = {k: v for k, v in subtrans_args.items() if not k.startswith("_")}  # type: ignore[unreachable]
+        subtrans_args = {k: v for k, v in subtrans_args.items() if not k.startswith("_")}
         prim_translators: dict[str, translator.PrimitiveTranslator] = {}
         for prim_translator_cls in sub_translators._get_subtranslators_cls():
             prim_translator: translator.PrimitiveTranslator = prim_translator_cls.CREATE(
@@ -838,7 +796,7 @@ def _init_sub_translators(
 
             for handled_primitive in handled_primitives:
                 if handled_primitive in prim_translators:
-                    raise RuntimeError(f"Multiple sub translators for '{handled_primitive}' found.")
+                    raise RuntimeError(f"Multiple translators for '{handled_primitive}' found.")
                 prim_translators[handled_primitive] = prim_translator
         self._sub_translators = prim_translators
 
@@ -848,7 +806,7 @@ def _clear_translation_ctx(self) -> JaxprTranslationDriver:
         """This function deallocate the translation context of `self`.
 
         Notes:
-            While it is allowed for outside code to call this explicitly function,
+            While it is allowed for outside code to call this function explicit
                 it is is most likely an error.
             If `self` is not allocated this function acts as a noops.
             The reserved names are only deallocated if `self` is a root translator.
@@ -856,19 +814,14 @@ def _clear_translation_ctx(self) -> JaxprTranslationDriver:
         if not self.is_allocated():
             return self
 
-        assert self._ctx is self._ctx_stack[-1], "Inconsistent stack detected."
         if self.is_root_translator():
             self._rev_manager = itertools.count(0, 1)
             self._reserved_names = None  # type: ignore[assignment]
-
-            self._ctx = None  # type: ignore[assignment]
             self._ctx_stack.pop()
 
         else:
             # Restore the previous state
-            assert len(self._ctx_stack) > 1
             self._ctx_stack.pop()
-            self._ctx = self._ctx_stack[-1]
         return self
 
     def _find_sub_translator_for(
@@ -876,8 +829,6 @@ def _find_sub_translator_for(
         eqn: jax_core.JaxprEqn,
     ) -> translator.PrimitiveTranslator:
         """Returns the appropriate subtranslator for equation `eqn`."""
-        assert self._sub_translators is not None
-
         prim_name: str = eqn.primitive.name
         if prim_name not in self._sub_translators:
             raise NotImplementedError(f"No subtranslators known to handle '{prim_name}'.")
@@ -886,7 +837,6 @@ def _find_sub_translator_for(
 
     def _translate_single_eqn(
         self,
-        jaxpr: jax_core.ClosedJaxpr,
         eqn: jax_core.JaxprEqn,
     ) -> tuple[Sequence[str | None], Sequence[str]]:
         """Translate `eqn` into its SDFG equivalent.
@@ -902,17 +852,14 @@ def _translate_single_eqn(
             The inputs might contain `None` which indicates that that input was a Jax Literal.
 
         Notes:
-            While `jaxpr` must be a `ClosedJaxpr`, `eqn` must come from the unclosed instance.
+            The equation, `eqn` must come from the unclosed jaxpr instance.
             The function will perform some consistency checking after the subtranslator was called.
         """
-        assert isinstance(eqn, jax_core.JaxprEqn)
-        assert isinstance(jaxpr, jax_core.ClosedJaxpr)
-
         if len(eqn.effects) != 0:
             raise NotImplementedError(f"Equation '{eqn}' has side effects.")
 
         # Input/Output variables
-        #  Using a tuple for the input ensures that it is not modified.
+        #  Using a tuple for the input ensures that it cannot be modified.
         in_var_names: Sequence[str | None] = tuple(
             self.create_jax_var_list(
                 eqn.invars,
@@ -920,7 +867,7 @@ def _translate_single_eqn(
                 handle_literals=True,  #  but they can be literals.
             )
         )
-        out_var_names: Sequence[str] = self.create_jax_var_list(  # type: ignore[assignment]
+        out_var_names: MutableSequence[str] = self.create_jax_var_list(
             eqn.outvars,
             only_creation=True,  # Output must not exist yet.
         )
@@ -932,7 +879,7 @@ def _translate_single_eqn(
         last_term_state: dace.SDFGState = self.get_terminal_sdfg_state()  # noqa: F841 # Will be used later
         eqn_state = self.append_new_state(
             label=f"{eqn.primitive.name}_{out_var_names[0]}",
-            prev_state=None,  # forces terminal state
+            prev_state=None,  # forces terminal state to use
         )
 
         # Now perform the actual translation of the equation.
@@ -957,40 +904,15 @@ def _translate_single_eqn(
 
         # In case a subtranslator decided to not use the variables we created for it, which is allowed
         #  but he must update the `out_var_names` list correctly, we will now verify this.
-        if len(out_var_names) != len(eqn.outvars):
-            raise RuntimeError(
-                f"Modified 'out_var_names'! Expected {len(eqn.outvars)} variables."
-                f" but found {len(out_var_names)}"
-            )
         for expectedSDFGName, jax_var in zip(out_var_names, eqn.outvars, strict=True):
             mapped_sdfg_name = self.map_jax_var_to_sdfg(jax_var)
-            jax_name = util.get_jax_var_name(jax_var)
             if mapped_sdfg_name != expectedSDFGName:
                 raise ValueError(
                     f"Mapping inconsistency detected, expected that Jax variable"
-                    f" '{jax_name}' maps to '{expectedSDFGName}' but it actually"
+                    f" '{jax_var}' maps to '{expectedSDFGName}' but it actually"
                     f" maps to '{mapped_sdfg_name}'."
                 )
 
-        # Views can only be used if there is a direct connection, between source,
-        #  view and destination (place of usage). Because of the way how Jax works,
-        #  it is impossible that an output variable is a View.
-        for outVarName, jax_var in zip(out_var_names, eqn.outvars, strict=True):
-            sdfg_var = self.get_array(outVarName)
-            if isinstance(sdfg_var, (dace.data.Array, dace.data.Scalar)):
-                pass
-            elif isinstance(sdfg_var, dace.data.View):
-                raise TypeError(
-                    f"For Jax variable '{util.get_jax_var_name(jax_var)}' (SDFG: '{outVarName}'),"
-                    f" which is an output, you used a View, which is not possible."
-                    " It must either be an array or a scalar."
-                )
-            else:
-                raise NotImplementedError(
-                    f"Output variable '{util.get_jax_var_name(jax_var)}' (SDFG: '{outVarName}')"
-                    f" is of type '{type(sdfg_var).__name__}' which I does not know how to handle."
-                )
-
         # Modify terminal root state of 'self'
         self._ctx.terminal_state = new_sdfg_term_state
 
@@ -1015,26 +937,22 @@ def _translate_jaxpr_internal(
                 this is used by Jax to indicate that they are never read.
                 Such variables are included by some transformations such as `grad()`.
         """
-        assert isinstance(jaxpr, jax_core.ClosedJaxpr)
-        assert self.is_allocated()
-
         nb_translated_eqn: int = 0
         out_var_names: Sequence[str] = []
-        for eqn in jaxpr.jaxpr.eqns:  # Translate the equations one by one.
-            assert len(eqn.effects) == 0
-            if len(eqn.outvars) == 0:  # Do we need this special case.
-                continue  #  Looks more like internal Jax error.
+
+        # Translate the equations one by one.
+        for eqn in jaxpr.jaxpr.eqns:
             if any(util.is_drop_var(outVar) for outVar in eqn.outvars):
-                assert (len(eqn.outvars) == 1) or all(
-                    util.is_drop_var(outVar) for outVar in eqn.outvars
-                )
+                assert all(util.is_drop_var(outVar) for outVar in eqn.outvars)
                 continue
-            _, out_var_names = self._translate_single_eqn(jaxpr=jaxpr, eqn=eqn)
+            _, out_var_names = self._translate_single_eqn(eqn=eqn)
             nb_translated_eqn += 1
 
+        # There were no equation, so handle the copying of input to output.
         if nb_translated_eqn == 0:
-            # There were no equation, so handle the copying of input to output.
             out_var_names = self._handle_null_jaxpr(jaxpr)
+
+        # Set the output names inside the context.
         self._ctx.out_names = tuple(out_var_names)
 
         return self._export_context()
@@ -1065,9 +983,9 @@ def _handle_null_jaxpr(
     ) -> Sequence[str]:
         """This function is called in case a `Jaxpr` with zero equations is encountered.
 
-        A function with zero equation might still have output, in which case an
-        input is copied to an output. This function will handle the copying from
-        the input into the corresponding output variable.
+        A function with zero equation might still have output, in which case an input is copied to an output.
+        This function will handle the copying from the input into the corresponding output variable.
+        It is important that the function will remove the input and output variables from the internal mapping.
 
         Returns:
             The function returns a list denoting the SDFG variables that refers to the output.
@@ -1082,47 +1000,46 @@ def _handle_null_jaxpr(
         assert len(self._ctx.inp_names) > 0
         assert len(self._ctx.out_names) == 0
 
-        # We will use this list to build the list of output names.
-        #  This is important for the exporter.
+        # List of the output variables.
         out_var_names: list[str] = []
 
         # If we are here then we are dealing with a nested SDFG/Jaxpr.
-        #  Because an input also serves as output, the nested SDFG will have connector pairs
-        #  with the same name, one serving as input the other as output, with the same name.
+        #  Because an input also serves as output, the nested SDFG will have a connector for the
+        #  input and one for the output, but both with the same name.
         #  This will make node validation fail.
-        #  Thus we have to introduce a some fake output name and explicitly copy the data around.
-        #  Once DaCe will inline the nested SDFG it will remove this intermediate copy.
+        #  We have to work around by introducing some fake copies, which will be removed by DaCe later.
         for jax_out_var in jaxpr.jaxpr.outvars:
-            jax_inp_name = util.get_jax_var_name(
-                jax_out_var
-            )  # Since output == input their names must be the same.
-            assert self.map_jax_var_to_sdfg(jax_inp_name, allow_fail=True)
+            # Since the output is also used as an input the variable mapping must be known.
+            sdfg_in_name: str = self.map_jax_var_to_sdfg(jax_out_var)
 
-            # This is the name we give to fictive Jax variable serving as output.
-            jax_out_name = f"_zero_equation_output_{self.map_jax_var_to_sdfg(jax_out_var)}"
-
-            # Now create the SDFG variable for it, give it a unique name.
+            # Now we create a variable that serves as true output, however, since the Jax variable
+            #  is already known we can not update the variable mapping.
             sdfg_out_name = self.add_array(
                 jax_out_var,
                 as_transient=True,
                 name_prefix="_zero_equation_output_for_",
                 update_var_mapping=False,
             )
+            out_var_names.append(sdfg_out_name)
 
-            # We now create a new mapping, we do this that we will later find the variable again.
-            self.add_jax_name_mapping(jax_var=jax_out_name, sdfg_name=sdfg_out_name)
-            out_var_names.append(jax_out_name)
-
-            # Now copy the input into the fake output variable.
-            inp_acc = self._ctx.start_state.add_read(self.map_jax_var_to_sdfg(jax_inp_name))
-            out_acc = self._ctx.start_state.add_write(self.map_jax_var_to_sdfg(jax_out_var))
+            # Now we perform the copy from the input variable in the newly created output variable.
+            inp_acc = self._ctx.start_state.add_read(sdfg_in_name)
+            out_acc = self._ctx.start_state.add_write(sdfg_out_name)
             self._ctx.start_state.add_nedge(
                 src=inp_acc,
                 dst=out_acc,
                 data=dace.Memlet.from_array(
-                    jax_inp_name, self.get_array(self.map_jax_var_to_sdfg(jax_inp_name))
+                    sdfg_in_name, self.get_array(self.map_jax_var_to_sdfg(sdfg_in_name))
                 ),
             )
+
+            # A Jax variable now has two SDFG equivalent, the input, that was previously created by
+            #  `self._create_initial_input()` and the `sdfg_out_name` we just created.
+            #  But we can not add this to the mapping, because of this situation we will now remove
+            #  the variable from the mapping. I am open for different approaches.
+            #  Note that input variables that are not used, will remain in the mapping.
+            self._ctx.jax_name_map.pop(jax_out_var)
+
         return tuple(out_var_names)
 
     # fmt: off
diff --git a/tests/test_jaxpr_translator_driver.py b/tests/test_jaxpr_translator_driver.py
index 46ea10b..1570471 100644
--- a/tests/test_jaxpr_translator_driver.py
+++ b/tests/test_jaxpr_translator_driver.py
@@ -32,8 +32,7 @@ def test_driver_alloc() -> None:
     """Tests the state right after allocation."""
     driver = jtrans.JaxprTranslationDriver()
     assert not driver.is_allocated(), "Driver was created allocated."
-    assert driver._ctx is None
-    assert len(driver._ctx_stack) == 0  # type: ignore[unreachable]
+    assert len(driver._ctx_stack) == 0
 
     # The reserved names will be tested in `test_driver_fork()`.
     sdfg_name = "qwertzuiopasdfghjkl"
@@ -78,7 +77,6 @@ def test_driver_nested() -> None:
     assert len(driver._ctx_stack) == 2
     assert driver._ctx is driver._ctx_stack[-1]
     assert driver._ctx is not driver._ctx_stack[0]
-    assert org_ctx is driver._ctx_stack[0]
 
     for member_name in driver._ctx.__slots__:
         org = getattr(org_ctx, member_name)
@@ -95,8 +93,7 @@ def test_driver_nested() -> None:
 
     # Now if we fully deallocate then we expect that it is fully deallocated.
     driver._clear_translation_ctx()
-    assert driver._ctx is None
-    assert len(driver._ctx_stack) == 0  # type: ignore[unreachable]
+    assert len(driver._ctx_stack) == 0
     assert driver._reserved_names is None
 
 
@@ -136,8 +133,8 @@ def test_driver_append_state(alloc_driver: jtrans.JaxprTranslationDriver) -> Non
     assert next(iter(sdfg.in_edges(non_terminal_state))).src is terminal_state_1
 
 
-def test_driver_array(alloc_driver: jtrans.JaxprTranslationDriver) -> None:
-    """This function tests the array creation routines.
+def test_driver_scalar(alloc_driver: jtrans.JaxprTranslationDriver) -> None:
+    """This function tests the array creation routines, especially the scalar part.
 
     However, it does so without using Jax variables.
     """
@@ -169,41 +166,91 @@ def test_driver_array(alloc_driver: jtrans.JaxprTranslationDriver) -> None:
     assert scal2.strides == (1,)
     assert scal2.dtype == scal2_j.dtype
 
-    # Create a scalar force it as an array and use symbolic strides.
+    # Using a special name for the variable
     scal3_j = JaCeVar("scal3", (), dace.int64)
+    scal3_n = "scal3_special_name"
     scal3_: str = alloc_driver.add_array(
         arg=scal3_j,
-        force_array=True,
-        symb_strides=True,  # Will have no effect.
+        alt_name=scal3_n,
+        update_var_mapping=True,
     )
-    scal3: Data = alloc_driver.get_array(scal3_)
-    assert isinstance(scal2, Array)
-    assert scal3_ == scal3_j.name
-    assert scal3.shape == (1,)
-    assert scal3.strides == (1,)
-    assert scal3.dtype == scal3_j.dtype
+    assert scal3_ == scal3_n
+    assert scal3_ == alloc_driver.map_jax_var_to_sdfg(scal3_j)
 
-    # Using a special name for the variable
-    scal4_j = scal3_j
-    scal4_n = "scal4_special_name"
-    scal4_: str = alloc_driver.add_array(
+    # Test the prefix functionality
+    scal4_j = JaCeVar("scal4", (), dace.float64)
+    scal4_p = "my_prefix"
+    scal4_n = "scal4_unused_name"
+    with pytest.raises(
+        expected_exception=ValueError,
+        match=re.escape(
+            f"Specified 'name_prefix' ('{scal4_p}') but passed '{scal4_n}' as 'alt_name'."
+        ),
+    ):
+        scal4_: str = alloc_driver.add_array(
+            arg=scal4_j,
+            alt_name=scal4_n,
+            name_prefix=scal4_p,
+        )
+    # Now create it correctly
+    scal4_ = alloc_driver.add_array(
         arg=scal4_j,
-        alt_name=scal4_n,
-        update_var_mapping=True,
+        name_prefix=scal4_p,
     )
-    assert scal4_ == scal4_n
-    assert scal4_ == alloc_driver.map_jax_var_to_sdfg(scal4_j)
+    assert scal4_.startswith(scal4_p)
+    assert scal4_j.name in scal4_
 
-    # Test the prefix functionality
+    # Test the strides, or the inability to use it.
     scal5_j = JaCeVar("scal5", (), dace.float64)
-    scal5_p = "my_prefix"
-    scal5_: str = alloc_driver.add_array(
-        arg=scal5_j,
-        name_prefix=scal5_p,
+    with pytest.raises(
+        expected_exception=ValueError,
+        match="Specified a stride for a scalar.",
+    ):
+        scal5_: str = alloc_driver.add_array(arg=scal5_j, strides=(3,))
+
+    # test the force jax name feature
+    scal6_j = JaCeVar("scal6", (), dace.float64)
+    scal6_n: str = "scal6_name"
+    scal6_np: str = "scal6_name_prefix"
+    with pytest.raises(
+        expected_exception=ValueError,
+        match=f"Specified 'force_jax_name', but passed '{scal6_n}' as 'alt_name'.",
+    ):
+        scal6_: str = alloc_driver.add_array(
+            arg=scal6_j,
+            alt_name=scal6_n,
+            force_jax_name=True,
+        )
+    with pytest.raises(
+        expected_exception=ValueError,
+        match=f"Specified 'force_jax_name', but passed '{scal6_np}' as 'name_prefix'.",
+    ):
+        scal6_ = alloc_driver.add_array(
+            arg=scal6_j,
+            name_prefix=scal6_np,
+            force_jax_name=True,
+        )
+    with pytest.raises(
+        expected_exception=ValueError,
+        match="Specified `force_jax_name` but also wanted a new name.",
+    ):
+        scal6_ = alloc_driver.add_array(
+            arg=scal6_j,
+            force_jax_name=True,
+            find_new_name=True,
+        )
+    scal6_ = alloc_driver.add_array(
+        arg=scal6_j,
+        force_jax_name=True,
     )
-    assert scal5_.startswith(scal5_p)
-    assert scal5_j.name in scal5_
+    assert scal6_ == scal6_j.name
+
 
+def test_driver_array(alloc_driver: jtrans.JaxprTranslationDriver) -> None:
+    """This function tests the array creation routines.
+
+    However, it does so without using Jax variables.
+    """
     # Allocating an array
     arr1_j = JaCeVar("arr1", (5, 3), dace.float32)
     arr1_: str = alloc_driver.add_array(
@@ -216,7 +263,7 @@ def test_driver_array(alloc_driver: jtrans.JaxprTranslationDriver) -> None:
     assert arr1.strides == (3, 1)
     assert arr1.dtype == arr1_j.dtype
 
-    # Create a variable that has a name that is already known.
+    # Create a variable that has a sdfg name that is already known.
     arr2_j = JaCeVar(arr1_, (10,), dace.float64)
     with pytest.raises(
         expected_exception=ValueError,
@@ -224,10 +271,9 @@ def test_driver_array(alloc_driver: jtrans.JaxprTranslationDriver) -> None:
     ):
         arr2_: str = alloc_driver.add_array(arg=arr2_j)
     with pytest.raises(expected_exception=ValueError, match=f"Variable '{arr1_}' already exists."):
-        # `alt_name` will not work because variable still exists.
+        # `alt_name` will not work because name still exists.
         arr2_ = alloc_driver.add_array(arg=arr2_j, alt_name=arr2_j.name)
     # However, specifying `find_new_name` will solve this issue
-    #  NOTE: Doing this is not a good idea.
     arr2_ = alloc_driver.add_array(
         arg=arr2_j,
         find_new_name=True,
@@ -246,36 +292,6 @@ def test_driver_array(alloc_driver: jtrans.JaxprTranslationDriver) -> None:
     assert arr3.shape == arr3_j.shape
     assert arr3.strides == arr3_st
 
-    # Test if specifying `symb_strides` and a stride at the same time is an error.
-    arr4_j = JaCeVar("arr4", arr3_j.shape, dace.uintp)
-    arr4_st = arr3_st
-    with pytest.raises(
-        expected_exception=ValueError,
-        match="Specified 'symb_strides' and 'stride at the same time.",
-    ):
-        arr4_: str = alloc_driver.add_array(
-            arg=arr4_j,
-            symb_strides=True,
-            strides=arr4_st,
-        )
-
-    # Test if specifying the symbolic stride alone works.
-    #  Because a shape is `1` there should be no symbolic for it.
-    arr4_ = alloc_driver.add_array(
-        arg=arr4_j,
-        symb_strides=True,
-    )
-    arr4: Data = alloc_driver.get_array(arr4_)
-    assert isinstance(arr4, Array)
-    assert arr4.shape == arr4_j.shape
-
-    for shp, stri in zip(arr4.shape, arr4.strides):
-        if shp == 1:
-            assert isinstance(stri, int)
-            assert stri == 0, f"Expected a stride of 0, but got '{stri}'."
-        else:
-            assert isinstance(stri, (str, dace.symbol))
-
 
 def test_driver_array2() -> None:
     """This function tests the array creation routine with respect to the automatic naming.
diff --git a/tests/test_sub_translators_alu.py b/tests/test_sub_translators_alu.py
index d6bc7b9..50128e8 100644
--- a/tests/test_sub_translators_alu.py
+++ b/tests/test_sub_translators_alu.py
@@ -51,5 +51,16 @@ def testee(A: np.ndarray, B: np.ndarray) -> np.ndarray:
     assert np.allclose(ref, res), f"Expected '{ref}' got '{res}'."
 
 
-if __name__ == "__main__":
-    test_add()
+def test_add3():
+    """Simple add function, with constant."""
+    jax.config.update("jax_enable_x64", True)
+
+    def testee(A: np.ndarray) -> np.ndarray:
+        return A + jax.numpy.array([[1.0, 2.0, 3.0], [4.0, 5.0, 6.0], [7.0, 8.0, 9.0]])
+
+    A = np.ones((3, 3), dtype=np.float64)
+
+    ref = testee(A)
+    res = jutil._jace_run(testee, A)
+
+    assert np.allclose(ref, res), f"Expected '{ref}' got '{res}'."

From a0bcfbb71aedada614fc9224cc8a19b456a60e27 Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Mon, 13 May 2024 12:56:58 +0200
Subject: [PATCH 139/458] Removed the `TranslationContext` object.

The job of the context and the return value will now be done by the `TranslatedJaxprSDFG` object in "Personalunion".
---
 src/jace/translator/_translation_context.py   | 95 -------------------
 .../translator/jaxpr_translator_driver.py     | 21 +---
 src/jace/translator/translated_jaxpr_sdfg.py  | 87 +++++++++++------
 3 files changed, 64 insertions(+), 139 deletions(-)
 delete mode 100644 src/jace/translator/_translation_context.py

diff --git a/src/jace/translator/_translation_context.py b/src/jace/translator/_translation_context.py
deleted file mode 100644
index 6253118..0000000
--- a/src/jace/translator/_translation_context.py
+++ /dev/null
@@ -1,95 +0,0 @@
-# JaCe - JAX Just-In-Time compilation using DaCe (Data Centric Parallel Programming)
-#
-# Copyright (c) 2024, ETH Zurich
-# All rights reserved.
-#
-# SPDX-License-Identifier: BSD-3-Clause
-
-"""This module contains the translation context for the `JaxprTranslationDriver`."""
-
-from __future__ import annotations
-
-from collections.abc import MutableMapping
-
-import dace
-from jax import core as jax_core
-
-from jace import translator, util
-
-
-class _TranslationContext:
-    """Represents the context of a `JaxprTranslationDriver`.
-
-    Essentially it contains the following variables:
-    - `sdfg`:
-        The SDFG object that is under construction.
-    - `start_state`:
-        The first state in the SDFG state machine.
-    - `terminal_state`:
-        The current terminal state of the SDFG state machine.
-    - `jax_name_map`:
-        A `dict` that maps every Jax variable to its corresponding SDFG variable _name_.
-    - `inp_names`:
-        A `list` of the SDFG variable names that are used for input.
-        Their order is the same as in `Jaxpr.invars`.
-        Filled at the very beginning.
-    - `out_names`:
-        A `list` of the SDFG variables names that are used for output,
-        Their order is the same as in `Jaxpr.outvars`.
-        Only filled at the very end.
-    - `rev_idx`:
-        The revision index (used to generate unique names in the translation.
-
-    Notes:
-        It might be that a name appears in both the `inp_names` and `out_names` list.
-            This happens if the corresponding variable is used as both input and output.
-            In Jax this is called argument donation.
-        This class is similar to but different to `TranslatedJaxprSDFG`.
-            This class is used to represent the dynamic state of the translation object,
-            `TranslatedJaxprSDFG` is used to result the end.
-    """
-
-    __slots__ = (
-        "sdfg",
-        "start_state",
-        "terminal_state",
-        "jax_name_map",
-        "inp_names",
-        "out_names",
-        "rev_idx",
-    )
-
-    def __init__(
-        self,
-        rev_idx: int,
-        name: str | None = None,
-    ) -> None:
-        """Initializes the context.
-
-        Args:
-            rev_idx:    The revision index of the context.
-            name:       Name of the SDFG object.
-        """
-        if isinstance(name, str) and not util.VALID_SDFG_OBJ_NAME.fullmatch(name):
-            raise ValueError(f"'{name}' is not a valid SDFG name.")
-
-        self.sdfg: dace.SDFG = dace.SDFG(name=(name or f"unnamed_SDFG_{id(self)}"))
-        self.start_state: dace.SDFGState = self.sdfg.add_state(
-            label="initial_state", is_start_block=True
-        )
-        self.terminal_state: dace.SDFGState = self.start_state
-        self.jax_name_map: MutableMapping[jax_core.Var | util.JaCeVar, str] = {}
-        self.inp_names: tuple[str, ...] = ()
-        self.out_names: tuple[str, ...] = ()
-        self.rev_idx: int = rev_idx
-
-    def to_translated_jaxpr_sdfg(self) -> translator.TranslatedJaxprSDFG:
-        """Transforms `self` into a `TranslatedJaxprSDFG`."""
-        return translator.TranslatedJaxprSDFG(
-            sdfg=self.sdfg,
-            start_state=self.start_state,
-            terminal_state=self.terminal_state,
-            jax_name_map=self.jax_name_map,
-            inp_names=self.inp_names,
-            out_names=self.out_names,
-        )
diff --git a/src/jace/translator/jaxpr_translator_driver.py b/src/jace/translator/jaxpr_translator_driver.py
index 09329e1..e319389 100644
--- a/src/jace/translator/jaxpr_translator_driver.py
+++ b/src/jace/translator/jaxpr_translator_driver.py
@@ -75,8 +75,6 @@ def __init__(
                 the shared part. This flag is provided only for implementing
                 `self.fork()` using it is an error and undefined behaviour.
         """
-        from ._translation_context import _TranslationContext
-
         # Contains all the subtranslators that we need.
         #  They are partitioned by the names of the primitive they have registered for.
         #  This member is allocated by '_init_sub_translators()' and remains allocated
@@ -97,7 +95,7 @@ def __init__(
 
         # Context stack and current context.
         #  Only allocated during an ongoing translation
-        self._ctx_stack: list[_TranslationContext] = []
+        self._ctx_stack: list[translator.TranslatedJaxprSDFG] = []
 
     def translate_jaxpr(
         self,
@@ -671,7 +669,6 @@ def _create_initial_input(
         Notes:
             This function will fill the internal list of inputs.
         """
-
         if not self.is_allocated():
             raise RuntimeError("Driver is not allocated, can not create constants.")
         if len(self._ctx.inp_names) != 0:
@@ -745,11 +742,9 @@ def _allocate_translation_ctx(
             name:               The name of the SDFG.
             reserved_names:     Add these name to the set of resered names of `self`.
         """
-        from ._translation_context import _TranslationContext
-
         # Create a new translation context and put it on the stack.
         self._ctx_stack.append(
-            _TranslationContext(
+            translator.TranslatedJaxprSDFG(
                 rev_idx=next(self._rev_manager),
                 name=name,
             )
@@ -770,7 +765,7 @@ def _allocate_translation_ctx(
         return self
 
     @property
-    def _ctx(self) -> _TranslationContext:
+    def _ctx(self) -> translator.TranslatedJaxprSDFG:
         """Returns the currently active translation context."""
         assert len(self._ctx_stack) != 0, "No context is active."
         return self._ctx_stack[-1]
@@ -967,15 +962,7 @@ def _export_context(self) -> translator.TranslatedJaxprSDFG:
         assert self.is_allocated()
         assert all((isinstance(x, str) and (len(x) > 0)) for x in self._ctx.inp_names)
         assert all((isinstance(x, str) and (len(x) > 0)) for x in self._ctx.out_names)
-
-        return translator.TranslatedJaxprSDFG(
-            sdfg=self._ctx.sdfg,
-            start_state=self._ctx.start_state,
-            terminal_state=self._ctx.terminal_state,
-            jax_name_map=self._ctx.jax_name_map,
-            inp_names=self._ctx.inp_names,
-            out_names=self._ctx.out_names,
-        )
+        return self._ctx
 
     def _handle_null_jaxpr(
         self,
diff --git a/src/jace/translator/translated_jaxpr_sdfg.py b/src/jace/translator/translated_jaxpr_sdfg.py
index 3a3bb6b..369572c 100644
--- a/src/jace/translator/translated_jaxpr_sdfg.py
+++ b/src/jace/translator/translated_jaxpr_sdfg.py
@@ -7,9 +7,8 @@
 
 from __future__ import annotations
 
-from collections.abc import Mapping, Sequence
+from collections.abc import MutableMapping
 from dataclasses import dataclass
-from typing import Any
 
 import dace
 from jax import core as jax_core
@@ -17,11 +16,14 @@
 from jace import util
 
 
-@dataclass(init=True, repr=True, eq=False, frozen=False, kw_only=True, slots=True)
+@dataclass(slots=True)
 class TranslatedJaxprSDFG:
     """Encapsulates the result of a translation run of the `JaxprTranslationDriver` object.
 
-    It defines the following members:
+    This class is also used to represent the internal state of the `JaxprTranslationDriver` during the translation.
+    For that reason the object defines some fields that only have a meaning during the actually translation.
+
+    The fields used to store the result are:
     - `sdfg` the SDFG object that was created.
     - `jax_name_map` a `dict` that maps every Jax variable to its corresponding SDFG variable _name_.
     - `start_state` the first state in the SDFG state machine.
@@ -29,32 +31,71 @@ class TranslatedJaxprSDFG:
     - `inp_names` a `list` of the SDFG variables that are used as input, in the same order as `Jaxpr.invars`.
     - `out_names` a `list` of the SDFG variables that are used as output, in the same order as `Jaxpr.outvars`.
 
-    The SDFG is in a so called canonical form, that is not directly usable, see `JaxprTranslationDriver` for more.
+    Please consider the following important points:
+    - The SDFG is in canonical form, which means that it is not directly usable, see `JaxprTranslationDriver` for more.
+    - It might be that a name appears in both the `inp_names` and `out_names` list.
+        This happens if the corresponding variable is used as both input and output.
+        In Jax this is called argument donation.
+
+    During the translation the following members are also allocated:
+    - `rev_idx` the revision index, used for name mangling.
 
-    It might be that a name appears in both the `inp_names` and `out_names` list.
-    This happens if the corresponding variable is used as both input and output.
-    In Jax this is called argument donation.
+    While they remain allocated, accessing them is considered an error.
     """
 
     sdfg: dace.SDFG
-    jax_name_map: Mapping[jax_core.Var | util.JaCeVar, str]
-    start_state: dace.SDFGState | None = None
-    terminal_state: dace.SDFGState | None = None
-    inp_names: Sequence[str] | None = None
-    out_names: Sequence[str] | None = None
+    jax_name_map: MutableMapping[jax_core.Var | util.JaCeVar, str]
+    start_state: dace.SDFGState
+    terminal_state: dace.SDFGState
+    inp_names: tuple[str, ...]
+    out_names: tuple[str, ...]
+    rev_idx: int
+
+    def __init__(
+        self,
+        rev_idx: int,
+        name: str | None = None,
+    ) -> None:
+        """Initializes the context.
+
+        The function allocates the SDFG and initializes the members properly.
+
+        Args:
+            rev_idx:    The revision index of the context.
+            name:       Name of the SDFG object.
+        """
+        if isinstance(name, str) and not util.VALID_SDFG_OBJ_NAME.fullmatch(name):
+            raise ValueError(f"'{name}' is not a valid SDFG name.")
+
+        self.sdfg: dace.SDFG = dace.SDFG(name=(name or f"unnamed_SDFG_{id(self)}"))
+        self.start_state: dace.SDFGState = self.sdfg.add_state(
+            label="initial_state", is_start_block=True
+        )
+        self.terminal_state: dace.SDFGState = self.start_state
+        self.jax_name_map: MutableMapping[jax_core.Var | util.JaCeVar, str] = {}
+        self.inp_names: tuple[str, ...] = ()
+        self.out_names: tuple[str, ...] = ()
+        self.rev_idx: int = rev_idx
 
     def validate(self) -> bool:
         """Validate the underlying SDFG."""
 
         # To prevent the 'non initialized' data warnings we have to temporary
         #  promote input and output arguments to globals
-        promote_to_glob: set[str] = set()
         org_trans_state: dict[str, bool] = {}
-        if self.inp_names:
-            promote_to_glob.update(self.inp_names)
-        if self.out_names:
-            promote_to_glob.update(self.out_names)
-        for var in promote_to_glob:
+        if not self.inp_names:
+            raise dace.sdfg.InvalidSDFGError(
+                "There are no input arguments.",
+                self.sdfg,
+                self.sdfg.node_id(self.start_state),
+            )
+        if not self.out_names:
+            raise dace.sdfg.InvalidSDFGError(
+                "There are no output arguments.",
+                self.sdfg,
+                self.sdfg.node_id(self.start_state),
+            )
+        for var in set(self.inp_names + self.out_names):  # set is needed for donated args.
             org_trans_state[var] = self.sdfg.arrays[var].transient
             self.sdfg.arrays[var].transient = False
 
@@ -64,11 +105,3 @@ def validate(self) -> bool:
             for var, orgValue in org_trans_state.items():
                 self.sdfg.arrays[var].transient = orgValue
         return True
-
-    def __getitem__(self, idx: str) -> Any:
-        """Allows member access using brackets."""
-        if not isinstance(idx, str):
-            raise TypeError(f"Expected 'idx' as 'str' but got '{type(str)}'")
-        if not hasattr(self, idx):
-            raise KeyError(f"The key '{idx}' is not known.")
-        return getattr(self, idx)

From fa089d9672de986c6b75415d97fe6b70be45aa0f Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Mon, 13 May 2024 13:40:02 +0200
Subject: [PATCH 140/458] Updated some package importing stuff.

---
 src/jace/translator/__init__.py                          | 2 ++
 src/jace/translator/jaxpr_translator_driver.py           | 1 -
 ...a_primitive_translator.py => primitive_translator.py} | 0
 src/jace/translator/sub_translators/__init__.py          | 9 +++++----
 src/jace/translator/sub_translators/alu_translator.py    | 3 +--
 5 files changed, 8 insertions(+), 7 deletions(-)
 rename src/jace/translator/{sub_translators/a_primitive_translator.py => primitive_translator.py} (100%)

diff --git a/src/jace/translator/__init__.py b/src/jace/translator/__init__.py
index d6bb0c7..042f82a 100644
--- a/src/jace/translator/__init__.py
+++ b/src/jace/translator/__init__.py
@@ -10,10 +10,12 @@
 from __future__ import annotations
 
 from .jaxpr_translator_driver import JaxprTranslationDriver
+from .primitive_translator import PrimitiveTranslator
 from .translated_jaxpr_sdfg import TranslatedJaxprSDFG
 
 
 __all__ = [
     "JaxprTranslationDriver",
+    "PrimitiveTranslator",
     "TranslatedJaxprSDFG",
 ]
diff --git a/src/jace/translator/jaxpr_translator_driver.py b/src/jace/translator/jaxpr_translator_driver.py
index e319389..6ce6e4c 100644
--- a/src/jace/translator/jaxpr_translator_driver.py
+++ b/src/jace/translator/jaxpr_translator_driver.py
@@ -17,7 +17,6 @@
 from jax import core as jax_core
 
 from jace import translator, util
-from jace.translator import sub_translators
 
 
 class JaxprTranslationDriver:
diff --git a/src/jace/translator/sub_translators/a_primitive_translator.py b/src/jace/translator/primitive_translator.py
similarity index 100%
rename from src/jace/translator/sub_translators/a_primitive_translator.py
rename to src/jace/translator/primitive_translator.py
diff --git a/src/jace/translator/sub_translators/__init__.py b/src/jace/translator/sub_translators/__init__.py
index 88c239c..7e52b28 100644
--- a/src/jace/translator/sub_translators/__init__.py
+++ b/src/jace/translator/sub_translators/__init__.py
@@ -10,18 +10,19 @@
 
 from collections.abc import Sequence
 
-from .a_primitive_translator import PrimitiveTranslator  # has to be the first import.
+from jace import translator
+
 from .alu_translator import ALUTranslator
 
 
 # List of all subtranslators that ships with JaCe.
-_KNOWN_SUBTRANSLATORS: list[type[PrimitiveTranslator]] = [
+_KNOWN_SUBTRANSLATORS: list[type[translator.PrimitiveTranslator]] = [
     ALUTranslator,
 ]
 
 
 def add_subtranslator(
-    subtrans: type[PrimitiveTranslator],
+    subtrans: type[translator.PrimitiveTranslator],
 ) -> bool:
     """Add `subtrans` to the externally defined subtranslators.
 
@@ -36,7 +37,7 @@ def add_subtranslator(
     return True
 
 
-def _get_subtranslators_cls() -> Sequence[type[PrimitiveTranslator]]:
+def _get_subtranslators_cls() -> Sequence[type[translator.PrimitiveTranslator]]:
     """Returns the list of all subtranslator known to JaCe.
 
     The translators are returned in FIFO order.
diff --git a/src/jace/translator/sub_translators/alu_translator.py b/src/jace/translator/sub_translators/alu_translator.py
index 8cc2466..23f0cb3 100644
--- a/src/jace/translator/sub_translators/alu_translator.py
+++ b/src/jace/translator/sub_translators/alu_translator.py
@@ -18,10 +18,9 @@
 from typing_extensions import override
 
 from jace import translator
-from jace.translator import sub_translators
 
 
-class ALUTranslator(sub_translators.PrimitiveTranslator):
+class ALUTranslator(translator.PrimitiveTranslator):
     """This translator handles all arithmetic and logical operations."""
 
     __slots__ = ()

From 75d0823bcad89b4ebc0dbdf7e427427e264e9b7f Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Mon, 13 May 2024 15:00:35 +0200
Subject: [PATCH 141/458] Driver now always deallocate.

---
 src/jace/translator/jaxpr_translator_driver.py | 8 +-------
 1 file changed, 1 insertion(+), 7 deletions(-)

diff --git a/src/jace/translator/jaxpr_translator_driver.py b/src/jace/translator/jaxpr_translator_driver.py
index 6ce6e4c..2fac9c4 100644
--- a/src/jace/translator/jaxpr_translator_driver.py
+++ b/src/jace/translator/jaxpr_translator_driver.py
@@ -104,7 +104,6 @@ def translate_jaxpr(
         name: str | None = None,
         reserved_names: str | Collection[str] | None = None,
         allow_empty_jaxpr: bool = False,
-        **kwargs: Any,
     ) -> translator.TranslatedJaxprSDFG:
         """Perform the translation of a Jaxpr into a SDFG.
 
@@ -136,10 +135,6 @@ def translate_jaxpr(
         if not jax.config.read("jax_enable_x64"):
             raise NotImplementedError("The translation only works if 'jax_enable_x64' is enabled.")
 
-        # The point of this flag is, that one can have the translator, but still have access
-        #  the the function of self, such as `add_array()` (is needed in later stages).
-        _clear_translation_ctx: bool = kwargs.pop("_clear_translation_ctx", True)
-
         # NOTE: If `self` is already allocated, i.e. has an ongoing translation process,
         #       the `_allocate_translation_ctx()` function will start a new context.
         #       Thus the driver will start to translate a second (nested) SDFG.
@@ -158,8 +153,7 @@ def translate_jaxpr(
         )
         # Note that `self` and `jsdfg` still share the same underlying memory, i.e. context.
         jsdfg: translator.TranslatedJaxprSDFG = self._translate_jaxpr_internal(jaxpr)
-        if _clear_translation_ctx:
-            self._clear_translation_ctx()
+        self._clear_translation_ctx()
 
         return jsdfg
 

From d39ba9b6506847056cc319713a36ea9a1cb9145f Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Mon, 13 May 2024 15:06:15 +0200
Subject: [PATCH 142/458] Small updates.

---
 src/jace/util/debug.py      | 7 +++++--
 src/jace/util/jax_helper.py | 4 ----
 2 files changed, 5 insertions(+), 6 deletions(-)

diff --git a/src/jace/util/debug.py b/src/jace/util/debug.py
index 27c57aa..23aee23 100644
--- a/src/jace/util/debug.py
+++ b/src/jace/util/debug.py
@@ -63,7 +63,7 @@ def run_jax_sdfg(
 
     # Canonical SDFGs do not have global memory, so we must transform it.
     #  We will afterwards undo it.
-    for glob_name in jsdfg.inp_names + jsdfg.out_names:  # type: ignore[operator]  # concatenation
+    for glob_name in jsdfg.inp_names + jsdfg.out_names:
         jsdfg.sdfg.arrays[glob_name].transient = False
 
     try:
@@ -80,7 +80,7 @@ def run_jax_sdfg(
         return ret_val
 
     finally:
-        for name in jsdfg.inp_names + jsdfg.out_names:  # type: ignore[operator]  # concatenation
+        for name in jsdfg.inp_names + jsdfg.out_names:
             jsdfg.sdfg.arrays[name].transient = True
 
 
@@ -94,6 +94,9 @@ def _jace_run(
     Args:
         *args:      Forwarded to the tracing and final execution of the SDFG.
         **kwargs:   Used to construct the driver.
+
+    Notes:
+        This function will be removed soon.
     """
     jaxpr = jax.make_jaxpr(fun)(*args)
     driver = translator.JaxprTranslationDriver(**kwargs)
diff --git a/src/jace/util/jax_helper.py b/src/jace/util/jax_helper.py
index fb4619a..0ea37a1 100644
--- a/src/jace/util/jax_helper.py
+++ b/src/jace/util/jax_helper.py
@@ -53,10 +53,6 @@ def __eq__(self, other: Any) -> bool:
             return NotImplemented
         return id(self) == id(other)
 
-    def __post_init__(self) -> None:
-        if not isinstance(self.shape, tuple):
-            raise ValueError("The 'shape' member of a 'JaCeVar' must be a tuple.")
-
 
 def get_jax_var_name(jax_var: jax_core.Atom | JaCeVar | str) -> str:
     """Returns the name of the Jax variable as a string.

From 8dcfbb0a260b0e12bba335a8870ff017b7189015 Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Mon, 13 May 2024 15:18:39 +0200
Subject: [PATCH 143/458] Made some small modifications, such that pre-commit
 is happy.

---
 pyproject.toml                 |  2 +-
 src/jace/jax/stages/a_stage.py |  2 +-
 src/jace/util/jax_helper.py    |  2 +-
 tests/test_jax_api.py          | 11 +++++++----
 4 files changed, 10 insertions(+), 7 deletions(-)

diff --git a/pyproject.toml b/pyproject.toml
index f05b72a..f9894fb 100644
--- a/pyproject.toml
+++ b/pyproject.toml
@@ -151,5 +151,5 @@ section-order = [
 "tests/**" = [
   "T10",
   "T20",  # Ignore `flake8-debugger` and `flake8-print`
-  "F841",  # Ignore assigned but not used; inside `with` to test if throw.
+  "F841"  # Ignore assigned but not used; inside `with` to test if throw.
 ]
diff --git a/src/jace/jax/stages/a_stage.py b/src/jace/jax/stages/a_stage.py
index 80c3c9f..945ba69 100644
--- a/src/jace/jax/stages/a_stage.py
+++ b/src/jace/jax/stages/a_stage.py
@@ -7,7 +7,7 @@
 """Interface of the Stages.
 
 In `jace.jax.stages.__init__.py` this file must be imported first.
-However, isort/ruff fail to do that and can not be convinced otherwise. 
+However, isort/ruff fail to do that and can not be convinced otherwise.
 For that reason this file was renamed to ensure that it comes at first.
 """
 
diff --git a/src/jace/util/jax_helper.py b/src/jace/util/jax_helper.py
index 72ff85d..a5bd891 100644
--- a/src/jace/util/jax_helper.py
+++ b/src/jace/util/jax_helper.py
@@ -62,7 +62,7 @@ def Create(
         name: str,
         shape: Sequence[int | dace.symbol | str] | int | dace.symbol | str,
         dtype: Any,
-    ) -> None:
+    ) -> JaCeVar:
         """Creates a `JaCeVar` object.
 
         Performs some sanity checks on the input.
diff --git a/tests/test_jax_api.py b/tests/test_jax_api.py
index 1e7b911..6e1a2da 100644
--- a/tests/test_jax_api.py
+++ b/tests/test_jax_api.py
@@ -18,7 +18,7 @@
 from jace import util as jutil
 
 
-np.random.seed(42)
+np.random.seed(42)  # noqa: NPY002  # random generator
 
 
 def test_jit():
@@ -103,7 +103,7 @@ def f3_(A, B, C, D):
     f3_jax = jax.jit(f3_)
     f3_jace = jace.jit(f3_)
 
-    A, B, C, D = (np.random.random((10, 3, 50)) for _ in range(4))
+    A, B, C, D = (np.random.random((10, 3, 50)) for _ in range(4))  # noqa: NPY002  # random generator
 
     ref = ((A + B) - C) * D
 
@@ -137,5 +137,8 @@ def f(x):
     x2 = 4.0
     df_x2 = -4.0
 
-    assert (res := df(x1)) == df_x1, f"Failed lower branch, expected '{df_x1}', got '{res}'."
-    assert (res := df(x2)) == df_x2, f"Failed upper branch, expected '{df_x2}', got '{res}'."
+    res_1 = df(x1)
+    res_2 = df(x2)
+
+    assert df(x1) == df_x1, f"Failed lower branch, expected '{df_x1}', got '{res_1}'."
+    assert df(x2) == df_x2, f"Failed upper branch, expected '{df_x2}', got '{res_2}'."

From 447afdbfcc2daf3f9cd27673bfeaaa26fb8be976 Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Mon, 13 May 2024 15:42:57 +0200
Subject: [PATCH 144/458] Removed the `_jace_run()` function that was only a
 temporary solution.

Also renamed the `jace.util.debug` module to `jace.util.compiling` which is much better.
---
 src/jace/util/__init__.py                |  6 +++--
 src/jace/util/{debug.py => compiling.py} | 32 ++++++------------------
 tests/test_sub_translators_alu.py        |  8 +++---
 3 files changed, 15 insertions(+), 31 deletions(-)
 rename src/jace/util/{debug.py => compiling.py} (88%)

diff --git a/src/jace/util/__init__.py b/src/jace/util/__init__.py
index 11469fc..795b1bf 100644
--- a/src/jace/util/__init__.py
+++ b/src/jace/util/__init__.py
@@ -9,7 +9,10 @@
 
 from __future__ import annotations
 
-from .debug import _jace_run, compile_jax_sdfg, run_jax_sdfg
+from .compiling import (
+    compile_jax_sdfg,
+    run_jax_sdfg,
+)
 from .jax_helper import (
     JaCeVar,
     _propose_jax_name,
@@ -56,7 +59,6 @@
     "get_jax_var_dtype",
     "translate_dtype",
     "run_jax_sdfg",
-    "_jace_run",
     "_propose_jax_name",
     "VALID_JAX_VAR_NAME",
     "VALID_SDFG_OBJ_NAME",
diff --git a/src/jace/util/debug.py b/src/jace/util/compiling.py
similarity index 88%
rename from src/jace/util/debug.py
rename to src/jace/util/compiling.py
index 799f882..395a7a5 100644
--- a/src/jace/util/debug.py
+++ b/src/jace/util/compiling.py
@@ -12,12 +12,11 @@
 
 from __future__ import annotations
 
-from collections.abc import Callable, Sequence
+from collections.abc import Sequence
 from functools import singledispatch
 from typing import Any
 
 import dace
-import jax
 
 from jace import translator
 from jace.util import dace_helper as jdace
@@ -78,10 +77,11 @@ def run_jax_sdfg(
     *args: Any,
     **kwargs: Any,
 ) -> tuple[Any, ...] | Any:
-    """Run the `TranslatedJaxprSDFG` object.
+    """Execute a `TranslatedJaxprSDFG` object directly.
 
     Notes:
-        The function either returns a value or a tuple of values, i.e. no tree.
+        This function is used for debugging purposes and you should use the `jace.jit` annotation instead.
+        The function either returns a value or a tuple of values, i.e. no pytree.
         There is an overload of this function that accepts an already compiled SDFG and runs it.
     """
     if jsdfg.inp_names is None:
@@ -110,7 +110,9 @@ def _(
 ) -> tuple[Any, ...] | Any:
     """Call the compiled SDFG.
 
-    The function assumes that the SDFG was compiled in accordance with `compile_jax_sdfg()`
+    Notes:
+        This function is used for debugging purposes and you should use the `jace.jit` annotation instead.
+        The function assumes that the SDFG was compiled in accordance with `compile_jax_sdfg()`
     """
     from dace.data import Array, Data, Scalar, make_array_from_descriptor
 
@@ -162,23 +164,3 @@ def _(
     if len(out_names) == 1:
         return ret_val[0]
     return ret_val
-
-
-def _jace_run(
-    fun: Callable,
-    *args: Any,
-    **kwargs: Any,
-) -> Any:
-    """Traces and run function `fun` using `Jax | DaCe`.
-
-    Args:
-        *args:      Forwarded to the tracing and final execution of the SDFG.
-        **kwargs:   Used to construct the driver.
-
-    Notes:
-        This function will be removed soon.
-    """
-    jaxpr = jax.make_jaxpr(fun)(*args)
-    driver = translator.JaxprTranslationDriver(**kwargs)
-    jsdfg = driver.translate_jaxpr(jaxpr)
-    return run_jax_sdfg(jsdfg, *args)
diff --git a/tests/test_sub_translators_alu.py b/tests/test_sub_translators_alu.py
index 50128e8..1853f92 100644
--- a/tests/test_sub_translators_alu.py
+++ b/tests/test_sub_translators_alu.py
@@ -12,7 +12,7 @@
 import jax
 import numpy as np
 
-from jace import util as jutil
+import jace
 
 
 def test_add():
@@ -26,7 +26,7 @@ def testee(A: np.ndarray, B: np.ndarray) -> np.ndarray:
     B = np.full((4, 3), 10, dtype=np.float64)
 
     ref = testee(A, B)
-    res = jutil._jace_run(testee, A, B)
+    res = jace.jit(testee)(A, B)
 
     assert np.allclose(ref, res), f"Expected '{ref}' got '{res}'."
 
@@ -46,7 +46,7 @@ def testee(A: np.ndarray, B: np.ndarray) -> np.ndarray:
     B = np.full((4, 3), 10, dtype=np.float64)
 
     ref = testee(A, B)
-    res = jutil._jace_run(testee, A, B)
+    res = jace.jit(testee)(A, B)
 
     assert np.allclose(ref, res), f"Expected '{ref}' got '{res}'."
 
@@ -61,6 +61,6 @@ def testee(A: np.ndarray) -> np.ndarray:
     A = np.ones((3, 3), dtype=np.float64)
 
     ref = testee(A)
-    res = jutil._jace_run(testee, A)
+    res = jace.jit(testee)(A)
 
     assert np.allclose(ref, res), f"Expected '{ref}' got '{res}'."

From 75c8dc5f96a3327cebf28016ed1ae66c220648d3 Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Mon, 13 May 2024 15:47:47 +0200
Subject: [PATCH 145/458] Small changes.

---
 src/jace/translator/jaxpr_translator_driver.py | 4 ++--
 src/jace/util/__init__.py                      | 4 ++--
 src/jace/util/jax_helper.py                    | 2 +-
 3 files changed, 5 insertions(+), 5 deletions(-)

diff --git a/src/jace/translator/jaxpr_translator_driver.py b/src/jace/translator/jaxpr_translator_driver.py
index 2fac9c4..f9ff13c 100644
--- a/src/jace/translator/jaxpr_translator_driver.py
+++ b/src/jace/translator/jaxpr_translator_driver.py
@@ -445,7 +445,7 @@ def add_array(
             if find_new_name:
                 raise ValueError("Specified `force_jax_name` but also wanted a new name.")
             find_new_name = False
-            alt_name = util._propose_jax_name(arg, self._ctx.jax_name_map)
+            alt_name = util.propose_jax_name(arg, self._ctx.jax_name_map)
         if alt_name is not None:
             assert isinstance(alt_name, str)
             find_new_name = False  # If a name was given, then use it no matter what.
@@ -485,7 +485,7 @@ def add_array(
         if alt_name is not None:
             prop_name = alt_name  # Just for completion: will be ignored later
         elif isinstance(arg, (jax_core.Var, util.JaCeVar)):
-            prop_name = util._propose_jax_name(arg, self._ctx.jax_name_map)
+            prop_name = util.propose_jax_name(arg, self._ctx.jax_name_map)
             assert not prop_name.startswith("__")
             if name_prefix is not None:
                 prop_name = name_prefix + prop_name
diff --git a/src/jace/util/__init__.py b/src/jace/util/__init__.py
index 795b1bf..eb8e624 100644
--- a/src/jace/util/__init__.py
+++ b/src/jace/util/__init__.py
@@ -15,11 +15,11 @@
 )
 from .jax_helper import (
     JaCeVar,
-    _propose_jax_name,
     get_jax_var_dtype,
     get_jax_var_name,
     get_jax_var_shape,
     is_tracing_ongoing,
+    propose_jax_name,
     translate_dtype,
 )
 from .traits import (
@@ -59,7 +59,7 @@
     "get_jax_var_dtype",
     "translate_dtype",
     "run_jax_sdfg",
-    "_propose_jax_name",
+    "propose_jax_name",
     "VALID_JAX_VAR_NAME",
     "VALID_SDFG_OBJ_NAME",
     "VALID_SDFG_VAR_NAME",
diff --git a/src/jace/util/jax_helper.py b/src/jace/util/jax_helper.py
index a5bd891..38c3f0d 100644
--- a/src/jace/util/jax_helper.py
+++ b/src/jace/util/jax_helper.py
@@ -212,7 +212,7 @@ def translate_dtype(dtype: Any) -> dace.typeclass:
     raise ValueError(f"Unable to translate '{dtype}' ino a DaCe dtype.")
 
 
-def _propose_jax_name(
+def propose_jax_name(
     jax_var: jax_core.Atom | JaCeVar,
     jax_name_map: Mapping[jax_core.Var | JaCeVar, Any] | None = None,
 ) -> str:

From 18eadc195209115b9b42f550d21d9f42ee3b63fa Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Mon, 13 May 2024 16:18:05 +0200
Subject: [PATCH 146/458] Made a first check for caching, however, I am not
 fully sure how I should implement the optimization.

I am pretty sure that the `optimize()` thing should be removed.
However, I think that in any case optimization _must_ occure in a copy, otherwhise it does not make any sense, because we have to pretend that the SDFG is immutable since it is cached.
---
 src/jace/jax/stages/jace_lowered.py | 11 +++++-
 src/jace/util/compiling.py          |  6 ++++
 tests/test_decorator.py             | 52 +++++++++++++++++++++++++++++
 3 files changed, 68 insertions(+), 1 deletion(-)

diff --git a/src/jace/jax/stages/jace_lowered.py b/src/jace/jax/stages/jace_lowered.py
index 581cefe..3c7e29d 100644
--- a/src/jace/jax/stages/jace_lowered.py
+++ b/src/jace/jax/stages/jace_lowered.py
@@ -49,6 +49,15 @@ def optimize(
         Notes:
             Currently no optimization is performed.
         """
+        # TODO(phimuell): Think really hard what we should do here, to avoid strange behaviour.
+        #                   I am not fully sure if we should include the SDFG value in the caching.
+
+        # TODO(phimuell):
+        #   - remove the inplace modification.
+        #   - Somehow integrate it into the caching strategy.
+        #
+        #  If we would not integrate it into the caching strategy, then calling `lower()` on
+        #  the wrapped object would return the original object, but with a modified, already optimized SDFG.
         return self
 
     @tcache.cached_translation
@@ -58,7 +67,7 @@ def compile(
     ) -> stages.JaceCompiled:
         """Compile the SDFG.
 
-        Returns an Object that encapsulates a
+        Returns an Object that encapsulates a compiled SDFG object.
         """
         csdfg: jdace.CompiledSDFG = util.compile_jax_sdfg(self._translated_sdfg)
         return stages.JaceCompiled(
diff --git a/src/jace/util/compiling.py b/src/jace/util/compiling.py
index 395a7a5..95b05c0 100644
--- a/src/jace/util/compiling.py
+++ b/src/jace/util/compiling.py
@@ -33,6 +33,7 @@ def compile_jax_sdfg(
         Currently the SDFG must not have any undefined symbols, i.e. no undefined sizes.
     """
     from copy import deepcopy
+    from time import time
 
     if not jsdfg.inp_names:
         raise ValueError("The passed SDFG did not had any input arguments.")
@@ -54,6 +55,11 @@ def compile_jax_sdfg(
     #  i.e. in the allocation of the return values as well as `arg_names`.
     sdfg: dace.SDFG = deepcopy(jsdfg.sdfg)
 
+    # We need to give the SDFG another name, this is needed to prevent a DaCe error/warning.
+    #  This happens if we compile the same lowered SDFG multiple times with different options.
+    #  We allow this because Jax allows this too, this is also a reason why we copy the SDFG.
+    sdfg.name = f"{sdfg.name}__comp_{int(time() * 1000)}"
+
     # Canonical SDFGs do not have global memory, so we must transform it
     sdfg_arg_names: list[str] = []
     for glob_name in jsdfg.inp_names + jsdfg.out_names:
diff --git a/tests/test_decorator.py b/tests/test_decorator.py
index 940e1f6..8b9bc38 100644
--- a/tests/test_decorator.py
+++ b/tests/test_decorator.py
@@ -63,3 +63,55 @@ def testee_(A: np.ndarray, B: np.ndarray) -> np.ndarray:
     res = testee(A, B)
 
     assert np.allclose(ref, res), f"Expected '{ref}' got '{res}'."
+
+
+def test_decorator_caching():
+    """This tests the caching ability"""
+    jax.config.update("jax_enable_x64", True)
+
+    def testee1_(A: np.ndarray, B: np.ndarray) -> np.ndarray:
+        return A * B
+
+    def testee2_(A: np.ndarray, B: np.ndarray) -> np.ndarray:
+        return A + B
+
+    testee1 = jace.jit(testee1_)
+    testee2 = jace.jit(testee2_)
+
+    assert testee1.__wrapped__ == testee1_
+    assert testee2.__wrapped__ == testee2_
+
+    # This is the first size
+    A = np.arange(12, dtype=np.float64).reshape((4, 3))
+    B = np.full((4, 3), 10, dtype=np.float64)
+
+    # This is the second sizes
+    C = np.arange(16, dtype=np.float64).reshape((4, 4))
+    D = np.full((4, 4), 10, dtype=np.float64)
+
+    # Lower the two functions for the first size.
+    lowered1_size1 = testee1.lower(A, B)
+    lowered2_size1 = testee2.lower(A, B)
+
+    # If we now lower them again, we should get the same objects
+    assert lowered1_size1 is testee1.lower(A, B)
+    assert lowered2_size1 is testee2.lower(A, B)
+
+    # Now we lower them for the second sizes.
+    lowered1_size2 = testee1.lower(C, D)
+    lowered2_size2 = testee2.lower(C, D)
+
+    # Again if we now lower them again, we should get the same objects.
+    assert lowered1_size1 is testee1.lower(A, B)
+    assert lowered2_size1 is testee2.lower(A, B)
+    assert lowered1_size2 is testee1.lower(C, D)
+    assert lowered2_size2 is testee2.lower(C, D)
+
+    # Now use the compilation; since all is the same code path we only use one size.
+    compiled1 = lowered1_size1.compile()
+    compiled2 = lowered1_size1.compile({"dummy_option": True})
+
+    assert compiled1 is lowered1_size1.compile()
+    assert compiled2 is lowered1_size1.compile({"dummy_option": True})
+    assert compiled2 is not lowered1_size1.compile({"dummy_option": False})
+    assert compiled2 is lowered1_size1.compile({"dummy_option": True})

From e31539e2f8fc6ad832bbb81721f19b01c7593887 Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Tue, 14 May 2024 08:51:56 +0200
Subject: [PATCH 147/458] Reworked the cache.

It is now better documented and there are also some edge cases that are now handled.
The most important thing is that the cache shjould also be resistant to inplace modifications, at least it should be that way.
Furthermore the names are now a bit better.
---
 src/jace/jax/stages/jace_lowered.py |   7 +-
 src/jace/util/translation_cache.py  | 186 ++++++++++++++++++++--------
 2 files changed, 137 insertions(+), 56 deletions(-)

diff --git a/src/jace/jax/stages/jace_lowered.py b/src/jace/jax/stages/jace_lowered.py
index 3c7e29d..ca2f6f8 100644
--- a/src/jace/jax/stages/jace_lowered.py
+++ b/src/jace/jax/stages/jace_lowered.py
@@ -10,7 +10,7 @@
 from __future__ import annotations
 
 import json
-from typing import Any
+from typing import Any, Final
 
 from jace import translator, util
 from jace.jax import stages
@@ -28,6 +28,11 @@ class JaceLowered(stages.Stage):
     _translated_sdfg: translator.TranslatedJaxprSDFG
     _cache: tcache.TranslationCache
 
+    DEF_COMPILER_OPTIONS: Final[dict[str, Any]] = {
+        "auto_opt": True,
+        "simplify": True,
+    }
+
     def __init__(
         self,
         translated_sdfg: translator.TranslatedJaxprSDFG,
diff --git a/src/jace/util/translation_cache.py b/src/jace/util/translation_cache.py
index 2ca78dc..e70c235 100644
--- a/src/jace/util/translation_cache.py
+++ b/src/jace/util/translation_cache.py
@@ -17,10 +17,11 @@
 from __future__ import annotations
 
 import functools as ft
+from abc import abstractmethod
 from collections import OrderedDict
 from collections.abc import Callable
 from dataclasses import dataclass
-from typing import Any
+from typing import Any, Protocol, runtime_checkable
 
 import dace
 from jax import core as jax_core
@@ -63,7 +64,7 @@ def _action_wrapper(
     ) -> stages.Stage:
         assert hasattr(self, "_cache"), f"Type '{type(self).__name__}' does not have `_cache`."
         cache: TranslationCache = self._cache
-        key: _CacheKey = cache.make_key(self, *args, **kwargs)
+        key: _CachedCall = cache.make_key(self, *args, **kwargs)
         if cache.has(key):
             return cache.get(key)
         next_stage: stages.Stage = action(self, *args, **kwargs)
@@ -75,7 +76,12 @@ def _action_wrapper(
 
 @dataclass(init=True, eq=True, frozen=True)
 class _AbstarctCallArgument:
-    """Class to represent the call arguments used in the cache."""
+    """Class to represent one argument to the call in an abstract way.
+
+    It is used as part of the key in the cache.
+    It represents the structure of the argument, i.e. its shape, type and so on, but nots its value.
+    To construct it you should use the `from_value()` class function which interfere the characteristics from a value.
+    """
 
     shape: tuple[int, ...] | tuple[()]
     dtype: dace.typeclass
@@ -98,14 +104,13 @@ def from_value(
         if isinstance(val, jax_core.Literal):
             raise TypeError("Jax Literals are not supported as cache keys.")
 
-        # TODO(phimuell): is `CPU_Heap` okay?
-
         if util.is_array(val):
             if util.is_jax_array(val):
                 val = val.__array__(copy=False)
             shape = val.shape
             dtype = util.translate_dtype(val.dtype)
             strides = getattr(val, "strides", None)
+            # TODO(phimuell): is `CPU_Heap` always okay? There would also be `CPU_Pinned`.
             storage = (
                 dace.StorageType.GPU_Global if util.is_on_device(val) else dace.StorageType.CPU_Heap
             )
@@ -132,15 +137,52 @@ def from_value(
         return cls.from_value(jax_core.get_aval(val))
 
 
-@dataclass(init=True, eq=True, frozen=True, unsafe_hash=True)
-class _CacheKey:
-    """Wrapper around the arguments"""
+@runtime_checkable
+class _ConcreteCallArgument(Protocol):
+    """Type for encoding a concrete arguments in the cache."""
+
+    @abstractmethod
+    def __hash__(self) -> int:
+        pass
+
+    @abstractmethod
+    def __eq__(self, other: Any) -> bool:
+        pass
+
+
+@dataclass(init=True, eq=True, frozen=True)
+class _CachedCall:
+    """Represents the structure of the entire call in the cache.
+
+    This class represents both the `JaceWrapped.lower()` and `JaceLowered.compile()` call.
+    The key combines the "origin of the call", i.e. `self` and the call arguments.
+
+    Arguments are represented in two ways:
+    - `_AbstarctCallArgument`: Which encode only the structure of the arguments.
+        These are essentially the tracer used by Jax.
+    - `_ConcreteCallArgument`: Which represents actual values of the call.
+        These are either the static arguments or compile options.
+
+    Depending of the origin the call, the key used for caching is different.
+    For `JaceWrapped` only the wrapped callable is included in the cache.
+
+    For the `JaceLowered` the SDFG is used as key, however, in a very special way.
+    `dace.SDFG` does not define `__hash__()` or `__eq__()` thus these operations fall back to `object`.
+    However, an SDFG defines the `hash_sdfg()` function, which generates a hash based on the structure of the SDFG.
+    We use the SDFG because we want to cache on it, but since it is not immutable, we have to account for that, by including this structural hash.
+    This is not ideal but it should work in the beginning.
+    """
 
-    # Note that either `_fun` or `_sdfg_hash` are not `None`.
-    # TODO(phimuell): Static arguments.
     fun: Callable | None
+    sdfg: dace.SDFG | None
     sdfg_hash: int | None
-    fargs: tuple[_AbstarctCallArgument, ...] | tuple[tuple[str, Any], ...]
+    fargs: tuple[
+        _AbstarctCallArgument
+        | _ConcreteCallArgument
+        | tuple[str, _AbstarctCallArgument]
+        | tuple[str, _ConcreteCallArgument],
+        ...,
+    ]
 
     @classmethod
     def make_key(
@@ -148,34 +190,53 @@ def make_key(
         stage: stages.Stage,
         *args: Any,
         **kwargs: Any,
-    ) -> _CacheKey:
-        """Creates a cache key for the stage object `stage` that was called to advance."""
-        if len(kwargs) != 0:
-            raise NotImplementedError("kwargs are not implemented.")
+    ) -> _CachedCall:
+        """Creates a cache key for the stage object `stage` that was called to advance to the next stage."""
 
         if isinstance(stage, stages.JaceWrapped):
+            # JaceWrapped.lower() to JaceLowered
+            #   Currently we only allow positional arguments and no static arguments.
+            #   Thus the function argument part of the key only consists of abstract arguments.
+            if len(kwargs) != 0:
+                raise NotImplementedError("'kwargs' are not implemented in 'JaceWrapped.lower()'.")
             fun = stage.__wrapped__
+            sdfg = None
             sdfg_hash = None
-            fargs: Any = tuple(  # Any is here to prevent typeconfusion in mypy.
+            fargs: tuple[_AbstarctCallArgument, ...] = tuple(
                 _AbstarctCallArgument.from_value(x) for x in args
             )
 
         elif isinstance(stage, stages.JaceLowered):
+            # JaceLowered.compile() to JaceCompiled
+            #   We only accepts compiler options, which the Jax interface mandates
+            #   are inside a `dict` thus we will get at most one argument.
             fun = None
-            sdfg_hash = int(stage.compiler_ir().sdfg.hash_sdfg(), 16)
+            sdfg = stage.compiler_ir().sdfg
+            sdfg_hash = int(sdfg.hash_sdfg(), 16)
 
-            # In this mode the inputs are compiler options, which are encapsulated in
-            #  `CompilerOptions` (aka. `dict`), or it is None.
-            assert len(args) <= 1
-            comp_ops: stages.CompilerOptions = (
-                stages.CompilerOptions() if len(args) == 0 else args[0]
-            )
+            if len(kwargs) != 0:
+                raise ValueError(
+                    "All arguments to 'JaceLowered.compile()' must be inside a 'dict'."
+                )
+            if len(args) >= 2:
+                raise ValueError("Only a 'dict' is allowed as argument to 'JaceLowered.compile()'.")
+            if (len(args) == 0) or (args[0] is None):
+                # No compiler options where specified, so we use the default ones.
+                comp_ops: stages.CompilerOptions = stages.JaceLowered.DEF_COMPILER_OPTIONS
+            else:
+                # Compiler options where given.
+                comp_ops = args[0]
             assert isinstance(comp_ops, dict)
+            assert all(
+                isinstance(k, str) and isinstance(v, _ConcreteCallArgument)
+                for k, v in comp_ops.items()
+            )
 
-            # Make `(argname, value)` pairs and sort them to get a concrete key
-            fargs = tuple(
+            # We will now make `(argname, argvalue)` pairs and sort them according to `argname`.
+            #  This guarantees a stable order.
+            fargs: tuple[tuple[str, _ConcreteCallArgument], ...] = tuple(  # type: ignore[no-redef]  # Type confusion.
                 sorted(
-                    ((k, v) for k, v in comp_ops.items()),
+                    ((argname, argvalue) for argname, argvalue in comp_ops.items()),
                     key=lambda X: X[0],
                 )
             )
@@ -183,21 +244,23 @@ def make_key(
         else:
             raise TypeError(f"Can not make key from '{type(stage).__name__}'.")
 
-        return cls(fun=fun, sdfg_hash=sdfg_hash, fargs=fargs)
+        return cls(fun=fun, sdfg=sdfg, sdfg_hash=sdfg_hash, fargs=fargs)
 
 
 class TranslationCache:
     """The _internal_ cache object.
 
-    It implements a simple LRU cache.
+    It implements a simple LRU cache, for storing the results of the `JaceWrapped.lower()` and `JaceLowered.compile()` calls.
+    You should not use this cache directly but instead use the `cached_translation` decorator.
 
-    Todo:
-        Also handle abstract values.
+    Notes:
+        The most recently used entry is at the end of the `OrderedDict`.
+            The reason for this is, because there the new entries are added.
     """
 
     __slots__ = ["_memory", "_size"]
 
-    _memory: OrderedDict[_CacheKey, stages.Stage]
+    _memory: OrderedDict[_CachedCall, stages.Stage]
     _size: int
 
     def __init__(
@@ -207,7 +270,7 @@ def __init__(
         """Creates a cache instance of size `size`."""
         if size <= 0:
             raise ValueError(f"Invalid cache size of '{size}'")
-        self._memory: OrderedDict[_CacheKey, stages.Stage] = OrderedDict()
+        self._memory: OrderedDict[_CachedCall, stages.Stage] = OrderedDict()
         self._size = size
 
     @staticmethod
@@ -215,63 +278,76 @@ def make_key(
         stage: stages.Stage,
         *args: Any,
         **kwargs: Any,
-    ) -> _CacheKey:
+    ) -> _CachedCall:
         """Create a key object for `stage`."""
-        if len(kwargs) != 0:
-            raise NotImplementedError
-        return _CacheKey.make_key(stage, *args, **kwargs)
+        return _CachedCall.make_key(stage, *args, **kwargs)
 
     def has(
         self,
-        key: _CacheKey,
+        key: _CachedCall,
     ) -> bool:
         """Check if `self` have a record of `key`.
 
-        To generate `key` use the `make_key` function.
+        Notes:
+            For generating `key` use the `make_key()` function.
+            This function will not modify the order of the cached entries.
         """
         return key in self._memory
 
     def get(
         self,
-        key: _CacheKey,
+        key: _CachedCall,
     ) -> stages.Stage:
         """Get the next stage associated with `key`.
 
-        It is an error if `key` does not exists.
-        This function will move `key` to front of `self`.
+        Notes:
+            It is an error if `key` does not exist.
+            This function will mark `key` as most recently used.
         """
         if not self.has(key):
             raise KeyError(f"Key '{key}' is unknown.")
-        self._memory.move_to_end(key, last=False)
+        self._memory.move_to_end(key, last=True)
         return self._memory.get(key)  # type: ignore[return-value]  # type confusion
 
     def add(
         self,
-        key: _CacheKey,
+        key: _CachedCall,
         res: stages.Stage,
     ) -> TranslationCache:
         """Adds `res` under `key` to `self`.
 
-        In case `key` is already known, it will first be eviceted and then reinserted.
-        If `self` is larger than specified the oldest one will be evicted.
+        Notes:
+            It is not an error if if `key` is already present.
         """
-        self._evict(key)
-        while len(self._memory) >= self._size:
-            self._memory.popitem(last=True)
-        self._memory[key] = res
-        self._memory.move_to_end(key, last=False)
+        if self.has(key):
+            # `key` is known, so move it to the end and update the mapped value.
+            self._memory.move_to_end(key, last=True)
+            self._memory[key] = res
+
+        else:
+            # `key` is not known so we have to add it
+            while len(self._memory) >= self._size:
+                self._evict(None)
+            self._memory[key] = res
         return self
 
     def _evict(
         self,
-        key: _CacheKey,
+        key: _CachedCall | None,
     ) -> bool:
-        """Evict `key` from `self`.
+        """Evict `key` from `self` and return `True`.
 
-        Returns if it was evicted or not.
+        In case `key` is not known the function returns `False`.
+        If `key` is `None` then evict the oldest one unconditionally.
         """
+        if key is None:
+            if len(self._memory) == 0:
+                return False
+            self._memory.popitem(last=False)
+            return True
+
         if not self.has(key):
             return False
-        self._memory.move_to_end(key, last=True)
-        self._memory.popitem(last=True)
+        self._memory.move_to_end(key, last=False)
+        self._memory.popitem(last=False)
         return True

From 41cec81f9270bff30d2c11bbc45e18365f50a614 Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Tue, 14 May 2024 09:10:31 +0200
Subject: [PATCH 148/458] Relocated the cache implementation.

It is now like anything else in `jace.stages`.
---
 src/jace/jax/stages/jace_lowered.py           | 10 +--
 src/jace/jax/stages/jace_wrapped.py           |  9 +--
 .../{util => jax/stages}/translation_cache.py | 64 ++++++++++++-------
 3 files changed, 43 insertions(+), 40 deletions(-)
 rename src/jace/{util => jax/stages}/translation_cache.py (93%)

diff --git a/src/jace/jax/stages/jace_lowered.py b/src/jace/jax/stages/jace_lowered.py
index ca2f6f8..44e4d0a 100644
--- a/src/jace/jax/stages/jace_lowered.py
+++ b/src/jace/jax/stages/jace_lowered.py
@@ -14,19 +14,14 @@
 
 from jace import translator, util
 from jace.jax import stages
-from jace.util import dace_helper as jdace, translation_cache as tcache
+from jace.jax.stages import translation_cache as tcache
+from jace.util import dace_helper as jdace
 
 
 class JaceLowered(stages.Stage):
     """Represents the original computation that was lowered to SDFG."""
 
-    __slots__ = (
-        "_translated_sdfg",
-        "_cache",
-    )
-
     _translated_sdfg: translator.TranslatedJaxprSDFG
-    _cache: tcache.TranslationCache
 
     DEF_COMPILER_OPTIONS: Final[dict[str, Any]] = {
         "auto_opt": True,
@@ -43,7 +38,6 @@ def __init__(
         if translated_sdfg.out_names is None:
             raise ValueError("Output names must be defined.")
         self._translated_sdfg = translated_sdfg
-        self._cache: tcache.TranslationCache = tcache.get_cache(self)
 
     def optimize(
         self,
diff --git a/src/jace/jax/stages/jace_wrapped.py b/src/jace/jax/stages/jace_wrapped.py
index 526b165..b017b8d 100644
--- a/src/jace/jax/stages/jace_wrapped.py
+++ b/src/jace/jax/stages/jace_wrapped.py
@@ -16,7 +16,7 @@
 
 from jace import translator, util
 from jace.jax import stages
-from jace.util import translation_cache as tcache
+from jace.jax.stages import translation_cache as tcache
 
 
 class JaceWrapped(stages.Stage):
@@ -36,13 +36,7 @@ class JaceWrapped(stages.Stage):
         Copy the `jax._src.pjit.make_jit()` functionality to remove `jax.make_jaxpr()`.
     """
 
-    __slots__ = (
-        "fun_",
-        "_cache",
-    )
-
     _fun: Callable
-    _cache: tcache.TranslationCache
 
     def __init__(
         self,
@@ -51,7 +45,6 @@ def __init__(
         """Creates a wrapped jace jitable object of `jax_prim`."""
         assert fun is not None
         self._fun: Callable = fun
-        self._cache: tcache.TranslationCache = tcache.get_cache(self)
 
     def __call__(
         self,
diff --git a/src/jace/util/translation_cache.py b/src/jace/jax/stages/translation_cache.py
similarity index 93%
rename from src/jace/util/translation_cache.py
rename to src/jace/jax/stages/translation_cache.py
index e70c235..11e4e13 100644
--- a/src/jace/util/translation_cache.py
+++ b/src/jace/jax/stages/translation_cache.py
@@ -30,31 +30,14 @@
 from jace.jax import stages
 
 
-def get_cache(
-    self: stages.Stage,
-    size: int = 128,
-) -> TranslationCache:
-    """Returns the cache associated to `name`.
-
-    If called for the first time, the cache sizes will be set to `size`.
-    In all later calls this value is ignored.
-    """
-    # Get the caches and if not present, create them.
-    if not hasattr(get_cache, "_caches"):
-        _caches: dict[type[stages.Stage], TranslationCache] = {}
-        get_cache._caches = _caches  # type: ignore[attr-defined]  # ruff removes the `getattr()` calls
-    _caches = get_cache._caches  # type: ignore[attr-defined]
-
-    if type(self) not in _caches:
-        _caches[type(self)] = TranslationCache(size=size)
-
-    return _caches[type(self)]
-
-
 def cached_translation(
     action: Callable,
 ) -> Callable:
-    """Decorator for making the function cacheable."""
+    """Decorator for making the transfer method, i.e. `JaceWrapped.lower()` and `JaceLowered.compile()` cacheable.
+
+    The cache is global and the function will add the respecifve cache object to the object upon its first call.
+    To clear the caches use the `clear_translation_cache()` function.
+    """
 
     @ft.wraps(action)
     def _action_wrapper(
@@ -62,8 +45,11 @@ def _action_wrapper(
         *args: Any,
         **kwargs: Any,
     ) -> stages.Stage:
-        assert hasattr(self, "_cache"), f"Type '{type(self).__name__}' does not have `_cache`."
-        cache: TranslationCache = self._cache
+        if hasattr(self, "_cache"):
+            cache: TranslationCache = self._cache
+        else:
+            cache = _get_cache(self)
+            self._cache = cache
         key: _CachedCall = cache.make_key(self, *args, **kwargs)
         if cache.has(key):
             return cache.get(key)
@@ -74,6 +60,36 @@ def _action_wrapper(
     return _action_wrapper
 
 
+def clear_translation_cache() -> None:
+    """Clear all caches associated to translation."""
+
+    if not hasattr(_get_cache, "_caches"):
+        return
+    _get_cache._caches.clear()
+    return
+
+
+def _get_cache(
+    self: stages.Stage,
+    size: int = 128,
+) -> TranslationCache:
+    """Returns the cache associated to `name`.
+
+    If called for the first time, the cache sizes will be set to `size`.
+    In all later calls this value is ignored.
+    """
+    # Get the caches and if not present, create them.
+    if not hasattr(_get_cache, "_caches"):
+        _caches: dict[type[stages.Stage], TranslationCache] = {}
+        _get_cache._caches = _caches  # type: ignore[attr-defined]  # ruff removes the `getattr()` calls
+    _caches = _get_cache._caches  # type: ignore[attr-defined]
+
+    if type(self) not in _caches:
+        _caches[type(self)] = TranslationCache(size=size)
+
+    return _caches[type(self)]
+
+
 @dataclass(init=True, eq=True, frozen=True)
 class _AbstarctCallArgument:
     """Class to represent one argument to the call in an abstract way.

From 2e1ebcd41b259f719342950f74f347e0e3e4a89c Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?Philip=20M=C3=BCller?=
 <147368808+philip-paul-mueller@users.noreply.github.com>
Date: Tue, 14 May 2024 11:26:16 +0200
Subject: [PATCH 149/458] Apply suggestions from code review
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

The other batch is done locally.

Co-authored-by: Enrique González Paredes <enriqueg@cscs.ch>
---
 pyproject.toml                                 | 6 +++---
 src/jace/translator/jaxpr_translator_driver.py | 2 +-
 tests/test_jaxpr_translator_driver.py          | 2 +-
 3 files changed, 5 insertions(+), 5 deletions(-)

diff --git a/pyproject.toml b/pyproject.toml
index f05b72a..fa01acb 100644
--- a/pyproject.toml
+++ b/pyproject.toml
@@ -149,7 +149,7 @@ section-order = [
 "!tests/**.py" = ["PT"]  # Ignore `flake8-pytest-style` everywhere except in `tests/`
 "noxfile.py" = ["T20"]  # Ignore `flake8-print`
 "tests/**" = [
-  "T10",
-  "T20",  # Ignore `flake8-debugger` and `flake8-print`
-  "F841",  # Ignore assigned but not used; inside `with` to test if throw.
+  "T10", # Ignore `flake8-debugger`
+  "T20",  # Ignore `flake8-print`
+  "F841",  # Ignore `unused-variable` (inside `with` to test if throws)
 ]
diff --git a/src/jace/translator/jaxpr_translator_driver.py b/src/jace/translator/jaxpr_translator_driver.py
index 2fac9c4..bf6eb23 100644
--- a/src/jace/translator/jaxpr_translator_driver.py
+++ b/src/jace/translator/jaxpr_translator_driver.py
@@ -241,7 +241,7 @@ def map_jax_var_to_sdfg(
     def map_jax_var_to_sdfg(
         self,
         jax_var: str | jax_core.Atom | util.JaCeVar,
-        allow_fail: bool,
+        allow_fail: Literal[True],
     ) -> str | None: ...
 
     def map_jax_var_to_sdfg(
diff --git a/tests/test_jaxpr_translator_driver.py b/tests/test_jaxpr_translator_driver.py
index 1570471..975fcbb 100644
--- a/tests/test_jaxpr_translator_driver.py
+++ b/tests/test_jaxpr_translator_driver.py
@@ -20,7 +20,7 @@
 
 
 @pytest.fixture(scope="module")
-def alloc_driver():
+def translation_driver():
     """Returns an allocated driver instance."""
     name = "fixture_driver"
     driver = jtrans.JaxprTranslationDriver()

From 62f9fae8c0f6b6b947c49f95a5c872632dd0558d Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Tue, 14 May 2024 13:02:37 +0200
Subject: [PATCH 150/458] Commited Second round of Enrique's changes.

The biggest change is how the primitive translators are recorded.
They now use this annotation method that was suggested by Enrique.
But this needed some changes and also some hacks, I have to find a better way of doing it.
---
 src/jace/translator/__init__.py               |  3 +
 .../translator/jaxpr_translator_driver.py     | 40 ++++-----
 src/jace/translator/managing.py               | 82 +++++++++++++++++++
 src/jace/translator/primitive_translator.py   |  6 +-
 .../primitive_translators/__init__.py         | 16 ++++
 .../alu_translator.py                         |  7 +-
 .../translator/sub_translators/__init__.py    | 52 ------------
 src/jace/translator/translated_jaxpr_sdfg.py  | 21 ++---
 src/jace/util/debug.py                        | 11 +--
 src/jace/util/jax_helper.py                   | 10 +--
 tests/test_jaxpr_translator_driver.py         | 21 ++---
 tests/test_subtranslator_helper.py            | 60 +++++++++++---
 12 files changed, 202 insertions(+), 127 deletions(-)
 create mode 100644 src/jace/translator/managing.py
 create mode 100644 src/jace/translator/primitive_translators/__init__.py
 rename src/jace/translator/{sub_translators => primitive_translators}/alu_translator.py (98%)
 delete mode 100644 src/jace/translator/sub_translators/__init__.py

diff --git a/src/jace/translator/__init__.py b/src/jace/translator/__init__.py
index 042f82a..22f3182 100644
--- a/src/jace/translator/__init__.py
+++ b/src/jace/translator/__init__.py
@@ -10,6 +10,7 @@
 from __future__ import annotations
 
 from .jaxpr_translator_driver import JaxprTranslationDriver
+from .managing import add_subtranslator, get_subtranslators_cls
 from .primitive_translator import PrimitiveTranslator
 from .translated_jaxpr_sdfg import TranslatedJaxprSDFG
 
@@ -18,4 +19,6 @@
     "JaxprTranslationDriver",
     "PrimitiveTranslator",
     "TranslatedJaxprSDFG",
+    "add_subtranslator",
+    "get_subtranslators_cls",
 ]
diff --git a/src/jace/translator/jaxpr_translator_driver.py b/src/jace/translator/jaxpr_translator_driver.py
index bf6eb23..e319bb8 100644
--- a/src/jace/translator/jaxpr_translator_driver.py
+++ b/src/jace/translator/jaxpr_translator_driver.py
@@ -8,8 +8,8 @@
 from __future__ import annotations
 
 import itertools
-from collections.abc import Collection, Iterable, Mapping, MutableSequence, Sequence
-from typing import Any, Final, cast, overload
+from collections.abc import Iterable, Mapping, MutableSequence, Sequence
+from typing import Any, Final, cast, overload, Literal
 
 import dace
 import jax
@@ -102,7 +102,7 @@ def translate_jaxpr(
         *,
         inp_scalar_as_array: bool = False,
         name: str | None = None,
-        reserved_names: str | Collection[str] | None = None,
+        reserved_names: str | Iterable[str] = (),
         allow_empty_jaxpr: bool = False,
     ) -> translator.TranslatedJaxprSDFG:
         """Perform the translation of a Jaxpr into a SDFG.
@@ -203,11 +203,12 @@ def append_new_state(
             self._ctx.terminal_state = new_state
         return new_state
 
-    def get_arrays(self) -> Mapping[str, ddata.Data]:
+    @property
+    def arrays(self) -> Mapping[str, ddata.Data]:
         """Get all `Data` descriptors that are currently known to the SDFG.
 
         Notes:
-            Essentially a shorthand and preferred way for `self.get_sdfg().arrays`.
+            Essentially a shorthand and preferred way for `self.sdfg.arrays`.
             For getting a specific data descriptor use `self.get_array()`.
         """
         return cast(Mapping[str, ddata.Data], self._ctx.sdfg.arrays)
@@ -270,14 +271,16 @@ def map_jax_var_to_sdfg(
             )
         return sdfg_name
 
-    def get_sdfg(self) -> dace.SDFG:
+    @property
+    def sdfg(self) -> dace.SDFG:
         """Returns the SDFG that is currently constructed.
 
-        If you want access to the arrays of the SDFG use `self.get_arrays()`/`self.get_array()`.
+        If you want access to the arrays of the SDFG use `self.arrays()`/`self.get_array()`.
         """
         return self._ctx.sdfg
 
-    def get_terminal_sdfg_state(self) -> dace.SDFGState:
+    @property
+    def terminal_sdfg_state(self) -> dace.SDFGState:
         """Returns the current terminal state of the SDFG under construction.
 
         The SDFGs that are constructed by the driver are essentially a list of states.
@@ -303,11 +306,11 @@ def is_root_translator(self) -> bool:
         if not self.is_allocated():
             raise RuntimeError("Driver is not allocated.")
         if self._ctx.rev_idx == 0:
-            assert len(self._ctx_stack) == 1
             return True
         return False
 
-    def get_rev_idx(self) -> int:
+    @property
+    def rev_idx(self) -> int:
         """Returns the revision index of `self`."""
         if not self.is_allocated():
             raise RuntimeError("Driver is not allocated.")
@@ -338,7 +341,7 @@ def add_jax_name_mapping(
                 f"Tried to create the mapping '{jax_var} -> {sdfg_name}', but '{jax_var}'"
                 f" already points to '{self.map_jax_var_to_sdfg(jax_var)}'."
             )
-        if sdfg_name not in self.get_arrays():
+        if sdfg_name not in self._ctx.sdfg.arrays:
             raise KeyError(f"Mapping '{jax_var} -> {sdfg_name}': SDFG target unknown.")
         if sdfg_name in self._forbidden_names:
             raise NameError(f"Mapping '{jax_var} -> {sdfg_name}': Forbidden name.")
@@ -348,15 +351,15 @@ def add_jax_name_mapping(
 
     def add_reserved_names(
         self,
-        reserved_names: None | str | Collection[str],
+        reserved_names: str | Iterable[str],
     ) -> JaxprTranslationDriver:
         """Adds the names listed in `reserved_names` to the internal list."""
 
-        if reserved_names is None:
+        if not reserved_names:
             return self
         if isinstance(reserved_names, str):
             reserved_names = [reserved_names]
-        elif isinstance(reserved_names, Collection):
+        elif isinstance(reserved_names, Iterable):
             pass
         else:
             raise TypeError(f"Does not know how to handle the type '{type(reserved_names)}'.")
@@ -723,7 +726,7 @@ def _create_constants(
     def _allocate_translation_ctx(
         self,
         name: str | None = None,
-        reserved_names: str | Collection[str] | None = None,
+        reserved_names: str | Iterable[str] = (),
     ) -> JaxprTranslationDriver:
         """This function allocates and initialize the members of the translation context of `self`.
 
@@ -772,12 +775,11 @@ def _init_sub_translators(
         The function forwards `kwargs` to the constructor of the subtranslators.
         However, it will remove all arguments starting with an underscore.
         """
-        from jace.translator import sub_translators  # Cyclic import
 
         subtrans_args = {k: v for k, v in subtrans_args.items() if not k.startswith("_")}
         prim_translators: dict[str, translator.PrimitiveTranslator] = {}
-        for prim_translator_cls in sub_translators._get_subtranslators_cls():
-            prim_translator: translator.PrimitiveTranslator = prim_translator_cls.CREATE(
+        for prim_translator_cls in translator.get_subtranslators_cls():
+            prim_translator: translator.PrimitiveTranslator = prim_translator_cls.build_translator(
                 **subtrans_args
             )
             handled_primitives: Iterable[str] = util.as_sequence(prim_translator.primitive)
@@ -864,7 +866,7 @@ def _translate_single_eqn(
         subtranslator: translator.PrimitiveTranslator = self._find_sub_translator_for(eqn)
 
         # Create the state into which the equation should be translated
-        last_term_state: dace.SDFGState = self.get_terminal_sdfg_state()  # noqa: F841 # Will be used later
+        last_term_state: dace.SDFGState = self.terminal_sdfg_state  # noqa: F841 # Will be used later
         eqn_state = self.append_new_state(
             label=f"{eqn.primitive.name}_{out_var_names[0]}",
             prev_state=None,  # forces terminal state to use
diff --git a/src/jace/translator/managing.py b/src/jace/translator/managing.py
new file mode 100644
index 0000000..589b446
--- /dev/null
+++ b/src/jace/translator/managing.py
@@ -0,0 +1,82 @@
+# JaCe - JAX Just-In-Time compilation using DaCe (Data Centric Parallel Programming)
+#
+# Copyright (c) 2024, ETH Zurich
+# All rights reserved.
+#
+# SPDX-License-Identifier: BSD-3-Clause
+"""Module for managing the individual sutranslators."""
+
+from __future__ import annotations
+
+from collections.abc import Callable, Sequence
+from typing import Literal, overload
+
+from jace import translator
+
+
+# List of all primitive translators that are known to Jace.
+#  They are filled through the `add_subtranslator()` decorator.
+#  See also the note in `get_subtranslators_cls()`
+_KNOWN_SUBTRANSLATORS: list[type[translator.PrimitiveTranslator]] = []
+
+
+@overload
+def add_subtranslator(
+    subtrans: Literal[None], /, overwrite: bool = False
+) -> Callable[[type[translator.PrimitiveTranslator]], type[translator.PrimitiveTranslator]]: ...
+
+
+@overload
+def add_subtranslator(
+    subtrans: type[translator.PrimitiveTranslator], /, overwrite: bool = False
+) -> type[translator.PrimitiveTranslator]: ...
+
+
+def add_subtranslator(
+    subtrans: type[translator.PrimitiveTranslator] | None = None,
+    /,
+    overwrite: bool = False,
+) -> (
+    type[translator.PrimitiveTranslator]
+    | Callable[[type[translator.PrimitiveTranslator]], type[translator.PrimitiveTranslator]]
+):
+    """Decorator to add `subtrans` to the list of known subtranslators.
+
+    If a class is tried to be registered twice an error will be generated unless, `overwrite` is set.
+    """
+    if subtrans is None:
+
+        def wrapper(
+            real_subtrans: type[translator.PrimitiveTranslator],
+        ) -> type[translator.PrimitiveTranslator]:
+            return add_subtranslator(real_subtrans, overwrite=overwrite)
+
+        return wrapper
+
+    if subtrans in _KNOWN_SUBTRANSLATORS:
+        if overwrite:
+            _KNOWN_SUBTRANSLATORS.remove(subtrans)
+        else:
+            raise ValueError(
+                f"Tried to add '{type(subtrans).__name__}' twice to the list of known primitive translators."
+            )
+
+    _KNOWN_SUBTRANSLATORS.append(subtrans)
+    return subtrans
+
+
+def get_subtranslators_cls() -> Sequence[type[translator.PrimitiveTranslator]]:
+    """Returns the list of all subtranslator known to JaCe.
+
+    The subtranslators are returned in FIFO order.
+    """
+    # There is a chicken-egg problem, i.e. circular import, if we use the decorator to add the build in classes.
+    #  The problem is, that they are only run, i.e. added to the list, upon importing.
+    #  Thus we have to explicitly import the subtranslator, but this would then lead to a circular import.
+    #  For that reason we import the subpackage here explicitly.
+    #  However, this requires that all are imported by the `__init__.py` file.
+    #  I do not know a way to do this better.
+    #  Actually I want to do it somehow upon the importation of `jace` itself.
+    from jace.translator import primitive_translators  # noqa: F401  # Unused import
+
+    return list(reversed(_KNOWN_SUBTRANSLATORS))
diff --git a/src/jace/translator/primitive_translator.py b/src/jace/translator/primitive_translator.py
index a1f34e6..fa717aa 100644
--- a/src/jace/translator/primitive_translator.py
+++ b/src/jace/translator/primitive_translator.py
@@ -32,7 +32,7 @@ class PrimitiveTranslator(Protocol):
     A translator for a primitive translates a single equation of a Jaxpr into its SDFG equivalent.
     A type that implements this interface must fulfil the following properties:
     - It must be immutable after construction.
-    - All subclass must implement the class method `CREATE()` to construct an instance.
+    - All subclass must implement the class method `build_translator()` to construct an instance.
 
     Subtranslators are simple, but highly specialized objects that are only able to perform the translation of a single primitive.
     The overall translation process itself is managed by a driver object, which also owns and manage the subtranslators.
@@ -49,7 +49,7 @@ class PrimitiveTranslator(Protocol):
 
     @classmethod
     @abstractmethod
-    def CREATE(
+    def build_translator(
         cls,
         *args: Any,
         **kwargs: Any,
@@ -90,7 +90,7 @@ def translate_jaxeqn(
             They are passed as `out_var_names`, same order as in the equation.
         - The driver will create a new terminal state and pass it as
             `eqn_state` argument. This state is guaranteed to be empty and
-            `translator.get_terminal_sdfg_state() is eqn_state` holds.
+            `translator.terminal_sdfg_state is eqn_state` holds.
 
         Then the subtranslator is called.
         Usually a subtranslator should construct the dataflow graph inside `eqn_state`.
diff --git a/src/jace/translator/primitive_translators/__init__.py b/src/jace/translator/primitive_translators/__init__.py
new file mode 100644
index 0000000..08bff9d
--- /dev/null
+++ b/src/jace/translator/primitive_translators/__init__.py
@@ -0,0 +1,16 @@
+# JaCe - JAX Just-In-Time compilation using DaCe (Data Centric Parallel Programming)
+#
+# Copyright (c) 2024, ETH Zurich
+# All rights reserved.
+#
+# SPDX-License-Identifier: BSD-3-Clause
+"""Module collecting all built-in subtranslators."""
+
+from __future__ import annotations
+
+from .alu_translator import ALUTranslator
+
+
+__all__ = [
+    "ALUTranslator",
+]
diff --git a/src/jace/translator/sub_translators/alu_translator.py b/src/jace/translator/primitive_translators/alu_translator.py
similarity index 98%
rename from src/jace/translator/sub_translators/alu_translator.py
rename to src/jace/translator/primitive_translators/alu_translator.py
index 23f0cb3..9f7aa44 100644
--- a/src/jace/translator/sub_translators/alu_translator.py
+++ b/src/jace/translator/primitive_translators/alu_translator.py
@@ -20,6 +20,7 @@
 from jace import translator
 
 
+@translator.add_subtranslator
 class ALUTranslator(translator.PrimitiveTranslator):
     """This translator handles all arithmetic and logical operations."""
 
@@ -70,7 +71,7 @@ class ALUTranslator(translator.PrimitiveTranslator):
     }
 
     @classmethod
-    def CREATE(
+    def build_translator(
         cls,
         *args: Any,
         **kwargs: Any,
@@ -168,7 +169,7 @@ def translate_jaxeqn(
                     raise ValueError(f"Invalid shapes in dimension {dim} for broadcasting.")
 
         # Now we create the Tasklet in which the calculation is performed.
-        tskl_code: str = self._writeTaskletCode(in_var_names, eqn)
+        tskl_code: str = self._write_tasklet_code(in_var_names, eqn)
         tskl_name: str = eqn.primitive.name
         tskl_map_ranges: list[tuple[str, str]] = [
             (f"__i{dim}", f"0:{N}") for dim, N in enumerate(eqn.outvars[0].aval.shape)
@@ -240,7 +241,7 @@ def translate_jaxeqn(
 
         return eqn_state
 
-    def _writeTaskletCode(
+    def _write_tasklet_code(
         self,
         in_var_names: Sequence[str | None],
         eqn: jax_core.JaxprEqn,
diff --git a/src/jace/translator/sub_translators/__init__.py b/src/jace/translator/sub_translators/__init__.py
deleted file mode 100644
index 7e52b28..0000000
--- a/src/jace/translator/sub_translators/__init__.py
+++ /dev/null
@@ -1,52 +0,0 @@
-# JaCe - JAX Just-In-Time compilation using DaCe (Data Centric Parallel Programming)
-#
-# Copyright (c) 2024, ETH Zurich
-# All rights reserved.
-#
-# SPDX-License-Identifier: BSD-3-Clause
-"""Module collecting all built-in subtranslators."""
-
-from __future__ import annotations
-
-from collections.abc import Sequence
-
-from jace import translator
-
-from .alu_translator import ALUTranslator
-
-
-# List of all subtranslators that ships with JaCe.
-_KNOWN_SUBTRANSLATORS: list[type[translator.PrimitiveTranslator]] = [
-    ALUTranslator,
-]
-
-
-def add_subtranslator(
-    subtrans: type[translator.PrimitiveTranslator],
-) -> bool:
-    """Add `subtrans` to the externally defined subtranslators.
-
-    The function returns `True` if it was added and `False` is not.
-    """
-    # NOTE: Because `PrimitiveTranslator` has a property, it is not possible to use
-    #         `issubclass()` here, to check if the interface is ready implemented.
-    if subtrans in _KNOWN_SUBTRANSLATORS:
-        # TODO: Consider moving `subtrans` to the front (last element).
-        return False
-    _KNOWN_SUBTRANSLATORS.append(subtrans)
-    return True
-
-
-def _get_subtranslators_cls() -> Sequence[type[translator.PrimitiveTranslator]]:
-    """Returns the list of all subtranslator known to JaCe.
-
-    The translators are returned in FIFO order.
-    """
-    return list(reversed(_KNOWN_SUBTRANSLATORS))
-
-
-__all__ = [
-    "ALUTranslator",
-    "add_subtranslator",
-    "PrimitiveTranslator",
-]
diff --git a/src/jace/translator/translated_jaxpr_sdfg.py b/src/jace/translator/translated_jaxpr_sdfg.py
index 369572c..17457b8 100644
--- a/src/jace/translator/translated_jaxpr_sdfg.py
+++ b/src/jace/translator/translated_jaxpr_sdfg.py
@@ -7,7 +7,6 @@
 
 from __future__ import annotations
 
-from collections.abc import MutableMapping
 from dataclasses import dataclass
 
 import dace
@@ -16,7 +15,7 @@
 from jace import util
 
 
-@dataclass(slots=True)
+@dataclass
 class TranslatedJaxprSDFG:
     """Encapsulates the result of a translation run of the `JaxprTranslationDriver` object.
 
@@ -44,7 +43,7 @@ class TranslatedJaxprSDFG:
     """
 
     sdfg: dace.SDFG
-    jax_name_map: MutableMapping[jax_core.Var | util.JaCeVar, str]
+    jax_name_map: dict[jax_core.Var | util.JaCeVar, str]
     start_state: dace.SDFGState
     terminal_state: dace.SDFGState
     inp_names: tuple[str, ...]
@@ -67,15 +66,13 @@ def __init__(
         if isinstance(name, str) and not util.VALID_SDFG_OBJ_NAME.fullmatch(name):
             raise ValueError(f"'{name}' is not a valid SDFG name.")
 
-        self.sdfg: dace.SDFG = dace.SDFG(name=(name or f"unnamed_SDFG_{id(self)}"))
-        self.start_state: dace.SDFGState = self.sdfg.add_state(
-            label="initial_state", is_start_block=True
-        )
-        self.terminal_state: dace.SDFGState = self.start_state
-        self.jax_name_map: MutableMapping[jax_core.Var | util.JaCeVar, str] = {}
-        self.inp_names: tuple[str, ...] = ()
-        self.out_names: tuple[str, ...] = ()
-        self.rev_idx: int = rev_idx
+        self.sdfg = dace.SDFG(name=(name or f"unnamed_SDFG_{id(self)}"))
+        self.start_state = self.sdfg.add_state(label="initial_state", is_start_block=True)
+        self.terminal_state = self.start_state
+        self.jax_name_map = {}
+        self.inp_names = ()
+        self.out_names = ()
+        self.rev_idx = rev_idx
 
     def validate(self) -> bool:
         """Validate the underlying SDFG."""
diff --git a/src/jace/util/debug.py b/src/jace/util/debug.py
index 23aee23..d4ae754 100644
--- a/src/jace/util/debug.py
+++ b/src/jace/util/debug.py
@@ -21,10 +21,7 @@
 from jace import translator
 
 
-def run_jax_sdfg(
-    jsdfg: translator.TranslatedJaxprSDFG,
-    *args: Any,
-) -> tuple[Any, ...] | Any:
+def run_jax_sdfg(jsdfg: translator.TranslatedJaxprSDFG, *args: Any) -> tuple[Any, ...] | Any:
     """Calls the SDFG that is encapsulated with the supplied arguments.
 
     Notes:
@@ -84,11 +81,7 @@ def run_jax_sdfg(
             jsdfg.sdfg.arrays[name].transient = True
 
 
-def _jace_run(
-    fun: Callable,
-    *args: Any,
-    **kwargs: Any,
-) -> Any:
+def _jace_run(fun: Callable, *args: Any, **kwargs: Any) -> Any:
     """Traces and run function `fun` using `Jax | DaCe`.
 
     Args:
diff --git a/src/jace/util/jax_helper.py b/src/jace/util/jax_helper.py
index 0ea37a1..0de9934 100644
--- a/src/jace/util/jax_helper.py
+++ b/src/jace/util/jax_helper.py
@@ -42,7 +42,7 @@ class JaCeVar:
     """
 
     name: str
-    shape: tuple[int | dace.symbol | str, ...] | tuple[()]
+    shape: tuple[int | dace.symbol | str, ...]
     dtype: dace.typeclass
 
     def __hash__(self) -> int:
@@ -93,16 +93,14 @@ def get_jax_var_name(jax_var: jax_core.Atom | JaCeVar | str) -> str:
 
 
 @overload
-def get_jax_var_shape(jax_var: JaCeVar) -> tuple[int | dace.symbol | str, ...] | tuple[()]: ...
+def get_jax_var_shape(jax_var: JaCeVar) -> tuple[int | dace.symbol | str, ...]: ...  # type: ignore[overload-overlap]
 
 
 @overload
-def get_jax_var_shape(jax_var: jax_core.Atom) -> tuple[int, ...] | tuple[()]: ...
+def get_jax_var_shape(jax_var: jax_core.Atom) -> tuple[int, ...]: ...
 
 
-def get_jax_var_shape(
-    jax_var: jax_core.Atom | JaCeVar,
-) -> tuple[int | dace.symbol | str, ...] | tuple[()]:
+def get_jax_var_shape(jax_var: jax_core.Atom | JaCeVar) -> tuple[int | dace.symbol | str, ...]:
     """Returns the shape of a Jax variable.
 
     Args:
diff --git a/tests/test_jaxpr_translator_driver.py b/tests/test_jaxpr_translator_driver.py
index 975fcbb..16cdfe3 100644
--- a/tests/test_jaxpr_translator_driver.py
+++ b/tests/test_jaxpr_translator_driver.py
@@ -38,14 +38,14 @@ def test_driver_alloc() -> None:
     sdfg_name = "qwertzuiopasdfghjkl"
     driver._allocate_translation_ctx(name=sdfg_name)
 
-    sdfg: dace.SDFG = driver.get_sdfg()
+    sdfg: dace.SDFG = driver.sdfg
 
     assert driver._ctx.sdfg is sdfg
-    assert driver.get_sdfg().name == sdfg_name
+    assert driver.sdfg.name == sdfg_name
     assert sdfg.number_of_nodes() == 1
     assert sdfg.number_of_edges() == 0
     assert sdfg.start_block is driver._ctx.start_state
-    assert driver.get_terminal_sdfg_state() is driver._ctx.start_state
+    assert driver.terminal_sdfg_state is driver._ctx.start_state
 
 
 def test_driver_nested() -> None:
@@ -78,11 +78,6 @@ def test_driver_nested() -> None:
     assert driver._ctx is driver._ctx_stack[-1]
     assert driver._ctx is not driver._ctx_stack[0]
 
-    for member_name in driver._ctx.__slots__:
-        org = getattr(org_ctx, member_name)
-        nest = getattr(driver._ctx, member_name)
-        assert org is not nest, f"Detected sharing for '{member_name}'"
-
     assert org_ctx.rev_idx < driver._ctx.rev_idx
 
     # Now we go back one state, i.e. pretend that we are done with translating the nested jaxpr.
@@ -99,13 +94,13 @@ def test_driver_nested() -> None:
 
 def test_driver_append_state(alloc_driver: jtrans.JaxprTranslationDriver) -> None:
     """Tests the functionality of appending states."""
-    sdfg: dace.SDFG = alloc_driver.get_sdfg()
+    sdfg: dace.SDFG = alloc_driver.sdfg
 
     terminal_state_1: dace.SDFGState = alloc_driver.append_new_state("terminal_state_1")
     assert sdfg.number_of_nodes() == 2
     assert sdfg.number_of_edges() == 1
-    assert terminal_state_1 is alloc_driver.get_terminal_sdfg_state()
-    assert alloc_driver.get_terminal_sdfg_state() is alloc_driver._ctx.terminal_state
+    assert terminal_state_1 is alloc_driver.terminal_sdfg_state
+    assert alloc_driver.terminal_sdfg_state is alloc_driver._ctx.terminal_state
     assert alloc_driver._ctx.start_state is sdfg.start_block
     assert alloc_driver._ctx.start_state is not terminal_state_1
     assert next(iter(sdfg.edges())).src is sdfg.start_block
@@ -117,7 +112,7 @@ def test_driver_append_state(alloc_driver: jtrans.JaxprTranslationDriver) -> Non
     )
     assert sdfg.number_of_nodes() == 3
     assert sdfg.number_of_edges() == 2
-    assert terminal_state_2 is alloc_driver.get_terminal_sdfg_state()
+    assert terminal_state_2 is alloc_driver.terminal_sdfg_state
     assert sdfg.out_degree(terminal_state_1) == 1
     assert sdfg.out_degree(terminal_state_2) == 0
     assert sdfg.in_degree(terminal_state_2) == 1
@@ -127,7 +122,7 @@ def test_driver_append_state(alloc_driver: jtrans.JaxprTranslationDriver) -> Non
     non_terminal_state: dace.SDFGState = alloc_driver.append_new_state(
         "non_terminal_state", prev_state=terminal_state_1
     )
-    assert alloc_driver.get_terminal_sdfg_state() is not non_terminal_state
+    assert alloc_driver.terminal_sdfg_state is not non_terminal_state
     assert sdfg.in_degree(non_terminal_state) == 1
     assert sdfg.out_degree(non_terminal_state) == 0
     assert next(iter(sdfg.in_edges(non_terminal_state))).src is terminal_state_1
diff --git a/tests/test_subtranslator_helper.py b/tests/test_subtranslator_helper.py
index 4c7ddd8..e50f9a5 100644
--- a/tests/test_subtranslator_helper.py
+++ b/tests/test_subtranslator_helper.py
@@ -9,23 +9,27 @@
 
 from __future__ import annotations
 
+import re
+
+import pytest
+
 from jace import translator as jtrans
 
 
 def test_subtranslatior_managing():
     """Ensures the functionality of the subtranslator managing."""
-    from jace.translator.sub_translators import (
-        _get_subtranslators_cls,
+    from jace.translator import (
         add_subtranslator,
+        get_subtranslators_cls,
     )
 
     # These are all initial subtranslators
-    builtin_subtrans_cls = _get_subtranslators_cls()
+    builtin_subtrans_cls = get_subtranslators_cls()
 
     # Definitions of some classes to help.
     class SubTrans1(jtrans.PrimitiveTranslator):
         @classmethod
-        def CREATE(cls) -> SubTrans1:
+        def build_translator(cls) -> SubTrans1:
             return SubTrans1()
 
         @property
@@ -37,7 +41,7 @@ def translate_jaxeqn(self) -> None:  # type: ignore[override]  # Arguments
 
     class SubTrans2(jtrans.PrimitiveTranslator):
         @classmethod
-        def CREATE(cls) -> SubTrans2:
+        def build_translator(cls) -> SubTrans2:
             return SubTrans2()
 
         @property
@@ -47,21 +51,57 @@ def primitive(self):
         def translate_jaxeqn(self) -> None:  # type: ignore[override]  # Arguments
             return None
 
+    assert SubTrans1 != SubTrans2
+
     # Adding the first subtranslator to the list.
-    assert add_subtranslator(SubTrans1)
+    add_subtranslator(SubTrans1)
 
-    curr_subtrans_cls = _get_subtranslators_cls()
+    curr_subtrans_cls = get_subtranslators_cls()
     assert len(curr_subtrans_cls) == len(builtin_subtrans_cls) + 1
-    assert [SubTrans1, *builtin_subtrans_cls] == curr_subtrans_cls
+    assert all(
+        type(exp) == type(got)
+        for exp, got in zip([SubTrans1, *builtin_subtrans_cls], curr_subtrans_cls)
+    )
 
     # Now adding the second subtranslator
-    assert add_subtranslator(SubTrans2)
+    add_subtranslator(SubTrans2)
 
-    curr_subtrans_cls2 = _get_subtranslators_cls()
+    curr_subtrans_cls2 = get_subtranslators_cls()
     assert len(curr_subtrans_cls2) == len(builtin_subtrans_cls) + 2
     assert [SubTrans2, SubTrans1, *builtin_subtrans_cls] == curr_subtrans_cls2
     assert curr_subtrans_cls2 is not curr_subtrans_cls
 
+    with pytest.raises(
+        expected_exception=ValueError,
+        match=re.escape(
+            f"Tried to add '{type(SubTrans1).__name__}' twice to the list of known primitive translators."
+        ),
+    ):
+        add_subtranslator(SubTrans2)
+
+    @add_subtranslator
+    class SubTrans3(jtrans.PrimitiveTranslator):
+        @classmethod
+        def build_translator(cls) -> SubTrans2:
+            return SubTrans2()
+
+        @property
+        def primitive(self):
+            return "non_existing_primitive2"
+
+        def translate_jaxeqn(self) -> None:  # type: ignore[override]  # Arguments
+            return None
+
+    curr_subtrans_cls3 = get_subtranslators_cls()
+    assert len(curr_subtrans_cls3) == len(builtin_subtrans_cls) + 3
+    assert [SubTrans3, SubTrans2, SubTrans1, *builtin_subtrans_cls] == curr_subtrans_cls3
+
+    # Adding version 1 again, but this time using overwrite
+    add_subtranslator(SubTrans1, overwrite=True)
+    curr_subtrans_cls4 = get_subtranslators_cls()
+    assert len(curr_subtrans_cls3) == len(curr_subtrans_cls4)
+    assert [SubTrans1, SubTrans3, SubTrans2, *builtin_subtrans_cls] == curr_subtrans_cls4
+
 
 if __name__ == "__main__":
     test_subtranslatior_managing()

From c00a9421d7bdcaf244a9f3f1330ce720ba629193 Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Tue, 14 May 2024 15:58:19 +0200
Subject: [PATCH 151/458] Started with implementing a better stage process.

The main point, which might not be liked, is that there is now a `FinalizedJaxprSDFG` object, which is essentially a compressed verison of a `TranslatedJaxprSDFG`.
---
 src/jace/jax/stages/jace_lowered.py           |  60 ++++----
 src/jace/jax/stages/jace_wrapped.py           |  22 +--
 src/jace/optimization/__init__.py             |  39 +++++
 .../translator/jaxpr_translator_driver.py     |   3 +-
 src/jace/translator/post_translation.py       | 138 ++++++++++++++++++
 src/jace/util/compiling.py                    | 124 ++++++++--------
 tests/test_decorator.py                       |   3 +-
 7 files changed, 286 insertions(+), 103 deletions(-)
 create mode 100644 src/jace/optimization/__init__.py
 create mode 100644 src/jace/translator/post_translation.py

diff --git a/src/jace/jax/stages/jace_lowered.py b/src/jace/jax/stages/jace_lowered.py
index 44e4d0a..2dae9a2 100644
--- a/src/jace/jax/stages/jace_lowered.py
+++ b/src/jace/jax/stages/jace_lowered.py
@@ -12,16 +12,17 @@
 import json
 from typing import Any, Final
 
-from jace import translator, util
+from jace import optimization, util
 from jace.jax import stages
 from jace.jax.stages import translation_cache as tcache
+from jace.translator import post_translation as ptrans
 from jace.util import dace_helper as jdace
 
 
 class JaceLowered(stages.Stage):
     """Represents the original computation that was lowered to SDFG."""
 
-    _translated_sdfg: translator.TranslatedJaxprSDFG
+    _trans_sdfg: ptrans.FinalizedJaxprSDFG
 
     DEF_COMPILER_OPTIONS: Final[dict[str, Any]] = {
         "auto_opt": True,
@@ -30,54 +31,49 @@ class JaceLowered(stages.Stage):
 
     def __init__(
         self,
-        translated_sdfg: translator.TranslatedJaxprSDFG,
+        trans_sdfg: ptrans.FinalizedJaxprSDFG,
     ) -> None:
         """Constructs the wrapper."""
-        if translated_sdfg.inp_names is None:
+        if trans_sdfg.inp_names is None:
             raise ValueError("Input names must be defined.")
-        if translated_sdfg.out_names is None:
+        if trans_sdfg.out_names is None:
             raise ValueError("Output names must be defined.")
-        self._translated_sdfg = translated_sdfg
-
-    def optimize(
-        self,
-        **kwargs: Any,  # noqa: ARG002  # Unused argument
-    ) -> JaceLowered:
-        """Perform optimization _inplace_ and return `self`.
-
-        Notes:
-            Currently no optimization is performed.
-        """
-        # TODO(phimuell): Think really hard what we should do here, to avoid strange behaviour.
-        #                   I am not fully sure if we should include the SDFG value in the caching.
-
-        # TODO(phimuell):
-        #   - remove the inplace modification.
-        #   - Somehow integrate it into the caching strategy.
-        #
-        #  If we would not integrate it into the caching strategy, then calling `lower()` on
-        #  the wrapped object would return the original object, but with a modified, already optimized SDFG.
-        return self
+        if trans_sdfg.csdfg is not None:
+            raise ValueError("SDFG is already compiled.")
+        self._trans_sdfg = trans_sdfg
 
     @tcache.cached_translation
     def compile(
         self,
-        compiler_options: stages.CompilerOptions | None = None,  # noqa: ARG002  # Unused arguments
+        compiler_options: stages.CompilerOptions | None = None,  # Unused arguments
     ) -> stages.JaceCompiled:
         """Compile the SDFG.
 
         Returns an Object that encapsulates a compiled SDFG object.
         """
-        csdfg: jdace.CompiledSDFG = util.compile_jax_sdfg(self._translated_sdfg)
+        from copy import deepcopy
+
+        # The reason why we have to deepcopy the SDFG
+        #  All optimization DaCe functions works in place, if we would not copy the SDFG first, then we would have a problem.
+        #  Because, these optimization would then have a feedback of the SDFG object which is stored inside `self`.
+        #  Thus if we would run this code `(jaceLoweredObject := jaceWrappedObject.lower()).compile({opti=True})` would return an optimized object.
+        #  However, if we would now call `jaceWrappedObject.lower()` (with the same arguments as before, we would get `jaceLoweredObject`,
+        #  but it would actually contain an already optimized SDFG, which is not what we want.
+        fsdfg: ptrans.FinalizedJaxprSDFG = deepcopy(self._trans_sdfg)
+        optimization.jace_auto_optimize(
+            fsdfg, **({} if compiler_options is None else compiler_options)
+        )
+        csdfg: jdace.CompiledSDFG = util.compile_jax_sdfg(fsdfg, cache=False)
+
         return stages.JaceCompiled(
             csdfg=csdfg,
-            inp_names=self._translated_sdfg.inp_names,
-            out_names=self._translated_sdfg.out_names,
+            inp_names=fsdfg.inp_names,
+            out_names=fsdfg.out_names,
         )
 
-    def compiler_ir(self, dialect: str | None = None) -> translator.TranslatedJaxprSDFG:
+    def compiler_ir(self, dialect: str | None = None) -> ptrans.FinalizedJaxprSDFG:
         if (dialect is None) or (dialect.upper() == "SDFG"):
-            return self._translated_sdfg
+            return self._trans_sdfg
         raise ValueError(f"Unknown dialect '{dialect}'.")
 
     def as_html(self, filename: str | None = None) -> None:
diff --git a/src/jace/jax/stages/jace_wrapped.py b/src/jace/jax/stages/jace_wrapped.py
index b017b8d..439512b 100644
--- a/src/jace/jax/stages/jace_wrapped.py
+++ b/src/jace/jax/stages/jace_wrapped.py
@@ -10,6 +10,7 @@
 from __future__ import annotations
 
 from collections.abc import Callable
+from functools import update_wrapper
 from typing import Any
 
 import jax as jax_jax
@@ -17,6 +18,7 @@
 from jace import translator, util
 from jace.jax import stages
 from jace.jax.stages import translation_cache as tcache
+from jace.translator import post_translation as ptrans
 
 
 class JaceWrapped(stages.Stage):
@@ -46,6 +48,11 @@ def __init__(
         assert fun is not None
         self._fun: Callable = fun
 
+        # Makes that `self` is a true stand-in for `fun`
+        #  This will also add a `__wrapped__` property to `self` which is not part of the interface.
+        # TODO(phimuell): modify text to make it clear that it is wrapped, Jax does the same.
+        update_wrapper(self, self._fun)
+
     def __call__(
         self,
         *args: Any,
@@ -62,7 +69,7 @@ def __call__(
 
         # TODO(phimuell): Handle static arguments correctly
         #                   https://jax.readthedocs.io/en/latest/aot.html#lowering-with-static-arguments
-        return self.lower(*args, **kwargs).optimize().compile()(*args, **kwargs)
+        return self.lower(*args, **kwargs).compile()(*args, **kwargs)
 
     @tcache.cached_translation
     def lower(
@@ -84,13 +91,10 @@ def lower(
 
         jaxpr = jax_jax.make_jaxpr(self._fun)(*real_args)
         driver = translator.JaxprTranslationDriver()
-        translated_sdfg: translator.TranslatedJaxprSDFG = driver.translate_jaxpr(jaxpr)
-        return stages.JaceLowered(translated_sdfg)
+        trans_sdfg: translator.TranslatedJaxprSDFG = driver.translate_jaxpr(jaxpr)
 
-    @property
-    def __wrapped__(self) -> Callable:
-        """Returns the wrapped function.
+        fin_sdfg: ptrans.FinalizedJaxprSDFG = ptrans.postprocess_jaxpr_sdfg(
+            tsdfg=trans_sdfg, fun=self.__wrapped__
+        )
 
-        This is a Jace extension.
-        """
-        return self._fun
+        return stages.JaceLowered(fin_sdfg)
diff --git a/src/jace/optimization/__init__.py b/src/jace/optimization/__init__.py
new file mode 100644
index 0000000..511d446
--- /dev/null
+++ b/src/jace/optimization/__init__.py
@@ -0,0 +1,39 @@
+# JaCe - JAX Just-In-Time compilation using DaCe (Data Centric Parallel Programming)
+#
+# Copyright (c) 2024, ETH Zurich
+# All rights reserved.
+#
+# SPDX-License-Identifier: BSD-3-Clause
+
+"""Module that will host all optimization functions specific to Jace.
+
+Currently it is just a dummy that exports some functions that do nothing.
+"""
+
+from __future__ import annotations
+
+import dace
+
+from jace.translator import post_translation as ptrans
+
+
+def jace_auto_optimize(
+    fsdfg: ptrans.FinalizedJaxprSDFG,
+    simplify: bool = True,
+    **kwargs: str | bool,  # noqa: ARG001  # Unused argument, for now
+) -> dace.SDFG:
+    """Performs optimization of the `fsdfg` _inplace_ and returns it.
+
+    Currently this function only supports simplification.
+    Its main job is to exists that we have something that we can call in the tool chain.
+    """
+    if simplify:
+        fsdfg.sdfg.simplify()
+
+    fsdfg.validate()
+    return fsdfg
+
+
+__all__ = [
+    "jace_auto_optimize",
+]
diff --git a/src/jace/translator/jaxpr_translator_driver.py b/src/jace/translator/jaxpr_translator_driver.py
index f9ff13c..8a0c9e2 100644
--- a/src/jace/translator/jaxpr_translator_driver.py
+++ b/src/jace/translator/jaxpr_translator_driver.py
@@ -31,7 +31,8 @@ class JaxprTranslationDriver:
     - the `arg_names` parameter is not set.
 
     For these reasons the SDFG is not directly usable, and further manipulations have to be performed.
-    TBA where to look for them.
+    Especially, DaCe's validation function will fail and it is unable to be perocessed by the optimization pipeline.
+    For more information also see `jace.translator.post_translation` module for more information.
 
     The idea of the translator is extremely simple. Since Jaxpr is a list
     consisting of more or less simple instructions/equations, they get processed
diff --git a/src/jace/translator/post_translation.py b/src/jace/translator/post_translation.py
new file mode 100644
index 0000000..c0b3ab8
--- /dev/null
+++ b/src/jace/translator/post_translation.py
@@ -0,0 +1,138 @@
+# JaCe - JAX Just-In-Time compilation using DaCe (Data Centric Parallel Programming)
+#
+# Copyright (c) 2024, ETH Zurich
+# All rights reserved.
+#
+# SPDX-License-Identifier: BSD-3-Clause
+
+"""This module contains all functions that are related to post processing the SDFG.
+
+Most of them operate on `TranslatedJaxprSDFG` objects.
+"""
+
+from __future__ import annotations
+
+from collections.abc import Callable
+from dataclasses import dataclass
+
+import dace
+
+from jace import translator
+from jace.util import dace_helper as jdace
+
+
+def postprocess_jaxpr_sdfg(
+    tsdfg: translator.TranslatedJaxprSDFG,
+    fun: Callable,  # noqa: ARG001  # Currently unused
+) -> FinalizedJaxprSDFG:
+    """Perform the final postprocessing step on the SDFG and returns a finalized version.
+
+    The function will not modify the passed `tsdfg` object (`TranslatedJaxprSDFG`).
+    The returned object is of type `FinalizedJaxprSDFG` and is decoupled from the input,
+    such that there is no feedback.
+
+    Args:
+        tsdfg:  The translated SDFG object.
+        fun:    The original function that we translated.
+    """
+    # Currently we do nothing except finalizing.
+    return finalize_jaxpr_sdfg(tsdfg)
+
+
+def finalize_jaxpr_sdfg(
+    trans_sdfg: translator.TranslatedJaxprSDFG,
+) -> FinalizedJaxprSDFG:
+    """Finalizes the supplied `trans_sdfg` object.
+
+    The returned object is guaranteed to be decoupled from the supplied `TranslatedJaxprSDFG`.
+    You should use this function after you have performed all necessary postprocessing for which you need the meta data of the translation.
+    The returned object is meant as input for jace's optimization pipeline.
+
+    Note:
+        For several reasons this function performs a deep copy of the associated SDFG.
+            The enter toolchain assumes and relies on this fact.
+    """
+    # Check if the outputs are defined.
+    if trans_sdfg.inp_names is None:
+        raise ValueError("Input names are not specified.")
+    if trans_sdfg.out_names is None:
+        raise ValueError("Output names are not specified.")
+
+    # We do not support the return value mechanism that dace provides us.
+    #  The reasons for that are that the return values are always shared and the working with pytrees is not yet understood.
+    #  Thus we make the safe choice by passing all as arguments.
+    assert not any(
+        arrname.startswith("__return")
+        for arrname in trans_sdfg.sdfg.arrays.keys()  # noqa: SIM118  # we can not use `in` because we are also interested in `__return_`!
+    ), "Only support SDFGs without '__return' members."
+
+    # We perform a deepcopy by serializing it, as deepcopy is known for having some issues.
+    sdfg = dace.SDFG.from_json(trans_sdfg.sdfg.to_json())
+    inp_names = trans_sdfg.inp_names
+    out_names = trans_sdfg.out_names
+
+    # Canonical SDFGs do not have global memory, so we must transform it
+    sdfg_arg_names: list[str] = []
+    for glob_name in inp_names + out_names:
+        if glob_name in sdfg_arg_names:  # Donated arguments
+            continue
+        sdfg.arrays[glob_name].transient = False
+        sdfg_arg_names.append(glob_name)
+
+    # This forces the signature of the SDFG to include all arguments in order they appear.
+    #  If an argument is reused (donated) then it is only listed once, the first time it appears
+    sdfg.arg_names = sdfg_arg_names
+
+    return FinalizedJaxprSDFG(sdfg=sdfg, inp_names=inp_names, out_names=out_names)
+
+
+@dataclass(init=True, eq=False, frozen=False)
+class FinalizedJaxprSDFG:
+    """This is the final stage of the post processing of the translation.
+
+    Instances of these class only contains enough information to run, but all other meta data associated to tarnslation are lost.
+    The idea of this class is that they can be feed to the optimization pipeline of Jace.
+    The SDFG that is inside `self` my not be optimized, but input and outputs are marked as global and they have a valid `arg_names` property.
+
+    SDFG encapsulated in `TranslatedJaxprSDFG` is in canonical form, which is not usable, finalized SDFGs are always valid.
+    They have:
+    - All input an output arrays are marked as global.
+    - It does not have `__return` values, i.e. all arguments are passed as arguments.
+    - Its `arg_names` are set with set `inp_names + out_names`, however,
+        arguments that are input and outputs are only listed as inputs.
+
+    Notes:
+        The main reason this class exists is, because optimizations are done in the `JaceLowered.compile()` function.
+            All DaCe functions in that regards are in place, if we would not copy the SDFG first, then we would have a problem.
+            Because these optimization would then have a feedback of the SDFG object which is stored in one way or the other
+            inside the `JaceLowered` object, which is wrong because `jaceLoweredObject.compile(no_opti=False)` and
+            `jaceLoweredObject.compile(no_opti=True)` will result in different objects but the SDFG is the same one, i.e. the optimized one.
+            It also makes sense, to remove all the unnecessary stuff that is part of the `TranslatedJaxprSDFG` but does not serve any purpose
+            inside the optimization pipeline.
+    """
+
+    sdfg: dace.SDFG
+    inp_names: tuple[str, ...]
+    out_names: tuple[str, ...]
+    csdfg: jdace.CompiledSDFG | None = None
+
+    def __post_init__(self) -> None:
+        self.validate()
+
+    def validate(self) -> bool:
+        """Checks if the embedded SDFG is valid."""
+        if any(arrname.startswith("__return") for arrname in self.sdfg.arrays.keys()):  # noqa: SIM118  # we can not use `in` because we are also interested in `__return_`!
+            raise dace.sdfg.InvalidSDFGError(
+                "There are no output arguments.",
+                self.sdfg,
+                self.sdfg.node_id(self.sdfg.start_state),
+            )
+        for glob_name in self.inp_names + self.out_names:
+            if self.sdfg.arrays[glob_name].transient:
+                raise dace.sdfg.InvalidSDFGError(
+                    f"Argument '{glob_name}' is a transient.",
+                    self.sdfg,
+                    self.sdfg.node_id(self.sdfg.start_state),
+                )
+        self.sdfg.validate()
+        return True
diff --git a/src/jace/util/compiling.py b/src/jace/util/compiling.py
index 95b05c0..8cfcdef 100644
--- a/src/jace/util/compiling.py
+++ b/src/jace/util/compiling.py
@@ -18,21 +18,22 @@
 
 import dace
 
-from jace import translator
+from jace.translator import post_translation as ptrans
 from jace.util import dace_helper as jdace
 
 
 def compile_jax_sdfg(
-    jsdfg: translator.TranslatedJaxprSDFG,
+    jsdfg: ptrans.FinalizedJaxprSDFG,
+    cache: bool = True,
 ) -> jdace.CompiledSDFG:
-    """This function compiles the embedded SDFG and return it.
+    """This function compiles the sdfg embedded in the `FinalizedJaxpr` object and returns it.
 
-    The SDFG is compiled in a very special way, i.e. all arguments and return values have to be passed as arguments.
+    By default the function will store the resulting `CompiledSDFG` object inside `jsdfg` (`FinalizedJaxprSDFG`).
+    However, by setting `cache` to `False` the respective field will not be modified.
 
     Notes:
         Currently the SDFG must not have any undefined symbols, i.e. no undefined sizes.
     """
-    from copy import deepcopy
     from time import time
 
     if not jsdfg.inp_names:
@@ -49,64 +50,39 @@ def compile_jax_sdfg(
             f"No externally defined symbols are allowed, found: {jsdfg.sdfg.free_symbols}"
         )
 
-    # We will now deepcopy the SDFG.
-    #  We do this because the SDFG is also a member of the `CompiledSDFG` object.
-    #  And currently we rely on the integrity of this object in the run function,
-    #  i.e. in the allocation of the return values as well as `arg_names`.
-    sdfg: dace.SDFG = deepcopy(jsdfg.sdfg)
-
-    # We need to give the SDFG another name, this is needed to prevent a DaCe error/warning.
-    #  This happens if we compile the same lowered SDFG multiple times with different options.
-    #  We allow this because Jax allows this too, this is also a reason why we copy the SDFG.
-    sdfg.name = f"{sdfg.name}__comp_{int(time() * 1000)}"
-
-    # Canonical SDFGs do not have global memory, so we must transform it
-    sdfg_arg_names: list[str] = []
-    for glob_name in jsdfg.inp_names + jsdfg.out_names:
-        if glob_name in sdfg_arg_names:  # Donated arguments
-            continue
-        sdfg.arrays[glob_name].transient = False
-        sdfg_arg_names.append(glob_name)
-
-    # This forces the signature of the SDFG to include all arguments in order they appear.
-    sdfg.arg_names = sdfg_arg_names
+    # To ensure that the SDFG is compiled and to get rid of a warning we must modify
+    #  some settings of the SDFG. To fake an immutable SDFG, we will restore them later.
+    sdfg: dace.SDFG = jsdfg.sdfg
+    org_sdfg_name: str = sdfg.name
+    org_recompile: bool = sdfg._recompile
+    org_regenerate_code: bool = sdfg._regenerate_code
+
+    try:
+        # We need to give the SDFG another name, this is needed to prevent a DaCe error/warning.
+        #  This happens if we compile the same lowered SDFG multiple times with different options.
+        sdfg.name = f"{sdfg.name}__comp_{int(time() * 1000)}"
+
+        # Actual compiling the stuff; forcing that a recompilation happens
+        with dace.config.temporary_config():
+            sdfg._recompile = True
+            sdfg._regenerate_code = True
+            dace.Config.set("compiler", "use_cache", value=False)
+            csdfg: jdace.CompiledSDFG = sdfg.compile()
+
+    finally:
+        sdfg.name = org_sdfg_name
+        sdfg._recompile = org_recompile
+        sdfg._regenerate_code = org_regenerate_code
+
+    # Storing the compiled SDFG for later use.
+    if cache:
+        jsdfg.csdfg = csdfg
 
-    # Actual compiling the stuff
-    csdfg: jdace.CompiledSDFG = sdfg.compile()
     return csdfg
 
 
 @singledispatch
 def run_jax_sdfg(
-    jsdfg: translator.TranslatedJaxprSDFG,
-    /,
-    *args: Any,
-    **kwargs: Any,
-) -> tuple[Any, ...] | Any:
-    """Execute a `TranslatedJaxprSDFG` object directly.
-
-    Notes:
-        This function is used for debugging purposes and you should use the `jace.jit` annotation instead.
-        The function either returns a value or a tuple of values, i.e. no pytree.
-        There is an overload of this function that accepts an already compiled SDFG and runs it.
-    """
-    if jsdfg.inp_names is None:
-        raise ValueError("Input names are not specified.")
-    if jsdfg.out_names is None:
-        raise ValueError("Output names are not specified.")
-    csdfg: jdace.CompiledSDFG = compile_jax_sdfg(jsdfg)
-
-    return run_jax_sdfg(
-        csdfg,
-        jsdfg.inp_names,
-        jsdfg.out_names,
-        *args,
-        **kwargs,
-    )
-
-
-@run_jax_sdfg.register(jdace.CompiledSDFG)
-def _(
     csdfg: jdace.CompiledSDFG,
     inp_names: Sequence[str],
     out_names: Sequence[str],
@@ -114,7 +90,10 @@ def _(
     *args: Any,
     **kwargs: Any,
 ) -> tuple[Any, ...] | Any:
-    """Call the compiled SDFG.
+    """Run the compiled SDFG.
+
+    The function assumes that the `(csdfg, inp_names, out_names)` together form a `FinalizedJaxprSDFG` object.
+    Further, it assumes that it was compiled according to this rule.
 
     Notes:
         This function is used for debugging purposes and you should use the `jace.jit` annotation instead.
@@ -129,7 +108,8 @@ def _(
 
     # We need the SDFG to construct/allocate the memory for the return values.
     #  Actually, we would only need the descriptors, but this is currently the only way to get them.
-    #  Note that this is safe to do, because in the compile function we decoupled the SDFG from all.
+    # Note that this is save to do, under the assumption that the SDFG, which is inside the CompiledSDFG is still accurate.
+    #  But since it is by assumption finalized we should be fine.
     sdfg: dace.SDFG = csdfg.sdfg
 
     # Build the argument list that we will pass to the compiled object.
@@ -170,3 +150,29 @@ def _(
     if len(out_names) == 1:
         return ret_val[0]
     return ret_val
+
+
+@run_jax_sdfg.register(ptrans.FinalizedJaxprSDFG)
+def _(
+    jsdfg: ptrans.FinalizedJaxprSDFG,
+    /,
+    *args: Any,
+    **kwargs: Any,
+) -> tuple[Any, ...] | Any:
+    """Execute the `FinalizedJaxprSDFG` object.
+
+    If `jsdfg` does not have an embedded `CompiledSDFG` already the function will compile it first.
+    However, it will not modify the field.
+    """
+
+    if jsdfg.csdfg is None:
+        csdfg: jdace.CompiledSDFG = compile_jax_sdfg(jsdfg, cache=False)
+    else:
+        csdfg = jsdfg.csdfg
+    return run_jax_sdfg(
+        csdfg=csdfg,
+        inp_names=jsdfg.inp_names,
+        out_names=jsdfg.out_names,
+        *args,  # noqa: B026  # star expansion.
+        **kwargs,
+    )
diff --git a/tests/test_decorator.py b/tests/test_decorator.py
index 8b9bc38..cfaef2d 100644
--- a/tests/test_decorator.py
+++ b/tests/test_decorator.py
@@ -38,8 +38,7 @@ def testee(A: np.ndarray, B: np.ndarray) -> np.ndarray:
     B = np.full((4, 3), 10, dtype=np.float64)
 
     lowered = testee.lower(A, B)
-    optimized = lowered.optimize()
-    compiled = optimized.compile()
+    compiled = lowered.compile()
 
     ref = testee_(A, B)
     res = compiled(A, B)

From 62a324d5db7bb33e19e99324e47f8156c7b5116a Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Wed, 15 May 2024 07:40:08 +0200
Subject: [PATCH 152/458] Started with a rework of yesterdays work.

But I realized that I first have to merge yesterday's modification from the PR.
---
 src/jace/translator/translated_jaxpr_sdfg.py | 80 ++++++++++----------
 1 file changed, 40 insertions(+), 40 deletions(-)

diff --git a/src/jace/translator/translated_jaxpr_sdfg.py b/src/jace/translator/translated_jaxpr_sdfg.py
index 369572c..e4c3ec0 100644
--- a/src/jace/translator/translated_jaxpr_sdfg.py
+++ b/src/jace/translator/translated_jaxpr_sdfg.py
@@ -16,7 +16,6 @@
 from jace import util
 
 
-@dataclass(slots=True)
 class TranslatedJaxprSDFG:
     """Encapsulates the result of a translation run of the `JaxprTranslationDriver` object.
 
@@ -30,26 +29,31 @@ class TranslatedJaxprSDFG:
     - `terminal_state` the last state in the state machine.
     - `inp_names` a `list` of the SDFG variables that are used as input, in the same order as `Jaxpr.invars`.
     - `out_names` a `list` of the SDFG variables that are used as output, in the same order as `Jaxpr.outvars`.
-
-    Please consider the following important points:
-    - The SDFG is in canonical form, which means that it is not directly usable, see `JaxprTranslationDriver` for more.
-    - It might be that a name appears in both the `inp_names` and `out_names` list.
-        This happens if the corresponding variable is used as both input and output.
-        In Jax this is called argument donation.
-
-    During the translation the following members are also allocated:
-    - `rev_idx` the revision index, used for name mangling.
-
-    While they remain allocated, accessing them is considered an error.
+    - `is_finalized` a bool that indicates if `self` represents a finalized or canonical SDFG, see bellow.
+    - `rev_idx` the revision index, used for name mangling, however, outside of a translation process,
+        the value carries no meaning.
+
+    Note, that it might happen that a name appears in both the `inp_names` and `out_names` lists.
+    This happens if an argument is used both as input and output, and it is not an error.
+    In Jax this is called argument donation.
+
+    If the flag `is_finalized` is `True` `self` carries a so called finalized SDFG.
+    In this case only the `sdfg`, `inp_names`, `out_names` and `is_finalized` fields remain allocated, all others are set to `None`.
+    Furthermore the SDFG is in the so called finalized form which is:
+    - All input an output arrays are marked as global.
+    - However, there are no `__return` arrays, i.e. all arguments are passed as arguments.
+    - Its `arg_names` are set with set `inp_names + out_names`, however,
+        arguments that are input and outputs are only listed as inputs.
     """
 
     sdfg: dace.SDFG
-    jax_name_map: MutableMapping[jax_core.Var | util.JaCeVar, str]
-    start_state: dace.SDFGState
-    terminal_state: dace.SDFGState
     inp_names: tuple[str, ...]
     out_names: tuple[str, ...]
-    rev_idx: int
+    jax_name_map: dict[jax_core.Var | util.JaCeVar, str] | None
+    start_state: dace.SDFGState | None
+    terminal_state: dace.SDFGState | None
+    rev_idx: int | None
+    is_finalized: bool
 
     def __init__(
         self,
@@ -67,41 +71,37 @@ def __init__(
         if isinstance(name, str) and not util.VALID_SDFG_OBJ_NAME.fullmatch(name):
             raise ValueError(f"'{name}' is not a valid SDFG name.")
 
-        self.sdfg: dace.SDFG = dace.SDFG(name=(name or f"unnamed_SDFG_{id(self)}"))
-        self.start_state: dace.SDFGState = self.sdfg.add_state(
-            label="initial_state", is_start_block=True
-        )
-        self.terminal_state: dace.SDFGState = self.start_state
-        self.jax_name_map: MutableMapping[jax_core.Var | util.JaCeVar, str] = {}
-        self.inp_names: tuple[str, ...] = ()
-        self.out_names: tuple[str, ...] = ()
-        self.rev_idx: int = rev_idx
+        self.sdfg = dace.SDFG(name=(name or f"unnamed_SDFG_{id(self)}"))
+        self.start_state = self.sdfg.add_state(label="initial_state", is_start_block=True)
+        self.terminal_state = self.start_state
+        self.jax_name_map = {}
+        self.inp_names = ()
+        self.out_names = ()
+        self.rev_idx = rev_idx
+        self.is_finalized = False
 
     def validate(self) -> bool:
-        """Validate the underlying SDFG."""
+        """Validate the underlying SDFG.
 
-        # To prevent the 'non initialized' data warnings we have to temporary
-        #  promote input and output arguments to globals
-        org_trans_state: dict[str, bool] = {}
-        if not self.inp_names:
+        Only a finalized SDFG can be validated.
+        """
+        if self.is_finalized:
+            raise dace.sdfg.InvalidSDFGError(
+                "SDFG is not finalized.",
+                self.sdfg,
+                self.sdfg.node_id(self.start_state),
+            )
+        if len(self.inp_names) == 0:
             raise dace.sdfg.InvalidSDFGError(
                 "There are no input arguments.",
                 self.sdfg,
                 self.sdfg.node_id(self.start_state),
             )
-        if not self.out_names:
+        if len(self.out_names) == 0:
             raise dace.sdfg.InvalidSDFGError(
                 "There are no output arguments.",
                 self.sdfg,
                 self.sdfg.node_id(self.start_state),
             )
-        for var in set(self.inp_names + self.out_names):  # set is needed for donated args.
-            org_trans_state[var] = self.sdfg.arrays[var].transient
-            self.sdfg.arrays[var].transient = False
-
-        try:
-            self.sdfg.validate()
-        finally:
-            for var, orgValue in org_trans_state.items():
-                self.sdfg.arrays[var].transient = orgValue
+        self.sdfg.validate()
         return True

From da054b0494c9bc32b52ef313f197ab2ba504860d Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Wed, 15 May 2024 11:10:26 +0200
Subject: [PATCH 153/458] Made the caching infrastructure and the whole thing a
 bit prettier.

Still not optimal, maybe a further separation, but lets see.
---
 src/jace/jax/stages/jace_compiled.py          |  11 +-
 src/jace/jax/stages/jace_lowered.py           |  55 ++++---
 src/jace/jax/stages/jace_wrapped.py           |  20 ++-
 src/jace/jax/stages/translation_cache.py      | 149 +++++++++++-------
 src/jace/optimization/__init__.py             |  34 ++--
 .../translator/jaxpr_translator_driver.py     |  38 +++--
 src/jace/translator/post_translation.py       | 119 ++++----------
 src/jace/translator/translated_jaxpr_sdfg.py  |  11 +-
 src/jace/util/compiling.py                    |  96 +++++------
 src/jace/util/jax_helper.py                   |   4 -
 tests/test_decorator.py                       |  30 ++++
 tests/test_jaxpr_translator_driver.py         |  86 +++++-----
 12 files changed, 335 insertions(+), 318 deletions(-)

diff --git a/src/jace/jax/stages/jace_compiled.py b/src/jace/jax/stages/jace_compiled.py
index 7b7e089..3f33859 100644
--- a/src/jace/jax/stages/jace_compiled.py
+++ b/src/jace/jax/stages/jace_compiled.py
@@ -26,16 +26,9 @@ class JaceCompiled(stages.Stage):
         Handle pytrees.
     """
 
-    __slots__ = (
-        "_csdfg",
-        "_inp_names",
-        "_out_names",
-    )
-
     _csdfg: jdace.CompiledSDFG  # The compiled SDFG object.
     _inp_names: tuple[str, ...]  # Name of all input arguments.
     _out_names: tuple[str, ...]  # Name of all output arguments.
-    # TODO(phimuell): Also store description of output, such that we do not have to rely on internal sdfg.
 
     def __init__(
         self,
@@ -59,6 +52,6 @@ def __call__(
             self._csdfg,
             self._inp_names,
             self._out_names,
-            *args,
-            **kwargs,
+            args,
+            kwargs,
         )
diff --git a/src/jace/jax/stages/jace_lowered.py b/src/jace/jax/stages/jace_lowered.py
index 2dae9a2..70e111e 100644
--- a/src/jace/jax/stages/jace_lowered.py
+++ b/src/jace/jax/stages/jace_lowered.py
@@ -9,37 +9,41 @@
 
 from __future__ import annotations
 
+import copy
 import json
 from typing import Any, Final
 
-from jace import optimization, util
+from jace import optimization, translator, util
 from jace.jax import stages
 from jace.jax.stages import translation_cache as tcache
-from jace.translator import post_translation as ptrans
 from jace.util import dace_helper as jdace
 
 
 class JaceLowered(stages.Stage):
     """Represents the original computation that was lowered to SDFG."""
 
-    _trans_sdfg: ptrans.FinalizedJaxprSDFG
+    # `self` assumes complete ownership of the
+    _trans_sdfg: translator.TranslatedJaxprSDFG
+
+    # Cache for the compilation. Managed by the caching infrastructure.
+    _cache: tcache.TranslationCache | None = None
 
     DEF_COMPILER_OPTIONS: Final[dict[str, Any]] = {
-        "auto_opt": True,
+        "auto_optimize": True,
         "simplify": True,
     }
 
     def __init__(
         self,
-        trans_sdfg: ptrans.FinalizedJaxprSDFG,
+        trans_sdfg: translator.TranslatedJaxprSDFG,
     ) -> None:
-        """Constructs the wrapper."""
+        """Constructs the lowered object."""
+        if not trans_sdfg.is_finalized:
+            raise ValueError("The translated SDFG must be finalized.")
         if trans_sdfg.inp_names is None:
             raise ValueError("Input names must be defined.")
         if trans_sdfg.out_names is None:
             raise ValueError("Output names must be defined.")
-        if trans_sdfg.csdfg is not None:
-            raise ValueError("SDFG is already compiled.")
         self._trans_sdfg = trans_sdfg
 
     @tcache.cached_translation
@@ -50,20 +54,28 @@ def compile(
         """Compile the SDFG.
 
         Returns an Object that encapsulates a compiled SDFG object.
-        """
-        from copy import deepcopy
+        You can pass a `dict` as argument which are passed to the `jace_optimize()` routine.
+        If you pass `None` then the default options are used.
+        To disable all optimization, pass an empty `dict`.
 
-        # The reason why we have to deepcopy the SDFG
+        Notes:
+            I am pretty sure that `None` in Jax means "use the default option".
+                See also `CachedCallDescription.make_call_description()`.
+        """
+        # We **must** deepcopy before we do any optimization.
+        #  There are many reasons for this but here are the most important ones:
         #  All optimization DaCe functions works in place, if we would not copy the SDFG first, then we would have a problem.
         #  Because, these optimization would then have a feedback of the SDFG object which is stored inside `self`.
-        #  Thus if we would run this code `(jaceLoweredObject := jaceWrappedObject.lower()).compile({opti=True})` would return an optimized object.
-        #  However, if we would now call `jaceWrappedObject.lower()` (with the same arguments as before, we would get `jaceLoweredObject`,
-        #  but it would actually contain an already optimized SDFG, which is not what we want.
-        fsdfg: ptrans.FinalizedJaxprSDFG = deepcopy(self._trans_sdfg)
-        optimization.jace_auto_optimize(
-            fsdfg, **({} if compiler_options is None else compiler_options)
+        #  Thus, if we would run this code `(jaceLoweredObject := jaceWrappedObject.lower()).compile({opti=True})` would return
+        #  an optimized object, which is what we intent to do.
+        #  However, if we would now call `jaceWrappedObject.lower()` (with the same arguments as before), we should get `jaceLoweredObject`,
+        #  since it was cached, but it would actually contain an already optimized SDFG, which is not what we want.
+        #  If you think you can remove this line then do it and run `tests/test_decorator.py::test_decorator_sharing`.
+        fsdfg: translator.TranslatedJaxprSDFG = copy.deepcopy(self._trans_sdfg)
+        optimization.jace_optimize(
+            fsdfg, **(self.DEF_COMPILER_OPTIONS if compiler_options is None else compiler_options)
         )
-        csdfg: jdace.CompiledSDFG = util.compile_jax_sdfg(fsdfg, cache=False)
+        csdfg: jdace.CompiledSDFG = util.compile_jax_sdfg(fsdfg)
 
         return stages.JaceCompiled(
             csdfg=csdfg,
@@ -71,7 +83,12 @@ def compile(
             out_names=fsdfg.out_names,
         )
 
-    def compiler_ir(self, dialect: str | None = None) -> ptrans.FinalizedJaxprSDFG:
+    def compiler_ir(self, dialect: str | None = None) -> translator.TranslatedJaxprSDFG:
+        """Returns the internal SDFG.
+
+        The function returns a `TranslatedJaxprSDFG` object.
+        It is important that modifying this object in any ways is considered an error.
+        """
         if (dialect is None) or (dialect.upper() == "SDFG"):
             return self._trans_sdfg
         raise ValueError(f"Unknown dialect '{dialect}'.")
diff --git a/src/jace/jax/stages/jace_wrapped.py b/src/jace/jax/stages/jace_wrapped.py
index 439512b..bc29f8d 100644
--- a/src/jace/jax/stages/jace_wrapped.py
+++ b/src/jace/jax/stages/jace_wrapped.py
@@ -9,8 +9,8 @@
 
 from __future__ import annotations
 
+import functools as ft
 from collections.abc import Callable
-from functools import update_wrapper
 from typing import Any
 
 import jax as jax_jax
@@ -40,6 +40,13 @@ class JaceWrapped(stages.Stage):
 
     _fun: Callable
 
+    # Managed by the caching infrastructure and only defined during `lower()`.
+    #  If defined it contains an abstract description of the function arguments.
+    _call_description: tcache.CallArgsDescription | None = None
+
+    # Cache for the lowering. Managed by the caching infrastructure.
+    _cache: tcache.TranslationCache | None = None
+
     def __init__(
         self,
         fun: Callable,
@@ -51,7 +58,7 @@ def __init__(
         # Makes that `self` is a true stand-in for `fun`
         #  This will also add a `__wrapped__` property to `self` which is not part of the interface.
         # TODO(phimuell): modify text to make it clear that it is wrapped, Jax does the same.
-        update_wrapper(self, self._fun)
+        ft.update_wrapper(self, self._fun)
 
     def __call__(
         self,
@@ -92,9 +99,6 @@ def lower(
         jaxpr = jax_jax.make_jaxpr(self._fun)(*real_args)
         driver = translator.JaxprTranslationDriver()
         trans_sdfg: translator.TranslatedJaxprSDFG = driver.translate_jaxpr(jaxpr)
-
-        fin_sdfg: ptrans.FinalizedJaxprSDFG = ptrans.postprocess_jaxpr_sdfg(
-            tsdfg=trans_sdfg, fun=self.__wrapped__
-        )
-
-        return stages.JaceLowered(fin_sdfg)
+        ptrans.postprocess_jaxpr_sdfg(tsdfg=trans_sdfg, fun=self.__wrapped__)
+        # The `JaceLowered` assumes complete ownership of `trans_sdfg`!
+        return stages.JaceLowered(trans_sdfg)
diff --git a/src/jace/jax/stages/translation_cache.py b/src/jace/jax/stages/translation_cache.py
index 11e4e13..08a4a57 100644
--- a/src/jace/jax/stages/translation_cache.py
+++ b/src/jace/jax/stages/translation_cache.py
@@ -21,7 +21,7 @@
 from collections import OrderedDict
 from collections.abc import Callable
 from dataclasses import dataclass
-from typing import Any, Protocol, runtime_checkable
+from typing import Any, Protocol, TypeAlias, runtime_checkable
 
 import dace
 from jax import core as jax_core
@@ -35,8 +35,19 @@ def cached_translation(
 ) -> Callable:
     """Decorator for making the transfer method, i.e. `JaceWrapped.lower()` and `JaceLowered.compile()` cacheable.
 
-    The cache is global and the function will add the respecifve cache object to the object upon its first call.
-    To clear the caches use the `clear_translation_cache()` function.
+    The main issue is that we can not simply cache on the actual arguments we pass to them, but on an abstract
+    (or concrete; static arguments + compiling) description on them, and this is what this decorator is for.
+    Based on its argument it will generate a key of the call, see `TranslationCache.make_key()` for more.
+    Then it will check if the result is known and if needed it will perform the actual call.
+
+    Beside this the function will two two things.
+    The first is, that it will set the `_cache` member of `self` to the associated cache.
+    Thus an annotated object need to define such a member.
+
+    The second thing it will do is optional, if the call is not cached inside the cache the wrapped function has to be run.
+    In that case the wrapper will first check if the object defines the `_call_description` member.
+    If this is the case the wrapper will set this object to an abstract description of the call, which is also used as key in the cache.
+    After the function return this member is set to `None`.
     """
 
     @ft.wraps(action)
@@ -45,16 +56,30 @@ def _action_wrapper(
         *args: Any,
         **kwargs: Any,
     ) -> stages.Stage:
-        if hasattr(self, "_cache"):
-            cache: TranslationCache = self._cache
-        else:
-            cache = _get_cache(self)
-            self._cache = cache
-        key: _CachedCall = cache.make_key(self, *args, **kwargs)
-        if cache.has(key):
-            return cache.get(key)
-        next_stage: stages.Stage = action(self, *args, **kwargs)
-        cache.add(key, next_stage)
+        # If not initialized initialize the cache.
+        if self._cache is None:
+            self._cache = _get_cache(self)
+
+        # Get the key (abstract description of the call).
+        key: CachedCallDescription = self._cache.make_key(self, *args, **kwargs)
+        if self._cache.has(key):
+            return self._cache.get(key)
+
+        # We must actually perform the call
+        wants_description: bool = hasattr(self, "_call_description")
+        try:
+            if wants_description:
+                assert (
+                    self._call_description is None
+                ), f"call description already set for `{self}` (probably another call going on?)."
+                self._call_description = key.fargs
+            next_stage: stages.Stage = action(self, *args, **kwargs)
+        finally:
+            if wants_description:
+                self._call_description = None
+
+        # Store the result.
+        self._cache.add(key, next_stage)
         return next_stage
 
     return _action_wrapper
@@ -81,7 +106,7 @@ def _get_cache(
     # Get the caches and if not present, create them.
     if not hasattr(_get_cache, "_caches"):
         _caches: dict[type[stages.Stage], TranslationCache] = {}
-        _get_cache._caches = _caches  # type: ignore[attr-defined]  # ruff removes the `getattr()` calls
+        _get_cache._caches = _caches  # type: ignore[attr-defined]
     _caches = _get_cache._caches  # type: ignore[attr-defined]
 
     if type(self) not in _caches:
@@ -99,9 +124,9 @@ class _AbstarctCallArgument:
     To construct it you should use the `from_value()` class function which interfere the characteristics from a value.
     """
 
-    shape: tuple[int, ...] | tuple[()]
+    shape: tuple[int, ...]
     dtype: dace.typeclass
-    strides: tuple[int, ...] | tuple[()] | None
+    strides: tuple[int, ...] | None
     storage: dace.StorageType
 
     @classmethod
@@ -166,70 +191,79 @@ def __eq__(self, other: Any) -> bool:
         pass
 
 
+"""This type is the abstract description of a function call.
+It is part of the key used in the cache.
+"""
+CallArgsDescription: TypeAlias = tuple[
+    _AbstarctCallArgument
+    | _ConcreteCallArgument
+    | tuple[str, _AbstarctCallArgument]
+    | tuple[str, _ConcreteCallArgument],
+    ...,
+]
+
+
 @dataclass(init=True, eq=True, frozen=True)
-class _CachedCall:
-    """Represents the structure of the entire call in the cache.
+class CachedCallDescription:
+    """Represents the structure of the entire call in the cache and used as key in the cache.
+
+    This class represents both the `JaceWrapped.lower()` and `JaceLowered.compile()` calls.
 
-    This class represents both the `JaceWrapped.lower()` and `JaceLowered.compile()` call.
-    The key combines the "origin of the call", i.e. `self` and the call arguments.
+    The actual key is composed of two parts, first the "origin of the call".
+    For the `JaceWrapped` this includes the wrapped callable, while for `JaceLowered` the lowered SDFG is used.
+    In both cases we rely on their `__hash__()` and `__eq__()` implementation, which should only involve the address.
+    Since we do not allow in place modification, this is not a problem, especially for the lowering.
 
-    Arguments are represented in two ways:
+    The second part is of the key are a description of the actual arguments, see `CallArgsDescription` type alias.
+    There are two ways for describing the arguments:
     - `_AbstarctCallArgument`: Which encode only the structure of the arguments.
         These are essentially the tracer used by Jax.
     - `_ConcreteCallArgument`: Which represents actual values of the call.
         These are either the static arguments or compile options.
 
-    Depending of the origin the call, the key used for caching is different.
-    For `JaceWrapped` only the wrapped callable is included in the cache.
+    While `JaceWrapped.lower()` uses both, `JaceLowered.compile()` will only use concrete arguments.
+    In addition an argument can be positional or a named argument,
+    in which case it consists of a `tuple[str, _AbstarctCallArgument  | _ConcreteCallArgument]`.
 
-    For the `JaceLowered` the SDFG is used as key, however, in a very special way.
-    `dace.SDFG` does not define `__hash__()` or `__eq__()` thus these operations fall back to `object`.
-    However, an SDFG defines the `hash_sdfg()` function, which generates a hash based on the structure of the SDFG.
-    We use the SDFG because we want to cache on it, but since it is not immutable, we have to account for that, by including this structural hash.
-    This is not ideal but it should work in the beginning.
+    Todo:
+        - pytrees.
     """
 
     fun: Callable | None
     sdfg: dace.SDFG | None
-    sdfg_hash: int | None
-    fargs: tuple[
-        _AbstarctCallArgument
-        | _ConcreteCallArgument
-        | tuple[str, _AbstarctCallArgument]
-        | tuple[str, _ConcreteCallArgument],
-        ...,
-    ]
+    fargs: CallArgsDescription
 
     @classmethod
-    def make_key(
+    def make_call_description(
         cls,
         stage: stages.Stage,
         *args: Any,
         **kwargs: Any,
-    ) -> _CachedCall:
-        """Creates a cache key for the stage object `stage` that was called to advance to the next stage."""
+    ) -> CachedCallDescription:
+        """Creates an abstract description of the call."""
 
         if isinstance(stage, stages.JaceWrapped):
             # JaceWrapped.lower() to JaceLowered
-            #   Currently we only allow positional arguments and no static arguments.
-            #   Thus the function argument part of the key only consists of abstract arguments.
-            if len(kwargs) != 0:
-                raise NotImplementedError("'kwargs' are not implemented in 'JaceWrapped.lower()'.")
             fun = stage.__wrapped__
             sdfg = None
-            sdfg_hash = None
+
+            if len(kwargs) != 0:
+                raise NotImplementedError("'kwargs' are not implemented in 'JaceWrapped.lower()'.")
+
+            # Currently we only allow positional arguments and no static arguments.
+            #   Thus the function argument part of the key only consists of abstract arguments.
             fargs: tuple[_AbstarctCallArgument, ...] = tuple(
                 _AbstarctCallArgument.from_value(x) for x in args
             )
 
         elif isinstance(stage, stages.JaceLowered):
             # JaceLowered.compile() to JaceCompiled
-            #   We only accepts compiler options, which the Jax interface mandates
-            #   are inside a `dict` thus we will get at most one argument.
+            #  We do not have to deepcopy the sdfg, since we assume immutability.
             fun = None
             sdfg = stage.compiler_ir().sdfg
-            sdfg_hash = int(sdfg.hash_sdfg(), 16)
 
+            #   We only accepts compiler options, which the Jax interface mandates
+            #   are inside a `dict` thus we will get at most one argument.
             if len(kwargs) != 0:
                 raise ValueError(
                     "All arguments to 'JaceLowered.compile()' must be inside a 'dict'."
@@ -237,7 +271,8 @@ def make_key(
             if len(args) >= 2:
                 raise ValueError("Only a 'dict' is allowed as argument to 'JaceLowered.compile()'.")
             if (len(args) == 0) or (args[0] is None):
-                # No compiler options where specified, so we use the default ones.
+                # Currently we consider no argument and `None` as "use the default argument".
+                #  This should be in accordance with Jax. See also `JaceLowered.compile()`.
                 comp_ops: stages.CompilerOptions = stages.JaceLowered.DEF_COMPILER_OPTIONS
             else:
                 # Compiler options where given.
@@ -260,7 +295,7 @@ def make_key(
         else:
             raise TypeError(f"Can not make key from '{type(stage).__name__}'.")
 
-        return cls(fun=fun, sdfg=sdfg, sdfg_hash=sdfg_hash, fargs=fargs)
+        return cls(fun=fun, sdfg=sdfg, fargs=fargs)
 
 
 class TranslationCache:
@@ -276,7 +311,7 @@ class TranslationCache:
 
     __slots__ = ["_memory", "_size"]
 
-    _memory: OrderedDict[_CachedCall, stages.Stage]
+    _memory: OrderedDict[CachedCallDescription, stages.Stage]
     _size: int
 
     def __init__(
@@ -286,7 +321,7 @@ def __init__(
         """Creates a cache instance of size `size`."""
         if size <= 0:
             raise ValueError(f"Invalid cache size of '{size}'")
-        self._memory: OrderedDict[_CachedCall, stages.Stage] = OrderedDict()
+        self._memory: OrderedDict[CachedCallDescription, stages.Stage] = OrderedDict()
         self._size = size
 
     @staticmethod
@@ -294,13 +329,13 @@ def make_key(
         stage: stages.Stage,
         *args: Any,
         **kwargs: Any,
-    ) -> _CachedCall:
+    ) -> CachedCallDescription:
         """Create a key object for `stage`."""
-        return _CachedCall.make_key(stage, *args, **kwargs)
+        return CachedCallDescription.make_call_description(stage, *args, **kwargs)
 
     def has(
         self,
-        key: _CachedCall,
+        key: CachedCallDescription,
     ) -> bool:
         """Check if `self` have a record of `key`.
 
@@ -312,7 +347,7 @@ def has(
 
     def get(
         self,
-        key: _CachedCall,
+        key: CachedCallDescription,
     ) -> stages.Stage:
         """Get the next stage associated with `key`.
 
@@ -327,7 +362,7 @@ def get(
 
     def add(
         self,
-        key: _CachedCall,
+        key: CachedCallDescription,
         res: stages.Stage,
     ) -> TranslationCache:
         """Adds `res` under `key` to `self`.
@@ -349,7 +384,7 @@ def add(
 
     def _evict(
         self,
-        key: _CachedCall | None,
+        key: CachedCallDescription | None,
     ) -> bool:
         """Evict `key` from `self` and return `True`.
 
diff --git a/src/jace/optimization/__init__.py b/src/jace/optimization/__init__.py
index 511d446..f841b62 100644
--- a/src/jace/optimization/__init__.py
+++ b/src/jace/optimization/__init__.py
@@ -12,26 +12,38 @@
 
 from __future__ import annotations
 
-import dace
+from jace import translator
 
-from jace.translator import post_translation as ptrans
 
-
-def jace_auto_optimize(
-    fsdfg: ptrans.FinalizedJaxprSDFG,
-    simplify: bool = True,
+def jace_optimize(
+    tsdfg: translator.TranslatedJaxprSDFG,
+    simplify: bool = False,
+    auto_optimize: bool = False,
     **kwargs: str | bool,  # noqa: ARG001  # Unused argument, for now
-) -> dace.SDFG:
-    """Performs optimization of the `fsdfg` _inplace_ and returns it.
+) -> None:
+    """Performs optimization of the `fsdfg` _inplace_.
 
     Currently this function only supports simplification.
     Its main job is to exists that we have something that we can call in the tool chain.
+
+    Args:
+        simplify:       Run the simplification pilepline.
+        auto_optimize:  Run the auto optimization pipeline (currently does nothing)
+
+    Notes:
+        All optimization flags must be disabled by default!
+            The reason for this is that `jaceLowered.compile({})` will disable all optimizations.
     """
+    if not tsdfg.is_finalized:
+        raise ValueError("Can only optimize finalized SDFGs.")
+
     if simplify:
-        fsdfg.sdfg.simplify()
+        tsdfg.sdfg.simplify()
+
+    if auto_optimize:
+        pass
 
-    fsdfg.validate()
-    return fsdfg
+    tsdfg.validate()
 
 
 __all__ = [
diff --git a/src/jace/translator/jaxpr_translator_driver.py b/src/jace/translator/jaxpr_translator_driver.py
index 1a821f1..92fda72 100644
--- a/src/jace/translator/jaxpr_translator_driver.py
+++ b/src/jace/translator/jaxpr_translator_driver.py
@@ -9,7 +9,7 @@
 
 import itertools
 from collections.abc import Iterable, Mapping, MutableSequence, Sequence
-from typing import Any, Final, cast, overload, Literal
+from typing import Any, Final, Literal, cast, overload
 
 import dace
 import jax
@@ -259,8 +259,8 @@ def map_jax_var_to_sdfg(
         """
         if isinstance(jax_var, jax_core.Literal):
             raise RuntimeError("There is no SDFG variable for literal '{jax_var}'.")
-        if jax_var in self._ctx.jax_name_map:
-            sdfg_name = self._ctx.jax_name_map[jax_var]
+        if jax_var in self._jax_name_map:
+            sdfg_name = self._jax_name_map[jax_var]
         elif allow_fail:
             return None
         else:
@@ -288,7 +288,7 @@ def terminal_sdfg_state(self) -> dace.SDFGState:
         New states are appended at the current terminal/end state and becoming the new terminal state.
         This function returns the current terminal state.
         """
-        return self._ctx.terminal_state
+        return cast(dace.SDFGState, self._ctx.terminal_state)
 
     def is_allocated(self) -> bool:
         """Tests if `self` has an allocated context.
@@ -315,7 +315,7 @@ def rev_idx(self) -> int:
         """Returns the revision index of `self`."""
         if not self.is_allocated():
             raise RuntimeError("Driver is not allocated.")
-        return self._ctx.rev_idx
+        return cast(int, self._ctx.rev_idx)
 
     def add_jax_name_mapping(
         self,
@@ -335,8 +335,8 @@ def add_jax_name_mapping(
         """
         assert isinstance(sdfg_name, str) and (len(sdfg_name) > 0)  # noqa: PT018  # Should be one assertion.
 
-        if jax_var in self._ctx.jax_name_map:
-            if self._ctx.jax_name_map[jax_var] == sdfg_name:  # noops.
+        if jax_var in self._jax_name_map:
+            if self._jax_name_map[jax_var] == sdfg_name:  # noops.
                 return self
             raise ValueError(
                 f"Tried to create the mapping '{jax_var} -> {sdfg_name}', but '{jax_var}'"
@@ -347,7 +347,7 @@ def add_jax_name_mapping(
         if sdfg_name in self._forbidden_names:
             raise NameError(f"Mapping '{jax_var} -> {sdfg_name}': Forbidden name.")
 
-        self._ctx.jax_name_map[jax_var] = sdfg_name
+        self._jax_name_map[jax_var] = sdfg_name
         return self
 
     def add_reserved_names(
@@ -449,7 +449,7 @@ def add_array(
             if find_new_name:
                 raise ValueError("Specified `force_jax_name` but also wanted a new name.")
             find_new_name = False
-            alt_name = util.propose_jax_name(arg, self._ctx.jax_name_map)
+            alt_name = util.propose_jax_name(arg, self._jax_name_map)
         if alt_name is not None:
             assert isinstance(alt_name, str)
             find_new_name = False  # If a name was given, then use it no matter what.
@@ -459,7 +459,7 @@ def add_array(
                 raise ValueError("'alt_name' is a forbidden name.")
             if not util.VALID_SDFG_VAR_NAME.fullmatch(alt_name):
                 raise ValueError(f"The passed name 'alt_name' '{alt_name}' is invalid.")
-            if update_var_mapping and arg in self._ctx.jax_name_map:
+            if update_var_mapping and arg in self._jax_name_map:
                 raise ValueError(f"Variable '{alt_name}' already registered.")
             if alt_name in self._ctx.sdfg.arrays:
                 raise ValueError(f"Variable '{alt_name}' already exists.")
@@ -489,7 +489,7 @@ def add_array(
         if alt_name is not None:
             prop_name = alt_name  # Just for completion: will be ignored later
         elif isinstance(arg, (jax_core.Var, util.JaCeVar)):
-            prop_name = util.propose_jax_name(arg, self._ctx.jax_name_map)
+            prop_name = util.propose_jax_name(arg, self._jax_name_map)
             assert not prop_name.startswith("__")
             if name_prefix is not None:
                 prop_name = name_prefix + prop_name
@@ -1006,9 +1006,9 @@ def _handle_null_jaxpr(
             out_var_names.append(sdfg_out_name)
 
             # Now we perform the copy from the input variable in the newly created output variable.
-            inp_acc = self._ctx.start_state.add_read(sdfg_in_name)
-            out_acc = self._ctx.start_state.add_write(sdfg_out_name)
-            self._ctx.start_state.add_nedge(
+            inp_acc = self._start_state.add_read(sdfg_in_name)
+            out_acc = self._start_state.add_write(sdfg_out_name)
+            self._start_state.add_nedge(
                 src=inp_acc,
                 dst=out_acc,
                 data=dace.Memlet.from_array(
@@ -1021,10 +1021,18 @@ def _handle_null_jaxpr(
             #  But we can not add this to the mapping, because of this situation we will now remove
             #  the variable from the mapping. I am open for different approaches.
             #  Note that input variables that are not used, will remain in the mapping.
-            self._ctx.jax_name_map.pop(jax_out_var)
+            self._jax_name_map.pop(jax_out_var)
 
         return tuple(out_var_names)
 
+    @property
+    def _jax_name_map(self) -> dict[jax_core.Var | util.JaCeVar, str]:
+        return cast(dict[jax_core.Var | util.JaCeVar, str], self._ctx.jax_name_map)
+
+    @property
+    def _start_state(self) -> dace.SDFGState:
+        return cast(dace.SDFGState, self._ctx.start_state)
+
     # fmt: off
     _forbidden_names: Final[set[str]] = {
         # These should be most of the C++ keywords, it is more important to have the short ones.
diff --git a/src/jace/translator/post_translation.py b/src/jace/translator/post_translation.py
index c0b3ab8..a32c05f 100644
--- a/src/jace/translator/post_translation.py
+++ b/src/jace/translator/post_translation.py
@@ -13,126 +13,65 @@
 from __future__ import annotations
 
 from collections.abc import Callable
-from dataclasses import dataclass
-
-import dace
 
 from jace import translator
-from jace.util import dace_helper as jdace
 
 
 def postprocess_jaxpr_sdfg(
     tsdfg: translator.TranslatedJaxprSDFG,
     fun: Callable,  # noqa: ARG001  # Currently unused
-) -> FinalizedJaxprSDFG:
-    """Perform the final postprocessing step on the SDFG and returns a finalized version.
+) -> None:
+    """Perform the final post processing steps on the SDFG in place.
+
+    Afterwards `tsdfg` will be finalized.
 
-    The function will not modify the passed `tsdfg` object (`TranslatedJaxprSDFG`).
-    The returned object is of type `FinalizedJaxprSDFG` and is decoupled from the input,
-    such that there is no feedback.
+    TBA, summary:
+    - Setting correct inputs (names + strides)
+    - Setting outputs (in case of donation).
 
     Args:
         tsdfg:  The translated SDFG object.
         fun:    The original function that we translated.
     """
     # Currently we do nothing except finalizing.
-    return finalize_jaxpr_sdfg(tsdfg)
+    finalize_jaxpr_sdfg(tsdfg)
 
 
 def finalize_jaxpr_sdfg(
-    trans_sdfg: translator.TranslatedJaxprSDFG,
-) -> FinalizedJaxprSDFG:
-    """Finalizes the supplied `trans_sdfg` object.
-
-    The returned object is guaranteed to be decoupled from the supplied `TranslatedJaxprSDFG`.
-    You should use this function after you have performed all necessary postprocessing for which you need the meta data of the translation.
-    The returned object is meant as input for jace's optimization pipeline.
-
-    Note:
-        For several reasons this function performs a deep copy of the associated SDFG.
-            The enter toolchain assumes and relies on this fact.
-    """
-    # Check if the outputs are defined.
-    if trans_sdfg.inp_names is None:
+    tsdfg: translator.TranslatedJaxprSDFG,
+) -> None:
+    """Finalizes the supplied `tsdfg` object in place."""
+    if tsdfg.is_finalized:
+        raise ValueError("The supplied SDFG is already finalized.")
+    if not tsdfg.inp_names:
         raise ValueError("Input names are not specified.")
-    if trans_sdfg.out_names is None:
+    if not tsdfg.out_names:
         raise ValueError("Output names are not specified.")
 
     # We do not support the return value mechanism that dace provides us.
     #  The reasons for that are that the return values are always shared and the working with pytrees is not yet understood.
     #  Thus we make the safe choice by passing all as arguments.
-    assert not any(
+    if any(
         arrname.startswith("__return")
-        for arrname in trans_sdfg.sdfg.arrays.keys()  # noqa: SIM118  # we can not use `in` because we are also interested in `__return_`!
-    ), "Only support SDFGs without '__return' members."
-
-    # We perform a deepcopy by serializing it, as deepcopy is known for having some issues.
-    sdfg = dace.SDFG.from_json(trans_sdfg.sdfg.to_json())
-    inp_names = trans_sdfg.inp_names
-    out_names = trans_sdfg.out_names
+        for arrname in tsdfg.sdfg.arrays.keys()  # noqa: SIM118  # we can not use `in` because we are also interested in `__return_`!
+    ):
+        raise ValueError("Only support SDFGs without '__return' members.")
 
     # Canonical SDFGs do not have global memory, so we must transform it
     sdfg_arg_names: list[str] = []
-    for glob_name in inp_names + out_names:
+    for glob_name in tsdfg.inp_names + tsdfg.out_names:
         if glob_name in sdfg_arg_names:  # Donated arguments
             continue
-        sdfg.arrays[glob_name].transient = False
+        tsdfg.sdfg.arrays[glob_name].transient = False
         sdfg_arg_names.append(glob_name)
 
     # This forces the signature of the SDFG to include all arguments in order they appear.
     #  If an argument is reused (donated) then it is only listed once, the first time it appears
-    sdfg.arg_names = sdfg_arg_names
-
-    return FinalizedJaxprSDFG(sdfg=sdfg, inp_names=inp_names, out_names=out_names)
-
-
-@dataclass(init=True, eq=False, frozen=False)
-class FinalizedJaxprSDFG:
-    """This is the final stage of the post processing of the translation.
-
-    Instances of these class only contains enough information to run, but all other meta data associated to tarnslation are lost.
-    The idea of this class is that they can be feed to the optimization pipeline of Jace.
-    The SDFG that is inside `self` my not be optimized, but input and outputs are marked as global and they have a valid `arg_names` property.
-
-    SDFG encapsulated in `TranslatedJaxprSDFG` is in canonical form, which is not usable, finalized SDFGs are always valid.
-    They have:
-    - All input an output arrays are marked as global.
-    - It does not have `__return` values, i.e. all arguments are passed as arguments.
-    - Its `arg_names` are set with set `inp_names + out_names`, however,
-        arguments that are input and outputs are only listed as inputs.
-
-    Notes:
-        The main reason this class exists is, because optimizations are done in the `JaceLowered.compile()` function.
-            All DaCe functions in that regards are in place, if we would not copy the SDFG first, then we would have a problem.
-            Because these optimization would then have a feedback of the SDFG object which is stored in one way or the other
-            inside the `JaceLowered` object, which is wrong because `jaceLoweredObject.compile(no_opti=False)` and
-            `jaceLoweredObject.compile(no_opti=True)` will result in different objects but the SDFG is the same one, i.e. the optimized one.
-            It also makes sense, to remove all the unnecessary stuff that is part of the `TranslatedJaxprSDFG` but does not serve any purpose
-            inside the optimization pipeline.
-    """
-
-    sdfg: dace.SDFG
-    inp_names: tuple[str, ...]
-    out_names: tuple[str, ...]
-    csdfg: jdace.CompiledSDFG | None = None
-
-    def __post_init__(self) -> None:
-        self.validate()
-
-    def validate(self) -> bool:
-        """Checks if the embedded SDFG is valid."""
-        if any(arrname.startswith("__return") for arrname in self.sdfg.arrays.keys()):  # noqa: SIM118  # we can not use `in` because we are also interested in `__return_`!
-            raise dace.sdfg.InvalidSDFGError(
-                "There are no output arguments.",
-                self.sdfg,
-                self.sdfg.node_id(self.sdfg.start_state),
-            )
-        for glob_name in self.inp_names + self.out_names:
-            if self.sdfg.arrays[glob_name].transient:
-                raise dace.sdfg.InvalidSDFGError(
-                    f"Argument '{glob_name}' is a transient.",
-                    self.sdfg,
-                    self.sdfg.node_id(self.sdfg.start_state),
-                )
-        self.sdfg.validate()
-        return True
+    tsdfg.sdfg.arg_names = sdfg_arg_names
+
+    # Now we will deallocate the fields and mark `self` as finalized.
+    tsdfg.jax_name_map = None
+    tsdfg.start_state = None
+    tsdfg.terminal_state = None
+    tsdfg.rev_idx = None
+    tsdfg.is_finalized = True
diff --git a/src/jace/translator/translated_jaxpr_sdfg.py b/src/jace/translator/translated_jaxpr_sdfg.py
index e4c3ec0..770ee0d 100644
--- a/src/jace/translator/translated_jaxpr_sdfg.py
+++ b/src/jace/translator/translated_jaxpr_sdfg.py
@@ -7,9 +7,6 @@
 
 from __future__ import annotations
 
-from collections.abc import MutableMapping
-from dataclasses import dataclass
-
 import dace
 from jax import core as jax_core
 
@@ -29,7 +26,7 @@ class TranslatedJaxprSDFG:
     - `terminal_state` the last state in the state machine.
     - `inp_names` a `list` of the SDFG variables that are used as input, in the same order as `Jaxpr.invars`.
     - `out_names` a `list` of the SDFG variables that are used as output, in the same order as `Jaxpr.outvars`.
-    - `is_finalized` a bool that indicates if `self` represents a finalized or canonical SDFG, see bellow.
+    - `is_finalized` a bool that indicates if `self` represents a finalized or canonical SDFG, see below.
     - `rev_idx` the revision index, used for name mangling, however, outside of a translation process,
         the value carries no meaning.
 
@@ -85,17 +82,17 @@ def validate(self) -> bool:
 
         Only a finalized SDFG can be validated.
         """
-        if self.is_finalized:
+        if not self.is_finalized:
             raise dace.sdfg.InvalidSDFGError(
                 "SDFG is not finalized.",
                 self.sdfg,
-                self.sdfg.node_id(self.start_state),
+                self.sdfg.node_id(self.sdfg.start_state),
             )
         if len(self.inp_names) == 0:
             raise dace.sdfg.InvalidSDFGError(
                 "There are no input arguments.",
                 self.sdfg,
-                self.sdfg.node_id(self.start_state),
+                self.sdfg.node_id(self.sdfg.start_state),
             )
         if len(self.out_names) == 0:
             raise dace.sdfg.InvalidSDFGError(
diff --git a/src/jace/util/compiling.py b/src/jace/util/compiling.py
index 8cfcdef..f5daa71 100644
--- a/src/jace/util/compiling.py
+++ b/src/jace/util/compiling.py
@@ -12,47 +12,42 @@
 
 from __future__ import annotations
 
-from collections.abc import Sequence
-from functools import singledispatch
+import functools as ft
+import time
+from collections.abc import Mapping, Sequence
 from typing import Any
 
 import dace
 
-from jace.translator import post_translation as ptrans
+from jace import translator
 from jace.util import dace_helper as jdace
 
 
 def compile_jax_sdfg(
-    jsdfg: ptrans.FinalizedJaxprSDFG,
-    cache: bool = True,
+    tsdfg: translator.TranslatedJaxprSDFG,
 ) -> jdace.CompiledSDFG:
-    """This function compiles the sdfg embedded in the `FinalizedJaxpr` object and returns it.
-
-    By default the function will store the resulting `CompiledSDFG` object inside `jsdfg` (`FinalizedJaxprSDFG`).
-    However, by setting `cache` to `False` the respective field will not be modified.
+    """This function compiles the SDFG embedded in the embedded `tsdfg` (`TranslatedJaxprSDFG`).
 
     Notes:
         Currently the SDFG must not have any undefined symbols, i.e. no undefined sizes.
     """
-    from time import time
-
-    if not jsdfg.inp_names:
+    if not tsdfg.is_finalized:
+        raise ValueError("Can only compile a finalized SDFG.")
+    if not tsdfg.inp_names:
         raise ValueError("The passed SDFG did not had any input arguments.")
-    if not jsdfg.out_names:
+    if not tsdfg.out_names:
         raise ValueError("The passed SDFG did not had any output arguments.")
-    if any(out_name.startswith("__return") for out_name in jsdfg.out_names):
-        raise NotImplementedError("No return statement is supported yet.")
 
     # This is a simplification that makes our life simply.
     #  However, we should consider lifting it at some point.
-    if len(jsdfg.sdfg.free_symbols) != 0:
+    if len(tsdfg.sdfg.free_symbols) != 0:
         raise ValueError(
-            f"No externally defined symbols are allowed, found: {jsdfg.sdfg.free_symbols}"
+            f"No externally defined symbols are allowed, found: {tsdfg.sdfg.free_symbols}"
         )
 
     # To ensure that the SDFG is compiled and to get rid of a warning we must modify
     #  some settings of the SDFG. To fake an immutable SDFG, we will restore them later.
-    sdfg: dace.SDFG = jsdfg.sdfg
+    sdfg: dace.SDFG = tsdfg.sdfg
     org_sdfg_name: str = sdfg.name
     org_recompile: bool = sdfg._recompile
     org_regenerate_code: bool = sdfg._regenerate_code
@@ -60,7 +55,7 @@ def compile_jax_sdfg(
     try:
         # We need to give the SDFG another name, this is needed to prevent a DaCe error/warning.
         #  This happens if we compile the same lowered SDFG multiple times with different options.
-        sdfg.name = f"{sdfg.name}__comp_{int(time() * 1000)}"
+        sdfg.name = f"{sdfg.name}__comp_{int(time.time() * 1000)}"
 
         # Actual compiling the stuff; forcing that a recompilation happens
         with dace.config.temporary_config():
@@ -74,47 +69,48 @@ def compile_jax_sdfg(
         sdfg._recompile = org_recompile
         sdfg._regenerate_code = org_regenerate_code
 
-    # Storing the compiled SDFG for later use.
-    if cache:
-        jsdfg.csdfg = csdfg
-
     return csdfg
 
 
-@singledispatch
+@ft.singledispatch
 def run_jax_sdfg(
     csdfg: jdace.CompiledSDFG,
     inp_names: Sequence[str],
     out_names: Sequence[str],
-    /,
-    *args: Any,
-    **kwargs: Any,
+    cargs: Sequence[Any],
+    ckwargs: Mapping[str, Any],
 ) -> tuple[Any, ...] | Any:
     """Run the compiled SDFG.
 
-    The function assumes that the `(csdfg, inp_names, out_names)` together form a `FinalizedJaxprSDFG` object.
-    Further, it assumes that it was compiled according to this rule.
+    The function assumes that the SDFG was finalized and then compiled by `compile_jax_sdfg()`.
+
+    Args:
+        csdfg:      The `CompiledSDFG` object.
+        inp_names:  List of names of the input arguments.
+        out_names:  List of names of the output arguments.
+        cargs:      All positional arguments of the call.
+        ckwargs:    All keyword arguments of the call.
 
     Notes:
-        This function is used for debugging purposes and you should use the `jace.jit` annotation instead.
-        The function assumes that the SDFG was compiled in accordance with `compile_jax_sdfg()`
+        There is no pytree mechanism jet, thus the return values are returned inside a `tuple`
+            or in case of one value, directly, in the order determined by Jax.
     """
     from dace.data import Array, Data, Scalar, make_array_from_descriptor
 
-    if len(inp_names) != len(args):
+    if len(inp_names) != len(cargs):
         raise RuntimeError("Wrong number of arguments.")
-    if len(kwargs) != 0:
+    if len(ckwargs) != 0:
         raise NotImplementedError("No kwargs are supported yet.")
 
     # We need the SDFG to construct/allocate the memory for the return values.
     #  Actually, we would only need the descriptors, but this is currently the only way to get them.
-    # Note that this is save to do, under the assumption that the SDFG, which is inside the CompiledSDFG is still accurate.
-    #  But since it is by assumption finalized we should be fine.
+    #  As far as I know the dace performs a deepcopy before compilation, thus it should be safe.
+    #  However, regardless of this this also works if we are inside the stages, which have exclusive ownership.
     sdfg: dace.SDFG = csdfg.sdfg
 
     # Build the argument list that we will pass to the compiled object.
     call_args: dict[str, Any] = {}
-    for in_name, in_val in zip(inp_names, args, strict=True):
+    for in_name, in_val in zip(inp_names, cargs, strict=True):
         call_args[in_name] = in_val
     for out_name in out_names:
         assert not ((out_name == "__return") or (out_name.startswith("__return_")))  # noqa: PT018 # Assert split
@@ -152,27 +148,21 @@ def run_jax_sdfg(
     return ret_val
 
 
-@run_jax_sdfg.register(ptrans.FinalizedJaxprSDFG)
+@run_jax_sdfg.register(translator.TranslatedJaxprSDFG)
 def _(
-    jsdfg: ptrans.FinalizedJaxprSDFG,
-    /,
-    *args: Any,
-    **kwargs: Any,
+    tsdfg: translator.TranslatedJaxprSDFG,
+    cargs: Sequence[Any],
+    ckwargs: Mapping[str, Any],
 ) -> tuple[Any, ...] | Any:
-    """Execute the `FinalizedJaxprSDFG` object.
+    """Execute the `TranslatedJaxprSDFG` object directly.
 
-    If `jsdfg` does not have an embedded `CompiledSDFG` already the function will compile it first.
-    However, it will not modify the field.
+    This function is a convenience function provided for debugging.
     """
-
-    if jsdfg.csdfg is None:
-        csdfg: jdace.CompiledSDFG = compile_jax_sdfg(jsdfg, cache=False)
-    else:
-        csdfg = jsdfg.csdfg
+    csdfg: jdace.CompiledSDFG = compile_jax_sdfg(tsdfg)
     return run_jax_sdfg(
         csdfg=csdfg,
-        inp_names=jsdfg.inp_names,
-        out_names=jsdfg.out_names,
-        *args,  # noqa: B026  # star expansion.
-        **kwargs,
+        inp_names=tsdfg.inp_names,
+        out_names=tsdfg.out_names,
+        cargs=cargs,
+        ckwargs=ckwargs,
     )
diff --git a/src/jace/util/jax_helper.py b/src/jace/util/jax_helper.py
index e586526..37f06ad 100644
--- a/src/jace/util/jax_helper.py
+++ b/src/jace/util/jax_helper.py
@@ -126,11 +126,7 @@ def get_jax_var_name(jax_var: jax_core.Atom | JaCeVar | str) -> str:
 
 
 @overload
-<<<<<<< HEAD
-def get_jax_var_shape(jax_var: JaCeVar) -> tuple[int | dace.symbol | str, ...] | tuple[()]: ...  # type: ignore[overload-overlap]
-=======
 def get_jax_var_shape(jax_var: JaCeVar) -> tuple[int | dace.symbol | str, ...]: ...  # type: ignore[overload-overlap]
->>>>>>> initial_implementation
 
 
 @overload
diff --git a/tests/test_decorator.py b/tests/test_decorator.py
index cfaef2d..00b494b 100644
--- a/tests/test_decorator.py
+++ b/tests/test_decorator.py
@@ -114,3 +114,33 @@ def testee2_(A: np.ndarray, B: np.ndarray) -> np.ndarray:
     assert compiled2 is lowered1_size1.compile({"dummy_option": True})
     assert compiled2 is not lowered1_size1.compile({"dummy_option": False})
     assert compiled2 is lowered1_size1.compile({"dummy_option": True})
+
+
+def test_decorator_sharing():
+    """Tests if there is no false sharing in the cache."""
+    jax.config.update("jax_enable_x64", True)
+
+    @jace.jit
+    def jaceWrapped(A: np.ndarray, B: np.ndarray) -> np.ndarray:
+        C = A * B
+        D = C + A
+        E = D + B  # Just enough state.
+        return A + B + C + D + E
+
+    # These are the argument
+    A = np.arange(12, dtype=np.float64).reshape((4, 3))
+    B = np.full((4, 3), 10, dtype=np.float64)
+
+    # Now we lower it.
+    jaceLowered = jaceWrapped.lower(A, B)
+
+    # Now we compile it with enabled optimization.
+    optiCompiled = jaceLowered.compile({"auto_optimize": True, "simplify": True})
+
+    # Now we compile it without any optimization.
+    unoptiCompiled = jaceLowered.compile({})
+
+    # Because of the way how things work the optimized must have more than the unoptimized.
+    #  If there is sharing, then this would not be the case.
+    assert optiCompiled._csdfg.sdfg.number_of_nodes() == 1
+    assert optiCompiled._csdfg.sdfg.number_of_nodes() < unoptiCompiled._csdfg.sdfg.number_of_nodes()
diff --git a/tests/test_jaxpr_translator_driver.py b/tests/test_jaxpr_translator_driver.py
index 16cdfe3..e52873e 100644
--- a/tests/test_jaxpr_translator_driver.py
+++ b/tests/test_jaxpr_translator_driver.py
@@ -78,7 +78,7 @@ def test_driver_nested() -> None:
     assert driver._ctx is driver._ctx_stack[-1]
     assert driver._ctx is not driver._ctx_stack[0]
 
-    assert org_ctx.rev_idx < driver._ctx.rev_idx
+    assert org_ctx.rev_idx < driver.rev_idx  # type: ignore[operator]  # Type confusion
 
     # Now we go back one state, i.e. pretend that we are done with translating the nested jaxpr.
     driver._clear_translation_ctx()
@@ -92,43 +92,43 @@ def test_driver_nested() -> None:
     assert driver._reserved_names is None
 
 
-def test_driver_append_state(alloc_driver: jtrans.JaxprTranslationDriver) -> None:
+def test_driver_append_state(translation_driver: jtrans.JaxprTranslationDriver) -> None:
     """Tests the functionality of appending states."""
-    sdfg: dace.SDFG = alloc_driver.sdfg
+    sdfg: dace.SDFG = translation_driver.sdfg
 
-    terminal_state_1: dace.SDFGState = alloc_driver.append_new_state("terminal_state_1")
+    terminal_state_1: dace.SDFGState = translation_driver.append_new_state("terminal_state_1")
     assert sdfg.number_of_nodes() == 2
     assert sdfg.number_of_edges() == 1
-    assert terminal_state_1 is alloc_driver.terminal_sdfg_state
-    assert alloc_driver.terminal_sdfg_state is alloc_driver._ctx.terminal_state
-    assert alloc_driver._ctx.start_state is sdfg.start_block
-    assert alloc_driver._ctx.start_state is not terminal_state_1
+    assert terminal_state_1 is translation_driver.terminal_sdfg_state
+    assert translation_driver.terminal_sdfg_state is translation_driver._ctx.terminal_state
+    assert translation_driver._ctx.start_state is sdfg.start_block
+    assert translation_driver._ctx.start_state is not terminal_state_1
     assert next(iter(sdfg.edges())).src is sdfg.start_block
     assert next(iter(sdfg.edges())).dst is terminal_state_1
 
     # Specifying an explicit append state that is the terminal should also update the terminal state of the driver.
-    terminal_state_2: dace.SDFGState = alloc_driver.append_new_state(
+    terminal_state_2: dace.SDFGState = translation_driver.append_new_state(
         "terminal_state_2", prev_state=terminal_state_1
     )
     assert sdfg.number_of_nodes() == 3
     assert sdfg.number_of_edges() == 2
-    assert terminal_state_2 is alloc_driver.terminal_sdfg_state
+    assert terminal_state_2 is translation_driver.terminal_sdfg_state
     assert sdfg.out_degree(terminal_state_1) == 1
     assert sdfg.out_degree(terminal_state_2) == 0
     assert sdfg.in_degree(terminal_state_2) == 1
     assert next(iter(sdfg.in_edges(terminal_state_2))).src is terminal_state_1
 
     # Specifying a previous node that is not the terminal state should not do anything.
-    non_terminal_state: dace.SDFGState = alloc_driver.append_new_state(
+    non_terminal_state: dace.SDFGState = translation_driver.append_new_state(
         "non_terminal_state", prev_state=terminal_state_1
     )
-    assert alloc_driver.terminal_sdfg_state is not non_terminal_state
+    assert translation_driver.terminal_sdfg_state is not non_terminal_state
     assert sdfg.in_degree(non_terminal_state) == 1
     assert sdfg.out_degree(non_terminal_state) == 0
     assert next(iter(sdfg.in_edges(non_terminal_state))).src is terminal_state_1
 
 
-def test_driver_scalar(alloc_driver: jtrans.JaxprTranslationDriver) -> None:
+def test_driver_scalar(translation_driver: jtrans.JaxprTranslationDriver) -> None:
     """This function tests the array creation routines, especially the scalar part.
 
     However, it does so without using Jax variables.
@@ -137,24 +137,24 @@ def test_driver_scalar(alloc_driver: jtrans.JaxprTranslationDriver) -> None:
 
     # Creating a scalar.
     scal1_j = JaCeVar("scal1", (), dace.float64)
-    scal1_: str = alloc_driver.add_array(
+    scal1_: str = translation_driver.add_array(
         arg=scal1_j,
         update_var_mapping=True,
     )
-    scal1: Data = alloc_driver.get_array(scal1_)
-    assert scal1 is alloc_driver.get_array(scal1_j)
-    assert scal1_ == alloc_driver.map_jax_var_to_sdfg(scal1_j)
+    scal1: Data = translation_driver.get_array(scal1_)
+    assert scal1 is translation_driver.get_array(scal1_j)
+    assert scal1_ == translation_driver.map_jax_var_to_sdfg(scal1_j)
     assert isinstance(scal1, Scalar)
     assert scal1_ == scal1_j.name
     assert scal1.dtype == scal1_j.dtype
 
     # Create a scalar and force it as an array
     scal2_j = JaCeVar("scal2", (), dace.int64)
-    scal2_: str = alloc_driver.add_array(
+    scal2_: str = translation_driver.add_array(
         arg=scal2_j,
         force_array=True,
     )
-    scal2: Data = alloc_driver.get_array(scal2_)
+    scal2: Data = translation_driver.get_array(scal2_)
     assert isinstance(scal2, Array)
     assert scal2_ == scal2_j.name
     assert scal2.shape == (1,)
@@ -164,13 +164,13 @@ def test_driver_scalar(alloc_driver: jtrans.JaxprTranslationDriver) -> None:
     # Using a special name for the variable
     scal3_j = JaCeVar("scal3", (), dace.int64)
     scal3_n = "scal3_special_name"
-    scal3_: str = alloc_driver.add_array(
+    scal3_: str = translation_driver.add_array(
         arg=scal3_j,
         alt_name=scal3_n,
         update_var_mapping=True,
     )
     assert scal3_ == scal3_n
-    assert scal3_ == alloc_driver.map_jax_var_to_sdfg(scal3_j)
+    assert scal3_ == translation_driver.map_jax_var_to_sdfg(scal3_j)
 
     # Test the prefix functionality
     scal4_j = JaCeVar("scal4", (), dace.float64)
@@ -182,13 +182,13 @@ def test_driver_scalar(alloc_driver: jtrans.JaxprTranslationDriver) -> None:
             f"Specified 'name_prefix' ('{scal4_p}') but passed '{scal4_n}' as 'alt_name'."
         ),
     ):
-        scal4_: str = alloc_driver.add_array(
+        scal4_: str = translation_driver.add_array(
             arg=scal4_j,
             alt_name=scal4_n,
             name_prefix=scal4_p,
         )
     # Now create it correctly
-    scal4_ = alloc_driver.add_array(
+    scal4_ = translation_driver.add_array(
         arg=scal4_j,
         name_prefix=scal4_p,
     )
@@ -201,7 +201,7 @@ def test_driver_scalar(alloc_driver: jtrans.JaxprTranslationDriver) -> None:
         expected_exception=ValueError,
         match="Specified a stride for a scalar.",
     ):
-        scal5_: str = alloc_driver.add_array(arg=scal5_j, strides=(3,))
+        scal5_: str = translation_driver.add_array(arg=scal5_j, strides=(3,))
 
     # test the force jax name feature
     scal6_j = JaCeVar("scal6", (), dace.float64)
@@ -211,7 +211,7 @@ def test_driver_scalar(alloc_driver: jtrans.JaxprTranslationDriver) -> None:
         expected_exception=ValueError,
         match=f"Specified 'force_jax_name', but passed '{scal6_n}' as 'alt_name'.",
     ):
-        scal6_: str = alloc_driver.add_array(
+        scal6_: str = translation_driver.add_array(
             arg=scal6_j,
             alt_name=scal6_n,
             force_jax_name=True,
@@ -220,7 +220,7 @@ def test_driver_scalar(alloc_driver: jtrans.JaxprTranslationDriver) -> None:
         expected_exception=ValueError,
         match=f"Specified 'force_jax_name', but passed '{scal6_np}' as 'name_prefix'.",
     ):
-        scal6_ = alloc_driver.add_array(
+        scal6_ = translation_driver.add_array(
             arg=scal6_j,
             name_prefix=scal6_np,
             force_jax_name=True,
@@ -229,29 +229,29 @@ def test_driver_scalar(alloc_driver: jtrans.JaxprTranslationDriver) -> None:
         expected_exception=ValueError,
         match="Specified `force_jax_name` but also wanted a new name.",
     ):
-        scal6_ = alloc_driver.add_array(
+        scal6_ = translation_driver.add_array(
             arg=scal6_j,
             force_jax_name=True,
             find_new_name=True,
         )
-    scal6_ = alloc_driver.add_array(
+    scal6_ = translation_driver.add_array(
         arg=scal6_j,
         force_jax_name=True,
     )
     assert scal6_ == scal6_j.name
 
 
-def test_driver_array(alloc_driver: jtrans.JaxprTranslationDriver) -> None:
+def test_driver_array(translation_driver: jtrans.JaxprTranslationDriver) -> None:
     """This function tests the array creation routines.
 
     However, it does so without using Jax variables.
     """
     # Allocating an array
     arr1_j = JaCeVar("arr1", (5, 3), dace.float32)
-    arr1_: str = alloc_driver.add_array(
+    arr1_: str = translation_driver.add_array(
         arg=arr1_j,
     )
-    arr1: Data = alloc_driver.get_array(arr1_)
+    arr1: Data = translation_driver.get_array(arr1_)
     assert isinstance(arr1, Array)
     assert arr1_ == arr1_j.name
     assert arr1.shape == arr1_j.shape
@@ -264,12 +264,12 @@ def test_driver_array(alloc_driver: jtrans.JaxprTranslationDriver) -> None:
         expected_exception=ValueError,
         match=f"Can't create variable '{arr2_j.name}', variable is already created.",
     ):
-        arr2_: str = alloc_driver.add_array(arg=arr2_j)
+        arr2_: str = translation_driver.add_array(arg=arr2_j)
     with pytest.raises(expected_exception=ValueError, match=f"Variable '{arr1_}' already exists."):
         # `alt_name` will not work because name still exists.
-        arr2_ = alloc_driver.add_array(arg=arr2_j, alt_name=arr2_j.name)
+        arr2_ = translation_driver.add_array(arg=arr2_j, alt_name=arr2_j.name)
     # However, specifying `find_new_name` will solve this issue
-    arr2_ = alloc_driver.add_array(
+    arr2_ = translation_driver.add_array(
         arg=arr2_j,
         find_new_name=True,
     )
@@ -278,11 +278,11 @@ def test_driver_array(alloc_driver: jtrans.JaxprTranslationDriver) -> None:
     # Create a variable that has a custom stride
     arr3_j = JaCeVar("arr3", (5, 1, 3), dace.float64)
     arr3_st = (5, 3, 2)
-    arr3_: str = alloc_driver.add_array(
+    arr3_: str = translation_driver.add_array(
         arg=arr3_j,
         strides=arr3_st,
     )
-    arr3: Data = alloc_driver.get_array(arr3_)
+    arr3: Data = translation_driver.get_array(arr3_)
     assert isinstance(arr3, Array)
     assert arr3.shape == arr3_j.shape
     assert arr3.strides == arr3_st
@@ -317,7 +317,7 @@ def test_driver_array2() -> None:
         only_creation=True,
     )
     assert res_names == exp_names, f"Expected names '{exp_names}' but got '{res_names}'."
-    assert len(driver._ctx.jax_name_map) == 2
+    assert len(driver._jax_name_map) == 2
 
     # Try to create variable `c` and `a`, however, since variable `a` already exists it will fail.
     #  However, currently the variable `c` will be created, this might change in the future.
@@ -330,15 +330,15 @@ def test_driver_array2() -> None:
             [var_c, var_a],
             only_creation=True,
         )
-    assert len(driver._ctx.jax_name_map) == 3, f"{driver._ctx.jax_name_map}"
-    assert driver._ctx.jax_name_map[var_c] == "c"
+    assert len(driver._jax_name_map) == 3, f"{driver._jax_name_map}"
+    assert driver._jax_name_map[var_c] == "c"
 
     # Now we test the only collection mode
     res_names = driver.create_jax_var_list(
         [var_c, var_a],
         prevent_creation=True,
     )
-    assert len(driver._ctx.jax_name_map) == 3, f"{driver._ctx.jax_name_map}"
+    assert len(driver._jax_name_map) == 3, f"{driver._jax_name_map}"
     assert res_names == ["c", "a"]
 
     # Now also the mixed mode, i.e. between collecting and creating.
@@ -347,9 +347,5 @@ def test_driver_array2() -> None:
     res_names = driver.create_jax_var_list(
         [var_c, var_d, var_a],
     )
-    assert len(driver._ctx.jax_name_map) == 4
+    assert len(driver._jax_name_map) == 4
     assert exp_names == res_names
-
-
-if __name__ == "__main__":
-    test_driver_alloc()

From b4ab93b85b6471d389a8ef6ac75c832e4c64f99c Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Thu, 16 May 2024 13:33:36 +0200
Subject: [PATCH 154/458] This commit partially add support for a global list
 of primitive translators.

This was Enrique's idea and it is really good, but it adds a lot of complexity.
For several reasons (mainly open PR) the commit is split into two parts one that can is merged into the PR (this one) and once that contains the parts that are development only.
Essentially we want allow code such as:
```python
       @jit
       def foo(...):
              ...
       foo1 = foo.lower(...args1)
       # Modify the list of internal translators, i.e. call `add_subtranslator()`
       foo2 = foo.lower(...args2)
```
because the list of translators is an implicit argument to the `jit` decorator, we expect that `foo2` is generated with the same translators as was `foo1`, see the next commit for a full description.
This commit essentially adds two things:
- the global list that stores the translator instances
- makes all necessary changes such that stuff works.

The managing of the global list is implemented such that it results in an immutable object.
Thus every time it is mutated a new list is created.
It might be a bit strange to do that, but the list is not changed that frequently (except upon loading) and it is only a shallow copy, since the translators are immutable themselves.
This approach allows some nice optimization further down.

For more information on the code see `jace.translator.managing.add_subtranslators`.
---
 pyproject.toml                                |   5 +-
 src/jace/__init__.py                          |  15 ++
 src/jace/translator/__init__.py               |   6 +-
 .../translator/jaxpr_translator_driver.py     |  92 ++-----
 src/jace/translator/managing.py               | 214 +++++++++++++----
 src/jace/translator/primitive_translator.py   |  31 +--
 .../primitive_translators/alu_translator.py   | 155 ++++++------
 tests/test_jaxpr_translator_driver.py         |  16 +-
 tests/test_subtranslator_helper.py            | 224 +++++++++++++-----
 9 files changed, 463 insertions(+), 295 deletions(-)

diff --git a/pyproject.toml b/pyproject.toml
index fa01acb..737d9e1 100644
--- a/pyproject.toml
+++ b/pyproject.toml
@@ -65,7 +65,7 @@ warn_unused_ignores = true
 disallow_incomplete_defs = false
 disallow_untyped_defs = false
 ignore_missing_imports = true
-module = "tests.*"
+module = ["tests.*"]
 
 # -- pytest  --
 [tool.pytest]
@@ -149,7 +149,8 @@ section-order = [
 "!tests/**.py" = ["PT"]  # Ignore `flake8-pytest-style` everywhere except in `tests/`
 "noxfile.py" = ["T20"]  # Ignore `flake8-print`
 "tests/**" = [
-  "T10", # Ignore `flake8-debugger`
+  "T10",  # Ignore `flake8-debugger`
   "T20",  # Ignore `flake8-print`
   "F841",  # Ignore `unused-variable` (inside `with` to test if throws)
+  "ARG001"  # Ignore `unused function argument` (to create simple fake stand ins)
 ]
diff --git a/src/jace/__init__.py b/src/jace/__init__.py
index 42641a0..930074e 100644
--- a/src/jace/__init__.py
+++ b/src/jace/__init__.py
@@ -13,6 +13,21 @@
 from .jax import grad, jacfwd, jacrev, jit
 
 
+def _ensure_build_in_translators_are_loaded() -> None:
+    # There is a chicken-egg problem, i.e. circular import, if we use the decorator to add the build in classes.
+    #  In order for the decorator to add the translators to the internal list, they have to be run, i.e. imported.
+    #  However, since they have to import the decorator, this would lead to a circular import.
+    #  To ensure that the built in translators are imported at the beginning, i.e. once Jace is loaded.
+    #  We define this function and call it and its only job is to load the subtranslaotrs.
+    #  However, this requires that all are imported by the `__init__.py` file.
+    # Too see that it is needed, remove this function and run `pytest tests/test_subtranslator_helper.py::test_are_subtranslators_imported`
+    from jace.translator import primitive_translators  # noqa: F401  # Unused import
+
+
+_ensure_build_in_translators_are_loaded()
+del _ensure_build_in_translators_are_loaded
+
+
 __all__ = [
     "__author__",
     "__copyright__",
diff --git a/src/jace/translator/__init__.py b/src/jace/translator/__init__.py
index 22f3182..69600ae 100644
--- a/src/jace/translator/__init__.py
+++ b/src/jace/translator/__init__.py
@@ -10,7 +10,7 @@
 from __future__ import annotations
 
 from .jaxpr_translator_driver import JaxprTranslationDriver
-from .managing import add_subtranslator, get_subtranslators_cls
+from .managing import add_fsubtranslator, add_subtranslator, add_subtranslators, get_subtranslators
 from .primitive_translator import PrimitiveTranslator
 from .translated_jaxpr_sdfg import TranslatedJaxprSDFG
 
@@ -20,5 +20,7 @@
     "PrimitiveTranslator",
     "TranslatedJaxprSDFG",
     "add_subtranslator",
-    "get_subtranslators_cls",
+    "add_subtranslators",
+    "add_fsubtranslator",
+    "get_subtranslators",
 ]
diff --git a/src/jace/translator/jaxpr_translator_driver.py b/src/jace/translator/jaxpr_translator_driver.py
index 92fda72..17fd2b9 100644
--- a/src/jace/translator/jaxpr_translator_driver.py
+++ b/src/jace/translator/jaxpr_translator_driver.py
@@ -44,12 +44,16 @@ class JaxprTranslationDriver:
     Instead the request is forwarded to a `PrimitiveTranslator` object, also known as subtranslator.
     This is a highly specialized object that is able to handle one kind of primitive.
     For more information on the subtranslators see the documentation of `PrimitiveTranslator`.
+    The actual translators are supplied from the outside at construction time.
 
     To start a translation the `translate_jaxpr()` function should be called,
     if this happens it is said that the driver has an ongoing translation.
     If `translate_jaxpr()` is called on driver that has an ongoing translation, a new translation context will be set up.
     Thus the driver will then translate the supplied (nested) Jaxpr and return the result.
     However, this will have no influence on the translation process that is already going.
+
+    Notes:
+        The translator is able to handle multiple consecutive translations.
     """
 
     __slots__ = (
@@ -61,26 +65,24 @@ class JaxprTranslationDriver:
 
     def __init__(
         self,
-        **kwargs: Any,
+        sub_translators: Mapping[str, translator.PrimitiveTranslator],
     ) -> None:
-        """Creates the base translator.
+        """Creates the driver.
 
-        All arguments that does not start with an underscore are used as
-        arguments to construct the subtranslators.
+        Args:
+            sub_translators:    Use these subtranslators to perform the translation.
 
         Notes:
-            This function will not allocate the translation context of `self`
-                but will only allocate the shared members.
-            By setting `_no_shared_alloc` to `True` the function will not allocate
-                the shared part. This flag is provided only for implementing
-                `self.fork()` using it is an error and undefined behaviour.
+            `sub_translators` is not copied, thus the user has to guarantee,
+                that it will not change during translation.
+                It is highly advised but not requiered to use the output of
+                `get_subtranslators()` or pass a copy as argument.
         """
-        # Contains all the subtranslators that we need.
-        #  They are partitioned by the names of the primitive they have registered for.
-        #  This member is allocated by '_init_sub_translators()' and remains allocated
-        #  during the lifetime of the object.
-        self._sub_translators: dict[str, translator.PrimitiveTranslator] = None  # type: ignore[assignment]
-        self._init_sub_translators(kwargs)
+
+        # Shared with the outside, while key and mapped values are immutable,
+        #  the mapping itself is not, but it should be fine.
+        #  Allocated through the lifetime of `self`.
+        self._sub_translators: Mapping[str, translator.PrimitiveTranslator] = sub_translators
 
         # These names can not be used for the automatic naming of Jax variables.
         #  They differ from the forbidden names, that they denote valid SDFG names.
@@ -767,32 +769,6 @@ def _ctx(self) -> translator.TranslatedJaxprSDFG:
         assert len(self._ctx_stack) != 0, "No context is active."
         return self._ctx_stack[-1]
 
-    def _init_sub_translators(
-        self,
-        subtrans_args: Mapping[str, Any],
-    ) -> JaxprTranslationDriver:
-        """This function initializes the subtranslator.
-
-        The function forwards `kwargs` to the constructor of the subtranslators.
-        However, it will remove all arguments starting with an underscore.
-        """
-
-        subtrans_args = {k: v for k, v in subtrans_args.items() if not k.startswith("_")}
-        prim_translators: dict[str, translator.PrimitiveTranslator] = {}
-        for prim_translator_cls in translator.get_subtranslators_cls():
-            prim_translator: translator.PrimitiveTranslator = prim_translator_cls.build_translator(
-                **subtrans_args
-            )
-            handled_primitives: Iterable[str] = util.as_sequence(prim_translator.primitive)
-
-            for handled_primitive in handled_primitives:
-                if handled_primitive in prim_translators:
-                    raise RuntimeError(f"Multiple translators for '{handled_primitive}' found.")
-                prim_translators[handled_primitive] = prim_translator
-        self._sub_translators = prim_translators
-
-        return self
-
     def _clear_translation_ctx(self) -> JaxprTranslationDriver:
         """This function deallocate the translation context of `self`.
 
@@ -815,17 +791,6 @@ def _clear_translation_ctx(self) -> JaxprTranslationDriver:
             self._ctx_stack.pop()
         return self
 
-    def _find_sub_translator_for(
-        self,
-        eqn: jax_core.JaxprEqn,
-    ) -> translator.PrimitiveTranslator:
-        """Returns the appropriate subtranslator for equation `eqn`."""
-        prim_name: str = eqn.primitive.name
-        if prim_name not in self._sub_translators:
-            raise NotImplementedError(f"No subtranslators known to handle '{prim_name}'.")
-
-        return self._sub_translators[prim_name]
-
     def _translate_single_eqn(
         self,
         eqn: jax_core.JaxprEqn,
@@ -864,17 +829,22 @@ def _translate_single_eqn(
         )
 
         # Find the subtranslator
-        subtranslator: translator.PrimitiveTranslator = self._find_sub_translator_for(eqn)
+        prim_name: str = eqn.primitive.name
+        if prim_name not in self._sub_translators:
+            raise NotImplementedError(
+                f"No subtranslators known to handle '{prim_name}' || {type(self._sub_translators)}."
+            )
+        subtranslator = self._sub_translators[prim_name]
 
         # Create the state into which the equation should be translated
         last_term_state: dace.SDFGState = self.terminal_sdfg_state  # noqa: F841 # Will be used later
         eqn_state = self.append_new_state(
-            label=f"{eqn.primitive.name}_{out_var_names[0]}",
+            label=f"{eqn.primitive.name}_{'_'.join(out_var_names)}",
             prev_state=None,  # forces terminal state to use
         )
 
         # Now perform the actual translation of the equation.
-        new_sdfg_term_state = subtranslator.translate_jaxeqn(
+        new_sdfg_term_state = subtranslator(
             driver=self,
             in_var_names=in_var_names,
             out_var_names=out_var_names,  # Might be modified by the subtranslator!
@@ -946,18 +916,6 @@ def _translate_jaxpr_internal(
         # Set the output names inside the context.
         self._ctx.out_names = tuple(out_var_names)
 
-        return self._export_context()
-
-    def _export_context(self) -> translator.TranslatedJaxprSDFG:
-        """Encapsulate the translation context of `self` into a `TranslatedJaxprSDFG` object..
-
-        This function will not deallocate the internal context of `self`.
-        Thus `self` and the return value will share the same context in memory.
-        To free the context of `self` use `self._clear_translation_ctx()`.
-        """
-        assert self.is_allocated()
-        assert all((isinstance(x, str) and (len(x) > 0)) for x in self._ctx.inp_names)
-        assert all((isinstance(x, str) and (len(x) > 0)) for x in self._ctx.out_names)
         return self._ctx
 
     def _handle_null_jaxpr(
diff --git a/src/jace/translator/managing.py b/src/jace/translator/managing.py
index 589b446..e3afc99 100644
--- a/src/jace/translator/managing.py
+++ b/src/jace/translator/managing.py
@@ -4,79 +4,195 @@
 # All rights reserved.
 #
 # SPDX-License-Identifier: BSD-3-Clause
-"""Module for managing the individual sutranslators."""
+"""Module for managing the individual sutranslators.
+
+The high level idea is that there is a "list" of instances of `PrimitiveTranslator`,
+which is known as `_CURRENT_SUBTRANSLATORS`.
+If not specified the content of this list is used to perform the translation.
+"""
 
 from __future__ import annotations
 
-from collections.abc import Callable, Sequence
-from typing import Literal, overload
+import inspect
+import types
+from collections.abc import Callable, Mapping, MutableMapping
+from typing import TYPE_CHECKING, Literal, TypeAlias, cast, overload
 
-from jace import translator
 
+if TYPE_CHECKING:
+    from jace import translator
 
-# List of all primitive translators that are known to Jace.
-#  They are filled through the `add_subtranslator()` decorator.
-#  See also the note in `get_subtranslators_cls()`
-_KNOWN_SUBTRANSLATORS: list[type[translator.PrimitiveTranslator]] = []
+    # Type alias for distinguish between instances and classes.
+    PrimitiveTranslator: TypeAlias = (
+        type[translator.PrimitiveTranslator] | translator.PrimitiveTranslator | Callable
+    )
 
 
-@overload
-def add_subtranslator(
-    subtrans: Literal[None], /, overwrite: bool = False
-) -> Callable[[type[translator.PrimitiveTranslator]], type[translator.PrimitiveTranslator]]: ...
+# These are all currently used subtranslators that we are used.
+_CURRENT_SUBTRANSLATORS: dict[str, translator.PrimitiveTranslator] = {}
+_CURRENT_SUBTRANSLATORS_VIEW: types.MappingProxyType[str, translator.PrimitiveTranslator] = (
+    types.MappingProxyType(_CURRENT_SUBTRANSLATORS)
+)
 
 
-@overload
-def add_subtranslator(
-    subtrans: type[translator.PrimitiveTranslator], /, overwrite: bool = False
-) -> type[translator.PrimitiveTranslator]: ...
+def add_subtranslators(
+    *subtrans: PrimitiveTranslator | None,
+    overwrite: bool = False,
+) -> None:
+    """Adds many subtranslators in one step to Jace's internal list.
+
+    This function is more efficient if many translators should be added in one go.
+    Please refer to `add_subtranslator()` for more information.
+
+    Notes:
+        If an error during insertion happens the operation is considered a no ops.
+    """
+    from jace import translator  # Circular import
+
+    global _CURRENT_SUBTRANSLATORS
+    global _CURRENT_SUBTRANSLATORS_VIEW
+
+    if len(subtrans) == 0:
+        raise ValueError("Not passed any subtranslators.")
+
+    # Why do we do this kind of versioning here or versioning at all?
+    #  The cache has to include the set of used subtranslators somehow.
+    #  However, as explained in `JaceWrapped.__init__()` the function must make a copy of it.
+    #  One way would be to hash the content, i.e. `[(prim_name, id(prim_translator)), ...]`.
+    #  But a much simpler idea is to just consider its address, since in 99% of the cases,
+    #  the global list is used and not some user supplied list is used we do this versioning.
+    #  This allows `JaceWrapped.__init__()` to identify if the current global list of installed
+    #  translated is passed to it and it can then prevent the copying.
+    #  In the end a code like:
+    #       def foo(...): ...
+    #       foo1 = jace.jit(foo).lower()   # noqa: ERA001 commented out code
+    #       foo2 = jace.jit(foo).lower()   # noqa: ERA001
+    #  Should only lower once as it is seen in Jax.
+    new_CURRENT_SUBTRANSLATORS = _CURRENT_SUBTRANSLATORS.copy()
+
+    for prim_trans in subtrans:
+        # If it is a class instantiate it.
+        if inspect.isclass(prim_trans):
+            prim_trans = prim_trans()
+        prim_trans = cast(translator.PrimitiveTranslator, prim_trans)
+
+        # Test if we know the primitive already
+        prim_name: str = prim_trans.primitive
+        if (prim_name in _CURRENT_SUBTRANSLATORS) and (not overwrite):
+            raise ValueError(f"Tried to add a second translator for primitive '{prim_name}'.")
+
+        # Commit the change to a "staging"
+        new_CURRENT_SUBTRANSLATORS[prim_name] = prim_trans
+
+    # Now update the global variables.
+    #  Doing it after the loop gives us exception guarantee
+    _CURRENT_SUBTRANSLATORS = new_CURRENT_SUBTRANSLATORS
+    _CURRENT_SUBTRANSLATORS_VIEW = types.MappingProxyType(_CURRENT_SUBTRANSLATORS)
 
 
 def add_subtranslator(
-    subtrans: type[translator.PrimitiveTranslator] | None = None,
+    subtrans: PrimitiveTranslator | None = None,
     /,
     overwrite: bool = False,
-) -> (
-    type[translator.PrimitiveTranslator]
-    | Callable[[type[translator.PrimitiveTranslator]], type[translator.PrimitiveTranslator]]
-):
-    """Decorator to add `subtrans` to the list of known subtranslators.
-
-    If a class is tried to be registered twice an error will be generated unless, `overwrite` is set.
+) -> PrimitiveTranslator | Callable[[PrimitiveTranslator], PrimitiveTranslator]:
+    """Adds the subtranslator `subtrans` to Jace's internal list of translators.
+
+    If the primitive is already known an error is generated, however, if `overwrite` is given,
+    then `subtrans` will replace the current one.
+    In case `subtrans` is a class, the function will instantiate it first.
+    Thus, a class must be constructable without arguments.
+
+    Notes:
+        Calls to this function will never modify subtranslator lists previously obtained by `get_subtranslators()`!
+        Since `subtrans` is returned unmodified, this function can be used to annotate classes.
+        For annotating functions use `add_fsubtranslator()`.
+
+    Todo:
+        Accept many inputs for bulk update.
+        Add functions to clear them or restore the default ones.
     """
-    if subtrans is None:
 
+    if subtrans is None:
+        # It was used as decorator with some argument (currently `overwrite`).
         def wrapper(
-            real_subtrans: type[translator.PrimitiveTranslator],
-        ) -> type[translator.PrimitiveTranslator]:
+            real_subtrans: PrimitiveTranslator,
+        ) -> PrimitiveTranslator:
             return add_subtranslator(real_subtrans, overwrite=overwrite)
 
         return wrapper
 
-    if subtrans in _KNOWN_SUBTRANSLATORS:
-        if overwrite:
-            _KNOWN_SUBTRANSLATORS.remove(subtrans)
-        else:
-            raise ValueError(
-                f"Tried to add '{type(subtrans).__name__}' twice to the list of known primitive translators."
-            )
-
-    _KNOWN_SUBTRANSLATORS.append(subtrans)
+    # Forward the call to the bulk insertion.
+    #  And always return the original argument.
+    add_subtranslators(subtrans, overwrite=overwrite)
     return subtrans
 
 
-def get_subtranslators_cls() -> Sequence[type[translator.PrimitiveTranslator]]:
-    """Returns the list of all subtranslator known to JaCe.
+def add_fsubtranslator(
+    prim_name: str,
+    fun: Callable | None = None,
+    /,
+    overwrite: bool = False,
+) -> PrimitiveTranslator | Callable[[Callable], PrimitiveTranslator]:
+    """Convenience function to annotate function and turn them into a translator.
+
+    Adds the `primitive` property to `fun` and register it then as translator.
+
+    Notes:
+        Without this function you would had to define the translator function,
+            add the `primitive` property to it and then pass it to `add_subtranslator()`.
+            This function allows it to do in one step.
+    """
+
+    if fun is None:
+        # Annotated mode.
+        def wrapper(real_fun: Callable) -> PrimitiveTranslator:
+            return add_fsubtranslator(prim_name, real_fun, overwrite=overwrite)
+
+        return wrapper
+
+    assert inspect.isfunction(fun)
+    if getattr(fun, "primitive", prim_name) != prim_name:
+        raise ValueError(f"Passed 'fun' already '{fun.primitive}' as 'primitive' property.")  # type: ignore[attr-defined]
+
+    fun.primitive = prim_name  # type: ignore[attr-defined]
+    return add_subtranslator(fun, overwrite=overwrite)
+
+
+@overload
+def get_subtranslators(  # type: ignore[overload-overlap]
+    as_mutable: Literal[False] = False,
+) -> Mapping[str, translator.PrimitiveTranslator]: ...
+
+
+@overload
+def get_subtranslators(
+    as_mutable: Literal[True] = True,
+) -> MutableMapping[str, translator.PrimitiveTranslator]: ...
+
+
+def get_subtranslators(
+    as_mutable: bool = False,
+) -> (
+    Mapping[str, translator.PrimitiveTranslator]
+    | MutableMapping[str, translator.PrimitiveTranslator]
+):
+    """Returns a view of all _currently_ installed primitive translators in Jace.
+
+    By setting `as_mutable` to `True` the function will return a mutable mapping object.
+    However, in any case the returned mapping will not be affected by calls that modify
+    the internal list of registered primitive translators, i.e. `add_subtranslator()`.
 
-    The subtranslators are returned in FIFO order.
+    Notes:
+        If `as_mutable` is `False` the function will return an immutable view of the
+            registered primitive translator list, thus only a view is created.
+            However, if `as_mutable` is `True` a copy is returned.
     """
-    # There is a chicken-egg problem, i.e. circular import, if we use the decorator to add the build in classes.
-    #  The problem is, that they are only run, i.e. added to the list, upon importing.
-    #  Thus we have to explicitly import the subtranslator, but this would then lead to a circular import.
-    #  For that reason we import the subpackage here explicitly.
-    #  However, this requires that all are imported by the `__init__.py` file.
-    #  I do not know a way to do this better.
-    #  Actually I want to do it somehow upon the importation of `jace` itself.
-    from jace.translator import primitive_translators  # noqa: F401  # Unused import
-
-    return list(reversed(_KNOWN_SUBTRANSLATORS))
+    if as_mutable:
+        # The use case for this is, that a user wants to populate its own list and do some funky stuff.
+        #  Without this option, he would first have to make a mutable copy of the map manually,
+        #  every fucking time he wants it, so making an option is simpler.
+        return _CURRENT_SUBTRANSLATORS.copy()
+
+    # Since we do a versioning in `add_subtranslator()` we do not have to create a new view.
+    #  We can just return the global view, this is needed to fix some problems in the caching.
+    return _CURRENT_SUBTRANSLATORS_VIEW
diff --git a/src/jace/translator/primitive_translator.py b/src/jace/translator/primitive_translator.py
index fa717aa..2e00ed6 100644
--- a/src/jace/translator/primitive_translator.py
+++ b/src/jace/translator/primitive_translator.py
@@ -17,7 +17,7 @@
 
 from abc import abstractmethod
 from collections.abc import MutableSequence, Sequence
-from typing import Any, Protocol, runtime_checkable
+from typing import Protocol, runtime_checkable
 
 import dace
 from jax import core as jax_core
@@ -30,44 +30,25 @@ class PrimitiveTranslator(Protocol):
     """Interface for all Jax primitive translators, also known as subtranslator.
 
     A translator for a primitive translates a single equation of a Jaxpr into its SDFG equivalent.
-    A type that implements this interface must fulfil the following properties:
-    - It must be immutable after construction.
-    - All subclass must implement the class method `build_translator()` to construct an instance.
+    For satisfying this interface a concrete implementation must be immutable after construction.
 
     Subtranslators are simple, but highly specialized objects that are only able to perform the translation of a single primitive.
     The overall translation process itself is managed by a driver object, which also owns and manage the subtranslators.
     In the end this implements the delegation pattern.
 
-    After instantiation a driver calls the subtranslator's `get_handled_primitive()` method.
-    This function returns the name of the Jax primitive the subtranslator is able to handle.
-    In case a subtranslator is able to handle multiple primitives, it should return a list with their names.
-    While there is no limit to the numbers of primitive a subtranslator can register itself for,
-    only one subtranslator can be register for any primitive.
+    You can use `jace.translator.add_subtranslator()` to register your translator to Jace.
     """
 
     __slots__ = ()
 
-    @classmethod
-    @abstractmethod
-    def build_translator(
-        cls,
-        *args: Any,
-        **kwargs: Any,
-    ) -> PrimitiveTranslator:
-        """Creates an instance of a subtranslator."""
-        ...
-
     @property
     @abstractmethod
-    def primitive(self) -> str | Sequence[str]:
-        """Returns the names of the Jax primitive that `self` is able to handle.
-
-        In case `self` can handle multiple primitives, it should return a list with these names.
-        """
+    def primitive(self) -> str:
+        """Returns the name of the Jax primitive that `self` is able to handle."""
         ...
 
     @abstractmethod
-    def translate_jaxeqn(
+    def __call__(
         self,
         driver: translator.JaxprTranslationDriver,
         in_var_names: Sequence[str | None],
diff --git a/src/jace/translator/primitive_translators/alu_translator.py b/src/jace/translator/primitive_translators/alu_translator.py
index 9f7aa44..05ce3fe 100644
--- a/src/jace/translator/primitive_translators/alu_translator.py
+++ b/src/jace/translator/primitive_translators/alu_translator.py
@@ -20,77 +20,30 @@
 from jace import translator
 
 
-@translator.add_subtranslator
 class ALUTranslator(translator.PrimitiveTranslator):
-    """This translator handles all arithmetic and logical operations."""
-
-    __slots__ = ()
-
-    # Contains all translation templates for unary operations.
-    _unary_ops: Final[dict[str, str]] = {
-        "pos": "__out0 = +(__in0)",
-        "neg": "__out0 = -(__in0)",
-        "not": "__out0 = not (__in0)",
-        "floor": "__out0 = floor(__in0)",
-        "ceil": "__out0 = ceil(__in0)",
-        "round": "__out0 = round(__in0)",
-        "abs": "__out0 = abs(__in0)",
-        "sign": "__out0 = sign(__in0)",
-        "sqrt": "__out0 = sqrt(__in0)",
-        "log": "__out0 = log(__in0)",
-        "exp": "__out0 = exp(__in0)",
-        "integer_pow": "__out0 = (__in0)**({y})",  # 'y' is a parameter of the primitive
-        "sin": "__out0 = sin(__in0)",
-        "asin": "__out0 = asin(__in0)",
-        "cos": "__out0 = cos(__in0)",
-        "acos": "__out0 = acos(__in0)",
-        "tan": "__out0 = tan(__in0)",
-        "atan": "__out0 = atan(__in0)",
-        "tanh": "__out0 = tanh(__in0)",
-    }
-    # Transformation for all binary operations
-    _binary_ops: Final[dict[str, str]] = {
-        "add": "__out0 = (__in0)+(__in1)",
-        "add_any": "__out0 = (__in0)+(__in1)",  # No idea what makes `add_any` differ from `add`
-        "sub": "__out0 = (__in0)-(__in1)",
-        "mul": "__out0 = (__in0)*(__in1)",
-        "div": "__out0 = (__in0)/(__in1)",
-        "rem": "__out0 = (__in0)%(__in1)",
-        "and": "__out0 = (__in0) and (__in1)",
-        "or": "__out0 = (__in0) or  (__in1)",
-        "pow": "__out0 = (__in0)**(__in1)",
-        "ipow": "__out0 = (__in0)**(int(__in1))",
-        "min": "__out0 = min(__in0, __in1)",
-        "max": "__out0 = max(__in0, __in1)",
-        "eq": "__out0 = __in0 == __in1",
-        "ne": "__out0 = __in0 != __in1",
-        "ge": "__out0 = __in0 >= __in1",
-        "gt": "__out0 = __in0 > __in1",
-        "le": "__out0 = __in0 <= __in1",
-        "lt": "__out0 = __in0 < __in1",
-    }
-
-    @classmethod
-    def build_translator(
-        cls,
-        *args: Any,
-        **kwargs: Any,
-    ) -> ALUTranslator:
-        """Creates an `ALUTranslator` instance."""
-        return cls(*args, **kwargs)
-
-    def __init__(self, **kwargs: Any) -> None:
+    """This translator handles all arithmetic and logical operations.
+
+    This translator will be reworked soon, it just exists that the initial PR can do anything at all!!
+    """
+
+    __slots__ = ("_prim_name", "_prim_tmpl")
+
+    def __init__(
+        self,
+        prim_name: str,
+        prim_tmpl: str,
+    ) -> None:
         """Initialize the `ALUTranslator`."""
-        super().__init__(**kwargs)
+        self._prim_name = prim_name
+        self._prim_tmpl = prim_tmpl
 
     @property
     @override
-    def primitive(self) -> Sequence[str]:
-        """Returns the list of all known primitives."""
-        return list(self._unary_ops.keys()) + list(self._binary_ops.keys())
+    def primitive(self) -> str:
+        return self._prim_name
 
     @override
-    def translate_jaxeqn(
+    def __call__(
         self,
         driver: translator.JaxprTranslationDriver,
         in_var_names: Sequence[str | None],
@@ -111,6 +64,7 @@ def translate_jaxeqn(
             eqn:            The Jax equation that is translated.
             eqn_state:      State into which the primitive's SDFG representation is constructed.
         """
+        assert self._prim_name == eqn.primitive.name
 
         # Determine what kind of input we got and how we should proceed.
         is_scalar = len(eqn.outvars[0].aval.shape) == 0
@@ -253,31 +207,8 @@ def _write_tasklet_code(
         Args:
             in_var_names:   The list of SDFG variables used as input.
         """
-        t_name = eqn.primitive.name
-        if t_name == "integer_pow":
-            # INTEGER POWER
-            exponent = int(eqn.params["y"])
-            if exponent == 0:
-                t_code = f"__out0 = dace.{eqn.outvars[0].aval.dtype!s}(1)"
-            elif exponent == 1:
-                t_code = "__out0 = __in0"
-            elif exponent == 2:
-                t_code = "__out0 = __in0 * __in0"
-            elif exponent == 3:
-                t_code = "__out0 = (__in0 * __in0) * __in0"
-            elif exponent == 4:
-                t_code = "__tmp0 = __in0 * __in0\n__out0 = __tmp0 * __tmp0"
-            elif exponent == 5:
-                t_code = "__tmp0 = __in0 * __in0\n__tmp1 = __tmp0 * __tmp0\n__out0 = __tmp1 * __in0"
-            else:
-                t_code = self._unary_ops[t_name]
 
-        else:
-            # GENERAL CASE
-            if t_name in self._unary_ops:
-                t_code = self._unary_ops[t_name]
-            elif t_name in self._binary_ops:
-                t_code = self._binary_ops[t_name]
+        t_code = self._prim_tmpl
 
         # Now we handle Literal substitution
         for i, in_var_name in enumerate(in_var_names):
@@ -308,3 +239,51 @@ def _list_to_dict(inp: Sequence[tuple[None | Any, Any]]) -> dict[Any, Any]:
     The function will only include pairs whose key, i.e. first element is not `None`.
     """
     return {k: v for k, v in inp if k is not None}
+
+
+# Contains all the templates for ALU operations.
+_ALU_OPS_TMPL: Final[dict[str, str]] = {
+    # Unary operations
+    "pos": "__out0 = +(__in0)",
+    "neg": "__out0 = -(__in0)",
+    "not": "__out0 = not (__in0)",
+    "floor": "__out0 = floor(__in0)",
+    "ceil": "__out0 = ceil(__in0)",
+    "round": "__out0 = round(__in0)",
+    "abs": "__out0 = abs(__in0)",
+    "sign": "__out0 = sign(__in0)",
+    "sqrt": "__out0 = sqrt(__in0)",
+    "log": "__out0 = log(__in0)",
+    "exp": "__out0 = exp(__in0)",
+    "integer_pow": "__out0 = (__in0)**({y})",  # 'y' is a parameter of the primitive
+    "sin": "__out0 = sin(__in0)",
+    "asin": "__out0 = asin(__in0)",
+    "cos": "__out0 = cos(__in0)",
+    "acos": "__out0 = acos(__in0)",
+    "tan": "__out0 = tan(__in0)",
+    "atan": "__out0 = atan(__in0)",
+    "tanh": "__out0 = tanh(__in0)",
+    # Binary operations
+    "add": "__out0 = (__in0)+(__in1)",
+    "add_any": "__out0 = (__in0)+(__in1)",  # No idea what makes `add_any` differ from `add`
+    "sub": "__out0 = (__in0)-(__in1)",
+    "mul": "__out0 = (__in0)*(__in1)",
+    "div": "__out0 = (__in0)/(__in1)",
+    "rem": "__out0 = (__in0)%(__in1)",
+    "and": "__out0 = (__in0) and (__in1)",
+    "or": "__out0 = (__in0) or  (__in1)",
+    "pow": "__out0 = (__in0)**(__in1)",
+    "ipow": "__out0 = (__in0)**(int(__in1))",
+    "min": "__out0 = min(__in0, __in1)",
+    "max": "__out0 = max(__in0, __in1)",
+    "eq": "__out0 = __in0 == __in1",
+    "ne": "__out0 = __in0 != __in1",
+    "ge": "__out0 = __in0 >= __in1",
+    "gt": "__out0 = __in0 > __in1",
+    "le": "__out0 = __in0 <= __in1",
+    "lt": "__out0 = __in0 < __in1",
+}
+
+translator.add_subtranslators(
+    *[ALUTranslator(prim_name, prim_tmpl) for prim_name, prim_tmpl in _ALU_OPS_TMPL.items()]
+)
diff --git a/tests/test_jaxpr_translator_driver.py b/tests/test_jaxpr_translator_driver.py
index e52873e..12eb48c 100644
--- a/tests/test_jaxpr_translator_driver.py
+++ b/tests/test_jaxpr_translator_driver.py
@@ -15,7 +15,7 @@
 import pytest
 from dace.data import Array, Data, Scalar
 
-from jace import translator as jtrans
+from jace import translator
 from jace.util import JaCeVar
 
 
@@ -23,14 +23,14 @@
 def translation_driver():
     """Returns an allocated driver instance."""
     name = "fixture_driver"
-    driver = jtrans.JaxprTranslationDriver()
+    driver = translator.JaxprTranslationDriver(sub_translators=translator.get_subtranslators())
     driver._allocate_translation_ctx(name=name)
     return driver
 
 
 def test_driver_alloc() -> None:
     """Tests the state right after allocation."""
-    driver = jtrans.JaxprTranslationDriver()
+    driver = translator.JaxprTranslationDriver(sub_translators=translator.get_subtranslators())
     assert not driver.is_allocated(), "Driver was created allocated."
     assert len(driver._ctx_stack) == 0
 
@@ -55,7 +55,7 @@ def test_driver_nested() -> None:
     """
 
     # This is the parent driver.
-    driver = jtrans.JaxprTranslationDriver()
+    driver = translator.JaxprTranslationDriver(sub_translators=translator.get_subtranslators())
     assert not driver.is_allocated(), "Driver should not be allocated."
 
     # We allocate the driver directly, because we need to set some internals.
@@ -92,7 +92,7 @@ def test_driver_nested() -> None:
     assert driver._reserved_names is None
 
 
-def test_driver_append_state(translation_driver: jtrans.JaxprTranslationDriver) -> None:
+def test_driver_append_state(translation_driver: translator.JaxprTranslationDriver) -> None:
     """Tests the functionality of appending states."""
     sdfg: dace.SDFG = translation_driver.sdfg
 
@@ -128,7 +128,7 @@ def test_driver_append_state(translation_driver: jtrans.JaxprTranslationDriver)
     assert next(iter(sdfg.in_edges(non_terminal_state))).src is terminal_state_1
 
 
-def test_driver_scalar(translation_driver: jtrans.JaxprTranslationDriver) -> None:
+def test_driver_scalar(translation_driver: translator.JaxprTranslationDriver) -> None:
     """This function tests the array creation routines, especially the scalar part.
 
     However, it does so without using Jax variables.
@@ -241,7 +241,7 @@ def test_driver_scalar(translation_driver: jtrans.JaxprTranslationDriver) -> Non
     assert scal6_ == scal6_j.name
 
 
-def test_driver_array(translation_driver: jtrans.JaxprTranslationDriver) -> None:
+def test_driver_array(translation_driver: translator.JaxprTranslationDriver) -> None:
     """This function tests the array creation routines.
 
     However, it does so without using Jax variables.
@@ -295,7 +295,7 @@ def test_driver_array2() -> None:
         - Literals.
     """
     # This is the parent driver.
-    driver = jtrans.JaxprTranslationDriver()
+    driver = translator.JaxprTranslationDriver(sub_translators=translator.get_subtranslators())
     assert not driver.is_allocated(), "Driver should not be allocated."
 
     # Creating JaCe Variables with empty names, forces the driver to use the
diff --git a/tests/test_subtranslator_helper.py b/tests/test_subtranslator_helper.py
index e50f9a5..d5885a3 100644
--- a/tests/test_subtranslator_helper.py
+++ b/tests/test_subtranslator_helper.py
@@ -10,97 +10,213 @@
 from __future__ import annotations
 
 import re
+from collections.abc import Mapping, MutableSequence, Sequence
+from inspect import isclass, isfunction
+from typing import Any
 
+import dace
+import jax
+import numpy as np
 import pytest
+from jax import core as jax_core
 
+import jace
 from jace import translator as jtrans
+from jace.translator import (
+    add_fsubtranslator,
+    add_subtranslator,
+    get_subtranslators,
+)
+
+
+@pytest.fixture(autouse=True)
+def _conserve_builtin_translators():
+    """Decorator that preserves the initial list of built in translators.
+
+    Todo:
+        Come up with something better/nicer.
+    """
+    initial_translators = get_subtranslators()
+    yield
+    jtrans.add_subtranslators(*initial_translators.values(), overwrite=True)
+
+
+def _dict_struct(dict_: Mapping[str, Any]) -> Sequence[tuple[str, int]]:
+    return tuple(sorted(((k, id(v)) for k, v in dict_.items()), key=lambda X: X[0]))
+
+
+def test_are_subtranslators_imported():
+    """Tests if something is inside the list of subtranslators."""
+    assert len(get_subtranslators()) > 1
 
 
 def test_subtranslatior_managing():
     """Ensures the functionality of the subtranslator managing."""
-    from jace.translator import (
-        add_subtranslator,
-        get_subtranslators_cls,
-    )
 
-    # These are all initial subtranslators
-    builtin_subtrans_cls = get_subtranslators_cls()
+    # TODO(phimuell): Make this more friendly; See blow
+    builtin_subtrans = get_subtranslators()
+    builin_struct = _dict_struct(builtin_subtrans)
 
-    # Definitions of some classes to help.
     class SubTrans1(jtrans.PrimitiveTranslator):
-        @classmethod
-        def build_translator(cls) -> SubTrans1:
-            return SubTrans1()
-
         @property
         def primitive(self):
             return "non_existing_primitive1"
 
-        def translate_jaxeqn(self) -> None:  # type: ignore[override]  # Arguments
-            return None
+        def __call__(self) -> None:  # type: ignore[override]  # Arguments
+            raise NotImplementedError
 
-    class SubTrans2(jtrans.PrimitiveTranslator):
-        @classmethod
-        def build_translator(cls) -> SubTrans2:
-            return SubTrans2()
+    # Ensures that we really return the object unmodified.
+    SubTrans1_ = add_subtranslator(SubTrans1)
+    assert isclass(SubTrans1_)
+    assert SubTrans1_ is SubTrans1
 
+    @add_subtranslator(overwrite=True)
+    class SubTrans2(jtrans.PrimitiveTranslator):
         @property
         def primitive(self):
             return "non_existing_primitive2"
 
-        def translate_jaxeqn(self) -> None:  # type: ignore[override]  # Arguments
-            return None
-
-    assert SubTrans1 != SubTrans2
-
-    # Adding the first subtranslator to the list.
-    add_subtranslator(SubTrans1)
+        def __call__(self) -> None:  # type: ignore[override]  # Arguments
+            raise NotImplementedError
+
+    assert isclass(SubTrans2)
+
+    @add_fsubtranslator("non_existing_primitive3")
+    def non_existing_primitive_translator_3(
+        driver: jtrans.JaxprTranslationDriver,
+        in_var_names: Sequence[str | None],
+        out_var_names: MutableSequence[str],
+        eqn: jax_core.JaxprEqn,
+        eqn_state: dace.SDFGState,
+    ) -> dace.SDFGState | None:
+        raise NotImplementedError
+
+    assert isfunction(non_existing_primitive_translator_3)
+    assert non_existing_primitive_translator_3.primitive == "non_existing_primitive3"
+
+    curr1_subtrans = get_subtranslators()
+    curr1_subtrans_mod = get_subtranslators(as_mutable=True)
+    assert curr1_subtrans is not builtin_subtrans
+    assert curr1_subtrans is not curr1_subtrans_mod
+    assert _dict_struct(curr1_subtrans) != builin_struct
+    assert _dict_struct(curr1_subtrans) == _dict_struct(curr1_subtrans_mod)
+
+    for i in [1, 2, 3]:
+        pname = f"non_existing_primitive{i}"
+        assert pname in curr1_subtrans, f"Expected to find '{pname}'."
+        curr1_subtrans_mod.pop(pname)
+    assert builin_struct == _dict_struct(curr1_subtrans_mod)
+    assert curr1_subtrans is get_subtranslators()
+
+    # Try adding instance and if we can overwrite.
+    sub_trans1_instance = SubTrans1()
+    with pytest.raises(
+        expected_exception=ValueError,
+        match=re.escape(
+            "Tried to add a second translator for primitive 'non_existing_primitive1'."
+        ),
+    ):
+        add_subtranslator(sub_trans1_instance, overwrite=False)
 
-    curr_subtrans_cls = get_subtranslators_cls()
-    assert len(curr_subtrans_cls) == len(builtin_subtrans_cls) + 1
-    assert all(
-        type(exp) == type(got)
-        for exp, got in zip([SubTrans1, *builtin_subtrans_cls], curr_subtrans_cls)
-    )
+    # Now adding it forcefully, this should also change a lot.
+    add_subtranslator(sub_trans1_instance, overwrite=True)
 
-    # Now adding the second subtranslator
-    add_subtranslator(SubTrans2)
+    curr2_subtrans = get_subtranslators()
+    assert curr2_subtrans is not builtin_subtrans
+    assert curr2_subtrans is not curr1_subtrans
+    assert _dict_struct(curr2_subtrans) != builin_struct
+    assert _dict_struct(curr2_subtrans) != _dict_struct(curr1_subtrans)
+    assert curr2_subtrans["non_existing_primitive1"] is sub_trans1_instance
 
-    curr_subtrans_cls2 = get_subtranslators_cls()
-    assert len(curr_subtrans_cls2) == len(builtin_subtrans_cls) + 2
-    assert [SubTrans2, SubTrans1, *builtin_subtrans_cls] == curr_subtrans_cls2
-    assert curr_subtrans_cls2 is not curr_subtrans_cls
+    # Try to answer a function as translator, that already has a primitive property.
+    with pytest.raises(
+        expected_exception=ValueError,
+        match=re.escape("Passed 'fun' already 'non_existing_primitive3' as 'primitive' property."),
+    ):
+        add_fsubtranslator(
+            "non_existing_primitive1", non_existing_primitive_translator_3, overwrite=False
+        )
 
+    # This would work because it has the same primitive name, but it fails because overwrite is False
     with pytest.raises(
         expected_exception=ValueError,
         match=re.escape(
-            f"Tried to add '{type(SubTrans1).__name__}' twice to the list of known primitive translators."
+            "Tried to add a second translator for primitive 'non_existing_primitive3'."
         ),
     ):
-        add_subtranslator(SubTrans2)
+        add_fsubtranslator(
+            "non_existing_primitive3", non_existing_primitive_translator_3, overwrite=False
+        )
 
-    @add_subtranslator
-    class SubTrans3(jtrans.PrimitiveTranslator):
-        @classmethod
-        def build_translator(cls) -> SubTrans2:
-            return SubTrans2()
+    add_fsubtranslator(
+        "non_existing_primitive3", non_existing_primitive_translator_3, overwrite=True
+    )
+
+
+def test_subtranslatior_managing_2():
+    """Shows that we are really able to overwrite stuff"""
+    jax.config.update("jax_enable_x64", True)
 
+    @add_subtranslator(overwrite=True)
+    class NonAddTranslator(jtrans.PrimitiveTranslator):
         @property
         def primitive(self):
-            return "non_existing_primitive2"
+            return "add"
+
+        def __call__(self, *args, **kwargs) -> None:
+            raise NotImplementedError("The 'NonAddTranslator' can not translate anything.")
+
+    @jace.jit
+    def testee(A: np.ndarray, B: np.ndarray) -> np.ndarray:
+        return A + B
+
+    A = np.arange(12, dtype=np.float64).reshape((4, 3))
+    B = np.full((4, 3), 10, dtype=np.float64)
+
+    with pytest.raises(
+        expected_exception=NotImplementedError,
+        match=re.escape("The 'NonAddTranslator' can not translate anything."),
+    ):
+        _ = testee.lower(A, B)
+
 
-        def translate_jaxeqn(self) -> None:  # type: ignore[override]  # Arguments
-            return None
+def test_subtranslatior_managing_3():
+    """Shows proper decoupling."""
+    jax.config.update("jax_enable_x64", True)
 
-    curr_subtrans_cls3 = get_subtranslators_cls()
-    assert len(curr_subtrans_cls3) == len(builtin_subtrans_cls) + 3
-    assert [SubTrans3, SubTrans2, SubTrans1, *builtin_subtrans_cls] == curr_subtrans_cls3
+    class NonAddTranslator(jtrans.PrimitiveTranslator):
+        @property
+        def primitive(self):
+            return "add"
+
+        def __call__(self, *args, **kwargs) -> None:
+            raise NotImplementedError("The 'NonAddTranslator' can not translate anything at all.")
+
+    used_sub_trans = get_subtranslators(as_mutable=True)
+    used_sub_trans["add"] = NonAddTranslator()
+
+    @jace.jit(sub_translators=used_sub_trans)
+    def not_working_test(A: np.ndarray, B: np.ndarray) -> np.ndarray:
+        return A + B
+
+    # Now we again remove the add from the list, but this will not have an impact on the `not_working_test()`.
+    used_sub_trans.pop("add")
+
+    @jace.jit
+    def working_test(A: np.ndarray, B: np.ndarray) -> np.ndarray:
+        return A + B
+
+    A = np.arange(12, dtype=np.float64).reshape((4, 3))
+    B = np.full((4, 3), 10, dtype=np.float64)
+
+    with pytest.raises(
+        expected_exception=NotImplementedError,
+        match=re.escape("The 'NonAddTranslator' can not translate anything at all."),
+    ):
+        _ = not_working_test.lower(A, B)
 
-    # Adding version 1 again, but this time using overwrite
-    add_subtranslator(SubTrans1, overwrite=True)
-    curr_subtrans_cls4 = get_subtranslators_cls()
-    assert len(curr_subtrans_cls3) == len(curr_subtrans_cls4)
-    assert [SubTrans1, SubTrans3, SubTrans2, *builtin_subtrans_cls] == curr_subtrans_cls4
+    # This works because the
+    working_test.lower(A, B)
 
 
 if __name__ == "__main__":

From bdceaf0e3aa376576a3533ea55c13f95213e2d6e Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Thu, 16 May 2024 14:48:45 +0200
Subject: [PATCH 155/458] This commit is the second part of the effort to make
 the list of currently active translators global.

The previous commit changed the driver to use them and adds the necessary infrastructure of managing them.
As before we want that in code such as:
```python
       @jit
       def foo(...):
              ...
       foo1 = foo.lower(...args1)
       # Modify the list of internal translators, i.e. call `add_subtranslator()`
       foo2 = foo.lower(...args2)
```
the second call to `lower()` uses the same translators as the first one.
What sounds simple is in fact relatively hard.
And we want that, in codes as
```
```python
       def foo(...):
              ...
       foo1 = jace.jit(foo)
       # Modify the list of internal translators, i.e. call `add_subtranslator()`
       foo2 = jace.jit(foo)
```
`foo1` and `foo2` use different translators as they where constructed differently.
As it is outlined inside in `JaceWrapped.__init__()`  the feature of "being able to manipulate the set of active translators from the outside of a `JaceWrapped` object" is not really useful and we thus forbid it.
As it is further outlined we _must_ make a copy (shallow copy is enough because the translators themselves are immutable) of the list of primitive translators that should be used, somewhere during the construction of a `JaceWrapped` object.
Which we do, for many reasons inside `JaceWrapped.__init__()`.

To include the set of used translators in the caching we use the address of the internal set of translators of the `JaceWrapped` object.
We can do this because we have by construction an immutable set, since we copied it at construction.
As an optimization, before we copy the set in `JaceWrapped.__init__()` we check if the set is the same as the global one (that is immutable).
This means that in situations such as:
```python
       def foo(A):
              ...
       foo1 = jace.jit(foo)(A)
       A[1, 2] = 0
       foo2 = jace.jit(foo)(A)
```
the code is only lowered once (this was not an intended design but a by product).
This captures the main use case in which the translators are set at the beginning and then never again.

We also included the Jax options to `jit`.
Currently we only really handle the case of no options, which is probably okay.
---
 src/jace/jax/api.py                      | 74 ++++++++++++------------
 src/jace/jax/stages/jace_wrapped.py      | 73 +++++++++++++++++++----
 src/jace/jax/stages/translation_cache.py | 49 ++++++++++++++--
 src/jace/translator/managing.py          |  2 +
 tests/test_decorator.py                  | 59 +++++++++++++++++++
 5 files changed, 201 insertions(+), 56 deletions(-)

diff --git a/src/jace/jax/api.py b/src/jace/jax/api.py
index dd3973e..6919f3b 100644
--- a/src/jace/jax/api.py
+++ b/src/jace/jax/api.py
@@ -9,12 +9,12 @@
 
 from __future__ import annotations
 
-from collections.abc import Callable
+from collections.abc import Callable, Mapping
 from typing import Any
 
 import jax as _jax_jax
 
-from jace import jax as jjax, util
+from jace import jax as jjax, translator
 from jace.jax import api_helper
 
 
@@ -22,51 +22,51 @@
 def jit(
     fun: Callable | None = None,
     /,
+    sub_translators: Mapping[str, translator.PrimitiveTranslator] | None = None,
     **kwargs: Any,
 ) -> jjax.JaceWrapped:
-    """Jace wrapper for `jax.jit`.
+    """Jace's replacement for `jax.jit` (just-in-time) wrapper.
 
-    Wraps the computation `fun` into a wrapped instance, that can either be traced or compiled.
-    For more information see `jace.jax.stages`.
+    It works the same way as `jax.jit` does, but instead of using XLA the computation is lowered to DaCe.
+    It supports the same arguments as `jax.jit` (although currently not) does.
+    In addition it accepts some Jace specific arguments.
+
+    Args:
+        sub_translators:    Use these subtranslators for the lowering to DaCe.
 
     Notes:
-        The function can either be used as decorator or as a command.
+        If no subtranslators are specified then the ones that are currently active,
+            i.e. the output of `get_subtranslators()`, are used.
+            After construction the set of subtranslators that are used by the wrapped object can not be changed.
     """
-    import jax
-    from jax._src import sharding_impls
-
-    if any(kwargs.get(arg, None) is not None for arg in ["static_argnums", "static_argnames"]):
-        raise NotImplementedError("Static arguments are not yet supported.")
     if any(kwargs.get(arg, None) is not None for arg in ["donate_argnums", "donate_argnames"]):
-        # Donated arguments are not yet (fully) supported, since they are more like a "hint"
-        #  to jax we will silently ignore them.
-        kwargs["donate_argnums"] = None
-        kwargs["donate_argnames"] = None
-    if any(
-        kwargs.get(x, sharding_impls.UNSPECIFIED) is not sharding_impls.UNSPECIFIED
-        for x in ["in_shardings", "out_shardings"]
-    ):
-        raise NotImplementedError("Sharding is not yet supported.")
-    if kwargs.get("device", None) is not None:
-        raise NotImplementedError("Selecting of device is not yet supported.")
-    if kwargs.get("backend", None) is not None:
-        raise NotImplementedError("Selecting of backend is not yet supported.")
+        # Donated arguments are not yet fully supported, the prototype supported something similar.
+        #  However, the documentation mentioned that they are only a hint, thus we ignore them.
+        kwargs.pop("donate_argnums", None)
+        kwargs.pop("donate_argnames", None)
+
+    if len(kwargs) != 0:
+        raise NotImplementedError(
+            f"The following arguments of 'jax.jit' are not yet supported by jace: {', '.join(kwargs.keys())}."
+        )
 
     # fmt: off
     if fun is None:
-        assert len(kwargs) > 0
+        # TODO: Is there an obscure case where it makes sense to copy `sub_translators`?
         def wrapper(f: Callable) -> jjax.JaceWrapped:
-            return jit(f, **kwargs)
+            return jit(f, sub_translators=sub_translators, **kwargs)
         return wrapper  # type: ignore[return-value]
     # fmt: on
 
-    if util.is_jaceified(fun):
-        return jit(fun.__wrapped__, **kwargs)
-    if len(kwargs) == 0:
-        # Prevents the creation of a level of unnecessary jit.
-        #  TODO(philmuell): Find a better way, probably better hijacking or `inline`.
-        return jjax.JaceWrapped(fun)
-    return jjax.JaceWrapped(jax.jit(fun, **kwargs))
+    # If no subtranslators were specified then use the ones that are currently installed.
+    if sub_translators is None:
+        sub_translators = translator.get_subtranslators()
+
+    return jjax.JaceWrapped(
+        fun=fun,
+        sub_translators=sub_translators,
+        jit_ops=kwargs,
+    )
 
 
 @api_helper.jax_wrapper(_jax_jax.pmap)
@@ -100,11 +100,9 @@ def vmap(
         "You are using the highly untested 'vamp' interface.",
         stacklevel=2,
     )
-    return jit(
-        _jax_jax.vmap(
-            fun,
-            **kwargs,
-        ),
+    return _jax_jax.vmap(
+        fun,
+        **kwargs,
     )
 
 
diff --git a/src/jace/jax/stages/jace_wrapped.py b/src/jace/jax/stages/jace_wrapped.py
index bc29f8d..2228e5c 100644
--- a/src/jace/jax/stages/jace_wrapped.py
+++ b/src/jace/jax/stages/jace_wrapped.py
@@ -10,7 +10,7 @@
 from __future__ import annotations
 
 import functools as ft
-from collections.abc import Callable
+from collections.abc import Callable, Mapping
 from typing import Any
 
 import jax as jax_jax
@@ -18,7 +18,7 @@
 from jace import translator, util
 from jace.jax import stages
 from jace.jax.stages import translation_cache as tcache
-from jace.translator import post_translation as ptrans
+from jace.translator import managing, post_translation as ptrans
 
 
 class JaceWrapped(stages.Stage):
@@ -28,17 +28,19 @@ class JaceWrapped(stages.Stage):
     Calling it results in jit (just-in-time) lowering, compilation, and execution.
     It can also be explicitly lowered prior to compilation, and the result compiled prior to execution.
 
+    You should not create `JaceWrapped` instances directly, instead you should use `jace.jit`.
+
     Notes:
-        Reimplementation of `jax.stages.Wrapped` protocol.
-        Function wrapped by this class are again tracable by Jax.
+        The wrapped function is accessible through the `__wrapped__` property.
 
     Todo:
         Handles pytrees.
-        Configuration of the driver?
         Copy the `jax._src.pjit.make_jit()` functionality to remove `jax.make_jaxpr()`.
     """
 
     _fun: Callable
+    _sub_translators: Mapping[str, translator.PrimitiveTranslator]
+    _jit_ops: Mapping[str, Any]
 
     # Managed by the caching infrastructure and only defined during `lower()`.
     #  If defined it contains an abstract description of the function arguments.
@@ -50,15 +52,58 @@ class JaceWrapped(stages.Stage):
     def __init__(
         self,
         fun: Callable,
+        sub_translators: Mapping[str, translator.PrimitiveTranslator],
+        jit_ops: Mapping[str, Any],
     ) -> None:
-        """Creates a wrapped jace jitable object of `jax_prim`."""
-        assert fun is not None
-        self._fun: Callable = fun
+        """Creates a wrapped jace jitable object of `jax_prim`.
+
+        You should not create `JaceWrapped` instances directly, instead you should use `jace.jit`.
+
+        Args:
+            fun:                The function that is wrapped.
+            sub_translators:    The list of subtranslators that that should be used.
+            jit_ops:            All options that we forward to `jax.jit`.
+
+        Notes:
+            Both the `sub_translators` and `jit_ops` are shallow copied.
+        """
 
         # Makes that `self` is a true stand-in for `fun`
-        #  This will also add a `__wrapped__` property to `self` which is not part of the interface.
-        # TODO(phimuell): modify text to make it clear that it is wrapped, Jax does the same.
-        ft.update_wrapper(self, self._fun)
+        self._fun: Callable = fun
+        ft.update_wrapper(self, self._fun)  # TODO(phimuell): modify text; Jax does the same.
+
+        # Why do we have to make a copy (shallow copy is enough as the translators themselves are immutable)?
+        #  The question is a little bit tricky so let's consider the following situation:
+        #  The user has created a Jace annotated function, and calls it, which leads to lowering and translation.
+        #  Then he goes on and in the process modifies the internal list of translators.
+        #  Then he calls the same annotated function again, then in case the arguments happens to be structurally the same,
+        #  lowering and translation will be skipped if the call is still inside the cache, this is what Jax does.
+        #  However, if they are different (or a cache eviction has happened), then tracing and translation will happen again.
+        #  Thus depending on the situation the user might get different behaviour.
+        #  In my expectation, Jace should always do the same thing, i.e. being deterministic, but what?
+        #  In my view, the simplest one and the one that is most functional is, to always use the translators,
+        #  that were _passed_ (although implicitly) at construction, making it independent on the global state.
+        #  One could argue, that the "dynamical modification of the translator list from the outside" is an actual legitimate use case, however, it is not.
+        #  Since `JaceWrapped.lower()` is cached, we would have to modify the caching to include the dynamic state of the set.
+        #  Furthermore, we would have to implement to make a distinction between this and the normal use case.
+        #  Thus we simply forbid it! If this is desired use `jace.jit()` as function to create an object dynamically.
+        # We could either here or in `jace.jit` perform the copy, but since `jace.jit` is at the end
+        #  just a glorified constructor and "allowing dynamic translator list" is not a use case, see above, we do it here.
+        #
+        # Because we know that the global state is immutable, we must not copy in this case.
+        #  See also `make_call_description()` in the cache implementation.
+        if sub_translators is managing._CURRENT_SUBTRANSLATORS_VIEW:
+            self._sub_translators = sub_translators
+        else:
+            # Note this is the canonical way to shallow copy a mapping since `Mapping` does not has `.copy()`
+            # and `copy.copy()` can not handle `MappingProxyType`.
+            self._sub_translators = dict(sub_translators)
+
+        # Following the same logic as above we should also copy `jit_ops`.
+        #  However, do we have to make a shallow copy or a deepcopy?
+        #  I looked at the Jax code and it seems that there is nothing that copies it,
+        #  so for now we will just go ahead and shallow copy it.
+        self._jit_ops = dict(jit_ops)
 
     def __call__(
         self,
@@ -73,6 +118,7 @@ def __call__(
         # TODO(phimuell): Handle the case of gradients:
         #                   It seems that this one uses special tracers, since they can handle comparisons.
         #                   https://jax.readthedocs.io/en/latest/notebooks/Common_Gotchas_in_JAX.html#python-control-flow-autodiff
+        # TODO(phimuell): Handle the `disable_jit` context manager of Jax.
 
         # TODO(phimuell): Handle static arguments correctly
         #                   https://jax.readthedocs.io/en/latest/aot.html#lowering-with-static-arguments
@@ -89,6 +135,9 @@ def lower(
         Performs the first two steps of the AOT steps described above,
         i.e. transformation into Jaxpr and then to SDFG.
         The result is encapsulated into a `Lowered` object.
+
+        Todo:
+            Add a context manager to disable caching.
         """
         if len(kwargs) != 0:
             raise NotImplementedError("Currently only positional arguments are supported.")
@@ -97,7 +146,7 @@ def lower(
         real_args: tuple[Any, ...] = args
 
         jaxpr = jax_jax.make_jaxpr(self._fun)(*real_args)
-        driver = translator.JaxprTranslationDriver()
+        driver = translator.JaxprTranslationDriver(sub_translators=self._sub_translators)
         trans_sdfg: translator.TranslatedJaxprSDFG = driver.translate_jaxpr(jaxpr)
         ptrans.postprocess_jaxpr_sdfg(tsdfg=trans_sdfg, fun=self.__wrapped__)
         # The `JaceLowered` assumes complete ownership of `trans_sdfg`!
diff --git a/src/jace/jax/stages/translation_cache.py b/src/jace/jax/stages/translation_cache.py
index 08a4a57..d27dd72 100644
--- a/src/jace/jax/stages/translation_cache.py
+++ b/src/jace/jax/stages/translation_cache.py
@@ -210,9 +210,11 @@ class CachedCallDescription:
     This class represents both the `JaceWrapped.lower()` and `JaceLowered.compile()` calls.
 
     The actual key is composed of two parts, first the "origin of the call".
-    For the `JaceWrapped` this includes the wrapped callable, while for `JaceLowered` the lowered SDFG is used.
-    In both cases we rely on their `__hash__()` and `__eq__()` implementation, which should only involve the address.
-    Since we do not allow in place modification, this is not a problem, especially for the lowering.
+    For `JaceLowered` the lowered SDFG is used, because we assume immutability across the whole translation chain,
+    we relay on its built-in  `__hash__()` and `__eq__`, which fall back to their address.
+
+    For `JaceWrapped` objects the first part includes the wrapped function.
+    Then it also includes the addresses of the jit options and the set of used subtranslators.
 
     The second part is of the key are a description of the actual arguments, see `CallArgsDescription` type alias.
     There are two ways for describing the arguments:
@@ -227,10 +229,19 @@ class CachedCallDescription:
 
     Todo:
         - pytrees.
+        - Turn the references into week references, Jax does this and I am sure there is a reason for it.
+        - Turn this into a strategy.
     """
 
+    # Origin Part for `JaceWrapped`:
     fun: Callable | None
+    sub_trans_id: int | None
+    jit_ops_id: int | None
+
+    # Origin Part for `JaceLowered`:
     sdfg: dace.SDFG | None
+
+    # Argument Part of the key
     fargs: CallArgsDescription
 
     @classmethod
@@ -244,12 +255,30 @@ def make_call_description(
 
         if isinstance(stage, stages.JaceWrapped):
             # JaceWrapped.lower() to JaceLowered
-            fun = stage.__wrapped__
-            sdfg = None
 
             if len(kwargs) != 0:
                 raise NotImplementedError("'kwargs' are not implemented in 'JaceWrapped.lower()'.")
 
+            fun = stage.__wrapped__
+            sdfg = None
+
+            # We have to guard ourselves from the case of annotating the same function, but using different translators.
+            #  Thus we have to include the translators somehow in the cache description.
+            #  As outlined in `JaceWrapped.__init__()`, the list of subtranslators is copied by the constructor,
+            #  thus it is unique, and its address serves as a key.
+            #  The special design of the copying in `JaceWrapped.__init__()`, will not make a copy if the set is the current global set.
+            #  This design will cache most aggressively, if the subtranslator are set up at the beginning and then never again.
+            #  Which should also be the main use case.
+            # The best we could probably do is some kind of content hash, i.e. creating a sorted list of `(prim_name, id(prim_trans))` tuples.
+            #  However, this is relatively expensive and probably an overkill.
+            sub_trans_id = id(stage._sub_translators)
+
+            # From the discussion above it becomes clear that we also have to include the Jax options in the hash.
+            #  Currently `JaceWrapper.__init__()` shallow copies it, in the assumption that this is enough.
+            #  We could also do some kind of semantic hash, but currently we just cache on its address,
+            #  with the optimization that "supplying no options" is handled explicitly.
+            jit_ops_id = id(stage._jit_ops) if len(stage._jit_ops) != 0 else None
+
             # Currently we only allow positional arguments and no static arguments.
             #   Thus the function argument part of the key only consists of abstract arguments.
             fargs: tuple[_AbstarctCallArgument, ...] = tuple(
@@ -260,6 +289,8 @@ def make_call_description(
             # JaceLowered.compile() to JaceCompiled
             #  We do not have to deepcopy the sdfg, since we assume immutability.
             fun = None
+            sub_trans_id = None
+            jit_ops_id = None
             sdfg = stage.compiler_ir().sdfg
 
             #   We only accepts compiler options, which the Jax interface mandates
@@ -295,7 +326,9 @@ def make_call_description(
         else:
             raise TypeError(f"Can not make key from '{type(stage).__name__}'.")
 
-        return cls(fun=fun, sdfg=sdfg, fargs=fargs)
+        return cls(
+            fun=fun, sdfg=sdfg, sub_trans_id=sub_trans_id, jit_ops_id=jit_ops_id, fargs=fargs
+        )
 
 
 class TranslationCache:
@@ -402,3 +435,7 @@ def _evict(
         self._memory.move_to_end(key, last=False)
         self._memory.popitem(last=False)
         return True
+
+    def __repr__(self) -> str:
+        """Textual representation for debugging."""
+        return f"TranslationCache({len(self._memory)} / {self._size} || {', '.join( '[' + repr(k) + ']' for k in self._memory)})"
diff --git a/src/jace/translator/managing.py b/src/jace/translator/managing.py
index e3afc99..22250be 100644
--- a/src/jace/translator/managing.py
+++ b/src/jace/translator/managing.py
@@ -86,6 +86,8 @@ def add_subtranslators(
 
     # Now update the global variables.
     #  Doing it after the loop gives us exception guarantee
+    # TODO: We should consider creating some list of "subtranslators sets that are known to be stable"
+    #           i.e. where generated by this function, this would allow better caching in some situation.
     _CURRENT_SUBTRANSLATORS = new_CURRENT_SUBTRANSLATORS
     _CURRENT_SUBTRANSLATORS_VIEW = types.MappingProxyType(_CURRENT_SUBTRANSLATORS)
 
diff --git a/tests/test_decorator.py b/tests/test_decorator.py
index 00b494b..2382f91 100644
--- a/tests/test_decorator.py
+++ b/tests/test_decorator.py
@@ -12,10 +12,15 @@
 
 from __future__ import annotations
 
+from collections.abc import MutableSequence, Sequence
+
+import dace
 import jax
 import numpy as np
+from jax import core as jax_core
 
 import jace
+from jace import translator
 
 
 def test_decorator_annotation():
@@ -116,6 +121,60 @@ def testee2_(A: np.ndarray, B: np.ndarray) -> np.ndarray:
     assert compiled2 is lowered1_size1.compile({"dummy_option": True})
 
 
+def test_decorator_double_annot():
+    """Tests the behaviour for double annotations."""
+    jax.config.update("jax_enable_x64", True)
+
+    lower_cnt = [0, 0]
+
+    def testee1(A: np.ndarray, B: np.ndarray) -> np.ndarray:
+        lower_cnt[0] += 1
+        return A * B
+
+    def testee2(A: np.ndarray, B: np.ndarray) -> np.ndarray:
+        lower_cnt[1] += 1
+        return A * B
+
+    A = np.arange(12, dtype=np.float64).reshape((4, 3))
+    B = np.full((4, 3), 10, dtype=np.float64)
+
+    jaceWrapped1_1 = jace.jit(testee1)
+    jaceWrapped1_2 = jace.jit(testee1)
+    assert jaceWrapped1_1 is not jaceWrapped1_2
+
+    # Lower them right after the other.
+    lower1_1 = jaceWrapped1_1.lower(A, B)
+    lower1_2 = jaceWrapped1_2.lower(A, B)
+    assert lower1_1 is lower1_2
+    assert (
+        lower_cnt[0] == 1
+    ), f"Annotated right after each other, but lowered {lower_cnt[0]} times instead of once."
+
+    # Now modify the state in between.
+    jaceWrapped2_1 = jace.jit(testee2)
+    lower2_1 = jaceWrapped2_1.lower(A, B)
+
+    @jace.translator.add_fsubtranslator("non_existing_primitive")
+    def non_existing_primitive_translator(
+        driver: translator.JaxprTranslationDriver,
+        in_var_names: Sequence[str | None],
+        out_var_names: MutableSequence[str],
+        eqn: jax_core.JaxprEqn,
+        eqn_state: dace.SDFGState,
+    ) -> dace.SDFGState | None:
+        raise NotImplementedError
+
+    jaceWrapped2_2 = jace.jit(testee2)
+    lower2_2 = jaceWrapped2_2.lower(A, B)
+    assert lower2_1 is not lower2_2
+    assert lower_cnt[1] == 2
+
+    # Now lower 2_1 again, to see if there is really no influence.
+    lower2_1_ = jaceWrapped2_1.lower(A, B)
+    assert lower2_1_ is lower2_1
+    assert lower_cnt[1] == 2
+
+
 def test_decorator_sharing():
     """Tests if there is no false sharing in the cache."""
     jax.config.update("jax_enable_x64", True)

From 3c4fad35304d564f5bd5034737cbfc9f40b10a8d Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Thu, 16 May 2024 15:25:43 +0200
Subject: [PATCH 156/458] Some cleanup.

---
 src/jace/util/compiling.py | 14 +++---
 src/jace/util/debug.py     | 97 --------------------------------------
 2 files changed, 7 insertions(+), 104 deletions(-)
 delete mode 100644 src/jace/util/debug.py

diff --git a/src/jace/util/compiling.py b/src/jace/util/compiling.py
index f5daa71..85107fa 100644
--- a/src/jace/util/compiling.py
+++ b/src/jace/util/compiling.py
@@ -41,16 +41,16 @@ def compile_jax_sdfg(
     # This is a simplification that makes our life simply.
     #  However, we should consider lifting it at some point.
     if len(tsdfg.sdfg.free_symbols) != 0:
-        raise ValueError(
+        raise NotImplementedError(
             f"No externally defined symbols are allowed, found: {tsdfg.sdfg.free_symbols}"
         )
 
     # To ensure that the SDFG is compiled and to get rid of a warning we must modify
     #  some settings of the SDFG. To fake an immutable SDFG, we will restore them later.
-    sdfg: dace.SDFG = tsdfg.sdfg
-    org_sdfg_name: str = sdfg.name
-    org_recompile: bool = sdfg._recompile
-    org_regenerate_code: bool = sdfg._regenerate_code
+    sdfg = tsdfg.sdfg
+    org_sdfg_name = sdfg.name
+    org_recompile = sdfg._recompile
+    org_regenerate_code = sdfg._regenerate_code
 
     try:
         # We need to give the SDFG another name, this is needed to prevent a DaCe error/warning.
@@ -97,10 +97,10 @@ def run_jax_sdfg(
     """
     from dace.data import Array, Data, Scalar, make_array_from_descriptor
 
-    if len(inp_names) != len(cargs):
-        raise RuntimeError("Wrong number of arguments.")
     if len(ckwargs) != 0:
         raise NotImplementedError("No kwargs are supported yet.")
+    if len(inp_names) != len(cargs):
+        raise RuntimeError("Wrong number of arguments.")
 
     # We need the SDFG to construct/allocate the memory for the return values.
     #  Actually, we would only need the descriptors, but this is currently the only way to get them.
diff --git a/src/jace/util/debug.py b/src/jace/util/debug.py
deleted file mode 100644
index d4ae754..0000000
--- a/src/jace/util/debug.py
+++ /dev/null
@@ -1,97 +0,0 @@
-# JaCe - JAX Just-In-Time compilation using DaCe (Data Centric Parallel Programming)
-#
-# Copyright (c) 2024, ETH Zurich
-# All rights reserved.
-#
-# SPDX-License-Identifier: BSD-3-Clause
-
-"""This module contains functions for debugging the translator.
-
-Everything in this module is experimental and might vanish anytime.
-"""
-
-from __future__ import annotations
-
-from collections.abc import Callable
-from typing import Any
-
-import dace
-import jax
-
-from jace import translator
-
-
-def run_jax_sdfg(jsdfg: translator.TranslatedJaxprSDFG, *args: Any) -> tuple[Any, ...] | Any:
-    """Calls the SDFG that is encapsulated with the supplied arguments.
-
-    Notes:
-        Currently the SDFG must not have any undefined symbols, i.e. no undefined sizes.
-        Currently denoted arguments are not fully respected.
-        The function either returns a value or a tuple of values, i.e. no tree.
-    """
-    from dace.data import Array, Data, Scalar, make_array_from_descriptor
-
-    # This is a simplification that makes our life simply
-    if len(jsdfg.sdfg.free_symbols) != 0:
-        raise ValueError(
-            f"No externally defined symbols are allowed, found: {jsdfg.sdfg.free_symbols}"
-        )
-    if len(jsdfg.inp_names) != len(args):
-        raise ValueError(
-            f"Wrong numbers of arguments expected {len(jsdfg.inp_names)} got {len(args)}."
-        )
-
-    # We use a return by reference approach, for calling the SDFG
-    call_args: dict[str, Any] = {}
-    for in_name, in_val in zip(jsdfg.inp_names, args):
-        call_args[in_name] = in_val
-    for out_name in jsdfg.out_names:
-        sarray: Data = jsdfg.sdfg.arrays[out_name]
-        assert out_name not in call_args
-
-        if (out_name == "__return") or (out_name.startswith("__return_")):
-            continue
-        if isinstance(sarray, Scalar):
-            raise NotImplementedError("Scalars as return values are not supported.")
-        if isinstance(sarray, Array):
-            call_args[out_name] = make_array_from_descriptor(sarray)
-        else:
-            raise NotImplementedError(f"Can not handle '{type(sarray).__name__}' as output.")
-
-    # Canonical SDFGs do not have global memory, so we must transform it.
-    #  We will afterwards undo it.
-    for glob_name in jsdfg.inp_names + jsdfg.out_names:
-        jsdfg.sdfg.arrays[glob_name].transient = False
-
-    try:
-        csdfg: dace.CompiledSDFG = jsdfg.sdfg.compile()
-        with dace.config.temporary_config():
-            dace.Config.set("compiler", "allow_view_arguments", value=True)
-            csdfg(**call_args)
-
-        if len(jsdfg.out_names) == 0:
-            return None
-        ret_val: tuple[Any] = tuple(call_args[out_name] for out_name in jsdfg.out_names)
-        if len(jsdfg.out_names) == 1:
-            return ret_val[0]
-        return ret_val
-
-    finally:
-        for name in jsdfg.inp_names + jsdfg.out_names:
-            jsdfg.sdfg.arrays[name].transient = True
-
-
-def _jace_run(fun: Callable, *args: Any, **kwargs: Any) -> Any:
-    """Traces and run function `fun` using `Jax | DaCe`.
-
-    Args:
-        *args:      Forwarded to the tracing and final execution of the SDFG.
-        **kwargs:   Used to construct the driver.
-
-    Notes:
-        This function will be removed soon.
-    """
-    jaxpr = jax.make_jaxpr(fun)(*args)
-    driver = translator.JaxprTranslationDriver(**kwargs)
-    jsdfg = driver.translate_jaxpr(jaxpr)
-    return run_jax_sdfg(jsdfg, *args)

From 5923c003587a9f794fdce1965dd5049ab803d25e Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Thu, 16 May 2024 15:29:23 +0200
Subject: [PATCH 157/458] More cleaning up, but that belongs to the PR.

---
 .../translator/jaxpr_translator_driver.py     | 58 +++++--------------
 src/jace/translator/managing.py               |  1 -
 src/jace/util/jax_helper.py                   | 42 ++------------
 src/jace/util/traits.py                       |  4 +-
 4 files changed, 19 insertions(+), 86 deletions(-)

diff --git a/src/jace/translator/jaxpr_translator_driver.py b/src/jace/translator/jaxpr_translator_driver.py
index 17fd2b9..85cea34 100644
--- a/src/jace/translator/jaxpr_translator_driver.py
+++ b/src/jace/translator/jaxpr_translator_driver.py
@@ -75,7 +75,7 @@ def __init__(
         Notes:
             `sub_translators` is not copied, thus the user has to guarantee,
                 that it will not change during translation.
-                It is highly advised but not requiered to use the output of
+                It is highly advised but not required to use the output of
                 `get_subtranslators()` or pass a copy as argument.
         """
 
@@ -106,7 +106,6 @@ def translate_jaxpr(
         inp_scalar_as_array: bool = False,
         name: str | None = None,
         reserved_names: str | Iterable[str] = (),
-        allow_empty_jaxpr: bool = False,
     ) -> translator.TranslatedJaxprSDFG:
         """Perform the translation of a Jaxpr into a SDFG.
 
@@ -122,19 +121,9 @@ def translate_jaxpr(
             inp_scalar_as_array:    Translate scalar _input_ arguments to arrays of length 1.
             name:                   Use this name for the SDFG instead some generated one.
             reserved_names:         Prevent the generation of variables with these names, see `self.add_array()` for more.
-            allow_empty_jaxpr:      Allows empty Jaxpr.
-
-        Notes:
-            Every time this function is called a new revision index is generated.
         """
-        if (len(jaxpr.eqns) == 0) and (not allow_empty_jaxpr):
-            raise ValueError("Passed an empty Jaxpr, but did not allow for empty Jaxpr.")
-        if not isinstance(jaxpr, jax_core.ClosedJaxpr):
-            raise TypeError(f"Expected a 'jax.core.ClosedJaxp' instance but got '{type(jaxpr)}'")
         if len(jaxpr.effects) != 0:
             raise NotImplementedError("'Jaxpr' with side effects are not supported.")
-        if len(jaxpr.out_avals) == 0:
-            raise ValueError("Jaxpr has zero output variables.")
         if not jax.config.read("jax_enable_x64"):
             raise NotImplementedError("The translation only works if 'jax_enable_x64' is enabled.")
 
@@ -165,7 +154,6 @@ def append_new_state(
         label: str | None = None,
         condition: dprop.CodeBlock | None = None,
         assignments: Mapping[str, Any] | None = None,
-        *,
         prev_state: dace.SDFGState | None = None,
     ) -> dace.SDFGState:
         """Creates a new `SDFGState` and adds it to the SDFG.
@@ -335,7 +323,7 @@ def add_jax_name_mapping(
             jax_var:     The Jax variable.
             sdfg_name:   The name of the corresponding SDFG variable.
         """
-        assert isinstance(sdfg_name, str) and (len(sdfg_name) > 0)  # noqa: PT018  # Should be one assertion.
+        assert len(sdfg_name) > 0
 
         if jax_var in self._jax_name_map:
             if self._jax_name_map[jax_var] == sdfg_name:  # noops.
@@ -362,10 +350,6 @@ def add_reserved_names(
             return self
         if isinstance(reserved_names, str):
             reserved_names = [reserved_names]
-        elif isinstance(reserved_names, Iterable):
-            pass
-        else:
-            raise TypeError(f"Does not know how to handle the type '{type(reserved_names)}'.")
         self._reserved_names.update(reserved_names)
         return self
 
@@ -424,9 +408,7 @@ def add_array(
             If you need to create a special array, you can use `jace.util.JaCeVar`
                 to create a pseudo Jax variable.
         """
-        assert self.is_allocated()
-
-        shape: Sequence[int] = util.get_jax_var_shape(arg)
+        shape: tuple[int] = util.get_jax_var_shape(arg)
         dtype = util.get_jax_var_dtype(arg)
         offset = None  # i.e. no offset
         storage: dace.StorageType = dace.StorageType.Default  # Set at later stages (optimization)
@@ -453,7 +435,6 @@ def add_array(
             find_new_name = False
             alt_name = util.propose_jax_name(arg, self._jax_name_map)
         if alt_name is not None:
-            assert isinstance(alt_name, str)
             find_new_name = False  # If a name was given, then use it no matter what.
             if len(alt_name) == 0:
                 raise ValueError("Passed an empty 'alt_name'.")
@@ -469,10 +450,8 @@ def add_array(
                 raise ValueError(
                     f"Specified 'name_prefix' ('{name_prefix}') but passed '{alt_name}' as 'alt_name'."
                 )
-        if name_prefix is not None:
-            assert isinstance(name_prefix, str)
-            if len(name_prefix) == 0:
-                raise ValueError("Specified an empty 'name_prefix'.")
+        if (name_prefix is not None) and (len(name_prefix) == 0):
+            raise ValueError("Specified an empty 'name_prefix'.")
 
         # Checking the strides.
         if strides is not None:
@@ -480,7 +459,8 @@ def add_array(
                 raise ValueError("Specified a stride for a scalar.")
             if isinstance(strides, (str, dace.symbol, int)):
                 strides = (strides,)
-            assert isinstance(strides, tuple)
+            elif not isinstance(strides, tuple):
+                strides = tuple(strides)
             if len(strides) != len(shape):
                 raise ValueError(
                     f"'strides' has length {len(strides)}, but array rank is {len(shape)}."
@@ -500,8 +480,6 @@ def add_array(
                 raise NotImplementedError("Jax Literals are not supported.")
             if alt_name is None:
                 raise ValueError(f"Passed literal '{arg}', but not specified a name to use.")
-        else:
-            raise TypeError(f"Does not know how to handle '{type(arg).__name__}'.")
 
         if alt_name is None:
             # If we are the root translator, then we will use `prop_name` directly;
@@ -624,7 +602,9 @@ def create_jax_var_list(  # type: ignore[misc]
         """
         if only_creation and prevent_creation:
             raise ValueError("Specified both 'only_creation' and 'prevent_creation'.")
-        assert "update_var_mapping" not in kwargs
+        assert (
+            "update_var_mapping" not in kwargs
+        ), "You can not pass 'update_var_mapping' as argument to 'create_jax_var_list()'."
 
         ret_list: list[None | str] = []
         for jax_var in jax_var_list:
@@ -632,7 +612,7 @@ def create_jax_var_list(  # type: ignore[misc]
                 if not handle_literals:
                     raise ValueError("Encountered a literal but `handle_literals` was `False`.")
                 sdfg_name = None
-            elif isinstance(jax_var, (jax_core.Var, util.JaCeVar)):
+            else:
                 mapped_sdfg_name: str | None = self.map_jax_var_to_sdfg(jax_var, allow_fail=True)
                 if (mapped_sdfg_name is None) and prevent_creation:
                     raise ValueError(f"'prevent_creation' given but have to create '{jax_var}'.")
@@ -644,8 +624,6 @@ def create_jax_var_list(  # type: ignore[misc]
                     sdfg_name = mapped_sdfg_name
                 # Calling `add_jax_name_mapping` is save, because if the mapping does already exists it is a no ops.
                 self.add_jax_name_mapping(jax_var, sdfg_name)
-            else:
-                raise TypeError(f"Does not know how to handle '{type(jax_var).__name__}'")
 
             ret_list.append(sdfg_name)
 
@@ -672,7 +650,6 @@ def _create_initial_input(
             raise RuntimeError("Driver is not allocated, can not create constants.")
         if len(self._ctx.inp_names) != 0:
             raise RuntimeError("Called '_create_initial_input()' twice?")
-        assert len(self._ctx.out_names) == 0
 
         # Handle the initial input arguments
         sdfg: dace.SDFG = self._ctx.sdfg
@@ -710,7 +687,7 @@ def _create_constants(
         if not self.is_allocated():
             raise RuntimeError("Driver is not allocated, can not create constants.")
         if len(jaxpr.consts) == 0:
-            return []
+            return ()
 
         sdfg_const_names: Sequence[str] = self.create_jax_var_list(
             jax_var_list=jaxpr.jaxpr.constvars,
@@ -831,9 +808,7 @@ def _translate_single_eqn(
         # Find the subtranslator
         prim_name: str = eqn.primitive.name
         if prim_name not in self._sub_translators:
-            raise NotImplementedError(
-                f"No subtranslators known to handle '{prim_name}' || {type(self._sub_translators)}."
-            )
+            raise NotImplementedError(f"No subtranslators known to handle '{prim_name}'.")
         subtranslator = self._sub_translators[prim_name]
 
         # Create the state into which the equation should be translated
@@ -857,11 +832,6 @@ def _translate_single_eqn(
             if eqn_state is not self._ctx.terminal_state:
                 raise RuntimeError("Inconsistent terminal state was detected.")
             new_sdfg_term_state = eqn_state
-        elif isinstance(new_sdfg_term_state, dace.SDFGState):
-            # TODO(phimuell): use `last_term_state` to test if `new_sdfg_term_state` is reachable.
-            pass
-        else:
-            raise TypeError(f"Encountered illegal types '{type(new_sdfg_term_state)}'")
 
         # In case a subtranslator decided to not use the variables we created for it, which is allowed
         #  but he must update the `out_var_names` list correctly, we will now verify this.
@@ -899,7 +869,7 @@ def _translate_jaxpr_internal(
                 Such variables are included by some transformations such as `grad()`.
         """
         nb_translated_eqn: int = 0
-        out_var_names: Sequence[str] = []
+        out_var_names: Sequence[str] = ()
 
         # Translate the equations one by one.
         for eqn in jaxpr.jaxpr.eqns:
diff --git a/src/jace/translator/managing.py b/src/jace/translator/managing.py
index 22250be..71167a3 100644
--- a/src/jace/translator/managing.py
+++ b/src/jace/translator/managing.py
@@ -152,7 +152,6 @@ def wrapper(real_fun: Callable) -> PrimitiveTranslator:
 
         return wrapper
 
-    assert inspect.isfunction(fun)
     if getattr(fun, "primitive", prim_name) != prim_name:
         raise ValueError(f"Passed 'fun' already '{fun.primitive}' as 'primitive' property.")  # type: ignore[attr-defined]
 
diff --git a/src/jace/util/jax_helper.py b/src/jace/util/jax_helper.py
index 37f06ad..457c43d 100644
--- a/src/jace/util/jax_helper.py
+++ b/src/jace/util/jax_helper.py
@@ -16,7 +16,7 @@
 from __future__ import annotations
 
 import itertools
-from collections.abc import Mapping, Sequence
+from collections.abc import Mapping
 from dataclasses import dataclass
 from typing import Any, overload
 
@@ -56,36 +56,6 @@ def __eq__(self, other: Any) -> bool:
             return NotImplemented
         return id(self) == id(other)
 
-    @classmethod
-    def Create(
-        cls,
-        name: str,
-        shape: Sequence[int | dace.symbol | str] | int | dace.symbol | str,
-        dtype: Any,
-    ) -> JaCeVar:
-        """Creates a `JaCeVar` object.
-
-        Performs some sanity checks on the input.
-        It is also possible that `shape` can be an integer or symbol, that is then translated into an tuple.
-
-        Args:
-            name:       Name of the variable, might be empty.
-            shape:      The shape of the array.
-            dtype:      The datatype, will be transformed into a dace datatype.
-        """
-        if name == "":
-            pass  # Explicit allowed in the interface, but a bit strange.
-        elif (name != "_") and (not util.VALID_SDFG_VAR_NAME.fullmatch(name)):
-            raise ValueError(f"Passed an invalid name '{name}'.")
-        if isinstance(shape, (int, dace.symbol, str)):
-            shape = (shape,)
-        elif not isinstance(shape, tuple):
-            shape = tuple(shape)
-        if not isinstance(dtype, dace.typeclass):
-            dtype = translate_dtype(dtype)
-        assert all(isinstance(x, (int, dace.symbol, str)) for x in shape)
-        return cls(name=name, shape=shape, dtype=dtype)
-
 
 def get_jax_var_name(jax_var: jax_core.Atom | JaCeVar | str) -> str:
     """Returns the name of the Jax variable as a string.
@@ -241,16 +211,12 @@ def propose_jax_name(
         raise RuntimeError(
             f"Can not propose a second name for '{jax_var}', it already known as '{jax_name_map[jax_var]}'."
         )
-    if isinstance(jax_var, jax_core.Var):
-        pass
-    elif isinstance(jax_var, JaCeVar):
+    if isinstance(jax_var, JaCeVar) and (jax_var.name != ""):
         # If the name of the JaCe variable is empty, then use the name proposing
         #  technique used for Jax variables; Mostly used for debugging.
-        if jax_var.name != "":
-            return jax_var.name
-    else:
-        raise TypeError(f"Can not propose a name for '{jax_var}'")
+        return jax_var.name
 
+    # This code is taken from the Jax source.
     c = len(jax_name_map)
     jax_name = ""
     while len(jax_name) == 0 or c != 0:
diff --git a/src/jace/util/traits.py b/src/jace/util/traits.py
index 779a8dd..cc53328 100644
--- a/src/jace/util/traits.py
+++ b/src/jace/util/traits.py
@@ -86,9 +86,7 @@ def is_array(
     obj: Any,
 ) -> bool:
     """Identifies arrays, this also includes Jax arrays."""
-    if is_jax_array(obj):
-        return True
-    return dace.is_array(obj)
+    return is_jax_array(obj) or dace.is_array(obj)
 
 
 def is_on_device(

From 56a309e122a0045a0d501a1c13fea57f4458e8c7 Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Thu, 16 May 2024 15:35:34 +0200
Subject: [PATCH 158/458] This commit partially add support for a global list
 of primitive translators.

This was Enrique's idea and it is really good, but it adds a lot of complexity.
For several reasons (mainly open PR) the commit is split into two parts one that can is merged into the PR (this one) and once that contains the parts that are development only.
Essentially we want allow code such as:
```python
       @jit
       def foo(...):
              ...
       foo1 = foo.lower(...args1)
       # Modify the list of internal translators, i.e. call `add_subtranslator()`
       foo2 = foo.lower(...args2)
```
because the list of translators is an implicit argument to the `jit` decorator, we expect that `foo2` is generated with the same translators as was `foo1`, see the next commit for a full description.
This commit essentially adds two things:
- the global list that stores the translator instances
- makes all necessary changes such that stuff works.

The managing of the global list is implemented such that it results in an immutable object.
Thus every time it is mutated a new list is created.
It might be a bit strange to do that, but the list is not changed that frequently (except upon loading) and it is only a shallow copy, since the translators are immutable themselves.
This approach allows some nice optimization further down.

For more information on the code see `jace.translator.managing.add_subtranslators`.
---
 pyproject.toml                                |   5 +-
 src/jace/__init__.py                          |  15 ++
 src/jace/translator/__init__.py               |   6 +-
 .../translator/jaxpr_translator_driver.py     |  92 ++-----
 src/jace/translator/managing.py               | 214 +++++++++++++----
 src/jace/translator/primitive_translator.py   |  31 +--
 .../primitive_translators/alu_translator.py   | 155 ++++++------
 tests/test_jaxpr_translator_driver.py         |  16 +-
 tests/test_subtranslator_helper.py            | 224 +++++++++++++-----
 9 files changed, 463 insertions(+), 295 deletions(-)

diff --git a/pyproject.toml b/pyproject.toml
index fa01acb..737d9e1 100644
--- a/pyproject.toml
+++ b/pyproject.toml
@@ -65,7 +65,7 @@ warn_unused_ignores = true
 disallow_incomplete_defs = false
 disallow_untyped_defs = false
 ignore_missing_imports = true
-module = "tests.*"
+module = ["tests.*"]
 
 # -- pytest  --
 [tool.pytest]
@@ -149,7 +149,8 @@ section-order = [
 "!tests/**.py" = ["PT"]  # Ignore `flake8-pytest-style` everywhere except in `tests/`
 "noxfile.py" = ["T20"]  # Ignore `flake8-print`
 "tests/**" = [
-  "T10", # Ignore `flake8-debugger`
+  "T10",  # Ignore `flake8-debugger`
   "T20",  # Ignore `flake8-print`
   "F841",  # Ignore `unused-variable` (inside `with` to test if throws)
+  "ARG001"  # Ignore `unused function argument` (to create simple fake stand ins)
 ]
diff --git a/src/jace/__init__.py b/src/jace/__init__.py
index 9b44225..c28ce55 100644
--- a/src/jace/__init__.py
+++ b/src/jace/__init__.py
@@ -12,6 +12,21 @@
 from .__about__ import __author__, __copyright__, __license__, __version__, __version_info__
 
 
+def _ensure_build_in_translators_are_loaded() -> None:
+    # There is a chicken-egg problem, i.e. circular import, if we use the decorator to add the build in classes.
+    #  In order for the decorator to add the translators to the internal list, they have to be run, i.e. imported.
+    #  However, since they have to import the decorator, this would lead to a circular import.
+    #  To ensure that the built in translators are imported at the beginning, i.e. once Jace is loaded.
+    #  We define this function and call it and its only job is to load the subtranslaotrs.
+    #  However, this requires that all are imported by the `__init__.py` file.
+    # Too see that it is needed, remove this function and run `pytest tests/test_subtranslator_helper.py::test_are_subtranslators_imported`
+    from jace.translator import primitive_translators  # noqa: F401  # Unused import
+
+
+_ensure_build_in_translators_are_loaded()
+del _ensure_build_in_translators_are_loaded
+
+
 __all__ = [
     "__author__",
     "__copyright__",
diff --git a/src/jace/translator/__init__.py b/src/jace/translator/__init__.py
index 22f3182..69600ae 100644
--- a/src/jace/translator/__init__.py
+++ b/src/jace/translator/__init__.py
@@ -10,7 +10,7 @@
 from __future__ import annotations
 
 from .jaxpr_translator_driver import JaxprTranslationDriver
-from .managing import add_subtranslator, get_subtranslators_cls
+from .managing import add_fsubtranslator, add_subtranslator, add_subtranslators, get_subtranslators
 from .primitive_translator import PrimitiveTranslator
 from .translated_jaxpr_sdfg import TranslatedJaxprSDFG
 
@@ -20,5 +20,7 @@
     "PrimitiveTranslator",
     "TranslatedJaxprSDFG",
     "add_subtranslator",
-    "get_subtranslators_cls",
+    "add_subtranslators",
+    "add_fsubtranslator",
+    "get_subtranslators",
 ]
diff --git a/src/jace/translator/jaxpr_translator_driver.py b/src/jace/translator/jaxpr_translator_driver.py
index e319bb8..262b1c8 100644
--- a/src/jace/translator/jaxpr_translator_driver.py
+++ b/src/jace/translator/jaxpr_translator_driver.py
@@ -43,12 +43,16 @@ class JaxprTranslationDriver:
     Instead the request is forwarded to a `PrimitiveTranslator` object, also known as subtranslator.
     This is a highly specialized object that is able to handle one kind of primitive.
     For more information on the subtranslators see the documentation of `PrimitiveTranslator`.
+    The actual translators are supplied from the outside at construction time.
 
     To start a translation the `translate_jaxpr()` function should be called,
     if this happens it is said that the driver has an ongoing translation.
     If `translate_jaxpr()` is called on driver that has an ongoing translation, a new translation context will be set up.
     Thus the driver will then translate the supplied (nested) Jaxpr and return the result.
     However, this will have no influence on the translation process that is already going.
+
+    Notes:
+        The translator is able to handle multiple consecutive translations.
     """
 
     __slots__ = (
@@ -60,26 +64,24 @@ class JaxprTranslationDriver:
 
     def __init__(
         self,
-        **kwargs: Any,
+        sub_translators: Mapping[str, translator.PrimitiveTranslator],
     ) -> None:
-        """Creates the base translator.
+        """Creates the driver.
 
-        All arguments that does not start with an underscore are used as
-        arguments to construct the subtranslators.
+        Args:
+            sub_translators:    Use these subtranslators to perform the translation.
 
         Notes:
-            This function will not allocate the translation context of `self`
-                but will only allocate the shared members.
-            By setting `_no_shared_alloc` to `True` the function will not allocate
-                the shared part. This flag is provided only for implementing
-                `self.fork()` using it is an error and undefined behaviour.
+            `sub_translators` is not copied, thus the user has to guarantee,
+                that it will not change during translation.
+                It is highly advised but not requiered to use the output of
+                `get_subtranslators()` or pass a copy as argument.
         """
-        # Contains all the subtranslators that we need.
-        #  They are partitioned by the names of the primitive they have registered for.
-        #  This member is allocated by '_init_sub_translators()' and remains allocated
-        #  during the lifetime of the object.
-        self._sub_translators: dict[str, translator.PrimitiveTranslator] = None  # type: ignore[assignment]
-        self._init_sub_translators(kwargs)
+
+        # Shared with the outside, while key and mapped values are immutable,
+        #  the mapping itself is not, but it should be fine.
+        #  Allocated through the lifetime of `self`.
+        self._sub_translators: Mapping[str, translator.PrimitiveTranslator] = sub_translators
 
         # These names can not be used for the automatic naming of Jax variables.
         #  They differ from the forbidden names, that they denote valid SDFG names.
@@ -766,32 +768,6 @@ def _ctx(self) -> translator.TranslatedJaxprSDFG:
         assert len(self._ctx_stack) != 0, "No context is active."
         return self._ctx_stack[-1]
 
-    def _init_sub_translators(
-        self,
-        subtrans_args: Mapping[str, Any],
-    ) -> JaxprTranslationDriver:
-        """This function initializes the subtranslator.
-
-        The function forwards `kwargs` to the constructor of the subtranslators.
-        However, it will remove all arguments starting with an underscore.
-        """
-
-        subtrans_args = {k: v for k, v in subtrans_args.items() if not k.startswith("_")}
-        prim_translators: dict[str, translator.PrimitiveTranslator] = {}
-        for prim_translator_cls in translator.get_subtranslators_cls():
-            prim_translator: translator.PrimitiveTranslator = prim_translator_cls.build_translator(
-                **subtrans_args
-            )
-            handled_primitives: Iterable[str] = util.as_sequence(prim_translator.primitive)
-
-            for handled_primitive in handled_primitives:
-                if handled_primitive in prim_translators:
-                    raise RuntimeError(f"Multiple translators for '{handled_primitive}' found.")
-                prim_translators[handled_primitive] = prim_translator
-        self._sub_translators = prim_translators
-
-        return self
-
     def _clear_translation_ctx(self) -> JaxprTranslationDriver:
         """This function deallocate the translation context of `self`.
 
@@ -814,17 +790,6 @@ def _clear_translation_ctx(self) -> JaxprTranslationDriver:
             self._ctx_stack.pop()
         return self
 
-    def _find_sub_translator_for(
-        self,
-        eqn: jax_core.JaxprEqn,
-    ) -> translator.PrimitiveTranslator:
-        """Returns the appropriate subtranslator for equation `eqn`."""
-        prim_name: str = eqn.primitive.name
-        if prim_name not in self._sub_translators:
-            raise NotImplementedError(f"No subtranslators known to handle '{prim_name}'.")
-
-        return self._sub_translators[prim_name]
-
     def _translate_single_eqn(
         self,
         eqn: jax_core.JaxprEqn,
@@ -863,17 +828,22 @@ def _translate_single_eqn(
         )
 
         # Find the subtranslator
-        subtranslator: translator.PrimitiveTranslator = self._find_sub_translator_for(eqn)
+        prim_name: str = eqn.primitive.name
+        if prim_name not in self._sub_translators:
+            raise NotImplementedError(
+                f"No subtranslators known to handle '{prim_name}' || {type(self._sub_translators)}."
+            )
+        subtranslator = self._sub_translators[prim_name]
 
         # Create the state into which the equation should be translated
         last_term_state: dace.SDFGState = self.terminal_sdfg_state  # noqa: F841 # Will be used later
         eqn_state = self.append_new_state(
-            label=f"{eqn.primitive.name}_{out_var_names[0]}",
+            label=f"{eqn.primitive.name}_{'_'.join(out_var_names)}",
             prev_state=None,  # forces terminal state to use
         )
 
         # Now perform the actual translation of the equation.
-        new_sdfg_term_state = subtranslator.translate_jaxeqn(
+        new_sdfg_term_state = subtranslator(
             driver=self,
             in_var_names=in_var_names,
             out_var_names=out_var_names,  # Might be modified by the subtranslator!
@@ -945,18 +915,6 @@ def _translate_jaxpr_internal(
         # Set the output names inside the context.
         self._ctx.out_names = tuple(out_var_names)
 
-        return self._export_context()
-
-    def _export_context(self) -> translator.TranslatedJaxprSDFG:
-        """Encapsulate the translation context of `self` into a `TranslatedJaxprSDFG` object..
-
-        This function will not deallocate the internal context of `self`.
-        Thus `self` and the return value will share the same context in memory.
-        To free the context of `self` use `self._clear_translation_ctx()`.
-        """
-        assert self.is_allocated()
-        assert all((isinstance(x, str) and (len(x) > 0)) for x in self._ctx.inp_names)
-        assert all((isinstance(x, str) and (len(x) > 0)) for x in self._ctx.out_names)
         return self._ctx
 
     def _handle_null_jaxpr(
diff --git a/src/jace/translator/managing.py b/src/jace/translator/managing.py
index 589b446..e3afc99 100644
--- a/src/jace/translator/managing.py
+++ b/src/jace/translator/managing.py
@@ -4,79 +4,195 @@
 # All rights reserved.
 #
 # SPDX-License-Identifier: BSD-3-Clause
-"""Module for managing the individual sutranslators."""
+"""Module for managing the individual sutranslators.
+
+The high level idea is that there is a "list" of instances of `PrimitiveTranslator`,
+which is known as `_CURRENT_SUBTRANSLATORS`.
+If not specified the content of this list is used to perform the translation.
+"""
 
 from __future__ import annotations
 
-from collections.abc import Callable, Sequence
-from typing import Literal, overload
+import inspect
+import types
+from collections.abc import Callable, Mapping, MutableMapping
+from typing import TYPE_CHECKING, Literal, TypeAlias, cast, overload
 
-from jace import translator
 
+if TYPE_CHECKING:
+    from jace import translator
 
-# List of all primitive translators that are known to Jace.
-#  They are filled through the `add_subtranslator()` decorator.
-#  See also the note in `get_subtranslators_cls()`
-_KNOWN_SUBTRANSLATORS: list[type[translator.PrimitiveTranslator]] = []
+    # Type alias for distinguish between instances and classes.
+    PrimitiveTranslator: TypeAlias = (
+        type[translator.PrimitiveTranslator] | translator.PrimitiveTranslator | Callable
+    )
 
 
-@overload
-def add_subtranslator(
-    subtrans: Literal[None], /, overwrite: bool = False
-) -> Callable[[type[translator.PrimitiveTranslator]], type[translator.PrimitiveTranslator]]: ...
+# These are all currently used subtranslators that we are used.
+_CURRENT_SUBTRANSLATORS: dict[str, translator.PrimitiveTranslator] = {}
+_CURRENT_SUBTRANSLATORS_VIEW: types.MappingProxyType[str, translator.PrimitiveTranslator] = (
+    types.MappingProxyType(_CURRENT_SUBTRANSLATORS)
+)
 
 
-@overload
-def add_subtranslator(
-    subtrans: type[translator.PrimitiveTranslator], /, overwrite: bool = False
-) -> type[translator.PrimitiveTranslator]: ...
+def add_subtranslators(
+    *subtrans: PrimitiveTranslator | None,
+    overwrite: bool = False,
+) -> None:
+    """Adds many subtranslators in one step to Jace's internal list.
+
+    This function is more efficient if many translators should be added in one go.
+    Please refer to `add_subtranslator()` for more information.
+
+    Notes:
+        If an error during insertion happens the operation is considered a no ops.
+    """
+    from jace import translator  # Circular import
+
+    global _CURRENT_SUBTRANSLATORS
+    global _CURRENT_SUBTRANSLATORS_VIEW
+
+    if len(subtrans) == 0:
+        raise ValueError("Not passed any subtranslators.")
+
+    # Why do we do this kind of versioning here or versioning at all?
+    #  The cache has to include the set of used subtranslators somehow.
+    #  However, as explained in `JaceWrapped.__init__()` the function must make a copy of it.
+    #  One way would be to hash the content, i.e. `[(prim_name, id(prim_translator)), ...]`.
+    #  But a much simpler idea is to just consider its address, since in 99% of the cases,
+    #  the global list is used and not some user supplied list is used we do this versioning.
+    #  This allows `JaceWrapped.__init__()` to identify if the current global list of installed
+    #  translated is passed to it and it can then prevent the copying.
+    #  In the end a code like:
+    #       def foo(...): ...
+    #       foo1 = jace.jit(foo).lower()   # noqa: ERA001 commented out code
+    #       foo2 = jace.jit(foo).lower()   # noqa: ERA001
+    #  Should only lower once as it is seen in Jax.
+    new_CURRENT_SUBTRANSLATORS = _CURRENT_SUBTRANSLATORS.copy()
+
+    for prim_trans in subtrans:
+        # If it is a class instantiate it.
+        if inspect.isclass(prim_trans):
+            prim_trans = prim_trans()
+        prim_trans = cast(translator.PrimitiveTranslator, prim_trans)
+
+        # Test if we know the primitive already
+        prim_name: str = prim_trans.primitive
+        if (prim_name in _CURRENT_SUBTRANSLATORS) and (not overwrite):
+            raise ValueError(f"Tried to add a second translator for primitive '{prim_name}'.")
+
+        # Commit the change to a "staging"
+        new_CURRENT_SUBTRANSLATORS[prim_name] = prim_trans
+
+    # Now update the global variables.
+    #  Doing it after the loop gives us exception guarantee
+    _CURRENT_SUBTRANSLATORS = new_CURRENT_SUBTRANSLATORS
+    _CURRENT_SUBTRANSLATORS_VIEW = types.MappingProxyType(_CURRENT_SUBTRANSLATORS)
 
 
 def add_subtranslator(
-    subtrans: type[translator.PrimitiveTranslator] | None = None,
+    subtrans: PrimitiveTranslator | None = None,
     /,
     overwrite: bool = False,
-) -> (
-    type[translator.PrimitiveTranslator]
-    | Callable[[type[translator.PrimitiveTranslator]], type[translator.PrimitiveTranslator]]
-):
-    """Decorator to add `subtrans` to the list of known subtranslators.
-
-    If a class is tried to be registered twice an error will be generated unless, `overwrite` is set.
+) -> PrimitiveTranslator | Callable[[PrimitiveTranslator], PrimitiveTranslator]:
+    """Adds the subtranslator `subtrans` to Jace's internal list of translators.
+
+    If the primitive is already known an error is generated, however, if `overwrite` is given,
+    then `subtrans` will replace the current one.
+    In case `subtrans` is a class, the function will instantiate it first.
+    Thus, a class must be constructable without arguments.
+
+    Notes:
+        Calls to this function will never modify subtranslator lists previously obtained by `get_subtranslators()`!
+        Since `subtrans` is returned unmodified, this function can be used to annotate classes.
+        For annotating functions use `add_fsubtranslator()`.
+
+    Todo:
+        Accept many inputs for bulk update.
+        Add functions to clear them or restore the default ones.
     """
-    if subtrans is None:
 
+    if subtrans is None:
+        # It was used as decorator with some argument (currently `overwrite`).
         def wrapper(
-            real_subtrans: type[translator.PrimitiveTranslator],
-        ) -> type[translator.PrimitiveTranslator]:
+            real_subtrans: PrimitiveTranslator,
+        ) -> PrimitiveTranslator:
             return add_subtranslator(real_subtrans, overwrite=overwrite)
 
         return wrapper
 
-    if subtrans in _KNOWN_SUBTRANSLATORS:
-        if overwrite:
-            _KNOWN_SUBTRANSLATORS.remove(subtrans)
-        else:
-            raise ValueError(
-                f"Tried to add '{type(subtrans).__name__}' twice to the list of known primitive translators."
-            )
-
-    _KNOWN_SUBTRANSLATORS.append(subtrans)
+    # Forward the call to the bulk insertion.
+    #  And always return the original argument.
+    add_subtranslators(subtrans, overwrite=overwrite)
     return subtrans
 
 
-def get_subtranslators_cls() -> Sequence[type[translator.PrimitiveTranslator]]:
-    """Returns the list of all subtranslator known to JaCe.
+def add_fsubtranslator(
+    prim_name: str,
+    fun: Callable | None = None,
+    /,
+    overwrite: bool = False,
+) -> PrimitiveTranslator | Callable[[Callable], PrimitiveTranslator]:
+    """Convenience function to annotate function and turn them into a translator.
+
+    Adds the `primitive` property to `fun` and register it then as translator.
+
+    Notes:
+        Without this function you would had to define the translator function,
+            add the `primitive` property to it and then pass it to `add_subtranslator()`.
+            This function allows it to do in one step.
+    """
+
+    if fun is None:
+        # Annotated mode.
+        def wrapper(real_fun: Callable) -> PrimitiveTranslator:
+            return add_fsubtranslator(prim_name, real_fun, overwrite=overwrite)
+
+        return wrapper
+
+    assert inspect.isfunction(fun)
+    if getattr(fun, "primitive", prim_name) != prim_name:
+        raise ValueError(f"Passed 'fun' already '{fun.primitive}' as 'primitive' property.")  # type: ignore[attr-defined]
+
+    fun.primitive = prim_name  # type: ignore[attr-defined]
+    return add_subtranslator(fun, overwrite=overwrite)
+
+
+@overload
+def get_subtranslators(  # type: ignore[overload-overlap]
+    as_mutable: Literal[False] = False,
+) -> Mapping[str, translator.PrimitiveTranslator]: ...
+
+
+@overload
+def get_subtranslators(
+    as_mutable: Literal[True] = True,
+) -> MutableMapping[str, translator.PrimitiveTranslator]: ...
+
+
+def get_subtranslators(
+    as_mutable: bool = False,
+) -> (
+    Mapping[str, translator.PrimitiveTranslator]
+    | MutableMapping[str, translator.PrimitiveTranslator]
+):
+    """Returns a view of all _currently_ installed primitive translators in Jace.
+
+    By setting `as_mutable` to `True` the function will return a mutable mapping object.
+    However, in any case the returned mapping will not be affected by calls that modify
+    the internal list of registered primitive translators, i.e. `add_subtranslator()`.
 
-    The subtranslators are returned in FIFO order.
+    Notes:
+        If `as_mutable` is `False` the function will return an immutable view of the
+            registered primitive translator list, thus only a view is created.
+            However, if `as_mutable` is `True` a copy is returned.
     """
-    # There is a chicken-egg problem, i.e. circular import, if we use the decorator to add the build in classes.
-    #  The problem is, that they are only run, i.e. added to the list, upon importing.
-    #  Thus we have to explicitly import the subtranslator, but this would then lead to a circular import.
-    #  For that reason we import the subpackage here explicitly.
-    #  However, this requires that all are imported by the `__init__.py` file.
-    #  I do not know a way to do this better.
-    #  Actually I want to do it somehow upon the importation of `jace` itself.
-    from jace.translator import primitive_translators  # noqa: F401  # Unused import
-
-    return list(reversed(_KNOWN_SUBTRANSLATORS))
+    if as_mutable:
+        # The use case for this is, that a user wants to populate its own list and do some funky stuff.
+        #  Without this option, he would first have to make a mutable copy of the map manually,
+        #  every fucking time he wants it, so making an option is simpler.
+        return _CURRENT_SUBTRANSLATORS.copy()
+
+    # Since we do a versioning in `add_subtranslator()` we do not have to create a new view.
+    #  We can just return the global view, this is needed to fix some problems in the caching.
+    return _CURRENT_SUBTRANSLATORS_VIEW
diff --git a/src/jace/translator/primitive_translator.py b/src/jace/translator/primitive_translator.py
index fa717aa..2e00ed6 100644
--- a/src/jace/translator/primitive_translator.py
+++ b/src/jace/translator/primitive_translator.py
@@ -17,7 +17,7 @@
 
 from abc import abstractmethod
 from collections.abc import MutableSequence, Sequence
-from typing import Any, Protocol, runtime_checkable
+from typing import Protocol, runtime_checkable
 
 import dace
 from jax import core as jax_core
@@ -30,44 +30,25 @@ class PrimitiveTranslator(Protocol):
     """Interface for all Jax primitive translators, also known as subtranslator.
 
     A translator for a primitive translates a single equation of a Jaxpr into its SDFG equivalent.
-    A type that implements this interface must fulfil the following properties:
-    - It must be immutable after construction.
-    - All subclass must implement the class method `build_translator()` to construct an instance.
+    For satisfying this interface a concrete implementation must be immutable after construction.
 
     Subtranslators are simple, but highly specialized objects that are only able to perform the translation of a single primitive.
     The overall translation process itself is managed by a driver object, which also owns and manage the subtranslators.
     In the end this implements the delegation pattern.
 
-    After instantiation a driver calls the subtranslator's `get_handled_primitive()` method.
-    This function returns the name of the Jax primitive the subtranslator is able to handle.
-    In case a subtranslator is able to handle multiple primitives, it should return a list with their names.
-    While there is no limit to the numbers of primitive a subtranslator can register itself for,
-    only one subtranslator can be register for any primitive.
+    You can use `jace.translator.add_subtranslator()` to register your translator to Jace.
     """
 
     __slots__ = ()
 
-    @classmethod
-    @abstractmethod
-    def build_translator(
-        cls,
-        *args: Any,
-        **kwargs: Any,
-    ) -> PrimitiveTranslator:
-        """Creates an instance of a subtranslator."""
-        ...
-
     @property
     @abstractmethod
-    def primitive(self) -> str | Sequence[str]:
-        """Returns the names of the Jax primitive that `self` is able to handle.
-
-        In case `self` can handle multiple primitives, it should return a list with these names.
-        """
+    def primitive(self) -> str:
+        """Returns the name of the Jax primitive that `self` is able to handle."""
         ...
 
     @abstractmethod
-    def translate_jaxeqn(
+    def __call__(
         self,
         driver: translator.JaxprTranslationDriver,
         in_var_names: Sequence[str | None],
diff --git a/src/jace/translator/primitive_translators/alu_translator.py b/src/jace/translator/primitive_translators/alu_translator.py
index 9f7aa44..05ce3fe 100644
--- a/src/jace/translator/primitive_translators/alu_translator.py
+++ b/src/jace/translator/primitive_translators/alu_translator.py
@@ -20,77 +20,30 @@
 from jace import translator
 
 
-@translator.add_subtranslator
 class ALUTranslator(translator.PrimitiveTranslator):
-    """This translator handles all arithmetic and logical operations."""
-
-    __slots__ = ()
-
-    # Contains all translation templates for unary operations.
-    _unary_ops: Final[dict[str, str]] = {
-        "pos": "__out0 = +(__in0)",
-        "neg": "__out0 = -(__in0)",
-        "not": "__out0 = not (__in0)",
-        "floor": "__out0 = floor(__in0)",
-        "ceil": "__out0 = ceil(__in0)",
-        "round": "__out0 = round(__in0)",
-        "abs": "__out0 = abs(__in0)",
-        "sign": "__out0 = sign(__in0)",
-        "sqrt": "__out0 = sqrt(__in0)",
-        "log": "__out0 = log(__in0)",
-        "exp": "__out0 = exp(__in0)",
-        "integer_pow": "__out0 = (__in0)**({y})",  # 'y' is a parameter of the primitive
-        "sin": "__out0 = sin(__in0)",
-        "asin": "__out0 = asin(__in0)",
-        "cos": "__out0 = cos(__in0)",
-        "acos": "__out0 = acos(__in0)",
-        "tan": "__out0 = tan(__in0)",
-        "atan": "__out0 = atan(__in0)",
-        "tanh": "__out0 = tanh(__in0)",
-    }
-    # Transformation for all binary operations
-    _binary_ops: Final[dict[str, str]] = {
-        "add": "__out0 = (__in0)+(__in1)",
-        "add_any": "__out0 = (__in0)+(__in1)",  # No idea what makes `add_any` differ from `add`
-        "sub": "__out0 = (__in0)-(__in1)",
-        "mul": "__out0 = (__in0)*(__in1)",
-        "div": "__out0 = (__in0)/(__in1)",
-        "rem": "__out0 = (__in0)%(__in1)",
-        "and": "__out0 = (__in0) and (__in1)",
-        "or": "__out0 = (__in0) or  (__in1)",
-        "pow": "__out0 = (__in0)**(__in1)",
-        "ipow": "__out0 = (__in0)**(int(__in1))",
-        "min": "__out0 = min(__in0, __in1)",
-        "max": "__out0 = max(__in0, __in1)",
-        "eq": "__out0 = __in0 == __in1",
-        "ne": "__out0 = __in0 != __in1",
-        "ge": "__out0 = __in0 >= __in1",
-        "gt": "__out0 = __in0 > __in1",
-        "le": "__out0 = __in0 <= __in1",
-        "lt": "__out0 = __in0 < __in1",
-    }
-
-    @classmethod
-    def build_translator(
-        cls,
-        *args: Any,
-        **kwargs: Any,
-    ) -> ALUTranslator:
-        """Creates an `ALUTranslator` instance."""
-        return cls(*args, **kwargs)
-
-    def __init__(self, **kwargs: Any) -> None:
+    """This translator handles all arithmetic and logical operations.
+
+    This translator will be reworked soon, it just exists that the initial PR can do anything at all!!
+    """
+
+    __slots__ = ("_prim_name", "_prim_tmpl")
+
+    def __init__(
+        self,
+        prim_name: str,
+        prim_tmpl: str,
+    ) -> None:
         """Initialize the `ALUTranslator`."""
-        super().__init__(**kwargs)
+        self._prim_name = prim_name
+        self._prim_tmpl = prim_tmpl
 
     @property
     @override
-    def primitive(self) -> Sequence[str]:
-        """Returns the list of all known primitives."""
-        return list(self._unary_ops.keys()) + list(self._binary_ops.keys())
+    def primitive(self) -> str:
+        return self._prim_name
 
     @override
-    def translate_jaxeqn(
+    def __call__(
         self,
         driver: translator.JaxprTranslationDriver,
         in_var_names: Sequence[str | None],
@@ -111,6 +64,7 @@ def translate_jaxeqn(
             eqn:            The Jax equation that is translated.
             eqn_state:      State into which the primitive's SDFG representation is constructed.
         """
+        assert self._prim_name == eqn.primitive.name
 
         # Determine what kind of input we got and how we should proceed.
         is_scalar = len(eqn.outvars[0].aval.shape) == 0
@@ -253,31 +207,8 @@ def _write_tasklet_code(
         Args:
             in_var_names:   The list of SDFG variables used as input.
         """
-        t_name = eqn.primitive.name
-        if t_name == "integer_pow":
-            # INTEGER POWER
-            exponent = int(eqn.params["y"])
-            if exponent == 0:
-                t_code = f"__out0 = dace.{eqn.outvars[0].aval.dtype!s}(1)"
-            elif exponent == 1:
-                t_code = "__out0 = __in0"
-            elif exponent == 2:
-                t_code = "__out0 = __in0 * __in0"
-            elif exponent == 3:
-                t_code = "__out0 = (__in0 * __in0) * __in0"
-            elif exponent == 4:
-                t_code = "__tmp0 = __in0 * __in0\n__out0 = __tmp0 * __tmp0"
-            elif exponent == 5:
-                t_code = "__tmp0 = __in0 * __in0\n__tmp1 = __tmp0 * __tmp0\n__out0 = __tmp1 * __in0"
-            else:
-                t_code = self._unary_ops[t_name]
 
-        else:
-            # GENERAL CASE
-            if t_name in self._unary_ops:
-                t_code = self._unary_ops[t_name]
-            elif t_name in self._binary_ops:
-                t_code = self._binary_ops[t_name]
+        t_code = self._prim_tmpl
 
         # Now we handle Literal substitution
         for i, in_var_name in enumerate(in_var_names):
@@ -308,3 +239,51 @@ def _list_to_dict(inp: Sequence[tuple[None | Any, Any]]) -> dict[Any, Any]:
     The function will only include pairs whose key, i.e. first element is not `None`.
     """
     return {k: v for k, v in inp if k is not None}
+
+
+# Contains all the templates for ALU operations.
+_ALU_OPS_TMPL: Final[dict[str, str]] = {
+    # Unary operations
+    "pos": "__out0 = +(__in0)",
+    "neg": "__out0 = -(__in0)",
+    "not": "__out0 = not (__in0)",
+    "floor": "__out0 = floor(__in0)",
+    "ceil": "__out0 = ceil(__in0)",
+    "round": "__out0 = round(__in0)",
+    "abs": "__out0 = abs(__in0)",
+    "sign": "__out0 = sign(__in0)",
+    "sqrt": "__out0 = sqrt(__in0)",
+    "log": "__out0 = log(__in0)",
+    "exp": "__out0 = exp(__in0)",
+    "integer_pow": "__out0 = (__in0)**({y})",  # 'y' is a parameter of the primitive
+    "sin": "__out0 = sin(__in0)",
+    "asin": "__out0 = asin(__in0)",
+    "cos": "__out0 = cos(__in0)",
+    "acos": "__out0 = acos(__in0)",
+    "tan": "__out0 = tan(__in0)",
+    "atan": "__out0 = atan(__in0)",
+    "tanh": "__out0 = tanh(__in0)",
+    # Binary operations
+    "add": "__out0 = (__in0)+(__in1)",
+    "add_any": "__out0 = (__in0)+(__in1)",  # No idea what makes `add_any` differ from `add`
+    "sub": "__out0 = (__in0)-(__in1)",
+    "mul": "__out0 = (__in0)*(__in1)",
+    "div": "__out0 = (__in0)/(__in1)",
+    "rem": "__out0 = (__in0)%(__in1)",
+    "and": "__out0 = (__in0) and (__in1)",
+    "or": "__out0 = (__in0) or  (__in1)",
+    "pow": "__out0 = (__in0)**(__in1)",
+    "ipow": "__out0 = (__in0)**(int(__in1))",
+    "min": "__out0 = min(__in0, __in1)",
+    "max": "__out0 = max(__in0, __in1)",
+    "eq": "__out0 = __in0 == __in1",
+    "ne": "__out0 = __in0 != __in1",
+    "ge": "__out0 = __in0 >= __in1",
+    "gt": "__out0 = __in0 > __in1",
+    "le": "__out0 = __in0 <= __in1",
+    "lt": "__out0 = __in0 < __in1",
+}
+
+translator.add_subtranslators(
+    *[ALUTranslator(prim_name, prim_tmpl) for prim_name, prim_tmpl in _ALU_OPS_TMPL.items()]
+)
diff --git a/tests/test_jaxpr_translator_driver.py b/tests/test_jaxpr_translator_driver.py
index 16cdfe3..7339525 100644
--- a/tests/test_jaxpr_translator_driver.py
+++ b/tests/test_jaxpr_translator_driver.py
@@ -15,7 +15,7 @@
 import pytest
 from dace.data import Array, Data, Scalar
 
-from jace import translator as jtrans
+from jace import translator
 from jace.util import JaCeVar
 
 
@@ -23,14 +23,14 @@
 def translation_driver():
     """Returns an allocated driver instance."""
     name = "fixture_driver"
-    driver = jtrans.JaxprTranslationDriver()
+    driver = translator.JaxprTranslationDriver(sub_translators=translator.get_subtranslators())
     driver._allocate_translation_ctx(name=name)
     return driver
 
 
 def test_driver_alloc() -> None:
     """Tests the state right after allocation."""
-    driver = jtrans.JaxprTranslationDriver()
+    driver = translator.JaxprTranslationDriver(sub_translators=translator.get_subtranslators())
     assert not driver.is_allocated(), "Driver was created allocated."
     assert len(driver._ctx_stack) == 0
 
@@ -55,7 +55,7 @@ def test_driver_nested() -> None:
     """
 
     # This is the parent driver.
-    driver = jtrans.JaxprTranslationDriver()
+    driver = translator.JaxprTranslationDriver(sub_translators=translator.get_subtranslators())
     assert not driver.is_allocated(), "Driver should not be allocated."
 
     # We allocate the driver directly, because we need to set some internals.
@@ -92,7 +92,7 @@ def test_driver_nested() -> None:
     assert driver._reserved_names is None
 
 
-def test_driver_append_state(alloc_driver: jtrans.JaxprTranslationDriver) -> None:
+def test_driver_append_state(translation_driver: translator.JaxprTranslationDriver) -> None:
     """Tests the functionality of appending states."""
     sdfg: dace.SDFG = alloc_driver.sdfg
 
@@ -128,7 +128,7 @@ def test_driver_append_state(alloc_driver: jtrans.JaxprTranslationDriver) -> Non
     assert next(iter(sdfg.in_edges(non_terminal_state))).src is terminal_state_1
 
 
-def test_driver_scalar(alloc_driver: jtrans.JaxprTranslationDriver) -> None:
+def test_driver_scalar(translation_driver: translator.JaxprTranslationDriver) -> None:
     """This function tests the array creation routines, especially the scalar part.
 
     However, it does so without using Jax variables.
@@ -241,7 +241,7 @@ def test_driver_scalar(alloc_driver: jtrans.JaxprTranslationDriver) -> None:
     assert scal6_ == scal6_j.name
 
 
-def test_driver_array(alloc_driver: jtrans.JaxprTranslationDriver) -> None:
+def test_driver_array(translation_driver: translator.JaxprTranslationDriver) -> None:
     """This function tests the array creation routines.
 
     However, it does so without using Jax variables.
@@ -295,7 +295,7 @@ def test_driver_array2() -> None:
         - Literals.
     """
     # This is the parent driver.
-    driver = jtrans.JaxprTranslationDriver()
+    driver = translator.JaxprTranslationDriver(sub_translators=translator.get_subtranslators())
     assert not driver.is_allocated(), "Driver should not be allocated."
 
     # Creating JaCe Variables with empty names, forces the driver to use the
diff --git a/tests/test_subtranslator_helper.py b/tests/test_subtranslator_helper.py
index e50f9a5..d5885a3 100644
--- a/tests/test_subtranslator_helper.py
+++ b/tests/test_subtranslator_helper.py
@@ -10,97 +10,213 @@
 from __future__ import annotations
 
 import re
+from collections.abc import Mapping, MutableSequence, Sequence
+from inspect import isclass, isfunction
+from typing import Any
 
+import dace
+import jax
+import numpy as np
 import pytest
+from jax import core as jax_core
 
+import jace
 from jace import translator as jtrans
+from jace.translator import (
+    add_fsubtranslator,
+    add_subtranslator,
+    get_subtranslators,
+)
+
+
+@pytest.fixture(autouse=True)
+def _conserve_builtin_translators():
+    """Decorator that preserves the initial list of built in translators.
+
+    Todo:
+        Come up with something better/nicer.
+    """
+    initial_translators = get_subtranslators()
+    yield
+    jtrans.add_subtranslators(*initial_translators.values(), overwrite=True)
+
+
+def _dict_struct(dict_: Mapping[str, Any]) -> Sequence[tuple[str, int]]:
+    return tuple(sorted(((k, id(v)) for k, v in dict_.items()), key=lambda X: X[0]))
+
+
+def test_are_subtranslators_imported():
+    """Tests if something is inside the list of subtranslators."""
+    assert len(get_subtranslators()) > 1
 
 
 def test_subtranslatior_managing():
     """Ensures the functionality of the subtranslator managing."""
-    from jace.translator import (
-        add_subtranslator,
-        get_subtranslators_cls,
-    )
 
-    # These are all initial subtranslators
-    builtin_subtrans_cls = get_subtranslators_cls()
+    # TODO(phimuell): Make this more friendly; See blow
+    builtin_subtrans = get_subtranslators()
+    builin_struct = _dict_struct(builtin_subtrans)
 
-    # Definitions of some classes to help.
     class SubTrans1(jtrans.PrimitiveTranslator):
-        @classmethod
-        def build_translator(cls) -> SubTrans1:
-            return SubTrans1()
-
         @property
         def primitive(self):
             return "non_existing_primitive1"
 
-        def translate_jaxeqn(self) -> None:  # type: ignore[override]  # Arguments
-            return None
+        def __call__(self) -> None:  # type: ignore[override]  # Arguments
+            raise NotImplementedError
 
-    class SubTrans2(jtrans.PrimitiveTranslator):
-        @classmethod
-        def build_translator(cls) -> SubTrans2:
-            return SubTrans2()
+    # Ensures that we really return the object unmodified.
+    SubTrans1_ = add_subtranslator(SubTrans1)
+    assert isclass(SubTrans1_)
+    assert SubTrans1_ is SubTrans1
 
+    @add_subtranslator(overwrite=True)
+    class SubTrans2(jtrans.PrimitiveTranslator):
         @property
         def primitive(self):
             return "non_existing_primitive2"
 
-        def translate_jaxeqn(self) -> None:  # type: ignore[override]  # Arguments
-            return None
-
-    assert SubTrans1 != SubTrans2
-
-    # Adding the first subtranslator to the list.
-    add_subtranslator(SubTrans1)
+        def __call__(self) -> None:  # type: ignore[override]  # Arguments
+            raise NotImplementedError
+
+    assert isclass(SubTrans2)
+
+    @add_fsubtranslator("non_existing_primitive3")
+    def non_existing_primitive_translator_3(
+        driver: jtrans.JaxprTranslationDriver,
+        in_var_names: Sequence[str | None],
+        out_var_names: MutableSequence[str],
+        eqn: jax_core.JaxprEqn,
+        eqn_state: dace.SDFGState,
+    ) -> dace.SDFGState | None:
+        raise NotImplementedError
+
+    assert isfunction(non_existing_primitive_translator_3)
+    assert non_existing_primitive_translator_3.primitive == "non_existing_primitive3"
+
+    curr1_subtrans = get_subtranslators()
+    curr1_subtrans_mod = get_subtranslators(as_mutable=True)
+    assert curr1_subtrans is not builtin_subtrans
+    assert curr1_subtrans is not curr1_subtrans_mod
+    assert _dict_struct(curr1_subtrans) != builin_struct
+    assert _dict_struct(curr1_subtrans) == _dict_struct(curr1_subtrans_mod)
+
+    for i in [1, 2, 3]:
+        pname = f"non_existing_primitive{i}"
+        assert pname in curr1_subtrans, f"Expected to find '{pname}'."
+        curr1_subtrans_mod.pop(pname)
+    assert builin_struct == _dict_struct(curr1_subtrans_mod)
+    assert curr1_subtrans is get_subtranslators()
+
+    # Try adding instance and if we can overwrite.
+    sub_trans1_instance = SubTrans1()
+    with pytest.raises(
+        expected_exception=ValueError,
+        match=re.escape(
+            "Tried to add a second translator for primitive 'non_existing_primitive1'."
+        ),
+    ):
+        add_subtranslator(sub_trans1_instance, overwrite=False)
 
-    curr_subtrans_cls = get_subtranslators_cls()
-    assert len(curr_subtrans_cls) == len(builtin_subtrans_cls) + 1
-    assert all(
-        type(exp) == type(got)
-        for exp, got in zip([SubTrans1, *builtin_subtrans_cls], curr_subtrans_cls)
-    )
+    # Now adding it forcefully, this should also change a lot.
+    add_subtranslator(sub_trans1_instance, overwrite=True)
 
-    # Now adding the second subtranslator
-    add_subtranslator(SubTrans2)
+    curr2_subtrans = get_subtranslators()
+    assert curr2_subtrans is not builtin_subtrans
+    assert curr2_subtrans is not curr1_subtrans
+    assert _dict_struct(curr2_subtrans) != builin_struct
+    assert _dict_struct(curr2_subtrans) != _dict_struct(curr1_subtrans)
+    assert curr2_subtrans["non_existing_primitive1"] is sub_trans1_instance
 
-    curr_subtrans_cls2 = get_subtranslators_cls()
-    assert len(curr_subtrans_cls2) == len(builtin_subtrans_cls) + 2
-    assert [SubTrans2, SubTrans1, *builtin_subtrans_cls] == curr_subtrans_cls2
-    assert curr_subtrans_cls2 is not curr_subtrans_cls
+    # Try to answer a function as translator, that already has a primitive property.
+    with pytest.raises(
+        expected_exception=ValueError,
+        match=re.escape("Passed 'fun' already 'non_existing_primitive3' as 'primitive' property."),
+    ):
+        add_fsubtranslator(
+            "non_existing_primitive1", non_existing_primitive_translator_3, overwrite=False
+        )
 
+    # This would work because it has the same primitive name, but it fails because overwrite is False
     with pytest.raises(
         expected_exception=ValueError,
         match=re.escape(
-            f"Tried to add '{type(SubTrans1).__name__}' twice to the list of known primitive translators."
+            "Tried to add a second translator for primitive 'non_existing_primitive3'."
         ),
     ):
-        add_subtranslator(SubTrans2)
+        add_fsubtranslator(
+            "non_existing_primitive3", non_existing_primitive_translator_3, overwrite=False
+        )
 
-    @add_subtranslator
-    class SubTrans3(jtrans.PrimitiveTranslator):
-        @classmethod
-        def build_translator(cls) -> SubTrans2:
-            return SubTrans2()
+    add_fsubtranslator(
+        "non_existing_primitive3", non_existing_primitive_translator_3, overwrite=True
+    )
+
+
+def test_subtranslatior_managing_2():
+    """Shows that we are really able to overwrite stuff"""
+    jax.config.update("jax_enable_x64", True)
 
+    @add_subtranslator(overwrite=True)
+    class NonAddTranslator(jtrans.PrimitiveTranslator):
         @property
         def primitive(self):
-            return "non_existing_primitive2"
+            return "add"
+
+        def __call__(self, *args, **kwargs) -> None:
+            raise NotImplementedError("The 'NonAddTranslator' can not translate anything.")
+
+    @jace.jit
+    def testee(A: np.ndarray, B: np.ndarray) -> np.ndarray:
+        return A + B
+
+    A = np.arange(12, dtype=np.float64).reshape((4, 3))
+    B = np.full((4, 3), 10, dtype=np.float64)
+
+    with pytest.raises(
+        expected_exception=NotImplementedError,
+        match=re.escape("The 'NonAddTranslator' can not translate anything."),
+    ):
+        _ = testee.lower(A, B)
+
 
-        def translate_jaxeqn(self) -> None:  # type: ignore[override]  # Arguments
-            return None
+def test_subtranslatior_managing_3():
+    """Shows proper decoupling."""
+    jax.config.update("jax_enable_x64", True)
 
-    curr_subtrans_cls3 = get_subtranslators_cls()
-    assert len(curr_subtrans_cls3) == len(builtin_subtrans_cls) + 3
-    assert [SubTrans3, SubTrans2, SubTrans1, *builtin_subtrans_cls] == curr_subtrans_cls3
+    class NonAddTranslator(jtrans.PrimitiveTranslator):
+        @property
+        def primitive(self):
+            return "add"
+
+        def __call__(self, *args, **kwargs) -> None:
+            raise NotImplementedError("The 'NonAddTranslator' can not translate anything at all.")
+
+    used_sub_trans = get_subtranslators(as_mutable=True)
+    used_sub_trans["add"] = NonAddTranslator()
+
+    @jace.jit(sub_translators=used_sub_trans)
+    def not_working_test(A: np.ndarray, B: np.ndarray) -> np.ndarray:
+        return A + B
+
+    # Now we again remove the add from the list, but this will not have an impact on the `not_working_test()`.
+    used_sub_trans.pop("add")
+
+    @jace.jit
+    def working_test(A: np.ndarray, B: np.ndarray) -> np.ndarray:
+        return A + B
+
+    A = np.arange(12, dtype=np.float64).reshape((4, 3))
+    B = np.full((4, 3), 10, dtype=np.float64)
+
+    with pytest.raises(
+        expected_exception=NotImplementedError,
+        match=re.escape("The 'NonAddTranslator' can not translate anything at all."),
+    ):
+        _ = not_working_test.lower(A, B)
 
-    # Adding version 1 again, but this time using overwrite
-    add_subtranslator(SubTrans1, overwrite=True)
-    curr_subtrans_cls4 = get_subtranslators_cls()
-    assert len(curr_subtrans_cls3) == len(curr_subtrans_cls4)
-    assert [SubTrans1, SubTrans3, SubTrans2, *builtin_subtrans_cls] == curr_subtrans_cls4
+    # This works because the
+    working_test.lower(A, B)
 
 
 if __name__ == "__main__":

From e0d5a527e845217beaa0efe905fff5844a4163d2 Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Thu, 16 May 2024 15:38:22 +0200
Subject: [PATCH 159/458] More cleaning up, but that belongs to the PR.

---
 .../translator/jaxpr_translator_driver.py     | 60 +++++--------------
 src/jace/translator/managing.py               |  1 -
 src/jace/util/jax_helper.py                   | 10 +---
 3 files changed, 18 insertions(+), 53 deletions(-)

diff --git a/src/jace/translator/jaxpr_translator_driver.py b/src/jace/translator/jaxpr_translator_driver.py
index 262b1c8..4e036c8 100644
--- a/src/jace/translator/jaxpr_translator_driver.py
+++ b/src/jace/translator/jaxpr_translator_driver.py
@@ -9,7 +9,7 @@
 
 import itertools
 from collections.abc import Iterable, Mapping, MutableSequence, Sequence
-from typing import Any, Final, cast, overload, Literal
+from typing import Any, Final, Literal, cast, overload
 
 import dace
 import jax
@@ -74,7 +74,7 @@ def __init__(
         Notes:
             `sub_translators` is not copied, thus the user has to guarantee,
                 that it will not change during translation.
-                It is highly advised but not requiered to use the output of
+                It is highly advised but not required to use the output of
                 `get_subtranslators()` or pass a copy as argument.
         """
 
@@ -105,7 +105,6 @@ def translate_jaxpr(
         inp_scalar_as_array: bool = False,
         name: str | None = None,
         reserved_names: str | Iterable[str] = (),
-        allow_empty_jaxpr: bool = False,
     ) -> translator.TranslatedJaxprSDFG:
         """Perform the translation of a Jaxpr into a SDFG.
 
@@ -121,19 +120,9 @@ def translate_jaxpr(
             inp_scalar_as_array:    Translate scalar _input_ arguments to arrays of length 1.
             name:                   Use this name for the SDFG instead some generated one.
             reserved_names:         Prevent the generation of variables with these names, see `self.add_array()` for more.
-            allow_empty_jaxpr:      Allows empty Jaxpr.
-
-        Notes:
-            Every time this function is called a new revision index is generated.
         """
-        if (len(jaxpr.eqns) == 0) and (not allow_empty_jaxpr):
-            raise ValueError("Passed an empty Jaxpr, but did not allow for empty Jaxpr.")
-        if not isinstance(jaxpr, jax_core.ClosedJaxpr):
-            raise TypeError(f"Expected a 'jax.core.ClosedJaxp' instance but got '{type(jaxpr)}'")
         if len(jaxpr.effects) != 0:
             raise NotImplementedError("'Jaxpr' with side effects are not supported.")
-        if len(jaxpr.out_avals) == 0:
-            raise ValueError("Jaxpr has zero output variables.")
         if not jax.config.read("jax_enable_x64"):
             raise NotImplementedError("The translation only works if 'jax_enable_x64' is enabled.")
 
@@ -164,7 +153,6 @@ def append_new_state(
         label: str | None = None,
         condition: dprop.CodeBlock | None = None,
         assignments: Mapping[str, Any] | None = None,
-        *,
         prev_state: dace.SDFGState | None = None,
     ) -> dace.SDFGState:
         """Creates a new `SDFGState` and adds it to the SDFG.
@@ -334,7 +322,7 @@ def add_jax_name_mapping(
             jax_var:     The Jax variable.
             sdfg_name:   The name of the corresponding SDFG variable.
         """
-        assert isinstance(sdfg_name, str) and (len(sdfg_name) > 0)  # noqa: PT018  # Should be one assertion.
+        assert len(sdfg_name) > 0
 
         if jax_var in self._ctx.jax_name_map:
             if self._ctx.jax_name_map[jax_var] == sdfg_name:  # noops.
@@ -361,10 +349,6 @@ def add_reserved_names(
             return self
         if isinstance(reserved_names, str):
             reserved_names = [reserved_names]
-        elif isinstance(reserved_names, Iterable):
-            pass
-        else:
-            raise TypeError(f"Does not know how to handle the type '{type(reserved_names)}'.")
         self._reserved_names.update(reserved_names)
         return self
 
@@ -423,9 +407,7 @@ def add_array(
             If you need to create a special array, you can use `jace.util.JaCeVar`
                 to create a pseudo Jax variable.
         """
-        assert self.is_allocated()
-
-        shape: Sequence[int] = util.get_jax_var_shape(arg)
+        shape: tuple[int] = util.get_jax_var_shape(arg)
         dtype = util.get_jax_var_dtype(arg)
         offset = None  # i.e. no offset
         storage: dace.StorageType = dace.StorageType.Default  # Set at later stages (optimization)
@@ -452,7 +434,6 @@ def add_array(
             find_new_name = False
             alt_name = util._propose_jax_name(arg, self._ctx.jax_name_map)
         if alt_name is not None:
-            assert isinstance(alt_name, str)
             find_new_name = False  # If a name was given, then use it no matter what.
             if len(alt_name) == 0:
                 raise ValueError("Passed an empty 'alt_name'.")
@@ -468,10 +449,8 @@ def add_array(
                 raise ValueError(
                     f"Specified 'name_prefix' ('{name_prefix}') but passed '{alt_name}' as 'alt_name'."
                 )
-        if name_prefix is not None:
-            assert isinstance(name_prefix, str)
-            if len(name_prefix) == 0:
-                raise ValueError("Specified an empty 'name_prefix'.")
+        if (name_prefix is not None) and (len(name_prefix) == 0):
+            raise ValueError("Specified an empty 'name_prefix'.")
 
         # Checking the strides.
         if strides is not None:
@@ -479,7 +458,8 @@ def add_array(
                 raise ValueError("Specified a stride for a scalar.")
             if isinstance(strides, (str, dace.symbol, int)):
                 strides = (strides,)
-            assert isinstance(strides, tuple)
+            elif not isinstance(strides, tuple):
+                strides = tuple(strides)
             if len(strides) != len(shape):
                 raise ValueError(
                     f"'strides' has length {len(strides)}, but array rank is {len(shape)}."
@@ -499,8 +479,6 @@ def add_array(
                 raise NotImplementedError("Jax Literals are not supported.")
             if alt_name is None:
                 raise ValueError(f"Passed literal '{arg}', but not specified a name to use.")
-        else:
-            raise TypeError(f"Does not know how to handle '{type(arg).__name__}'.")
 
         if alt_name is None:
             # If we are the root translator, then we will use `prop_name` directly;
@@ -623,7 +601,9 @@ def create_jax_var_list(  # type: ignore[misc]
         """
         if only_creation and prevent_creation:
             raise ValueError("Specified both 'only_creation' and 'prevent_creation'.")
-        assert "update_var_mapping" not in kwargs
+        assert (
+            "update_var_mapping" not in kwargs
+        ), "You can not pass 'update_var_mapping' as argument to 'create_jax_var_list()'."
 
         ret_list: list[None | str] = []
         for jax_var in jax_var_list:
@@ -631,7 +611,7 @@ def create_jax_var_list(  # type: ignore[misc]
                 if not handle_literals:
                     raise ValueError("Encountered a literal but `handle_literals` was `False`.")
                 sdfg_name = None
-            elif isinstance(jax_var, (jax_core.Var, util.JaCeVar)):
+            else:
                 mapped_sdfg_name: str | None = self.map_jax_var_to_sdfg(jax_var, allow_fail=True)
                 if (mapped_sdfg_name is None) and prevent_creation:
                     raise ValueError(f"'prevent_creation' given but have to create '{jax_var}'.")
@@ -643,8 +623,6 @@ def create_jax_var_list(  # type: ignore[misc]
                     sdfg_name = mapped_sdfg_name
                 # Calling `add_jax_name_mapping` is save, because if the mapping does already exists it is a no ops.
                 self.add_jax_name_mapping(jax_var, sdfg_name)
-            else:
-                raise TypeError(f"Does not know how to handle '{type(jax_var).__name__}'")
 
             ret_list.append(sdfg_name)
 
@@ -671,7 +649,6 @@ def _create_initial_input(
             raise RuntimeError("Driver is not allocated, can not create constants.")
         if len(self._ctx.inp_names) != 0:
             raise RuntimeError("Called '_create_initial_input()' twice?")
-        assert len(self._ctx.out_names) == 0
 
         # Handle the initial input arguments
         sdfg: dace.SDFG = self._ctx.sdfg
@@ -709,7 +686,7 @@ def _create_constants(
         if not self.is_allocated():
             raise RuntimeError("Driver is not allocated, can not create constants.")
         if len(jaxpr.consts) == 0:
-            return []
+            return ()
 
         sdfg_const_names: Sequence[str] = self.create_jax_var_list(
             jax_var_list=jaxpr.jaxpr.constvars,
@@ -830,9 +807,7 @@ def _translate_single_eqn(
         # Find the subtranslator
         prim_name: str = eqn.primitive.name
         if prim_name not in self._sub_translators:
-            raise NotImplementedError(
-                f"No subtranslators known to handle '{prim_name}' || {type(self._sub_translators)}."
-            )
+            raise NotImplementedError(f"No subtranslators known to handle '{prim_name}'.")
         subtranslator = self._sub_translators[prim_name]
 
         # Create the state into which the equation should be translated
@@ -856,11 +831,6 @@ def _translate_single_eqn(
             if eqn_state is not self._ctx.terminal_state:
                 raise RuntimeError("Inconsistent terminal state was detected.")
             new_sdfg_term_state = eqn_state
-        elif isinstance(new_sdfg_term_state, dace.SDFGState):
-            # TODO(phimuell): use `last_term_state` to test if `new_sdfg_term_state` is reachable.
-            pass
-        else:
-            raise TypeError(f"Encountered illegal types '{type(new_sdfg_term_state)}'")
 
         # In case a subtranslator decided to not use the variables we created for it, which is allowed
         #  but he must update the `out_var_names` list correctly, we will now verify this.
@@ -898,7 +868,7 @@ def _translate_jaxpr_internal(
                 Such variables are included by some transformations such as `grad()`.
         """
         nb_translated_eqn: int = 0
-        out_var_names: Sequence[str] = []
+        out_var_names: Sequence[str] = ()
 
         # Translate the equations one by one.
         for eqn in jaxpr.jaxpr.eqns:
diff --git a/src/jace/translator/managing.py b/src/jace/translator/managing.py
index e3afc99..e15769b 100644
--- a/src/jace/translator/managing.py
+++ b/src/jace/translator/managing.py
@@ -150,7 +150,6 @@ def wrapper(real_fun: Callable) -> PrimitiveTranslator:
 
         return wrapper
 
-    assert inspect.isfunction(fun)
     if getattr(fun, "primitive", prim_name) != prim_name:
         raise ValueError(f"Passed 'fun' already '{fun.primitive}' as 'primitive' property.")  # type: ignore[attr-defined]
 
diff --git a/src/jace/util/jax_helper.py b/src/jace/util/jax_helper.py
index 0de9934..cd027d6 100644
--- a/src/jace/util/jax_helper.py
+++ b/src/jace/util/jax_helper.py
@@ -181,16 +181,12 @@ def _propose_jax_name(
         raise RuntimeError(
             f"Can not propose a second name for '{jax_var}', it already known as '{jax_name_map[jax_var]}'."
         )
-    if isinstance(jax_var, jax_core.Var):
-        pass
-    elif isinstance(jax_var, JaCeVar):
+    if isinstance(jax_var, JaCeVar) and (jax_var.name != ""):
         # If the name of the JaCe variable is empty, then use the name proposing
         #  technique used for Jax variables; Mostly used for debugging.
-        if jax_var.name != "":
-            return jax_var.name
-    else:
-        raise TypeError(f"Can not propose a name for '{jax_var}'")
+        return jax_var.name
 
+    # This code is taken from the Jax source.
     c = len(jax_name_map)
     jax_name = ""
     while len(jax_name) == 0 or c != 0:

From a95a843a7c59355f070d021351cb31da153f4dba Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Thu, 16 May 2024 15:42:35 +0200
Subject: [PATCH 160/458] Fixed the tests.

---
 src/jace/util/debug.py                |  5 +-
 tests/test_jaxpr_translator_driver.py | 64 ++++++++++++-------------
 tests/test_subtranslator_helper.py    | 69 ---------------------------
 3 files changed, 34 insertions(+), 104 deletions(-)

diff --git a/src/jace/util/debug.py b/src/jace/util/debug.py
index d4ae754..023b3a5 100644
--- a/src/jace/util/debug.py
+++ b/src/jace/util/debug.py
@@ -81,17 +81,16 @@ def run_jax_sdfg(jsdfg: translator.TranslatedJaxprSDFG, *args: Any) -> tuple[Any
             jsdfg.sdfg.arrays[name].transient = True
 
 
-def _jace_run(fun: Callable, *args: Any, **kwargs: Any) -> Any:
+def _jace_run(fun: Callable, *args: Any) -> Any:
     """Traces and run function `fun` using `Jax | DaCe`.
 
     Args:
         *args:      Forwarded to the tracing and final execution of the SDFG.
-        **kwargs:   Used to construct the driver.
 
     Notes:
         This function will be removed soon.
     """
     jaxpr = jax.make_jaxpr(fun)(*args)
-    driver = translator.JaxprTranslationDriver(**kwargs)
+    driver = translator.JaxprTranslationDriver(translator.get_subtranslators())
     jsdfg = driver.translate_jaxpr(jaxpr)
     return run_jax_sdfg(jsdfg, *args)
diff --git a/tests/test_jaxpr_translator_driver.py b/tests/test_jaxpr_translator_driver.py
index 7339525..b00ee72 100644
--- a/tests/test_jaxpr_translator_driver.py
+++ b/tests/test_jaxpr_translator_driver.py
@@ -94,35 +94,35 @@ def test_driver_nested() -> None:
 
 def test_driver_append_state(translation_driver: translator.JaxprTranslationDriver) -> None:
     """Tests the functionality of appending states."""
-    sdfg: dace.SDFG = alloc_driver.sdfg
+    sdfg: dace.SDFG = translation_driver.sdfg
 
-    terminal_state_1: dace.SDFGState = alloc_driver.append_new_state("terminal_state_1")
+    terminal_state_1: dace.SDFGState = translation_driver.append_new_state("terminal_state_1")
     assert sdfg.number_of_nodes() == 2
     assert sdfg.number_of_edges() == 1
-    assert terminal_state_1 is alloc_driver.terminal_sdfg_state
-    assert alloc_driver.terminal_sdfg_state is alloc_driver._ctx.terminal_state
-    assert alloc_driver._ctx.start_state is sdfg.start_block
-    assert alloc_driver._ctx.start_state is not terminal_state_1
+    assert terminal_state_1 is translation_driver.terminal_sdfg_state
+    assert translation_driver.terminal_sdfg_state is translation_driver._ctx.terminal_state
+    assert translation_driver._ctx.start_state is sdfg.start_block
+    assert translation_driver._ctx.start_state is not terminal_state_1
     assert next(iter(sdfg.edges())).src is sdfg.start_block
     assert next(iter(sdfg.edges())).dst is terminal_state_1
 
     # Specifying an explicit append state that is the terminal should also update the terminal state of the driver.
-    terminal_state_2: dace.SDFGState = alloc_driver.append_new_state(
+    terminal_state_2: dace.SDFGState = translation_driver.append_new_state(
         "terminal_state_2", prev_state=terminal_state_1
     )
     assert sdfg.number_of_nodes() == 3
     assert sdfg.number_of_edges() == 2
-    assert terminal_state_2 is alloc_driver.terminal_sdfg_state
+    assert terminal_state_2 is translation_driver.terminal_sdfg_state
     assert sdfg.out_degree(terminal_state_1) == 1
     assert sdfg.out_degree(terminal_state_2) == 0
     assert sdfg.in_degree(terminal_state_2) == 1
     assert next(iter(sdfg.in_edges(terminal_state_2))).src is terminal_state_1
 
     # Specifying a previous node that is not the terminal state should not do anything.
-    non_terminal_state: dace.SDFGState = alloc_driver.append_new_state(
+    non_terminal_state: dace.SDFGState = translation_driver.append_new_state(
         "non_terminal_state", prev_state=terminal_state_1
     )
-    assert alloc_driver.terminal_sdfg_state is not non_terminal_state
+    assert translation_driver.terminal_sdfg_state is not non_terminal_state
     assert sdfg.in_degree(non_terminal_state) == 1
     assert sdfg.out_degree(non_terminal_state) == 0
     assert next(iter(sdfg.in_edges(non_terminal_state))).src is terminal_state_1
@@ -137,24 +137,24 @@ def test_driver_scalar(translation_driver: translator.JaxprTranslationDriver) ->
 
     # Creating a scalar.
     scal1_j = JaCeVar("scal1", (), dace.float64)
-    scal1_: str = alloc_driver.add_array(
+    scal1_: str = translation_driver.add_array(
         arg=scal1_j,
         update_var_mapping=True,
     )
-    scal1: Data = alloc_driver.get_array(scal1_)
-    assert scal1 is alloc_driver.get_array(scal1_j)
-    assert scal1_ == alloc_driver.map_jax_var_to_sdfg(scal1_j)
+    scal1: Data = translation_driver.get_array(scal1_)
+    assert scal1 is translation_driver.get_array(scal1_j)
+    assert scal1_ == translation_driver.map_jax_var_to_sdfg(scal1_j)
     assert isinstance(scal1, Scalar)
     assert scal1_ == scal1_j.name
     assert scal1.dtype == scal1_j.dtype
 
     # Create a scalar and force it as an array
     scal2_j = JaCeVar("scal2", (), dace.int64)
-    scal2_: str = alloc_driver.add_array(
+    scal2_: str = translation_driver.add_array(
         arg=scal2_j,
         force_array=True,
     )
-    scal2: Data = alloc_driver.get_array(scal2_)
+    scal2: Data = translation_driver.get_array(scal2_)
     assert isinstance(scal2, Array)
     assert scal2_ == scal2_j.name
     assert scal2.shape == (1,)
@@ -164,13 +164,13 @@ def test_driver_scalar(translation_driver: translator.JaxprTranslationDriver) ->
     # Using a special name for the variable
     scal3_j = JaCeVar("scal3", (), dace.int64)
     scal3_n = "scal3_special_name"
-    scal3_: str = alloc_driver.add_array(
+    scal3_: str = translation_driver.add_array(
         arg=scal3_j,
         alt_name=scal3_n,
         update_var_mapping=True,
     )
     assert scal3_ == scal3_n
-    assert scal3_ == alloc_driver.map_jax_var_to_sdfg(scal3_j)
+    assert scal3_ == translation_driver.map_jax_var_to_sdfg(scal3_j)
 
     # Test the prefix functionality
     scal4_j = JaCeVar("scal4", (), dace.float64)
@@ -182,13 +182,13 @@ def test_driver_scalar(translation_driver: translator.JaxprTranslationDriver) ->
             f"Specified 'name_prefix' ('{scal4_p}') but passed '{scal4_n}' as 'alt_name'."
         ),
     ):
-        scal4_: str = alloc_driver.add_array(
+        scal4_: str = translation_driver.add_array(
             arg=scal4_j,
             alt_name=scal4_n,
             name_prefix=scal4_p,
         )
     # Now create it correctly
-    scal4_ = alloc_driver.add_array(
+    scal4_ = translation_driver.add_array(
         arg=scal4_j,
         name_prefix=scal4_p,
     )
@@ -201,7 +201,7 @@ def test_driver_scalar(translation_driver: translator.JaxprTranslationDriver) ->
         expected_exception=ValueError,
         match="Specified a stride for a scalar.",
     ):
-        scal5_: str = alloc_driver.add_array(arg=scal5_j, strides=(3,))
+        scal5_: str = translation_driver.add_array(arg=scal5_j, strides=(3,))
 
     # test the force jax name feature
     scal6_j = JaCeVar("scal6", (), dace.float64)
@@ -211,7 +211,7 @@ def test_driver_scalar(translation_driver: translator.JaxprTranslationDriver) ->
         expected_exception=ValueError,
         match=f"Specified 'force_jax_name', but passed '{scal6_n}' as 'alt_name'.",
     ):
-        scal6_: str = alloc_driver.add_array(
+        scal6_: str = translation_driver.add_array(
             arg=scal6_j,
             alt_name=scal6_n,
             force_jax_name=True,
@@ -220,7 +220,7 @@ def test_driver_scalar(translation_driver: translator.JaxprTranslationDriver) ->
         expected_exception=ValueError,
         match=f"Specified 'force_jax_name', but passed '{scal6_np}' as 'name_prefix'.",
     ):
-        scal6_ = alloc_driver.add_array(
+        scal6_ = translation_driver.add_array(
             arg=scal6_j,
             name_prefix=scal6_np,
             force_jax_name=True,
@@ -229,12 +229,12 @@ def test_driver_scalar(translation_driver: translator.JaxprTranslationDriver) ->
         expected_exception=ValueError,
         match="Specified `force_jax_name` but also wanted a new name.",
     ):
-        scal6_ = alloc_driver.add_array(
+        scal6_ = translation_driver.add_array(
             arg=scal6_j,
             force_jax_name=True,
             find_new_name=True,
         )
-    scal6_ = alloc_driver.add_array(
+    scal6_ = translation_driver.add_array(
         arg=scal6_j,
         force_jax_name=True,
     )
@@ -248,10 +248,10 @@ def test_driver_array(translation_driver: translator.JaxprTranslationDriver) ->
     """
     # Allocating an array
     arr1_j = JaCeVar("arr1", (5, 3), dace.float32)
-    arr1_: str = alloc_driver.add_array(
+    arr1_: str = translation_driver.add_array(
         arg=arr1_j,
     )
-    arr1: Data = alloc_driver.get_array(arr1_)
+    arr1: Data = translation_driver.get_array(arr1_)
     assert isinstance(arr1, Array)
     assert arr1_ == arr1_j.name
     assert arr1.shape == arr1_j.shape
@@ -264,12 +264,12 @@ def test_driver_array(translation_driver: translator.JaxprTranslationDriver) ->
         expected_exception=ValueError,
         match=f"Can't create variable '{arr2_j.name}', variable is already created.",
     ):
-        arr2_: str = alloc_driver.add_array(arg=arr2_j)
+        arr2_: str = translation_driver.add_array(arg=arr2_j)
     with pytest.raises(expected_exception=ValueError, match=f"Variable '{arr1_}' already exists."):
         # `alt_name` will not work because name still exists.
-        arr2_ = alloc_driver.add_array(arg=arr2_j, alt_name=arr2_j.name)
+        arr2_ = translation_driver.add_array(arg=arr2_j, alt_name=arr2_j.name)
     # However, specifying `find_new_name` will solve this issue
-    arr2_ = alloc_driver.add_array(
+    arr2_ = translation_driver.add_array(
         arg=arr2_j,
         find_new_name=True,
     )
@@ -278,11 +278,11 @@ def test_driver_array(translation_driver: translator.JaxprTranslationDriver) ->
     # Create a variable that has a custom stride
     arr3_j = JaCeVar("arr3", (5, 1, 3), dace.float64)
     arr3_st = (5, 3, 2)
-    arr3_: str = alloc_driver.add_array(
+    arr3_: str = translation_driver.add_array(
         arg=arr3_j,
         strides=arr3_st,
     )
-    arr3: Data = alloc_driver.get_array(arr3_)
+    arr3: Data = translation_driver.get_array(arr3_)
     assert isinstance(arr3, Array)
     assert arr3.shape == arr3_j.shape
     assert arr3.strides == arr3_st
diff --git a/tests/test_subtranslator_helper.py b/tests/test_subtranslator_helper.py
index d5885a3..27baf97 100644
--- a/tests/test_subtranslator_helper.py
+++ b/tests/test_subtranslator_helper.py
@@ -15,12 +15,9 @@
 from typing import Any
 
 import dace
-import jax
-import numpy as np
 import pytest
 from jax import core as jax_core
 
-import jace
 from jace import translator as jtrans
 from jace.translator import (
     add_fsubtranslator,
@@ -153,71 +150,5 @@ def non_existing_primitive_translator_3(
     )
 
 
-def test_subtranslatior_managing_2():
-    """Shows that we are really able to overwrite stuff"""
-    jax.config.update("jax_enable_x64", True)
-
-    @add_subtranslator(overwrite=True)
-    class NonAddTranslator(jtrans.PrimitiveTranslator):
-        @property
-        def primitive(self):
-            return "add"
-
-        def __call__(self, *args, **kwargs) -> None:
-            raise NotImplementedError("The 'NonAddTranslator' can not translate anything.")
-
-    @jace.jit
-    def testee(A: np.ndarray, B: np.ndarray) -> np.ndarray:
-        return A + B
-
-    A = np.arange(12, dtype=np.float64).reshape((4, 3))
-    B = np.full((4, 3), 10, dtype=np.float64)
-
-    with pytest.raises(
-        expected_exception=NotImplementedError,
-        match=re.escape("The 'NonAddTranslator' can not translate anything."),
-    ):
-        _ = testee.lower(A, B)
-
-
-def test_subtranslatior_managing_3():
-    """Shows proper decoupling."""
-    jax.config.update("jax_enable_x64", True)
-
-    class NonAddTranslator(jtrans.PrimitiveTranslator):
-        @property
-        def primitive(self):
-            return "add"
-
-        def __call__(self, *args, **kwargs) -> None:
-            raise NotImplementedError("The 'NonAddTranslator' can not translate anything at all.")
-
-    used_sub_trans = get_subtranslators(as_mutable=True)
-    used_sub_trans["add"] = NonAddTranslator()
-
-    @jace.jit(sub_translators=used_sub_trans)
-    def not_working_test(A: np.ndarray, B: np.ndarray) -> np.ndarray:
-        return A + B
-
-    # Now we again remove the add from the list, but this will not have an impact on the `not_working_test()`.
-    used_sub_trans.pop("add")
-
-    @jace.jit
-    def working_test(A: np.ndarray, B: np.ndarray) -> np.ndarray:
-        return A + B
-
-    A = np.arange(12, dtype=np.float64).reshape((4, 3))
-    B = np.full((4, 3), 10, dtype=np.float64)
-
-    with pytest.raises(
-        expected_exception=NotImplementedError,
-        match=re.escape("The 'NonAddTranslator' can not translate anything at all."),
-    ):
-        _ = not_working_test.lower(A, B)
-
-    # This works because the
-    working_test.lower(A, B)
-
-
 if __name__ == "__main__":
     test_subtranslatior_managing()

From bdaf93727048a3ff2e5f503f67dc8ae384cfba95 Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Fri, 17 May 2024 07:38:22 +0200
Subject: [PATCH 161/458] Fixed the `__wrapper__` inconsistency.

The solution, I only partially like, is to create a new property in the `JaceWrapped` object.
Furthermore the object is no longer annotated inside the constructor, but inside `jit`.
This makes more sense since `jit` is a wrapper while `JaceWrapped` is essentially a carrier.
---
 src/jace/jax/api.py                      |  4 +++-
 src/jace/jax/stages/jace_wrapped.py      | 29 ++++++++++++------------
 src/jace/jax/stages/translation_cache.py |  2 +-
 3 files changed, 19 insertions(+), 16 deletions(-)

diff --git a/src/jace/jax/api.py b/src/jace/jax/api.py
index 6919f3b..79a067a 100644
--- a/src/jace/jax/api.py
+++ b/src/jace/jax/api.py
@@ -11,6 +11,7 @@
 
 from collections.abc import Callable, Mapping
 from typing import Any
+import functools as ft
 
 import jax as _jax_jax
 
@@ -62,11 +63,12 @@ def wrapper(f: Callable) -> jjax.JaceWrapped:
     if sub_translators is None:
         sub_translators = translator.get_subtranslators()
 
-    return jjax.JaceWrapped(
+    wrapper = jjax.JaceWrapped(
         fun=fun,
         sub_translators=sub_translators,
         jit_ops=kwargs,
     )
+    return ft.wraps(fun)(wrapper)
 
 
 @api_helper.jax_wrapper(_jax_jax.pmap)
diff --git a/src/jace/jax/stages/jace_wrapped.py b/src/jace/jax/stages/jace_wrapped.py
index 2228e5c..433bc8a 100644
--- a/src/jace/jax/stages/jace_wrapped.py
+++ b/src/jace/jax/stages/jace_wrapped.py
@@ -9,7 +9,6 @@
 
 from __future__ import annotations
 
-import functools as ft
 from collections.abc import Callable, Mapping
 from typing import Any
 
@@ -30,9 +29,6 @@ class JaceWrapped(stages.Stage):
 
     You should not create `JaceWrapped` instances directly, instead you should use `jace.jit`.
 
-    Notes:
-        The wrapped function is accessible through the `__wrapped__` property.
-
     Todo:
         Handles pytrees.
         Copy the `jax._src.pjit.make_jit()` functionality to remove `jax.make_jaxpr()`.
@@ -67,10 +63,7 @@ def __init__(
         Notes:
             Both the `sub_translators` and `jit_ops` are shallow copied.
         """
-
-        # Makes that `self` is a true stand-in for `fun`
         self._fun: Callable = fun
-        ft.update_wrapper(self, self._fun)  # TODO(phimuell): modify text; Jax does the same.
 
         # Why do we have to make a copy (shallow copy is enough as the translators themselves are immutable)?
         #  The question is a little bit tricky so let's consider the following situation:
@@ -112,17 +105,20 @@ def __call__(
     ) -> Any:
         """Executes the wrapped function, lowering and compiling as needed in one step."""
 
+        # TODO(phimuell): Handle the `disable_jit` context manager of Jax.
+
         # This allows us to be composable with Jax transformations.
         if util.is_tracing_ongoing(*args, **kwargs):
-            return self.__wrapped__(*args, **kwargs)
-        # TODO(phimuell): Handle the case of gradients:
-        #                   It seems that this one uses special tracers, since they can handle comparisons.
-        #                   https://jax.readthedocs.io/en/latest/notebooks/Common_Gotchas_in_JAX.html#python-control-flow-autodiff
-        # TODO(phimuell): Handle the `disable_jit` context manager of Jax.
+            # TODO(phimuell): Handle the case of gradients:
+            #                   It seems that this one uses special tracers, since they can handle comparisons.
+            #                   https://jax.readthedocs.io/en/latest/notebooks/Common_Gotchas_in_JAX.html#python-control-flow-autodiff
+            return self._fun(*args, **kwargs)
 
         # TODO(phimuell): Handle static arguments correctly
         #                   https://jax.readthedocs.io/en/latest/aot.html#lowering-with-static-arguments
-        return self.lower(*args, **kwargs).compile()(*args, **kwargs)
+        lowered = self.lower(*args, **kwargs)
+        compiled = lowered.compile()
+        return compiled(*args, **kwargs)
 
     @tcache.cached_translation
     def lower(
@@ -148,6 +144,11 @@ def lower(
         jaxpr = jax_jax.make_jaxpr(self._fun)(*real_args)
         driver = translator.JaxprTranslationDriver(sub_translators=self._sub_translators)
         trans_sdfg: translator.TranslatedJaxprSDFG = driver.translate_jaxpr(jaxpr)
-        ptrans.postprocess_jaxpr_sdfg(tsdfg=trans_sdfg, fun=self.__wrapped__)
+        ptrans.postprocess_jaxpr_sdfg(tsdfg=trans_sdfg, fun=self.wrapped_fun)
         # The `JaceLowered` assumes complete ownership of `trans_sdfg`!
         return stages.JaceLowered(trans_sdfg)
+
+    @property
+    def wrapped_fun(self) -> Callable:
+        """Returns the wrapped function."""
+        return self._fun
diff --git a/src/jace/jax/stages/translation_cache.py b/src/jace/jax/stages/translation_cache.py
index d27dd72..184dfe8 100644
--- a/src/jace/jax/stages/translation_cache.py
+++ b/src/jace/jax/stages/translation_cache.py
@@ -259,7 +259,7 @@ def make_call_description(
             if len(kwargs) != 0:
                 raise NotImplementedError("'kwargs' are not implemented in 'JaceWrapped.lower()'.")
 
-            fun = stage.__wrapped__
+            fun = stage.wrapped_fun
             sdfg = None
 
             # We have to guard ourselves from the case of annotating the same function, but using different translators.

From 927c375e3990d9636e88a745a985cc8eddb18f2b Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Fri, 17 May 2024 07:42:33 +0200
Subject: [PATCH 162/458] Updated the wrapper function.

---
 src/jace/jax/api.py        |  4 ++--
 src/jace/jax/api_helper.py | 32 +++++++++++++++++++++++++-------
 tests/test_decorator.py    |  5 -----
 3 files changed, 27 insertions(+), 14 deletions(-)

diff --git a/src/jace/jax/api.py b/src/jace/jax/api.py
index 79a067a..394ac93 100644
--- a/src/jace/jax/api.py
+++ b/src/jace/jax/api.py
@@ -9,9 +9,9 @@
 
 from __future__ import annotations
 
+import functools as ft
 from collections.abc import Callable, Mapping
 from typing import Any
-import functools as ft
 
 import jax as _jax_jax
 
@@ -19,7 +19,7 @@
 from jace.jax import api_helper
 
 
-@api_helper.jax_wrapper(_jax_jax.jit)
+@api_helper.jax_wrapper(_jax_jax.jit, rewriting=False)
 def jit(
     fun: Callable | None = None,
     /,
diff --git a/src/jace/jax/api_helper.py b/src/jace/jax/api_helper.py
index fbc441f..bc7162e 100644
--- a/src/jace/jax/api_helper.py
+++ b/src/jace/jax/api_helper.py
@@ -16,22 +16,40 @@
 
 def jax_wrapper(
     jax_fun: Callable,
-    fun: Callable | None = None,
+    jace_fun: Callable | None = None,
     /,
+    rewriting: bool = True,
     **kwargs: Any,
 ) -> Callable:
-    """Creates a wrapper function for"""
+    """Creates a wrapper to encapsulate Jax in Jace functions.
+
+    A replacement for `functools.wraps` but for the special
+    case that a Jace function should replace a Jax function.
+
+    Args:
+        rewriting:      Replace 'JAX' with 'JaCe' in the doc string.
+
+    Todo:
+        Improve.
+    """
 
     # fmt: off
-    if fun is None:
-        def _inner_jax_wrapper(fun: Callable) -> Callable:
-            return jax_wrapper(jax_fun, fun, **kwargs)
+    if jace_fun is None:
+        def _inner_jax_wrapper(jace_fun_: Callable) -> Callable:
+            return jax_wrapper(jax_fun, jace_fun_, **kwargs)
         return _inner_jax_wrapper
     # fmt: on
 
+    # This function creates the `__wrapped__` property, that I do not want
+    #  So we have to replace it, I think we should consider using the one of Jax.
     ft.update_wrapper(
-        wrapper=fun,
+        wrapper=jace_fun,
         wrapped=jax_fun,
         **kwargs,
     )
-    return fun
+
+    if rewriting:
+        # TODO(phimuell): Handle web addresses, code example and more.
+        jace_fun.__doc__ = jace_fun.__doc__.replace("JAX", "JaCe")
+
+    return jace_fun
diff --git a/tests/test_decorator.py b/tests/test_decorator.py
index 2382f91..a1cba33 100644
--- a/tests/test_decorator.py
+++ b/tests/test_decorator.py
@@ -23,11 +23,6 @@
 from jace import translator
 
 
-def test_decorator_annotation():
-    """Tests the annotation, essential `jace.jax.api_helper.jax_wrapper`."""
-    assert jax.jit.__doc__ == jace.jit.__doc__
-
-
 def test_decorator_individually():
     """Tests the compilation steps individually."""
     jax.config.update("jax_enable_x64", True)

From d91acd06a9e3085382f25bc52254cede88c26753 Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Fri, 17 May 2024 09:23:26 +0200
Subject: [PATCH 163/458] Added a function to identify scalars.

---
 src/jace/util/__init__.py |  2 ++
 src/jace/util/traits.py   | 33 +++++++++++++++++++++++++++++++++
 2 files changed, 35 insertions(+)

diff --git a/src/jace/util/__init__.py b/src/jace/util/__init__.py
index eb8e624..aaff453 100644
--- a/src/jace/util/__init__.py
+++ b/src/jace/util/__init__.py
@@ -31,6 +31,7 @@
     is_jaxified,
     is_non_string_iterable,
     is_on_device,
+    is_scalar,
 )
 from .util import (
     VALID_JAX_VAR_NAME,
@@ -54,6 +55,7 @@
     "is_fully_addressable",
     "is_non_string_iterable",
     "is_on_device",
+    "is_scalar",
     "get_jax_var_name",
     "get_jax_var_shape",
     "get_jax_var_dtype",
diff --git a/src/jace/util/traits.py b/src/jace/util/traits.py
index cc53328..b0a3805 100644
--- a/src/jace/util/traits.py
+++ b/src/jace/util/traits.py
@@ -13,6 +13,7 @@
 from typing import Any, TypeGuard
 
 import dace
+import numpy as np
 from jax import _src as jax_src, core as jax_core
 from jaxlib import xla_extension as jax_xe
 
@@ -89,6 +90,38 @@ def is_array(
     return is_jax_array(obj) or dace.is_array(obj)
 
 
+def is_scalar(
+    obj: Any,
+) -> bool:
+    """Tests if `obj` is a scalar."""
+    # These are the type known to DaCe; Taken from `dace.dtypes`.
+    known_types = {
+        bool,
+        int,
+        float,
+        complex,
+        np.intc,
+        np.uintc,
+        np.bool_,
+        np.int8,
+        np.int16,
+        np.int32,
+        np.int64,
+        np.uint8,
+        np.uint16,
+        np.uint32,
+        np.uint64,
+        np.float16,
+        np.float32,
+        np.float64,
+        np.complex64,
+        np.complex128,
+        np.longlong,
+        np.ulonglong,
+    }
+    return type(obj) in known_types
+
+
 def is_on_device(
     obj: Any,
 ) -> bool:

From e55a33f1cedf5e3902dd5887543059405092b66f Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Fri, 17 May 2024 09:25:35 +0200
Subject: [PATCH 164/458] Updated the function to abstractify arguments.

The function is now also able to handle scalars and concrete arguments.
---
 src/jace/jax/stages/translation_cache.py | 14 +++++++++++++-
 1 file changed, 13 insertions(+), 1 deletion(-)

diff --git a/src/jace/jax/stages/translation_cache.py b/src/jace/jax/stages/translation_cache.py
index 184dfe8..322df55 100644
--- a/src/jace/jax/stages/translation_cache.py
+++ b/src/jace/jax/stages/translation_cache.py
@@ -158,7 +158,19 @@ def from_value(
 
             return cls(shape=shape, dtype=dtype, strides=strides, storage=storage)
 
-        if isinstance(val, jax_core.ShpedArray):
+        if util.is_scalar(val):
+            shape = ()
+            dtype = util.translate_dtype(type(val))
+            strides = None
+            # Lets pretend that scalars are always on the CPU, which is a fair assumption.
+            storage = dace.StorageType.CPU_Heap
+
+            return cls(shape=shape, dtype=dtype, strides=strides, storage=storage)
+
+        if isinstance(val, jax_core.ConcreteArray):
+            return cls.from_value(val.val)
+
+        if isinstance(val, jax_core.ShapedArray):
             shape = val.aval.shape
             dtype = val.aval.dtype
             strides = None

From f3ef81c788400502c13a81e75ee3957fb2173667 Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Fri, 17 May 2024 09:27:11 +0200
Subject: [PATCH 165/458] Fixed some issues that are related to empty jaxprs.

This changes a bit how `propose_jax_name()` works, if the variable is known, it now just outputs the already known name.
In previous versions an error was generated.

Also added some tetsts.
---
 .../translator/jaxpr_translator_driver.py     | 37 +++++--------
 src/jace/util/jax_helper.py                   |  6 +-
 tests/test_empty_jaxpr.py                     | 55 +++++++++++++++++++
 3 files changed, 71 insertions(+), 27 deletions(-)
 create mode 100644 tests/test_empty_jaxpr.py

diff --git a/src/jace/translator/jaxpr_translator_driver.py b/src/jace/translator/jaxpr_translator_driver.py
index 85cea34..c847f6d 100644
--- a/src/jace/translator/jaxpr_translator_driver.py
+++ b/src/jace/translator/jaxpr_translator_driver.py
@@ -414,13 +414,6 @@ def add_array(
         storage: dace.StorageType = dace.StorageType.Default  # Set at later stages (optimization)
         is_scalar: bool = shape == ()
 
-        if (alt_name is None) and (self.map_jax_var_to_sdfg(arg, allow_fail=True) is not None):
-            # Maybe the test could be more robust, but it will check if we try to create
-            #  a variable for a second time. It is, however, okay to use one as template,
-            #  if another name is specified from the beginning.
-            raise ValueError(
-                f"Tried to create variable '{arg}' again, without specifying an alternative name."
-            )
         if force_jax_name:
             if alt_name is not None:
                 raise ValueError(
@@ -453,19 +446,6 @@ def add_array(
         if (name_prefix is not None) and (len(name_prefix) == 0):
             raise ValueError("Specified an empty 'name_prefix'.")
 
-        # Checking the strides.
-        if strides is not None:
-            if is_scalar:
-                raise ValueError("Specified a stride for a scalar.")
-            if isinstance(strides, (str, dace.symbol, int)):
-                strides = (strides,)
-            elif not isinstance(strides, tuple):
-                strides = tuple(strides)
-            if len(strides) != len(shape):
-                raise ValueError(
-                    f"'strides' has length {len(strides)}, but array rank is {len(shape)}."
-                )
-
         # Now we determine the proposed name of the variable.
         #  Depending on the situation, we will further manipulate it.
         if alt_name is not None:
@@ -491,6 +471,19 @@ def add_array(
             # Use the supplied name directly.
             arg_name = str(alt_name)
 
+        # Checking the strides.
+        if strides is not None:
+            if is_scalar:
+                raise ValueError("Specified a stride for a scalar.")
+            if isinstance(strides, (str, dace.symbol, int)):
+                strides = (strides,)
+            elif not isinstance(strides, tuple):
+                strides = tuple(strides)
+            if len(strides) != len(shape):
+                raise ValueError(
+                    f"'strides' has length {len(strides)}, but array rank is {len(shape)}."
+                )
+
         # Determine if we should look for a new name or not, if nothing was specified
         if find_new_name is None:
             if arg_name in self._reserved_names:
@@ -939,9 +932,7 @@ def _handle_null_jaxpr(
             self._start_state.add_nedge(
                 src=inp_acc,
                 dst=out_acc,
-                data=dace.Memlet.from_array(
-                    sdfg_in_name, self.get_array(self.map_jax_var_to_sdfg(sdfg_in_name))
-                ),
+                data=dace.Memlet.from_array(sdfg_in_name, self.get_array(sdfg_in_name)),
             )
 
             # A Jax variable now has two SDFG equivalent, the input, that was previously created by
diff --git a/src/jace/util/jax_helper.py b/src/jace/util/jax_helper.py
index 457c43d..2917b50 100644
--- a/src/jace/util/jax_helper.py
+++ b/src/jace/util/jax_helper.py
@@ -199,6 +199,7 @@ def propose_jax_name(
         The second mode is activated by passing `jax_name_map` as argument.
         The naming of variables are only consistent with the inner most Jaxpr a variable is defined in.
         Dropped variables will always be named `'_'`.
+        If `jax_var` is already inside `jax_name_map` that name will be returned.
     """
     if util.traits.is_drop_var(jax_var):
         return "_"
@@ -207,10 +208,7 @@ def propose_jax_name(
     if jax_name_map is None:
         return get_jax_var_name(jax_var)
     if jax_var in jax_name_map:
-        # Should be turned into a lookup?
-        raise RuntimeError(
-            f"Can not propose a second name for '{jax_var}', it already known as '{jax_name_map[jax_var]}'."
-        )
+        return jax_name_map[jax_var]
     if isinstance(jax_var, JaCeVar) and (jax_var.name != ""):
         # If the name of the JaCe variable is empty, then use the name proposing
         #  technique used for Jax variables; Mostly used for debugging.
diff --git a/tests/test_empty_jaxpr.py b/tests/test_empty_jaxpr.py
new file mode 100644
index 0000000..e2c63a1
--- /dev/null
+++ b/tests/test_empty_jaxpr.py
@@ -0,0 +1,55 @@
+# JaCe - JAX Just-In-Time compilation using DaCe (Data Centric Parallel Programming)
+#
+# Copyright (c) 2024, ETH Zurich
+# All rights reserved.
+#
+# SPDX-License-Identifier: BSD-3-Clause
+
+"""Implements tests for empty jaxprs.
+."""
+
+from __future__ import annotations
+
+import jax
+import numpy as np
+import pytest
+
+import jace
+
+
+def test_empty_array():
+    jax.config.update("jax_enable_x64", True)
+
+    @jace.jit
+    def testee(A: np.ndarray) -> np.ndarray:
+        return A
+
+    A = np.arange(12, dtype=np.float64).reshape((4, 3))
+
+    assert np.all(testee(A) == A)
+
+
+@pytest.mark.skip(reason="Scalar return values are not handled.")
+def test_empty_scalar():
+    jax.config.update("jax_enable_x64", True)
+
+    @jace.jit
+    def testee(A: float) -> float:
+        return A
+
+    A = np.pi
+
+    assert np.all(testee(A) == A)
+
+
+@pytest.mark.skip(reason="Nested Jaxpr are not handled.")
+def test_empty_nested():
+    jax.config.update("jax_enable_x64", True)
+
+    @jace.jit
+    def testee3(A: float) -> float:
+        return jax.jit(lambda A: A)(A)
+
+    A = np.pi
+
+    assert np.all(testee3(A) == A)

From 21a284f4223737145804e982e5ed14cc0b549428 Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Fri, 17 May 2024 09:57:16 +0200
Subject: [PATCH 166/458] The `Stage` class of Jace is no longer a subclass of
 Jax.

---
 src/jace/jax/stages/a_stage.py | 5 +----
 1 file changed, 1 insertion(+), 4 deletions(-)

diff --git a/src/jace/jax/stages/a_stage.py b/src/jace/jax/stages/a_stage.py
index 945ba69..1b099cc 100644
--- a/src/jace/jax/stages/a_stage.py
+++ b/src/jace/jax/stages/a_stage.py
@@ -13,13 +13,10 @@
 
 from __future__ import annotations
 
-from jax._src import stages as jax_stages
 
-
-class Stage(jax_stages.Stage):
+class Stage:
     """A distinct step in the compilation chain, see module description for more.
 
-    This class inherent from its Jax counterpart.
     The concrete steps are implemented in:
     - JaceWrapped
     - JaceLowered

From 7c4680cf0de5d95573f72313bc78c0e3b97382ad Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Fri, 17 May 2024 10:51:11 +0200
Subject: [PATCH 167/458] Started to remove some sources of cyclic imports.

According to [SE](https://stackoverflow.com/a/746067) the bst way to avoid that is using the `import ...` instaxt instead of the `from ... import` syntax.
Since the util module is accessed by almost everyone, it makes sense to use that stile inside it.
However, the translator package would also make much sense.

I am aware that this violates the codeing guide but in this case i do not care.
---
 src/jace/util/compiling.py  | 30 +++++-------------------------
 src/jace/util/jax_helper.py |  5 +++--
 src/jace/util/traits.py     |  3 ++-
 src/jace/util/util.py       |  2 +-
 4 files changed, 11 insertions(+), 29 deletions(-)

diff --git a/src/jace/util/compiling.py b/src/jace/util/compiling.py
index 85107fa..286b988 100644
--- a/src/jace/util/compiling.py
+++ b/src/jace/util/compiling.py
@@ -12,15 +12,16 @@
 
 from __future__ import annotations
 
-import functools as ft
 import time
 from collections.abc import Mapping, Sequence
-from typing import Any
+from typing import TYPE_CHECKING, Any
 
 import dace
 
-from jace import translator
-from jace.util import dace_helper as jdace
+
+if TYPE_CHECKING:
+    from jace import translator
+    from jace.util import dace_helper as jdace
 
 
 def compile_jax_sdfg(
@@ -72,7 +73,6 @@ def compile_jax_sdfg(
     return csdfg
 
 
-@ft.singledispatch
 def run_jax_sdfg(
     csdfg: jdace.CompiledSDFG,
     inp_names: Sequence[str],
@@ -146,23 +146,3 @@ def run_jax_sdfg(
     if len(out_names) == 1:
         return ret_val[0]
     return ret_val
-
-
-@run_jax_sdfg.register(translator.TranslatedJaxprSDFG)
-def _(
-    tsdfg: translator.TranslatedJaxprSDFG,
-    cargs: Sequence[Any],
-    ckwargs: Mapping[str, Any],
-) -> tuple[Any, ...] | Any:
-    """Execute the `TranslatedJaxprSDFG` object directly.
-
-    This function is a convenience function provided for debugging.
-    """
-    csdfg: jdace.CompiledSDFG = compile_jax_sdfg(tsdfg)
-    return run_jax_sdfg(
-        csdfg=csdfg,
-        inp_names=tsdfg.inp_names,
-        out_names=tsdfg.out_names,
-        cargs=cargs,
-        ckwargs=ckwargs,
-    )
diff --git a/src/jace/util/jax_helper.py b/src/jace/util/jax_helper.py
index 2917b50..98d65d7 100644
--- a/src/jace/util/jax_helper.py
+++ b/src/jace/util/jax_helper.py
@@ -25,7 +25,7 @@
 import jax.dtypes as jax_dtypes
 import numpy as np
 
-from jace import util
+import jace.util as util
 
 
 @dataclass(init=True, repr=True, frozen=True, eq=False)
@@ -67,6 +67,7 @@ def get_jax_var_name(jax_var: jax_core.Atom | JaCeVar | str) -> str:
         Due to some modification in Jax itself, this function is unable to return "proper" variable names.
         This function is subject for removal.
     """
+
     match jax_var:
         case jax_core.DropVar():
             return "_"
@@ -201,7 +202,7 @@ def propose_jax_name(
         Dropped variables will always be named `'_'`.
         If `jax_var` is already inside `jax_name_map` that name will be returned.
     """
-    if util.traits.is_drop_var(jax_var):
+    if util.is_drop_var(jax_var):
         return "_"
     if isinstance(jax_var, jax_core.Literal):
         raise TypeError(f"Can not propose a name for literal '{jax_var}'.")
diff --git a/src/jace/util/traits.py b/src/jace/util/traits.py
index b0a3805..fd61a6d 100644
--- a/src/jace/util/traits.py
+++ b/src/jace/util/traits.py
@@ -17,7 +17,8 @@
 from jax import _src as jax_src, core as jax_core
 from jaxlib import xla_extension as jax_xe
 
-from jace import jax as jjax, util
+import jace.jax as jjax
+import jace.util as util
 
 
 class NonStringIterable(Iterable): ...
diff --git a/src/jace/util/util.py b/src/jace/util/util.py
index 4e97e8c..b0f5640 100644
--- a/src/jace/util/util.py
+++ b/src/jace/util/util.py
@@ -11,7 +11,7 @@
 from collections.abc import Iterable
 from typing import TypeVar, cast, overload
 
-from jace.util import traits
+import jace.util.traits as traits
 
 
 _T = TypeVar("_T")

From 0dafb8d0dfb85dd7e72c9d126ebcb288ac9c9c1e Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Fri, 17 May 2024 11:13:46 +0200
Subject: [PATCH 168/458] Hardnened the `jace.translator` subpackage against
 cyclic import.

---
 src/jace/translator/jaxpr_translator_driver.py | 10 ++++++++--
 src/jace/translator/post_translation.py        |  5 ++++-
 src/jace/translator/primitive_translator.py    |  6 ++++--
 3 files changed, 16 insertions(+), 5 deletions(-)

diff --git a/src/jace/translator/jaxpr_translator_driver.py b/src/jace/translator/jaxpr_translator_driver.py
index c847f6d..aaa43f6 100644
--- a/src/jace/translator/jaxpr_translator_driver.py
+++ b/src/jace/translator/jaxpr_translator_driver.py
@@ -9,14 +9,18 @@
 
 import itertools
 from collections.abc import Iterable, Mapping, MutableSequence, Sequence
-from typing import Any, Final, Literal, cast, overload
+from typing import TYPE_CHECKING, Any, Final, Literal, cast, overload
 
 import dace
 import jax
 from dace import data as ddata, properties as dprop
 from jax import core as jax_core
 
-from jace import translator, util
+
+if TYPE_CHECKING:
+    from jace import translator
+
+from jace import util
 
 
 class JaxprTranslationDriver:
@@ -711,6 +715,8 @@ def _allocate_translation_ctx(
             name:               The name of the SDFG.
             reserved_names:     Add these name to the set of resered names of `self`.
         """
+        from jace import translator  # Cyclic import
+
         # Create a new translation context and put it on the stack.
         self._ctx_stack.append(
             translator.TranslatedJaxprSDFG(
diff --git a/src/jace/translator/post_translation.py b/src/jace/translator/post_translation.py
index a32c05f..fbe16b7 100644
--- a/src/jace/translator/post_translation.py
+++ b/src/jace/translator/post_translation.py
@@ -13,8 +13,11 @@
 from __future__ import annotations
 
 from collections.abc import Callable
+from typing import TYPE_CHECKING
 
-from jace import translator
+
+if TYPE_CHECKING:
+    from jace import translator
 
 
 def postprocess_jaxpr_sdfg(
diff --git a/src/jace/translator/primitive_translator.py b/src/jace/translator/primitive_translator.py
index 2e00ed6..29964a1 100644
--- a/src/jace/translator/primitive_translator.py
+++ b/src/jace/translator/primitive_translator.py
@@ -17,12 +17,14 @@
 
 from abc import abstractmethod
 from collections.abc import MutableSequence, Sequence
-from typing import Protocol, runtime_checkable
+from typing import TYPE_CHECKING, Protocol, runtime_checkable
 
 import dace
 from jax import core as jax_core
 
-from jace import translator
+
+if TYPE_CHECKING:
+    from jace import translator
 
 
 @runtime_checkable

From 5651483b4635469154eefe9639e68bbc4fe6a981 Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Fri, 17 May 2024 11:46:42 +0200
Subject: [PATCH 169/458] Moved all stages into a single file.

---
 src/jace/jax/stages.py                        | 339 ++++++++++++++++++
 src/jace/jax/stages/__init__.py               |  41 ---
 src/jace/jax/stages/a_stage.py                |  24 --
 src/jace/jax/stages/jace_compiled.py          |  57 ---
 src/jace/jax/stages/jace_lowered.py           | 124 -------
 src/jace/jax/stages/jace_wrapped.py           | 154 --------
 .../jax/{stages => }/translation_cache.py     |  16 +-
 7 files changed, 350 insertions(+), 405 deletions(-)
 create mode 100644 src/jace/jax/stages.py
 delete mode 100644 src/jace/jax/stages/__init__.py
 delete mode 100644 src/jace/jax/stages/a_stage.py
 delete mode 100644 src/jace/jax/stages/jace_compiled.py
 delete mode 100644 src/jace/jax/stages/jace_lowered.py
 delete mode 100644 src/jace/jax/stages/jace_wrapped.py
 rename src/jace/jax/{stages => }/translation_cache.py (97%)

diff --git a/src/jace/jax/stages.py b/src/jace/jax/stages.py
new file mode 100644
index 0000000..df537c7
--- /dev/null
+++ b/src/jace/jax/stages.py
@@ -0,0 +1,339 @@
+# JaCe - JAX Just-In-Time compilation using DaCe (Data Centric Parallel Programming)
+#
+# Copyright (c) 2024, ETH Zurich
+# All rights reserved.
+#
+# SPDX-License-Identifier: BSD-3-Clause
+"""Reimplementation of the `jax.stages` module.
+
+This module reimplements the public classes of that Jax module.
+However, they are a big different, because Jace uses DaCe as backend.
+
+As in Jax Jace has different stages, the terminology is taken from [Jax' AOT-Tutorial](https://jax.readthedocs.io/en/latest/aot.html).
+- Stage out:
+    In this phase we translate an executable python function into Jaxpr.
+- Lower:
+    This will transform the Jaxpr into an SDFG equivalent.
+    As a implementation note, currently this and the previous step are handled as a single step.
+- Compile:
+    This will turn the SDFG into an executable object, see `dace.codegen.CompiledSDFG`.
+- Execution:
+    This is the actual running of the computation.
+"""
+
+from __future__ import annotations
+
+import copy
+import json
+from collections.abc import Callable, Mapping, Sequence
+from typing import TYPE_CHECKING, Any, Final
+
+import jax as jax_jax
+from jax.stages import CompilerOptions
+
+from jace import optimization, translator, util
+from jace.jax import translation_cache as tcache
+from jace.translator import managing, post_translation as ptrans
+from jace.util import dace_helper as jdace
+
+
+if TYPE_CHECKING:
+    pass
+
+
+class Stage:
+    """A distinct step in the compilation chain, see module description for more.
+
+    The concrete steps are implemented in:
+    - JaceWrapped
+    - JaceLowered
+    - JaceCompiled
+    """
+
+
+class JaceWrapped(Stage):
+    """A function ready to be specialized, lowered, and compiled.
+
+    This class represents the output of functions such as `jace.jit()`.
+    Calling it results in jit (just-in-time) lowering, compilation, and execution.
+    It can also be explicitly lowered prior to compilation, and the result compiled prior to execution.
+
+    You should not create `JaceWrapped` instances directly, instead you should use `jace.jit`.
+
+    Todo:
+        Handles pytrees.
+        Copy the `jax._src.pjit.make_jit()` functionality to remove `jax.make_jaxpr()`.
+    """
+
+    _fun: Callable
+    _sub_translators: Mapping[str, translator.PrimitiveTranslator]
+    _jit_ops: Mapping[str, Any]
+
+    # Managed by the caching infrastructure and only defined during `lower()`.
+    #  If defined it contains an abstract description of the function arguments.
+    _call_description: tcache.CallArgsDescription | None = None
+
+    # Cache for the lowering. Managed by the caching infrastructure.
+    _cache: tcache.TranslationCache | None = None
+
+    def __init__(
+        self,
+        fun: Callable,
+        sub_translators: Mapping[str, translator.PrimitiveTranslator],
+        jit_ops: Mapping[str, Any],
+    ) -> None:
+        """Creates a wrapped jace jitable object of `jax_prim`.
+
+        You should not create `JaceWrapped` instances directly, instead you should use `jace.jit`.
+
+        Args:
+            fun:                The function that is wrapped.
+            sub_translators:    The list of subtranslators that that should be used.
+            jit_ops:            All options that we forward to `jax.jit`.
+
+        Notes:
+            Both the `sub_translators` and `jit_ops` are shallow copied.
+        """
+        self._fun: Callable = fun
+
+        # Why do we have to make a copy (shallow copy is enough as the translators themselves are immutable)?
+        #  The question is a little bit tricky so let's consider the following situation:
+        #  The user has created a Jace annotated function, and calls it, which leads to lowering and translation.
+        #  Then he goes on and in the process modifies the internal list of translators.
+        #  Then he calls the same annotated function again, then in case the arguments happens to be structurally the same,
+        #  lowering and translation will be skipped if the call is still inside the cache, this is what Jax does.
+        #  However, if they are different (or a cache eviction has happened), then tracing and translation will happen again.
+        #  Thus depending on the situation the user might get different behaviour.
+        #  In my expectation, Jace should always do the same thing, i.e. being deterministic, but what?
+        #  In my view, the simplest one and the one that is most functional is, to always use the translators,
+        #  that were _passed_ (although implicitly) at construction, making it independent on the global state.
+        #  One could argue, that the "dynamical modification of the translator list from the outside" is an actual legitimate use case, however, it is not.
+        #  Since `JaceWrapped.lower()` is cached, we would have to modify the caching to include the dynamic state of the set.
+        #  Furthermore, we would have to implement to make a distinction between this and the normal use case.
+        #  Thus we simply forbid it! If this is desired use `jace.jit()` as function to create an object dynamically.
+        # We could either here or in `jace.jit` perform the copy, but since `jace.jit` is at the end
+        #  just a glorified constructor and "allowing dynamic translator list" is not a use case, see above, we do it here.
+        #
+        # Because we know that the global state is immutable, we must not copy in this case.
+        #  See also `make_call_description()` in the cache implementation.
+        if sub_translators is managing._CURRENT_SUBTRANSLATORS_VIEW:
+            self._sub_translators = sub_translators
+        else:
+            # Note this is the canonical way to shallow copy a mapping since `Mapping` does not has `.copy()`
+            # and `copy.copy()` can not handle `MappingProxyType`.
+            self._sub_translators = dict(sub_translators)
+
+        # Following the same logic as above we should also copy `jit_ops`.
+        #  However, do we have to make a shallow copy or a deepcopy?
+        #  I looked at the Jax code and it seems that there is nothing that copies it,
+        #  so for now we will just go ahead and shallow copy it.
+        self._jit_ops = dict(jit_ops)
+
+    def __call__(
+        self,
+        *args: Any,
+        **kwargs: Any,
+    ) -> Any:
+        """Executes the wrapped function, lowering and compiling as needed in one step."""
+
+        # TODO(phimuell): Handle the `disable_jit` context manager of Jax.
+
+        # This allows us to be composable with Jax transformations.
+        if util.is_tracing_ongoing(*args, **kwargs):
+            # TODO(phimuell): Handle the case of gradients:
+            #                   It seems that this one uses special tracers, since they can handle comparisons.
+            #                   https://jax.readthedocs.io/en/latest/notebooks/Common_Gotchas_in_JAX.html#python-control-flow-autodiff
+            return self._fun(*args, **kwargs)
+
+        # TODO(phimuell): Handle static arguments correctly
+        #                   https://jax.readthedocs.io/en/latest/aot.html#lowering-with-static-arguments
+        lowered = self.lower(*args, **kwargs)
+        compiled = lowered.compile()
+        return compiled(*args, **kwargs)
+
+    @tcache.cached_translation
+    def lower(
+        self,
+        *args: Any,
+        **kwargs: Any,
+    ) -> JaceLowered:
+        """Lower this function explicitly for the given arguments.
+
+        Performs the first two steps of the AOT steps described above,
+        i.e. transformation into Jaxpr and then to SDFG.
+        The result is encapsulated into a `Lowered` object.
+
+        Todo:
+            Add a context manager to disable caching.
+        """
+        if len(kwargs) != 0:
+            raise NotImplementedError("Currently only positional arguments are supported.")
+
+        # TODO(phimuell): Handle pytrees.
+        real_args: tuple[Any, ...] = args
+
+        jaxpr = jax_jax.make_jaxpr(self._fun)(*real_args)
+        driver = translator.JaxprTranslationDriver(sub_translators=self._sub_translators)
+        trans_sdfg: translator.TranslatedJaxprSDFG = driver.translate_jaxpr(jaxpr)
+        ptrans.postprocess_jaxpr_sdfg(tsdfg=trans_sdfg, fun=self.wrapped_fun)
+        # The `JaceLowered` assumes complete ownership of `trans_sdfg`!
+        return JaceLowered(trans_sdfg)
+
+    @property
+    def wrapped_fun(self) -> Callable:
+        """Returns the wrapped function."""
+        return self._fun
+
+
+class JaceLowered(Stage):
+    """Represents the original computation that was lowered to SDFG."""
+
+    # `self` assumes complete ownership of the
+    _trans_sdfg: translator.TranslatedJaxprSDFG
+
+    # Cache for the compilation. Managed by the caching infrastructure.
+    _cache: tcache.TranslationCache | None = None
+
+    DEF_COMPILER_OPTIONS: Final[dict[str, Any]] = {
+        "auto_optimize": True,
+        "simplify": True,
+    }
+
+    def __init__(
+        self,
+        trans_sdfg: translator.TranslatedJaxprSDFG,
+    ) -> None:
+        """Constructs the lowered object."""
+        if not trans_sdfg.is_finalized:
+            raise ValueError("The translated SDFG must be finalized.")
+        if trans_sdfg.inp_names is None:
+            raise ValueError("Input names must be defined.")
+        if trans_sdfg.out_names is None:
+            raise ValueError("Output names must be defined.")
+        self._trans_sdfg = trans_sdfg
+
+    @tcache.cached_translation
+    def compile(
+        self,
+        compiler_options: CompilerOptions | None = None,  # Unused arguments
+    ) -> JaceCompiled:
+        """Compile the SDFG.
+
+        Returns an Object that encapsulates a compiled SDFG object.
+        You can pass a `dict` as argument which are passed to the `jace_optimize()` routine.
+        If you pass `None` then the default options are used.
+        To disable all optimization, pass an empty `dict`.
+
+        Notes:
+            I am pretty sure that `None` in Jax means "use the default option".
+                See also `CachedCallDescription.make_call_description()`.
+        """
+        # We **must** deepcopy before we do any optimization.
+        #  There are many reasons for this but here are the most important ones:
+        #  All optimization DaCe functions works in place, if we would not copy the SDFG first, then we would have a problem.
+        #  Because, these optimization would then have a feedback of the SDFG object which is stored inside `self`.
+        #  Thus, if we would run this code `(jaceLoweredObject := jaceWrappedObject.lower()).compile({opti=True})` would return
+        #  an optimized object, which is what we intent to do.
+        #  However, if we would now call `jaceWrappedObject.lower()` (with the same arguments as before), we should get `jaceLoweredObject`,
+        #  since it was cached, but it would actually contain an already optimized SDFG, which is not what we want.
+        #  If you think you can remove this line then do it and run `tests/test_decorator.py::test_decorator_sharing`.
+        fsdfg: translator.TranslatedJaxprSDFG = copy.deepcopy(self._trans_sdfg)
+        optimization.jace_optimize(
+            fsdfg, **(self.DEF_COMPILER_OPTIONS if compiler_options is None else compiler_options)
+        )
+        csdfg: jdace.CompiledSDFG = util.compile_jax_sdfg(fsdfg)
+
+        return JaceCompiled(
+            csdfg=csdfg,
+            inp_names=fsdfg.inp_names,
+            out_names=fsdfg.out_names,
+        )
+
+    def compiler_ir(self, dialect: str | None = None) -> translator.TranslatedJaxprSDFG:
+        """Returns the internal SDFG.
+
+        The function returns a `TranslatedJaxprSDFG` object.
+        It is important that modifying this object in any ways is considered an error.
+        """
+        if (dialect is None) or (dialect.upper() == "SDFG"):
+            return self._trans_sdfg
+        raise ValueError(f"Unknown dialect '{dialect}'.")
+
+    def as_html(self, filename: str | None = None) -> None:
+        """Runs the `view()` method of the underlying SDFG.
+
+        This is a Jace extension.
+        """
+        self.compiler_ir().sdfg.view(filename=filename, verbose=False)
+
+    def as_text(self, dialect: str | None = None) -> str:
+        """Textual representation of the SDFG.
+
+        By default, the function will return the Json representation of the SDFG.
+        However, by specifying `'html'` as `dialect` the function will call `view()` on the underlying SDFG.
+
+        Notes:
+            You should prefer `self.as_html()` instead of this function.
+        """
+        if (dialect is None) or (dialect.upper() == "JSON"):
+            return json.dumps(self.compiler_ir().sdfg.to_json())
+        if dialect.upper() == "HTML":
+            self.as_html()
+            return ""  # For the interface
+        raise ValueError(f"Unknown dialect '{dialect}'.")
+
+    def cost_analysis(self) -> Any | None:
+        """A summary of execution cost estimates.
+
+        Not implemented use the DaCe [instrumentation API](https://spcldace.readthedocs.io/en/latest/optimization/profiling.html) directly.
+        """
+        raise NotImplementedError()
+
+
+class JaceCompiled(Stage):
+    """Compiled version of the SDFG.
+
+    Contains all the information to run the associated computation.
+
+    Todo:
+        Handle pytrees.
+    """
+
+    _csdfg: jdace.CompiledSDFG  # The compiled SDFG object.
+    _inp_names: tuple[str, ...]  # Name of all input arguments.
+    _out_names: tuple[str, ...]  # Name of all output arguments.
+
+    def __init__(
+        self,
+        csdfg: jdace.CompiledSDFG,
+        inp_names: Sequence[str],
+        out_names: Sequence[str],
+    ) -> None:
+        if (not inp_names) or (not out_names):
+            raise ValueError("Input and output can not be empty.")
+        self._csdfg = csdfg
+        self._inp_names = tuple(inp_names)
+        self._out_names = tuple(out_names)
+
+    def __call__(
+        self,
+        *args: Any,
+        **kwargs: Any,
+    ) -> Any:
+        """Calls the embedded computation."""
+        return util.run_jax_sdfg(
+            self._csdfg,
+            self._inp_names,
+            self._out_names,
+            args,
+            kwargs,
+        )
+
+
+__all__ = [
+    "Stage",
+    "CompilerOptions",
+    "JaceWrapped",
+    "JaceLowered",
+    "JaceCompiled",
+]
diff --git a/src/jace/jax/stages/__init__.py b/src/jace/jax/stages/__init__.py
deleted file mode 100644
index 49f13bd..0000000
--- a/src/jace/jax/stages/__init__.py
+++ /dev/null
@@ -1,41 +0,0 @@
-# JaCe - JAX Just-In-Time compilation using DaCe (Data Centric Parallel Programming)
-#
-# Copyright (c) 2024, ETH Zurich
-# All rights reserved.
-#
-# SPDX-License-Identifier: BSD-3-Clause
-
-"""Reimplementation of the `jax.stages` module.
-
-The module either imports or reimplements Jax classes.
-In case classes/functions are reimplemented they might be slightly different to fit their usage within Jace.
-
-As in Jax Jace has different stages, the terminology is taken from [Jax' AOT-Tutorial](https://jax.readthedocs.io/en/latest/aot.html).
-- Stage out:
-    In this phase we translate an executable python function into Jaxpr.
-- Lower:
-    This will transform the Jaxpr into an SDFG equivalent.
-    As a implementation note, currently this and the previous step are handled as a single step.
-- Compile:
-    This will turn the SDFG into an executable object, see `dace.codegen.CompiledSDFG`.
-- Execution:
-    This is the actual running of the computation.
-"""
-
-from __future__ import annotations
-
-from jax.stages import CompilerOptions
-
-from .a_stage import Stage
-from .jace_compiled import JaceCompiled
-from .jace_lowered import JaceLowered
-from .jace_wrapped import JaceWrapped
-
-
-__all__ = [
-    "Stage",
-    "CompilerOptions",
-    "JaceWrapped",
-    "JaceLowered",
-    "JaceCompiled",
-]
diff --git a/src/jace/jax/stages/a_stage.py b/src/jace/jax/stages/a_stage.py
deleted file mode 100644
index 1b099cc..0000000
--- a/src/jace/jax/stages/a_stage.py
+++ /dev/null
@@ -1,24 +0,0 @@
-# JaCe - JAX Just-In-Time compilation using DaCe (Data Centric Parallel Programming)
-#
-# Copyright (c) 2024, ETH Zurich
-# All rights reserved.
-#
-# SPDX-License-Identifier: BSD-3-Clause
-"""Interface of the Stages.
-
-In `jace.jax.stages.__init__.py` this file must be imported first.
-However, isort/ruff fail to do that and can not be convinced otherwise.
-For that reason this file was renamed to ensure that it comes at first.
-"""
-
-from __future__ import annotations
-
-
-class Stage:
-    """A distinct step in the compilation chain, see module description for more.
-
-    The concrete steps are implemented in:
-    - JaceWrapped
-    - JaceLowered
-    - JaceCompiled
-    """
diff --git a/src/jace/jax/stages/jace_compiled.py b/src/jace/jax/stages/jace_compiled.py
deleted file mode 100644
index 3f33859..0000000
--- a/src/jace/jax/stages/jace_compiled.py
+++ /dev/null
@@ -1,57 +0,0 @@
-# JaCe - JAX Just-In-Time compilation using DaCe (Data Centric Parallel Programming)
-#
-# Copyright (c) 2024, ETH Zurich
-# All rights reserved.
-#
-# SPDX-License-Identifier: BSD-3-Clause
-
-"""Implementation of the `jace.jax.stages.Compiled` stage for Jace."""
-
-from __future__ import annotations
-
-from collections.abc import Sequence
-from typing import Any
-
-from jace import util
-from jace.jax import stages
-from jace.util import dace_helper as jdace
-
-
-class JaceCompiled(stages.Stage):
-    """Compiled version of the SDFG.
-
-    Contains all the information to run the associated computation.
-
-    Todo:
-        Handle pytrees.
-    """
-
-    _csdfg: jdace.CompiledSDFG  # The compiled SDFG object.
-    _inp_names: tuple[str, ...]  # Name of all input arguments.
-    _out_names: tuple[str, ...]  # Name of all output arguments.
-
-    def __init__(
-        self,
-        csdfg: jdace.CompiledSDFG,
-        inp_names: Sequence[str],
-        out_names: Sequence[str],
-    ) -> None:
-        if (not inp_names) or (not out_names):
-            raise ValueError("Input and output can not be empty.")
-        self._csdfg = csdfg
-        self._inp_names = tuple(inp_names)
-        self._out_names = tuple(out_names)
-
-    def __call__(
-        self,
-        *args: Any,
-        **kwargs: Any,
-    ) -> Any:
-        """Calls the embedded computation."""
-        return util.run_jax_sdfg(
-            self._csdfg,
-            self._inp_names,
-            self._out_names,
-            args,
-            kwargs,
-        )
diff --git a/src/jace/jax/stages/jace_lowered.py b/src/jace/jax/stages/jace_lowered.py
deleted file mode 100644
index 70e111e..0000000
--- a/src/jace/jax/stages/jace_lowered.py
+++ /dev/null
@@ -1,124 +0,0 @@
-# JaCe - JAX Just-In-Time compilation using DaCe (Data Centric Parallel Programming)
-#
-# Copyright (c) 2024, ETH Zurich
-# All rights reserved.
-#
-# SPDX-License-Identifier: BSD-3-Clause
-
-"""Implementation of the `jace.jax.stages.Lowered` stage for Jace."""
-
-from __future__ import annotations
-
-import copy
-import json
-from typing import Any, Final
-
-from jace import optimization, translator, util
-from jace.jax import stages
-from jace.jax.stages import translation_cache as tcache
-from jace.util import dace_helper as jdace
-
-
-class JaceLowered(stages.Stage):
-    """Represents the original computation that was lowered to SDFG."""
-
-    # `self` assumes complete ownership of the
-    _trans_sdfg: translator.TranslatedJaxprSDFG
-
-    # Cache for the compilation. Managed by the caching infrastructure.
-    _cache: tcache.TranslationCache | None = None
-
-    DEF_COMPILER_OPTIONS: Final[dict[str, Any]] = {
-        "auto_optimize": True,
-        "simplify": True,
-    }
-
-    def __init__(
-        self,
-        trans_sdfg: translator.TranslatedJaxprSDFG,
-    ) -> None:
-        """Constructs the lowered object."""
-        if not trans_sdfg.is_finalized:
-            raise ValueError("The translated SDFG must be finalized.")
-        if trans_sdfg.inp_names is None:
-            raise ValueError("Input names must be defined.")
-        if trans_sdfg.out_names is None:
-            raise ValueError("Output names must be defined.")
-        self._trans_sdfg = trans_sdfg
-
-    @tcache.cached_translation
-    def compile(
-        self,
-        compiler_options: stages.CompilerOptions | None = None,  # Unused arguments
-    ) -> stages.JaceCompiled:
-        """Compile the SDFG.
-
-        Returns an Object that encapsulates a compiled SDFG object.
-        You can pass a `dict` as argument which are passed to the `jace_optimize()` routine.
-        If you pass `None` then the default options are used.
-        To disable all optimization, pass an empty `dict`.
-
-        Notes:
-            I am pretty sure that `None` in Jax means "use the default option".
-                See also `CachedCallDescription.make_call_description()`.
-        """
-        # We **must** deepcopy before we do any optimization.
-        #  There are many reasons for this but here are the most important ones:
-        #  All optimization DaCe functions works in place, if we would not copy the SDFG first, then we would have a problem.
-        #  Because, these optimization would then have a feedback of the SDFG object which is stored inside `self`.
-        #  Thus, if we would run this code `(jaceLoweredObject := jaceWrappedObject.lower()).compile({opti=True})` would return
-        #  an optimized object, which is what we intent to do.
-        #  However, if we would now call `jaceWrappedObject.lower()` (with the same arguments as before), we should get `jaceLoweredObject`,
-        #  since it was cached, but it would actually contain an already optimized SDFG, which is not what we want.
-        #  If you think you can remove this line then do it and run `tests/test_decorator.py::test_decorator_sharing`.
-        fsdfg: translator.TranslatedJaxprSDFG = copy.deepcopy(self._trans_sdfg)
-        optimization.jace_optimize(
-            fsdfg, **(self.DEF_COMPILER_OPTIONS if compiler_options is None else compiler_options)
-        )
-        csdfg: jdace.CompiledSDFG = util.compile_jax_sdfg(fsdfg)
-
-        return stages.JaceCompiled(
-            csdfg=csdfg,
-            inp_names=fsdfg.inp_names,
-            out_names=fsdfg.out_names,
-        )
-
-    def compiler_ir(self, dialect: str | None = None) -> translator.TranslatedJaxprSDFG:
-        """Returns the internal SDFG.
-
-        The function returns a `TranslatedJaxprSDFG` object.
-        It is important that modifying this object in any ways is considered an error.
-        """
-        if (dialect is None) or (dialect.upper() == "SDFG"):
-            return self._trans_sdfg
-        raise ValueError(f"Unknown dialect '{dialect}'.")
-
-    def as_html(self, filename: str | None = None) -> None:
-        """Runs the `view()` method of the underlying SDFG.
-
-        This is a Jace extension.
-        """
-        self.compiler_ir().sdfg.view(filename=filename, verbose=False)
-
-    def as_text(self, dialect: str | None = None) -> str:
-        """Textual representation of the SDFG.
-
-        By default, the function will return the Json representation of the SDFG.
-        However, by specifying `'html'` as `dialect` the function will call `view()` on the underlying SDFG.
-
-        Notes:
-            You should prefer `self.as_html()` instead of this function.
-        """
-        if (dialect is None) or (dialect.upper() == "JSON"):
-            return json.dumps(self.compiler_ir().sdfg.to_json())
-        if dialect.upper() == "HTML":
-            self.as_html()
-            return ""  # For the interface
-        raise ValueError(f"Unknown dialect '{dialect}'.")
-
-    def cost_analysis(self) -> Any | None:
-        """A summary of execution cost estimates.
-
-        Not implemented use the DaCe [instrumentation API](https://spcldace.readthedocs.io/en/latest/optimization/profiling.html) directly.
-        """
-        raise NotImplementedError()
diff --git a/src/jace/jax/stages/jace_wrapped.py b/src/jace/jax/stages/jace_wrapped.py
deleted file mode 100644
index 433bc8a..0000000
--- a/src/jace/jax/stages/jace_wrapped.py
+++ /dev/null
@@ -1,154 +0,0 @@
-# JaCe - JAX Just-In-Time compilation using DaCe (Data Centric Parallel Programming)
-#
-# Copyright (c) 2024, ETH Zurich
-# All rights reserved.
-#
-# SPDX-License-Identifier: BSD-3-Clause
-
-"""Implementation of the `jace.jax.stages.Wrapped` protocol."""
-
-from __future__ import annotations
-
-from collections.abc import Callable, Mapping
-from typing import Any
-
-import jax as jax_jax
-
-from jace import translator, util
-from jace.jax import stages
-from jace.jax.stages import translation_cache as tcache
-from jace.translator import managing, post_translation as ptrans
-
-
-class JaceWrapped(stages.Stage):
-    """A function ready to be specialized, lowered, and compiled.
-
-    This class represents the output of functions such as `jace.jit()`.
-    Calling it results in jit (just-in-time) lowering, compilation, and execution.
-    It can also be explicitly lowered prior to compilation, and the result compiled prior to execution.
-
-    You should not create `JaceWrapped` instances directly, instead you should use `jace.jit`.
-
-    Todo:
-        Handles pytrees.
-        Copy the `jax._src.pjit.make_jit()` functionality to remove `jax.make_jaxpr()`.
-    """
-
-    _fun: Callable
-    _sub_translators: Mapping[str, translator.PrimitiveTranslator]
-    _jit_ops: Mapping[str, Any]
-
-    # Managed by the caching infrastructure and only defined during `lower()`.
-    #  If defined it contains an abstract description of the function arguments.
-    _call_description: tcache.CallArgsDescription | None = None
-
-    # Cache for the lowering. Managed by the caching infrastructure.
-    _cache: tcache.TranslationCache | None = None
-
-    def __init__(
-        self,
-        fun: Callable,
-        sub_translators: Mapping[str, translator.PrimitiveTranslator],
-        jit_ops: Mapping[str, Any],
-    ) -> None:
-        """Creates a wrapped jace jitable object of `jax_prim`.
-
-        You should not create `JaceWrapped` instances directly, instead you should use `jace.jit`.
-
-        Args:
-            fun:                The function that is wrapped.
-            sub_translators:    The list of subtranslators that that should be used.
-            jit_ops:            All options that we forward to `jax.jit`.
-
-        Notes:
-            Both the `sub_translators` and `jit_ops` are shallow copied.
-        """
-        self._fun: Callable = fun
-
-        # Why do we have to make a copy (shallow copy is enough as the translators themselves are immutable)?
-        #  The question is a little bit tricky so let's consider the following situation:
-        #  The user has created a Jace annotated function, and calls it, which leads to lowering and translation.
-        #  Then he goes on and in the process modifies the internal list of translators.
-        #  Then he calls the same annotated function again, then in case the arguments happens to be structurally the same,
-        #  lowering and translation will be skipped if the call is still inside the cache, this is what Jax does.
-        #  However, if they are different (or a cache eviction has happened), then tracing and translation will happen again.
-        #  Thus depending on the situation the user might get different behaviour.
-        #  In my expectation, Jace should always do the same thing, i.e. being deterministic, but what?
-        #  In my view, the simplest one and the one that is most functional is, to always use the translators,
-        #  that were _passed_ (although implicitly) at construction, making it independent on the global state.
-        #  One could argue, that the "dynamical modification of the translator list from the outside" is an actual legitimate use case, however, it is not.
-        #  Since `JaceWrapped.lower()` is cached, we would have to modify the caching to include the dynamic state of the set.
-        #  Furthermore, we would have to implement to make a distinction between this and the normal use case.
-        #  Thus we simply forbid it! If this is desired use `jace.jit()` as function to create an object dynamically.
-        # We could either here or in `jace.jit` perform the copy, but since `jace.jit` is at the end
-        #  just a glorified constructor and "allowing dynamic translator list" is not a use case, see above, we do it here.
-        #
-        # Because we know that the global state is immutable, we must not copy in this case.
-        #  See also `make_call_description()` in the cache implementation.
-        if sub_translators is managing._CURRENT_SUBTRANSLATORS_VIEW:
-            self._sub_translators = sub_translators
-        else:
-            # Note this is the canonical way to shallow copy a mapping since `Mapping` does not has `.copy()`
-            # and `copy.copy()` can not handle `MappingProxyType`.
-            self._sub_translators = dict(sub_translators)
-
-        # Following the same logic as above we should also copy `jit_ops`.
-        #  However, do we have to make a shallow copy or a deepcopy?
-        #  I looked at the Jax code and it seems that there is nothing that copies it,
-        #  so for now we will just go ahead and shallow copy it.
-        self._jit_ops = dict(jit_ops)
-
-    def __call__(
-        self,
-        *args: Any,
-        **kwargs: Any,
-    ) -> Any:
-        """Executes the wrapped function, lowering and compiling as needed in one step."""
-
-        # TODO(phimuell): Handle the `disable_jit` context manager of Jax.
-
-        # This allows us to be composable with Jax transformations.
-        if util.is_tracing_ongoing(*args, **kwargs):
-            # TODO(phimuell): Handle the case of gradients:
-            #                   It seems that this one uses special tracers, since they can handle comparisons.
-            #                   https://jax.readthedocs.io/en/latest/notebooks/Common_Gotchas_in_JAX.html#python-control-flow-autodiff
-            return self._fun(*args, **kwargs)
-
-        # TODO(phimuell): Handle static arguments correctly
-        #                   https://jax.readthedocs.io/en/latest/aot.html#lowering-with-static-arguments
-        lowered = self.lower(*args, **kwargs)
-        compiled = lowered.compile()
-        return compiled(*args, **kwargs)
-
-    @tcache.cached_translation
-    def lower(
-        self,
-        *args: Any,
-        **kwargs: Any,
-    ) -> stages.JaceLowered:
-        """Lower this function explicitly for the given arguments.
-
-        Performs the first two steps of the AOT steps described above,
-        i.e. transformation into Jaxpr and then to SDFG.
-        The result is encapsulated into a `Lowered` object.
-
-        Todo:
-            Add a context manager to disable caching.
-        """
-        if len(kwargs) != 0:
-            raise NotImplementedError("Currently only positional arguments are supported.")
-
-        # TODO(phimuell): Handle pytrees.
-        real_args: tuple[Any, ...] = args
-
-        jaxpr = jax_jax.make_jaxpr(self._fun)(*real_args)
-        driver = translator.JaxprTranslationDriver(sub_translators=self._sub_translators)
-        trans_sdfg: translator.TranslatedJaxprSDFG = driver.translate_jaxpr(jaxpr)
-        ptrans.postprocess_jaxpr_sdfg(tsdfg=trans_sdfg, fun=self.wrapped_fun)
-        # The `JaceLowered` assumes complete ownership of `trans_sdfg`!
-        return stages.JaceLowered(trans_sdfg)
-
-    @property
-    def wrapped_fun(self) -> Callable:
-        """Returns the wrapped function."""
-        return self._fun
diff --git a/src/jace/jax/stages/translation_cache.py b/src/jace/jax/translation_cache.py
similarity index 97%
rename from src/jace/jax/stages/translation_cache.py
rename to src/jace/jax/translation_cache.py
index 322df55..d67b1e9 100644
--- a/src/jace/jax/stages/translation_cache.py
+++ b/src/jace/jax/translation_cache.py
@@ -21,13 +21,16 @@
 from collections import OrderedDict
 from collections.abc import Callable
 from dataclasses import dataclass
-from typing import Any, Protocol, TypeAlias, runtime_checkable
+from typing import TYPE_CHECKING, Any, Protocol, TypeAlias, runtime_checkable
 
 import dace
 from jax import core as jax_core
 
 from jace import util
-from jace.jax import stages
+
+
+if TYPE_CHECKING:
+    from jace.jax import stages
 
 
 def cached_translation(
@@ -57,6 +60,7 @@ def _action_wrapper(
         **kwargs: Any,
     ) -> stages.Stage:
         # If not initialized initialize the cache.
+        assert hasattr(self, "_cache")  # Needed to make mypy silent
         if self._cache is None:
             self._cache = _get_cache(self)
 
@@ -66,16 +70,17 @@ def _action_wrapper(
             return self._cache.get(key)
 
         # We must actually perform the call
-        wants_description: bool = hasattr(self, "_call_description")
         try:
-            if wants_description:
+            if hasattr(self, "_call_description"):
                 assert (
                     self._call_description is None
                 ), f"call description already set for `{self}` (probably another call going on?)."
                 self._call_description = key.fargs
             next_stage: stages.Stage = action(self, *args, **kwargs)
         finally:
-            if wants_description:
+            # If I would cache the result from above and store and then use here,
+            #  mypy would complain, thus we have to do it twice.
+            if hasattr(self, "_call_description"):
                 self._call_description = None
 
         # Store the result.
@@ -264,6 +269,7 @@ def make_call_description(
         **kwargs: Any,
     ) -> CachedCallDescription:
         """Creates an abstract description of the call."""
+        from jace.jax import stages  # Cyclic import
 
         if isinstance(stage, stages.JaceWrapped):
             # JaceWrapped.lower() to JaceLowered

From 334823ddb7ebdda92af38e543606bd1e66370c6b Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Fri, 17 May 2024 13:09:32 +0200
Subject: [PATCH 170/458] Changed the names of the global list of
 subtranslators.

---
 src/jace/jax/stages.py          |  2 +-
 src/jace/translator/managing.py | 26 +++++++++++++-------------
 2 files changed, 14 insertions(+), 14 deletions(-)

diff --git a/src/jace/jax/stages.py b/src/jace/jax/stages.py
index df537c7..f7e3127 100644
--- a/src/jace/jax/stages.py
+++ b/src/jace/jax/stages.py
@@ -116,7 +116,7 @@ def __init__(
         #
         # Because we know that the global state is immutable, we must not copy in this case.
         #  See also `make_call_description()` in the cache implementation.
-        if sub_translators is managing._CURRENT_SUBTRANSLATORS_VIEW:
+        if sub_translators is managing._PRIMITIVE_TRANSLATORS_VIEW:
             self._sub_translators = sub_translators
         else:
             # Note this is the canonical way to shallow copy a mapping since `Mapping` does not has `.copy()`
diff --git a/src/jace/translator/managing.py b/src/jace/translator/managing.py
index 71167a3..f42eed8 100644
--- a/src/jace/translator/managing.py
+++ b/src/jace/translator/managing.py
@@ -7,7 +7,7 @@
 """Module for managing the individual sutranslators.
 
 The high level idea is that there is a "list" of instances of `PrimitiveTranslator`,
-which is known as `_CURRENT_SUBTRANSLATORS`.
+which is known as `_PRIMITIVE_TRANSLATORS_DICT`.
 If not specified the content of this list is used to perform the translation.
 """
 
@@ -29,9 +29,9 @@
 
 
 # These are all currently used subtranslators that we are used.
-_CURRENT_SUBTRANSLATORS: dict[str, translator.PrimitiveTranslator] = {}
-_CURRENT_SUBTRANSLATORS_VIEW: types.MappingProxyType[str, translator.PrimitiveTranslator] = (
-    types.MappingProxyType(_CURRENT_SUBTRANSLATORS)
+_PRIMITIVE_TRANSLATORS_DICT: dict[str, translator.PrimitiveTranslator] = {}
+_PRIMITIVE_TRANSLATORS_VIEW: types.MappingProxyType[str, translator.PrimitiveTranslator] = (
+    types.MappingProxyType(_PRIMITIVE_TRANSLATORS_DICT)
 )
 
 
@@ -49,8 +49,8 @@ def add_subtranslators(
     """
     from jace import translator  # Circular import
 
-    global _CURRENT_SUBTRANSLATORS
-    global _CURRENT_SUBTRANSLATORS_VIEW
+    global _PRIMITIVE_TRANSLATORS_DICT
+    global _PRIMITIVE_TRANSLATORS_VIEW
 
     if len(subtrans) == 0:
         raise ValueError("Not passed any subtranslators.")
@@ -68,7 +68,7 @@ def add_subtranslators(
     #       foo1 = jace.jit(foo).lower()   # noqa: ERA001 commented out code
     #       foo2 = jace.jit(foo).lower()   # noqa: ERA001
     #  Should only lower once as it is seen in Jax.
-    new_CURRENT_SUBTRANSLATORS = _CURRENT_SUBTRANSLATORS.copy()
+    new_PRIMITIVE_TRANSLATORS_DICT = _PRIMITIVE_TRANSLATORS_DICT.copy()
 
     for prim_trans in subtrans:
         # If it is a class instantiate it.
@@ -78,18 +78,18 @@ def add_subtranslators(
 
         # Test if we know the primitive already
         prim_name: str = prim_trans.primitive
-        if (prim_name in _CURRENT_SUBTRANSLATORS) and (not overwrite):
+        if (prim_name in _PRIMITIVE_TRANSLATORS_DICT) and (not overwrite):
             raise ValueError(f"Tried to add a second translator for primitive '{prim_name}'.")
 
         # Commit the change to a "staging"
-        new_CURRENT_SUBTRANSLATORS[prim_name] = prim_trans
+        new_PRIMITIVE_TRANSLATORS_DICT[prim_name] = prim_trans
 
     # Now update the global variables.
     #  Doing it after the loop gives us exception guarantee
     # TODO: We should consider creating some list of "subtranslators sets that are known to be stable"
     #           i.e. where generated by this function, this would allow better caching in some situation.
-    _CURRENT_SUBTRANSLATORS = new_CURRENT_SUBTRANSLATORS
-    _CURRENT_SUBTRANSLATORS_VIEW = types.MappingProxyType(_CURRENT_SUBTRANSLATORS)
+    _PRIMITIVE_TRANSLATORS_DICT = new_PRIMITIVE_TRANSLATORS_DICT
+    _PRIMITIVE_TRANSLATORS_VIEW = types.MappingProxyType(_PRIMITIVE_TRANSLATORS_DICT)
 
 
 def add_subtranslator(
@@ -192,8 +192,8 @@ def get_subtranslators(
         # The use case for this is, that a user wants to populate its own list and do some funky stuff.
         #  Without this option, he would first have to make a mutable copy of the map manually,
         #  every fucking time he wants it, so making an option is simpler.
-        return _CURRENT_SUBTRANSLATORS.copy()
+        return _PRIMITIVE_TRANSLATORS_DICT.copy()
 
     # Since we do a versioning in `add_subtranslator()` we do not have to create a new view.
     #  We can just return the global view, this is needed to fix some problems in the caching.
-    return _CURRENT_SUBTRANSLATORS_VIEW
+    return _PRIMITIVE_TRANSLATORS_VIEW

From de6eb3a7f2d9e907df925092368f1978659cb79d Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Fri, 17 May 2024 13:11:47 +0200
Subject: [PATCH 171/458] Updated a test.

But I think I have to rewrite them soon anyway.
---
 tests/test_decorator.py | 8 ++++++++
 1 file changed, 8 insertions(+)

diff --git a/tests/test_decorator.py b/tests/test_decorator.py
index a1cba33..7ddcacd 100644
--- a/tests/test_decorator.py
+++ b/tests/test_decorator.py
@@ -144,10 +144,12 @@ def testee2(A: np.ndarray, B: np.ndarray) -> np.ndarray:
     assert (
         lower_cnt[0] == 1
     ), f"Annotated right after each other, but lowered {lower_cnt[0]} times instead of once."
+    assert lower_cnt[1] == 0
 
     # Now modify the state in between.
     jaceWrapped2_1 = jace.jit(testee2)
     lower2_1 = jaceWrapped2_1.lower(A, B)
+    assert lower_cnt[1] == 1
 
     @jace.translator.add_fsubtranslator("non_existing_primitive")
     def non_existing_primitive_translator(
@@ -159,6 +161,12 @@ def non_existing_primitive_translator(
     ) -> dace.SDFGState | None:
         raise NotImplementedError
 
+    # Now lets lower the version 1 again to see if something has changed.
+    assert lower1_1 is jaceWrapped1_1.lower(A, B)
+    assert lower1_2 is jaceWrapped1_2.lower(A, B)
+    assert lower_cnt[0] == 1
+
+    # Now lets nower the second version 2 test.
     jaceWrapped2_2 = jace.jit(testee2)
     lower2_2 = jaceWrapped2_2.lower(A, B)
     assert lower2_1 is not lower2_2

From f38ade0d6bb75643cb3c098aaaa704d6e57e905a Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Fri, 17 May 2024 15:40:52 +0200
Subject: [PATCH 172/458] Implemented Enrique's changes regarding the
 registering of stuff.

---
 src/jace/jax/__init__.py                      |   2 -
 src/jace/jax/api.py                           |  61 ++---
 src/jace/jax/api_helper.py                    |  55 -----
 src/jace/jax/stages.py                        |  50 +---
 src/jace/translator/__init__.py               |  11 +-
 .../translator/jaxpr_translator_driver.py     |   8 +-
 src/jace/translator/managing.py               | 223 ++++++------------
 src/jace/translator/primitive_translator.py   |  39 ++-
 .../primitive_translators/alu_translator.py   |   7 +-
 tests/test_decorator.py                       |  50 +---
 tests/test_jaxpr_translator_driver.py         |  16 +-
 tests/test_subtranslator_helper.py            |  99 ++++----
 12 files changed, 212 insertions(+), 409 deletions(-)
 delete mode 100644 src/jace/jax/api_helper.py

diff --git a/src/jace/jax/__init__.py b/src/jace/jax/__init__.py
index bb826a1..47bb219 100644
--- a/src/jace/jax/__init__.py
+++ b/src/jace/jax/__init__.py
@@ -9,7 +9,6 @@
 
 from __future__ import annotations
 
-from . import api_helper, stages
 from .api import grad, jacfwd, jacrev, jit
 from .stages import (
     CompilerOptions,
@@ -20,7 +19,6 @@
 
 
 __all__ = [
-    "stages",
     "Compiled",
     "CompilerOptions",
     "JaceWrapped",
diff --git a/src/jace/jax/api.py b/src/jace/jax/api.py
index 394ac93..806a9d2 100644
--- a/src/jace/jax/api.py
+++ b/src/jace/jax/api.py
@@ -16,16 +16,14 @@
 import jax as _jax_jax
 
 from jace import jax as jjax, translator
-from jace.jax import api_helper
 
 
-@api_helper.jax_wrapper(_jax_jax.jit, rewriting=False)
 def jit(
     fun: Callable | None = None,
     /,
     sub_translators: Mapping[str, translator.PrimitiveTranslator] | None = None,
     **kwargs: Any,
-) -> jjax.JaceWrapped:
+) -> jjax.JaceWrapped | Callable:
     """Jace's replacement for `jax.jit` (just-in-time) wrapper.
 
     It works the same way as `jax.jit` does, but instead of using XLA the computation is lowered to DaCe.
@@ -37,55 +35,29 @@ def jit(
 
     Notes:
         If no subtranslators are specified then the ones that are currently active,
-            i.e. the output of `get_subtranslators()`, are used.
-            After construction the set of subtranslators that are used by the wrapped object can not be changed.
+            i.e. the output of `get_regsitered_primitive_translators()`, are used.
+            After construction changes to the passed `sub_translators` have no effect on the returned object.
     """
-    if any(kwargs.get(arg, None) is not None for arg in ["donate_argnums", "donate_argnames"]):
-        # Donated arguments are not yet fully supported, the prototype supported something similar.
-        #  However, the documentation mentioned that they are only a hint, thus we ignore them.
-        kwargs.pop("donate_argnums", None)
-        kwargs.pop("donate_argnames", None)
-
     if len(kwargs) != 0:
         raise NotImplementedError(
             f"The following arguments of 'jax.jit' are not yet supported by jace: {', '.join(kwargs.keys())}."
         )
 
-    # fmt: off
-    if fun is None:
-        # TODO: Is there an obscure case where it makes sense to copy `sub_translators`?
-        def wrapper(f: Callable) -> jjax.JaceWrapped:
-            return jit(f, sub_translators=sub_translators, **kwargs)
-        return wrapper  # type: ignore[return-value]
-    # fmt: on
-
-    # If no subtranslators were specified then use the ones that are currently installed.
-    if sub_translators is None:
-        sub_translators = translator.get_subtranslators()
-
-    wrapper = jjax.JaceWrapped(
-        fun=fun,
-        sub_translators=sub_translators,
-        jit_ops=kwargs,
-    )
-    return ft.wraps(fun)(wrapper)
-
-
-@api_helper.jax_wrapper(_jax_jax.pmap)
-def pmap(
-    fun: Callable | None = None,  # noqa: ARG001  # Unused argument
-    /,
-    **kwargs: Any,  # noqa: ARG001 # Unused argument.
-) -> jjax.JaceWrapped:
-    """Jace wrapper around `jax.pmap`.
+    def wrapper(f: Callable) -> jjax.JaceWrapped:
+        jace_wrapper = jjax.JaceWrapped(
+            fun=f,
+            sub_translators=(
+                translator.managing._PRIMITIVE_TRANSLATORS_DICT
+                if sub_translators is None
+                else sub_translators
+            ),
+            jit_ops=kwargs,
+        )
+        return ft.wraps(f)(jace_wrapper)
 
-    Notes:
-        Will be supported in a very late state.
-    """
-    raise NotImplementedError("Currently Jace is not able to run in multi resource mode.")
+    return wrapper if fun is None else wrapper(fun)
 
 
-@api_helper.jax_wrapper(_jax_jax.vmap)
 def vmap(
     fun: Callable,
     /,
@@ -108,7 +80,6 @@ def vmap(
     )
 
 
-@api_helper.jax_wrapper(_jax_jax.grad)
 def grad(
     fun: Callable | None = None,
     /,
@@ -124,7 +95,6 @@ def grad(
     return _jax_jax.grad(fun, **kwargs)
 
 
-@api_helper.jax_wrapper(_jax_jax.jacfwd)
 def jacfwd(
     fun: Callable | None = None,
     /,
@@ -134,7 +104,6 @@ def jacfwd(
     return _jax_jax.jacfwd(fun, **kwargs)
 
 
-@api_helper.jax_wrapper(_jax_jax.jacrev)
 def jacrev(
     fun: Callable | None = None,
     /,
diff --git a/src/jace/jax/api_helper.py b/src/jace/jax/api_helper.py
deleted file mode 100644
index bc7162e..0000000
--- a/src/jace/jax/api_helper.py
+++ /dev/null
@@ -1,55 +0,0 @@
-# JaCe - JAX Just-In-Time compilation using DaCe (Data Centric Parallel Programming)
-#
-# Copyright (c) 2024, ETH Zurich
-# All rights reserved.
-#
-# SPDX-License-Identifier: BSD-3-Clause
-
-"""Helper function for the api."""
-
-from __future__ import annotations
-
-import functools as ft
-from collections.abc import Callable
-from typing import Any
-
-
-def jax_wrapper(
-    jax_fun: Callable,
-    jace_fun: Callable | None = None,
-    /,
-    rewriting: bool = True,
-    **kwargs: Any,
-) -> Callable:
-    """Creates a wrapper to encapsulate Jax in Jace functions.
-
-    A replacement for `functools.wraps` but for the special
-    case that a Jace function should replace a Jax function.
-
-    Args:
-        rewriting:      Replace 'JAX' with 'JaCe' in the doc string.
-
-    Todo:
-        Improve.
-    """
-
-    # fmt: off
-    if jace_fun is None:
-        def _inner_jax_wrapper(jace_fun_: Callable) -> Callable:
-            return jax_wrapper(jax_fun, jace_fun_, **kwargs)
-        return _inner_jax_wrapper
-    # fmt: on
-
-    # This function creates the `__wrapped__` property, that I do not want
-    #  So we have to replace it, I think we should consider using the one of Jax.
-    ft.update_wrapper(
-        wrapper=jace_fun,
-        wrapped=jax_fun,
-        **kwargs,
-    )
-
-    if rewriting:
-        # TODO(phimuell): Handle web addresses, code example and more.
-        jace_fun.__doc__ = jace_fun.__doc__.replace("JAX", "JaCe")
-
-    return jace_fun
diff --git a/src/jace/jax/stages.py b/src/jace/jax/stages.py
index f7e3127..43fe7a5 100644
--- a/src/jace/jax/stages.py
+++ b/src/jace/jax/stages.py
@@ -33,7 +33,7 @@
 
 from jace import optimization, translator, util
 from jace.jax import translation_cache as tcache
-from jace.translator import managing, post_translation as ptrans
+from jace.translator import post_translation as ptrans
 from jace.util import dace_helper as jdace
 
 
@@ -94,40 +94,12 @@ def __init__(
         Notes:
             Both the `sub_translators` and `jit_ops` are shallow copied.
         """
-        self._fun: Callable = fun
-
-        # Why do we have to make a copy (shallow copy is enough as the translators themselves are immutable)?
-        #  The question is a little bit tricky so let's consider the following situation:
-        #  The user has created a Jace annotated function, and calls it, which leads to lowering and translation.
-        #  Then he goes on and in the process modifies the internal list of translators.
-        #  Then he calls the same annotated function again, then in case the arguments happens to be structurally the same,
-        #  lowering and translation will be skipped if the call is still inside the cache, this is what Jax does.
-        #  However, if they are different (or a cache eviction has happened), then tracing and translation will happen again.
-        #  Thus depending on the situation the user might get different behaviour.
-        #  In my expectation, Jace should always do the same thing, i.e. being deterministic, but what?
-        #  In my view, the simplest one and the one that is most functional is, to always use the translators,
-        #  that were _passed_ (although implicitly) at construction, making it independent on the global state.
-        #  One could argue, that the "dynamical modification of the translator list from the outside" is an actual legitimate use case, however, it is not.
-        #  Since `JaceWrapped.lower()` is cached, we would have to modify the caching to include the dynamic state of the set.
-        #  Furthermore, we would have to implement to make a distinction between this and the normal use case.
-        #  Thus we simply forbid it! If this is desired use `jace.jit()` as function to create an object dynamically.
-        # We could either here or in `jace.jit` perform the copy, but since `jace.jit` is at the end
-        #  just a glorified constructor and "allowing dynamic translator list" is not a use case, see above, we do it here.
-        #
-        # Because we know that the global state is immutable, we must not copy in this case.
-        #  See also `make_call_description()` in the cache implementation.
-        if sub_translators is managing._PRIMITIVE_TRANSLATORS_VIEW:
-            self._sub_translators = sub_translators
-        else:
-            # Note this is the canonical way to shallow copy a mapping since `Mapping` does not has `.copy()`
-            # and `copy.copy()` can not handle `MappingProxyType`.
-            self._sub_translators = dict(sub_translators)
-
-        # Following the same logic as above we should also copy `jit_ops`.
-        #  However, do we have to make a shallow copy or a deepcopy?
-        #  I looked at the Jax code and it seems that there is nothing that copies it,
-        #  so for now we will just go ahead and shallow copy it.
+        # We have to shallow copy both the translator and the jit options.
+        #  This prevents that any modifications affect `self`.
+        #  Shallow is enough since the translators themselves are immutable.
+        self._sub_translators = dict(sub_translators)
         self._jit_ops = dict(jit_ops)
+        self._fun = fun
 
     def __call__(
         self,
@@ -162,17 +134,13 @@ def lower(
         Performs the first two steps of the AOT steps described above,
         i.e. transformation into Jaxpr and then to SDFG.
         The result is encapsulated into a `Lowered` object.
-
-        Todo:
-            Add a context manager to disable caching.
         """
+        # TODO(phimuell): Handle pytrees
+
         if len(kwargs) != 0:
             raise NotImplementedError("Currently only positional arguments are supported.")
 
-        # TODO(phimuell): Handle pytrees.
-        real_args: tuple[Any, ...] = args
-
-        jaxpr = jax_jax.make_jaxpr(self._fun)(*real_args)
+        jaxpr = jax_jax.make_jaxpr(self._fun)(*args)
         driver = translator.JaxprTranslationDriver(sub_translators=self._sub_translators)
         trans_sdfg: translator.TranslatedJaxprSDFG = driver.translate_jaxpr(jaxpr)
         ptrans.postprocess_jaxpr_sdfg(tsdfg=trans_sdfg, fun=self.wrapped_fun)
diff --git a/src/jace/translator/__init__.py b/src/jace/translator/__init__.py
index 69600ae..7d4426e 100644
--- a/src/jace/translator/__init__.py
+++ b/src/jace/translator/__init__.py
@@ -10,17 +10,16 @@
 from __future__ import annotations
 
 from .jaxpr_translator_driver import JaxprTranslationDriver
-from .managing import add_fsubtranslator, add_subtranslator, add_subtranslators, get_subtranslators
-from .primitive_translator import PrimitiveTranslator
+from .managing import get_regsitered_primitive_translators, register_primitive_translator
+from .primitive_translator import PrimitiveTranslator, PrimitiveTranslatorCallable
 from .translated_jaxpr_sdfg import TranslatedJaxprSDFG
 
 
 __all__ = [
     "JaxprTranslationDriver",
     "PrimitiveTranslator",
+    "PrimitiveTranslatorCallable",
     "TranslatedJaxprSDFG",
-    "add_subtranslator",
-    "add_subtranslators",
-    "add_fsubtranslator",
-    "get_subtranslators",
+    "register_primitive_translator",
+    "get_regsitered_primitive_translators",
 ]
diff --git a/src/jace/translator/jaxpr_translator_driver.py b/src/jace/translator/jaxpr_translator_driver.py
index aaa43f6..f95c207 100644
--- a/src/jace/translator/jaxpr_translator_driver.py
+++ b/src/jace/translator/jaxpr_translator_driver.py
@@ -69,7 +69,7 @@ class JaxprTranslationDriver:
 
     def __init__(
         self,
-        sub_translators: Mapping[str, translator.PrimitiveTranslator],
+        sub_translators: Mapping[str, translator.PrimitiveTranslatorCallable],
     ) -> None:
         """Creates the driver.
 
@@ -80,13 +80,15 @@ def __init__(
             `sub_translators` is not copied, thus the user has to guarantee,
                 that it will not change during translation.
                 It is highly advised but not required to use the output of
-                `get_subtranslators()` or pass a copy as argument.
+                `get_regsitered_primitive_translators()` or pass a copy as argument.
         """
 
         # Shared with the outside, while key and mapped values are immutable,
         #  the mapping itself is not, but it should be fine.
         #  Allocated through the lifetime of `self`.
-        self._sub_translators: Mapping[str, translator.PrimitiveTranslator] = sub_translators
+        self._sub_translators: Mapping[str, translator.PrimitiveTranslatorCallable] = (
+            sub_translators
+        )
 
         # These names can not be used for the automatic naming of Jax variables.
         #  They differ from the forbidden names, that they denote valid SDFG names.
diff --git a/src/jace/translator/managing.py b/src/jace/translator/managing.py
index f42eed8..1651000 100644
--- a/src/jace/translator/managing.py
+++ b/src/jace/translator/managing.py
@@ -13,187 +13,96 @@
 
 from __future__ import annotations
 
-import inspect
-import types
-from collections.abc import Callable, Mapping, MutableMapping
-from typing import TYPE_CHECKING, Literal, TypeAlias, cast, overload
+from collections.abc import Callable, MutableMapping
+from typing import TYPE_CHECKING, Literal, cast, overload
 
 
 if TYPE_CHECKING:
     from jace import translator
 
-    # Type alias for distinguish between instances and classes.
-    PrimitiveTranslator: TypeAlias = (
-        type[translator.PrimitiveTranslator] | translator.PrimitiveTranslator | Callable
-    )
+# These are the currently active primitive translators of JaCe.
+_PRIMITIVE_TRANSLATORS_DICT: dict[str, translator.PrimitiveTranslatorCallable] = {}
 
 
-# These are all currently used subtranslators that we are used.
-_PRIMITIVE_TRANSLATORS_DICT: dict[str, translator.PrimitiveTranslator] = {}
-_PRIMITIVE_TRANSLATORS_VIEW: types.MappingProxyType[str, translator.PrimitiveTranslator] = (
-    types.MappingProxyType(_PRIMITIVE_TRANSLATORS_DICT)
-)
-
-
-def add_subtranslators(
-    *subtrans: PrimitiveTranslator | None,
-    overwrite: bool = False,
-) -> None:
-    """Adds many subtranslators in one step to Jace's internal list.
-
-    This function is more efficient if many translators should be added in one go.
-    Please refer to `add_subtranslator()` for more information.
-
-    Notes:
-        If an error during insertion happens the operation is considered a no ops.
-    """
-    from jace import translator  # Circular import
-
-    global _PRIMITIVE_TRANSLATORS_DICT
-    global _PRIMITIVE_TRANSLATORS_VIEW
-
-    if len(subtrans) == 0:
-        raise ValueError("Not passed any subtranslators.")
-
-    # Why do we do this kind of versioning here or versioning at all?
-    #  The cache has to include the set of used subtranslators somehow.
-    #  However, as explained in `JaceWrapped.__init__()` the function must make a copy of it.
-    #  One way would be to hash the content, i.e. `[(prim_name, id(prim_translator)), ...]`.
-    #  But a much simpler idea is to just consider its address, since in 99% of the cases,
-    #  the global list is used and not some user supplied list is used we do this versioning.
-    #  This allows `JaceWrapped.__init__()` to identify if the current global list of installed
-    #  translated is passed to it and it can then prevent the copying.
-    #  In the end a code like:
-    #       def foo(...): ...
-    #       foo1 = jace.jit(foo).lower()   # noqa: ERA001 commented out code
-    #       foo2 = jace.jit(foo).lower()   # noqa: ERA001
-    #  Should only lower once as it is seen in Jax.
-    new_PRIMITIVE_TRANSLATORS_DICT = _PRIMITIVE_TRANSLATORS_DICT.copy()
-
-    for prim_trans in subtrans:
-        # If it is a class instantiate it.
-        if inspect.isclass(prim_trans):
-            prim_trans = prim_trans()
-        prim_trans = cast(translator.PrimitiveTranslator, prim_trans)
-
-        # Test if we know the primitive already
-        prim_name: str = prim_trans.primitive
-        if (prim_name in _PRIMITIVE_TRANSLATORS_DICT) and (not overwrite):
-            raise ValueError(f"Tried to add a second translator for primitive '{prim_name}'.")
-
-        # Commit the change to a "staging"
-        new_PRIMITIVE_TRANSLATORS_DICT[prim_name] = prim_trans
-
-    # Now update the global variables.
-    #  Doing it after the loop gives us exception guarantee
-    # TODO: We should consider creating some list of "subtranslators sets that are known to be stable"
-    #           i.e. where generated by this function, this would allow better caching in some situation.
-    _PRIMITIVE_TRANSLATORS_DICT = new_PRIMITIVE_TRANSLATORS_DICT
-    _PRIMITIVE_TRANSLATORS_VIEW = types.MappingProxyType(_PRIMITIVE_TRANSLATORS_DICT)
-
-
-def add_subtranslator(
-    subtrans: PrimitiveTranslator | None = None,
+@overload
+def register_primitive_translator(
+    prim_translator: Literal[None] = None,
     /,
+    primitive: str | None = None,
     overwrite: bool = False,
-) -> PrimitiveTranslator | Callable[[PrimitiveTranslator], PrimitiveTranslator]:
-    """Adds the subtranslator `subtrans` to Jace's internal list of translators.
+) -> Callable[
+    [translator.PrimitiveTranslator | translator.PrimitiveTranslatorCallable],
+    translator.PrimitiveTranslator,
+]: ...
 
-    If the primitive is already known an error is generated, however, if `overwrite` is given,
-    then `subtrans` will replace the current one.
-    In case `subtrans` is a class, the function will instantiate it first.
-    Thus, a class must be constructable without arguments.
 
-    Notes:
-        Calls to this function will never modify subtranslator lists previously obtained by `get_subtranslators()`!
-        Since `subtrans` is returned unmodified, this function can be used to annotate classes.
-        For annotating functions use `add_fsubtranslator()`.
-
-    Todo:
-        Accept many inputs for bulk update.
-        Add functions to clear them or restore the default ones.
-    """
-
-    if subtrans is None:
-        # It was used as decorator with some argument (currently `overwrite`).
-        def wrapper(
-            real_subtrans: PrimitiveTranslator,
-        ) -> PrimitiveTranslator:
-            return add_subtranslator(real_subtrans, overwrite=overwrite)
-
-        return wrapper
-
-    # Forward the call to the bulk insertion.
-    #  And always return the original argument.
-    add_subtranslators(subtrans, overwrite=overwrite)
-    return subtrans
+@overload
+def register_primitive_translator(
+    prim_translator: translator.PrimitiveTranslator | translator.PrimitiveTranslatorCallable,
+    *,
+    primitive: str | None = None,
+    overwrite: bool = False,
+) -> translator.PrimitiveTranslator: ...
 
 
-def add_fsubtranslator(
-    prim_name: str,
-    fun: Callable | None = None,
-    /,
+def register_primitive_translator(
+    prim_translator: translator.PrimitiveTranslator
+    | translator.PrimitiveTranslatorCallable
+    | None = None,
+    *,
+    primitive: str | None = None,
     overwrite: bool = False,
-) -> PrimitiveTranslator | Callable[[Callable], PrimitiveTranslator]:
-    """Convenience function to annotate function and turn them into a translator.
+) -> (
+    translator.PrimitiveTranslator
+    | Callable[
+        [translator.PrimitiveTranslator | translator.PrimitiveTranslatorCallable],
+        translator.PrimitiveTranslator,
+    ]
+):
+    """Adds the primitive translator `prim_translator` to Jace's internal list of translators.
 
-    Adds the `primitive` property to `fun` and register it then as translator.
+    If the primitive is already known an error is generated, if `overwrite` is set, it will be replaced.
+
+    Args:
+        prim_translator:    The primitive translator to annotate.
+        primitive:          Name of the primitive `prim_translator` is handled.
+                                If not given will use `prim_translator.primitive`.
+        overwrite:          Replace the current primitive translator with `prim_translator`.
 
     Notes:
-        Without this function you would had to define the translator function,
-            add the `primitive` property to it and then pass it to `add_subtranslator()`.
-            This function allows it to do in one step.
+        Can only be used to register instances.
     """
 
-    if fun is None:
-        # Annotated mode.
-        def wrapper(real_fun: Callable) -> PrimitiveTranslator:
-            return add_fsubtranslator(prim_name, real_fun, overwrite=overwrite)
-
-        return wrapper
-
-    if getattr(fun, "primitive", prim_name) != prim_name:
-        raise ValueError(f"Passed 'fun' already '{fun.primitive}' as 'primitive' property.")  # type: ignore[attr-defined]
+    def wrapper(
+        prim_translator: translator.PrimitiveTranslator | translator.PrimitiveTranslatorCallable,
+    ) -> translator.PrimitiveTranslator:
+        if not hasattr(prim_translator, "primitive"):
+            if not primitive:
+                raise ValueError(f"Missing primitive name for '{prim_translator}'")
+            prim_translator.primitive = primitive  # type: ignore[attr-defined]
+        elif prim_translator.primitive != (primitive or prim_translator.primitive):
+            raise TypeError(
+                f"Translator's primitive '{prim_translator.primitive}' doesn't match the supplied '{primitive}'."
+            )
 
-    fun.primitive = prim_name  # type: ignore[attr-defined]
-    return add_subtranslator(fun, overwrite=overwrite)
+        if prim_translator.primitive in _PRIMITIVE_TRANSLATORS_DICT and not overwrite:
+            raise ValueError(
+                f"Explicit override=True needed for primitive '{prim_translator.primitive}' to overwrite existing one."
+            )
+        _PRIMITIVE_TRANSLATORS_DICT[prim_translator.primitive] = prim_translator
 
+        # We add a `.primitive` property, thus it is for sure now no longer just a `PrimitiveTranslatorCallable`.
+        return cast(translator.PrimitiveTranslator, prim_translator)
 
-@overload
-def get_subtranslators(  # type: ignore[overload-overlap]
-    as_mutable: Literal[False] = False,
-) -> Mapping[str, translator.PrimitiveTranslator]: ...
-
-
-@overload
-def get_subtranslators(
-    as_mutable: Literal[True] = True,
-) -> MutableMapping[str, translator.PrimitiveTranslator]: ...
+    return wrapper if prim_translator is None else wrapper(prim_translator)
 
 
-def get_subtranslators(
-    as_mutable: bool = False,
-) -> (
-    Mapping[str, translator.PrimitiveTranslator]
-    | MutableMapping[str, translator.PrimitiveTranslator]
+def get_regsitered_primitive_translators() -> (
+    MutableMapping[str, translator.PrimitiveTranslatorCallable]
 ):
-    """Returns a view of all _currently_ installed primitive translators in Jace.
-
-    By setting `as_mutable` to `True` the function will return a mutable mapping object.
-    However, in any case the returned mapping will not be affected by calls that modify
-    the internal list of registered primitive translators, i.e. `add_subtranslator()`.
+    """Returns the currently active view of all _currently_ installed primitive translators in Jace.
 
-    Notes:
-        If `as_mutable` is `False` the function will return an immutable view of the
-            registered primitive translator list, thus only a view is created.
-            However, if `as_mutable` is `True` a copy is returned.
+    The returned mapping represents the active primitive translators at the time of calling.
+    This means that calls to `register_primitive_translator()` does not modify the returned object.
     """
-    if as_mutable:
-        # The use case for this is, that a user wants to populate its own list and do some funky stuff.
-        #  Without this option, he would first have to make a mutable copy of the map manually,
-        #  every fucking time he wants it, so making an option is simpler.
-        return _PRIMITIVE_TRANSLATORS_DICT.copy()
-
-    # Since we do a versioning in `add_subtranslator()` we do not have to create a new view.
-    #  We can just return the global view, this is needed to fix some problems in the caching.
-    return _PRIMITIVE_TRANSLATORS_VIEW
+    return _PRIMITIVE_TRANSLATORS_DICT.copy()
diff --git a/src/jace/translator/primitive_translator.py b/src/jace/translator/primitive_translator.py
index 29964a1..6c350f0 100644
--- a/src/jace/translator/primitive_translator.py
+++ b/src/jace/translator/primitive_translator.py
@@ -27,8 +27,7 @@
     from jace import translator
 
 
-@runtime_checkable
-class PrimitiveTranslator(Protocol):
+class PrimitiveTranslatorCallable(Protocol):
     """Interface for all Jax primitive translators, also known as subtranslator.
 
     A translator for a primitive translates a single equation of a Jaxpr into its SDFG equivalent.
@@ -39,16 +38,13 @@ class PrimitiveTranslator(Protocol):
     In the end this implements the delegation pattern.
 
     You can use `jace.translator.add_subtranslator()` to register your translator to Jace.
+
+    Notes:
+        Primitive translators that are implemented as a class, should be derived from `PrimitiveTranslator`.
     """
 
     __slots__ = ()
 
-    @property
-    @abstractmethod
-    def primitive(self) -> str:
-        """Returns the name of the Jax primitive that `self` is able to handle."""
-        ...
-
     @abstractmethod
     def __call__(
         self,
@@ -101,3 +97,30 @@ def __call__(
                                 should be constructed.
         """
         ...
+
+
+@runtime_checkable
+class PrimitiveTranslator(PrimitiveTranslatorCallable, Protocol):
+    """Interface for all Jax primitive translators, also known as subtranslator, that are implemented as class.
+
+    A translator for a primitive translates a single equation of a Jaxpr into its SDFG equivalent.
+    For satisfying this interface a concrete implementation must be immutable after construction.
+
+    Subtranslators are simple, but highly specialized objects that are only able to perform the translation of a single primitive.
+    The overall translation process itself is managed by a driver object, which also owns and manage the subtranslators.
+    In the end this implements the delegation pattern.
+
+    You can use `jace.translator.add_subtranslator()` to register your translator to Jace.
+
+    Notes:
+        The main difference to to `PrimitiveTranslatorCallable` is that this interface specifies the `primitive` property.
+            Thus, it must not be specified during registration.
+    """
+
+    __slots__ = ()
+
+    @property
+    @abstractmethod
+    def primitive(self) -> str:
+        """Returns the name of the Jax primitive that `self` is able to handle."""
+        ...
diff --git a/src/jace/translator/primitive_translators/alu_translator.py b/src/jace/translator/primitive_translators/alu_translator.py
index 05ce3fe..0d19973 100644
--- a/src/jace/translator/primitive_translators/alu_translator.py
+++ b/src/jace/translator/primitive_translators/alu_translator.py
@@ -284,6 +284,7 @@ def _list_to_dict(inp: Sequence[tuple[None | Any, Any]]) -> dict[Any, Any]:
     "lt": "__out0 = __in0 < __in1",
 }
 
-translator.add_subtranslators(
-    *[ALUTranslator(prim_name, prim_tmpl) for prim_name, prim_tmpl in _ALU_OPS_TMPL.items()]
-)
+_ = [
+    translator.register_primitive_translator(ALUTranslator(prim_name, prim_tmpl))
+    for prim_name, prim_tmpl in _ALU_OPS_TMPL.items()
+]
diff --git a/tests/test_decorator.py b/tests/test_decorator.py
index 7ddcacd..24ce507 100644
--- a/tests/test_decorator.py
+++ b/tests/test_decorator.py
@@ -12,15 +12,10 @@
 
 from __future__ import annotations
 
-from collections.abc import MutableSequence, Sequence
-
-import dace
 import jax
 import numpy as np
-from jax import core as jax_core
 
 import jace
-from jace import translator
 
 
 def test_decorator_individually():
@@ -120,16 +115,12 @@ def test_decorator_double_annot():
     """Tests the behaviour for double annotations."""
     jax.config.update("jax_enable_x64", True)
 
-    lower_cnt = [0, 0]
+    lower_cnt = [0]
 
     def testee1(A: np.ndarray, B: np.ndarray) -> np.ndarray:
         lower_cnt[0] += 1
         return A * B
 
-    def testee2(A: np.ndarray, B: np.ndarray) -> np.ndarray:
-        lower_cnt[1] += 1
-        return A * B
-
     A = np.arange(12, dtype=np.float64).reshape((4, 3))
     B = np.full((4, 3), 10, dtype=np.float64)
 
@@ -140,42 +131,13 @@ def testee2(A: np.ndarray, B: np.ndarray) -> np.ndarray:
     # Lower them right after the other.
     lower1_1 = jaceWrapped1_1.lower(A, B)
     lower1_2 = jaceWrapped1_2.lower(A, B)
-    assert lower1_1 is lower1_2
-    assert (
-        lower_cnt[0] == 1
-    ), f"Annotated right after each other, but lowered {lower_cnt[0]} times instead of once."
-    assert lower_cnt[1] == 0
-
-    # Now modify the state in between.
-    jaceWrapped2_1 = jace.jit(testee2)
-    lower2_1 = jaceWrapped2_1.lower(A, B)
-    assert lower_cnt[1] == 1
-
-    @jace.translator.add_fsubtranslator("non_existing_primitive")
-    def non_existing_primitive_translator(
-        driver: translator.JaxprTranslationDriver,
-        in_var_names: Sequence[str | None],
-        out_var_names: MutableSequence[str],
-        eqn: jax_core.JaxprEqn,
-        eqn_state: dace.SDFGState,
-    ) -> dace.SDFGState | None:
-        raise NotImplementedError
-
-    # Now lets lower the version 1 again to see if something has changed.
+    assert lower1_1 is not lower1_2
+    assert lower_cnt[0] == 2
+
+    # Lower them right after the other.
     assert lower1_1 is jaceWrapped1_1.lower(A, B)
     assert lower1_2 is jaceWrapped1_2.lower(A, B)
-    assert lower_cnt[0] == 1
-
-    # Now lets nower the second version 2 test.
-    jaceWrapped2_2 = jace.jit(testee2)
-    lower2_2 = jaceWrapped2_2.lower(A, B)
-    assert lower2_1 is not lower2_2
-    assert lower_cnt[1] == 2
-
-    # Now lower 2_1 again, to see if there is really no influence.
-    lower2_1_ = jaceWrapped2_1.lower(A, B)
-    assert lower2_1_ is lower2_1
-    assert lower_cnt[1] == 2
+    assert lower_cnt[0] == 2
 
 
 def test_decorator_sharing():
diff --git a/tests/test_jaxpr_translator_driver.py b/tests/test_jaxpr_translator_driver.py
index 12eb48c..f123c4f 100644
--- a/tests/test_jaxpr_translator_driver.py
+++ b/tests/test_jaxpr_translator_driver.py
@@ -23,14 +23,18 @@
 def translation_driver():
     """Returns an allocated driver instance."""
     name = "fixture_driver"
-    driver = translator.JaxprTranslationDriver(sub_translators=translator.get_subtranslators())
+    driver = translator.JaxprTranslationDriver(
+        sub_translators=translator.get_regsitered_primitive_translators()
+    )
     driver._allocate_translation_ctx(name=name)
     return driver
 
 
 def test_driver_alloc() -> None:
     """Tests the state right after allocation."""
-    driver = translator.JaxprTranslationDriver(sub_translators=translator.get_subtranslators())
+    driver = translator.JaxprTranslationDriver(
+        sub_translators=translator.get_regsitered_primitive_translators()
+    )
     assert not driver.is_allocated(), "Driver was created allocated."
     assert len(driver._ctx_stack) == 0
 
@@ -55,7 +59,9 @@ def test_driver_nested() -> None:
     """
 
     # This is the parent driver.
-    driver = translator.JaxprTranslationDriver(sub_translators=translator.get_subtranslators())
+    driver = translator.JaxprTranslationDriver(
+        sub_translators=translator.get_regsitered_primitive_translators()
+    )
     assert not driver.is_allocated(), "Driver should not be allocated."
 
     # We allocate the driver directly, because we need to set some internals.
@@ -295,7 +301,9 @@ def test_driver_array2() -> None:
         - Literals.
     """
     # This is the parent driver.
-    driver = translator.JaxprTranslationDriver(sub_translators=translator.get_subtranslators())
+    driver = translator.JaxprTranslationDriver(
+        sub_translators=translator.get_regsitered_primitive_translators()
+    )
     assert not driver.is_allocated(), "Driver should not be allocated."
 
     # Creating JaCe Variables with empty names, forces the driver to use the
diff --git a/tests/test_subtranslator_helper.py b/tests/test_subtranslator_helper.py
index d5885a3..871e679 100644
--- a/tests/test_subtranslator_helper.py
+++ b/tests/test_subtranslator_helper.py
@@ -11,7 +11,6 @@
 
 import re
 from collections.abc import Mapping, MutableSequence, Sequence
-from inspect import isclass, isfunction
 from typing import Any
 
 import dace
@@ -21,11 +20,10 @@
 from jax import core as jax_core
 
 import jace
-from jace import translator as jtrans
+from jace import translator
 from jace.translator import (
-    add_fsubtranslator,
-    add_subtranslator,
-    get_subtranslators,
+    get_regsitered_primitive_translators,
+    register_primitive_translator,
 )
 
 
@@ -36,9 +34,10 @@ def _conserve_builtin_translators():
     Todo:
         Come up with something better/nicer.
     """
-    initial_translators = get_subtranslators()
+    initial_translators = get_regsitered_primitive_translators()
     yield
-    jtrans.add_subtranslators(*initial_translators.values(), overwrite=True)
+    translator.managing._PRIMITIVE_TRANSLATORS_DICT.clear()
+    translator.managing._PRIMITIVE_TRANSLATORS_DICT.update(initial_translators)
 
 
 def _dict_struct(dict_: Mapping[str, Any]) -> Sequence[tuple[str, int]]:
@@ -47,17 +46,17 @@ def _dict_struct(dict_: Mapping[str, Any]) -> Sequence[tuple[str, int]]:
 
 def test_are_subtranslators_imported():
     """Tests if something is inside the list of subtranslators."""
-    assert len(get_subtranslators()) > 1
+    assert len(get_regsitered_primitive_translators()) > 1
 
 
 def test_subtranslatior_managing():
     """Ensures the functionality of the subtranslator managing."""
 
     # TODO(phimuell): Make this more friendly; See blow
-    builtin_subtrans = get_subtranslators()
+    builtin_subtrans = get_regsitered_primitive_translators()
     builin_struct = _dict_struct(builtin_subtrans)
 
-    class SubTrans1(jtrans.PrimitiveTranslator):
+    class SubTrans1(translator.PrimitiveTranslator):
         @property
         def primitive(self):
             return "non_existing_primitive1"
@@ -66,12 +65,10 @@ def __call__(self) -> None:  # type: ignore[override]  # Arguments
             raise NotImplementedError
 
     # Ensures that we really return the object unmodified.
-    SubTrans1_ = add_subtranslator(SubTrans1)
-    assert isclass(SubTrans1_)
-    assert SubTrans1_ is SubTrans1
+    sub_trans1 = register_primitive_translator(SubTrans1())
+    assert sub_trans1 is get_regsitered_primitive_translators()["non_existing_primitive1"]
 
-    @add_subtranslator(overwrite=True)
-    class SubTrans2(jtrans.PrimitiveTranslator):
+    class SubTrans2(translator.PrimitiveTranslator):
         @property
         def primitive(self):
             return "non_existing_primitive2"
@@ -79,11 +76,28 @@ def primitive(self):
         def __call__(self) -> None:  # type: ignore[override]  # Arguments
             raise NotImplementedError
 
-    assert isclass(SubTrans2)
+    # Wrong name
+    sub_trans2_instance = SubTrans2()
+    with pytest.raises(
+        expected_exception=TypeError,
+        match=re.escape(
+            f"Translator's primitive '{sub_trans2_instance.primitive}' doesn't match the supplied 'not_non_existing_primitive2'."
+        ),
+    ):
+        register_primitive_translator(
+            sub_trans2_instance,
+            primitive="not_non_existing_primitive2",
+        )
 
-    @add_fsubtranslator("non_existing_primitive3")
+    # But if the correct name is specified it works.
+    register_primitive_translator(
+        sub_trans2_instance,
+        primitive="non_existing_primitive2",
+    )
+
+    @register_primitive_translator(primitive="non_existing_primitive3")
     def non_existing_primitive_translator_3(
-        driver: jtrans.JaxprTranslationDriver,
+        driver: translator.JaxprTranslationDriver,
         in_var_names: Sequence[str | None],
         out_var_names: MutableSequence[str],
         eqn: jax_core.JaxprEqn,
@@ -91,11 +105,10 @@ def non_existing_primitive_translator_3(
     ) -> dace.SDFGState | None:
         raise NotImplementedError
 
-    assert isfunction(non_existing_primitive_translator_3)
     assert non_existing_primitive_translator_3.primitive == "non_existing_primitive3"
 
-    curr1_subtrans = get_subtranslators()
-    curr1_subtrans_mod = get_subtranslators(as_mutable=True)
+    curr1_subtrans = get_regsitered_primitive_translators()
+    curr1_subtrans_mod = get_regsitered_primitive_translators()
     assert curr1_subtrans is not builtin_subtrans
     assert curr1_subtrans is not curr1_subtrans_mod
     assert _dict_struct(curr1_subtrans) != builin_struct
@@ -106,50 +119,55 @@ def non_existing_primitive_translator_3(
         assert pname in curr1_subtrans, f"Expected to find '{pname}'."
         curr1_subtrans_mod.pop(pname)
     assert builin_struct == _dict_struct(curr1_subtrans_mod)
-    assert curr1_subtrans is get_subtranslators()
 
     # Try adding instance and if we can overwrite.
     sub_trans1_instance = SubTrans1()
     with pytest.raises(
         expected_exception=ValueError,
         match=re.escape(
-            "Tried to add a second translator for primitive 'non_existing_primitive1'."
+            "Explicit override=True needed for primitive 'non_existing_primitive1' to overwrite existing one."
         ),
     ):
-        add_subtranslator(sub_trans1_instance, overwrite=False)
+        register_primitive_translator(sub_trans1_instance, overwrite=False)
 
     # Now adding it forcefully, this should also change a lot.
-    add_subtranslator(sub_trans1_instance, overwrite=True)
+    register_primitive_translator(sub_trans1_instance, overwrite=True)
 
-    curr2_subtrans = get_subtranslators()
+    curr2_subtrans = get_regsitered_primitive_translators()
     assert curr2_subtrans is not builtin_subtrans
     assert curr2_subtrans is not curr1_subtrans
     assert _dict_struct(curr2_subtrans) != builin_struct
     assert _dict_struct(curr2_subtrans) != _dict_struct(curr1_subtrans)
     assert curr2_subtrans["non_existing_primitive1"] is sub_trans1_instance
 
-    # Try to answer a function as translator, that already has a primitive property.
+    # Try to register a function as translator, that already has a primitive property.
     with pytest.raises(
-        expected_exception=ValueError,
-        match=re.escape("Passed 'fun' already 'non_existing_primitive3' as 'primitive' property."),
+        expected_exception=TypeError,
+        match=re.escape(
+            f"Translator's primitive '{non_existing_primitive_translator_3.primitive}' doesn't match the supplied 'non_existing_primitive1'."
+        ),
     ):
-        add_fsubtranslator(
-            "non_existing_primitive1", non_existing_primitive_translator_3, overwrite=False
+        register_primitive_translator(
+            non_existing_primitive_translator_3,
+            primitive="non_existing_primitive1",
+            overwrite=False,
         )
 
     # This would work because it has the same primitive name, but it fails because overwrite is False
     with pytest.raises(
         expected_exception=ValueError,
         match=re.escape(
-            "Tried to add a second translator for primitive 'non_existing_primitive3'."
+            "Explicit override=True needed for primitive 'non_existing_primitive3' to overwrite existing one."
         ),
     ):
-        add_fsubtranslator(
-            "non_existing_primitive3", non_existing_primitive_translator_3, overwrite=False
+        register_primitive_translator(
+            non_existing_primitive_translator_3,
+            primitive="non_existing_primitive3",
+            overwrite=False,
         )
 
-    add_fsubtranslator(
-        "non_existing_primitive3", non_existing_primitive_translator_3, overwrite=True
+    register_primitive_translator(
+        non_existing_primitive_translator_3, primitive="non_existing_primitive3", overwrite=True
     )
 
 
@@ -157,8 +175,7 @@ def test_subtranslatior_managing_2():
     """Shows that we are really able to overwrite stuff"""
     jax.config.update("jax_enable_x64", True)
 
-    @add_subtranslator(overwrite=True)
-    class NonAddTranslator(jtrans.PrimitiveTranslator):
+    class NonAddTranslator(translator.PrimitiveTranslator):
         @property
         def primitive(self):
             return "add"
@@ -166,6 +183,8 @@ def primitive(self):
         def __call__(self, *args, **kwargs) -> None:
             raise NotImplementedError("The 'NonAddTranslator' can not translate anything.")
 
+    register_primitive_translator(NonAddTranslator(), overwrite=True)
+
     @jace.jit
     def testee(A: np.ndarray, B: np.ndarray) -> np.ndarray:
         return A + B
@@ -184,7 +203,7 @@ def test_subtranslatior_managing_3():
     """Shows proper decoupling."""
     jax.config.update("jax_enable_x64", True)
 
-    class NonAddTranslator(jtrans.PrimitiveTranslator):
+    class NonAddTranslator(translator.PrimitiveTranslator):
         @property
         def primitive(self):
             return "add"
@@ -192,7 +211,7 @@ def primitive(self):
         def __call__(self, *args, **kwargs) -> None:
             raise NotImplementedError("The 'NonAddTranslator' can not translate anything at all.")
 
-    used_sub_trans = get_subtranslators(as_mutable=True)
+    used_sub_trans = get_regsitered_primitive_translators()
     used_sub_trans["add"] = NonAddTranslator()
 
     @jace.jit(sub_translators=used_sub_trans)

From c53ed96d7e4925ef6302d97e8b9a4df555e0afb4 Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Fri, 17 May 2024 15:48:44 +0200
Subject: [PATCH 173/458] Fixed the population bug according to Enrique's
 suggestions.

---
 src/jace/__init__.py            | 17 ++---------------
 src/jace/translator/managing.py |  1 +
 2 files changed, 3 insertions(+), 15 deletions(-)

diff --git a/src/jace/__init__.py b/src/jace/__init__.py
index 930074e..294d357 100644
--- a/src/jace/__init__.py
+++ b/src/jace/__init__.py
@@ -9,25 +9,12 @@
 
 from __future__ import annotations
 
+import jace.translator.primitive_translators  # noqa: F401  # needed to poulate the internal list of translators.
+
 from .__about__ import __author__, __copyright__, __license__, __version__, __version_info__
 from .jax import grad, jacfwd, jacrev, jit
 
 
-def _ensure_build_in_translators_are_loaded() -> None:
-    # There is a chicken-egg problem, i.e. circular import, if we use the decorator to add the build in classes.
-    #  In order for the decorator to add the translators to the internal list, they have to be run, i.e. imported.
-    #  However, since they have to import the decorator, this would lead to a circular import.
-    #  To ensure that the built in translators are imported at the beginning, i.e. once Jace is loaded.
-    #  We define this function and call it and its only job is to load the subtranslaotrs.
-    #  However, this requires that all are imported by the `__init__.py` file.
-    # Too see that it is needed, remove this function and run `pytest tests/test_subtranslator_helper.py::test_are_subtranslators_imported`
-    from jace.translator import primitive_translators  # noqa: F401  # Unused import
-
-
-_ensure_build_in_translators_are_loaded()
-del _ensure_build_in_translators_are_loaded
-
-
 __all__ = [
     "__author__",
     "__copyright__",
diff --git a/src/jace/translator/managing.py b/src/jace/translator/managing.py
index 1651000..1e091e8 100644
--- a/src/jace/translator/managing.py
+++ b/src/jace/translator/managing.py
@@ -72,6 +72,7 @@ def register_primitive_translator(
     Notes:
         Can only be used to register instances.
     """
+    from jace import translator
 
     def wrapper(
         prim_translator: translator.PrimitiveTranslator | translator.PrimitiveTranslatorCallable,

From 7d0b6b962a27e7d44926fa291017c63b781be035 Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Fri, 17 May 2024 16:06:02 +0200
Subject: [PATCH 174/458] Fixed some potential of cyclic import in the API.

---
 src/jace/jax/api.py | 12 +++++++++---
 1 file changed, 9 insertions(+), 3 deletions(-)

diff --git a/src/jace/jax/api.py b/src/jace/jax/api.py
index 806a9d2..e47a8d7 100644
--- a/src/jace/jax/api.py
+++ b/src/jace/jax/api.py
@@ -11,17 +11,21 @@
 
 import functools as ft
 from collections.abc import Callable, Mapping
-from typing import Any
+from typing import TYPE_CHECKING, Any
 
 import jax as _jax_jax
 
-from jace import jax as jjax, translator
+from jace import translator
+
+
+if TYPE_CHECKING:
+    from jace import jax as jjax
 
 
 def jit(
     fun: Callable | None = None,
     /,
-    sub_translators: Mapping[str, translator.PrimitiveTranslator] | None = None,
+    sub_translators: Mapping[str, translator.PrimitiveTranslatorCallable] | None = None,
     **kwargs: Any,
 ) -> jjax.JaceWrapped | Callable:
     """Jace's replacement for `jax.jit` (just-in-time) wrapper.
@@ -44,6 +48,8 @@ def jit(
         )
 
     def wrapper(f: Callable) -> jjax.JaceWrapped:
+        from jace import jax as jjax  # Cyclic import
+
         jace_wrapper = jjax.JaceWrapped(
             fun=f,
             sub_translators=(

From ff9af79fec4a22692608838b97292c4c77cc78fb Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Fri, 17 May 2024 16:06:33 +0200
Subject: [PATCH 175/458] Updated the translation cache.

---
 src/jace/jax/translation_cache.py | 57 +++++--------------------------
 1 file changed, 8 insertions(+), 49 deletions(-)

diff --git a/src/jace/jax/translation_cache.py b/src/jace/jax/translation_cache.py
index d67b1e9..bed803a 100644
--- a/src/jace/jax/translation_cache.py
+++ b/src/jace/jax/translation_cache.py
@@ -227,11 +227,8 @@ class CachedCallDescription:
     This class represents both the `JaceWrapped.lower()` and `JaceLowered.compile()` calls.
 
     The actual key is composed of two parts, first the "origin of the call".
-    For `JaceLowered` the lowered SDFG is used, because we assume immutability across the whole translation chain,
-    we relay on its built-in  `__hash__()` and `__eq__`, which fall back to their address.
-
-    For `JaceWrapped` objects the first part includes the wrapped function.
-    Then it also includes the addresses of the jit options and the set of used subtranslators.
+    For this we just use the address of the stage object we are caching and hope that the
+    address is not reused for another stag anytime soon.
 
     The second part is of the key are a description of the actual arguments, see `CallArgsDescription` type alias.
     There are two ways for describing the arguments:
@@ -244,21 +241,16 @@ class CachedCallDescription:
     In addition an argument can be positional or a named argument,
     in which case it consists of a `tuple[str, _AbstarctCallArgument  | _ConcreteCallArgument]`.
 
+    Notes:
+        The base assumption is that the stages are immutable.
+
     Todo:
         - pytrees.
         - Turn the references into week references, Jax does this and I am sure there is a reason for it.
         - Turn this into a strategy.
     """
 
-    # Origin Part for `JaceWrapped`:
-    fun: Callable | None
-    sub_trans_id: int | None
-    jit_ops_id: int | None
-
-    # Origin Part for `JaceLowered`:
-    sdfg: dace.SDFG | None
-
-    # Argument Part of the key
+    stage_id: int
     fargs: CallArgsDescription
 
     @classmethod
@@ -277,26 +269,6 @@ def make_call_description(
             if len(kwargs) != 0:
                 raise NotImplementedError("'kwargs' are not implemented in 'JaceWrapped.lower()'.")
 
-            fun = stage.wrapped_fun
-            sdfg = None
-
-            # We have to guard ourselves from the case of annotating the same function, but using different translators.
-            #  Thus we have to include the translators somehow in the cache description.
-            #  As outlined in `JaceWrapped.__init__()`, the list of subtranslators is copied by the constructor,
-            #  thus it is unique, and its address serves as a key.
-            #  The special design of the copying in `JaceWrapped.__init__()`, will not make a copy if the set is the current global set.
-            #  This design will cache most aggressively, if the subtranslator are set up at the beginning and then never again.
-            #  Which should also be the main use case.
-            # The best we could probably do is some kind of content hash, i.e. creating a sorted list of `(prim_name, id(prim_trans))` tuples.
-            #  However, this is relatively expensive and probably an overkill.
-            sub_trans_id = id(stage._sub_translators)
-
-            # From the discussion above it becomes clear that we also have to include the Jax options in the hash.
-            #  Currently `JaceWrapper.__init__()` shallow copies it, in the assumption that this is enough.
-            #  We could also do some kind of semantic hash, but currently we just cache on its address,
-            #  with the optimization that "supplying no options" is handled explicitly.
-            jit_ops_id = id(stage._jit_ops) if len(stage._jit_ops) != 0 else None
-
             # Currently we only allow positional arguments and no static arguments.
             #   Thus the function argument part of the key only consists of abstract arguments.
             fargs: tuple[_AbstarctCallArgument, ...] = tuple(
@@ -305,11 +277,6 @@ def make_call_description(
 
         elif isinstance(stage, stages.JaceLowered):
             # JaceLowered.compile() to JaceCompiled
-            #  We do not have to deepcopy the sdfg, since we assume immutability.
-            fun = None
-            sub_trans_id = None
-            jit_ops_id = None
-            sdfg = stage.compiler_ir().sdfg
 
             #   We only accepts compiler options, which the Jax interface mandates
             #   are inside a `dict` thus we will get at most one argument.
@@ -321,16 +288,10 @@ def make_call_description(
                 raise ValueError("Only a 'dict' is allowed as argument to 'JaceLowered.compile()'.")
             if (len(args) == 0) or (args[0] is None):
                 # Currently we consider no argument and `None` as "use the default argument".
-                #  This should be in accordance with Jax. See also `JaceLowered.compile()`.
+                #  Which is what Jax does.
                 comp_ops: stages.CompilerOptions = stages.JaceLowered.DEF_COMPILER_OPTIONS
             else:
-                # Compiler options where given.
                 comp_ops = args[0]
-            assert isinstance(comp_ops, dict)
-            assert all(
-                isinstance(k, str) and isinstance(v, _ConcreteCallArgument)
-                for k, v in comp_ops.items()
-            )
 
             # We will now make `(argname, argvalue)` pairs and sort them according to `argname`.
             #  This guarantees a stable order.
@@ -344,9 +305,7 @@ def make_call_description(
         else:
             raise TypeError(f"Can not make key from '{type(stage).__name__}'.")
 
-        return cls(
-            fun=fun, sdfg=sdfg, sub_trans_id=sub_trans_id, jit_ops_id=jit_ops_id, fargs=fargs
-        )
+        return cls(stage_id=id(stage), fargs=fargs)
 
 
 class TranslationCache:

From 1feff89560847c152c9aa6d32b901326cf42d0c1 Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Sun, 19 May 2024 14:15:31 +0200
Subject: [PATCH 176/458] First rework.

Not all is working yet but the majority is again.
---
 .../translator/jaxpr_translator_driver.py     | 441 +++++-------------
 src/jace/translator/translated_jaxpr_sdfg.py  |  63 +--
 src/jace/util/__init__.py                     |   8 +-
 src/jace/util/jax_helper.py                   | 110 +++--
 src/jace/util/traits.py                       |  26 +-
 src/jace/util/util.py                         |  23 +-
 6 files changed, 243 insertions(+), 428 deletions(-)

diff --git a/src/jace/translator/jaxpr_translator_driver.py b/src/jace/translator/jaxpr_translator_driver.py
index f95c207..294d0a1 100644
--- a/src/jace/translator/jaxpr_translator_driver.py
+++ b/src/jace/translator/jaxpr_translator_driver.py
@@ -7,9 +7,8 @@
 
 from __future__ import annotations
 
-import itertools
-from collections.abc import Iterable, Mapping, MutableSequence, Sequence
-from typing import TYPE_CHECKING, Any, Final, Literal, cast, overload
+from collections.abc import Mapping, MutableSequence, Sequence
+from typing import TYPE_CHECKING, Any, Literal, cast, overload
 
 import dace
 import jax
@@ -35,36 +34,32 @@ class JaxprTranslationDriver:
     - the `arg_names` parameter is not set.
 
     For these reasons the SDFG is not directly usable, and further manipulations have to be performed.
-    Especially, DaCe's validation function will fail and it is unable to be perocessed by the optimization pipeline.
-    For more information also see `jace.translator.post_translation` module for more information.
+    Especially, DaCe's validation function will fail and it is unable to be processed by the optimization pipeline.
+    For more information also see `jace.translator.post_translation` module.
 
-    The idea of the translator is extremely simple. Since Jaxpr is a list
-    consisting of more or less simple instructions/equations, they get processed
-    one after the other. Each equation is translated into its own state that
-    is appended to the SDFG, thus the SDFG is a long list of states. In certain
-    cases it might be that an equation needs more states, but this is an exception.
+    The idea of the translator is extremely simple.
+    Since Jaxpr is a list consisting of more or less simple instructions/equations, they get processed one after the other.
+    Each equation is translated into its own state that is appended to the SDFG, thus the SDFG is a long list of states.
+    In certain cases it might be that an equation needs more states, but this is an exception.
 
     The actual translation of the equation is not handled by the driver.
     Instead the request is forwarded to a `PrimitiveTranslator` object, also known as subtranslator.
     This is a highly specialized object that is able to handle one kind of primitive.
     For more information on the subtranslators see the documentation of `PrimitiveTranslator`.
-    The actual translators are supplied from the outside at construction time.
 
-    To start a translation the `translate_jaxpr()` function should be called,
-    if this happens it is said that the driver has an ongoing translation.
-    If `translate_jaxpr()` is called on driver that has an ongoing translation, a new translation context will be set up.
+    To start a translation the `translate_jaxpr()` function should be called, if this happens it is said that the driver has an ongoing translation.
+    If `translate_jaxpr()` is called on a driver that has an ongoing translation, a new translation context will be set up.
     Thus the driver will then translate the supplied (nested) Jaxpr and return the result.
     However, this will have no influence on the translation process that is already going.
 
     Notes:
-        The translator is able to handle multiple consecutive translations.
+        After the main translation has been performed the translator object can be used again.
     """
 
     __slots__ = (
         "_ctx_stack",  # Stack of all contexts
-        "_reserved_names",  # Part of the context, but is copied.
         "_sub_translators",
-        "_rev_manager",
+        "_jax_name_map",
     )
 
     def __init__(
@@ -83,35 +78,28 @@ def __init__(
                 `get_regsitered_primitive_translators()` or pass a copy as argument.
         """
 
-        # Shared with the outside, while key and mapped values are immutable,
-        #  the mapping itself is not, but it should be fine.
-        #  Allocated through the lifetime of `self`.
+        # Maps the name of a Jax primitive to the primitive translator that should be used.
+        #  Note that the subtranslator is only required to be a callable, and immutable.
+        #  Allocated through the lifetime of `self`, and shared with the outside.
         self._sub_translators: Mapping[str, translator.PrimitiveTranslatorCallable] = (
             sub_translators
         )
 
-        # These names can not be used for the automatic naming of Jax variables.
-        #  They differ from the forbidden names, that they denote valid SDFG names.
-        #  An example would be names of the function arguments.
-        #  Only allocated during an ongoing translation.
-        self._reserved_names: set[str] = None  # type: ignore[assignment]
-
-        # Shared revision counter manager.
-        #  Generates the revision numbers we need.
-        #  Is reset after every translation.
-        self._rev_manager: itertools.count[int] = itertools.count(0, 1)
+        # Maps Jax variables to the name of its SDFG equivalent.
+        #  Note that it is shared among all translation contexts.
+        #  This is done to create consistency between SDFG variables
+        #  and the names used pretty printed Jaxprs.
+        self._jax_name_map: dict[jax_core.Var | util.JaCeVar, str] = {}
 
         # Context stack and current context.
-        #  Only allocated during an ongoing translation
+        #  If it is empty, then no translation process is in process.
         self._ctx_stack: list[translator.TranslatedJaxprSDFG] = []
 
     def translate_jaxpr(
         self,
         jaxpr: jax_core.ClosedJaxpr,
         *,
-        inp_scalar_as_array: bool = False,
         name: str | None = None,
-        reserved_names: str | Iterable[str] = (),
     ) -> translator.TranslatedJaxprSDFG:
         """Perform the translation of a Jaxpr into a SDFG.
 
@@ -120,13 +108,10 @@ def translate_jaxpr(
 
         Returns:
             The function will translate the passed Jaxpr object into an SDFG in canonical form.
-            This SDFG together with additional meta data, that is needed for further processing
-            is encapsulated inside a `TranslatedJaxprSDFG` object.
+            This SDFG together with additional meta data, that is needed for further processing is encapsulated inside a `TranslatedJaxprSDFG` object.
 
         Args:
-            inp_scalar_as_array:    Translate scalar _input_ arguments to arrays of length 1.
             name:                   Use this name for the SDFG instead some generated one.
-            reserved_names:         Prevent the generation of variables with these names, see `self.add_array()` for more.
         """
         if len(jaxpr.effects) != 0:
             raise NotImplementedError("'Jaxpr' with side effects are not supported.")
@@ -140,15 +125,11 @@ def translate_jaxpr(
         #       this must be done manually.
         self._allocate_translation_ctx(
             name=name,
-            reserved_names=reserved_names,
         )
         self._create_constants(
             jaxpr=jaxpr,
         )
-        self._create_initial_input(
-            jaxpr=jaxpr,
-            inp_scalar_as_array=inp_scalar_as_array,
-        )
+        self._create_initial_input(jaxpr=jaxpr)
         # Note that `self` and `jsdfg` still share the same underlying memory, i.e. context.
         jsdfg: translator.TranslatedJaxprSDFG = self._translate_jaxpr_internal(jaxpr)
         self._clear_translation_ctx()
@@ -164,19 +145,17 @@ def append_new_state(
     ) -> dace.SDFGState:
         """Creates a new `SDFGState` and adds it to the SDFG.
 
-        By default the new state is appended to the current terminal state.
-        This will also update the terminal SDFG state of `self`.
+        By default the new state is appended to the current terminal state,
+        which will also update the terminal state of recorded inside `self`.
 
-        However, if `prev_state` is specified the state new state will be
-        appended to `prev_state` instead. This will not modify the terminal
-        state unless `prev_state` is the current terminal state.
+        However, if `prev_state` is specified the state new state will be appended to `prev_state` instead.
+        The terminal state of `self` will only be modified if `prev_state` is the current terminal state.
 
         Args:
             label:          The name that should be given to the new `SDFGState`.
             condition:      The condition of the state transitions used on the `InterstateEdge`.
             assignments:    Symbol assignments that should be done during the transition.
             prev_state:     Alternative `SDFGState` at which we should append the new state.
-
         """
         if isinstance(label, str) and (not util.VALID_SDFG_OBJ_NAME.fullmatch(label)):
             raise ValueError(f"Can not create state with label '{label}' since it is invalid.")
@@ -202,7 +181,7 @@ def append_new_state(
 
     @property
     def arrays(self) -> Mapping[str, ddata.Data]:
-        """Get all `Data` descriptors that are currently known to the SDFG.
+        """Get all data descriptors that are currently known to the SDFG.
 
         Notes:
             Essentially a shorthand and preferred way for `self.sdfg.arrays`.
@@ -217,16 +196,16 @@ def get_array(
         """Returns the SDFG `Data` object `name` referees to.
 
         If `name` is a string it is directly interpreted as the name of an SDFG variable.
-        In case it is a `jax.core.Atom` it is first translated, see `self.map_jax_var_to_sdfg()`.
+        In other cases it is first translated using `self.map_jax_var_to_sdfg()`.
         """
-        if isinstance(name, str):
-            sdfg_name: str = name
-        elif isinstance(name, (jax_core.Var, util.JaCeVar)):
-            sdfg_name = self.map_jax_var_to_sdfg(name)
+        if isinstance(name, (jax_core.Var, util.JaCeVar)):
+            sdfg_name: str = self.map_jax_var_to_sdfg(name)
+        elif isinstance(name, str):
+            sdfg_name = name
         else:
-            raise TypeError(f"Does not know how to handle '{type(name).__name__}'.")
+            raise TypeError(f"The literal '{name}' does not have an SDFG equivalent.")
         if sdfg_name not in self._ctx.sdfg.arrays:
-            raise KeyError(f"Requested SDFG array '{name}' but it is not known.")
+            raise KeyError(f"Requested SDFG object '{name}' is not known.")
         return self._ctx.sdfg.arrays[sdfg_name]
 
     @overload
@@ -251,7 +230,7 @@ def map_jax_var_to_sdfg(
 
         Args:
             jax_var:        The Jax variable to look up.
-            allow_fail:     If mapping is not known return `None` instead of raise `KeyError`.
+            allow_fail:     If mapping is not known return `None` instead of raising `KeyError`.
         """
         if isinstance(jax_var, jax_core.Literal):
             raise RuntimeError("There is no SDFG variable for literal '{jax_var}'.")
@@ -276,16 +255,6 @@ def sdfg(self) -> dace.SDFG:
         """
         return self._ctx.sdfg
 
-    @property
-    def terminal_sdfg_state(self) -> dace.SDFGState:
-        """Returns the current terminal state of the SDFG under construction.
-
-        The SDFGs that are constructed by the driver are essentially a list of states.
-        New states are appended at the current terminal/end state and becoming the new terminal state.
-        This function returns the current terminal state.
-        """
-        return cast(dace.SDFGState, self._ctx.terminal_state)
-
     def is_allocated(self) -> bool:
         """Tests if `self` has an allocated context.
 
@@ -302,17 +271,10 @@ def is_root_translator(self) -> bool:
         """
         if not self.is_allocated():
             raise RuntimeError("Driver is not allocated.")
-        if self._ctx.rev_idx == 0:
+        if len(self._ctx_stack) == 1:
             return True
         return False
 
-    @property
-    def rev_idx(self) -> int:
-        """Returns the revision index of `self`."""
-        if not self.is_allocated():
-            raise RuntimeError("Driver is not allocated.")
-        return cast(int, self._ctx.rev_idx)
-
     def add_jax_name_mapping(
         self,
         jax_var: jax_core.Var | util.JaCeVar,
@@ -320,10 +282,8 @@ def add_jax_name_mapping(
     ) -> JaxprTranslationDriver:
         """Creates a mapping between `jax_var` to `sdfg_name`.
 
-        This function updates the internal map of `self` and after the call
-        `self.map_jax_var_to_sdfg()` will identify `jax_var` with `sdfg_name`.
-        This function is not able to delete a variable mapping that was
-        established before, for this use TBA.
+        This function updates the internal map of `self` and after the call `self.map_jax_var_to_sdfg()` will identify `jax_var` with `sdfg_name`.
+        This function is not able to delete a variable mapping that was established before, for this use TBA.
 
         Args:
             jax_var:     The Jax variable.
@@ -340,197 +300,62 @@ def add_jax_name_mapping(
             )
         if sdfg_name not in self._ctx.sdfg.arrays:
             raise KeyError(f"Mapping '{jax_var} -> {sdfg_name}': SDFG target unknown.")
-        if sdfg_name in self._forbidden_names:
+        if sdfg_name in util.FORBIDDEN_SDFG_VAR_NAMES:
             raise NameError(f"Mapping '{jax_var} -> {sdfg_name}': Forbidden name.")
 
         self._jax_name_map[jax_var] = sdfg_name
         return self
 
-    def add_reserved_names(
-        self,
-        reserved_names: str | Iterable[str],
-    ) -> JaxprTranslationDriver:
-        """Adds the names listed in `reserved_names` to the internal list."""
-
-        if not reserved_names:
-            return self
-        if isinstance(reserved_names, str):
-            reserved_names = [reserved_names]
-        self._reserved_names.update(reserved_names)
-        return self
-
     def add_array(
         self,
         arg: jax_core.Atom | util.JaCeVar,
         *,
-        as_transient: bool = True,
-        alt_name: str | None = None,
         name_prefix: str | None = None,
-        find_new_name: bool | None = None,
-        force_array: bool = False,
-        strides: Sequence[int | dace.symbol | str] | None = None,
-        allow_literals: bool = False,
-        force_jax_name: bool = False,
         update_var_mapping: bool = False,
     ) -> str:
         """Creates an SDFG variable for the Jax variable `arg` and returns its SDFG name.
 
-        By default the function will create a transient, use `as_transient=True` to change that.
-        By default the function will honor if the Jax variable is a scalar or an array.
-        However, by setting `force_array` the function will always generate an array.
+        By default this function will _not_ update the internal variable list mapping.
+        If you wish to do that, which is recommended you should set `update_var_mapping` to `True`.
 
-        By default the name for the SDFG variable is derived from the Jax variable.
-        It is guaranteed that this name is unique in the SDFG, even in the presence of nested SDFGs.
-        By specifying `alt_name` it is possible to force a certain name on a variable.
-        It is important that if `alt_name` is specified the function will either generate the variable or fail.
-
-        The  driver distinguishes between two kinds of "bad (SDFG) variable names".
-        The first category are the forbidden names, which the function refuses to generate.
-        The second type are the so called reserved names, which were set at the beginning, or by `self.add_reserved_names()`.
-        These names can be used if the name is specified through `alt_name` but are not used in automatic naming.
-
-        If nothing is specified, the strides of the data are determined by DaCe, which is continuous C order.
-        It is possible to set a certain values by setting `strides` appropriate.
-
-        By default this function does not update the internal variable map.
-        However, by setting `update_var_mapping` to `True` the function will
-        update the mapping.
+        The function will create either scalar or Array transients.
+        By default the function will extract all necessary information using the `jace.util.get_jax_var_*` functions.
+        For the naming the function will use the `jace.util.propose_jax_name()` function and pass the internal variable mapping.
+        If you need to create a rather special variable, it is advised to pass a `JaCeVar` instance.
 
         Args:
             arg:                The Jax object for which a SDFG equivalent should be created.
-            as_transient:       If set, the SDFG variable is a transient, `True` by default.
-            alt_name:           Try to create the variable with this name; either succeed or fail.
-            name_prefix:        If given and in automatic naming mode, add this prefix to the name.
-            find_new_name:      The translator will try to find a new name if the designated is already occupied.
-            force_array:        Instead of a `dace.Scalar` create a `dace.Array` with one element.
-            strides:            Instead of the default strides use these values.
-            allow_literals:     If `True` then also allows JaxLiterals as `arg`.
-            force_jax_name:     If `True` then, the verbatim Jax name will be used.
+            name_prefix:        If given it will be used as prefix for the name.
             update_var_mapping: Update the internal variable mapping; by default `False`.
-
-        Notes:
-            If this function is used directly a user is advised to always set
-                `update_var_mapping` to `True`.
-            If you need to create a special array, you can use `jace.util.JaCeVar`
-                to create a pseudo Jax variable.
         """
-        shape: tuple[int] = util.get_jax_var_shape(arg)
-        dtype = util.get_jax_var_dtype(arg)
-        offset = None  # i.e. no offset
+        shape: tuple[int | dace.symbol | str, ...] = util.get_jax_var_shape(arg)
+        dtype: dace.typeclass = util.get_jax_var_dtype(arg)
+        strides: tuple[int | dace.symbol | str, ...] | None = util.get_jax_var_strides(arg)
         storage: dace.StorageType = dace.StorageType.Default  # Set at later stages (optimization)
+        offset = None  # i.e. no offset
         is_scalar: bool = shape == ()
+        as_transient: bool = True
 
-        if force_jax_name:
-            if alt_name is not None:
-                raise ValueError(
-                    f"Specified 'force_jax_name', but passed '{alt_name}' as 'alt_name'."
-                )
-            if name_prefix is not None:
-                raise ValueError(
-                    f"Specified 'force_jax_name', but passed '{name_prefix}' as 'name_prefix'."
-                )
-            if find_new_name:
-                raise ValueError("Specified `force_jax_name` but also wanted a new name.")
-            find_new_name = False
-            alt_name = util.propose_jax_name(arg, self._jax_name_map)
-        if alt_name is not None:
-            find_new_name = False  # If a name was given, then use it no matter what.
-            if len(alt_name) == 0:
-                raise ValueError("Passed an empty 'alt_name'.")
-            if alt_name in self._forbidden_names:
-                raise ValueError("'alt_name' is a forbidden name.")
-            if not util.VALID_SDFG_VAR_NAME.fullmatch(alt_name):
-                raise ValueError(f"The passed name 'alt_name' '{alt_name}' is invalid.")
-            if update_var_mapping and arg in self._jax_name_map:
-                raise ValueError(f"Variable '{alt_name}' already registered.")
-            if alt_name in self._ctx.sdfg.arrays:
-                raise ValueError(f"Variable '{alt_name}' already exists.")
-            if name_prefix is not None:
-                raise ValueError(
-                    f"Specified 'name_prefix' ('{name_prefix}') but passed '{alt_name}' as 'alt_name'."
-                )
-        if (name_prefix is not None) and (len(name_prefix) == 0):
-            raise ValueError("Specified an empty 'name_prefix'.")
-
-        # Now we determine the proposed name of the variable.
-        #  Depending on the situation, we will further manipulate it.
-        if alt_name is not None:
-            prop_name = alt_name  # Just for completion: will be ignored later
-        elif isinstance(arg, (jax_core.Var, util.JaCeVar)):
-            prop_name = util.propose_jax_name(arg, self._jax_name_map)
-            assert not prop_name.startswith("__")
-            if name_prefix is not None:
-                prop_name = name_prefix + prop_name
-        elif isinstance(arg, jax_core.Literal):  # type: ignore[unreachable]
-            if not allow_literals:  # Allows to use a literal as template.
-                raise NotImplementedError("Jax Literals are not supported.")
-            if alt_name is None:
-                raise ValueError(f"Passed literal '{arg}', but not specified a name to use.")
-
-        if alt_name is None:
-            # If we are the root translator, then we will use `prop_name` directly;
-            #  otherwise we will append the revision of `self` to the name.
-            arg_name = prop_name + (
-                "" if self.is_root_translator() else f"_rev_idx{self._ctx.rev_idx}"
-            )
-        else:
-            # Use the supplied name directly.
-            arg_name = str(alt_name)
-
-        # Checking the strides.
-        if strides is not None:
-            if is_scalar:
-                raise ValueError("Specified a stride for a scalar.")
-            if isinstance(strides, (str, dace.symbol, int)):
-                strides = (strides,)
-            elif not isinstance(strides, tuple):
-                strides = tuple(strides)
-            if len(strides) != len(shape):
-                raise ValueError(
-                    f"'strides' has length {len(strides)}, but array rank is {len(shape)}."
-                )
-
-        # Determine if we should look for a new name or not, if nothing was specified
-        if find_new_name is None:
-            if arg_name in self._reserved_names:
-                find_new_name = True
-            if arg_name in self._forbidden_names:
-                # This is not an error, but happens if we handle Jax variable `if`.
-                find_new_name = True
-
-        if find_new_name:
-            name_tmpl = "_jax_variable__" + arg_name + "__{}"
-            for iCounter in range(1000):
-                _arg_name = name_tmpl.format(iCounter)
-                if (
-                    (_arg_name in self._forbidden_names)
-                    or (_arg_name in self._reserved_names)
-                    or (_arg_name in self._ctx.sdfg.arrays)
-                ):
-                    continue  # The proposed variable is known, so try next value.
-                arg_name = _arg_name  # We found a name that we can use.
-                break
-            else:
-                raise ValueError(f"Failed to find a replacement name for '{arg_name}'")
-            del iCounter, _arg_name
+        # Propose a name and if needed extend it.
+        arg_name = util.propose_jax_name(arg, self._jax_name_map)
+        assert not arg_name.startswith("__")
+        if name_prefix is not None:
+            arg_name = name_prefix + arg_name
 
-        # Final name check
-        if arg_name in self._forbidden_names:
-            raise ValueError(f"Can't create variable '{arg_name}', name is forbidden.")
-        if arg_name in self._ctx.sdfg.arrays:
-            raise ValueError(f"Can't create variable '{arg_name}', variable is already created.")
+        # final checks
+        if arg_name in util.FORBIDDEN_SDFG_VAR_NAMES:
+            raise ValueError(f"add_array({arg}): The proposed name '{arg_name}' is forbidden.")
         if not util.VALID_SDFG_VAR_NAME.fullmatch(arg_name):
-            raise ValueError(f"The requested variable name '{arg_name}' is invalid.")
-
-        # Promotion of scalar to array.
-        if is_scalar and force_array:
-            shape = (1,)
-            strides = None
-            is_scalar = False
+            raise ValueError(f"add_array({arg}): The proposed name '{arg_name} is invalid.")
+        if arg_name in self._ctx.sdfg.arrays:
+            raise ValueError(f"add_array({arg}): The proposed name '{arg_name}', is used.")
 
         if is_scalar:
             self._ctx.sdfg.add_scalar(
-                name=arg_name, storage=storage, dtype=dtype, transient=as_transient
+                name=arg_name,
+                storage=storage,
+                dtype=dtype,
+                transient=as_transient,
             )
         else:
             self._ctx.sdfg.add_array(
@@ -579,12 +404,10 @@ def create_jax_var_list(  # type: ignore[misc]
         """Creates SDFG variables for the listed Jax variables and returns their SDFG names.
 
         If a Jax variable already has a SDFG equivalent then the function will use this variable.
-        If no SDFG variable is known the function will create one using `add_array()`, with `update_var_mapping` set to `True`.
+        If no corresponding SDFG variable is known the function will create one using `add_array()`, with `update_var_mapping` set to `True`.
 
-        By setting `prevent_creation` the function will not create any new SDFG variables.
-        This mode is used to indicate that all variables have to exists already.
-        By setting `only_creation` the function will only create new SDFG variables.
-        If a Jax variable already has a known SDFG equivalent an error is generated.
+        By setting `prevent_creation` the function will not create any new SDFG variables, if no already existing variable is found an error is generated.
+        By setting `only_creation` the function will only create new SDFG variables, if a variable was already processed an error will be created.
 
         By default literals cause an error.
         However, by setting `handle_literals` to `True` literals will will be included in the output with the value `None`.
@@ -613,7 +436,7 @@ def create_jax_var_list(  # type: ignore[misc]
                 sdfg_name = None
             else:
                 mapped_sdfg_name: str | None = self.map_jax_var_to_sdfg(jax_var, allow_fail=True)
-                if (mapped_sdfg_name is None) and prevent_creation:
+                if prevent_creation and (mapped_sdfg_name is None):
                     raise ValueError(f"'prevent_creation' given but have to create '{jax_var}'.")
                 if mapped_sdfg_name is None:
                     sdfg_name = self.add_array(arg=jax_var, update_var_mapping=True, **kwargs)
@@ -621,9 +444,6 @@ def create_jax_var_list(  # type: ignore[misc]
                     raise ValueError(f"'only_creation' given '{jax_var}' already exists.")
                 else:
                     sdfg_name = mapped_sdfg_name
-                # Calling `add_jax_name_mapping` is save, because if the mapping does already exists it is a no ops.
-                self.add_jax_name_mapping(jax_var, sdfg_name)
-
             ret_list.append(sdfg_name)
 
         return ret_list
@@ -631,38 +451,30 @@ def create_jax_var_list(  # type: ignore[misc]
     def _create_initial_input(
         self,
         jaxpr: jax_core.ClosedJaxpr,
-        inp_scalar_as_array: bool,
     ) -> Sequence[str]:
         """This function will create the internal input variables that are used for the SDFG.
 
         Args:
             jaxpr:                  The Jaxpr that we want to translate.
-            inp_scalar_as_array:    Promote scalars to arrays of size one.
 
         Returns:
             The list of SDFG variables used as input arguments of `jaxpr` in the same order.
 
         Notes:
-            This function will fill the internal list of inputs.
+            The function will populate the `inp_names` member of the current context.
         """
         if not self.is_allocated():
             raise RuntimeError("Driver is not allocated, can not create constants.")
-        if len(self._ctx.inp_names) != 0:
-            raise RuntimeError("Called '_create_initial_input()' twice?")
+        assert len(self._ctx.inp_names) == 0
 
         # Handle the initial input arguments
-        sdfg: dace.SDFG = self._ctx.sdfg
         init_in_var_names: Sequence[str] = self.create_jax_var_list(
             jax_var_list=jaxpr.jaxpr.invars,
-            only_creation=True,
-            as_transient=True,  # Explicit transient; no error!
+            only_creation=True,  # Nothing exists yet.
             handle_literals=False,  # Initial arguments are never literals
-            force_array=inp_scalar_as_array,
-            force_jax_name=self.is_root_translator(),  # Ensure root get pure Jax names.
         )
-        # This forces the code to only accept kwargs
-        #  Is also part of "what a canonical sdfg" is.
-        sdfg.arg_names = []
+        # This forces the code to only accept kwargs; it is also part of "what a canonical sdfg" is.
+        self.sdfg.arg_names = []
 
         # The output list is populated by `self._translate_jaxpr_internal()`
         self._ctx.inp_names = tuple(init_in_var_names)
@@ -690,13 +502,11 @@ def _create_constants(
 
         sdfg_const_names: Sequence[str] = self.create_jax_var_list(
             jax_var_list=jaxpr.jaxpr.constvars,
-            only_creation=True,
-            strides=None,
+            only_creation=True,  # Nothing exists yet.
+            handle_literals=False,  # It seems that constants are never literals.
             name_prefix="__const_",
         )
-
         for sdfg_name, const_value in zip(sdfg_const_names, jaxpr.consts, strict=True):
-            # We have to pass the data descriptor to `add_constant()`, otherwise a new one would be created.
             self._ctx.sdfg.add_constant(
                 sdfg_name, deepcopy(const_value), self._ctx.sdfg.arrays[sdfg_name]
             )
@@ -705,7 +515,6 @@ def _create_constants(
     def _allocate_translation_ctx(
         self,
         name: str | None = None,
-        reserved_names: str | Iterable[str] = (),
     ) -> JaxprTranslationDriver:
         """This function allocates and initialize the members of the translation context of `self`.
 
@@ -715,29 +524,19 @@ def _allocate_translation_ctx(
 
         Args:
             name:               The name of the SDFG.
-            reserved_names:     Add these name to the set of resered names of `self`.
         """
         from jace import translator  # Cyclic import
 
         # Create a new translation context and put it on the stack.
         self._ctx_stack.append(
             translator.TranslatedJaxprSDFG(
-                rev_idx=next(self._rev_manager),
                 name=name,
             )
         )
 
         if self.is_root_translator():
-            # The root translation, i.e. the very first context allocation
-            #  Thus we also have to allocate the additional members
-            #  which are shared among all contexts.
-            self._reserved_names = set()
-            self.add_reserved_names(reserved_names)
-
-        else:
-            # We are in a nested context.
-            #  We might have to update the reserved names.
-            self.add_reserved_names(reserved_names)
+            # In the future we will populate the generate state here, i.e. if we are on GPU or not and so on.
+            assert len(self._jax_name_map) == 0
 
         return self
 
@@ -748,25 +547,23 @@ def _ctx(self) -> translator.TranslatedJaxprSDFG:
         return self._ctx_stack[-1]
 
     def _clear_translation_ctx(self) -> JaxprTranslationDriver:
-        """This function deallocate the translation context of `self`.
+        """This function deallocate the currently active translation context of `self`.
 
         Notes:
-            While it is allowed for outside code to call this function explicit
-                it is is most likely an error.
+            While it is allowed for outside code to call this function explicit it is is most likely an error.
             If `self` is not allocated this function acts as a noops.
-            The reserved names are only deallocated if `self` is a root translator.
+            If `self` is a root translator, then the function will also deallocate the shared state of `self`.
         """
         if not self.is_allocated():
             return self
 
         if self.is_root_translator():
-            self._rev_manager = itertools.count(0, 1)
-            self._reserved_names = None  # type: ignore[assignment]
-            self._ctx_stack.pop()
+            # The translation as a whole has finished, so restore the driver,
+            #  i.e. delete all the shared state.
+            self._jax_name_map = {}
 
-        else:
-            # Restore the previous state
-            self._ctx_stack.pop()
+        # Remove the current head stack.
+        _ = self._ctx_stack.pop()
         return self
 
     def _translate_single_eqn(
@@ -798,7 +595,7 @@ def _translate_single_eqn(
             self.create_jax_var_list(
                 eqn.invars,
                 prevent_creation=True,  # Inputs must already exists.
-                handle_literals=True,  #  but they can be literals.
+                handle_literals=True,  #   but they can be literals.
             )
         )
         out_var_names: MutableSequence[str] = self.create_jax_var_list(
@@ -813,7 +610,7 @@ def _translate_single_eqn(
         subtranslator = self._sub_translators[prim_name]
 
         # Create the state into which the equation should be translated
-        last_term_state: dace.SDFGState = self.terminal_sdfg_state  # noqa: F841 # Will be used later
+        last_term_state: dace.SDFGState = self._terminal_sdfg_state  # noqa: F841 # Will be used later
         eqn_state = self.append_new_state(
             label=f"{eqn.primitive.name}_{'_'.join(out_var_names)}",
             prev_state=None,  # forces terminal state to use
@@ -835,7 +632,7 @@ def _translate_single_eqn(
             new_sdfg_term_state = eqn_state
 
         # In case a subtranslator decided to not use the variables we created for it, which is allowed
-        #  but he must update the `out_var_names` list correctly, we will now verify this.
+        #  but it must update the `out_var_names` list correctly, we will now verify this.
         for expectedSDFGName, jax_var in zip(out_var_names, eqn.outvars, strict=True):
             mapped_sdfg_name = self.map_jax_var_to_sdfg(jax_var)
             if mapped_sdfg_name != expectedSDFGName:
@@ -856,8 +653,8 @@ def _translate_jaxpr_internal(
     ) -> translator.TranslatedJaxprSDFG:
         """Performs the actual translation of the Jaxpr into an SDFG.
 
-        The function assumes that the context is allocated as well as initial variables.
-        The function will return the internal state of `self` as a `TranslatedJaxprSDFG` object.
+        The function assumes that the context is allocated as well as the initial variables.
+        The function will return the internal state of `self` encapsulated inside a `TranslatedJaxprSDFG` object.
         However, it will not deallocate the translation context, thus `self` and the return value share the same memory.
 
         Args:
@@ -865,9 +662,8 @@ def _translate_jaxpr_internal(
 
         Notes:
             The function will unconditionally handle empty Jaxpr.
-            Jax uses a variable with name `_` to indicate that this value is never read,
-                this is used by Jax to indicate that they are never read.
-                Such variables are included by some transformations such as `grad()`.
+            Equations that store into drop variables, i.e. with name `_`, will be skipped.
+                Jax used such variables to indicate that it is not needed, transformations such as `grad` include them.
         """
         nb_translated_eqn: int = 0
         out_var_names: Sequence[str] = ()
@@ -903,32 +699,30 @@ def _handle_null_jaxpr(
             The function returns a list denoting the SDFG variables that refers to the output.
             The order of the list is the same as in `jaxpr.jaxpr.outvars`.
         """
-        if len(jaxpr.eqns) != 0:
-            raise NotImplementedError("'_handle_null_jaxpr()' was called for a non empty Jaxpr.")
-        if len(jaxpr.out_avals) == 0:
-            # There is not output so we do not have to copy anything around.
-            return ()
         assert self._ctx.terminal_state is self._ctx.start_state
         assert len(self._ctx.inp_names) > 0
         assert len(self._ctx.out_names) == 0
 
+        # There is not output so we do not have to copy anything around.
+        if len(jaxpr.out_avals) == 0:
+            return ()
+
         # List of the output variables.
         out_var_names: list[str] = []
 
-        # If we are here then we are dealing with a nested SDFG/Jaxpr.
+        # If we are here then we are dealing with a nested SDFG/Jaxpr, that has output.
         #  Because an input also serves as output, the nested SDFG will have a connector for the
         #  input and one for the output, but both with the same name.
         #  This will make node validation fail.
-        #  We have to work around by introducing some fake copies, which will be removed by DaCe later.
+        #  We have to work around this by introducing some fake copies, which will be removed by DaCe later.
         for jax_out_var in jaxpr.jaxpr.outvars:
-            # Since the output is also used as an input the variable mapping must be known.
+            # Since the output is also used as an input the variable mapping must be already known.
             sdfg_in_name: str = self.map_jax_var_to_sdfg(jax_out_var)
 
             # Now we create a variable that serves as true output, however, since the Jax variable
             #  is already known we can not update the variable mapping.
             sdfg_out_name = self.add_array(
                 jax_out_var,
-                as_transient=True,
                 name_prefix="_zero_equation_output_for_",
                 update_var_mapping=False,
             )
@@ -943,35 +737,20 @@ def _handle_null_jaxpr(
                 data=dace.Memlet.from_array(sdfg_in_name, self.get_array(sdfg_in_name)),
             )
 
-            # A Jax variable now has two SDFG equivalent, the input, that was previously created by
+            # A Jax variable now has, in some sense, two SDFG equivalent, the input, that was previously created by
             #  `self._create_initial_input()` and the `sdfg_out_name` we just created.
-            #  But we can not add this to the mapping, because of this situation we will now remove
-            #  the variable from the mapping. I am open for different approaches.
-            #  Note that input variables that are not used, will remain in the mapping.
+            #  But we can not add this to the mapping, because of this situation we will now remove the variable from the mapping all together.
+            #  I am open for different approaches.
+            #  Note that input variables that are not used as outputs, will remain in the mapping.
             self._jax_name_map.pop(jax_out_var)
 
         return tuple(out_var_names)
 
-    @property
-    def _jax_name_map(self) -> dict[jax_core.Var | util.JaCeVar, str]:
-        return cast(dict[jax_core.Var | util.JaCeVar, str], self._ctx.jax_name_map)
-
     @property
     def _start_state(self) -> dace.SDFGState:
         return cast(dace.SDFGState, self._ctx.start_state)
 
-    # fmt: off
-    _forbidden_names: Final[set[str]] = {
-        # These should be most of the C++ keywords, it is more important to have the short ones.
-        #  Taken from 'https://learn.microsoft.com/en-us/cpp/cpp/keywords-cpp?view=msvc-170'
-        'alignas', 'alignof', 'and', 'asm', 'auto', 'bitand', 'bitor', 'bool', 'break', 'case',
-        'catch', 'char', 'class', 'compl', 'concept', 'const', 'consteval', 'constexpr',
-        'constinit', 'continue', 'decltype', 'default', 'delete', 'directive', 'do', 'double',
-        'else', 'enum', 'explicit', 'export', 'extern', 'false', 'float', 'for', 'friend',
-        'goto', 'if', 'inline', 'int', 'long', 'mutable', 'namespace', 'new', 'noexcept', 'not',
-        'nullptr', 'operator', 'or', 'private', 'protected', 'public', 'register', 'requires',
-        'return', 'short', 'signed', 'sizeof', 'static', 'struct', 'switch', 'template', 'this',
-        'throw', 'true', 'try', 'typedef', 'typeid', 'typename', 'union', 'unsigned', 'using',
-        'virtual', 'void', 'volatile', 'while', 'xor', 'std',
-    }
-    # fmt: on
+    @property
+    def _terminal_sdfg_state(self) -> dace.SDFGState:
+        """Returns the current terminal state of the SDFG under construction."""
+        return cast(dace.SDFGState, self._ctx.terminal_state)
diff --git a/src/jace/translator/translated_jaxpr_sdfg.py b/src/jace/translator/translated_jaxpr_sdfg.py
index 770ee0d..eae6292 100644
--- a/src/jace/translator/translated_jaxpr_sdfg.py
+++ b/src/jace/translator/translated_jaxpr_sdfg.py
@@ -8,7 +8,6 @@
 from __future__ import annotations
 
 import dace
-from jax import core as jax_core
 
 from jace import util
 
@@ -16,45 +15,37 @@
 class TranslatedJaxprSDFG:
     """Encapsulates the result of a translation run of the `JaxprTranslationDriver` object.
 
-    This class is also used to represent the internal state of the `JaxprTranslationDriver` during the translation.
-    For that reason the object defines some fields that only have a meaning during the actually translation.
-
     The fields used to store the result are:
     - `sdfg` the SDFG object that was created.
-    - `jax_name_map` a `dict` that maps every Jax variable to its corresponding SDFG variable _name_.
+    - `inp_names` a list of the SDFG variables that are used as input, in the same order as `Jaxpr.invars`.
+    - `out_names` a list of the SDFG variables that are used as output, in the same order as `Jaxpr.outvars`.
     - `start_state` the first state in the SDFG state machine.
     - `terminal_state` the last state in the state machine.
-    - `inp_names` a `list` of the SDFG variables that are used as input, in the same order as `Jaxpr.invars`.
-    - `out_names` a `list` of the SDFG variables that are used as output, in the same order as `Jaxpr.outvars`.
     - `is_finalized` a bool that indicates if `self` represents a finalized or canonical SDFG, see below.
-    - `rev_idx` the revision index, used for name mangling, however, outside of a translation process,
-        the value carries no meaning.
 
     Note, that it might happen that a name appears in both the `inp_names` and `out_names` lists.
     This happens if an argument is used both as input and output, and it is not an error.
     In Jax this is called argument donation.
 
-    If the flag `is_finalized` is `True` `self` carries a so called finalized SDFG.
-    In this case only the `sdfg`, `inp_names`, `out_names` and `is_finalized` fields remain allocated, all others are set to `None`.
-    Furthermore the SDFG is in the so called finalized form which is:
-    - All input an output arrays are marked as global.
-    - However, there are no `__return` arrays, i.e. all arguments are passed as arguments.
-    - Its `arg_names` are set with set `inp_names + out_names`, however,
+    By default `self` encapsulates a canonical SDFG, see `JaxprTranslationDriver` for more information on this.
+    However, if `is_finalized` is set, then `self` contains a finalized SDFG, i.e.
+    - all input an output arrays are marked as global,
+    - however, there are no `__return` arrays, i.e. all arguments are passed as arguments,
+    - its `arg_names` are set with set `inp_names + out_names`, however,
         arguments that are input and outputs are only listed as inputs.
+
+    Furthermore, only `sdfg`, `inp_names` and `out_names` are guaranteed to be allocated, all other fields might be `None`.
     """
 
     sdfg: dace.SDFG
     inp_names: tuple[str, ...]
     out_names: tuple[str, ...]
-    jax_name_map: dict[jax_core.Var | util.JaCeVar, str] | None
+    is_finalized: bool
     start_state: dace.SDFGState | None
     terminal_state: dace.SDFGState | None
-    rev_idx: int | None
-    is_finalized: bool
 
     def __init__(
         self,
-        rev_idx: int,
         name: str | None = None,
     ) -> None:
         """Initializes the context.
@@ -62,32 +53,26 @@ def __init__(
         The function allocates the SDFG and initializes the members properly.
 
         Args:
-            rev_idx:    The revision index of the context.
             name:       Name of the SDFG object.
+
+        Notes:
+            A user should never need to call this function.
         """
         if isinstance(name, str) and not util.VALID_SDFG_OBJ_NAME.fullmatch(name):
             raise ValueError(f"'{name}' is not a valid SDFG name.")
 
         self.sdfg = dace.SDFG(name=(name or f"unnamed_SDFG_{id(self)}"))
-        self.start_state = self.sdfg.add_state(label="initial_state", is_start_block=True)
-        self.terminal_state = self.start_state
-        self.jax_name_map = {}
         self.inp_names = ()
         self.out_names = ()
-        self.rev_idx = rev_idx
         self.is_finalized = False
+        self.start_state = self.sdfg.add_state(label="initial_state", is_start_block=True)
+        self.terminal_state = self.start_state
 
     def validate(self) -> bool:
         """Validate the underlying SDFG.
 
-        Only a finalized SDFG can be validated.
+        The actual SDFG is only validated for finalized SDFGs.
         """
-        if not self.is_finalized:
-            raise dace.sdfg.InvalidSDFGError(
-                "SDFG is not finalized.",
-                self.sdfg,
-                self.sdfg.node_id(self.sdfg.start_state),
-            )
         if len(self.inp_names) == 0:
             raise dace.sdfg.InvalidSDFGError(
                 "There are no input arguments.",
@@ -100,5 +85,21 @@ def validate(self) -> bool:
                 self.sdfg,
                 self.sdfg.node_id(self.start_state),
             )
+        if self.start_state and (self.start_state is not self.sdfg.start_block):
+            raise dace.sdfg.InvalidSDFGError(
+                f"Expected to find '{self.start_state}' ({self.sdfg.node_id(self.start_state)}),"
+                f" instead found '{self.sdfg.start_block} ({self.sdfg.node_id(self.sdfg.start_block)}).",
+                self.sdfg,
+                self.sdfg.node_id(self.start_state),
+            )
+        if self.start_state and ({self.terminal_state} != set(self.sdfg.sink_nodes())):
+            raise dace.sdfg.InvalidSDFGError(
+                f"Expected to find '{self.terminal_state}' ({self.sdfg.node_id(self.terminal_state)}),"
+                f" instead found '{self.sdfg.sink_nodes()}.",
+                self.sdfg,
+                self.sdfg.node_id(self.terminal_state),
+            )
+        if not self.is_finalized:
+            return True  # More we can not do for an unfinalized SDFG.
         self.sdfg.validate()
         return True
diff --git a/src/jace/util/__init__.py b/src/jace/util/__init__.py
index aaff453..7ee52c8 100644
--- a/src/jace/util/__init__.py
+++ b/src/jace/util/__init__.py
@@ -18,6 +18,7 @@
     get_jax_var_dtype,
     get_jax_var_name,
     get_jax_var_shape,
+    get_jax_var_strides,
     is_tracing_ongoing,
     propose_jax_name,
     translate_dtype,
@@ -34,7 +35,7 @@
     is_scalar,
 )
 from .util import (
-    VALID_JAX_VAR_NAME,
+    FORBIDDEN_SDFG_VAR_NAMES,
     VALID_SDFG_OBJ_NAME,
     VALID_SDFG_VAR_NAME,
     as_sequence,
@@ -56,13 +57,14 @@
     "is_non_string_iterable",
     "is_on_device",
     "is_scalar",
+    "get_jax_var_dtype",
     "get_jax_var_name",
     "get_jax_var_shape",
-    "get_jax_var_dtype",
+    "get_jax_var_strides",
     "translate_dtype",
     "run_jax_sdfg",
     "propose_jax_name",
-    "VALID_JAX_VAR_NAME",
     "VALID_SDFG_OBJ_NAME",
     "VALID_SDFG_VAR_NAME",
+    "FORBIDDEN_SDFG_VAR_NAMES",
 ]
diff --git a/src/jace/util/jax_helper.py b/src/jace/util/jax_helper.py
index 98d65d7..e0b6f3a 100644
--- a/src/jace/util/jax_helper.py
+++ b/src/jace/util/jax_helper.py
@@ -18,7 +18,7 @@
 import itertools
 from collections.abc import Mapping
 from dataclasses import dataclass
-from typing import Any, overload
+from typing import Any
 
 import dace
 import jax.core as jax_core
@@ -28,25 +28,38 @@
 import jace.util as util
 
 
-@dataclass(init=True, repr=True, frozen=True, eq=False)
+@dataclass(repr=True, frozen=True, eq=False)
 class JaCeVar:
-    """Substitute class for Jax' `Var` instance.
+    """Replacement for the `jax.Var` class.
 
     This class can be seen as some kind of substitute `jax.core.Var`.
     The main intention of this class is as an internal representation of values,
     as they are used in Jax, but without the Jax machinery.
-    The main differences to Jax variable is that this class has a name.
+    The main difference is, that this class also carries a `strides` and a `name` member,
+    this can be used to influence how `JaxprTranslationDriver::add_array()` works.
 
     Notes:
         Main intention is to test functionality.
         If the name of a `JaCeVar` is '_' it is considered a drop variable.
         If the name of a `JaCeVar` is empty, the automatic naming will consider it as a Jax variable.
-        The definition of `__hash__` and `__eq__` is in accordance how Jax variable works.
+        The definitions of `__hash__` and `__eq__` are in accordance how Jax variable works.
     """
 
-    name: str
     shape: tuple[int | dace.symbol | str, ...]
     dtype: dace.typeclass
+    strides: tuple[int | dace.symbol | str, ...] | None = None
+    name: str | None = None
+
+    def __post_init__(self) -> None:
+        """Sanity checks."""
+        if not ((self.name is None) or util.VALID_SDFG_VAR_NAME.fullmatch(self.name)):
+            raise ValueError(f"Supplied the invalid name '{self.name}'.")
+        if (self.strides is not None) and (len(self.strides) != len(self.shape)):
+            raise ValueError(
+                f"Passed strides of rank {len(self.strides)}, but shape had rank {len(self.shape)}."
+            )
+        if not isinstance(self.dtype, dace.typeclass):  # To typechecking yet.
+            raise TypeError(f"'dtype' is not a 'dace.typeclass' but '{type(self.dtype).__name__}'.")
 
     def __hash__(self) -> int:
         return id(self)
@@ -57,51 +70,32 @@ def __eq__(self, other: Any) -> bool:
         return id(self) == id(other)
 
 
-def get_jax_var_name(jax_var: jax_core.Atom | JaCeVar | str) -> str:
+def get_jax_var_name(jax_var: jax_core.Atom | JaCeVar) -> str:
     """Returns the name of the Jax variable as a string.
 
     Args:
         jax_var:     The variable to stringify.
 
     Notes:
-        Due to some modification in Jax itself, this function is unable to return "proper" variable names.
-        This function is subject for removal.
+        If `jax_var` is a `JaCeVar` the function will return, if defined, its `.name` property.
+            Otherwise it will compose a name similar to Jax `Var` objects.
+        The returned names are stable, i.e. it will output the same value for the same variable.
+        The returned name passes the `util.VALID_SDFG_VAR_NAME` pattern.
     """
-
     match jax_var:
         case jax_core.DropVar():
             return "_"
         case JaCeVar():
-            # In case of an empty name consider the jace variable as a Jax variable.
-            #  This is mostly for testing.
-            jax_name = f"jax{id(jax_var)}" if jax_var.name == "" else jax_var.name
+            return jax_var.name if jax_var.name else f"jax{id(jax_var)}"
         case jax_core.Var():
-            # This stopped working after version 0.20.4, because of some changes in Jax
-            #  See `https://github.com/google/jax/pull/10573` for more information.
-            #  The following implementation will generate stable names, however, they will be decoupled
-            #  from output of the pretty printed Jaxpr
-            jax_name = f"jax{jax_var.count}{jax_var.suffix}"
+            # This is not how the pretty printer works nor Jax.Var.__repr__, but leads to stable names that can be used.
+            return f"jax{jax_var.count}{jax_var.suffix}"
         case jax_core.Literal():
             raise TypeError("Can not derive a name from a Jax Literal.")
-        case str():
-            jax_name = jax_var
         case _:
             raise TypeError(
                 f"Does not know how to transform '{jax_var}' (type: '{type(jax_var).__name__}') into a string."
             )
-    assert isinstance(jax_name, str)
-
-    if not util.VALID_JAX_VAR_NAME.fullmatch(jax_name):
-        raise ValueError(f"Deduced Jax name '{jax_name}' is invalid.")
-    return jax_name
-
-
-@overload
-def get_jax_var_shape(jax_var: JaCeVar) -> tuple[int | dace.symbol | str, ...]: ...  # type: ignore[overload-overlap]
-
-
-@overload
-def get_jax_var_shape(jax_var: jax_core.Atom) -> tuple[int, ...]: ...
 
 
 def get_jax_var_shape(jax_var: jax_core.Atom | JaCeVar) -> tuple[int | dace.symbol | str, ...]:
@@ -119,6 +113,22 @@ def get_jax_var_shape(jax_var: jax_core.Atom | JaCeVar) -> tuple[int | dace.symb
             raise TypeError(f"'get_jax_var_shape()` is not implemented for '{type(jax_var)}'.")
 
 
+def get_jax_var_strides(
+    jax_var: jax_core.Atom | JaCeVar,
+) -> tuple[int | dace.symbol | str, ...] | None:
+    """Returns the stride of `jax_var`.
+
+    If there is no stride specified return `None`.
+    """
+    match jax_var:
+        case jax_core.Var() | jax_core.Literal():
+            return getattr(jax_var.aval, "strides", None)
+        case JaCeVar():
+            return jax_var.strides
+        case _:
+            raise TypeError(f"'get_jax_var_strides()` is not implemented for '{type(jax_var)}'.")
+
+
 def get_jax_var_dtype(jax_var: jax_core.Atom | JaCeVar) -> dace.typeclass:
     """Returns the DaCe equivalent of `jax_var`s datatype."""
     match jax_var:
@@ -183,42 +193,44 @@ def translate_dtype(dtype: Any) -> dace.typeclass:
 
 def propose_jax_name(
     jax_var: jax_core.Atom | JaCeVar,
-    jax_name_map: Mapping[jax_core.Var | JaCeVar, Any] | None = None,
+    jax_name_map: Mapping[jax_core.Var | JaCeVar, str] | None = None,
 ) -> str:
     """Proposes a variable name for `jax_var`.
 
-    There are two modes for proposing new names.
-    In the first mode, `get_jax_var_name()` is used to derive a name.
-    The second mode, proposes a name based on all names that are already known,
-    this leads to names similar to the ones used by Jax.
+    If `jax_name_map` is `None` then the function will fallback to `get_jax_var_name()`.
+    If `jax_name_map` is supplied the function will:
+    - if `jax_var` is stored inside the mapping that value will be returned.
+    - if `jax_var` is a `JaCeVar` with a set `.name` property it will be returned.
+    - otherwise the function will generate a new name similar to how the pretty printer of Jaxpr works.
 
     Args:
         jax_var:        The variable for which a name to propose.
         jax_name_map:   A mapping of all Jax variables that were already named.
 
     Notes:
-        The second mode is activated by passing `jax_name_map` as argument.
-        The naming of variables are only consistent with the inner most Jaxpr a variable is defined in.
+        The function guarantees that the returned name passes `VALID_SDFG_VAR_NAME` test
+            and that the name is not part of `util.FORBIDDEN_SDFG_VAR_NAMES`.
         Dropped variables will always be named `'_'`.
-        If `jax_var` is already inside `jax_name_map` that name will be returned.
     """
-    if util.is_drop_var(jax_var):
-        return "_"
     if isinstance(jax_var, jax_core.Literal):
         raise TypeError(f"Can not propose a name for literal '{jax_var}'.")
-    if jax_name_map is None:
+    if util.is_drop_var(jax_var) or (jax_name_map is None):
         return get_jax_var_name(jax_var)
     if jax_var in jax_name_map:
         return jax_name_map[jax_var]
-    if isinstance(jax_var, JaCeVar) and (jax_var.name != ""):
-        # If the name of the JaCe variable is empty, then use the name proposing
-        #  technique used for Jax variables; Mostly used for debugging.
+    if isinstance(jax_var, JaCeVar) and (jax_var.name is not None):
         return jax_var.name
 
-    # This code is taken from the Jax source.
+    # We have the set of all previous names, so we generate names
+    #  in the same way as Jax does:
     c = len(jax_name_map)
     jax_name = ""
     while len(jax_name) == 0 or c != 0:
         c, i = c // 26, c % 26
         jax_name = chr(97 + i % 26) + jax_name
-    return jax_name + getattr(jax_var, "suffix", "")
+    jax_name = jax_name + getattr(jax_var, "suffix", "")
+
+    if jax_name is util.FORBIDDEN_SDFG_VAR_NAMES:
+        jax_name = f"__jace_forbidden_{jax_name}"
+        assert jax_name not in util.FORBIDDEN_SDFG_VAR_NAMES
+    return jax_name
diff --git a/src/jace/util/traits.py b/src/jace/util/traits.py
index fd61a6d..6bd3a81 100644
--- a/src/jace/util/traits.py
+++ b/src/jace/util/traits.py
@@ -13,6 +13,7 @@
 from typing import Any, TypeGuard
 
 import dace
+import jax
 import numpy as np
 from jax import _src as jax_src, core as jax_core
 from jaxlib import xla_extension as jax_xe
@@ -74,21 +75,20 @@ def is_jaxified(
 
 def is_jax_array(
     obj: Any,
-) -> bool:
+) -> TypeGuard[jax.Array]:
     """Tests if `obj` is a jax array.
 
-    Todo:
-        Find the Jax type for `TypeGuard`.
+    Notes jax array are special, you can not write to them directly.
+    Furthermore, they always allocate also on GPU, beside the CPU allocation.
     """
-    # Currently this seams to be the besst way to identify Jax arrays.
-    return all(hasattr(obj, x) for x in ["sharding", "is_fully_addressable"])
+    return isinstance(obj, jax.Array)
 
 
 def is_array(
     obj: Any,
 ) -> bool:
     """Identifies arrays, this also includes Jax arrays."""
-    return is_jax_array(obj) or dace.is_array(obj)
+    return dace.is_array(obj) or is_jax_array(obj)
 
 
 def is_scalar(
@@ -126,11 +126,17 @@ def is_scalar(
 def is_on_device(
     obj: Any,
 ) -> bool:
-    """Tests if `obj` is on a device."""
-    # The problem is, that we can not test if `__cuda_array_interface__` exists.
-    #  because Jax array have that even on CPU, thus it is a bit mnore complex.
+    """Tests if `obj` is on a device.
+
+    Jax arrays are always on the CPU and GPU (if there is one).
+    Thus for Jax arrays this function is more of a test, if there is a GPU or not.
+    """
     if is_jax_array(obj):
-        obj = obj.__array__(copy=False)
+        try:
+            _ = obj.__cuda_array_interface__
+            return True
+        except AttributeError:
+            return False
     return dace.is_gpu_array(obj)
 
 
diff --git a/src/jace/util/util.py b/src/jace/util/util.py
index b0f5640..c1463d9 100644
--- a/src/jace/util/util.py
+++ b/src/jace/util/util.py
@@ -9,7 +9,7 @@
 
 import re
 from collections.abc import Iterable
-from typing import TypeVar, cast, overload
+from typing import Final, TypeVar, cast, overload
 
 import jace.util.traits as traits
 
@@ -35,11 +35,26 @@ def as_sequence(value: _T | Iterable[_T]) -> Iterable[_T]:
     return cast(Iterable[_T], [value])
 
 
-# Valid name for a jax variable.
-VALID_JAX_VAR_NAME: re.Pattern = re.compile("(jax[0-9]+_?)|([a-z]+_?)")
-
 # Valid name for an SDFG variable.
 VALID_SDFG_VAR_NAME: re.Pattern = re.compile("[a-zA-Z_][a-zA-Z0-9_]*")
 
 # Valid name for an SDFG itself, includes `SDFGState` objects.
 VALID_SDFG_OBJ_NAME: re.Pattern = re.compile("[a-zA-Z_][a-zA-Z0-9_]*")
+
+
+# fmt: off
+# This is a set of all names that are invalid SDFG names.
+FORBIDDEN_SDFG_VAR_NAMES: Final[set[str]] = {
+    # These should be most of the C++ keywords, it is more important to have the short ones.
+    #  Taken from 'https://learn.microsoft.com/en-us/cpp/cpp/keywords-cpp?view=msvc-170'
+    'alignas', 'alignof', 'and', 'asm', 'auto', 'bitand', 'bitor', 'bool', 'break', 'case',
+    'catch', 'char', 'class', 'compl', 'concept', 'const', 'consteval', 'constexpr',
+    'constinit', 'continue', 'decltype', 'default', 'delete', 'directive', 'do', 'double',
+    'else', 'enum', 'explicit', 'export', 'extern', 'false', 'float', 'for', 'friend',
+    'goto', 'if', 'inline', 'int', 'long', 'mutable', 'namespace', 'new', 'noexcept', 'not',
+    'nullptr', 'operator', 'or', 'private', 'protected', 'public', 'register', 'requires',
+    'return', 'short', 'signed', 'sizeof', 'static', 'struct', 'switch', 'template', 'this',
+    'throw', 'true', 'try', 'typedef', 'typeid', 'typename', 'union', 'unsigned', 'using',
+    'virtual', 'void', 'volatile', 'while', 'xor', 'std',
+}
+# fmt: on

From de9f09a2931311013afcf325e2489804d3e30d91 Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Mon, 20 May 2024 07:36:05 +0200
Subject: [PATCH 177/458] Removed the `.strides` property from the `JaCeVar`
 object.

---
 .../translator/jaxpr_translator_driver.py     |  1 -
 src/jace/util/__init__.py                     |  8 ++--
 src/jace/util/jax_helper.py                   | 38 ++++++-------------
 3 files changed, 14 insertions(+), 33 deletions(-)

diff --git a/src/jace/translator/jaxpr_translator_driver.py b/src/jace/translator/jaxpr_translator_driver.py
index 294d0a1..d470ce8 100644
--- a/src/jace/translator/jaxpr_translator_driver.py
+++ b/src/jace/translator/jaxpr_translator_driver.py
@@ -330,7 +330,6 @@ def add_array(
         """
         shape: tuple[int | dace.symbol | str, ...] = util.get_jax_var_shape(arg)
         dtype: dace.typeclass = util.get_jax_var_dtype(arg)
-        strides: tuple[int | dace.symbol | str, ...] | None = util.get_jax_var_strides(arg)
         storage: dace.StorageType = dace.StorageType.Default  # Set at later stages (optimization)
         offset = None  # i.e. no offset
         is_scalar: bool = shape == ()
diff --git a/src/jace/util/__init__.py b/src/jace/util/__init__.py
index 7ee52c8..925b58e 100644
--- a/src/jace/util/__init__.py
+++ b/src/jace/util/__init__.py
@@ -18,7 +18,6 @@
     get_jax_var_dtype,
     get_jax_var_name,
     get_jax_var_shape,
-    get_jax_var_strides,
     is_tracing_ongoing,
     propose_jax_name,
     translate_dtype,
@@ -43,6 +42,9 @@
 
 
 __all__ = [
+    "VALID_SDFG_OBJ_NAME",
+    "VALID_SDFG_VAR_NAME",
+    "FORBIDDEN_SDFG_VAR_NAMES",
     "JaCeVar",
     "as_sequence",
     "compile_jax_sdfg",
@@ -60,11 +62,7 @@
     "get_jax_var_dtype",
     "get_jax_var_name",
     "get_jax_var_shape",
-    "get_jax_var_strides",
     "translate_dtype",
     "run_jax_sdfg",
     "propose_jax_name",
-    "VALID_SDFG_OBJ_NAME",
-    "VALID_SDFG_VAR_NAME",
-    "FORBIDDEN_SDFG_VAR_NAMES",
 ]
diff --git a/src/jace/util/jax_helper.py b/src/jace/util/jax_helper.py
index e0b6f3a..d86e5d6 100644
--- a/src/jace/util/jax_helper.py
+++ b/src/jace/util/jax_helper.py
@@ -35,30 +35,30 @@ class JaCeVar:
     This class can be seen as some kind of substitute `jax.core.Var`.
     The main intention of this class is as an internal representation of values,
     as they are used in Jax, but without the Jax machinery.
-    The main difference is, that this class also carries a `strides` and a `name` member,
-    this can be used to influence how `JaxprTranslationDriver::add_array()` works.
+    As abstract values in Jax this class has a datatype, which is a `dace.typeclass` instance and a shape.
+    In addition it has an optional name, which allows to create variables with a certain name using `JaxprTranslationDriver::add_array()`.
 
     Notes:
         Main intention is to test functionality.
         If the name of a `JaCeVar` is '_' it is considered a drop variable.
-        If the name of a `JaCeVar` is empty, the automatic naming will consider it as a Jax variable.
         The definitions of `__hash__` and `__eq__` are in accordance how Jax variable works.
+
+    Todo:
+        Add support for strides.
     """
 
     shape: tuple[int | dace.symbol | str, ...]
     dtype: dace.typeclass
-    strides: tuple[int | dace.symbol | str, ...] | None = None
     name: str | None = None
 
     def __post_init__(self) -> None:
         """Sanity checks."""
-        if not ((self.name is None) or util.VALID_SDFG_VAR_NAME.fullmatch(self.name)):
+        if self.name is not None and (
+            (not util.VALID_SDFG_VAR_NAME.fullmatch(self.name))
+            or self.name in util.FORBIDDEN_SDFG_VAR_NAMES
+        ):
             raise ValueError(f"Supplied the invalid name '{self.name}'.")
-        if (self.strides is not None) and (len(self.strides) != len(self.shape)):
-            raise ValueError(
-                f"Passed strides of rank {len(self.strides)}, but shape had rank {len(self.shape)}."
-            )
-        if not isinstance(self.dtype, dace.typeclass):  # To typechecking yet.
+        if not isinstance(self.dtype, dace.typeclass):  # No typechecking yet.
             raise TypeError(f"'dtype' is not a 'dace.typeclass' but '{type(self.dtype).__name__}'.")
 
     def __hash__(self) -> int:
@@ -113,22 +113,6 @@ def get_jax_var_shape(jax_var: jax_core.Atom | JaCeVar) -> tuple[int | dace.symb
             raise TypeError(f"'get_jax_var_shape()` is not implemented for '{type(jax_var)}'.")
 
 
-def get_jax_var_strides(
-    jax_var: jax_core.Atom | JaCeVar,
-) -> tuple[int | dace.symbol | str, ...] | None:
-    """Returns the stride of `jax_var`.
-
-    If there is no stride specified return `None`.
-    """
-    match jax_var:
-        case jax_core.Var() | jax_core.Literal():
-            return getattr(jax_var.aval, "strides", None)
-        case JaCeVar():
-            return jax_var.strides
-        case _:
-            raise TypeError(f"'get_jax_var_strides()` is not implemented for '{type(jax_var)}'.")
-
-
 def get_jax_var_dtype(jax_var: jax_core.Atom | JaCeVar) -> dace.typeclass:
     """Returns the DaCe equivalent of `jax_var`s datatype."""
     match jax_var:
@@ -199,7 +183,7 @@ def propose_jax_name(
 
     If `jax_name_map` is `None` then the function will fallback to `get_jax_var_name()`.
     If `jax_name_map` is supplied the function will:
-    - if `jax_var` is stored inside the mapping that value will be returned.
+    - if `jax_var` is stored inside `jax_name_map` this value will be returned.
     - if `jax_var` is a `JaCeVar` with a set `.name` property it will be returned.
     - otherwise the function will generate a new name similar to how the pretty printer of Jaxpr works.
 

From 9a744007f9f52629317078575eb67e1d2aa79c25 Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Mon, 20 May 2024 07:36:44 +0200
Subject: [PATCH 178/458] Updated the fromating of the forbidden names and
 added the empty string.

---
 src/jace/util/util.py | 18 +++++++++---------
 1 file changed, 9 insertions(+), 9 deletions(-)

diff --git a/src/jace/util/util.py b/src/jace/util/util.py
index c1463d9..342295f 100644
--- a/src/jace/util/util.py
+++ b/src/jace/util/util.py
@@ -47,14 +47,14 @@ def as_sequence(value: _T | Iterable[_T]) -> Iterable[_T]:
 FORBIDDEN_SDFG_VAR_NAMES: Final[set[str]] = {
     # These should be most of the C++ keywords, it is more important to have the short ones.
     #  Taken from 'https://learn.microsoft.com/en-us/cpp/cpp/keywords-cpp?view=msvc-170'
-    'alignas', 'alignof', 'and', 'asm', 'auto', 'bitand', 'bitor', 'bool', 'break', 'case',
-    'catch', 'char', 'class', 'compl', 'concept', 'const', 'consteval', 'constexpr',
-    'constinit', 'continue', 'decltype', 'default', 'delete', 'directive', 'do', 'double',
-    'else', 'enum', 'explicit', 'export', 'extern', 'false', 'float', 'for', 'friend',
-    'goto', 'if', 'inline', 'int', 'long', 'mutable', 'namespace', 'new', 'noexcept', 'not',
-    'nullptr', 'operator', 'or', 'private', 'protected', 'public', 'register', 'requires',
-    'return', 'short', 'signed', 'sizeof', 'static', 'struct', 'switch', 'template', 'this',
-    'throw', 'true', 'try', 'typedef', 'typeid', 'typename', 'union', 'unsigned', 'using',
-    'virtual', 'void', 'volatile', 'while', 'xor', 'std',
+    "alignas", "alignof", "and", "asm", "auto", "bitand", "bitor", "bool", "break", "case",
+    "catch", "char", "class", "compl", "concept", "const", "consteval", "constexpr",
+    "constinit", "continue", "decltype", "default", "delete", "directive", "do", "double",
+    "else", "enum", "explicit", "export", "extern", "false", "float", "for", "friend",
+    "goto", "if", "inline", "int", "long", "mutable", "namespace", "new", "noexcept", "not",
+    "nullptr", "operator", "or", "private", "protected", "public", "register", "requires",
+    "return", "short", "signed", "sizeof", "static", "struct", "switch", "template", "this",
+    "throw", "true", "try", "typedef", "typeid", "typename", "union", "unsigned", "using",
+    "virtual", "void", "volatile", "while", "xor", "std",  "",
 }
 # fmt: on

From cd2467470a2d5490ea0b68c2d380770c869c97ea Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Mon, 20 May 2024 07:41:14 +0200
Subject: [PATCH 179/458] The driver now only generates scalars if requested.

It is not that nice, but should solve some proplems further down, actually not, but lets life with them for the time being.
---
 .../translator/jaxpr_translator_driver.py     | 51 +++++++++----------
 1 file changed, 24 insertions(+), 27 deletions(-)

diff --git a/src/jace/translator/jaxpr_translator_driver.py b/src/jace/translator/jaxpr_translator_driver.py
index d470ce8..abf4478 100644
--- a/src/jace/translator/jaxpr_translator_driver.py
+++ b/src/jace/translator/jaxpr_translator_driver.py
@@ -31,6 +31,7 @@ class JaxprTranslationDriver:
     - all variable names are derived from Jax names,
     - there are only transient variables inside the SDFG,
     - It lacks the special `__return` variable,
+    - all variables that Jax considers a scalar are in fact arrays with shape `(1,)`.
     - the `arg_names` parameter is not set.
 
     For these reasons the SDFG is not directly usable, and further manipulations have to be performed.
@@ -315,13 +316,15 @@ def add_array(
     ) -> str:
         """Creates an SDFG variable for the Jax variable `arg` and returns its SDFG name.
 
-        By default this function will _not_ update the internal variable list mapping.
-        If you wish to do that, which is recommended you should set `update_var_mapping` to `True`.
+        Regardless, if `arg` refers to an array or a scalar, the function will generate an array.
+        Furthermore, the created variables are always transients.
 
-        The function will create either scalar or Array transients.
-        By default the function will extract all necessary information using the `jace.util.get_jax_var_*` functions.
-        For the naming the function will use the `jace.util.propose_jax_name()` function and pass the internal variable mapping.
-        If you need to create a rather special variable, it is advised to pass a `JaCeVar` instance.
+        By default this function will _not_ update the internal variable mapping.
+        However, by setting `update_var_mapping` to `True` the mapping will be created.
+
+        By default the function will use `jace.util.propose_jax_name()` to derive the name that should be used.
+        However, by passing a `JaCeVar` with a name it is possible to suggest a specific name.
+        In addition it is possible to specify `name_prefix` to prefix name that would be used.
 
         Args:
             arg:                The Jax object for which a SDFG equivalent should be created.
@@ -331,13 +334,15 @@ def add_array(
         shape: tuple[int | dace.symbol | str, ...] = util.get_jax_var_shape(arg)
         dtype: dace.typeclass = util.get_jax_var_dtype(arg)
         storage: dace.StorageType = dace.StorageType.Default  # Set at later stages (optimization)
-        offset = None  # i.e. no offset
-        is_scalar: bool = shape == ()
-        as_transient: bool = True
+        offset = None
+        as_transient = True
+        strides = None
+
+        if shape == ():  # Shape of a DaCe scalar.
+            shape = (1,)
 
         # Propose a name and if needed extend it.
         arg_name = util.propose_jax_name(arg, self._jax_name_map)
-        assert not arg_name.startswith("__")
         if name_prefix is not None:
             arg_name = name_prefix + arg_name
 
@@ -349,23 +354,15 @@ def add_array(
         if arg_name in self._ctx.sdfg.arrays:
             raise ValueError(f"add_array({arg}): The proposed name '{arg_name}', is used.")
 
-        if is_scalar:
-            self._ctx.sdfg.add_scalar(
-                name=arg_name,
-                storage=storage,
-                dtype=dtype,
-                transient=as_transient,
-            )
-        else:
-            self._ctx.sdfg.add_array(
-                name=arg_name,
-                shape=shape,
-                strides=strides,
-                offset=offset,
-                storage=storage,
-                dtype=dtype,
-                transient=as_transient,
-            )
+        self._ctx.sdfg.add_array(
+            name=arg_name,
+            shape=shape,
+            strides=strides,
+            offset=offset,
+            storage=storage,
+            dtype=dtype,
+            transient=as_transient,
+        )
 
         if update_var_mapping:
             self.add_jax_name_mapping(jax_var=arg, sdfg_name=arg_name)

From 5e84dd7de9a5c8c5913aa85ed973865f1651812b Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Mon, 20 May 2024 07:52:56 +0200
Subject: [PATCH 180/458] Made a line shorter.

---
 src/jace/translator/managing.py | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/src/jace/translator/managing.py b/src/jace/translator/managing.py
index 1e091e8..563992d 100644
--- a/src/jace/translator/managing.py
+++ b/src/jace/translator/managing.py
@@ -13,7 +13,7 @@
 
 from __future__ import annotations
 
-from collections.abc import Callable, MutableMapping
+from collections.abc import Callable, MutableMapping, Mapping
 from typing import TYPE_CHECKING, Literal, cast, overload
 
 
@@ -81,7 +81,7 @@ def wrapper(
             if not primitive:
                 raise ValueError(f"Missing primitive name for '{prim_translator}'")
             prim_translator.primitive = primitive  # type: ignore[attr-defined]
-        elif prim_translator.primitive != (primitive or prim_translator.primitive):
+        elif (primitive is not None) and (prim_translator.primitive != primitive):
             raise TypeError(
                 f"Translator's primitive '{prim_translator.primitive}' doesn't match the supplied '{primitive}'."
             )

From f34759aa182b1b9497b637b27708884cde5fa0e4 Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Mon, 20 May 2024 07:55:03 +0200
Subject: [PATCH 181/458] Added a function to proper restore the state of
 subtranslators.

As I wrote it is mostly for restoring stuff.
---
 src/jace/translator/__init__.py    |  7 +++++-
 src/jace/translator/managing.py    | 38 ++++++++++++------------------
 tests/test_subtranslator_helper.py | 11 +++------
 3 files changed, 24 insertions(+), 32 deletions(-)

diff --git a/src/jace/translator/__init__.py b/src/jace/translator/__init__.py
index 7d4426e..341c713 100644
--- a/src/jace/translator/__init__.py
+++ b/src/jace/translator/__init__.py
@@ -10,7 +10,11 @@
 from __future__ import annotations
 
 from .jaxpr_translator_driver import JaxprTranslationDriver
-from .managing import get_regsitered_primitive_translators, register_primitive_translator
+from .managing import (
+    get_regsitered_primitive_translators,
+    register_primitive_translator,
+    set_active_primitive_translators_to,
+)
 from .primitive_translator import PrimitiveTranslator, PrimitiveTranslatorCallable
 from .translated_jaxpr_sdfg import TranslatedJaxprSDFG
 
@@ -22,4 +26,5 @@
     "TranslatedJaxprSDFG",
     "register_primitive_translator",
     "get_regsitered_primitive_translators",
+    "set_active_primitive_translators_to",
 ]
diff --git a/src/jace/translator/managing.py b/src/jace/translator/managing.py
index 563992d..cc79319 100644
--- a/src/jace/translator/managing.py
+++ b/src/jace/translator/managing.py
@@ -13,8 +13,8 @@
 
 from __future__ import annotations
 
-from collections.abc import Callable, MutableMapping, Mapping
-from typing import TYPE_CHECKING, Literal, cast, overload
+from collections.abc import Callable, Mapping, MutableMapping
+from typing import TYPE_CHECKING, cast
 
 
 if TYPE_CHECKING:
@@ -24,27 +24,6 @@
 _PRIMITIVE_TRANSLATORS_DICT: dict[str, translator.PrimitiveTranslatorCallable] = {}
 
 
-@overload
-def register_primitive_translator(
-    prim_translator: Literal[None] = None,
-    /,
-    primitive: str | None = None,
-    overwrite: bool = False,
-) -> Callable[
-    [translator.PrimitiveTranslator | translator.PrimitiveTranslatorCallable],
-    translator.PrimitiveTranslator,
-]: ...
-
-
-@overload
-def register_primitive_translator(
-    prim_translator: translator.PrimitiveTranslator | translator.PrimitiveTranslatorCallable,
-    *,
-    primitive: str | None = None,
-    overwrite: bool = False,
-) -> translator.PrimitiveTranslator: ...
-
-
 def register_primitive_translator(
     prim_translator: translator.PrimitiveTranslator
     | translator.PrimitiveTranslatorCallable
@@ -107,3 +86,16 @@ def get_regsitered_primitive_translators() -> (
     This means that calls to `register_primitive_translator()` does not modify the returned object.
     """
     return _PRIMITIVE_TRANSLATORS_DICT.copy()
+
+
+def set_active_primitive_translators_to(
+    new_translators: Mapping[str, translator.PrimitiveTranslatorCallable],
+) -> None:
+    """Exchange the currently active subtranslators in Jace with the one inside `new_translators`.
+
+    This function allows you to restore a specific state that was obtained by a previous call to `get_regsitered_primitive_translators()`.
+    The function is mainly intended for debugging.
+    """
+    assert all(getattr(trans, "primitive", prim) for prim, trans in new_translators.items())
+    global _PRIMITIVE_TRANSLATORS_DICT
+    _PRIMITIVE_TRANSLATORS_DICT = dict(new_translators)
diff --git a/tests/test_subtranslator_helper.py b/tests/test_subtranslator_helper.py
index 871e679..05dead7 100644
--- a/tests/test_subtranslator_helper.py
+++ b/tests/test_subtranslator_helper.py
@@ -29,15 +29,10 @@
 
 @pytest.fixture(autouse=True)
 def _conserve_builtin_translators():
-    """Decorator that preserves the initial list of built in translators.
-
-    Todo:
-        Come up with something better/nicer.
-    """
-    initial_translators = get_regsitered_primitive_translators()
+    """Decorator that restores the previous state of the build ins."""
+    initial_translators = translator.get_regsitered_primitive_translators()
     yield
-    translator.managing._PRIMITIVE_TRANSLATORS_DICT.clear()
-    translator.managing._PRIMITIVE_TRANSLATORS_DICT.update(initial_translators)
+    translator.set_active_primitive_translators_to(initial_translators)
 
 
 def _dict_struct(dict_: Mapping[str, Any]) -> Sequence[tuple[str, int]]:

From 203e68f2a6eb3ab1ba5d5637d9d5abc46a3fa6a6 Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Mon, 20 May 2024 09:05:25 +0200
Subject: [PATCH 182/458] Fixed some errors in the post processing.

I should have never backed down on `__slots__`.
---
 src/jace/translator/post_translation.py | 10 ++++------
 1 file changed, 4 insertions(+), 6 deletions(-)

diff --git a/src/jace/translator/post_translation.py b/src/jace/translator/post_translation.py
index fbe16b7..4334e23 100644
--- a/src/jace/translator/post_translation.py
+++ b/src/jace/translator/post_translation.py
@@ -28,13 +28,13 @@ def postprocess_jaxpr_sdfg(
 
     Afterwards `tsdfg` will be finalized.
 
-    TBA, summary:
-    - Setting correct inputs (names + strides)
-    - Setting outputs (in case of donation).
-
     Args:
         tsdfg:  The translated SDFG object.
         fun:    The original function that we translated.
+
+    Todo:
+        - Setting correct input names (layer that does not depend on JAX).
+        - Setting the correct strides & Storage properties.
     """
     # Currently we do nothing except finalizing.
     finalize_jaxpr_sdfg(tsdfg)
@@ -73,8 +73,6 @@ def finalize_jaxpr_sdfg(
     tsdfg.sdfg.arg_names = sdfg_arg_names
 
     # Now we will deallocate the fields and mark `self` as finalized.
-    tsdfg.jax_name_map = None
     tsdfg.start_state = None
     tsdfg.terminal_state = None
-    tsdfg.rev_idx = None
     tsdfg.is_finalized = True

From 085c53ddef5cb365abf2dd854fb1a51a9da8a5b7 Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Mon, 20 May 2024 09:06:02 +0200
Subject: [PATCH 183/458] Updated the translation cache.

Mostly data was moved arround but it might be a bit better.
---
 src/jace/jax/stages.py            |  82 +++++++------
 src/jace/jax/translation_cache.py | 195 ++++++------------------------
 2 files changed, 82 insertions(+), 195 deletions(-)

diff --git a/src/jace/jax/stages.py b/src/jace/jax/stages.py
index 43fe7a5..32f020c 100644
--- a/src/jace/jax/stages.py
+++ b/src/jace/jax/stages.py
@@ -24,10 +24,10 @@
 from __future__ import annotations
 
 import copy
-import json
 from collections.abc import Callable, Mapping, Sequence
-from typing import TYPE_CHECKING, Any, Final
+from typing import Any, Final
 
+import dace
 import jax as jax_jax
 from jax.stages import CompilerOptions
 
@@ -37,10 +37,6 @@
 from jace.util import dace_helper as jdace
 
 
-if TYPE_CHECKING:
-    pass
-
-
 class Stage:
     """A distinct step in the compilation chain, see module description for more.
 
@@ -68,13 +64,7 @@ class JaceWrapped(Stage):
     _fun: Callable
     _sub_translators: Mapping[str, translator.PrimitiveTranslator]
     _jit_ops: Mapping[str, Any]
-
-    # Managed by the caching infrastructure and only defined during `lower()`.
-    #  If defined it contains an abstract description of the function arguments.
-    _call_description: tcache.CallArgsDescription | None = None
-
-    # Cache for the lowering. Managed by the caching infrastructure.
-    _cache: tcache.TranslationCache | None = None
+    _cache: tcache.TranslationCache
 
     def __init__(
         self,
@@ -100,6 +90,7 @@ def __init__(
         self._sub_translators = dict(sub_translators)
         self._jit_ops = dict(jit_ops)
         self._fun = fun
+        self._cache = tcache.get_cache(self)
 
     def __call__(
         self,
@@ -152,21 +143,32 @@ def wrapped_fun(self) -> Callable:
         """Returns the wrapped function."""
         return self._fun
 
+    def _make_call_decscription(
+        self,
+        *args: Any,
+    ) -> tcache.CachedCallDescription:
+        """This function computes the key for the `JaceWrapped.lower()` call.
 
-class JaceLowered(Stage):
-    """Represents the original computation that was lowered to SDFG."""
+        Currently it is only able to handle positional argument and does not support static arguments.
+        The function will fully abstractify its input arguments.
+        This function is used by the cache to generate the key.
+        """
+        fargs = tuple(tcache._AbstarctCallArgument.from_value(x) for x in args)
+        return tcache.CachedCallDescription(stage_id=id(self), fargs=fargs)
 
-    # `self` assumes complete ownership of the
-    _trans_sdfg: translator.TranslatedJaxprSDFG
 
-    # Cache for the compilation. Managed by the caching infrastructure.
-    _cache: tcache.TranslationCache | None = None
+class JaceLowered(Stage):
+    """Represents the original computation that was lowered to SDFG."""
 
     DEF_COMPILER_OPTIONS: Final[dict[str, Any]] = {
         "auto_optimize": True,
         "simplify": True,
     }
 
+    # `self` assumes complete ownership of the
+    _trans_sdfg: translator.TranslatedJaxprSDFG
+    _cache: tcache.TranslationCache
+
     def __init__(
         self,
         trans_sdfg: translator.TranslatedJaxprSDFG,
@@ -179,11 +181,12 @@ def __init__(
         if trans_sdfg.out_names is None:
             raise ValueError("Output names must be defined.")
         self._trans_sdfg = trans_sdfg
+        self._cache = tcache.get_cache(self)
 
     @tcache.cached_translation
     def compile(
         self,
-        compiler_options: CompilerOptions | None = None,  # Unused arguments
+        compiler_options: CompilerOptions | None = None,
     ) -> JaceCompiled:
         """Compile the SDFG.
 
@@ -234,28 +237,33 @@ def as_html(self, filename: str | None = None) -> None:
         """
         self.compiler_ir().sdfg.view(filename=filename, verbose=False)
 
-    def as_text(self, dialect: str | None = None) -> str:
-        """Textual representation of the SDFG.
+    def as_sdfg(self) -> dace.SDFG:
+        """Returns the encapsulated SDFG.
 
-        By default, the function will return the Json representation of the SDFG.
-        However, by specifying `'html'` as `dialect` the function will call `view()` on the underlying SDFG.
-
-        Notes:
-            You should prefer `self.as_html()` instead of this function.
+        It is an error to modify the returned object.
         """
-        if (dialect is None) or (dialect.upper() == "JSON"):
-            return json.dumps(self.compiler_ir().sdfg.to_json())
-        if dialect.upper() == "HTML":
-            self.as_html()
-            return ""  # For the interface
-        raise ValueError(f"Unknown dialect '{dialect}'.")
+        return self.compiler_ir().sdfg
 
-    def cost_analysis(self) -> Any | None:
-        """A summary of execution cost estimates.
+    def _make_call_decscription(
+        self,
+        compiler_options: CompilerOptions | None = None,
+    ) -> tcache.CachedCallDescription:
+        """This function computes the key for the `self.compile()` call.
 
-        Not implemented use the DaCe [instrumentation API](https://spcldace.readthedocs.io/en/latest/optimization/profiling.html) directly.
+        The function only get one argument that is either a `dict` or a `None`, where `None` means `use default argument.
+        The function will construct a concrete description of the call using `(name, value)` pairs.
+        This function is used by the cache.
         """
-        raise NotImplementedError()
+        if compiler_options is None:  # Must be the same as in `compile()`!
+            compiler_options = self.DEF_COMPILER_OPTIONS
+        assert isinstance(compiler_options, dict)
+        fargs: tuple[tuple[str, tcache._ConcreteCallArgument], ...] = tuple(
+            sorted(
+                ((argname, argvalue) for argname, argvalue in compiler_options.items()),
+                key=lambda X: X[0],
+            )
+        )
+        return tcache.CachedCallDescription(stage_id=id(self), fargs=fargs)
 
 
 class JaceCompiled(Stage):
diff --git a/src/jace/jax/translation_cache.py b/src/jace/jax/translation_cache.py
index bed803a..267b7f9 100644
--- a/src/jace/jax/translation_cache.py
+++ b/src/jace/jax/translation_cache.py
@@ -21,7 +21,7 @@
 from collections import OrderedDict
 from collections.abc import Callable
 from dataclasses import dataclass
-from typing import TYPE_CHECKING, Any, Protocol, TypeAlias, runtime_checkable
+from typing import TYPE_CHECKING, Any, Final, Protocol, TypeAlias, runtime_checkable
 
 import dace
 from jax import core as jax_core
@@ -32,6 +32,12 @@
 if TYPE_CHECKING:
     from jace.jax import stages
 
+# This is the default cache size we are using
+_DEF_CACHE_SIZE: Final[int] = 256
+
+# This are the caches that we are using.
+_TRANSLATION_CACHES: dict[type[stages.Stage], TranslationCache] = {}
+
 
 def cached_translation(
     action: Callable,
@@ -55,35 +61,17 @@ def cached_translation(
 
     @ft.wraps(action)
     def _action_wrapper(
-        self: stages.Stage,
+        self: stages.JaceWrapped | stages.JaceLowered,
         *args: Any,
         **kwargs: Any,
     ) -> stages.Stage:
-        # If not initialized initialize the cache.
-        assert hasattr(self, "_cache")  # Needed to make mypy silent
-        if self._cache is None:
-            self._cache = _get_cache(self)
-
-        # Get the key (abstract description of the call).
-        key: CachedCallDescription = self._cache.make_key(self, *args, **kwargs)
+        # Get the abstract description of the call, that is used as key.
+        key: CachedCallDescription = self._make_call_decscription(*args, **kwargs)
         if self._cache.has(key):
             return self._cache.get(key)
 
         # We must actually perform the call
-        try:
-            if hasattr(self, "_call_description"):
-                assert (
-                    self._call_description is None
-                ), f"call description already set for `{self}` (probably another call going on?)."
-                self._call_description = key.fargs
-            next_stage: stages.Stage = action(self, *args, **kwargs)
-        finally:
-            # If I would cache the result from above and store and then use here,
-            #  mypy would complain, thus we have to do it twice.
-            if hasattr(self, "_call_description"):
-                self._call_description = None
-
-        # Store the result.
+        next_stage: stages.Stage = action(self, *args, **kwargs)
         self._cache.add(key, next_stage)
         return next_stage
 
@@ -92,32 +80,18 @@ def _action_wrapper(
 
 def clear_translation_cache() -> None:
     """Clear all caches associated to translation."""
+    _TRANSLATION_CACHES.clear()
 
-    if not hasattr(_get_cache, "_caches"):
-        return
-    _get_cache._caches.clear()
-    return
 
-
-def _get_cache(
-    self: stages.Stage,
-    size: int = 128,
+def get_cache(
+    stage: stages.Stage,
 ) -> TranslationCache:
-    """Returns the cache associated to `name`.
-
-    If called for the first time, the cache sizes will be set to `size`.
-    In all later calls this value is ignored.
-    """
-    # Get the caches and if not present, create them.
-    if not hasattr(_get_cache, "_caches"):
-        _caches: dict[type[stages.Stage], TranslationCache] = {}
-        _get_cache._caches = _caches  # type: ignore[attr-defined]
-    _caches = _get_cache._caches  # type: ignore[attr-defined]
-
-    if type(self) not in _caches:
-        _caches[type(self)] = TranslationCache(size=size)
-
-    return _caches[type(self)]
+    """Returns the cache that is used for `stage`."""
+    # The caches are per stage and not per instance basis
+    tstage = type(stage)
+    if tstage not in _TRANSLATION_CACHES:
+        _TRANSLATION_CACHES[tstage] = TranslationCache(size=_DEF_CACHE_SIZE)
+    return _TRANSLATION_CACHES[tstage]
 
 
 @dataclass(init=True, eq=True, frozen=True)
@@ -172,27 +146,7 @@ def from_value(
 
             return cls(shape=shape, dtype=dtype, strides=strides, storage=storage)
 
-        if isinstance(val, jax_core.ConcreteArray):
-            return cls.from_value(val.val)
-
-        if isinstance(val, jax_core.ShapedArray):
-            shape = val.aval.shape
-            dtype = val.aval.dtype
-            strides = None
-            storage = (
-                dace.StorageType.GPU_Global
-                if util.is_on_device(val.val)
-                else dace.StorageType.CPU_Heap
-            )
-
-            return cls(shape=shape, dtype=dtype, strides=strides, storage=storage)
-
-        if isinstance(val, jax_core.AbstractValue):
-            raise TypeError(f"Can not make 'JaCeVar' from '{type(val).__name__}', too abstract.")
-
-        # If we are here, then we where not able, thus we will will now try Jax
-        #  This is inefficient and we should make it better.
-        return cls.from_value(jax_core.get_aval(val))
+        raise TypeError(f"Can not make 'an abstract description from '{type(val).__name__}'.")
 
 
 @runtime_checkable
@@ -247,66 +201,11 @@ class CachedCallDescription:
     Todo:
         - pytrees.
         - Turn the references into week references, Jax does this and I am sure there is a reason for it.
-        - Turn this into a strategy.
     """
 
     stage_id: int
     fargs: CallArgsDescription
 
-    @classmethod
-    def make_call_description(
-        cls,
-        stage: stages.Stage,
-        *args: Any,
-        **kwargs: Any,
-    ) -> CachedCallDescription:
-        """Creates an abstract description of the call."""
-        from jace.jax import stages  # Cyclic import
-
-        if isinstance(stage, stages.JaceWrapped):
-            # JaceWrapped.lower() to JaceLowered
-
-            if len(kwargs) != 0:
-                raise NotImplementedError("'kwargs' are not implemented in 'JaceWrapped.lower()'.")
-
-            # Currently we only allow positional arguments and no static arguments.
-            #   Thus the function argument part of the key only consists of abstract arguments.
-            fargs: tuple[_AbstarctCallArgument, ...] = tuple(
-                _AbstarctCallArgument.from_value(x) for x in args
-            )
-
-        elif isinstance(stage, stages.JaceLowered):
-            # JaceLowered.compile() to JaceCompiled
-
-            #   We only accepts compiler options, which the Jax interface mandates
-            #   are inside a `dict` thus we will get at most one argument.
-            if len(kwargs) != 0:
-                raise ValueError(
-                    "All arguments to 'JaceLowered.compile()' must be inside a 'dict'."
-                )
-            if len(args) >= 2:
-                raise ValueError("Only a 'dict' is allowed as argument to 'JaceLowered.compile()'.")
-            if (len(args) == 0) or (args[0] is None):
-                # Currently we consider no argument and `None` as "use the default argument".
-                #  Which is what Jax does.
-                comp_ops: stages.CompilerOptions = stages.JaceLowered.DEF_COMPILER_OPTIONS
-            else:
-                comp_ops = args[0]
-
-            # We will now make `(argname, argvalue)` pairs and sort them according to `argname`.
-            #  This guarantees a stable order.
-            fargs: tuple[tuple[str, _ConcreteCallArgument], ...] = tuple(  # type: ignore[no-redef]  # Type confusion.
-                sorted(
-                    ((argname, argvalue) for argname, argvalue in comp_ops.items()),
-                    key=lambda X: X[0],
-                )
-            )
-
-        else:
-            raise TypeError(f"Can not make key from '{type(stage).__name__}'.")
-
-        return cls(stage_id=id(stage), fargs=fargs)
-
 
 class TranslationCache:
     """The _internal_ cache object.
@@ -326,33 +225,22 @@ class TranslationCache:
 
     def __init__(
         self,
-        size: int = 128,
+        size: int,
     ) -> None:
-        """Creates a cache instance of size `size`."""
+        """Creates a cache instance of size.
+
+        The cache will have size `size` and use `key` as key function.
+        """
         if size <= 0:
             raise ValueError(f"Invalid cache size of '{size}'")
         self._memory: OrderedDict[CachedCallDescription, stages.Stage] = OrderedDict()
         self._size = size
 
-    @staticmethod
-    def make_key(
-        stage: stages.Stage,
-        *args: Any,
-        **kwargs: Any,
-    ) -> CachedCallDescription:
-        """Create a key object for `stage`."""
-        return CachedCallDescription.make_call_description(stage, *args, **kwargs)
-
     def has(
         self,
         key: CachedCallDescription,
     ) -> bool:
-        """Check if `self` have a record of `key`.
-
-        Notes:
-            For generating `key` use the `make_key()` function.
-            This function will not modify the order of the cached entries.
-        """
+        """Check if `self` have a record of `key`."""
         return key in self._memory
 
     def get(
@@ -368,18 +256,14 @@ def get(
         if not self.has(key):
             raise KeyError(f"Key '{key}' is unknown.")
         self._memory.move_to_end(key, last=True)
-        return self._memory.get(key)  # type: ignore[return-value]  # type confusion
+        return self._memory[key]
 
     def add(
         self,
         key: CachedCallDescription,
         res: stages.Stage,
     ) -> TranslationCache:
-        """Adds `res` under `key` to `self`.
-
-        Notes:
-            It is not an error if if `key` is already present.
-        """
+        """Adds `res` under `key` to `self`."""
         if self.has(key):
             # `key` is known, so move it to the end and update the mapped value.
             self._memory.move_to_end(key, last=True)
@@ -395,23 +279,18 @@ def add(
     def _evict(
         self,
         key: CachedCallDescription | None,
-    ) -> bool:
-        """Evict `key` from `self` and return `True`.
+    ) -> None:
+        """Evict `key` from `self`.
 
-        In case `key` is not known the function returns `False`.
-        If `key` is `None` then evict the oldest one unconditionally.
+        If `key` is `None` the oldest entry is evicted.
         """
+        if len(self._memory) == 0:
+            return
         if key is None:
-            if len(self._memory) == 0:
-                return False
             self._memory.popitem(last=False)
-            return True
-
-        if not self.has(key):
-            return False
-        self._memory.move_to_end(key, last=False)
-        self._memory.popitem(last=False)
-        return True
+        elif self.has(key):
+            self._memory.move_to_end(key, last=False)
+            self._memory.popitem(last=False)
 
     def __repr__(self) -> str:
         """Textual representation for debugging."""

From 3a33d32d4ece315090089859aa2c4580418b43e8 Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Mon, 20 May 2024 10:16:18 +0200
Subject: [PATCH 184/458] Made some reminders about stride and input.

---
 src/jace/util/compiling.py | 9 +++++++++
 1 file changed, 9 insertions(+)

diff --git a/src/jace/util/compiling.py b/src/jace/util/compiling.py
index 286b988..cf44f13 100644
--- a/src/jace/util/compiling.py
+++ b/src/jace/util/compiling.py
@@ -94,9 +94,12 @@ def run_jax_sdfg(
     Notes:
         There is no pytree mechanism jet, thus the return values are returned inside a `tuple`
             or in case of one value, directly, in the order determined by Jax.
+        Currently, this function does not consider strides in the input.
     """
     from dace.data import Array, Data, Scalar, make_array_from_descriptor
 
+    from jace import util
+
     if len(ckwargs) != 0:
         raise NotImplementedError("No kwargs are supported yet.")
     if len(inp_names) != len(cargs):
@@ -111,12 +114,18 @@ def run_jax_sdfg(
     # Build the argument list that we will pass to the compiled object.
     call_args: dict[str, Any] = {}
     for in_name, in_val in zip(inp_names, cargs, strict=True):
+        assert (  # noqa: PT018  # Assertion must be one line
+            util.is_array(in_val) and in_val.flags["C_CONTIGUOUS"]
+        )  # Currently the only stride we support.
         call_args[in_name] = in_val
     for out_name in out_names:
         assert not ((out_name == "__return") or (out_name.startswith("__return_")))  # noqa: PT018 # Assert split
 
         if out_name in call_args:  # Donated arguments
             assert out_name in inp_names
+            assert not util.is_jax_array(
+                call_args[out_name]
+            )  # This violates one of Jax internal assumptions.
             continue
 
         sarray: Data = sdfg.arrays[out_name]

From bc5f2b663ff29c9af753b5752e66f3cb1ab0bd82 Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Mon, 20 May 2024 10:19:17 +0200
Subject: [PATCH 185/458] Updated the decorator tests.

I splited it up and the tests about the cache are now in a separate module.
---
 tests/test_decorator.py | 142 ++++++++++------------------------------
 1 file changed, 35 insertions(+), 107 deletions(-)

diff --git a/tests/test_decorator.py b/tests/test_decorator.py
index 24ce507..b83320a 100644
--- a/tests/test_decorator.py
+++ b/tests/test_decorator.py
@@ -14,10 +14,27 @@
 
 import jax
 import numpy as np
+import pytest
 
 import jace
 
 
+@pytest.fixture(autouse=True)
+def _clear_translation_cache():
+    """Decorator that clears the translation cache.
+
+    Ensures that a function finds an empty cache and clears up afterwards.
+
+    Todo:
+        Should be used _everywhere_.
+    """
+    from jace.jax import translation_cache as tcache
+
+    tcache.clear_translation_cache()
+    yield
+    tcache.clear_translation_cache()
+
+
 def test_decorator_individually():
     """Tests the compilation steps individually."""
     jax.config.update("jax_enable_x64", True)
@@ -25,8 +42,11 @@ def test_decorator_individually():
     def testee_(A: np.ndarray, B: np.ndarray) -> np.ndarray:
         return A + B
 
+    lowering_cnt = [0]
+
     @jace.jit
-    def testee(A: np.ndarray, B: np.ndarray) -> np.ndarray:
+    def testee(A, B):
+        lowering_cnt[0] += 1
         return testee_(A, B)
 
     A = np.arange(12, dtype=np.float64).reshape((4, 3))
@@ -39,6 +59,7 @@ def testee(A: np.ndarray, B: np.ndarray) -> np.ndarray:
     res = compiled(A, B)
 
     assert np.allclose(ref, res), f"Expected '{ref}' got '{res}'."
+    assert lowering_cnt[0] == 1
 
 
 def test_decorator_one_go():
@@ -48,7 +69,12 @@ def test_decorator_one_go():
     def testee_(A: np.ndarray, B: np.ndarray) -> np.ndarray:
         return A + B
 
-    testee = jace.jit(testee_)
+    lowering_cnt = [0]
+
+    @jace.jit
+    def testee(A, B):
+        lowering_cnt[0] += 1
+        return testee_(A, B)
 
     A = np.arange(12, dtype=np.float64).reshape((4, 3))
     B = np.full((4, 3), 10, dtype=np.float64)
@@ -57,114 +83,16 @@ def testee_(A: np.ndarray, B: np.ndarray) -> np.ndarray:
     res = testee(A, B)
 
     assert np.allclose(ref, res), f"Expected '{ref}' got '{res}'."
+    assert lowering_cnt[0] == 1
 
 
-def test_decorator_caching():
-    """This tests the caching ability"""
-    jax.config.update("jax_enable_x64", True)
-
-    def testee1_(A: np.ndarray, B: np.ndarray) -> np.ndarray:
-        return A * B
-
-    def testee2_(A: np.ndarray, B: np.ndarray) -> np.ndarray:
-        return A + B
-
-    testee1 = jace.jit(testee1_)
-    testee2 = jace.jit(testee2_)
-
-    assert testee1.__wrapped__ == testee1_
-    assert testee2.__wrapped__ == testee2_
-
-    # This is the first size
-    A = np.arange(12, dtype=np.float64).reshape((4, 3))
-    B = np.full((4, 3), 10, dtype=np.float64)
-
-    # This is the second sizes
-    C = np.arange(16, dtype=np.float64).reshape((4, 4))
-    D = np.full((4, 4), 10, dtype=np.float64)
-
-    # Lower the two functions for the first size.
-    lowered1_size1 = testee1.lower(A, B)
-    lowered2_size1 = testee2.lower(A, B)
-
-    # If we now lower them again, we should get the same objects
-    assert lowered1_size1 is testee1.lower(A, B)
-    assert lowered2_size1 is testee2.lower(A, B)
-
-    # Now we lower them for the second sizes.
-    lowered1_size2 = testee1.lower(C, D)
-    lowered2_size2 = testee2.lower(C, D)
+def test_decorator_wrapped():
+    """Tests if some properties are set correctly."""
 
-    # Again if we now lower them again, we should get the same objects.
-    assert lowered1_size1 is testee1.lower(A, B)
-    assert lowered2_size1 is testee2.lower(A, B)
-    assert lowered1_size2 is testee1.lower(C, D)
-    assert lowered2_size2 is testee2.lower(C, D)
-
-    # Now use the compilation; since all is the same code path we only use one size.
-    compiled1 = lowered1_size1.compile()
-    compiled2 = lowered1_size1.compile({"dummy_option": True})
-
-    assert compiled1 is lowered1_size1.compile()
-    assert compiled2 is lowered1_size1.compile({"dummy_option": True})
-    assert compiled2 is not lowered1_size1.compile({"dummy_option": False})
-    assert compiled2 is lowered1_size1.compile({"dummy_option": True})
-
-
-def test_decorator_double_annot():
-    """Tests the behaviour for double annotations."""
-    jax.config.update("jax_enable_x64", True)
-
-    lower_cnt = [0]
-
-    def testee1(A: np.ndarray, B: np.ndarray) -> np.ndarray:
-        lower_cnt[0] += 1
+    def testee(A: np.ndarray, B: np.ndarray) -> np.ndarray:
         return A * B
 
-    A = np.arange(12, dtype=np.float64).reshape((4, 3))
-    B = np.full((4, 3), 10, dtype=np.float64)
-
-    jaceWrapped1_1 = jace.jit(testee1)
-    jaceWrapped1_2 = jace.jit(testee1)
-    assert jaceWrapped1_1 is not jaceWrapped1_2
-
-    # Lower them right after the other.
-    lower1_1 = jaceWrapped1_1.lower(A, B)
-    lower1_2 = jaceWrapped1_2.lower(A, B)
-    assert lower1_1 is not lower1_2
-    assert lower_cnt[0] == 2
-
-    # Lower them right after the other.
-    assert lower1_1 is jaceWrapped1_1.lower(A, B)
-    assert lower1_2 is jaceWrapped1_2.lower(A, B)
-    assert lower_cnt[0] == 2
-
-
-def test_decorator_sharing():
-    """Tests if there is no false sharing in the cache."""
-    jax.config.update("jax_enable_x64", True)
-
-    @jace.jit
-    def jaceWrapped(A: np.ndarray, B: np.ndarray) -> np.ndarray:
-        C = A * B
-        D = C + A
-        E = D + B  # Just enough state.
-        return A + B + C + D + E
-
-    # These are the argument
-    A = np.arange(12, dtype=np.float64).reshape((4, 3))
-    B = np.full((4, 3), 10, dtype=np.float64)
-
-    # Now we lower it.
-    jaceLowered = jaceWrapped.lower(A, B)
-
-    # Now we compile it with enabled optimization.
-    optiCompiled = jaceLowered.compile({"auto_optimize": True, "simplify": True})
-
-    # Now we compile it without any optimization.
-    unoptiCompiled = jaceLowered.compile({})
+    wrapped = jace.jit(testee)
 
-    # Because of the way how things work the optimized must have more than the unoptimized.
-    #  If there is sharing, then this would not be the case.
-    assert optiCompiled._csdfg.sdfg.number_of_nodes() == 1
-    assert optiCompiled._csdfg.sdfg.number_of_nodes() < unoptiCompiled._csdfg.sdfg.number_of_nodes()
+    assert wrapped.wrapped_fun is testee
+    assert wrapped.__wrapped__ is testee

From d2da4f31aea40951f0989671e60da196187da616 Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Mon, 20 May 2024 10:24:20 +0200
Subject: [PATCH 186/458] Added the tests about the caching.

---
 tests/test_caching.py | 189 ++++++++++++++++++++++++++++++++++++++++++
 1 file changed, 189 insertions(+)
 create mode 100644 tests/test_caching.py

diff --git a/tests/test_caching.py b/tests/test_caching.py
new file mode 100644
index 0000000..0703f3e
--- /dev/null
+++ b/tests/test_caching.py
@@ -0,0 +1,189 @@
+# JaCe - JAX Just-In-Time compilation using DaCe (Data Centric Parallel Programming)
+#
+# Copyright (c) 2024, ETH Zurich
+# All rights reserved.
+#
+# SPDX-License-Identifier: BSD-3-Clause
+
+"""Tests for the caching infrastructure.
+."""
+
+from __future__ import annotations
+
+import itertools as it
+
+import jax
+import numpy as np
+import pytest
+
+import jace
+from jace.jax import stages
+
+
+@pytest.fixture(autouse=True)
+def _clear_translation_cache():
+    """Decorator that clears the translation cache.
+
+    Ensures that a function finds an empty cache and clears up afterwards.
+
+    Todo:
+        Ask Enrique how I can make that fixture apply everywhere not just in the file but the whole test suite.
+    """
+    from jace.jax import translation_cache as tcache
+
+    tcache.clear_translation_cache()
+    yield
+    tcache.clear_translation_cache()
+
+
+def test_caching_same_sizes():
+    """The behaviour of the cache if same sizes are used."""
+    jax.config.update("jax_enable_x64", True)
+
+    # Counter for how many time it was lowered.
+    lowering_cnt = [0]
+
+    # This is the pure Python function.
+    def testee(A: np.ndarray, B: np.ndarray) -> np.ndarray:
+        return A * B
+
+    # this is the wrapped function.
+    @jace.jit
+    def wrapped(A, B):
+        lowering_cnt[0] += 1
+        return testee(A, B)
+
+    # First batch of arguments.
+    A = np.arange(12, dtype=np.float64).reshape((4, 3))
+    B = np.full((4, 3), 10, dtype=np.float64)
+
+    # The second batch of argument, it is the same size (structurally) but different values.
+    AA = A + 1.0362
+    BB = B + 0.638956
+
+    # Now let's lower it once directly and call it.
+    lowered: stages.JaceLowered = wrapped.lower(A, B)
+    compiled: stages.JaceCompiled = lowered.compile()
+    assert lowering_cnt[0] == 1
+    assert np.allclose(testee(A, B), compiled(A, B))
+
+    # Now lets call the wrapped object directly, since we already did the lowering
+    #  no longering (and compiling) is needed.
+    assert np.allclose(testee(A, B), wrapped(A, B))
+    assert lowering_cnt[0] == 1
+
+    # Now lets call it with different objects, that have the same structure.
+    #  Again no lowering should happen.
+    assert np.allclose(testee(AA, BB), wrapped(AA, BB))
+    assert wrapped.lower(AA, BB) is lowered
+    assert wrapped.lower(A, B) is lowered
+    assert lowering_cnt[0] == 1
+
+
+def test_caching_different_sizes():
+    """The behaviour of the cache if different sizes where used."""
+    jax.config.update("jax_enable_x64", True)
+
+    # Counter for how many time it was lowered.
+    lowering_cnt = [0]
+
+    # This is the wrapped function.
+    @jace.jit
+    def wrapped(A, B):
+        lowering_cnt[0] += 1
+        return A * B
+
+    # First size of arguments
+    A = np.arange(12, dtype=np.float64).reshape((4, 3))
+    B = np.full((4, 3), 10, dtype=np.float64)
+
+    # Second size of arguments
+    C = np.arange(16, dtype=np.float64).reshape((4, 4))
+    D = np.full((4, 4), 10, dtype=np.float64)
+
+    # Now lower the function once for each.
+    lowered1 = wrapped.lower(A, B)
+    lowered2 = wrapped.lower(C, D)
+    assert lowering_cnt[0] == 2
+    assert lowered1 is not lowered2
+
+    # Now also check if the compilation works as intended
+    compiled1 = lowered1.compile()
+    compiled2 = lowered2.compile()
+    assert lowering_cnt[0] == 2
+    assert compiled1 is not compiled2
+
+
+@pytest.mark.skip(reason="Missing primitive translators")
+def test_caching_different_structure():
+    """Now tests if we can handle multiple arguments with different structures.
+
+    Todo:
+        - Extend with strides once they are part of the cache.
+    """
+    jax.config.update("jax_enable_x64", True)
+
+    # This is the wrapped function.
+    lowering_cnt = [0]
+
+    @jace.jit
+    def wrapped(A, B):
+        lowering_cnt[0] += 1
+        return A * 4.0, B + 2.0
+
+    A = np.full((4, 30), 10, dtype=np.float64)
+    B = np.full((4, 3), 10, dtype=np.float64)
+    C = np.full((5, 3), 14, dtype=np.float64)
+    D = np.full((6, 3), 14, dtype=np.int64)
+
+    # These are the arrays.
+    args: dict[int, np.ndarray] = {id(x): x for x in [A, B, C, D]}
+    # These are the known lowerings.
+    lowerings: dict[tuple[int, int], stages.JaceLowered] = {}
+    lowering_ids: set[int] = set()
+
+    # Generating the lowerings
+    for arg1, arg2 in it.permutations([A, B, C, D], 2):
+        lower = wrapped.lower(arg1, arg2)
+        assert id(lower) not in lowering_ids
+        lowerings[id(arg1), id(arg2)] = lower
+        lowering_ids.add(id(lower))
+
+    # Now check if they are still cached.
+    for arg1, arg2 in it.permutations([A, B, C, D], 2):
+        lower = wrapped.lower(arg1, arg2)
+        clower = lowerings[id(arg1), id(arg2)]
+        assert clower is lower
+
+
+def test_caching_compilation():
+    """Tests the compilation cache, this is just very simple, since it uses the same code paths as lowering."""
+    jax.config.update("jax_enable_x64", True)
+
+    @jace.jit
+    def jaceWrapped(A: np.ndarray, B: np.ndarray) -> np.ndarray:
+        C = A * B
+        D = C + A
+        E = D + B  # Just enough state.
+        return A + B + C + D + E
+
+    # These are the argument
+    A = np.arange(12, dtype=np.float64).reshape((4, 3))
+    B = np.full((4, 3), 10, dtype=np.float64)
+
+    # Now we lower it.
+    jaceLowered = jaceWrapped.lower(A, B)
+
+    # Now we compile it with enabled optimization.
+    optiCompiled = jaceLowered.compile(stages.JaceLowered.DEF_COMPILER_OPTIONS)
+
+    # Passing `None` also means 'default' which is a bit strange, but it is what Jax does.
+    assert optiCompiled is jaceLowered.compile(None)
+
+    # Now we compile it without any optimization.
+    unoptiCompiled = jaceLowered.compile({})
+
+    # Because of the way how things work the optimized must have more than the unoptimized.
+    #  If there is sharing, then this would not be the case.
+    assert optiCompiled._csdfg.sdfg.number_of_nodes() == 1
+    assert optiCompiled._csdfg.sdfg.number_of_nodes() < unoptiCompiled._csdfg.sdfg.number_of_nodes()

From 271567039ff3929871d0017b3daf82d773056da1 Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Mon, 20 May 2024 11:00:30 +0200
Subject: [PATCH 187/458] Updated the api tests.

---
 tests/test_jax_api.py | 130 +++++++++++++++++++++++++++++-------------
 1 file changed, 90 insertions(+), 40 deletions(-)

diff --git a/tests/test_jax_api.py b/tests/test_jax_api.py
index 6e1a2da..d1f5c6d 100644
--- a/tests/test_jax_api.py
+++ b/tests/test_jax_api.py
@@ -46,78 +46,129 @@ def testee(A: np.ndarray, B: np.ndarray) -> np.ndarray:
 
 
 @pytest.mark.skip(reason="Scalar return values are not handled.")
-def test_composition1():
+def test_composition_itself():
+    """Tests if Jace is composable with itself."""
     jax.config.update("jax_enable_x64", True)
 
-    def f_(x):
+    # Pure Python functions
+    def f_ref(x):
         return jnp.sin(x)
 
-    def df_(x):
+    def df_ref(x):
         return jnp.cos(x)
 
-    def ddf_(x):
+    def ddf_ref(x):
         return -jnp.sin(x)
 
+    # Annotated functions.
+
+    @jace.jit
+    def f(x):
+        return f_ref(x)
+
+    @jace.jit
+    def df(x):
+        return jace.grad(f)(x)
+
+    @jace.jit
+    @jace.grad
+    def ddf(x):
+        return df(x)
+
+    assert all(jutil.is_jaceified(x) for x in [f, df, ddf])
+
     x = 1.0
+    for fun, fref in zip([f, df, ddf], [f_ref, df_ref, ddf_ref]):
+        ref = fref(x)
+        res = fun(x)
+        assert np.allclose(ref, res), f"f: Expected '{ref}', got '{res}'."
 
-    # Jacify it.
-    f = jace.jit(f_)
-    assert jutil.is_jaceified(f)
-    assert not jutil.is_jaxified(f)
 
-    ref = f_(x)
-    res = f(x)
-    assert np.allclose(ref, res), f"f: Expected '{ref}', got '{res}'."
+@pytest.mark.skip(reason="Nested Jaxpr are not handled.")
+def test_composition_with_jax():
+    """Tests if Jace can interact with Jax and vice versa."""
+    jax.config.update("jax_enable_x64", True)
 
-    # Now apply a Jax transformation to the jaceified function.
-    df = jax.grad(f)
+    def base_fun(A, B, C):
+        return A + B * jnp.sin(C) - A * B
 
-    ref = df_(x)
-    res = df(x)
-    assert np.allclose(ref, res), f"df: Expected '{ref}', got '{res}'."
+    @jace.jit
+    def jace_fun(A, B, C):
+        return jax.jit(base_fun)(A, B, C)
 
-    # Now apply a jace transformation around a jaxified transformation.
-    ddf = jace.grad(df)
+    def jax_fun(A, B, C):
+        return jace.jit(base_fun)(A, B, C)
 
-    ref = ddf_(x)
-    res = ddf(x)
-    assert np.allclose(ref, res), f"ddf: Expected '{ref}', got '{res}'."
+    A, B, C = (np.random.random((10, 3, 50)) for _ in range(3))  # noqa: NPY002  # random generator
 
+    assert np.allclose(jace_fun(A, B, C), jax_fun(A, B, C))
 
-def test_composition2():
-    jax.config.update("jax_enable_x64", True)
 
-    def f1_(A, B):
+@pytest.mark.skip(reason="Nested Jaxpr are not handled.")
+def test_composition_with_jax_2():
+    """Second test if Jace can interact with Jax and vice versa."""
+
+    @jax.jit
+    def f1_jax(A, B):
         return A + B
 
-    f1 = jax.jit(f1_)
+    assert jutil.is_jaxified(f1_jax)
+
+    @jace.jit
+    def f2_jace(A, B, C):
+        return f1_jax(A, B) - C
+
+    assert jutil.is_jaceified(f2_jace)
 
-    def f2_(A, B, C):
-        return f1(A, B) - C
+    @jax.jit
+    def f3_jax(A, B, C, D):
+        return f2_jace(A, B, C) * D
 
-    f2 = jace.jit(f2_)
+    assert jutil.is_jaxified(f3_jax)
 
-    def f3_(A, B, C, D):
-        return f2(A, B, C) * D
+    @jace.jit
+    def f3_jace(A, B, C, D):
+        return f3_jax(A, B, C, D)
 
-    f3_jax = jax.jit(f3_)
-    f3_jace = jace.jit(f3_)
+    assert jutil.is_jaceified(f3_jace)
 
     A, B, C, D = (np.random.random((10, 3, 50)) for _ in range(4))  # noqa: NPY002  # random generator
 
     ref = ((A + B) - C) * D
 
-    # We have to disable it, because currently there is no `pjit` instruction
-    #  that can handle the nesting.
-    with jax.disable_jit():
-        res_jax = f3_jax(A, B, C, D)
-        res_jace = f3_jace(A, B, C, D)
+    res_jax = f3_jax(A, B, C, D)
+    res_jace = f3_jace(A, B, C, D)
 
     assert np.allclose(ref, res_jax), "Jax failed."
     assert np.allclose(ref, res_jace), "JaCe Failed."
 
 
 @pytest.mark.skip(reason="Scalar return values are not handled.")
+def test_grad_annotation_direct():
+    """Test if `jace.grad` works directly."""
+    jax.config.update("jax_enable_x64", True)
+
+    def f(x):
+        return jnp.sin(jnp.exp(jnp.cos(x**2)))
+
+    @jax.grad
+    def jax_df(x):
+        return f(x)
+
+    @jax.jit
+    def jace_df(x):
+        return jace.grad(f)(x)
+
+    # These are the random numbers where we test
+    Xs = (np.random.random(10) - 0.5) * 10  # noqa: NPY002  # Random number generator
+
+    for i in range(Xs.shape[0]):
+        x = Xs[i]
+        res = jace_df(x)
+        ref = jax_df(x)
+        assert np.allclose(res, ref)
+
+
 def test_grad_control_flow():
     """Tests if `grad` and controlflow works.
 
@@ -125,13 +176,12 @@ def test_grad_control_flow():
     """
     jax.config.update("jax_enable_x64", True)
 
-    def f(x):
+    @jace.grad
+    def df(x):
         if x < 3:
             return 3.0 * x**2
         return -4 * x
 
-    df = jace.grad(f)
-
     x1 = 2.0
     df_x1 = 6 * x1
     x2 = 4.0

From 80bfa8fdf53dad1ed922ed095024b8d9fc2a5040 Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Mon, 20 May 2024 11:58:23 +0200
Subject: [PATCH 188/458] Made a first version of the driver tests.

Currently they only test positive stuff, and not negative stuff, i.e. tests if something fails.
---
 tests/test_jaxpr_translator_driver.py | 470 +++++++++++---------------
 1 file changed, 199 insertions(+), 271 deletions(-)

diff --git a/tests/test_jaxpr_translator_driver.py b/tests/test_jaxpr_translator_driver.py
index f123c4f..8ad340f 100644
--- a/tests/test_jaxpr_translator_driver.py
+++ b/tests/test_jaxpr_translator_driver.py
@@ -13,13 +13,29 @@
 
 import dace
 import pytest
-from dace.data import Array, Data, Scalar
+from dace.data import Array
 
-from jace import translator
+from jace import translator, util
 from jace.util import JaCeVar
 
 
-@pytest.fixture(scope="module")
+# These are some Jace variables that we use inside the tests
+#  Unnamed arrays
+array1 = JaCeVar((10, 12), dace.float64)
+array2 = JaCeVar((10, 13), dace.float32)
+array3 = JaCeVar((11, 16), dace.int64)
+
+#  Unnamed scalars
+scal1 = JaCeVar((), dace.float16)
+scal2 = JaCeVar((), dace.float32)
+scal3 = JaCeVar((), dace.int64)
+
+# Named variables
+narray = JaCeVar((10,), dace.float16, "narr")
+nscal = JaCeVar((), dace.int32, "nscal")
+
+
+@pytest.fixture()
 def translation_driver():
     """Returns an allocated driver instance."""
     name = "fixture_driver"
@@ -31,7 +47,10 @@ def translation_driver():
 
 
 def test_driver_alloc() -> None:
-    """Tests the state right after allocation."""
+    """Tests the state right after allocation.
+
+    Does not use the fixture because it does it on its own.
+    """
     driver = translator.JaxprTranslationDriver(
         sub_translators=translator.get_regsitered_primitive_translators()
     )
@@ -41,6 +60,8 @@ def test_driver_alloc() -> None:
     # The reserved names will be tested in `test_driver_fork()`.
     sdfg_name = "qwertzuiopasdfghjkl"
     driver._allocate_translation_ctx(name=sdfg_name)
+    assert len(driver._ctx_stack) == 1
+    assert driver.is_root_translator()
 
     sdfg: dace.SDFG = driver.sdfg
 
@@ -49,53 +70,182 @@ def test_driver_alloc() -> None:
     assert sdfg.number_of_nodes() == 1
     assert sdfg.number_of_edges() == 0
     assert sdfg.start_block is driver._ctx.start_state
-    assert driver.terminal_sdfg_state is driver._ctx.start_state
+    assert driver._terminal_sdfg_state is driver._ctx.start_state
+
+
+def test_driver_variable_alloc_auto_naming(
+    translation_driver: translator.JaxprTranslationDriver,
+) -> None:
+    """Tests simple variable allocation."""
+    for i, var in enumerate([array1, array2, scal1, array3, scal2, scal3]):
+        sdfg_name = translation_driver.add_array(var, update_var_mapping=True)
+        sdfg_var = translation_driver.get_array(sdfg_name)
+        assert sdfg_name == chr(97 + i)
+        assert isinstance(sdfg_var, Array)  # Everything is now an array
+        assert sdfg_var.shape == ((1,) if var.shape == () else var.shape)
+        assert sdfg_var.dtype == var.dtype
 
 
-def test_driver_nested() -> None:
-    """Tests the ability of the nesting of the driver.
+def test_driver_variable_alloc_mixed_naming(
+    translation_driver: translator.JaxprTranslationDriver,
+) -> None:
+    """Tests the naming in a mixed setting.
 
-    Note this test does the creation of subcontext manually, which is not recommended.
+    If `update_var_mapping=True` is given, then the naming will skip variables, see also `test_driver_variable_alloc_mixed_naming2()`.
     """
+    #                        *       b       c       d      *      f      g
+    for i, var in enumerate([narray, array1, array2, scal1, nscal, scal2, scal3]):
+        sdfg_name = translation_driver.add_array(var, update_var_mapping=True)
+        sdfg_var = translation_driver.get_array(sdfg_name)
+        if var.name is None:
+            assert sdfg_name == chr(97 + i)
+        else:
+            assert sdfg_name == var.name
+        assert isinstance(sdfg_var, Array)  # Everything is now an array
+        assert sdfg_var.shape == ((1,) if var.shape == () else var.shape)
+        assert sdfg_var.dtype == var.dtype
+
+
+def test_driver_variable_alloc_mixed_naming2(
+    translation_driver: translator.JaxprTranslationDriver,
+) -> None:
+    """Tests the naming in a mixed setting.
+
+    This time we do not use `update_var_mapping=True`, instead it now depends on the name.
+    This means that automatic naming will now again include all, letters, but not in a linear order.
+    """
+    letoff = 0
+    #             *      a        b       c      *      d     e
+    for var in [narray, array1, array2, scal1, nscal, scal2, scal3]:
+        sdfg_name = translation_driver.add_array(var, update_var_mapping=var.name is None)
+        sdfg_var = translation_driver.get_array(sdfg_name)
+        if var.name is None:
+            assert sdfg_name == chr(97 + letoff)
+            letoff += 1
+        else:
+            assert sdfg_name == var.name
+        assert isinstance(sdfg_var, Array)  # Everything is now an array
+        assert sdfg_var.shape == ((1,) if var.shape == () else var.shape)
+        assert sdfg_var.dtype == var.dtype
+
+
+def test_driver_variable_alloc_prefix_naming(
+    translation_driver: translator.JaxprTranslationDriver,
+) -> None:
+    """Using the prefix to name variables."""
+    prefix_1 = "__my_special_prefix"
+    exp_name_1 = prefix_1 + "a"
+    sdfg_name_1 = translation_driver.add_array(
+        array1, name_prefix=prefix_1, update_var_mapping=False
+    )
+    assert exp_name_1 == sdfg_name_1
 
-    # This is the parent driver.
-    driver = translator.JaxprTranslationDriver(
-        sub_translators=translator.get_regsitered_primitive_translators()
+    # Because `update_var_mapping` is `False` above, 'a' will be reused.
+    prefix_2 = "__my_special_prefix_second_"
+    exp_name_2 = prefix_2 + "a"
+    sdfg_name_2 = translation_driver.add_array(
+        array1, name_prefix=prefix_2, update_var_mapping=False
     )
-    assert not driver.is_allocated(), "Driver should not be allocated."
-
-    # We allocate the driver directly, because we need to set some internals.
-    #  This is also the reason why we do not use the fixture.
-    org_res_names = {"a", "b"}
-    driver._allocate_translation_ctx("driver", reserved_names=org_res_names)
-    driver._ctx.inp_names = ("a", "b")
-    driver._ctx.out_names = ("c", "d")
-    assert driver.is_allocated()
-    assert len(driver._ctx_stack) == 1
-    assert driver._reserved_names == org_res_names
-
-    # Now we increase the stack by one.
-    org_ctx = driver._ctx
-    driver._allocate_translation_ctx("driver2")
-    driver._ctx.inp_names = ("e", "f")
-    driver._ctx.out_names = ("g", "h")
-    assert driver.is_allocated()
-    assert len(driver._ctx_stack) == 2
-    assert driver._ctx is driver._ctx_stack[-1]
-    assert driver._ctx is not driver._ctx_stack[0]
-
-    assert org_ctx.rev_idx < driver.rev_idx  # type: ignore[operator]  # Type confusion
-
-    # Now we go back one state, i.e. pretend that we are done with translating the nested jaxpr.
-    driver._clear_translation_ctx()
-    assert driver._ctx is org_ctx
-    assert len(driver._ctx_stack) == 1
-    assert driver._reserved_names == org_res_names
+    assert exp_name_2 == sdfg_name_2
+
+
+def test_driver_variable_alloc_auto_naming_wrapped(
+    translation_driver: translator.JaxprTranslationDriver,
+) -> None:
+    """Tests the variable naming if we have more than 26 variables."""
+    single_letters = [chr(x) for x in range(97, 123)]
+    i = 0
+    for let1 in ["", *single_letters[1:]]:  # Note `z` is followed by `ba` and not by `aa`.
+        for let2 in single_letters:
+            i += 1
+            # Create a variable and enter it into the variable naming.
+            var = JaCeVar(shape=(19, 19), dtype=dace.float64)
+            sdfg_name = translation_driver.add_array(arg=var, update_var_mapping=True)
+            mapped_name = translation_driver.map_jax_var_to_sdfg(var)
+            assert (
+                sdfg_name == mapped_name
+            ), f"Mapping for '{var}' failed, expected '{sdfg_name}' got '{mapped_name}'."
+
+            # Get the name that we really expect, we must also handle some situations.
+            exp_name = let1 + let2
+            if exp_name in util.FORBIDDEN_SDFG_VAR_NAMES:
+                exp_name = "__jace_forbidden_" + exp_name
+            assert (
+                exp_name == sdfg_name
+            ), f"Automated naming failed, expected '{exp_name}' but got '{sdfg_name}'."
+
+
+def test_driver_nested(translation_driver: translator.JaxprTranslationDriver) -> None:
+    """Tests the ability of the nesting of the driver."""
+
+    # Now add a variable to the current subtext.
+    name_1 = translation_driver.add_array(array1, update_var_mapping=True)
+    assert name_1 == "a"
+    assert translation_driver.map_jax_var_to_sdfg(array1) == name_1
+
+    # For the sake of doing it add a new state to the SDFG.
+    translation_driver.append_new_state("sake_state")
+    assert translation_driver.sdfg.number_of_nodes() == 2
+    assert translation_driver.sdfg.number_of_edges() == 1
+
+    # Now we go one subcontext deeper; note we do this manually which should not be done.
+    translation_driver._allocate_translation_ctx("driver")
+    assert len(translation_driver._ctx_stack) == 2
+    assert translation_driver.sdfg.name == "driver"
+    assert translation_driver.sdfg.number_of_nodes() == 1
+    assert translation_driver.sdfg.number_of_edges() == 0
+    assert not translation_driver.is_root_translator()
+
+    # Because we have a new SDFG the mapping to previous SDFG does not work,
+    #  regardless the fact that it still exists.
+    with pytest.raises(
+        expected_exception=KeyError,
+        match=re.escape(
+            f"Jax variable '{array1}' was supposed to map to '{name_1}', but no such SDFG variable is known."
+        ),
+    ):
+        _ = translation_driver.map_jax_var_to_sdfg(array1)
 
-    # Now if we fully deallocate then we expect that it is fully deallocated.
-    driver._clear_translation_ctx()
-    assert len(driver._ctx_stack) == 0
-    assert driver._reserved_names is None
+    # Because the SDFGs are distinct it is possible to add `array1` to the nested one.
+    #  However, it is not able to update the mapping.
+    with pytest.raises(
+        expected_exception=ValueError,
+        match=re.escape(
+            f"Tried to create the mapping '{array1} -> {name_1}', but the variable is already mapped."
+        ),
+    ):
+        _ = translation_driver.add_array(array1, update_var_mapping=True)
+    assert name_1 not in translation_driver.sdfg.arrays
+
+    # Without updating the mapping it is possible create the variable.
+    assert name_1 == translation_driver.add_array(array1, update_var_mapping=False)
+
+    # Now add a new variable, the map is shared, so a new name will be generated.
+    name_2 = translation_driver.add_array(array2, update_var_mapping=True)
+    assert name_2 == "b"
+    assert name_2 == translation_driver.map_jax_var_to_sdfg(array2)
+
+    # Now we go one stack level back.
+    translation_driver._clear_translation_ctx()
+    assert len(translation_driver._ctx_stack) == 1
+    assert translation_driver.sdfg.number_of_nodes() == 2
+    assert translation_driver.sdfg.number_of_edges() == 1
+
+    # Again the variable that was declared in the last stack is now no longer present.
+    #  Note if the nested SDFG was integrated into the parent SDFG it would be accessible
+    with pytest.raises(
+        expected_exception=KeyError,
+        match=re.escape(
+            f"Jax variable '{array2}' was supposed to map to '{name_2}', but no such SDFG variable is known."
+        ),
+    ):
+        _ = translation_driver.map_jax_var_to_sdfg(array2)
+    assert name_2 == translation_driver._jax_name_map[array2]
+
+    # Now add a new variable, since the map is shared, we will now get the next name.
+    name_3 = translation_driver.add_array(array3, update_var_mapping=True)
+    assert name_3 == "c"
+    assert name_3 == translation_driver.map_jax_var_to_sdfg(array3)
 
 
 def test_driver_append_state(translation_driver: translator.JaxprTranslationDriver) -> None:
@@ -105,8 +255,8 @@ def test_driver_append_state(translation_driver: translator.JaxprTranslationDriv
     terminal_state_1: dace.SDFGState = translation_driver.append_new_state("terminal_state_1")
     assert sdfg.number_of_nodes() == 2
     assert sdfg.number_of_edges() == 1
-    assert terminal_state_1 is translation_driver.terminal_sdfg_state
-    assert translation_driver.terminal_sdfg_state is translation_driver._ctx.terminal_state
+    assert terminal_state_1 is translation_driver._terminal_sdfg_state
+    assert translation_driver._terminal_sdfg_state is translation_driver._ctx.terminal_state
     assert translation_driver._ctx.start_state is sdfg.start_block
     assert translation_driver._ctx.start_state is not terminal_state_1
     assert next(iter(sdfg.edges())).src is sdfg.start_block
@@ -118,7 +268,7 @@ def test_driver_append_state(translation_driver: translator.JaxprTranslationDriv
     )
     assert sdfg.number_of_nodes() == 3
     assert sdfg.number_of_edges() == 2
-    assert terminal_state_2 is translation_driver.terminal_sdfg_state
+    assert terminal_state_2 is translation_driver._terminal_sdfg_state
     assert sdfg.out_degree(terminal_state_1) == 1
     assert sdfg.out_degree(terminal_state_2) == 0
     assert sdfg.in_degree(terminal_state_2) == 1
@@ -128,232 +278,10 @@ def test_driver_append_state(translation_driver: translator.JaxprTranslationDriv
     non_terminal_state: dace.SDFGState = translation_driver.append_new_state(
         "non_terminal_state", prev_state=terminal_state_1
     )
-    assert translation_driver.terminal_sdfg_state is not non_terminal_state
+    assert translation_driver._terminal_sdfg_state is not non_terminal_state
     assert sdfg.in_degree(non_terminal_state) == 1
     assert sdfg.out_degree(non_terminal_state) == 0
     assert next(iter(sdfg.in_edges(non_terminal_state))).src is terminal_state_1
 
 
-def test_driver_scalar(translation_driver: translator.JaxprTranslationDriver) -> None:
-    """This function tests the array creation routines, especially the scalar part.
-
-    However, it does so without using Jax variables.
-    """
-    # Since we do not have Jax variables, we are using JaCe substitute for it.
-
-    # Creating a scalar.
-    scal1_j = JaCeVar("scal1", (), dace.float64)
-    scal1_: str = translation_driver.add_array(
-        arg=scal1_j,
-        update_var_mapping=True,
-    )
-    scal1: Data = translation_driver.get_array(scal1_)
-    assert scal1 is translation_driver.get_array(scal1_j)
-    assert scal1_ == translation_driver.map_jax_var_to_sdfg(scal1_j)
-    assert isinstance(scal1, Scalar)
-    assert scal1_ == scal1_j.name
-    assert scal1.dtype == scal1_j.dtype
-
-    # Create a scalar and force it as an array
-    scal2_j = JaCeVar("scal2", (), dace.int64)
-    scal2_: str = translation_driver.add_array(
-        arg=scal2_j,
-        force_array=True,
-    )
-    scal2: Data = translation_driver.get_array(scal2_)
-    assert isinstance(scal2, Array)
-    assert scal2_ == scal2_j.name
-    assert scal2.shape == (1,)
-    assert scal2.strides == (1,)
-    assert scal2.dtype == scal2_j.dtype
-
-    # Using a special name for the variable
-    scal3_j = JaCeVar("scal3", (), dace.int64)
-    scal3_n = "scal3_special_name"
-    scal3_: str = translation_driver.add_array(
-        arg=scal3_j,
-        alt_name=scal3_n,
-        update_var_mapping=True,
-    )
-    assert scal3_ == scal3_n
-    assert scal3_ == translation_driver.map_jax_var_to_sdfg(scal3_j)
-
-    # Test the prefix functionality
-    scal4_j = JaCeVar("scal4", (), dace.float64)
-    scal4_p = "my_prefix"
-    scal4_n = "scal4_unused_name"
-    with pytest.raises(
-        expected_exception=ValueError,
-        match=re.escape(
-            f"Specified 'name_prefix' ('{scal4_p}') but passed '{scal4_n}' as 'alt_name'."
-        ),
-    ):
-        scal4_: str = translation_driver.add_array(
-            arg=scal4_j,
-            alt_name=scal4_n,
-            name_prefix=scal4_p,
-        )
-    # Now create it correctly
-    scal4_ = translation_driver.add_array(
-        arg=scal4_j,
-        name_prefix=scal4_p,
-    )
-    assert scal4_.startswith(scal4_p)
-    assert scal4_j.name in scal4_
-
-    # Test the strides, or the inability to use it.
-    scal5_j = JaCeVar("scal5", (), dace.float64)
-    with pytest.raises(
-        expected_exception=ValueError,
-        match="Specified a stride for a scalar.",
-    ):
-        scal5_: str = translation_driver.add_array(arg=scal5_j, strides=(3,))
-
-    # test the force jax name feature
-    scal6_j = JaCeVar("scal6", (), dace.float64)
-    scal6_n: str = "scal6_name"
-    scal6_np: str = "scal6_name_prefix"
-    with pytest.raises(
-        expected_exception=ValueError,
-        match=f"Specified 'force_jax_name', but passed '{scal6_n}' as 'alt_name'.",
-    ):
-        scal6_: str = translation_driver.add_array(
-            arg=scal6_j,
-            alt_name=scal6_n,
-            force_jax_name=True,
-        )
-    with pytest.raises(
-        expected_exception=ValueError,
-        match=f"Specified 'force_jax_name', but passed '{scal6_np}' as 'name_prefix'.",
-    ):
-        scal6_ = translation_driver.add_array(
-            arg=scal6_j,
-            name_prefix=scal6_np,
-            force_jax_name=True,
-        )
-    with pytest.raises(
-        expected_exception=ValueError,
-        match="Specified `force_jax_name` but also wanted a new name.",
-    ):
-        scal6_ = translation_driver.add_array(
-            arg=scal6_j,
-            force_jax_name=True,
-            find_new_name=True,
-        )
-    scal6_ = translation_driver.add_array(
-        arg=scal6_j,
-        force_jax_name=True,
-    )
-    assert scal6_ == scal6_j.name
-
-
-def test_driver_array(translation_driver: translator.JaxprTranslationDriver) -> None:
-    """This function tests the array creation routines.
-
-    However, it does so without using Jax variables.
-    """
-    # Allocating an array
-    arr1_j = JaCeVar("arr1", (5, 3), dace.float32)
-    arr1_: str = translation_driver.add_array(
-        arg=arr1_j,
-    )
-    arr1: Data = translation_driver.get_array(arr1_)
-    assert isinstance(arr1, Array)
-    assert arr1_ == arr1_j.name
-    assert arr1.shape == arr1_j.shape
-    assert arr1.strides == (3, 1)
-    assert arr1.dtype == arr1_j.dtype
-
-    # Create a variable that has a sdfg name that is already known.
-    arr2_j = JaCeVar(arr1_, (10,), dace.float64)
-    with pytest.raises(
-        expected_exception=ValueError,
-        match=f"Can't create variable '{arr2_j.name}', variable is already created.",
-    ):
-        arr2_: str = translation_driver.add_array(arg=arr2_j)
-    with pytest.raises(expected_exception=ValueError, match=f"Variable '{arr1_}' already exists."):
-        # `alt_name` will not work because name still exists.
-        arr2_ = translation_driver.add_array(arg=arr2_j, alt_name=arr2_j.name)
-    # However, specifying `find_new_name` will solve this issue
-    arr2_ = translation_driver.add_array(
-        arg=arr2_j,
-        find_new_name=True,
-    )
-    assert arr2_.startswith("_jax_variable__" + arr2_j.name)
-
-    # Create a variable that has a custom stride
-    arr3_j = JaCeVar("arr3", (5, 1, 3), dace.float64)
-    arr3_st = (5, 3, 2)
-    arr3_: str = translation_driver.add_array(
-        arg=arr3_j,
-        strides=arr3_st,
-    )
-    arr3: Data = translation_driver.get_array(arr3_)
-    assert isinstance(arr3, Array)
-    assert arr3.shape == arr3_j.shape
-    assert arr3.strides == arr3_st
-
-
-def test_driver_array2() -> None:
-    """This function tests the array creation routine with respect to the automatic naming.
-
-    Todo:
-        - Literals.
-    """
-    # This is the parent driver.
-    driver = translator.JaxprTranslationDriver(
-        sub_translators=translator.get_regsitered_primitive_translators()
-    )
-    assert not driver.is_allocated(), "Driver should not be allocated."
-
-    # Creating JaCe Variables with empty names, forces the driver to use the
-    #  Jax naming algorithm.
-    var_a = JaCeVar("", (10, 19), dace.int64)
-    var_b = JaCeVar("", (10, 909), dace.float16)
-
-    # These are the reserved names, so `a` should be named as is, but `b` should have another name.
-    org_res_names = {"b"}
-    driver._allocate_translation_ctx("driver", reserved_names=org_res_names)
-
-    # These are the expected names
-    exp_names = [
-        "a",
-        "_jax_variable__b__0",
-    ]
-    res_names = driver.create_jax_var_list(
-        [var_a, var_b],
-        only_creation=True,
-    )
-    assert res_names == exp_names, f"Expected names '{exp_names}' but got '{res_names}'."
-    assert len(driver._jax_name_map) == 2
-
-    # Try to create variable `c` and `a`, however, since variable `a` already exists it will fail.
-    #  However, currently the variable `c` will be created, this might change in the future.
-    var_c = JaCeVar("", (10, 19), dace.int64)
-    with pytest.raises(
-        expected_exception=ValueError,
-        match=re.escape(f"'only_creation' given '{var_a}' already exists."),
-    ):
-        res_names = driver.create_jax_var_list(
-            [var_c, var_a],
-            only_creation=True,
-        )
-    assert len(driver._jax_name_map) == 3, f"{driver._jax_name_map}"
-    assert driver._jax_name_map[var_c] == "c"
-
-    # Now we test the only collection mode
-    res_names = driver.create_jax_var_list(
-        [var_c, var_a],
-        prevent_creation=True,
-    )
-    assert len(driver._jax_name_map) == 3, f"{driver._jax_name_map}"
-    assert res_names == ["c", "a"]
-
-    # Now also the mixed mode, i.e. between collecting and creating.
-    var_d = JaCeVar("", (10, 19), dace.int64)
-    exp_names = ["c", "d", "a"]
-    res_names = driver.create_jax_var_list(
-        [var_c, var_d, var_a],
-    )
-    assert len(driver._jax_name_map) == 4
-    assert exp_names == res_names
+# TODO: Failing tests

From 4ec34be2201029418a28a53da00217fe058d8003 Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Mon, 20 May 2024 13:10:57 +0200
Subject: [PATCH 189/458] Fixed a small issue in the `propose_jax_name()`
 function.

---
 src/jace/util/jax_helper.py | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/src/jace/util/jax_helper.py b/src/jace/util/jax_helper.py
index d86e5d6..ba0127d 100644
--- a/src/jace/util/jax_helper.py
+++ b/src/jace/util/jax_helper.py
@@ -211,10 +211,10 @@ def propose_jax_name(
     jax_name = ""
     while len(jax_name) == 0 or c != 0:
         c, i = c // 26, c % 26
-        jax_name = chr(97 + i % 26) + jax_name
+        jax_name = chr(97 + i) + jax_name
     jax_name = jax_name + getattr(jax_var, "suffix", "")
 
-    if jax_name is util.FORBIDDEN_SDFG_VAR_NAMES:
+    if jax_name in util.FORBIDDEN_SDFG_VAR_NAMES:
         jax_name = f"__jace_forbidden_{jax_name}"
         assert jax_name not in util.FORBIDDEN_SDFG_VAR_NAMES
     return jax_name

From db3890ca2f0f5724b0a39a00813dc00d15e1f131 Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Mon, 20 May 2024 13:12:07 +0200
Subject: [PATCH 190/458] Updated the
 `JaxprTranslatorDriver::add_jax_name_mapping()` function.

Before, the behaviour was that if the mapping was already known but formally did not change no error was generated.
However, this has some issues when looking at nested stuff, so I promoted it to an error.

It would be possible to generate a more specific error but currently not.
---
 src/jace/translator/jaxpr_translator_driver.py | 9 +++------
 1 file changed, 3 insertions(+), 6 deletions(-)

diff --git a/src/jace/translator/jaxpr_translator_driver.py b/src/jace/translator/jaxpr_translator_driver.py
index abf4478..80cebb2 100644
--- a/src/jace/translator/jaxpr_translator_driver.py
+++ b/src/jace/translator/jaxpr_translator_driver.py
@@ -281,9 +281,9 @@ def add_jax_name_mapping(
         jax_var: jax_core.Var | util.JaCeVar,
         sdfg_name: str,
     ) -> JaxprTranslationDriver:
-        """Creates a mapping between `jax_var` to `sdfg_name`.
+        """Creates a new mapping between `jax_var` to `sdfg_name`.
 
-        This function updates the internal map of `self` and after the call `self.map_jax_var_to_sdfg()` will identify `jax_var` with `sdfg_name`.
+        If the mapping already exists an error will be generated.
         This function is not able to delete a variable mapping that was established before, for this use TBA.
 
         Args:
@@ -293,11 +293,8 @@ def add_jax_name_mapping(
         assert len(sdfg_name) > 0
 
         if jax_var in self._jax_name_map:
-            if self._jax_name_map[jax_var] == sdfg_name:  # noops.
-                return self
             raise ValueError(
-                f"Tried to create the mapping '{jax_var} -> {sdfg_name}', but '{jax_var}'"
-                f" already points to '{self.map_jax_var_to_sdfg(jax_var)}'."
+                f"Tried to create the mapping '{jax_var} -> {sdfg_name}', but the variable is already mapped."
             )
         if sdfg_name not in self._ctx.sdfg.arrays:
             raise KeyError(f"Mapping '{jax_var} -> {sdfg_name}': SDFG target unknown.")

From ee1d5ad6a8de990c79783c34d052b08f3c5651b6 Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Mon, 20 May 2024 13:14:34 +0200
Subject: [PATCH 191/458] Updated how `JaxprTranslatorDriver::add_array()`
 works.

If teh function fails to establish a mapping then the SDFG variable is removed.
---
 src/jace/translator/jaxpr_translator_driver.py | 7 ++++++-
 1 file changed, 6 insertions(+), 1 deletion(-)

diff --git a/src/jace/translator/jaxpr_translator_driver.py b/src/jace/translator/jaxpr_translator_driver.py
index 80cebb2..043cf58 100644
--- a/src/jace/translator/jaxpr_translator_driver.py
+++ b/src/jace/translator/jaxpr_translator_driver.py
@@ -362,7 +362,12 @@ def add_array(
         )
 
         if update_var_mapping:
-            self.add_jax_name_mapping(jax_var=arg, sdfg_name=arg_name)
+            try:
+                # If the mapping fails, remove the variable from the SDFG.
+                self.add_jax_name_mapping(jax_var=arg, sdfg_name=arg_name)
+            except:
+                del self._ctx.sdfg.arrays[arg_name]
+                raise
 
         return arg_name
 

From 009f59818325a0004b8f87035494d9684ce17923 Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Mon, 20 May 2024 13:44:08 +0200
Subject: [PATCH 192/458] Since the `propose_jax_name()` function was made more
 inteligent, I was able to remove some tests.

---
 src/jace/translator/jaxpr_translator_driver.py | 8 +++-----
 src/jace/util/jax_helper.py                    | 1 -
 2 files changed, 3 insertions(+), 6 deletions(-)

diff --git a/src/jace/translator/jaxpr_translator_driver.py b/src/jace/translator/jaxpr_translator_driver.py
index 043cf58..6a85ea1 100644
--- a/src/jace/translator/jaxpr_translator_driver.py
+++ b/src/jace/translator/jaxpr_translator_driver.py
@@ -341,13 +341,11 @@ def add_array(
         # Propose a name and if needed extend it.
         arg_name = util.propose_jax_name(arg, self._jax_name_map)
         if name_prefix is not None:
-            arg_name = name_prefix + arg_name
+            if not util.VALID_SDFG_VAR_NAME.fullmatch(name_prefix):
+                raise ValueError(f"add_array({arg}): Supplied invalid prefix '{name_prefix}'.")
+            arg_name = f"{name_prefix}{arg_name}"
 
         # final checks
-        if arg_name in util.FORBIDDEN_SDFG_VAR_NAMES:
-            raise ValueError(f"add_array({arg}): The proposed name '{arg_name}' is forbidden.")
-        if not util.VALID_SDFG_VAR_NAME.fullmatch(arg_name):
-            raise ValueError(f"add_array({arg}): The proposed name '{arg_name} is invalid.")
         if arg_name in self._ctx.sdfg.arrays:
             raise ValueError(f"add_array({arg}): The proposed name '{arg_name}', is used.")
 
diff --git a/src/jace/util/jax_helper.py b/src/jace/util/jax_helper.py
index ba0127d..01eaa8f 100644
--- a/src/jace/util/jax_helper.py
+++ b/src/jace/util/jax_helper.py
@@ -216,5 +216,4 @@ def propose_jax_name(
 
     if jax_name in util.FORBIDDEN_SDFG_VAR_NAMES:
         jax_name = f"__jace_forbidden_{jax_name}"
-        assert jax_name not in util.FORBIDDEN_SDFG_VAR_NAMES
     return jax_name

From 0d92f5b188a3cdfaec1badfa8f6f792d476ec337 Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Mon, 20 May 2024 13:45:55 +0200
Subject: [PATCH 193/458] Updated the tests for the driver.

They are now a bit cleanerer and shorter.
---
 tests/test_jaxpr_translator_driver.py | 57 ++++++++++++++++++++++++++-
 1 file changed, 56 insertions(+), 1 deletion(-)

diff --git a/tests/test_jaxpr_translator_driver.py b/tests/test_jaxpr_translator_driver.py
index 8ad340f..1789dcd 100644
--- a/tests/test_jaxpr_translator_driver.py
+++ b/tests/test_jaxpr_translator_driver.py
@@ -148,6 +148,14 @@ def test_driver_variable_alloc_prefix_naming(
     )
     assert exp_name_2 == sdfg_name_2
 
+    # Now we use a named variables, which are also affected.
+    prefix_3 = "__my_special_prefix_third_named_"
+    exp_name_3 = prefix_3 + nscal.name  # type: ignore[operator]  # `.name` is not `None`.
+    sdfg_name_3 = translation_driver.add_array(
+        nscal, name_prefix=prefix_3, update_var_mapping=False
+    )
+    assert exp_name_3 == sdfg_name_3
+
 
 def test_driver_variable_alloc_auto_naming_wrapped(
     translation_driver: translator.JaxprTranslationDriver,
@@ -284,4 +292,51 @@ def test_driver_append_state(translation_driver: translator.JaxprTranslationDriv
     assert next(iter(sdfg.in_edges(non_terminal_state))).src is terminal_state_1
 
 
-# TODO: Failing tests
+def test_driver_variable_multiple_variables(
+    translation_driver: translator.JaxprTranslationDriver,
+) -> None:
+    """A simple test in which we try to add a variable that are known, but with a different name."""
+    # Now we will add `array1` and then different ways of updating it.
+    narray1: str = translation_driver.add_array(array1, update_var_mapping=True)
+
+    # It will fail if we use the prefix, because we also want to update.
+    prefix = "__jace_prefix"
+    prefix_expected_name = prefix + narray1
+    with pytest.raises(
+        expected_exception=ValueError,
+        match=re.escape(
+            f"Tried to create the mapping '{array1} -> {prefix_expected_name}', but the variable is already mapped."
+        ),
+    ):
+        _ = translation_driver.add_array(array1, update_var_mapping=True, name_prefix=prefix)
+    assert prefix_expected_name not in translation_driver.sdfg.arrays
+
+    # But if we do not want to update it then it works.
+    prefix_sdfg_name = translation_driver.add_array(
+        array1, update_var_mapping=False, name_prefix=prefix
+    )
+    assert prefix_expected_name in translation_driver.sdfg.arrays
+    assert narray1 == translation_driver.map_jax_var_to_sdfg(array1)
+
+
+def test_driver_variable_invalid_prefix(
+    translation_driver: translator.JaxprTranslationDriver,
+) -> None:
+    """Use invalid prefix."""
+    # It will fail if we use the prefix, because we also want to update.
+    for iprefix in ["0_", "_ja ", "_!"]:
+        with pytest.raises(
+            expected_exception=ValueError,
+            match=re.escape(f"add_array({array1}): Supplied invalid prefix '{iprefix}'."),
+        ):
+            _ = translation_driver.add_array(array1, update_var_mapping=False, name_prefix=iprefix)
+        assert len(translation_driver.sdfg.arrays) == 0
+
+
+def test_driver_jace_var() -> None:
+    """Simple tests about the `JaCeVar` objects."""
+    for iname in ["do", "", "_ _", "9al", "_!"]:
+        with pytest.raises(
+            expected_exception=ValueError, match=re.escape(f"Supplied the invalid name '{iname}'.")
+        ):
+            _ = JaCeVar((), dace.int8, name=iname)

From fec6f509d84a783b99808a9abe2733f1d04655b6 Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Mon, 20 May 2024 14:42:10 +0200
Subject: [PATCH 194/458] Updated the tests to manage the translators.

---
 tests/test_subtranslator_helper.py | 273 +++++++++++++----------------
 1 file changed, 124 insertions(+), 149 deletions(-)

diff --git a/tests/test_subtranslator_helper.py b/tests/test_subtranslator_helper.py
index 05dead7..3c0897a 100644
--- a/tests/test_subtranslator_helper.py
+++ b/tests/test_subtranslator_helper.py
@@ -10,14 +10,11 @@
 from __future__ import annotations
 
 import re
-from collections.abc import Mapping, MutableSequence, Sequence
 from typing import Any
 
-import dace
 import jax
 import numpy as np
 import pytest
-from jax import core as jax_core
 
 import jace
 from jace import translator
@@ -29,209 +26,187 @@
 
 @pytest.fixture(autouse=True)
 def _conserve_builtin_translators():
-    """Decorator that restores the previous state of the build ins."""
+    """Restores the set of registered subtranslators after a test."""
     initial_translators = translator.get_regsitered_primitive_translators()
     yield
     translator.set_active_primitive_translators_to(initial_translators)
 
 
-def _dict_struct(dict_: Mapping[str, Any]) -> Sequence[tuple[str, int]]:
-    return tuple(sorted(((k, id(v)) for k, v in dict_.items()), key=lambda X: X[0]))
+@pytest.fixture()
+def no_builtin_translators() -> str:
+    """This fixture can be used if the test does not want any builtin translators."""
+    initial_translators = translator.get_regsitered_primitive_translators()
+    translator.set_active_primitive_translators_to({})
+    yield "DUMMY_VALUE"
+    translator.set_active_primitive_translators_to(initial_translators)
 
 
-def test_are_subtranslators_imported():
-    """Tests if something is inside the list of subtranslators."""
-    assert len(get_regsitered_primitive_translators()) > 1
+# These are definitions of some Subtranslators that can be used to test things.
+class SubTrans1(translator.PrimitiveTranslator):
+    @property
+    def primitive(self):
+        return "non_existing_primitive1"
 
+    def __call__(self) -> None:  # type: ignore[override]  # Arguments
+        raise NotImplementedError
 
-def test_subtranslatior_managing():
-    """Ensures the functionality of the subtranslator managing."""
 
-    # TODO(phimuell): Make this more friendly; See blow
-    builtin_subtrans = get_regsitered_primitive_translators()
-    builin_struct = _dict_struct(builtin_subtrans)
+class SubTrans2(translator.PrimitiveTranslator):
+    @property
+    def primitive(self):
+        return "non_existing_primitive2"
 
-    class SubTrans1(translator.PrimitiveTranslator):
-        @property
-        def primitive(self):
-            return "non_existing_primitive1"
+    def __call__(self) -> None:  # type: ignore[override]  # Arguments
+        raise NotImplementedError
 
-        def __call__(self) -> None:  # type: ignore[override]  # Arguments
-            raise NotImplementedError
 
-    # Ensures that we really return the object unmodified.
-    sub_trans1 = register_primitive_translator(SubTrans1())
-    assert sub_trans1 is get_regsitered_primitive_translators()["non_existing_primitive1"]
+# fmt: off
+def SubTrans3_Callable(*args: Any, **kwargs: Any) -> None:
+    raise NotImplementedError
+SubTrans3_Callable.primitive = "non_existing_primitive3" # type: ignore[attr-defined]
+# fmt: on
 
-    class SubTrans2(translator.PrimitiveTranslator):
-        @property
-        def primitive(self):
-            return "non_existing_primitive2"
 
-        def __call__(self) -> None:  # type: ignore[override]  # Arguments
-            raise NotImplementedError
+def test_are_subtranslators_imported():
+    """Tests if something is inside the list of subtranslators."""
+    # Must be adapted if new primitives are implemented.
+    assert len(get_regsitered_primitive_translators()) == 37
 
-    # Wrong name
-    sub_trans2_instance = SubTrans2()
-    with pytest.raises(
-        expected_exception=TypeError,
-        match=re.escape(
-            f"Translator's primitive '{sub_trans2_instance.primitive}' doesn't match the supplied 'not_non_existing_primitive2'."
-        ),
-    ):
-        register_primitive_translator(
-            sub_trans2_instance,
-            primitive="not_non_existing_primitive2",
-        )
-
-    # But if the correct name is specified it works.
-    register_primitive_translator(
-        sub_trans2_instance,
-        primitive="non_existing_primitive2",
-    )
 
-    @register_primitive_translator(primitive="non_existing_primitive3")
-    def non_existing_primitive_translator_3(
-        driver: translator.JaxprTranslationDriver,
-        in_var_names: Sequence[str | None],
-        out_var_names: MutableSequence[str],
-        eqn: jax_core.JaxprEqn,
-        eqn_state: dace.SDFGState,
-    ) -> dace.SDFGState | None:
-        raise NotImplementedError
+def test_subtranslatior_managing(no_builtin_translators):
+    """Basic functionality of the subtranslators."""
+    original_active_subtrans = get_regsitered_primitive_translators()
+    assert len(original_active_subtrans) == 0
 
-    assert non_existing_primitive_translator_3.primitive == "non_existing_primitive3"
+    # Create the classes.
+    sub1 = SubTrans1()
+    sub2 = SubTrans2()
 
-    curr1_subtrans = get_regsitered_primitive_translators()
-    curr1_subtrans_mod = get_regsitered_primitive_translators()
-    assert curr1_subtrans is not builtin_subtrans
-    assert curr1_subtrans is not curr1_subtrans_mod
-    assert _dict_struct(curr1_subtrans) != builin_struct
-    assert _dict_struct(curr1_subtrans) == _dict_struct(curr1_subtrans_mod)
+    # These are all primitive translators
+    prim_translators = [sub1, sub2, SubTrans3_Callable]
 
-    for i in [1, 2, 3]:
-        pname = f"non_existing_primitive{i}"
-        assert pname in curr1_subtrans, f"Expected to find '{pname}'."
-        curr1_subtrans_mod.pop(pname)
-    assert builin_struct == _dict_struct(curr1_subtrans_mod)
+    # Add the instances.
+    for sub in prim_translators:
+        assert register_primitive_translator(sub) is sub
+
+    # Tests if they were correctly registered
+    active_subtrans = get_regsitered_primitive_translators()
+    for expected in prim_translators:
+        assert active_subtrans[expected.primitive] is expected
+    assert len(active_subtrans) == 3
+
+
+def test_subtranslatior_managing_callable(no_builtin_translators):
+    """If we add a callable, and have no `.primitive` property defined."""
+
+    def noname_translator_callable(*args: Any, **kwargs: Any) -> None:
+        raise NotImplementedError
 
-    # Try adding instance and if we can overwrite.
-    sub_trans1_instance = SubTrans1()
+    # This will not work because `noname_translator_callable()` does not have a `.primitive` attribute.
     with pytest.raises(
         expected_exception=ValueError,
-        match=re.escape(
-            "Explicit override=True needed for primitive 'non_existing_primitive1' to overwrite existing one."
-        ),
+        match=re.escape(f"Missing primitive name for '{noname_translator_callable}'"),
     ):
-        register_primitive_translator(sub_trans1_instance, overwrite=False)
+        register_primitive_translator(noname_translator_callable)
+    assert len(get_regsitered_primitive_translators()) == 0
+
+    # This works because there is a primitive specified, it will also update the object.
+    prim_name = "noname_translator_callable_prim"
+    assert register_primitive_translator(noname_translator_callable, primitive=prim_name)
+    assert noname_translator_callable.primitive == prim_name
 
-    # Now adding it forcefully, this should also change a lot.
-    register_primitive_translator(sub_trans1_instance, overwrite=True)
 
-    curr2_subtrans = get_regsitered_primitive_translators()
-    assert curr2_subtrans is not builtin_subtrans
-    assert curr2_subtrans is not curr1_subtrans
-    assert _dict_struct(curr2_subtrans) != builin_struct
-    assert _dict_struct(curr2_subtrans) != _dict_struct(curr1_subtrans)
-    assert curr2_subtrans["non_existing_primitive1"] is sub_trans1_instance
+def test_subtranslatior_managing_failing_wrong_name(no_builtin_translators):
+    """Tests if how it works with wrong name."""
+    sub1 = SubTrans1()
+    sub2 = SubTrans2()
 
-    # Try to register a function as translator, that already has a primitive property.
     with pytest.raises(
         expected_exception=TypeError,
         match=re.escape(
-            f"Translator's primitive '{non_existing_primitive_translator_3.primitive}' doesn't match the supplied 'non_existing_primitive1'."
+            f"Translator's primitive '{sub1.primitive}' doesn't match the supplied '{sub2.primitive}'."
         ),
     ):
-        register_primitive_translator(
-            non_existing_primitive_translator_3,
-            primitive="non_existing_primitive1",
-            overwrite=False,
-        )
+        register_primitive_translator(sub1, primitive=sub2.primitive)
+
+
+def test_subtranslatior_managing_overwriting():
+    """Tests if we are able to overwrite something."""
+    current_add_translator = get_regsitered_primitive_translators()["add"]
 
-    # This would work because it has the same primitive name, but it fails because overwrite is False
+    def useless_add_translator(*args: Any, **kwargs: Any) -> None:
+        raise NotImplementedError
+
+    useless_add_translator.primitive = "add"
+
+    # This will not work because it is not overwritten.
     with pytest.raises(
         expected_exception=ValueError,
         match=re.escape(
-            "Explicit override=True needed for primitive 'non_existing_primitive3' to overwrite existing one."
+            "Explicit override=True needed for primitive 'add' to overwrite existing one."
         ),
     ):
-        register_primitive_translator(
-            non_existing_primitive_translator_3,
-            primitive="non_existing_primitive3",
-            overwrite=False,
-        )
-
-    register_primitive_translator(
-        non_existing_primitive_translator_3, primitive="non_existing_primitive3", overwrite=True
+        register_primitive_translator(useless_add_translator)
+    assert current_add_translator is get_regsitered_primitive_translators()["add"]
+
+    # Now we use overwrite, thus it will now work.
+    assert useless_add_translator is register_primitive_translator(
+        useless_add_translator, overwrite=True
     )
 
 
-def test_subtranslatior_managing_2():
-    """Shows that we are really able to overwrite stuff"""
+def test_subtranslatior_managing_overwriting_2(no_builtin_translators):
+    """Again an overwriting test, but this time a bit more complicated."""
     jax.config.update("jax_enable_x64", True)
 
-    class NonAddTranslator(translator.PrimitiveTranslator):
-        @property
-        def primitive(self):
-            return "add"
-
-        def __call__(self, *args, **kwargs) -> None:
-            raise NotImplementedError("The 'NonAddTranslator' can not translate anything.")
+    trans_cnt = [0]
 
-    register_primitive_translator(NonAddTranslator(), overwrite=True)
+    @register_primitive_translator(primitive="add")
+    def still_but_less_useless_add_translator(*args: Any, **kwargs: Any) -> None:
+        trans_cnt[0] += 1
+        return
 
     @jace.jit
-    def testee(A: np.ndarray, B: np.ndarray) -> np.ndarray:
-        return A + B
+    def foo(A):
+        B = A + 1
+        C = B + 1
+        D = C + 1
+        return D + 1
 
-    A = np.arange(12, dtype=np.float64).reshape((4, 3))
-    B = np.full((4, 3), 10, dtype=np.float64)
+    _ = foo.lower(1)
+    assert trans_cnt[0] == 4
 
-    with pytest.raises(
-        expected_exception=NotImplementedError,
-        match=re.escape("The 'NonAddTranslator' can not translate anything."),
-    ):
-        _ = testee.lower(A, B)
 
+def test_subtranslatior_managing_decoupling():
+    """Shows that we have proper decoupling.
 
-def test_subtranslatior_managing_3():
-    """Shows proper decoupling."""
+    I.e. changes to the global state, does not affect already annotated functions.
+    """
     jax.config.update("jax_enable_x64", True)
 
-    class NonAddTranslator(translator.PrimitiveTranslator):
-        @property
-        def primitive(self):
-            return "add"
-
-        def __call__(self, *args, **kwargs) -> None:
-            raise NotImplementedError("The 'NonAddTranslator' can not translate anything at all.")
-
-    used_sub_trans = get_regsitered_primitive_translators()
-    used_sub_trans["add"] = NonAddTranslator()
+    @jace.jit
+    def foo(A):
+        B = A + 1
+        C = B + 1
+        D = C + 1
+        return D + 1
 
-    @jace.jit(sub_translators=used_sub_trans)
-    def not_working_test(A: np.ndarray, B: np.ndarray) -> np.ndarray:
-        return A + B
+    @register_primitive_translator(primitive="add", overwrite=True)
+    def useless_add_translator(*args: Any, **kwargs: Any) -> None:
+        raise NotImplementedError("The 'useless_add_translator' was called as expected.")
 
-    # Now we again remove the add from the list, but this will not have an impact on the `not_working_test()`.
-    used_sub_trans.pop("add")
+    # Since `foo` was already constructed, a new registering can not change anything.
+    A = np.zeros((10, 10))
+    assert np.all(foo(A) == 4)
 
+    # But if we now annotate a new function, then we will get the uselss translator
     @jace.jit
-    def working_test(A: np.ndarray, B: np.ndarray) -> np.ndarray:
-        return A + B
-
-    A = np.arange(12, dtype=np.float64).reshape((4, 3))
-    B = np.full((4, 3), 10, dtype=np.float64)
+    def foo_fail(A):
+        B = A + 1
+        return B + 1
 
     with pytest.raises(
         expected_exception=NotImplementedError,
-        match=re.escape("The 'NonAddTranslator' can not translate anything at all."),
+        match=re.escape("The 'useless_add_translator' was called as expected."),
     ):
-        _ = not_working_test.lower(A, B)
-
-    # This works because the
-    working_test.lower(A, B)
-
-
-if __name__ == "__main__":
-    test_subtranslatior_managing()
+        _ = foo_fail.lower(A)

From af2d6c7bc21e4d28ff0a705e7fc01c49fd4509be Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Mon, 20 May 2024 15:13:57 +0200
Subject: [PATCH 195/458] Removed some unused stuff.

---
 src/jace/util/__init__.py | 2 --
 src/jace/util/traits.py   | 8 --------
 2 files changed, 10 deletions(-)

diff --git a/src/jace/util/__init__.py b/src/jace/util/__init__.py
index 925b58e..6bff211 100644
--- a/src/jace/util/__init__.py
+++ b/src/jace/util/__init__.py
@@ -29,7 +29,6 @@
     is_jaceified,
     is_jax_array,
     is_jaxified,
-    is_non_string_iterable,
     is_on_device,
     is_scalar,
 )
@@ -56,7 +55,6 @@
     "is_jaxified",
     "is_jax_array",
     "is_fully_addressable",
-    "is_non_string_iterable",
     "is_on_device",
     "is_scalar",
     "get_jax_var_dtype",
diff --git a/src/jace/util/traits.py b/src/jace/util/traits.py
index 6bd3a81..6336f6d 100644
--- a/src/jace/util/traits.py
+++ b/src/jace/util/traits.py
@@ -9,7 +9,6 @@
 
 from __future__ import annotations
 
-from collections.abc import Iterable
 from typing import Any, TypeGuard
 
 import dace
@@ -22,13 +21,6 @@
 import jace.util as util
 
 
-class NonStringIterable(Iterable): ...
-
-
-def is_non_string_iterable(val: Any) -> TypeGuard[NonStringIterable]:
-    return isinstance(val, Iterable) and not isinstance(val, str)
-
-
 def is_jaceified(obj: Any) -> TypeGuard[jjax.JaceWrapped]:
     """Tests if `obj` is decorated by JaCe.
 

From fc1ccbcb5a7ff9e359a8595be7d92e2177fc2ffc Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Tue, 21 May 2024 06:57:04 +0200
Subject: [PATCH 196/458] Updated the managing functionality.

Before the `set_active_primitive_translators_to()` did not return anything.
Now it returns the previous state, which is, most of the times much more usefull.
---
 src/jace/translator/managing.py    | 18 +++++++++---------
 tests/test_subtranslator_helper.py |  3 +--
 2 files changed, 10 insertions(+), 11 deletions(-)

diff --git a/src/jace/translator/managing.py b/src/jace/translator/managing.py
index cc79319..1f16641 100644
--- a/src/jace/translator/managing.py
+++ b/src/jace/translator/managing.py
@@ -13,7 +13,7 @@
 
 from __future__ import annotations
 
-from collections.abc import Callable, Mapping, MutableMapping
+from collections.abc import Callable, Mapping
 from typing import TYPE_CHECKING, cast
 
 
@@ -77,25 +77,25 @@ def wrapper(
     return wrapper if prim_translator is None else wrapper(prim_translator)
 
 
-def get_regsitered_primitive_translators() -> (
-    MutableMapping[str, translator.PrimitiveTranslatorCallable]
-):
-    """Returns the currently active view of all _currently_ installed primitive translators in Jace.
+def get_regsitered_primitive_translators() -> dict[str, translator.PrimitiveTranslatorCallable]:
+    """Returns a view of the _currently_ active set of installed primitive translators in Jace.
 
     The returned mapping represents the active primitive translators at the time of calling.
-    This means that calls to `register_primitive_translator()` does not modify the returned object.
+    This means that calls to `register_primitive_translator()` or any other mutating call will not affect the returned object.
     """
     return _PRIMITIVE_TRANSLATORS_DICT.copy()
 
 
 def set_active_primitive_translators_to(
     new_translators: Mapping[str, translator.PrimitiveTranslatorCallable],
-) -> None:
-    """Exchange the currently active subtranslators in Jace with the one inside `new_translators`.
+) -> Mapping[str, translator.PrimitiveTranslatorCallable]:
+    """Exchange the currently active subtranslators in Jace with `new_translators` and returns the previous ones.
 
     This function allows you to restore a specific state that was obtained by a previous call to `get_regsitered_primitive_translators()`.
     The function is mainly intended for debugging.
     """
-    assert all(getattr(trans, "primitive", prim) for prim, trans in new_translators.items())
     global _PRIMITIVE_TRANSLATORS_DICT
+    assert all(getattr(trans, "primitive", prim) for prim, trans in new_translators.items())
+    previous_translators = _PRIMITIVE_TRANSLATORS_DICT
     _PRIMITIVE_TRANSLATORS_DICT = dict(new_translators)
+    return previous_translators
diff --git a/tests/test_subtranslator_helper.py b/tests/test_subtranslator_helper.py
index 3c0897a..316d342 100644
--- a/tests/test_subtranslator_helper.py
+++ b/tests/test_subtranslator_helper.py
@@ -35,8 +35,7 @@ def _conserve_builtin_translators():
 @pytest.fixture()
 def no_builtin_translators() -> str:
     """This fixture can be used if the test does not want any builtin translators."""
-    initial_translators = translator.get_regsitered_primitive_translators()
-    translator.set_active_primitive_translators_to({})
+    initial_translators = translator.set_active_primitive_translators_to({})
     yield "DUMMY_VALUE"
     translator.set_active_primitive_translators_to(initial_translators)
 

From 1ce995135fdf15d8ca08a157de9ccdf14071c596 Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Tue, 21 May 2024 07:48:32 +0200
Subject: [PATCH 197/458] Updated the `create_jax_var_list()` function.

---
 .../translator/jaxpr_translator_driver.py     | 24 ++++++++++---------
 1 file changed, 13 insertions(+), 11 deletions(-)

diff --git a/src/jace/translator/jaxpr_translator_driver.py b/src/jace/translator/jaxpr_translator_driver.py
index 6a85ea1..df0932a 100644
--- a/src/jace/translator/jaxpr_translator_driver.py
+++ b/src/jace/translator/jaxpr_translator_driver.py
@@ -316,13 +316,13 @@ def add_array(
         Regardless, if `arg` refers to an array or a scalar, the function will generate an array.
         Furthermore, the created variables are always transients.
 
-        By default this function will _not_ update the internal variable mapping.
-        However, by setting `update_var_mapping` to `True` the mapping will be created.
-
         By default the function will use `jace.util.propose_jax_name()` to derive the name that should be used.
         However, by passing a `JaCeVar` with a name it is possible to suggest a specific name.
         In addition it is possible to specify `name_prefix` to prefix name that would be used.
 
+        The function will not update the internal variable mapping.
+        If this is desired one can set `update_var_mapping`, for forcing this.
+
         Args:
             arg:                The Jax object for which a SDFG equivalent should be created.
             name_prefix:        If given it will be used as prefix for the name.
@@ -400,10 +400,12 @@ def create_jax_var_list(  # type: ignore[misc]
         """Creates SDFG variables for the listed Jax variables and returns their SDFG names.
 
         If a Jax variable already has a SDFG equivalent then the function will use this variable.
-        If no corresponding SDFG variable is known the function will create one using `add_array()`, with `update_var_mapping` set to `True`.
+        If no corresponding SDFG variable is known the function will create one using `add_array()`.
 
-        By setting `prevent_creation` the function will not create any new SDFG variables, if no already existing variable is found an error is generated.
-        By setting `only_creation` the function will only create new SDFG variables, if a variable was already processed an error will be created.
+        By setting `prevent_creation` the function will not create any new SDFG variables,
+        if no corresponding SDFG variable exists an error is generated.
+        By setting `only_creation` the function will only create new SDFG variables,
+        if a variable already have a corresponding SDFG variable an error will be created.
 
         By default literals cause an error.
         However, by setting `handle_literals` to `True` literals will will be included in the output with the value `None`.
@@ -413,16 +415,13 @@ def create_jax_var_list(  # type: ignore[misc]
             prevent_creation:   Never create a variable, all must already be known.
             only_creation:      Always create a variable, it is an error if one already exist.
             handle_literals:    Allow the processing of literals.
-            kwargs:             Will be forwarded to `self.add_array()` if a variable as to be created,
+            kwargs:             Will be forwarded to `self.add_array()` in case a variable is created.
 
         Todo:
             Rollback if the creation fails.
         """
         if only_creation and prevent_creation:
             raise ValueError("Specified both 'only_creation' and 'prevent_creation'.")
-        assert (
-            "update_var_mapping" not in kwargs
-        ), "You can not pass 'update_var_mapping' as argument to 'create_jax_var_list()'."
 
         ret_list: list[None | str] = []
         for jax_var in jax_var_list:
@@ -435,7 +434,7 @@ def create_jax_var_list(  # type: ignore[misc]
                 if prevent_creation and (mapped_sdfg_name is None):
                     raise ValueError(f"'prevent_creation' given but have to create '{jax_var}'.")
                 if mapped_sdfg_name is None:
-                    sdfg_name = self.add_array(arg=jax_var, update_var_mapping=True, **kwargs)
+                    sdfg_name = self.add_array(arg=jax_var, **kwargs)
                 elif only_creation:
                     raise ValueError(f"'only_creation' given '{jax_var}' already exists.")
                 else:
@@ -468,6 +467,7 @@ def _create_initial_input(
             jax_var_list=jaxpr.jaxpr.invars,
             only_creation=True,  # Nothing exists yet.
             handle_literals=False,  # Initial arguments are never literals
+            update_var_mapping=True,
         )
         # This forces the code to only accept kwargs; it is also part of "what a canonical sdfg" is.
         self.sdfg.arg_names = []
@@ -501,6 +501,7 @@ def _create_constants(
             only_creation=True,  # Nothing exists yet.
             handle_literals=False,  # It seems that constants are never literals.
             name_prefix="__const_",
+            update_var_mapping=True,
         )
         for sdfg_name, const_value in zip(sdfg_const_names, jaxpr.consts, strict=True):
             self._ctx.sdfg.add_constant(
@@ -597,6 +598,7 @@ def _translate_single_eqn(
         out_var_names: MutableSequence[str] = self.create_jax_var_list(
             eqn.outvars,
             only_creation=True,  # Output must not exist yet.
+            update_var_mapping=True,
         )
 
         # Find the subtranslator

From 75ee7412c32d3e432aa7d3457fa7bf2af75d3ee4 Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Tue, 21 May 2024 07:53:37 +0200
Subject: [PATCH 198/458] Added more tests.

---
 tests/test_jaxpr_translator_driver.py | 167 +++++++++++++++++++++++++-
 1 file changed, 166 insertions(+), 1 deletion(-)

diff --git a/tests/test_jaxpr_translator_driver.py b/tests/test_jaxpr_translator_driver.py
index 1789dcd..9fe4a4f 100644
--- a/tests/test_jaxpr_translator_driver.py
+++ b/tests/test_jaxpr_translator_driver.py
@@ -12,6 +12,7 @@
 import re
 
 import dace
+import numpy as np
 import pytest
 from dace.data import Array
 
@@ -333,10 +334,174 @@ def test_driver_variable_invalid_prefix(
         assert len(translation_driver.sdfg.arrays) == 0
 
 
+def test_driver_variable_alloc_list(
+    translation_driver: translator.JaxprTranslationDriver,
+) -> None:
+    """Tests part of the `JaxprTranslationDriver::create_jax_var_list()` api."""
+    var_list_1 = [array1, nscal, scal2]
+    exp_names_1 = ["a", nscal.name, "c"]
+
+    res_names_1 = translation_driver.create_jax_var_list(
+        var_list_1,
+        update_var_mapping=True,
+    )
+    assert len(translation_driver.arrays) == 3
+    assert res_names_1 == exp_names_1
+
+    # Now a mixture of the collection and creation.
+    var_list_2 = [array2, nscal, scal1]
+    exp_names_2 = ["d", nscal.name, "e"]
+
+    res_names_2 = translation_driver.create_jax_var_list(
+        var_list_2,
+        update_var_mapping=True,
+    )
+    assert res_names_2 == exp_names_2
+    assert len(translation_driver.arrays) == 5
+
+
+@pytest.mark.skip(reason="'create_jax_var_list()' does not clean up in case of an error.")
+def test_driver_variable_alloc_list_cleaning(
+    translation_driver: translator.JaxprTranslationDriver,
+) -> None:
+    """Tests part of the `JaxprTranslationDriver::create_jax_var_list()` api.
+
+    It will fail because `update_var_mapping=False` thus the third variable will
+    cause an error because it is proposed to `a`, which is already used.
+    """
+    var_list = [array1, nscal, scal2]
+    exp_names = ["a", nscal.name, "c"]
+
+    with pytest.raises(
+        expected_exception=ValueError,
+        match=re.escape(f"add_array({scal2}): The proposed name 'a', is used."),
+    ):
+        res_names = translation_driver.create_jax_var_list(var_list)
+
+    # This currently fails, because the `create_jax_var_list()` function does not clean up.
+    assert len(translation_driver.arrays) == 0
+
+
+def test_driver_variable_alloc_list_prevent_creation(
+    translation_driver: translator.JaxprTranslationDriver,
+) -> None:
+    """Tests part of the `JaxprTranslationDriver::create_jax_var_list()` api.
+
+    It will test the `prevent_creation` flag.
+    """
+    # First create a variable.
+    translation_driver.add_array(array1, update_var_mapping=True)
+    assert len(translation_driver.arrays) == 1
+
+    # Now create the variables
+    var_list = [array1, array2]
+
+    with pytest.raises(
+        expected_exception=ValueError,
+        match=re.escape(f"'prevent_creation' given but have to create '{array2}'."),
+    ):
+        translation_driver.create_jax_var_list(
+            var_list,
+            prevent_creation=True,
+        )
+    assert len(translation_driver.arrays) == 1
+    assert translation_driver.map_jax_var_to_sdfg(array1) == "a"
+
+
+@pytest.mark.skip(reason="'create_jax_var_list()' does not clean up in case of an error.")
+def test_driver_variable_alloc_list_only_creation(
+    translation_driver: translator.JaxprTranslationDriver,
+) -> None:
+    """Tests part of the `JaxprTranslationDriver::create_jax_var_list()` api.
+
+    It will test the `only_creation` flag.
+    """
+    # First create a variable.
+    translation_driver.add_array(array1, update_var_mapping=True)
+    assert len(translation_driver.arrays) == 1
+
+    # Now create the variables
+    var_list = [array2, array1]
+
+    with pytest.raises(
+        expected_exception=ValueError,
+        match=re.escape(f"'only_creation' given '{array1}' already exists."),
+    ):
+        translation_driver.create_jax_var_list(
+            var_list,
+            only_creation=True,
+        )
+    assert len(translation_driver.arrays) == 1
+    assert translation_driver.map_jax_var_to_sdfg(array1) == "a"
+
+
+def test_driver_variable_alloc_list_handle_literal(
+    translation_driver: translator.JaxprTranslationDriver,
+) -> None:
+    """Tests part of the `JaxprTranslationDriver::create_jax_var_list()` api.
+
+    It will test the `handle_literals` flag.
+    """
+    # First we have to build a jax literal.
+    import numpy as np
+    from jax import core as jcore
+
+    val = np.array(1)
+    aval = jcore.get_aval(val)
+    lit = jcore.Literal(val, aval)
+    var_list = [lit]
+
+    with pytest.raises(
+        expected_exception=ValueError,
+        match=re.escape("Encountered a literal but `handle_literals` was `False`."),
+    ):
+        translation_driver.create_jax_var_list(
+            var_list,
+            handle_literals=False,
+        )
+    assert len(translation_driver.arrays) == 0
+
+    name_list = translation_driver.create_jax_var_list(
+        var_list,
+        handle_literals=True,
+    )
+    assert len(translation_driver.arrays) == 0
+    assert name_list == [None]
+
+
+def test_driver_constants(
+    translation_driver: translator.JaxprTranslationDriver,
+) -> None:
+    """Tests part of the `JaxprTranslationDriver::_create_constants()` api.
+
+    See also the `test_subtranslators_alu.py::test_add3` test.
+    """
+    import jax
+
+    # Create the Jaxpr that we need.
+    constant = [[1.0, 2.0, 3.0], [4.0, 5.0, 6.0], [7.0, 8.0, 9.0]]
+    jaxpr = jax.make_jaxpr(lambda A: A + jax.numpy.array(constant))(1.0)
+
+    # We have to manually allocate the driver context.
+    #  You should not do that.
+    translation_driver._allocate_translation_ctx(name="Manual_test")
+
+    # No create the constants.
+    translation_driver._create_constants(jaxpr)
+
+    # Test if it was created with the correct value.
+    assert len(translation_driver.arrays) == 1
+    assert len(translation_driver._jax_name_map) == 1
+    assert next(iter(translation_driver._jax_name_map.values())) == "__const_a"
+    assert len(translation_driver.sdfg.constants) == 1
+    assert np.all(translation_driver.sdfg.constants["__const_a"] == constant)
+
+
 def test_driver_jace_var() -> None:
     """Simple tests about the `JaCeVar` objects."""
     for iname in ["do", "", "_ _", "9al", "_!"]:
         with pytest.raises(
-            expected_exception=ValueError, match=re.escape(f"Supplied the invalid name '{iname}'.")
+            expected_exception=ValueError,
+            match=re.escape(f"Supplied the invalid name '{iname}'."),
         ):
             _ = JaCeVar((), dace.int8, name=iname)

From 067f55fa0bc7ee1c600fdcc4e8b4d7106722cf0c Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Tue, 21 May 2024 07:59:51 +0200
Subject: [PATCH 199/458] Made it clear that the "all Array" SDFG is only a
 temporary solution.

---
 src/jace/translator/jaxpr_translator_driver.py | 14 +++++++++++---
 1 file changed, 11 insertions(+), 3 deletions(-)

diff --git a/src/jace/translator/jaxpr_translator_driver.py b/src/jace/translator/jaxpr_translator_driver.py
index df0932a..211a19a 100644
--- a/src/jace/translator/jaxpr_translator_driver.py
+++ b/src/jace/translator/jaxpr_translator_driver.py
@@ -31,7 +31,6 @@ class JaxprTranslationDriver:
     - all variable names are derived from Jax names,
     - there are only transient variables inside the SDFG,
     - It lacks the special `__return` variable,
-    - all variables that Jax considers a scalar are in fact arrays with shape `(1,)`.
     - the `arg_names` parameter is not set.
 
     For these reasons the SDFG is not directly usable, and further manipulations have to be performed.
@@ -55,6 +54,8 @@ class JaxprTranslationDriver:
 
     Notes:
         After the main translation has been performed the translator object can be used again.
+        Currently the driver will generate only Array as SDFG variables, however, this is a temporary solution.
+            For more on that see `add_array()`.
     """
 
     __slots__ = (
@@ -313,8 +314,7 @@ def add_array(
     ) -> str:
         """Creates an SDFG variable for the Jax variable `arg` and returns its SDFG name.
 
-        Regardless, if `arg` refers to an array or a scalar, the function will generate an array.
-        Furthermore, the created variables are always transients.
+        The SDFG object is always created as a transient.
 
         By default the function will use `jace.util.propose_jax_name()` to derive the name that should be used.
         However, by passing a `JaCeVar` with a name it is possible to suggest a specific name.
@@ -327,6 +327,14 @@ def add_array(
             arg:                The Jax object for which a SDFG equivalent should be created.
             name_prefix:        If given it will be used as prefix for the name.
             update_var_mapping: Update the internal variable mapping; by default `False`.
+
+        Notes:
+            Currently the function will always create an Array, even if the Jax variable refers to a scalar.
+                This is done to work around some difficulties with scalar return values and so on.
+                This issue should actually handled in the post processing stage, but currently it is not.
+                However, from a point of building an SDFG manually, there is no difference between a Scalar and an Array.
+                According to the dace developer, the majority of the backend, i.e. optimization pipeline, should be handle to handle it.
+                But there are some special parts that might explicitly want a scalar, it also might block certain compiler optimization.
         """
         shape: tuple[int | dace.symbol | str, ...] = util.get_jax_var_shape(arg)
         dtype: dace.typeclass = util.get_jax_var_dtype(arg)

From d178b864c64d093288ec04daf77ba3842a88de2e Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Tue, 21 May 2024 09:08:15 +0200
Subject: [PATCH 200/458] Made it possible that "scalars" can be returned, in
 fact the code just returns array with shape `(1,)`.

---
 src/jace/util/compiling.py            | 24 ++++++++++++------------
 tests/test_empty_jaxpr.py             |  1 -
 tests/test_jax_api.py                 | 14 ++++++--------
 tests/test_jaxpr_translator_driver.py | 26 ++++++++++++++++++++++++++
 4 files changed, 44 insertions(+), 21 deletions(-)

diff --git a/src/jace/util/compiling.py b/src/jace/util/compiling.py
index cf44f13..a2d9f61 100644
--- a/src/jace/util/compiling.py
+++ b/src/jace/util/compiling.py
@@ -17,6 +17,7 @@
 from typing import TYPE_CHECKING, Any
 
 import dace
+import numpy as np
 
 
 if TYPE_CHECKING:
@@ -104,29 +105,28 @@ def run_jax_sdfg(
         raise NotImplementedError("No kwargs are supported yet.")
     if len(inp_names) != len(cargs):
         raise RuntimeError("Wrong number of arguments.")
+    if len(set(inp_names).intersection(out_names)) != 0:
+        raise NotImplementedError("Using an input also for output is not yet supported.")
 
     # We need the SDFG to construct/allocate the memory for the return values.
-    #  Actually, we would only need the descriptors, but this is currently the only way to get them.
-    #  As far as I know the dace performs a deepcopy before compilation, thus it should be safe.
-    #  However, regardless of this this also works if we are inside the stages, which have exclusive ownership.
     sdfg: dace.SDFG = csdfg.sdfg
 
     # Build the argument list that we will pass to the compiled object.
     call_args: dict[str, Any] = {}
     for in_name, in_val in zip(inp_names, cargs, strict=True):
-        assert (  # noqa: PT018  # Assertion must be one line
-            util.is_array(in_val) and in_val.flags["C_CONTIGUOUS"]
-        )  # Currently the only stride we support.
+        assert (not util.is_array(in_val)) or in_val.flags["C_CONTIGUOUS"]
+        if util.is_scalar(in_val):
+            # Currently the translator makes scalar into arrays, this has to be reflected here
+            in_val = np.array([in_val])
         call_args[in_name] = in_val
+
     for out_name in out_names:
         assert not ((out_name == "__return") or (out_name.startswith("__return_")))  # noqa: PT018 # Assert split
 
-        if out_name in call_args:  # Donated arguments
-            assert out_name in inp_names
-            assert not util.is_jax_array(
-                call_args[out_name]
-            )  # This violates one of Jax internal assumptions.
-            continue
+        if out_name in call_args:
+            # This is just a reminder, to not mess with Jax internals!
+            assert not util.is_jax_array(call_args[out_name])
+            raise NotImplementedError
 
         sarray: Data = sdfg.arrays[out_name]
         if isinstance(sarray, Scalar):
diff --git a/tests/test_empty_jaxpr.py b/tests/test_empty_jaxpr.py
index e2c63a1..cf5820a 100644
--- a/tests/test_empty_jaxpr.py
+++ b/tests/test_empty_jaxpr.py
@@ -29,7 +29,6 @@ def testee(A: np.ndarray) -> np.ndarray:
     assert np.all(testee(A) == A)
 
 
-@pytest.mark.skip(reason="Scalar return values are not handled.")
 def test_empty_scalar():
     jax.config.update("jax_enable_x64", True)
 
diff --git a/tests/test_jax_api.py b/tests/test_jax_api.py
index d1f5c6d..ad88af1 100644
--- a/tests/test_jax_api.py
+++ b/tests/test_jax_api.py
@@ -45,7 +45,6 @@ def testee(A: np.ndarray, B: np.ndarray) -> np.ndarray:
     assert np.allclose(ref, res), f"Expected '{ref}' got '{res}'."
 
 
-@pytest.mark.skip(reason="Scalar return values are not handled.")
 def test_composition_itself():
     """Tests if Jace is composable with itself."""
     jax.config.update("jax_enable_x64", True)
@@ -143,7 +142,6 @@ def f3_jace(A, B, C, D):
     assert np.allclose(ref, res_jace), "JaCe Failed."
 
 
-@pytest.mark.skip(reason="Scalar return values are not handled.")
 def test_grad_annotation_direct():
     """Test if `jace.grad` works directly."""
     jax.config.update("jax_enable_x64", True)
@@ -152,20 +150,20 @@ def f(x):
         return jnp.sin(jnp.exp(jnp.cos(x**2)))
 
     @jax.grad
-    def jax_df(x):
-        return f(x)
+    def jax_ddf(x):
+        return jax.grad(f)(x)
 
     @jax.jit
-    def jace_df(x):
-        return jace.grad(f)(x)
+    def jace_ddf(x):
+        return jace.grad(jace.grad(f))(x)
 
     # These are the random numbers where we test
     Xs = (np.random.random(10) - 0.5) * 10  # noqa: NPY002  # Random number generator
 
     for i in range(Xs.shape[0]):
         x = Xs[i]
-        res = jace_df(x)
-        ref = jax_df(x)
+        res = jace_ddf(x)
+        ref = jax_ddf(x)
         assert np.allclose(res, ref)
 
 
diff --git a/tests/test_jaxpr_translator_driver.py b/tests/test_jaxpr_translator_driver.py
index 9fe4a4f..59adf82 100644
--- a/tests/test_jaxpr_translator_driver.py
+++ b/tests/test_jaxpr_translator_driver.py
@@ -12,10 +12,12 @@
 import re
 
 import dace
+import jax
 import numpy as np
 import pytest
 from dace.data import Array
 
+import jace
 from jace import translator, util
 from jace.util import JaCeVar
 
@@ -497,6 +499,30 @@ def test_driver_constants(
     assert np.all(translation_driver.sdfg.constants["__const_a"] == constant)
 
 
+def test_driver_scalar_return_value(
+    translation_driver: translator.JaxprTranslationDriver,
+) -> None:
+    """Tests if scalars can be returned directly"""
+    jax.config.update("jax_enable_x64", True)
+
+    def scalar_ops(A: float) -> float:
+        return A + A - A * A
+
+    lower_cnt = [0]
+
+    @jace.jit
+    def wrapped(A: float) -> float:
+        lower_cnt[0] += 1
+        return scalar_ops(A)
+
+    vals = np.random.random(100)  # noqa: NPY002
+    for i in range(vals.size):
+        res = wrapped(vals[i])
+        ref = scalar_ops(vals[i])
+        assert np.allclose(res, ref)
+    assert lower_cnt[0] == 1
+
+
 def test_driver_jace_var() -> None:
     """Simple tests about the `JaCeVar` objects."""
     for iname in ["do", "", "_ _", "9al", "_!"]:

From 897a361ce3b00f979fc4b9d9c62fd48af639b700 Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Tue, 21 May 2024 10:38:31 +0200
Subject: [PATCH 201/458] Fixed some typing errors in the jax API.

---
 src/jace/jax/api.py    | 32 +++++++++++++++++++++++++-------
 src/jace/jax/stages.py | 22 ++++++++++++++++------
 2 files changed, 41 insertions(+), 13 deletions(-)

diff --git a/src/jace/jax/api.py b/src/jace/jax/api.py
index e47a8d7..7dc27f5 100644
--- a/src/jace/jax/api.py
+++ b/src/jace/jax/api.py
@@ -11,7 +11,7 @@
 
 import functools as ft
 from collections.abc import Callable, Mapping
-from typing import TYPE_CHECKING, Any
+from typing import TYPE_CHECKING, Any, Literal, overload
 
 import jax as _jax_jax
 
@@ -19,7 +19,25 @@
 
 
 if TYPE_CHECKING:
-    from jace import jax as jjax
+    from jace.jax import stages
+
+
+@overload
+def jit(
+    fun: Literal[None] = None,
+    /,
+    sub_translators: Mapping[str, translator.PrimitiveTranslatorCallable] | None = None,
+    **kwargs: Any,
+) -> Callable[..., stages.JaceWrapped]: ...
+
+
+@overload
+def jit(
+    fun: Callable,
+    /,
+    sub_translators: Mapping[str, translator.PrimitiveTranslatorCallable] | None = None,
+    **kwargs: Any,
+) -> stages.JaceWrapped: ...
 
 
 def jit(
@@ -27,7 +45,7 @@ def jit(
     /,
     sub_translators: Mapping[str, translator.PrimitiveTranslatorCallable] | None = None,
     **kwargs: Any,
-) -> jjax.JaceWrapped | Callable:
+) -> stages.JaceWrapped | Callable[..., stages.JaceWrapped]:
     """Jace's replacement for `jax.jit` (just-in-time) wrapper.
 
     It works the same way as `jax.jit` does, but instead of using XLA the computation is lowered to DaCe.
@@ -47,10 +65,10 @@ def jit(
             f"The following arguments of 'jax.jit' are not yet supported by jace: {', '.join(kwargs.keys())}."
         )
 
-    def wrapper(f: Callable) -> jjax.JaceWrapped:
-        from jace import jax as jjax  # Cyclic import
+    def wrapper(f: Callable) -> stages.JaceWrapped:
+        from jace import jax as stages  # Cyclic import
 
-        jace_wrapper = jjax.JaceWrapped(
+        jace_wrapper = stages.JaceWrapped(
             fun=f,
             sub_translators=(
                 translator.managing._PRIMITIVE_TRANSLATORS_DICT
@@ -68,7 +86,7 @@ def vmap(
     fun: Callable,
     /,
     **kwargs: Any,
-) -> jjax.JaceWrapped:
+) -> stages.JaceWrapped:
     """Jace wrapper around `jax.vmap`.
 
     Notes:
diff --git a/src/jace/jax/stages.py b/src/jace/jax/stages.py
index 32f020c..ce0ef48 100644
--- a/src/jace/jax/stages.py
+++ b/src/jace/jax/stages.py
@@ -25,11 +25,10 @@
 
 import copy
 from collections.abc import Callable, Mapping, Sequence
-from typing import Any, Final
+from typing import Any, Final, TypeAlias
 
 import dace
 import jax as jax_jax
-from jax.stages import CompilerOptions
 
 from jace import optimization, translator, util
 from jace.jax import translation_cache as tcache
@@ -47,6 +46,11 @@ class Stage:
     """
 
 
+"""Map type to pass compiler options to `JaceLowered.compile()`.
+"""
+CompilerOptions: TypeAlias = dict[str, tuple[bool, str]]
+
+
 class JaceWrapped(Stage):
     """A function ready to be specialized, lowered, and compiled.
 
@@ -62,14 +66,14 @@ class JaceWrapped(Stage):
     """
 
     _fun: Callable
-    _sub_translators: Mapping[str, translator.PrimitiveTranslator]
+    _sub_translators: Mapping[str, translator.PrimitiveTranslatorCallable]
     _jit_ops: Mapping[str, Any]
     _cache: tcache.TranslationCache
 
     def __init__(
         self,
         fun: Callable,
-        sub_translators: Mapping[str, translator.PrimitiveTranslator],
+        sub_translators: Mapping[str, translator.PrimitiveTranslatorCallable],
         jit_ops: Mapping[str, Any],
     ) -> None:
         """Creates a wrapped jace jitable object of `jax_prim`.
@@ -125,12 +129,18 @@ def lower(
         Performs the first two steps of the AOT steps described above,
         i.e. transformation into Jaxpr and then to SDFG.
         The result is encapsulated into a `Lowered` object.
-        """
-        # TODO(phimuell): Handle pytrees
 
+        Todo:
+            - Handle pytrees.
+        """
         if len(kwargs) != 0:
             raise NotImplementedError("Currently only positional arguments are supported.")
 
+        # Currently we do not allow memory order beside `C_CONTIGUOUS`.
+        #  This is the best place to check for it.
+        if not all((not util.is_array(arg)) or arg.flags["C_CONTIGUOUS"] for arg in args):
+            raise NotImplementedError("Currently can not handle strides beside 'C_CONTIGUOUS'.")
+
         jaxpr = jax_jax.make_jaxpr(self._fun)(*args)
         driver = translator.JaxprTranslationDriver(sub_translators=self._sub_translators)
         trans_sdfg: translator.TranslatedJaxprSDFG = driver.translate_jaxpr(jaxpr)

From eb15d49d251824ee2d149a87be061251b598e0e4 Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Tue, 21 May 2024 10:42:48 +0200
Subject: [PATCH 202/458] Moved some code around and also forbid that non C
 strides can be used.

---
 src/jace/translator/post_translation.py | 18 +++----
 src/jace/util/compiling.py              | 68 ++++++++++---------------
 tests/test_caching.py                   | 38 ++++++++++++++
 tests/test_jaxpr_translator_driver.py   | 23 +++++++++
 4 files changed, 95 insertions(+), 52 deletions(-)

diff --git a/src/jace/translator/post_translation.py b/src/jace/translator/post_translation.py
index 4334e23..fc28160 100644
--- a/src/jace/translator/post_translation.py
+++ b/src/jace/translator/post_translation.py
@@ -43,7 +43,14 @@ def postprocess_jaxpr_sdfg(
 def finalize_jaxpr_sdfg(
     tsdfg: translator.TranslatedJaxprSDFG,
 ) -> None:
-    """Finalizes the supplied `tsdfg` object in place."""
+    """Finalizes the supplied `tsdfg` object in place.
+
+    This function will turn a non finalized, i.e. canonical, SDFG into a finalized one,
+    i.e. after this function `tsdfg.is_finalized` is `True`.
+    Thus the function will:
+    - Mark all input and output variables, i.e. listed in `tsdfg.{inp, out}_names`, as globals.
+    - Deallocate all members of `tsdfg` that are no longer needed.
+    """
     if tsdfg.is_finalized:
         raise ValueError("The supplied SDFG is already finalized.")
     if not tsdfg.inp_names:
@@ -51,15 +58,6 @@ def finalize_jaxpr_sdfg(
     if not tsdfg.out_names:
         raise ValueError("Output names are not specified.")
 
-    # We do not support the return value mechanism that dace provides us.
-    #  The reasons for that are that the return values are always shared and the working with pytrees is not yet understood.
-    #  Thus we make the safe choice by passing all as arguments.
-    if any(
-        arrname.startswith("__return")
-        for arrname in tsdfg.sdfg.arrays.keys()  # noqa: SIM118  # we can not use `in` because we are also interested in `__return_`!
-    ):
-        raise ValueError("Only support SDFGs without '__return' members.")
-
     # Canonical SDFGs do not have global memory, so we must transform it
     sdfg_arg_names: list[str] = []
     for glob_name in tsdfg.inp_names + tsdfg.out_names:
diff --git a/src/jace/util/compiling.py b/src/jace/util/compiling.py
index a2d9f61..31afd59 100644
--- a/src/jace/util/compiling.py
+++ b/src/jace/util/compiling.py
@@ -18,6 +18,7 @@
 
 import dace
 import numpy as np
+from dace import data as ddata
 
 
 if TYPE_CHECKING:
@@ -30,22 +31,15 @@ def compile_jax_sdfg(
 ) -> jdace.CompiledSDFG:
     """This function compiles the SDFG embedded in the embedded `tsdfg` (`TranslatedJaxprSDFG`).
 
-    Notes:
-        Currently the SDFG must not have any undefined symbols, i.e. no undefined sizes.
+    For executing the SDFG, the `run_jax_sdfg()` function, together with the `tsdfg.{inp, out}_names` can be used.
     """
     if not tsdfg.is_finalized:
         raise ValueError("Can only compile a finalized SDFG.")
-    if not tsdfg.inp_names:
-        raise ValueError("The passed SDFG did not had any input arguments.")
-    if not tsdfg.out_names:
-        raise ValueError("The passed SDFG did not had any output arguments.")
-
-    # This is a simplification that makes our life simply.
-    #  However, we should consider lifting it at some point.
-    if len(tsdfg.sdfg.free_symbols) != 0:
-        raise NotImplementedError(
-            f"No externally defined symbols are allowed, found: {tsdfg.sdfg.free_symbols}"
-        )
+    if any(  # We do not support the DaCe return mechanism
+        arrname.startswith("__return")
+        for arrname in tsdfg.sdfg.arrays.keys()  # noqa: SIM118  # we can not use `in` because we are also interested in `__return_`!
+    ):
+        raise ValueError("Only support SDFGs without '__return' members.")
 
     # To ensure that the SDFG is compiled and to get rid of a warning we must modify
     #  some settings of the SDFG. To fake an immutable SDFG, we will restore them later.
@@ -95,53 +89,43 @@ def run_jax_sdfg(
     Notes:
         There is no pytree mechanism jet, thus the return values are returned inside a `tuple`
             or in case of one value, directly, in the order determined by Jax.
-        Currently, this function does not consider strides in the input.
+        Currently, this function does not consider strides in the input,
+            all input must be `C_CONTIGUOUS`.
+        Currently the SDFG must not have any undefined symbols, i.e. no undefined sizes.
     """
-    from dace.data import Array, Data, Scalar, make_array_from_descriptor
-
     from jace import util
 
+    sdfg: dace.SDFG = csdfg.sdfg
+
     if len(ckwargs) != 0:
         raise NotImplementedError("No kwargs are supported yet.")
     if len(inp_names) != len(cargs):
         raise RuntimeError("Wrong number of arguments.")
     if len(set(inp_names).intersection(out_names)) != 0:
         raise NotImplementedError("Using an input also for output is not yet supported.")
-
-    # We need the SDFG to construct/allocate the memory for the return values.
-    sdfg: dace.SDFG = csdfg.sdfg
+    if len(sdfg.free_symbols) != 0:  # This is a simplification that makes our life simple.
+        raise NotImplementedError(
+            f"No externally defined symbols are allowed, found: {sdfg.free_symbols}"
+        )
 
     # Build the argument list that we will pass to the compiled object.
     call_args: dict[str, Any] = {}
     for in_name, in_val in zip(inp_names, cargs, strict=True):
-        assert (not util.is_array(in_val)) or in_val.flags["C_CONTIGUOUS"]
         if util.is_scalar(in_val):
             # Currently the translator makes scalar into arrays, this has to be reflected here
             in_val = np.array([in_val])
         call_args[in_name] = in_val
 
-    for out_name in out_names:
-        assert not ((out_name == "__return") or (out_name.startswith("__return_")))  # noqa: PT018 # Assert split
-
-        if out_name in call_args:
-            # This is just a reminder, to not mess with Jax internals!
-            assert not util.is_jax_array(call_args[out_name])
-            raise NotImplementedError
-
-        sarray: Data = sdfg.arrays[out_name]
-        if isinstance(sarray, Scalar):
-            raise NotImplementedError("Scalars as return values are not supported.")
-        if isinstance(sarray, Array):
-            call_args[out_name] = make_array_from_descriptor(sarray)
-        else:
-            raise NotImplementedError(f"Can not handle '{type(sarray).__name__}' as output.")
-
-    if len(call_args) != len(csdfg.argnames):
-        raise ValueError(
-            "Failed to construct the call arguments,"
-            f" expected {len(csdfg.argnames)} but got {len(call_args)}."
-            f"\nExpected: {csdfg.argnames}\nGot: {list(call_args.keys())}"
-        )
+    for out_name, sarray in ((name, sdfg.arrays[name]) for name in out_names):
+        assert not (out_name in call_args and util.is_jax_array(call_args[out_name]))
+        assert isinstance(sarray, ddata.Array)
+        call_args[out_name] = ddata.make_array_from_descriptor(sarray)
+
+    assert len(call_args) == len(csdfg.argnames), (
+        "Failed to construct the call arguments,"
+        f" expected {len(csdfg.argnames)} but got {len(call_args)}."
+        f"\nExpected: {csdfg.argnames}\nGot: {list(call_args.keys())}"
+    )
 
     # Calling the SDFG
     with dace.config.temporary_config():
diff --git a/tests/test_caching.py b/tests/test_caching.py
index 0703f3e..6e1b304 100644
--- a/tests/test_caching.py
+++ b/tests/test_caching.py
@@ -11,6 +11,7 @@
 from __future__ import annotations
 
 import itertools as it
+import re
 
 import jax
 import numpy as np
@@ -187,3 +188,40 @@ def jaceWrapped(A: np.ndarray, B: np.ndarray) -> np.ndarray:
     #  If there is sharing, then this would not be the case.
     assert optiCompiled._csdfg.sdfg.number_of_nodes() == 1
     assert optiCompiled._csdfg.sdfg.number_of_nodes() < unoptiCompiled._csdfg.sdfg.number_of_nodes()
+
+
+def test_caching_strides() -> None:
+    """Test if the cache detects a change in strides."""
+    jax.config.update("jax_enable_x64", True)
+
+    @jace.jit
+    def wrapped(A: np.ndarray) -> np.ndarray:
+        return A + 10.0
+
+    shape = (10, 100, 1000)
+    C = np.array(
+        (np.random.random(shape) - 0.5) * 10,  # noqa: NPY002
+        order="C",
+        dtype=np.float64,
+    )
+    F = np.array(C, copy=True, order="F")
+
+    # First we compile run it with C strides.
+    C_lower = wrapped.lower(C)
+    C_res = wrapped(C)
+
+    # Now we run it with FORTRAN strides.
+    #  However, this does not work because we do not support strides at all.
+    #  But the cache is aware of this, which helps catch some nasty bugs.
+    F_lower = None  # Remove later
+    F_res = C_res.copy()  # Remove later
+    with pytest.raises(  # noqa: PT012 # Multiple calls
+        expected_exception=NotImplementedError,
+        match=re.escape("Currently can not handle strides beside 'C_CONTIGUOUS'."),
+    ):
+        F_lower = wrapped.lower(F)
+        F_res = wrapped(F)
+    assert F_lower is None  # Remove later.
+    assert C_res is not F_res  # Remove later
+    assert np.allclose(F_res, C_res)
+    assert F_lower is not C_lower
diff --git a/tests/test_jaxpr_translator_driver.py b/tests/test_jaxpr_translator_driver.py
index 59adf82..c51e01f 100644
--- a/tests/test_jaxpr_translator_driver.py
+++ b/tests/test_jaxpr_translator_driver.py
@@ -531,3 +531,26 @@ def test_driver_jace_var() -> None:
             match=re.escape(f"Supplied the invalid name '{iname}'."),
         ):
             _ = JaCeVar((), dace.int8, name=iname)
+
+
+def test_driver_F_strides(
+    translation_driver: translator.JaxprTranslationDriver,
+) -> None:
+    """Tests if we can lower without a standard stride.
+
+    Notes:
+        This tests if the restriction is currently in place.
+        See also `tests/test_caching.py::test_caching_strides`.
+    """
+
+    @jace.jit
+    def testee(A: np.ndarray) -> np.ndarray:
+        return A + 10.0
+
+    F = np.full((4, 3), 10, dtype=np.float64, order="F")
+
+    with pytest.raises(
+        expected_exception=NotImplementedError,
+        match=re.escape("Currently can not handle strides beside 'C_CONTIGUOUS'."),
+    ):
+        _ = testee(F)

From c05bbc6ecc04394127b2cf7feb0dbdae474d8083 Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Tue, 21 May 2024 11:24:35 +0200
Subject: [PATCH 203/458] Made some changes regarding the `x64` feature of Jax.

The solution is not great.
It is now globally at import time enabled.
The driver still generates an error if it encounters that.
I also added a test for explicitly checking that it does not work.

I also updated all the tests.
---
 src/jace/__init__.py                          | 11 ++++++
 .../translator/jaxpr_translator_driver.py     | 10 ++++--
 tests/test_caching.py                         |  6 ----
 tests/test_decorator.py                       |  3 --
 tests/test_empty_jaxpr.py                     |  6 ----
 tests/test_jax_api.py                         | 34 ++++++++++++++++---
 tests/test_jaxpr_translator_driver.py         |  2 --
 tests/test_sub_translators_alu.py             |  3 --
 tests/test_subtranslator_helper.py            |  3 --
 9 files changed, 47 insertions(+), 31 deletions(-)

diff --git a/src/jace/__init__.py b/src/jace/__init__.py
index 294d357..47f74ed 100644
--- a/src/jace/__init__.py
+++ b/src/jace/__init__.py
@@ -9,12 +9,21 @@
 
 from __future__ import annotations
 
+import jax as _jax
+
 import jace.translator.primitive_translators  # noqa: F401  # needed to poulate the internal list of translators.
 
 from .__about__ import __author__, __copyright__, __license__, __version__, __version_info__
 from .jax import grad, jacfwd, jacrev, jit
 
 
+# In Jax `float32` is the main datatype, and they go to great lengths to avoid
+#  some aggressive [type promotion](https://jax.readthedocs.io/en/latest/type_promotion.html).
+#  However, in this case we will have problems when we call the SDFG, for some reasons
+#  `CompiledSDFG` does not work in that case correctly, thus we enable it now globally.
+_jax.config.update("jax_enable_x64", True)
+
+
 __all__ = [
     "__author__",
     "__copyright__",
@@ -26,3 +35,5 @@
     "__version__",
     "__version_info__",
 ]
+
+del _jax
diff --git a/src/jace/translator/jaxpr_translator_driver.py b/src/jace/translator/jaxpr_translator_driver.py
index 211a19a..ab7d905 100644
--- a/src/jace/translator/jaxpr_translator_driver.py
+++ b/src/jace/translator/jaxpr_translator_driver.py
@@ -11,7 +11,6 @@
 from typing import TYPE_CHECKING, Any, Literal, cast, overload
 
 import dace
-import jax
 from dace import data as ddata, properties as dprop
 from jax import core as jax_core
 
@@ -115,10 +114,15 @@ def translate_jaxpr(
         Args:
             name:                   Use this name for the SDFG instead some generated one.
         """
+        import jax as _jax
+
         if len(jaxpr.effects) != 0:
             raise NotImplementedError("'Jaxpr' with side effects are not supported.")
-        if not jax.config.read("jax_enable_x64"):
-            raise NotImplementedError("The translation only works if 'jax_enable_x64' is enabled.")
+        if not _jax.config.read("jax_enable_x64"):
+            raise NotImplementedError(
+                "You have disabled 'x64' support in Jax, which interferes with the calling of the SDFG. "
+                "SDFG generated in this way will fail to call."
+            )
 
         # NOTE: If `self` is already allocated, i.e. has an ongoing translation process,
         #       the `_allocate_translation_ctx()` function will start a new context.
diff --git a/tests/test_caching.py b/tests/test_caching.py
index 6e1b304..ea31153 100644
--- a/tests/test_caching.py
+++ b/tests/test_caching.py
@@ -13,7 +13,6 @@
 import itertools as it
 import re
 
-import jax
 import numpy as np
 import pytest
 
@@ -39,7 +38,6 @@ def _clear_translation_cache():
 
 def test_caching_same_sizes():
     """The behaviour of the cache if same sizes are used."""
-    jax.config.update("jax_enable_x64", True)
 
     # Counter for how many time it was lowered.
     lowering_cnt = [0]
@@ -83,7 +81,6 @@ def wrapped(A, B):
 
 def test_caching_different_sizes():
     """The behaviour of the cache if different sizes where used."""
-    jax.config.update("jax_enable_x64", True)
 
     # Counter for how many time it was lowered.
     lowering_cnt = [0]
@@ -122,7 +119,6 @@ def test_caching_different_structure():
     Todo:
         - Extend with strides once they are part of the cache.
     """
-    jax.config.update("jax_enable_x64", True)
 
     # This is the wrapped function.
     lowering_cnt = [0]
@@ -159,7 +155,6 @@ def wrapped(A, B):
 
 def test_caching_compilation():
     """Tests the compilation cache, this is just very simple, since it uses the same code paths as lowering."""
-    jax.config.update("jax_enable_x64", True)
 
     @jace.jit
     def jaceWrapped(A: np.ndarray, B: np.ndarray) -> np.ndarray:
@@ -192,7 +187,6 @@ def jaceWrapped(A: np.ndarray, B: np.ndarray) -> np.ndarray:
 
 def test_caching_strides() -> None:
     """Test if the cache detects a change in strides."""
-    jax.config.update("jax_enable_x64", True)
 
     @jace.jit
     def wrapped(A: np.ndarray) -> np.ndarray:
diff --git a/tests/test_decorator.py b/tests/test_decorator.py
index b83320a..cf1ffaf 100644
--- a/tests/test_decorator.py
+++ b/tests/test_decorator.py
@@ -12,7 +12,6 @@
 
 from __future__ import annotations
 
-import jax
 import numpy as np
 import pytest
 
@@ -37,7 +36,6 @@ def _clear_translation_cache():
 
 def test_decorator_individually():
     """Tests the compilation steps individually."""
-    jax.config.update("jax_enable_x64", True)
 
     def testee_(A: np.ndarray, B: np.ndarray) -> np.ndarray:
         return A + B
@@ -64,7 +62,6 @@ def testee(A, B):
 
 def test_decorator_one_go():
     """Tests the compilation steps in one go."""
-    jax.config.update("jax_enable_x64", True)
 
     def testee_(A: np.ndarray, B: np.ndarray) -> np.ndarray:
         return A + B
diff --git a/tests/test_empty_jaxpr.py b/tests/test_empty_jaxpr.py
index cf5820a..36e8247 100644
--- a/tests/test_empty_jaxpr.py
+++ b/tests/test_empty_jaxpr.py
@@ -18,8 +18,6 @@
 
 
 def test_empty_array():
-    jax.config.update("jax_enable_x64", True)
-
     @jace.jit
     def testee(A: np.ndarray) -> np.ndarray:
         return A
@@ -30,8 +28,6 @@ def testee(A: np.ndarray) -> np.ndarray:
 
 
 def test_empty_scalar():
-    jax.config.update("jax_enable_x64", True)
-
     @jace.jit
     def testee(A: float) -> float:
         return A
@@ -43,8 +39,6 @@ def testee(A: float) -> float:
 
 @pytest.mark.skip(reason="Nested Jaxpr are not handled.")
 def test_empty_nested():
-    jax.config.update("jax_enable_x64", True)
-
     @jace.jit
     def testee3(A: float) -> float:
         return jax.jit(lambda A: A)(A)
diff --git a/tests/test_jax_api.py b/tests/test_jax_api.py
index ad88af1..221733a 100644
--- a/tests/test_jax_api.py
+++ b/tests/test_jax_api.py
@@ -23,7 +23,6 @@
 
 def test_jit():
     """Simple add function."""
-    jax.config.update("jax_enable_x64", True)
 
     def testee(A: np.ndarray, B: np.ndarray) -> np.ndarray:
         return A + B
@@ -47,7 +46,6 @@ def testee(A: np.ndarray, B: np.ndarray) -> np.ndarray:
 
 def test_composition_itself():
     """Tests if Jace is composable with itself."""
-    jax.config.update("jax_enable_x64", True)
 
     # Pure Python functions
     def f_ref(x):
@@ -86,7 +84,6 @@ def ddf(x):
 @pytest.mark.skip(reason="Nested Jaxpr are not handled.")
 def test_composition_with_jax():
     """Tests if Jace can interact with Jax and vice versa."""
-    jax.config.update("jax_enable_x64", True)
 
     def base_fun(A, B, C):
         return A + B * jnp.sin(C) - A * B
@@ -144,7 +141,6 @@ def f3_jace(A, B, C, D):
 
 def test_grad_annotation_direct():
     """Test if `jace.grad` works directly."""
-    jax.config.update("jax_enable_x64", True)
 
     def f(x):
         return jnp.sin(jnp.exp(jnp.cos(x**2)))
@@ -172,7 +168,6 @@ def test_grad_control_flow():
 
     This requirement is mentioned in `https://jax.readthedocs.io/en/latest/notebooks/Common_Gotchas_in_JAX.html#python-control-flow-autodiff`.
     """
-    jax.config.update("jax_enable_x64", True)
 
     @jace.grad
     def df(x):
@@ -190,3 +185,32 @@ def df(x):
 
     assert df(x1) == df_x1, f"Failed lower branch, expected '{df_x1}', got '{res_1}'."
     assert df(x2) == df_x2, f"Failed upper branch, expected '{df_x2}', got '{res_2}'."
+
+
+@pytest.mark.skip(reason="Running Jace with disabled 'x64' support does not work.")
+def test_disabled_x64():
+    """Tests the behaviour of the tool chain if we explicitly disable x64 support in Jax.
+
+    If you want to test, if this restriction still applies, you can enable the test.
+    """
+    from jax.experimental import disable_x64
+
+    def testee(A: np.ndarray, B: np.float64) -> np.ndarray:
+        return A + B
+
+    A = np.arange(12, dtype=np.float64).reshape((4, 3))
+    B = np.float64(10.0)
+
+    # Run them with disabled x64 support
+    with disable_x64():
+        # Jace
+        jace_testee = jace.jit(testee)
+        jace_lowered = jace_testee.lower(A, B)
+        jace_comp = jace_lowered.compile()
+        res = jace_comp(A, B)
+
+        # Jax
+        jax_testee = jax.jit(testee)
+        ref = jax_testee(A, B)
+
+    assert np.allclose(ref, res), "Expected that: {ref.tolist()}, but got {res.tolist()}."
diff --git a/tests/test_jaxpr_translator_driver.py b/tests/test_jaxpr_translator_driver.py
index c51e01f..5a0aaee 100644
--- a/tests/test_jaxpr_translator_driver.py
+++ b/tests/test_jaxpr_translator_driver.py
@@ -12,7 +12,6 @@
 import re
 
 import dace
-import jax
 import numpy as np
 import pytest
 from dace.data import Array
@@ -503,7 +502,6 @@ def test_driver_scalar_return_value(
     translation_driver: translator.JaxprTranslationDriver,
 ) -> None:
     """Tests if scalars can be returned directly"""
-    jax.config.update("jax_enable_x64", True)
 
     def scalar_ops(A: float) -> float:
         return A + A - A * A
diff --git a/tests/test_sub_translators_alu.py b/tests/test_sub_translators_alu.py
index 1853f92..45a5548 100644
--- a/tests/test_sub_translators_alu.py
+++ b/tests/test_sub_translators_alu.py
@@ -17,7 +17,6 @@
 
 def test_add():
     """Simple add function."""
-    jax.config.update("jax_enable_x64", True)
 
     def testee(A: np.ndarray, B: np.ndarray) -> np.ndarray:
         return A + B
@@ -33,7 +32,6 @@ def testee(A: np.ndarray, B: np.ndarray) -> np.ndarray:
 
 def test_add2():
     """Simple add function, with literal."""
-    jax.config.update("jax_enable_x64", True)
 
     def testee(A: np.ndarray, B: np.ndarray) -> np.ndarray:
         c = A + 0.01
@@ -53,7 +51,6 @@ def testee(A: np.ndarray, B: np.ndarray) -> np.ndarray:
 
 def test_add3():
     """Simple add function, with constant."""
-    jax.config.update("jax_enable_x64", True)
 
     def testee(A: np.ndarray) -> np.ndarray:
         return A + jax.numpy.array([[1.0, 2.0, 3.0], [4.0, 5.0, 6.0], [7.0, 8.0, 9.0]])
diff --git a/tests/test_subtranslator_helper.py b/tests/test_subtranslator_helper.py
index 316d342..8046e88 100644
--- a/tests/test_subtranslator_helper.py
+++ b/tests/test_subtranslator_helper.py
@@ -12,7 +12,6 @@
 import re
 from typing import Any
 
-import jax
 import numpy as np
 import pytest
 
@@ -156,7 +155,6 @@ def useless_add_translator(*args: Any, **kwargs: Any) -> None:
 
 def test_subtranslatior_managing_overwriting_2(no_builtin_translators):
     """Again an overwriting test, but this time a bit more complicated."""
-    jax.config.update("jax_enable_x64", True)
 
     trans_cnt = [0]
 
@@ -181,7 +179,6 @@ def test_subtranslatior_managing_decoupling():
 
     I.e. changes to the global state, does not affect already annotated functions.
     """
-    jax.config.update("jax_enable_x64", True)
 
     @jace.jit
     def foo(A):

From 74bdcafc79f33ae1cc6d2eb8eba5b6b45eecc38c Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Tue, 21 May 2024 12:31:40 +0200
Subject: [PATCH 204/458] Renamed the `post_translation` to the
 `pre_post_translation`, since it is still so small.

---
 src/jace/jax/stages.py                                        | 4 ++--
 src/jace/translator/jaxpr_translator_driver.py                | 2 +-
 .../{post_translation.py => pre_post_translation.py}          | 0
 3 files changed, 3 insertions(+), 3 deletions(-)
 rename src/jace/translator/{post_translation.py => pre_post_translation.py} (100%)

diff --git a/src/jace/jax/stages.py b/src/jace/jax/stages.py
index ce0ef48..cb27165 100644
--- a/src/jace/jax/stages.py
+++ b/src/jace/jax/stages.py
@@ -32,7 +32,7 @@
 
 from jace import optimization, translator, util
 from jace.jax import translation_cache as tcache
-from jace.translator import post_translation as ptrans
+from jace.translator import pre_post_translation as pptrans
 from jace.util import dace_helper as jdace
 
 
@@ -144,7 +144,7 @@ def lower(
         jaxpr = jax_jax.make_jaxpr(self._fun)(*args)
         driver = translator.JaxprTranslationDriver(sub_translators=self._sub_translators)
         trans_sdfg: translator.TranslatedJaxprSDFG = driver.translate_jaxpr(jaxpr)
-        ptrans.postprocess_jaxpr_sdfg(tsdfg=trans_sdfg, fun=self.wrapped_fun)
+        pptrans.postprocess_jaxpr_sdfg(tsdfg=trans_sdfg, fun=self.wrapped_fun)
         # The `JaceLowered` assumes complete ownership of `trans_sdfg`!
         return JaceLowered(trans_sdfg)
 
diff --git a/src/jace/translator/jaxpr_translator_driver.py b/src/jace/translator/jaxpr_translator_driver.py
index ab7d905..a70598b 100644
--- a/src/jace/translator/jaxpr_translator_driver.py
+++ b/src/jace/translator/jaxpr_translator_driver.py
@@ -34,7 +34,7 @@ class JaxprTranslationDriver:
 
     For these reasons the SDFG is not directly usable, and further manipulations have to be performed.
     Especially, DaCe's validation function will fail and it is unable to be processed by the optimization pipeline.
-    For more information also see `jace.translator.post_translation` module.
+    For more information also see `jace.translator.pre_post_translation` module.
 
     The idea of the translator is extremely simple.
     Since Jaxpr is a list consisting of more or less simple instructions/equations, they get processed one after the other.
diff --git a/src/jace/translator/post_translation.py b/src/jace/translator/pre_post_translation.py
similarity index 100%
rename from src/jace/translator/post_translation.py
rename to src/jace/translator/pre_post_translation.py

From 2810e93b61a247b1375d133820f7e102cccd084e Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Tue, 21 May 2024 12:46:00 +0200
Subject: [PATCH 205/458] Integrated the `finalize_jaxpr_sdfg()` into the
 `postprocess_jaxpr_sdfg()` function since _currently_ only that happens.

However, as we will advance more, the finalize function will reappear as `postprocess_jaxpr_sdfg()` will start to do more.
---
 src/jace/translator/pre_post_translation.py | 15 ---------------
 1 file changed, 15 deletions(-)

diff --git a/src/jace/translator/pre_post_translation.py b/src/jace/translator/pre_post_translation.py
index fc28160..c177ebd 100644
--- a/src/jace/translator/pre_post_translation.py
+++ b/src/jace/translator/pre_post_translation.py
@@ -36,21 +36,6 @@ def postprocess_jaxpr_sdfg(
         - Setting correct input names (layer that does not depend on JAX).
         - Setting the correct strides & Storage properties.
     """
-    # Currently we do nothing except finalizing.
-    finalize_jaxpr_sdfg(tsdfg)
-
-
-def finalize_jaxpr_sdfg(
-    tsdfg: translator.TranslatedJaxprSDFG,
-) -> None:
-    """Finalizes the supplied `tsdfg` object in place.
-
-    This function will turn a non finalized, i.e. canonical, SDFG into a finalized one,
-    i.e. after this function `tsdfg.is_finalized` is `True`.
-    Thus the function will:
-    - Mark all input and output variables, i.e. listed in `tsdfg.{inp, out}_names`, as globals.
-    - Deallocate all members of `tsdfg` that are no longer needed.
-    """
     if tsdfg.is_finalized:
         raise ValueError("The supplied SDFG is already finalized.")
     if not tsdfg.inp_names:

From 1144d68ec36a09b107910853d29603ebbb7e7458 Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Tue, 21 May 2024 14:54:03 +0200
Subject: [PATCH 206/458] Rewrite the ALU translators.

They are now nicer, and I have split them into a binary and unary version.
It makes just sense to do that.

I also added more tests, I think that almost all code paths are now tested.
---
 .../primitive_translators/__init__.py         |   6 +-
 .../primitive_translators/alu_translator.py   | 290 ---------------
 .../primitive_translators/alu_translators.py  | 340 ++++++++++++++++++
 tests/test_sub_translators_alu.py             | 158 ++++++--
 4 files changed, 476 insertions(+), 318 deletions(-)
 delete mode 100644 src/jace/translator/primitive_translators/alu_translator.py
 create mode 100644 src/jace/translator/primitive_translators/alu_translators.py

diff --git a/src/jace/translator/primitive_translators/__init__.py b/src/jace/translator/primitive_translators/__init__.py
index 08bff9d..c01f657 100644
--- a/src/jace/translator/primitive_translators/__init__.py
+++ b/src/jace/translator/primitive_translators/__init__.py
@@ -8,9 +8,11 @@
 
 from __future__ import annotations
 
-from .alu_translator import ALUTranslator
+from .alu_translators import ALUBaseTranslator, BinaryALUTranslator, UnaryALUTranslator
 
 
 __all__ = [
-    "ALUTranslator",
+    "ALUBaseTranslator",
+    "BinaryALUTranslator",
+    "UnaryALUTranslator",
 ]
diff --git a/src/jace/translator/primitive_translators/alu_translator.py b/src/jace/translator/primitive_translators/alu_translator.py
deleted file mode 100644
index 0d19973..0000000
--- a/src/jace/translator/primitive_translators/alu_translator.py
+++ /dev/null
@@ -1,290 +0,0 @@
-# JaCe - JAX Just-In-Time compilation using DaCe (Data Centric Parallel Programming)
-#
-# Copyright (c) 2024, ETH Zurich
-# All rights reserved.
-#
-# SPDX-License-Identifier: BSD-3-Clause
-
-"""This module contains the `ALUTranslator` which translates all arithmetic and logic primitives."""
-
-from __future__ import annotations
-
-from collections.abc import MutableSequence, Sequence
-from typing import Any, Final, cast
-
-import dace
-import numpy as np
-from jax import core as jax_core
-from typing_extensions import override
-
-from jace import translator
-
-
-class ALUTranslator(translator.PrimitiveTranslator):
-    """This translator handles all arithmetic and logical operations.
-
-    This translator will be reworked soon, it just exists that the initial PR can do anything at all!!
-    """
-
-    __slots__ = ("_prim_name", "_prim_tmpl")
-
-    def __init__(
-        self,
-        prim_name: str,
-        prim_tmpl: str,
-    ) -> None:
-        """Initialize the `ALUTranslator`."""
-        self._prim_name = prim_name
-        self._prim_tmpl = prim_tmpl
-
-    @property
-    @override
-    def primitive(self) -> str:
-        return self._prim_name
-
-    @override
-    def __call__(
-        self,
-        driver: translator.JaxprTranslationDriver,
-        in_var_names: Sequence[str | None],
-        out_var_names: MutableSequence[str],
-        eqn: jax_core.JaxprEqn,
-        eqn_state: dace.SDFGState,
-    ) -> None:
-        """Perform the translation.
-
-        Deepening on the shapes of the input the function will either create a Tasklet or a mapped Tasklet.
-        The translator is able to handle broadcasting with NumPy rules.
-        The function will always perform the translation inside the provided state.
-
-        Args:
-            driver:         The driver object of the translation.
-            in_var_names:   List of the names of the arrays created inside the SDFG for the inpts or 'None' in case of a literal.
-            out_var_names:  List of the names of the arrays created inside the SDFG for the outputs.
-            eqn:            The Jax equation that is translated.
-            eqn_state:      State into which the primitive's SDFG representation is constructed.
-        """
-        assert self._prim_name == eqn.primitive.name
-
-        # Determine what kind of input we got and how we should proceed.
-        is_scalar = len(eqn.outvars[0].aval.shape) == 0
-        inp_scalars = [len(Inp.aval.shape) == 0 for i, Inp in enumerate(eqn.invars)]
-        has_scalars_as_inputs = any(inp_scalars)
-        has_some_literals = any(x is None for x in in_var_names)
-        inps_same_shape = all(
-            eqn.invars[0].aval.shape == eqn.invars[i].aval.shape for i in range(1, len(eqn.invars))
-        )
-
-        # We will now look which dimensions have to be broadcasted on which operator.
-        #  I.e. in the dimensions in the lists below there will be no map iteration index.
-        dims_to_bcastl: list[int] = []
-        dims_to_bcastr: list[int] = []
-
-        # Determine if and how we have to broadcast.
-        if inps_same_shape or is_scalar:
-            pass
-
-        elif has_some_literals or has_scalars_as_inputs:
-            # This is essentially an array plus a scalar, that is eitehr a literal or a variable.
-            assert (not has_some_literals) or all(
-                invar.aval.shape == eqn.outvars[0].aval.shape
-                for (invar, x) in zip(eqn.invars, in_var_names, strict=False)
-                if x is not None
-            )
-            assert (not has_scalars_as_inputs) or all(
-                invar.aval.shape in {eqn.outvars[0].aval.shape, ()}
-                for (invar, x) in zip(eqn.invars, in_var_names, strict=False)
-                if x is not None
-            )
-
-        else:
-            # This is the general broadcasting case
-            #  We assume that both inputs and the output have the same rank but different sizes in each dimension.
-            #  It seems that Jax ensures this.
-            #  We further assume that if the size in a dimension differs then one must have size 1.
-            #  This is the size we broadcast over, i.e. conceptually replicated.
-            out_shps = tuple(eqn.outvars[0].aval.shape)  # Shape of the output
-            inp_shpl = tuple(eqn.invars[0].aval.shape)  # Shape of the left/first input
-            inp_shpr = tuple(eqn.invars[1].aval.shape)  # Shape of the right/second input
-
-            if not ((len(inp_shpl) == len(inp_shpr)) and (len(out_shps) == len(inp_shpr))):
-                raise NotImplementedError("Can not broadcast over different ranks.")
-
-            for dim, (shp_lft, shp_rgt, out_shp) in enumerate(zip(inp_shpl, inp_shpr, out_shps)):
-                if shp_lft == shp_rgt:
-                    assert out_shp == shp_lft
-                elif shp_lft == 1:
-                    assert shp_rgt == out_shp
-                    dims_to_bcastl.append(dim)
-                elif shp_rgt == 1:
-                    assert shp_lft == out_shp
-                    dims_to_bcastr.append(dim)
-                else:
-                    raise ValueError(f"Invalid shapes in dimension {dim} for broadcasting.")
-
-        # Now we create the Tasklet in which the calculation is performed.
-        tskl_code: str = self._write_tasklet_code(in_var_names, eqn)
-        tskl_name: str = eqn.primitive.name
-        tskl_map_ranges: list[tuple[str, str]] = [
-            (f"__i{dim}", f"0:{N}") for dim, N in enumerate(eqn.outvars[0].aval.shape)
-        ]
-        tskl_output: tuple[str, dace.Memlet] = None  # type: ignore[assignment]
-        tskl_inputs: list[tuple[str, dace.Memlet] | tuple[None, None]] = []
-
-        # Generate the Memlets for the input.
-        for i, dims_to_bcast in zip(range(len(in_var_names)), [dims_to_bcastl, dims_to_bcastr]):
-            if in_var_names[i] is None:  # Literal: No input needed.
-                tskl_inputs.append((None, None))
-                continue
-            if inp_scalars[i]:  # Scalar
-                assert len(dims_to_bcast) == 0
-                i_memlet = dace.Memlet.simple(in_var_names[i], "0")
-            else:  # Array: We may have to broadcast
-                inputs_: list[str] = []
-                for dim, (map_var, _) in enumerate(tskl_map_ranges):
-                    if dim in dims_to_bcast:
-                        inputs_.append("0")
-                    else:
-                        inputs_.append(map_var)
-                i_memlet = dace.Memlet.simple(in_var_names[i], ", ".join(inputs_))
-                del inputs_
-            tskl_inputs.append((f"__in{i}", i_memlet))
-
-        # Now generate the Memlets for the output
-        if is_scalar:
-            tskl_output = ("__out0", dace.Memlet.simple(out_var_names[0], "0"))
-        else:
-            tskl_output = (
-                "__out0",
-                dace.Memlet.simple(out_var_names[0], ", ".join([X[0] for X in tskl_map_ranges])),
-            )
-
-        if is_scalar:
-            tskl_tasklet = eqn_state.add_tasklet(
-                tskl_name,
-                _list_to_dict(tskl_inputs).keys(),
-                _list_to_dict([tskl_output]).keys(),
-                tskl_code,
-            )
-            for in_var, (in_connector, in_memlet) in zip(in_var_names, tskl_inputs, strict=False):
-                if in_var is None:  # So access node for literal
-                    continue
-                eqn_state.add_edge(
-                    eqn_state.add_read(in_var),
-                    None,
-                    tskl_tasklet,
-                    in_connector,
-                    in_memlet,
-                )
-            eqn_state.add_edge(
-                tskl_tasklet,
-                tskl_output[0],
-                eqn_state.add_write(out_var_names[0]),
-                None,
-                tskl_output[1],
-            )
-        else:
-            eqn_state.add_mapped_tasklet(
-                name=tskl_name,
-                map_ranges=_list_to_dict(tskl_map_ranges),
-                inputs=_list_to_dict(tskl_inputs),
-                code=tskl_code,
-                outputs=_list_to_dict([tskl_output]),
-                external_edges=True,
-            )
-
-        return eqn_state
-
-    def _write_tasklet_code(
-        self,
-        in_var_names: Sequence[str | None],
-        eqn: jax_core.JaxprEqn,
-    ) -> str:
-        """This function generates the Tasklet code based on a primitive.
-
-        The function will also perform literal substitution and parameter handling.
-
-        Args:
-            in_var_names:   The list of SDFG variables used as input.
-        """
-
-        t_code = self._prim_tmpl
-
-        # Now we handle Literal substitution
-        for i, in_var_name in enumerate(in_var_names):
-            if in_var_name is not None:
-                continue
-
-            jax_in_var: jax_core.Literal = cast(jax_core.Literal, eqn.invars[i])
-            if jax_in_var.aval.shape == ():
-                t_val = jax_in_var.val
-                if isinstance(t_val, np.ndarray):
-                    t_val = jax_in_var.val.max()  # I do not know a better way in that case
-                t_code = t_code.replace(f"__in{i}", str(t_val))
-            else:
-                raise ValueError(
-                    f"Can not handle the literal case of shape: {jax_in_var.aval.shape}"
-                )
-
-        # Now replace the parameters
-        if len(eqn.params) != 0:
-            t_code = t_code.format(**eqn.params)
-
-        return t_code
-
-
-def _list_to_dict(inp: Sequence[tuple[None | Any, Any]]) -> dict[Any, Any]:
-    """This method turns a `list` of pairs into a `dict` and applies a `None` filter.
-
-    The function will only include pairs whose key, i.e. first element is not `None`.
-    """
-    return {k: v for k, v in inp if k is not None}
-
-
-# Contains all the templates for ALU operations.
-_ALU_OPS_TMPL: Final[dict[str, str]] = {
-    # Unary operations
-    "pos": "__out0 = +(__in0)",
-    "neg": "__out0 = -(__in0)",
-    "not": "__out0 = not (__in0)",
-    "floor": "__out0 = floor(__in0)",
-    "ceil": "__out0 = ceil(__in0)",
-    "round": "__out0 = round(__in0)",
-    "abs": "__out0 = abs(__in0)",
-    "sign": "__out0 = sign(__in0)",
-    "sqrt": "__out0 = sqrt(__in0)",
-    "log": "__out0 = log(__in0)",
-    "exp": "__out0 = exp(__in0)",
-    "integer_pow": "__out0 = (__in0)**({y})",  # 'y' is a parameter of the primitive
-    "sin": "__out0 = sin(__in0)",
-    "asin": "__out0 = asin(__in0)",
-    "cos": "__out0 = cos(__in0)",
-    "acos": "__out0 = acos(__in0)",
-    "tan": "__out0 = tan(__in0)",
-    "atan": "__out0 = atan(__in0)",
-    "tanh": "__out0 = tanh(__in0)",
-    # Binary operations
-    "add": "__out0 = (__in0)+(__in1)",
-    "add_any": "__out0 = (__in0)+(__in1)",  # No idea what makes `add_any` differ from `add`
-    "sub": "__out0 = (__in0)-(__in1)",
-    "mul": "__out0 = (__in0)*(__in1)",
-    "div": "__out0 = (__in0)/(__in1)",
-    "rem": "__out0 = (__in0)%(__in1)",
-    "and": "__out0 = (__in0) and (__in1)",
-    "or": "__out0 = (__in0) or  (__in1)",
-    "pow": "__out0 = (__in0)**(__in1)",
-    "ipow": "__out0 = (__in0)**(int(__in1))",
-    "min": "__out0 = min(__in0, __in1)",
-    "max": "__out0 = max(__in0, __in1)",
-    "eq": "__out0 = __in0 == __in1",
-    "ne": "__out0 = __in0 != __in1",
-    "ge": "__out0 = __in0 >= __in1",
-    "gt": "__out0 = __in0 > __in1",
-    "le": "__out0 = __in0 <= __in1",
-    "lt": "__out0 = __in0 < __in1",
-}
-
-_ = [
-    translator.register_primitive_translator(ALUTranslator(prim_name, prim_tmpl))
-    for prim_name, prim_tmpl in _ALU_OPS_TMPL.items()
-]
diff --git a/src/jace/translator/primitive_translators/alu_translators.py b/src/jace/translator/primitive_translators/alu_translators.py
new file mode 100644
index 0000000..28c4af0
--- /dev/null
+++ b/src/jace/translator/primitive_translators/alu_translators.py
@@ -0,0 +1,340 @@
+# JaCe - JAX Just-In-Time compilation using DaCe (Data Centric Parallel Programming)
+#
+# Copyright (c) 2024, ETH Zurich
+# All rights reserved.
+#
+# SPDX-License-Identifier: BSD-3-Clause
+
+"""Module containing all translators related to arithmetic logical operations."""
+
+from __future__ import annotations
+
+from abc import abstractmethod
+from collections.abc import MutableSequence, Sequence
+from typing import Final, cast
+
+import dace
+import numpy as np
+from jax import core as jax_core
+from typing_extensions import override
+
+from jace import translator
+
+
+class ALUBaseTranslator(translator.PrimitiveTranslator):
+    """Base for all ALU (arithmetic logical operations) translators.
+
+    The ALU translators make use of the template pattern and this is the main Skeleton.
+    You can think of it as a glorified wrapper around `sdfg::add_mapped_tasklet()`.
+
+    It assumes that Tasklets can be written in the following form:
+    ```
+        __out0 = f(__in0, __in1, ...)
+    ```
+    where `f` is some function like plus, i.e. `__out0 = __in0 + __in1`, where `__in{}` is an input connector name of the Tasklet.
+
+    An instance of this class is constructed with the name of the primitive that it should handle and a template.
+    The template is basically the code that should be inside the Tasklet, i.e. the function `f`.
+
+    A subclass has to implement the `_get_input_memlets()` function which computes the Memlets used as inputs that are used.
+    There are two subclasses:
+    - `UnaryALUTranslator` for all unary operations.
+    - `BinaryALUTranslator` for all binary operations.
+    """
+
+    __slots__ = ("_prim_name", "_tskl_tmpl")
+
+    def __init__(
+        self,
+        prim_name: str,
+        tskl_tmpl: str,
+    ) -> None:
+        """Initialize a base translator for primitive `prim_name` with template `tskl_tmpl`.
+
+        Args:
+            prim_name:      The name of the primitive that should be handled.
+            tskl_tmpl:      Template used for generating the Tasklet code.
+        """
+        self._prim_name = prim_name
+        self._tskl_tmpl = tskl_tmpl
+
+    @property
+    def primitive(self) -> str:
+        """Returns the primitive that should be translated."""
+        return self._prim_name
+
+    @override
+    def __call__(
+        self,
+        driver: translator.JaxprTranslationDriver,
+        in_var_names: Sequence[str | None],
+        out_var_names: MutableSequence[str],
+        eqn: jax_core.JaxprEqn,
+        eqn_state: dace.SDFGState,
+    ) -> None:
+        """Perform the translation.
+
+        Deepening on the shapes of the input the function will either create a Tasklet or a mapped Tasklet.
+        The translator is able to handle broadcasting with NumPy rules.
+        The function will always perform the translation inside the provided state.
+
+        Args:
+            driver:         The driver object of the translation.
+            in_var_names:   List of the names of the arrays created inside the SDFG for the inpts or 'None' in case of a literal.
+            out_var_names:  List of the names of the arrays created inside the SDFG for the outputs.
+            eqn:            The Jax equation that is translated.
+            eqn_state:      State into which the primitive's SDFG representation is constructed.
+        """
+        if len(out_var_names) != 1:
+            raise NotImplementedError("'ALUBaseTranslator' only one output is allowed.")
+
+        if eqn.outvars[0].aval.shape != ():
+            tskl_map_ranges: list[tuple[str, str]] = [
+                (f"__i{dim}", f"0:{N}") for dim, N in enumerate(eqn.outvars[0].aval.shape)
+            ]
+            tskl_output: dict[str, dace.Memlet] = {
+                "__out0": dace.Memlet.simple(
+                    out_var_names[0],
+                    ", ".join(name for name, _ in tskl_map_ranges),
+                ),
+            }
+        else:
+            # If we have a scalar we will generate a Map, but it will be trivial.
+            tskl_map_ranges = [("__iSCALAR", "0:1")]
+            tskl_output = {"__out0": dace.Memlet.simple(out_var_names[0], "0")}
+
+        # Non size dependent properties
+        tskl_name: str = f"{self.primitive}_{out_var_names[0]}"
+        tskl_code: str = self._get_tasklet_code(in_var_names, eqn)
+        tskl_inputs: dict[str, dace.Memlet] = self._get_input_memlets(
+            tskl_map_ranges, in_var_names, eqn
+        )
+
+        eqn_state.add_mapped_tasklet(
+            name=tskl_name,
+            map_ranges=tskl_map_ranges,
+            inputs=tskl_inputs,
+            code=tskl_code,
+            outputs=tskl_output,
+            external_edges=True,
+        )
+
+        return eqn_state
+
+    def _get_tasklet_code(
+        self,
+        in_var_names: Sequence[str | None],
+        eqn: jax_core.JaxprEqn,
+    ) -> str:
+        """Return the code that should be put inside the Tasklet, with all parameters and literals substituted with their values.
+
+        Args:
+            in_var_names:   The list of SDFG variables used as input.
+            eqn:            The equation.
+        """
+
+        tskl_code = self._tskl_tmpl
+        for i, in_var_name in enumerate(in_var_names):
+            if in_var_name is not None:
+                continue
+
+            jax_in_var: jax_core.Literal = cast(jax_core.Literal, eqn.invars[i])
+            if jax_in_var.aval.shape == ():
+                t_val = jax_in_var.val
+                if isinstance(t_val, np.ndarray):
+                    t_val = jax_in_var.val.max()  # I do not know a better way in that case
+                tskl_code = tskl_code.replace(f"__in{i}", str(t_val))
+            else:
+                raise ValueError(f"Can not handle non scalar literals: {jax_in_var}")
+        if len(eqn.params) != 0:
+            tskl_code = tskl_code.format(**eqn.params)
+
+        return tskl_code
+
+    @abstractmethod
+    def _get_input_memlets(
+        self,
+        tskl_ranges: Sequence[tuple[str, str]],
+        in_var_names: Sequence[str | None],
+        eqn: jax_core.JaxprEqn,
+    ) -> dict[str, dace.Memlet]:
+        """Generate the input Memlets for the non literal operators of the primitive.
+
+        The returned `dict` maps the input connector of the Tasklet to the Memlet that is used to connect it to the Map entry node.
+
+        Args:
+            tskl_map_ranges:    List of the different map parameter, first element is the name of the dimension,
+                                    second is the range, i.e. `0:SIZE`.
+            in_var_names:       The list of SDFG variables used as input.
+            eqn:                The equation object.
+        """
+        ...
+
+
+class UnaryALUTranslator(ALUBaseTranslator):
+    """Class for all unary operations.
+
+    Thus all Tasklets this class generates have the form:
+    ```python
+        __out0 = f(__in0)
+    ```
+
+    Todo:
+        - Specialize for `integer_pow` to do code unrolling in certain situations.
+    """
+
+    def _get_input_memlets(
+        self,
+        tskl_ranges: Sequence[tuple[str, str]],
+        in_var_names: Sequence[str | None],
+        eqn: jax_core.JaxprEqn,
+    ) -> dict[str, dace.Memlet]:
+        """Generate the input Memlets for non literal data.
+
+        Args:
+            tskl_map_ranges:    List of the different map parameter, first element is the name of the dimension,
+                                    second is the range, i.e. `0:SIZE`.
+            in_var_names:       The list of SDFG variables used as input.
+            eqn:                The equation object.
+        """
+        in_var_name = in_var_names[0]
+        if in_var_name is None:  # Unary operation with literal input -> there is nothing to do.
+            return {}
+        if eqn.outvars[0].aval.shape == ():
+            imemlet = dace.Memlet.simple(in_var_name, "0")
+        else:
+            imemlet = dace.Memlet.simple(in_var_name, ", ".join(name for name, _ in tskl_ranges))
+        return {"__in0": imemlet}
+
+
+class BinaryALUTranslator(ALUBaseTranslator):
+    """Class for all binary ALU operations.
+
+    Thus all Tasklets will have the following form:
+    ```python
+        __out0 = f(__in0, __in1)
+    ```
+
+    The main difference towards the `UnaryALUTranslator` is that this class supports broadcasting.
+    However, this is only possible if both operators have the same rank.
+
+    Notes:
+        The input `__in0` is identified with the left hand side of an operator and `__in1` is identified as the right hand side.
+    """
+
+    def _get_input_memlets(
+        self,
+        tskl_ranges: Sequence[tuple[str, str]],
+        in_var_names: Sequence[str | None],
+        eqn: jax_core.JaxprEqn,
+    ) -> dict[str, dace.Memlet]:
+        out_shps = tuple(eqn.outvars[0].aval.shape)  # Shape of the output
+        inp_shpl = tuple(eqn.invars[0].aval.shape)  # Shape of the left/first input
+        inp_shpr = tuple(eqn.invars[1].aval.shape)  # Shape of the right/second input
+
+        # Which dimensions on which input should be broadcast, i.e. replicated.
+        #  A dimension that is replicated is always accessed with the index `0` in the Memlet.
+        #  If `dims_to_bcast*` is `None` then the corresponding argument is a scalar.
+        dims_to_bcastl: list[int] | None = []
+        dims_to_bcastr: list[int] | None = []
+
+        if out_shps == ():
+            # Output is scalar (thus also the inputs).
+            dims_to_bcastl = None
+            dims_to_bcastr = None
+
+        elif inp_shpl == inp_shpr:
+            # The two have the same shapes and neither is a scalar.
+            pass
+
+        elif inp_shpl == ():
+            # The LHS is a scalar (RHS is not)
+            dims_to_bcastl = None
+
+        elif inp_shpr == ():
+            # The RHS is a scalar (LHS is not)
+            dims_to_bcastr = None
+
+        else:
+            # This is the general broadcasting case
+            #  We assume that both inputs and the output have the same rank, Jax seems to ensure this.
+            assert len(out_shps) == len(inp_shpl) == len(inp_shpr)
+            for dim, shp_lft, shp_rgt in zip(range(len(out_shps)), inp_shpl, inp_shpr):
+                if shp_lft == shp_rgt:
+                    pass  # Needed for cases such as `(10, 1, 3) + (10, 1, 1)`.
+                elif shp_lft == 1:
+                    dims_to_bcastl.append(dim)  # type: ignore[union-attr]  # guaranteed to be not `None`
+                else:
+                    dims_to_bcastr.append(dim)  # type: ignore[union-attr]
+
+        # Now we will generate the input Memlets.
+        tskl_inputs: dict[str, dace.Memlet] = {}
+        for i, in_var_name, dims_to_bcast in zip(
+            range(2), in_var_names, [dims_to_bcastl, dims_to_bcastr]
+        ):
+            if in_var_name is None:  # Input is a literal: No Memlet needed
+                continue
+
+            if dims_to_bcast is None:
+                imemelt = dace.Memlet.simple(in_var_name, "0")  # Scalar
+            else:
+                imemelt = dace.Memlet.simple(
+                    in_var_name,
+                    ", ".join(
+                        ("0" if i in dims_to_bcast else it_var)
+                        for i, (it_var, _) in enumerate(tskl_ranges)
+                    ),
+                )
+            tskl_inputs[f"__in{i}"] = imemelt
+
+        return tskl_inputs
+
+
+# Contains all the templates for ALU operations.
+_ALU_UN_OPS_TMPL: Final[dict[str, str]] = {
+    "pos": "__out0 = +(__in0)",
+    "neg": "__out0 = -(__in0)",
+    "not": "__out0 = not (__in0)",
+    "floor": "__out0 = floor(__in0)",
+    "ceil": "__out0 = ceil(__in0)",
+    "round": "__out0 = round(__in0)",
+    "abs": "__out0 = abs(__in0)",
+    "sign": "__out0 = sign(__in0)",
+    "sqrt": "__out0 = sqrt(__in0)",
+    "log": "__out0 = log(__in0)",
+    "exp": "__out0 = exp(__in0)",
+    "integer_pow": "__out0 = (__in0)**({y})",  # 'y' is a parameter of the primitive
+    "sin": "__out0 = sin(__in0)",
+    "asin": "__out0 = asin(__in0)",
+    "cos": "__out0 = cos(__in0)",
+    "acos": "__out0 = acos(__in0)",
+    "tan": "__out0 = tan(__in0)",
+    "atan": "__out0 = atan(__in0)",
+    "tanh": "__out0 = tanh(__in0)",
+}
+_ALU_BI_OPS_TMPL: Final[dict[str, str]] = {
+    "add": "__out0 = (__in0)+(__in1)",
+    "add_any": "__out0 = (__in0)+(__in1)",  # No idea what makes `add_any` differ from `add`
+    "sub": "__out0 = (__in0)-(__in1)",
+    "mul": "__out0 = (__in0)*(__in1)",
+    "div": "__out0 = (__in0)/(__in1)",
+    "rem": "__out0 = (__in0)%(__in1)",
+    "and": "__out0 = (__in0) and (__in1)",
+    "or": "__out0 = (__in0) or  (__in1)",
+    "pow": "__out0 = (__in0)**(__in1)",
+    "ipow": "__out0 = (__in0)**(int(__in1))",
+    "min": "__out0 = min(__in0, __in1)",
+    "max": "__out0 = max(__in0, __in1)",
+    "eq": "__out0 = __in0 == __in1",
+    "ne": "__out0 = __in0 != __in1",
+    "ge": "__out0 = __in0 >= __in1",
+    "gt": "__out0 = __in0 > __in1",
+    "le": "__out0 = __in0 <= __in1",
+    "lt": "__out0 = __in0 < __in1",
+}
+
+# Create the ALU translators
+for pname, ptmpl in _ALU_UN_OPS_TMPL.items():
+    translator.register_primitive_translator(UnaryALUTranslator(pname, ptmpl))
+for pname, ptmpl in _ALU_BI_OPS_TMPL.items():
+    translator.register_primitive_translator(BinaryALUTranslator(pname, ptmpl))
diff --git a/tests/test_sub_translators_alu.py b/tests/test_sub_translators_alu.py
index 45a5548..5c3a995 100644
--- a/tests/test_sub_translators_alu.py
+++ b/tests/test_sub_translators_alu.py
@@ -9,55 +9,161 @@
 
 from __future__ import annotations
 
+from collections.abc import Callable, Sequence
+from typing import Any
+
 import jax
 import numpy as np
+from jax import numpy as jnp
 
 import jace
 
 
-def test_add():
-    """Simple add function."""
+def _perform_test(testee: Callable, *args: Any) -> None:
+    """General function that just performs the test."""
+    wrapped = jace.jit(testee)
+
+    ref = testee(*args)
+    res = wrapped(*args)
+    assert np.allclose(ref, res), f"Expected '{ref.tolist()}' got '{res.tolist()}'"
+
+
+def mkarr(
+    shape: Sequence[int],
+    dtype=np.float64,
+) -> np.ndarray:
+    return np.array(np.random.random(shape), dtype=dtype)  # noqa: NPY002
+
+
+def test_alu_unary_scalar():
+    """Test unary ALU translator in the scalar case."""
+
+    def testee(A: float) -> float:
+        return jnp.cos(A)
+
+    _perform_test(testee, 1.0)
+
+
+def test_alu_unary_array():
+    """Test unary ALU translator with array argument."""
+
+    def testee(A: np.ndarray) -> np.ndarray:
+        return jnp.sin(A)
+
+    A = mkarr((100, 10, 3))
+
+    _perform_test(testee, A)
+
+
+def test_alu_unary_scalar_literal():
+    """Test unary ALU translator with literal argument"""
+
+    def testee(A: float) -> float:
+        return jnp.sin(1.98) + A
+
+    _perform_test(testee, 10.0)
+
+
+def test_alu_unary_integer_power():
+    """Tests the integer power, which has a parameter."""
+    for exp in [0, 1, 2, 10]:
+
+        def testee(A: np.ndarray) -> np.ndarray:
+            return A ** int(exp)  # noqa: B023 # `exp` is not used in the body
+
+        A = mkarr((10, 2 + exp, 3))
+        _perform_test(testee, A)
+
+
+def test_alu_binary_scalar():
+    """Scalar binary operation."""
+
+    def testee(A: float, B: float) -> float:
+        return A * B
+
+    _perform_test(testee, 1.0, 2.0)
+
+
+def test_alu_binary_scalar_literal():
+    """Scalar binary operation, with a literal."""
+
+    def testee(A: float) -> float:
+        return A * 2.03
+
+    _perform_test(testee, 7.0)
+
+
+def test_alu_binary_array():
+    """Test binary of arrays, with same size."""
 
     def testee(A: np.ndarray, B: np.ndarray) -> np.ndarray:
         return A + B
 
-    A = np.arange(12, dtype=np.float64).reshape((4, 3))
-    B = np.full((4, 3), 10, dtype=np.float64)
+    A = mkarr((100, 10, 3))
+    B = mkarr((100, 10, 3))
+    _perform_test(testee, A, B)
 
-    ref = testee(A, B)
-    res = jace.jit(testee)(A, B)
 
-    assert np.allclose(ref, res), f"Expected '{ref}' got '{res}'."
+def test_alu_binary_array_scalar():
+    """Test binary of array with scalar."""
 
+    def testee(A: np.ndarray, B: float) -> np.ndarray:
+        return A + B
 
-def test_add2():
-    """Simple add function, with literal."""
+    A = mkarr((100, 22))
+    B = np.float64(1.34)
+    _perform_test(testee, A, B)
 
-    def testee(A: np.ndarray, B: np.ndarray) -> np.ndarray:
-        c = A + 0.01
-        d = B * 0.6
-        e = c / 1.0
-        f = d - 0.1
-        return e + f * d
 
-    A = np.arange(12, dtype=np.float64).reshape((4, 3))
-    B = np.full((4, 3), 10, dtype=np.float64)
+def test_alu_binary_array_literal():
+    """Test binary of array with literal"""
 
-    ref = testee(A, B)
-    res = jace.jit(testee)(A, B)
+    def testee(A: np.ndarray) -> np.ndarray:
+        return A + 1.52
 
-    assert np.allclose(ref, res), f"Expected '{ref}' got '{res}'."
+    A = mkarr((100, 22))
+    _perform_test(testee, A)
 
 
-def test_add3():
-    """Simple add function, with constant."""
+def test_alu_binary_array_literal_2():
+    """Test binary of array with literal"""
+
+    def testee(A: np.ndarray) -> np.ndarray:
+        return 1.52 + A
+
+    A = mkarr((100, 22))
+    _perform_test(testee, A)
+
+
+def test_alu_binary_array_constants():
+    """Test binary of array with constant."""
 
     def testee(A: np.ndarray) -> np.ndarray:
         return A + jax.numpy.array([[1.0, 2.0, 3.0], [4.0, 5.0, 6.0], [7.0, 8.0, 9.0]])
 
-    A = np.ones((3, 3), dtype=np.float64)
+    A = mkarr((3, 3))
+    _perform_test(testee, A)
+
+
+def test_alu_binary_broadcast_1():
+    """Test broadcasting."""
+
+    def testee(A: np.ndarray, B: np.ndarray) -> np.ndarray:
+        return A + B
+
+    A = mkarr((100, 1, 3))
+    B = mkarr((100, 1, 1))
+    _perform_test(testee, A, B)
+    _perform_test(testee, B, A)
+
 
-    ref = testee(A)
-    res = jace.jit(testee)(A)
+def test_alu_binary_broadcast_2():
+    """Test broadcasting."""
+
+    def testee(A: np.ndarray, B: np.ndarray) -> np.ndarray:
+        return A + B
 
-    assert np.allclose(ref, res), f"Expected '{ref}' got '{res}'."
+    A = mkarr((100, 1))
+    B = mkarr((100, 10))
+    _perform_test(testee, A, B)
+    _perform_test(testee, B, A)

From 6c0c5e2c358dee307c72e6d06a9320b43b80245c Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Wed, 22 May 2024 07:29:31 +0200
Subject: [PATCH 207/458] Updated the ALU translators a bit, they now have
 better names.

---
 .../primitive_translators/alu_translators.py  | 38 +++++++++----------
 1 file changed, 19 insertions(+), 19 deletions(-)

diff --git a/src/jace/translator/primitive_translators/alu_translators.py b/src/jace/translator/primitive_translators/alu_translators.py
index 28c4af0..7f3b504 100644
--- a/src/jace/translator/primitive_translators/alu_translators.py
+++ b/src/jace/translator/primitive_translators/alu_translators.py
@@ -36,7 +36,7 @@ class ALUBaseTranslator(translator.PrimitiveTranslator):
     An instance of this class is constructed with the name of the primitive that it should handle and a template.
     The template is basically the code that should be inside the Tasklet, i.e. the function `f`.
 
-    A subclass has to implement the `_get_input_memlets()` function which computes the Memlets used as inputs that are used.
+    A subclass has to implement the `make_input_memlets()` function which computes the Memlets used as inputs that are used.
     There are two subclasses:
     - `UnaryALUTranslator` for all unary operations.
     - `BinaryALUTranslator` for all binary operations.
@@ -80,39 +80,39 @@ def __call__(
 
         Args:
             driver:         The driver object of the translation.
-            in_var_names:   List of the names of the arrays created inside the SDFG for the inpts or 'None' in case of a literal.
+            in_var_names:   List of the names of the arrays created inside the SDFG for the inputs or 'None' in case of a literal.
             out_var_names:  List of the names of the arrays created inside the SDFG for the outputs.
             eqn:            The Jax equation that is translated.
             eqn_state:      State into which the primitive's SDFG representation is constructed.
         """
         if len(out_var_names) != 1:
-            raise NotImplementedError("'ALUBaseTranslator' only one output is allowed.")
+            raise NotImplementedError("'{type(self).__name__}' only one output is allowed.")
 
         if eqn.outvars[0].aval.shape != ():
-            tskl_map_ranges: list[tuple[str, str]] = [
+            tskl_ranges: list[tuple[str, str]] = [
                 (f"__i{dim}", f"0:{N}") for dim, N in enumerate(eqn.outvars[0].aval.shape)
             ]
             tskl_output: dict[str, dace.Memlet] = {
                 "__out0": dace.Memlet.simple(
                     out_var_names[0],
-                    ", ".join(name for name, _ in tskl_map_ranges),
+                    ", ".join(name for name, _ in tskl_ranges),
                 ),
             }
         else:
             # If we have a scalar we will generate a Map, but it will be trivial.
-            tskl_map_ranges = [("__iSCALAR", "0:1")]
+            tskl_ranges = [("__jace_iterator_SCALAR", "0:1")]
             tskl_output = {"__out0": dace.Memlet.simple(out_var_names[0], "0")}
 
         # Non size dependent properties
         tskl_name: str = f"{self.primitive}_{out_var_names[0]}"
-        tskl_code: str = self._get_tasklet_code(in_var_names, eqn)
-        tskl_inputs: dict[str, dace.Memlet] = self._get_input_memlets(
-            tskl_map_ranges, in_var_names, eqn
+        tskl_code: str = self.write_tasklet_code(in_var_names, eqn)
+        tskl_inputs: dict[str, dace.Memlet] = self.make_input_memlets(
+            tskl_ranges, in_var_names, eqn
         )
 
         eqn_state.add_mapped_tasklet(
             name=tskl_name,
-            map_ranges=tskl_map_ranges,
+            map_ranges=tskl_ranges,
             inputs=tskl_inputs,
             code=tskl_code,
             outputs=tskl_output,
@@ -121,7 +121,7 @@ def __call__(
 
         return eqn_state
 
-    def _get_tasklet_code(
+    def write_tasklet_code(
         self,
         in_var_names: Sequence[str | None],
         eqn: jax_core.JaxprEqn,
@@ -152,7 +152,7 @@ def _get_tasklet_code(
         return tskl_code
 
     @abstractmethod
-    def _get_input_memlets(
+    def make_input_memlets(
         self,
         tskl_ranges: Sequence[tuple[str, str]],
         in_var_names: Sequence[str | None],
@@ -163,7 +163,7 @@ def _get_input_memlets(
         The returned `dict` maps the input connector of the Tasklet to the Memlet that is used to connect it to the Map entry node.
 
         Args:
-            tskl_map_ranges:    List of the different map parameter, first element is the name of the dimension,
+            tskl_ranges:    List of the different map parameter, first element is the name of the dimension,
                                     second is the range, i.e. `0:SIZE`.
             in_var_names:       The list of SDFG variables used as input.
             eqn:                The equation object.
@@ -183,7 +183,7 @@ class UnaryALUTranslator(ALUBaseTranslator):
         - Specialize for `integer_pow` to do code unrolling in certain situations.
     """
 
-    def _get_input_memlets(
+    def make_input_memlets(
         self,
         tskl_ranges: Sequence[tuple[str, str]],
         in_var_names: Sequence[str | None],
@@ -192,10 +192,10 @@ def _get_input_memlets(
         """Generate the input Memlets for non literal data.
 
         Args:
-            tskl_map_ranges:    List of the different map parameter, first element is the name of the dimension,
-                                    second is the range, i.e. `0:SIZE`.
-            in_var_names:       The list of SDFG variables used as input.
-            eqn:                The equation object.
+            tskl_ranges:    List of the different map parameter, first element is the name of the dimension,
+                                second is the range, i.e. `0:SIZE`.
+            in_var_names:   The list of SDFG variables used as input.
+            eqn:            The equation object.
         """
         in_var_name = in_var_names[0]
         if in_var_name is None:  # Unary operation with literal input -> there is nothing to do.
@@ -222,7 +222,7 @@ class BinaryALUTranslator(ALUBaseTranslator):
         The input `__in0` is identified with the left hand side of an operator and `__in1` is identified as the right hand side.
     """
 
-    def _get_input_memlets(
+    def make_input_memlets(
         self,
         tskl_ranges: Sequence[tuple[str, str]],
         in_var_names: Sequence[str | None],

From ab4f60cf0046f6b9d488f82b9e169858ebaca84b Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Wed, 22 May 2024 09:07:19 +0200
Subject: [PATCH 208/458] Split the ALU class again.

There is now a more general class that is able to do broadcasting.
However, theunary operation now looks a bit strange, but I am willingly to pay the price.
---
 .../primitive_translators/__init__.py         |   3 +-
 .../primitive_translators/alu_translators.py  | 159 +++--------------
 .../mapped_operation_base_translator.py       | 167 ++++++++++++++++++
 3 files changed, 197 insertions(+), 132 deletions(-)
 create mode 100644 src/jace/translator/primitive_translators/mapped_operation_base_translator.py

diff --git a/src/jace/translator/primitive_translators/__init__.py b/src/jace/translator/primitive_translators/__init__.py
index c01f657..5595589 100644
--- a/src/jace/translator/primitive_translators/__init__.py
+++ b/src/jace/translator/primitive_translators/__init__.py
@@ -8,11 +8,10 @@
 
 from __future__ import annotations
 
-from .alu_translators import ALUBaseTranslator, BinaryALUTranslator, UnaryALUTranslator
+from .alu_translators import BinaryALUTranslator, UnaryALUTranslator
 
 
 __all__ = [
-    "ALUBaseTranslator",
     "BinaryALUTranslator",
     "UnaryALUTranslator",
 ]
diff --git a/src/jace/translator/primitive_translators/alu_translators.py b/src/jace/translator/primitive_translators/alu_translators.py
index 7f3b504..fd3b442 100644
--- a/src/jace/translator/primitive_translators/alu_translators.py
+++ b/src/jace/translator/primitive_translators/alu_translators.py
@@ -9,8 +9,7 @@
 
 from __future__ import annotations
 
-from abc import abstractmethod
-from collections.abc import MutableSequence, Sequence
+from collections.abc import Sequence
 from typing import Final, cast
 
 import dace
@@ -19,30 +18,24 @@
 from typing_extensions import override
 
 from jace import translator
+from jace.translator.primitive_translators.mapped_operation_base_translator import (
+    MappedOperationBaseTranslator,
+)
 
 
-class ALUBaseTranslator(translator.PrimitiveTranslator):
+class ALUBaseTranslator(MappedOperationBaseTranslator):
     """Base for all ALU (arithmetic logical operations) translators.
 
-    The ALU translators make use of the template pattern and this is the main Skeleton.
-    You can think of it as a glorified wrapper around `sdfg::add_mapped_tasklet()`.
+    This class implements the `MappedOperationBaseTranslator::write_tasklet_code()` function.
+    The tasklet is written based on a template string.
+    In addition to that the function will also do literal substitution.
 
-    It assumes that Tasklets can be written in the following form:
-    ```
-        __out0 = f(__in0, __in1, ...)
-    ```
-    where `f` is some function like plus, i.e. `__out0 = __in0 + __in1`, where `__in{}` is an input connector name of the Tasklet.
-
-    An instance of this class is constructed with the name of the primitive that it should handle and a template.
-    The template is basically the code that should be inside the Tasklet, i.e. the function `f`.
-
-    A subclass has to implement the `make_input_memlets()` function which computes the Memlets used as inputs that are used.
     There are two subclasses:
     - `UnaryALUTranslator` for all unary operations.
     - `BinaryALUTranslator` for all binary operations.
     """
 
-    __slots__ = ("_prim_name", "_tskl_tmpl")
+    __slots__ = "_tskl_tmpl"
 
     def __init__(
         self,
@@ -55,72 +48,10 @@ def __init__(
             prim_name:      The name of the primitive that should be handled.
             tskl_tmpl:      Template used for generating the Tasklet code.
         """
-        self._prim_name = prim_name
+        super().__init__(primitive_name=prim_name)
         self._tskl_tmpl = tskl_tmpl
 
-    @property
-    def primitive(self) -> str:
-        """Returns the primitive that should be translated."""
-        return self._prim_name
-
     @override
-    def __call__(
-        self,
-        driver: translator.JaxprTranslationDriver,
-        in_var_names: Sequence[str | None],
-        out_var_names: MutableSequence[str],
-        eqn: jax_core.JaxprEqn,
-        eqn_state: dace.SDFGState,
-    ) -> None:
-        """Perform the translation.
-
-        Deepening on the shapes of the input the function will either create a Tasklet or a mapped Tasklet.
-        The translator is able to handle broadcasting with NumPy rules.
-        The function will always perform the translation inside the provided state.
-
-        Args:
-            driver:         The driver object of the translation.
-            in_var_names:   List of the names of the arrays created inside the SDFG for the inputs or 'None' in case of a literal.
-            out_var_names:  List of the names of the arrays created inside the SDFG for the outputs.
-            eqn:            The Jax equation that is translated.
-            eqn_state:      State into which the primitive's SDFG representation is constructed.
-        """
-        if len(out_var_names) != 1:
-            raise NotImplementedError("'{type(self).__name__}' only one output is allowed.")
-
-        if eqn.outvars[0].aval.shape != ():
-            tskl_ranges: list[tuple[str, str]] = [
-                (f"__i{dim}", f"0:{N}") for dim, N in enumerate(eqn.outvars[0].aval.shape)
-            ]
-            tskl_output: dict[str, dace.Memlet] = {
-                "__out0": dace.Memlet.simple(
-                    out_var_names[0],
-                    ", ".join(name for name, _ in tskl_ranges),
-                ),
-            }
-        else:
-            # If we have a scalar we will generate a Map, but it will be trivial.
-            tskl_ranges = [("__jace_iterator_SCALAR", "0:1")]
-            tskl_output = {"__out0": dace.Memlet.simple(out_var_names[0], "0")}
-
-        # Non size dependent properties
-        tskl_name: str = f"{self.primitive}_{out_var_names[0]}"
-        tskl_code: str = self.write_tasklet_code(in_var_names, eqn)
-        tskl_inputs: dict[str, dace.Memlet] = self.make_input_memlets(
-            tskl_ranges, in_var_names, eqn
-        )
-
-        eqn_state.add_mapped_tasklet(
-            name=tskl_name,
-            map_ranges=tskl_ranges,
-            inputs=tskl_inputs,
-            code=tskl_code,
-            outputs=tskl_output,
-            external_edges=True,
-        )
-
-        return eqn_state
-
     def write_tasklet_code(
         self,
         in_var_names: Sequence[str | None],
@@ -132,7 +63,6 @@ def write_tasklet_code(
             in_var_names:   The list of SDFG variables used as input.
             eqn:            The equation.
         """
-
         tskl_code = self._tskl_tmpl
         for i, in_var_name in enumerate(in_var_names):
             if in_var_name is not None:
@@ -151,72 +81,36 @@ def write_tasklet_code(
 
         return tskl_code
 
-    @abstractmethod
-    def make_input_memlets(
-        self,
-        tskl_ranges: Sequence[tuple[str, str]],
-        in_var_names: Sequence[str | None],
-        eqn: jax_core.JaxprEqn,
-    ) -> dict[str, dace.Memlet]:
-        """Generate the input Memlets for the non literal operators of the primitive.
-
-        The returned `dict` maps the input connector of the Tasklet to the Memlet that is used to connect it to the Map entry node.
-
-        Args:
-            tskl_ranges:    List of the different map parameter, first element is the name of the dimension,
-                                    second is the range, i.e. `0:SIZE`.
-            in_var_names:       The list of SDFG variables used as input.
-            eqn:                The equation object.
-        """
-        ...
-
 
 class UnaryALUTranslator(ALUBaseTranslator):
     """Class for all unary operations.
 
-    Thus all Tasklets this class generates have the form:
-    ```python
-        __out0 = f(__in0)
-    ```
-
     Todo:
         - Specialize for `integer_pow` to do code unrolling in certain situations.
     """
 
-    def make_input_memlets(
+    @override
+    def write_tasklet_code(
         self,
-        tskl_ranges: Sequence[tuple[str, str]],
         in_var_names: Sequence[str | None],
         eqn: jax_core.JaxprEqn,
-    ) -> dict[str, dace.Memlet]:
-        """Generate the input Memlets for non literal data.
-
-        Args:
-            tskl_ranges:    List of the different map parameter, first element is the name of the dimension,
-                                second is the range, i.e. `0:SIZE`.
-            in_var_names:   The list of SDFG variables used as input.
-            eqn:            The equation object.
-        """
-        in_var_name = in_var_names[0]
-        if in_var_name is None:  # Unary operation with literal input -> there is nothing to do.
-            return {}
-        if eqn.outvars[0].aval.shape == ():
-            imemlet = dace.Memlet.simple(in_var_name, "0")
-        else:
-            imemlet = dace.Memlet.simple(in_var_name, ", ".join(name for name, _ in tskl_ranges))
-        return {"__in0": imemlet}
+    ) -> str:
+        if len(in_var_names) != 1:
+            raise RuntimeWarning(
+                f"'UnaryALUTranslator' can only handle unary operations.\nEqn: {eqn}"
+            )
+        return super().write_tasklet_code(
+            in_var_names=in_var_names,
+            eqn=eqn,
+        )
 
 
 class BinaryALUTranslator(ALUBaseTranslator):
     """Class for all binary ALU operations.
 
-    Thus all Tasklets will have the following form:
-    ```python
-        __out0 = f(__in0, __in1)
-    ```
-
-    The main difference towards the `UnaryALUTranslator` is that this class supports broadcasting.
-    However, this is only possible if both operators have the same rank.
+    While `MappedOperationBaseTranslator` requires that the inputs must have the same shape,
+    this class lift this restriction and allows to broadcast the operants.
+    However, broadcasting is only possible if both inputs have the same rank.
 
     Notes:
         The input `__in0` is identified with the left hand side of an operator and `__in1` is identified as the right hand side.
@@ -228,6 +122,11 @@ def make_input_memlets(
         in_var_names: Sequence[str | None],
         eqn: jax_core.JaxprEqn,
     ) -> dict[str, dace.Memlet]:
+        if len(in_var_names) != 2:
+            raise RuntimeWarning(
+                f"'BinaryALUTranslator' can only handle binary operations.\nEqn: {eqn}"
+            )
+
         out_shps = tuple(eqn.outvars[0].aval.shape)  # Shape of the output
         inp_shpl = tuple(eqn.invars[0].aval.shape)  # Shape of the left/first input
         inp_shpr = tuple(eqn.invars[1].aval.shape)  # Shape of the right/second input
diff --git a/src/jace/translator/primitive_translators/mapped_operation_base_translator.py b/src/jace/translator/primitive_translators/mapped_operation_base_translator.py
new file mode 100644
index 0000000..5f217f1
--- /dev/null
+++ b/src/jace/translator/primitive_translators/mapped_operation_base_translator.py
@@ -0,0 +1,167 @@
+# JaCe - JAX Just-In-Time compilation using DaCe (Data Centric Parallel Programming)
+#
+# Copyright (c) 2024, ETH Zurich
+# All rights reserved.
+#
+# SPDX-License-Identifier: BSD-3-Clause
+
+"""Module containing all translators related to arithmetic logical operations."""
+
+from __future__ import annotations
+
+from abc import abstractmethod
+from collections.abc import MutableSequence, Sequence
+
+import dace
+from jax import core as jax_core
+from typing_extensions import final, override
+
+from jace import translator
+
+
+class MappedOperationBaseTranslator(translator.PrimitiveTranslator):
+    """Implements the base for all "mapped base operations".
+
+    A mapped base operation `f` is an operation that has several inputs arrays that are elementwise combined to a single output array.
+    A prime example for this would be the addition of two arrays of the _same_ size.
+    Essentially it assumes that the Tasklet code can be written as:
+    ```
+        __out0 = f(__in0, __in1, __in3, ...)
+    ```
+    where `__in*` are the connector names of the Tasklet and `__out0` is the output connector.
+    For problems such as this, the SDFG API provides the `SDFGState::add_mapped_tasklet()` function, however, in most cases it can not be directly used.
+    Thus this class acts like a convenience wrapper around it.
+
+    To use this class a user has to overwrite the `write_tasklet_code()` function.
+    This function generates the Python code that should be put inside the Tasklet.
+
+    Notes:
+        This class will always generate a mapped Tasklet, even if a scalar is handled.
+        The class will always map over the entirety of the output and assume that all inputs have the same shape as the output.
+            If you want to override this behaviour you have to override the `make_input_memlets()` method
+            and generate the appropriate Memlets to use as inputs yourself.
+        Only one output is allowed.
+    """
+
+    __slots__ = ("_prim_name",)
+
+    def __init__(
+        self,
+        primitive_name: str,
+    ) -> None:
+        """Bind `self` to the primitive with name `primitive_name`."""
+        self._prim_name = primitive_name
+
+    @property
+    def primitive(self) -> str:
+        """Returns the primitive that should be translated."""
+        return self._prim_name
+
+    @final
+    @override
+    def __call__(
+        self,
+        driver: translator.JaxprTranslationDriver,
+        in_var_names: Sequence[str | None],
+        out_var_names: MutableSequence[str],
+        eqn: jax_core.JaxprEqn,
+        eqn_state: dace.SDFGState,
+    ) -> None:
+        """Create the mapped Tasklet.
+
+        The function will create the map ranges and based on the shape of the output array.
+        It will then call `make_input_memlets()` to get the input Memlets.
+        After that it calls `write_tasklet_code()` to get the Tasklet code.
+        After that it will create the mapped Tasklet.
+
+        Args:
+            driver:         The driver object of the translation.
+            in_var_names:   List of the names of the arrays created inside the SDFG for the inputs or 'None' in case of a literal.
+            out_var_names:  List of the names of the arrays created inside the SDFG for the outputs.
+            eqn:            The Jax equation that is translated.
+            eqn_state:      State into which the primitive's SDFG representation is constructed.
+        """
+        if eqn.outvars[0].aval.shape != ():
+            tskl_ranges: list[tuple[str, str]] = [
+                (f"__i{dim}", f"0:{N}") for dim, N in enumerate(eqn.outvars[0].aval.shape)
+            ]
+            tskl_output: dict[str, dace.Memlet] = {
+                "__out0": dace.Memlet.simple(
+                    out_var_names[0],
+                    ", ".join(name for name, _ in tskl_ranges),
+                )
+            }
+
+        else:
+            # If we have a scalar we will generate a Map, but it will be trivial.
+            tskl_ranges = [("__jace_iterator_SCALAR", "0:1")]
+            tskl_output = {"__out0": dace.Memlet.simple(out_var_names[0], "0")}
+
+        tskl_inputs: dict[str, dace.Memlet] = self.make_input_memlets(
+            tskl_ranges, in_var_names, eqn
+        )
+        tskl_name: str = f"{self.primitive}_{out_var_names[0]}"
+        tskl_code: str = self.write_tasklet_code(in_var_names, eqn)
+
+        eqn_state.add_mapped_tasklet(
+            name=tskl_name,
+            map_ranges=tskl_ranges,
+            inputs=tskl_inputs,
+            code=tskl_code,
+            outputs=tskl_output,
+            external_edges=True,
+        )
+
+        return eqn_state
+
+    @abstractmethod
+    def write_tasklet_code(
+        self,
+        in_var_names: Sequence[str | None],
+        eqn: jax_core.JaxprEqn,
+    ) -> str:
+        """Return the code that should be put inside the Tasklet.
+
+        Note that returned code is not processed any further.
+        Thus the function has to apply literal removal on its own.
+
+        Args:
+            in_var_names:   The list of SDFG variables used as input.
+            eqn:            The equation.
+        """
+        ...
+
+    def make_input_memlets(
+        self,
+        tskl_ranges: Sequence[tuple[str, str]],
+        in_var_names: Sequence[str | None],
+        eqn: jax_core.JaxprEqn,
+    ) -> dict[str, dace.Memlet]:
+        """Generate the input Memlets for the non literal operators of the primitive.
+
+        The returned `dict` maps the input connector of the Tasklet to the Memlet that is used to connect it to the Map entry node.
+
+        Args:
+            tskl_ranges:    List of the different map parameter, first element is the name of the dimension,
+                                    second is the range, i.e. `0:SIZE`.
+            in_var_names:       The list of SDFG variables used as input.
+            eqn:                The equation object.
+        """
+        if any(eqn.outvars[0].aval.shape != invar.aval.shape for invar in eqn.invars):
+            # If you want to use this class as base, then you must override this function.
+            raise NotImplementedError(
+                "`MappedOperationBaseTranslator` can only handle inputs and output of the same shape!\nEqn: {eqn}"
+            )
+
+        return {
+            f"__in{i}": dace.Memlet.simple(
+                in_var_name,
+                (
+                    ", ".join(name for name, _ in tskl_ranges)
+                    if eqn.outvars[0].aval.shape != ()
+                    else "0"
+                ),
+            )
+            for i, in_var_name in enumerate(in_var_names)
+            if in_var_name is not None
+        }

From 31f11fc567823958fc45d437edcee4d370bf0690 Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Wed, 22 May 2024 09:28:31 +0200
Subject: [PATCH 209/458] Small fixes.

---
 src/jace/jax/translation_cache.py | 2 +-
 src/jace/util/jax_helper.py       | 2 +-
 src/jace/util/traits.py           | 2 +-
 3 files changed, 3 insertions(+), 3 deletions(-)

diff --git a/src/jace/jax/translation_cache.py b/src/jace/jax/translation_cache.py
index 267b7f9..f46cdef 100644
--- a/src/jace/jax/translation_cache.py
+++ b/src/jace/jax/translation_cache.py
@@ -126,7 +126,7 @@ def from_value(
 
         if util.is_array(val):
             if util.is_jax_array(val):
-                val = val.__array__(copy=False)
+                val = val.__array__()  # Passing `copy=False` leads to error in NumPy.
             shape = val.shape
             dtype = util.translate_dtype(val.dtype)
             strides = getattr(val, "strides", None)
diff --git a/src/jace/util/jax_helper.py b/src/jace/util/jax_helper.py
index 01eaa8f..1df0334 100644
--- a/src/jace/util/jax_helper.py
+++ b/src/jace/util/jax_helper.py
@@ -170,7 +170,7 @@ def translate_dtype(dtype: Any) -> dace.typeclass:
     if hasattr(dace.dtypes, dtype_name):
         return getattr(dace.dtypes, dtype_name)
     if hasattr(np, dtype_name):
-        dtype = getattr(np, dtype)
+        dtype = getattr(np, dtype_name)
         return dace.dtype_to_typeclass(dtype)
     raise ValueError(f"Unable to translate '{dtype}' ino a DaCe dtype.")
 
diff --git a/src/jace/util/traits.py b/src/jace/util/traits.py
index 6336f6d..44ba097 100644
--- a/src/jace/util/traits.py
+++ b/src/jace/util/traits.py
@@ -142,5 +142,5 @@ def is_fully_addressable(
             Jax array is on this host.
     """
     if is_jax_array(obj):
-        return obj.is_fully_addressable()
+        return obj.is_fully_addressable
     return True

From 8543e6831ab2027eb1739315560c45488f825348 Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Wed, 22 May 2024 09:33:17 +0200
Subject: [PATCH 210/458] Added a new note regarding the `x64` Situation.

---
 src/jace/translator/jaxpr_translator_driver.py | 5 +++++
 1 file changed, 5 insertions(+)

diff --git a/src/jace/translator/jaxpr_translator_driver.py b/src/jace/translator/jaxpr_translator_driver.py
index a70598b..6e40b33 100644
--- a/src/jace/translator/jaxpr_translator_driver.py
+++ b/src/jace/translator/jaxpr_translator_driver.py
@@ -119,6 +119,11 @@ def translate_jaxpr(
         if len(jaxpr.effects) != 0:
             raise NotImplementedError("'Jaxpr' with side effects are not supported.")
         if not _jax.config.read("jax_enable_x64"):
+            # NOTE: What is interesting here is, that the SDFG can be called, but the result is garbage.
+            #  Beside that I think it should not work, I think it should not even call,
+            #  because of a mismatch in data types.
+            #  However, If we work with Jax arrays themselves, it should technically work.
+            #  But currently the best we can do, is forbid it!
             raise NotImplementedError(
                 "You have disabled 'x64' support in Jax, which interferes with the calling of the SDFG. "
                 "SDFG generated in this way will fail to call."

From 3a3ca657cc8b40b13cf237d71151c1bc34c6bb21 Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Wed, 22 May 2024 09:45:16 +0200
Subject: [PATCH 211/458] Updated the tests, there is now also a test for
 checking the Datatype.

---
 tests/test_caching.py | 24 ++++++++++++++++++++++++
 1 file changed, 24 insertions(+)

diff --git a/tests/test_caching.py b/tests/test_caching.py
index ea31153..67d5e70 100644
--- a/tests/test_caching.py
+++ b/tests/test_caching.py
@@ -185,6 +185,30 @@ def jaceWrapped(A: np.ndarray, B: np.ndarray) -> np.ndarray:
     assert optiCompiled._csdfg.sdfg.number_of_nodes() < unoptiCompiled._csdfg.sdfg.number_of_nodes()
 
 
+def test_caching_dtype():
+    """Tests if the data type is properly included in the test."""
+
+    lowering_cnt = [0]
+
+    @jace.jit
+    def testee(A: np.ndarray) -> np.ndarray:
+        lowering_cnt[0] += 1
+        return A + A
+
+    dtypes = [np.float64, np.float32, np.int32, np.int64]
+    shape = (10, 10)
+
+    for i, dtype in enumerate(dtypes):
+        A = np.array((np.random.random(shape) - 0.5) * 10, dtype=dtype)  # noqa: NPY002
+
+        assert lowering_cnt[0] == i
+        _ = testee(A)
+        assert lowering_cnt[0] == i + 1
+
+        assert np.allclose(testee(A), 2 * A)
+        assert lowering_cnt[0] == i + 1
+
+
 def test_caching_strides() -> None:
     """Test if the cache detects a change in strides."""
 

From e41a7e9b7c4793ed21f4424a524489de1834cef1 Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Wed, 22 May 2024 09:56:44 +0200
Subject: [PATCH 212/458] Added a test for a possible bug in DaCe.

---
 tests/test_decorator.py |  2 +-
 tests/test_misc.py      | 40 ++++++++++++++++++++++++++++++++++++++++
 2 files changed, 41 insertions(+), 1 deletion(-)
 create mode 100644 tests/test_misc.py

diff --git a/tests/test_decorator.py b/tests/test_decorator.py
index cf1ffaf..7877b07 100644
--- a/tests/test_decorator.py
+++ b/tests/test_decorator.py
@@ -8,7 +8,7 @@
 """Implements tests for the jit decorator.
 
 Also see the `test_jax_api.py` test file, that tests composability.
-."""
+"""
 
 from __future__ import annotations
 
diff --git a/tests/test_misc.py b/tests/test_misc.py
new file mode 100644
index 0000000..ec2a5b2
--- /dev/null
+++ b/tests/test_misc.py
@@ -0,0 +1,40 @@
+# JaCe - JAX Just-In-Time compilation using DaCe (Data Centric Parallel Programming)
+#
+# Copyright (c) 2024, ETH Zurich
+# All rights reserved.
+#
+# SPDX-License-Identifier: BSD-3-Clause
+
+"""Implements general tests for Jace."""
+
+from __future__ import annotations
+
+import numpy as np
+import pytest
+
+import jace
+
+
+@pytest.mark.skip("Possible bug in DaCe.")
+def test_mismatch_in_datatyte_calling():
+    """Tests compilation and calling with different types.
+
+    Note that this more or less tests the calling implementation of the `CompiledSDFG` class in DaCe.
+    As I understand the `CompiledSDFG::_construct_args()` function this should be detected.
+    However, as evidently it does not do this.
+    """
+
+    @jace.jit
+    def testee(A: np.ndarray) -> np.ndarray:
+        return -A
+
+    # Different types.
+    A1 = np.arange(12, dtype=np.float32).reshape((4, 3))
+    A2 = np.arange(12, dtype=np.int64).reshape((4, 3))
+
+    # Lower and compilation for first type
+    callee = testee.lower(A1).compile()
+
+    # But calling with the second type
+    with pytest.raises(Exception):  # noqa: B017, PT011 # Unknown exception.
+        _ = callee(A2)

From 2fd739100efebd827f7c93ece9269484f36785b5 Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Wed, 22 May 2024 10:40:40 +0200
Subject: [PATCH 213/458] Updated the `translate_dtype()` function.

I think this make it less magical, okay it is stil very guru level, but it looks a bit more reasonable.
---
 src/jace/util/jax_helper.py | 32 +++++---------------------------
 1 file changed, 5 insertions(+), 27 deletions(-)

diff --git a/src/jace/util/jax_helper.py b/src/jace/util/jax_helper.py
index 1df0334..5d004ab 100644
--- a/src/jace/util/jax_helper.py
+++ b/src/jace/util/jax_helper.py
@@ -22,8 +22,6 @@
 
 import dace
 import jax.core as jax_core
-import jax.dtypes as jax_dtypes
-import numpy as np
 
 import jace.util as util
 
@@ -144,35 +142,15 @@ def is_tracing_ongoing(
 
 def translate_dtype(dtype: Any) -> dace.typeclass:
     """Turns a Jax datatype into a DaCe datatype."""
+    if dtype is None:
+        raise NotImplementedError  # Handling a special case in DaCe.
     if isinstance(dtype, dace.typeclass):
         return dtype
-    if dtype is None:
-        # Special behaviour of `dtype_to_typeclass()`
-        raise NotImplementedError()
-
-    # For reasons unknown to me we have to do the dtype conversion this way.
-    #  It is not possible to simply call `dace.typeclass(dtype)` or pass it to
-    #  `dace.dtype_to_typeclass()`, it will generate an error.
-    #  We keep the `dtype_to_typeclass()` function call, in order to handle
-    #  NumPy types as DaCe intended them to be handled.
-    try:
-        return dace.dtype_to_typeclass(dtype)
-    except KeyError:
-        pass
-
     try:
-        dtype_ = jax_dtypes.canonicalize_dtype(dtype)
-        return dace.dtype_to_typeclass(dtype_)
-    except Exception:
+        return dace.typeclass(dtype)
+    except (NameError, KeyError):
         pass
-
-    dtype_name = str(dtype)
-    if hasattr(dace.dtypes, dtype_name):
-        return getattr(dace.dtypes, dtype_name)
-    if hasattr(np, dtype_name):
-        dtype = getattr(np, dtype_name)
-        return dace.dtype_to_typeclass(dtype)
-    raise ValueError(f"Unable to translate '{dtype}' ino a DaCe dtype.")
+    return dace.dtype_to_typeclass(getattr(dtype, "type", dtype))
 
 
 def propose_jax_name(

From e4fb0cb4ab5d3fb5221f911dae65af809ffb4fad Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Wed, 22 May 2024 12:37:43 +0200
Subject: [PATCH 214/458] WIP: Testing new translator.

---
 .../primitive_translators/__init__.py         |  2 +
 .../convert_element_type_translator.py        | 91 +++++++++++++++++++
 tests/test_convert_element_type.py            | 18 ++++
 3 files changed, 111 insertions(+)
 create mode 100644 src/jace/translator/primitive_translators/convert_element_type_translator.py
 create mode 100644 tests/test_convert_element_type.py

diff --git a/src/jace/translator/primitive_translators/__init__.py b/src/jace/translator/primitive_translators/__init__.py
index 5595589..043661c 100644
--- a/src/jace/translator/primitive_translators/__init__.py
+++ b/src/jace/translator/primitive_translators/__init__.py
@@ -9,9 +9,11 @@
 from __future__ import annotations
 
 from .alu_translators import BinaryALUTranslator, UnaryALUTranslator
+from .convert_element_type_translator import ConvertElementTypeTranslator
 
 
 __all__ = [
     "BinaryALUTranslator",
     "UnaryALUTranslator",
+    "ConvertElementTypeTranslator",
 ]
diff --git a/src/jace/translator/primitive_translators/convert_element_type_translator.py b/src/jace/translator/primitive_translators/convert_element_type_translator.py
new file mode 100644
index 0000000..531cc48
--- /dev/null
+++ b/src/jace/translator/primitive_translators/convert_element_type_translator.py
@@ -0,0 +1,91 @@
+# JaCe - JAX Just-In-Time compilation using DaCe (Data Centric Parallel Programming)
+#
+# Copyright (c) 2024, ETH Zurich
+# All rights reserved.
+#
+# SPDX-License-Identifier: BSD-3-Clause
+
+"""Implements the Translator for the `convert_element_type` primitive."""
+
+from __future__ import annotations
+
+import warnings
+from collections.abc import Sequence
+
+import dace
+from jax import core as jax_core
+from typing_extensions import override
+
+from jace.translator.primitive_translators.mapped_operation_base_translator import (
+    MappedOperationBaseTranslator,
+)
+
+
+class ConvertElementTypeTranslator(MappedOperationBaseTranslator):
+    """Implements the `convert_element_type` primitive.
+
+    Copies the input to the output and performs type conversion.
+
+    Notes:
+        This translator ignores the `new_dtype` and `weak_type` parameter of the equation and only performs casting
+
+    Todo:
+        I occasionally Jax converts from the same type to another type.
+            This case should be handled by a Memlet directly, which can then be removed.
+    """
+
+    __slots__ = ()
+
+    def __init__(self) -> None:
+        super().__init__(primitive_name="convert_element_type")
+
+    @override
+    def write_tasklet_code(
+        self,
+        in_var_names: Sequence[str | None],
+        eqn: jax_core.JaxprEqn,
+    ) -> str:
+        """Return the code that should be put inside the Tasklet.
+
+        Note that returned code is not processed any further.
+        Thus the function has to apply literal removal on its own.
+
+        Args:
+            in_var_names:   The list of SDFG variables used as input.
+            eqn:            The equation.
+        """
+        assert in_var_names[0] is not None
+
+        in_var_name: str = in_var_names[0]
+        in_dtype = eqn.invars[0].aval.dtype
+        out_dtype = eqn.outvars[0].aval.dtype
+
+        if in_var_name is None:
+            raise NotImplementedError("'convert_element_type' is not supported for literals.")
+        if in_dtype == out_dtype:
+            # TODO(phimuell): make this into a pure Memlet such that it can be optimized away by DaCe.
+            # Believe it or not but it happens.
+            warnings.warn(
+                "convert_element_type({eqn}): is useless, because input and output have same type.",
+                stacklevel=1,  # Find a better one
+            )
+
+        # This is the base of the template that we use for conversion.
+        #  You should notice that the Tasklet `__out0 = __in0` will fail, see commit `f5aabc3` of the prototype.
+        #  Thus we have to do it in this way.
+        conv_code = "__in0"
+
+        if str(in_dtype).startswith("bool") and str(out_dtype).startswith("int"):
+            # Interestingly `__out0 = int(__in0)` will fail, Dace will optimize it away.
+            conv_code = f"(1 if {conv_code} else 0)"
+
+        # Now do the actual casting.
+        if hasattr(dace.dtypes, str(out_dtype)):
+            conv_code = f"dace.{out_dtype!s}(__in)"
+        else:
+            raise NotImplementedError(
+                f"Cannot convert '{in_dtype}' to '{out_dtype}' as this type is not known to DaCe."
+            )
+
+        # Now writing the full Tasklet, i.e. with the output.
+        return f"__out0 = {conv_code}"
diff --git a/tests/test_convert_element_type.py b/tests/test_convert_element_type.py
new file mode 100644
index 0000000..8d8a9ca
--- /dev/null
+++ b/tests/test_convert_element_type.py
@@ -0,0 +1,18 @@
+# JaCe - JAX Just-In-Time compilation using DaCe (Data Centric Parallel Programming)
+#
+# Copyright (c) 2024, ETH Zurich
+# All rights reserved.
+#
+# SPDX-License-Identifier: BSD-3-Clause
+
+"""Tests the element type conversion functionality."""
+
+from __future__ import annotations
+
+
+def test_convert_element_type_non_bool():
+    """Tests all conversions with the exception of bool as conversion target."""
+
+
+def test_convert_element_type_bool():
+    """Tests all conversions with the exception of bool as conversion target."""

From 1cd2c1c248a5623e286d9b9e75aa2b4c84699ac0 Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Wed, 22 May 2024 16:45:02 +0200
Subject: [PATCH 215/458] Added all suggestions by Enrque, at least I think
 that.

---
 src/jace/__init__.py                          |   2 +-
 src/jace/jax/__init__.py                      |   2 +-
 src/jace/jax/api.py                           |  90 ++--------
 src/jace/jax/stages.py                        |  85 ++++-----
 src/jace/jax/translation_cache.py             | 167 +++++++++---------
 .../__init__.py => optimization.py}           |  14 +-
 .../translator/jaxpr_translator_driver.py     |  65 +++----
 src/jace/translator/managing.py               |  93 ++++++----
 src/jace/translator/primitive_translator.py   |  19 +-
 src/jace/translator/translated_jaxpr_sdfg.py  |   4 +-
 src/jace/util/compiling.py                    |   9 +-
 src/jace/util/jax_helper.py                   |  21 +--
 tests/test_jaxpr_translator_driver.py         |  12 +-
 13 files changed, 243 insertions(+), 340 deletions(-)
 rename src/jace/{optimization/__init__.py => optimization.py} (72%)

diff --git a/src/jace/__init__.py b/src/jace/__init__.py
index 47f74ed..aad3265 100644
--- a/src/jace/__init__.py
+++ b/src/jace/__init__.py
@@ -11,7 +11,7 @@
 
 import jax as _jax
 
-import jace.translator.primitive_translators  # noqa: F401  # needed to poulate the internal list of translators.
+import jace.translator.primitive_translators as _  # noqa: F401  # Populate the internal registry.
 
 from .__about__ import __author__, __copyright__, __license__, __version__, __version_info__
 from .jax import grad, jacfwd, jacrev, jit
diff --git a/src/jace/jax/__init__.py b/src/jace/jax/__init__.py
index 47bb219..f4df884 100644
--- a/src/jace/jax/__init__.py
+++ b/src/jace/jax/__init__.py
@@ -5,7 +5,7 @@
 #
 # SPDX-License-Identifier: BSD-3-Clause
 
-"""This package mimics parts of the interface of the `jax` package that is supported by JaCe."""
+"""This package mimics the `jax` functions and features supported by JaCe."""
 
 from __future__ import annotations
 
diff --git a/src/jace/jax/api.py b/src/jace/jax/api.py
index 7dc27f5..a46702b 100644
--- a/src/jace/jax/api.py
+++ b/src/jace/jax/api.py
@@ -9,33 +9,30 @@
 
 from __future__ import annotations
 
-import functools as ft
+import functools
 from collections.abc import Callable, Mapping
-from typing import TYPE_CHECKING, Any, Literal, overload
+from typing import Any, Literal, overload
 
-import jax as _jax_jax
+from jax import grad, jacfwd, jacrev
 
 from jace import translator
-
-
-if TYPE_CHECKING:
-    from jace.jax import stages
+from jace.jax import stages
 
 
 @overload
 def jit(
     fun: Literal[None] = None,
     /,
-    sub_translators: Mapping[str, translator.PrimitiveTranslatorCallable] | None = None,
+    sub_translators: Mapping[str, translator.PrimitiveTranslator] | None = None,
     **kwargs: Any,
-) -> Callable[..., stages.JaceWrapped]: ...
+) -> Callable[[Callable], stages.JaceWrapped]: ...
 
 
 @overload
 def jit(
     fun: Callable,
     /,
-    sub_translators: Mapping[str, translator.PrimitiveTranslatorCallable] | None = None,
+    sub_translators: Mapping[str, translator.PrimitiveTranslator] | None = None,
     **kwargs: Any,
 ) -> stages.JaceWrapped: ...
 
@@ -43,9 +40,9 @@ def jit(
 def jit(
     fun: Callable | None = None,
     /,
-    sub_translators: Mapping[str, translator.PrimitiveTranslatorCallable] | None = None,
+    sub_translators: Mapping[str, translator.PrimitiveTranslator] | None = None,
     **kwargs: Any,
-) -> stages.JaceWrapped | Callable[..., stages.JaceWrapped]:
+) -> stages.JaceWrapped | Callable[[Callable], stages.JaceWrapped]:
     """Jace's replacement for `jax.jit` (just-in-time) wrapper.
 
     It works the same way as `jax.jit` does, but instead of using XLA the computation is lowered to DaCe.
@@ -57,17 +54,15 @@ def jit(
 
     Notes:
         If no subtranslators are specified then the ones that are currently active,
-            i.e. the output of `get_regsitered_primitive_translators()`, are used.
-            After construction changes to the passed `sub_translators` have no effect on the returned object.
+        i.e. the output of `get_regsitered_primitive_translators()`, are used.
+        After construction changes to the passed `sub_translators` have no effect on the returned object.
     """
-    if len(kwargs) != 0:
+    if kwargs:
         raise NotImplementedError(
             f"The following arguments of 'jax.jit' are not yet supported by jace: {', '.join(kwargs.keys())}."
         )
 
     def wrapper(f: Callable) -> stages.JaceWrapped:
-        from jace import jax as stages  # Cyclic import
-
         jace_wrapper = stages.JaceWrapped(
             fun=f,
             sub_translators=(
@@ -77,61 +72,14 @@ def wrapper(f: Callable) -> stages.JaceWrapped:
             ),
             jit_ops=kwargs,
         )
-        return ft.wraps(f)(jace_wrapper)
+        return functools.update_wrapper(jace_wrapper, f)
 
     return wrapper if fun is None else wrapper(fun)
 
 
-def vmap(
-    fun: Callable,
-    /,
-    **kwargs: Any,
-) -> stages.JaceWrapped:
-    """Jace wrapper around `jax.vmap`.
-
-    Notes:
-        Currently that is an untested extension.
-    """
-    import warnings
-
-    warnings.warn(
-        "You are using the highly untested 'vamp' interface.",
-        stacklevel=2,
-    )
-    return _jax_jax.vmap(
-        fun,
-        **kwargs,
-    )
-
-
-def grad(
-    fun: Callable | None = None,
-    /,
-    **kwargs: Any,
-) -> Callable:
-    """Jace wrapper for `jax.grad`.
-
-    Notes:
-        Note we can not put it into a `JaceWrapped` object because in autodiff mode
-            control primitives, such as `if` are allowed, but not in `jit`.
-            Thus there need to be this extra layer.
-    """
-    return _jax_jax.grad(fun, **kwargs)
-
-
-def jacfwd(
-    fun: Callable | None = None,
-    /,
-    **kwargs: Any,
-) -> Callable:
-    """Jace wrapper around `jax.jacfwd`."""
-    return _jax_jax.jacfwd(fun, **kwargs)
-
-
-def jacrev(
-    fun: Callable | None = None,
-    /,
-    **kwargs: Any,
-) -> Callable:
-    """Jace wrapper around `jax.jacrev`."""
-    return _jax_jax.jacrev(fun, **kwargs)
+__all__ = [
+    "grad",
+    "jit",
+    "jacfwd",
+    "jacrev",
+]
diff --git a/src/jace/jax/stages.py b/src/jace/jax/stages.py
index ce0ef48..038b66d 100644
--- a/src/jace/jax/stages.py
+++ b/src/jace/jax/stages.py
@@ -24,11 +24,11 @@
 from __future__ import annotations
 
 import copy
-from collections.abc import Callable, Mapping, Sequence
+from collections.abc import Callable, Hashable, Mapping, Sequence
 from typing import Any, Final, TypeAlias
 
 import dace
-import jax as jax_jax
+import jax as _jax
 
 from jace import optimization, translator, util
 from jace.jax import translation_cache as tcache
@@ -36,22 +36,12 @@
 from jace.util import dace_helper as jdace
 
 
-class Stage:
-    """A distinct step in the compilation chain, see module description for more.
+# TODO(phimuell): Turn this into `TypedDict` thing.
+#: Map type to pass compiler options to `JaceLowered.compile()`.
+CompilerOptions: TypeAlias = dict[str, bool | str]
 
-    The concrete steps are implemented in:
-    - JaceWrapped
-    - JaceLowered
-    - JaceCompiled
-    """
-
-
-"""Map type to pass compiler options to `JaceLowered.compile()`.
-"""
-CompilerOptions: TypeAlias = dict[str, tuple[bool, str]]
 
-
-class JaceWrapped(Stage):
+class JaceWrapped(tcache.CachingStage):
     """A function ready to be specialized, lowered, and compiled.
 
     This class represents the output of functions such as `jace.jit()`.
@@ -61,22 +51,20 @@ class JaceWrapped(Stage):
     You should not create `JaceWrapped` instances directly, instead you should use `jace.jit`.
 
     Todo:
-        Handles pytrees.
-        Copy the `jax._src.pjit.make_jit()` functionality to remove `jax.make_jaxpr()`.
+        - Handle pytrees.
     """
 
     _fun: Callable
-    _sub_translators: Mapping[str, translator.PrimitiveTranslatorCallable]
-    _jit_ops: Mapping[str, Any]
-    _cache: tcache.TranslationCache
+    _sub_translators: dict[str, translator.PrimitiveTranslator]
+    _jit_ops: dict[str, Any]
 
     def __init__(
         self,
         fun: Callable,
-        sub_translators: Mapping[str, translator.PrimitiveTranslatorCallable],
+        sub_translators: Mapping[str, translator.PrimitiveTranslator],
         jit_ops: Mapping[str, Any],
     ) -> None:
-        """Creates a wrapped jace jitable object of `jax_prim`.
+        """Creates a wrapped jitable object of `fun`.
 
         You should not create `JaceWrapped` instances directly, instead you should use `jace.jit`.
 
@@ -84,17 +72,14 @@ def __init__(
             fun:                The function that is wrapped.
             sub_translators:    The list of subtranslators that that should be used.
             jit_ops:            All options that we forward to `jax.jit`.
-
-        Notes:
-            Both the `sub_translators` and `jit_ops` are shallow copied.
         """
+        super().__init__()
         # We have to shallow copy both the translator and the jit options.
         #  This prevents that any modifications affect `self`.
         #  Shallow is enough since the translators themselves are immutable.
         self._sub_translators = dict(sub_translators)
         self._jit_ops = dict(jit_ops)
         self._fun = fun
-        self._cache = tcache.get_cache(self)
 
     def __call__(
         self,
@@ -141,7 +126,7 @@ def lower(
         if not all((not util.is_array(arg)) or arg.flags["C_CONTIGUOUS"] for arg in args):
             raise NotImplementedError("Currently can not handle strides beside 'C_CONTIGUOUS'.")
 
-        jaxpr = jax_jax.make_jaxpr(self._fun)(*args)
+        jaxpr = _jax.make_jaxpr(self._fun)(*args)
         driver = translator.JaxprTranslationDriver(sub_translators=self._sub_translators)
         trans_sdfg: translator.TranslatedJaxprSDFG = driver.translate_jaxpr(jaxpr)
         ptrans.postprocess_jaxpr_sdfg(tsdfg=trans_sdfg, fun=self.wrapped_fun)
@@ -153,7 +138,7 @@ def wrapped_fun(self) -> Callable:
         """Returns the wrapped function."""
         return self._fun
 
-    def _make_call_decscription(
+    def _make_call_description(
         self,
         *args: Any,
     ) -> tcache.CachedCallDescription:
@@ -163,21 +148,24 @@ def _make_call_decscription(
         The function will fully abstractify its input arguments.
         This function is used by the cache to generate the key.
         """
-        fargs = tuple(tcache._AbstarctCallArgument.from_value(x) for x in args)
+        fargs = tuple(tcache._AbstractCallArgument.from_value(x) for x in args)
         return tcache.CachedCallDescription(stage_id=id(self), fargs=fargs)
 
 
-class JaceLowered(Stage):
-    """Represents the original computation that was lowered to SDFG."""
+class JaceLowered(tcache.CachingStage):
+    """Represents the original computation that was lowered to SDFG.
 
-    DEF_COMPILER_OPTIONS: Final[dict[str, Any]] = {
+    Todo:
+        - Handle pytrees.
+    """
+
+    DEF_COMPILER_OPTIONS: Final[CompilerOptions] = {
         "auto_optimize": True,
         "simplify": True,
     }
 
     # `self` assumes complete ownership of the
     _trans_sdfg: translator.TranslatedJaxprSDFG
-    _cache: tcache.TranslationCache
 
     def __init__(
         self,
@@ -190,8 +178,8 @@ def __init__(
             raise ValueError("Input names must be defined.")
         if trans_sdfg.out_names is None:
             raise ValueError("Output names must be defined.")
+        super().__init__()
         self._trans_sdfg = trans_sdfg
-        self._cache = tcache.get_cache(self)
 
     @tcache.cached_translation
     def compile(
@@ -207,7 +195,7 @@ def compile(
 
         Notes:
             I am pretty sure that `None` in Jax means "use the default option".
-                See also `CachedCallDescription.make_call_description()`.
+            See also `CachedCallDescription.make_call_description()`.
         """
         # We **must** deepcopy before we do any optimization.
         #  There are many reasons for this but here are the most important ones:
@@ -218,16 +206,17 @@ def compile(
         #  However, if we would now call `jaceWrappedObject.lower()` (with the same arguments as before), we should get `jaceLoweredObject`,
         #  since it was cached, but it would actually contain an already optimized SDFG, which is not what we want.
         #  If you think you can remove this line then do it and run `tests/test_decorator.py::test_decorator_sharing`.
-        fsdfg: translator.TranslatedJaxprSDFG = copy.deepcopy(self._trans_sdfg)
+        tsdfg: translator.TranslatedJaxprSDFG = copy.deepcopy(self._trans_sdfg)
         optimization.jace_optimize(
-            fsdfg, **(self.DEF_COMPILER_OPTIONS if compiler_options is None else compiler_options)
+            tsdfg=tsdfg,
+            **(self.DEF_COMPILER_OPTIONS if compiler_options is None else compiler_options),  # type: ignore[arg-type]  # type confusion.
         )
-        csdfg: jdace.CompiledSDFG = util.compile_jax_sdfg(fsdfg)
+        csdfg: jdace.CompiledSDFG = util.compile_jax_sdfg(tsdfg)
 
         return JaceCompiled(
             csdfg=csdfg,
-            inp_names=fsdfg.inp_names,
-            out_names=fsdfg.out_names,
+            inp_names=tsdfg.inp_names,
+            out_names=tsdfg.out_names,
         )
 
     def compiler_ir(self, dialect: str | None = None) -> translator.TranslatedJaxprSDFG:
@@ -254,7 +243,7 @@ def as_sdfg(self) -> dace.SDFG:
         """
         return self.compiler_ir().sdfg
 
-    def _make_call_decscription(
+    def _make_call_description(
         self,
         compiler_options: CompilerOptions | None = None,
     ) -> tcache.CachedCallDescription:
@@ -267,7 +256,7 @@ def _make_call_decscription(
         if compiler_options is None:  # Must be the same as in `compile()`!
             compiler_options = self.DEF_COMPILER_OPTIONS
         assert isinstance(compiler_options, dict)
-        fargs: tuple[tuple[str, tcache._ConcreteCallArgument], ...] = tuple(
+        fargs: tuple[tuple[str, Hashable], ...] = tuple(
             sorted(
                 ((argname, argvalue) for argname, argvalue in compiler_options.items()),
                 key=lambda X: X[0],
@@ -276,13 +265,11 @@ def _make_call_decscription(
         return tcache.CachedCallDescription(stage_id=id(self), fargs=fargs)
 
 
-class JaceCompiled(Stage):
+class JaceCompiled:
     """Compiled version of the SDFG.
 
-    Contains all the information to run the associated computation.
-
     Todo:
-        Handle pytrees.
+        - Handle pytrees.
     """
 
     _csdfg: jdace.CompiledSDFG  # The compiled SDFG object.
@@ -316,6 +303,10 @@ def __call__(
         )
 
 
+#: Known compilation stages in Jace.
+Stage = JaceWrapped | JaceLowered | JaceCompiled
+
+
 __all__ = [
     "Stage",
     "CompilerOptions",
diff --git a/src/jace/jax/translation_cache.py b/src/jace/jax/translation_cache.py
index 267b7f9..be4b0a2 100644
--- a/src/jace/jax/translation_cache.py
+++ b/src/jace/jax/translation_cache.py
@@ -16,12 +16,12 @@
 
 from __future__ import annotations
 
-import functools as ft
-from abc import abstractmethod
-from collections import OrderedDict
-from collections.abc import Callable
-from dataclasses import dataclass
-from typing import TYPE_CHECKING, Any, Final, Protocol, TypeAlias, runtime_checkable
+import abc
+import collections
+import dataclasses
+import functools
+from collections.abc import Callable, Hashable
+from typing import TYPE_CHECKING, Any, Final, TypeAlias
 
 import dace
 from jax import core as jax_core
@@ -36,43 +36,58 @@
 _DEF_CACHE_SIZE: Final[int] = 256
 
 # This are the caches that we are using.
-_TRANSLATION_CACHES: dict[type[stages.Stage], TranslationCache] = {}
+_TRANSLATION_CACHES: dict[type[CachingStage], TranslationCache] = {}
 
 
-def cached_translation(
-    action: Callable,
-) -> Callable:
-    """Decorator for making the transfer method, i.e. `JaceWrapped.lower()` and `JaceLowered.compile()` cacheable.
+class CachingStage:
+    """Annotates a stage whose transition to the next one is cacheable.
+
+    This transitions are mainly `JaceWrapped.lower()` and `JaceLowered.compile()` calls.
+    To make a stage cacheable annotate the transition function with the `@cached_translation` decorator.
+
+    Todo:
+        - Make a generic to indicate what the result stage is.
+    """
+
+    _cache: TranslationCache
+
+    def __init__(self) -> None:
+        self._cache = get_cache(self)
+
+    @abc.abstractmethod
+    def _make_call_description(
+        self: CachingStage,
+        *args: Any,
+        **kwargs: Any,
+    ) -> CachedCallDescription:
+        """Generates the key that is used to store/locate the call in the cache."""
+        ...
 
-    The main issue is that we can not simply cache on the actual arguments we pass to them, but on an abstract
-    (or concrete; static arguments + compiling) description on them, and this is what this decorator is for.
-    Based on its argument it will generate a key of the call, see `TranslationCache.make_key()` for more.
-    Then it will check if the result is known and if needed it will perform the actual call.
 
-    Beside this the function will two two things.
-    The first is, that it will set the `_cache` member of `self` to the associated cache.
-    Thus an annotated object need to define such a member.
+def cached_translation(
+    action: Callable[..., stages.Stage],
+) -> Callable:
+    """Decorator for making the transition function of the stage cacheable.
 
-    The second thing it will do is optional, if the call is not cached inside the cache the wrapped function has to be run.
-    In that case the wrapper will first check if the object defines the `_call_description` member.
-    If this is the case the wrapper will set this object to an abstract description of the call, which is also used as key in the cache.
-    After the function return this member is set to `None`.
+    The decorator will call the annotated function only if the call is not stored inside the cache.
+    The key to look up the call in the cache is computed by `self._make_call_description()`.
+    For this the stage must be derived from `CachingStage`.
     """
 
-    @ft.wraps(action)
+    @functools.wraps(action)
     def _action_wrapper(
-        self: stages.JaceWrapped | stages.JaceLowered,
+        self: CachingStage,
         *args: Any,
         **kwargs: Any,
     ) -> stages.Stage:
         # Get the abstract description of the call, that is used as key.
-        key: CachedCallDescription = self._make_call_decscription(*args, **kwargs)
-        if self._cache.has(key):
-            return self._cache.get(key)
+        key: CachedCallDescription = self._make_call_description(*args, **kwargs)
+        if key in self._cache:
+            return self._cache[key]
 
         # We must actually perform the call
         next_stage: stages.Stage = action(self, *args, **kwargs)
-        self._cache.add(key, next_stage)
+        self._cache[key] = next_stage
         return next_stage
 
     return _action_wrapper
@@ -84,7 +99,7 @@ def clear_translation_cache() -> None:
 
 
 def get_cache(
-    stage: stages.Stage,
+    stage: CachingStage,
 ) -> TranslationCache:
     """Returns the cache that is used for `stage`."""
     # The caches are per stage and not per instance basis
@@ -94,8 +109,8 @@ def get_cache(
     return _TRANSLATION_CACHES[tstage]
 
 
-@dataclass(init=True, eq=True, frozen=True)
-class _AbstarctCallArgument:
+@dataclasses.dataclass(frozen=True)
+class _AbstractCallArgument:
     """Class to represent one argument to the call in an abstract way.
 
     It is used as part of the key in the cache.
@@ -112,12 +127,11 @@ class _AbstarctCallArgument:
     def from_value(
         cls,
         val: Any,
-    ) -> _AbstarctCallArgument:
-        """Construct an `_AbstarctCallArgument` from a value.
+    ) -> _AbstractCallArgument:
+        """Construct an `_AbstractCallArgument` from a value.
 
         Todo:
-            Improve, such that NumPy arrays are on CPU, CuPy on GPU and so on.
-            This function also probably fails for scalars.
+            Handle storage location of arrays correctly.
         """
         if not util.is_fully_addressable(val):
             raise NotImplementedError("Distributed arrays are not addressed yet.")
@@ -130,7 +144,7 @@ def from_value(
             shape = val.shape
             dtype = util.translate_dtype(val.dtype)
             strides = getattr(val, "strides", None)
-            # TODO(phimuell): is `CPU_Heap` always okay? There would also be `CPU_Pinned`.
+            # Is `CPU_Heap` always okay? There would also be `CPU_Pinned`.
             storage = (
                 dace.StorageType.GPU_Global if util.is_on_device(val) else dace.StorageType.CPU_Heap
             )
@@ -141,7 +155,7 @@ def from_value(
             shape = ()
             dtype = util.translate_dtype(type(val))
             strides = None
-            # Lets pretend that scalars are always on the CPU, which is a fair assumption.
+            # Scalar arguments are always on the CPU and never on the GPU.
             storage = dace.StorageType.CPU_Heap
 
             return cls(shape=shape, dtype=dtype, strides=strides, storage=storage)
@@ -149,51 +163,34 @@ def from_value(
         raise TypeError(f"Can not make 'an abstract description from '{type(val).__name__}'.")
 
 
-@runtime_checkable
-class _ConcreteCallArgument(Protocol):
-    """Type for encoding a concrete arguments in the cache."""
-
-    @abstractmethod
-    def __hash__(self) -> int:
-        pass
-
-    @abstractmethod
-    def __eq__(self, other: Any) -> bool:
-        pass
-
-
-"""This type is the abstract description of a function call.
-It is part of the key used in the cache.
-"""
+#: This type is the abstract description of a function call.
+#:  It is part of the key used in the cache.
 CallArgsDescription: TypeAlias = tuple[
-    _AbstarctCallArgument
-    | _ConcreteCallArgument
-    | tuple[str, _AbstarctCallArgument]
-    | tuple[str, _ConcreteCallArgument],
+    _AbstractCallArgument | Hashable | tuple[str, _AbstractCallArgument | Hashable],
     ...,
 ]
 
 
-@dataclass(init=True, eq=True, frozen=True)
+@dataclasses.dataclass(frozen=True)
 class CachedCallDescription:
-    """Represents the structure of the entire call in the cache and used as key in the cache.
+    """Represents the full structure of a call in the cache as a key.
 
-    This class represents both the `JaceWrapped.lower()` and `JaceLowered.compile()` calls.
+    This class is the return type of the `CachingStage._make_call_description()` function,
+    which is used by the `@cached_translation` decorator to compute a key of transition.
+    This allows to either retrieve or then store the result of the actual call in the cache.
 
     The actual key is composed of two parts, first the "origin of the call".
     For this we just use the address of the stage object we are caching and hope that the
     address is not reused for another stag anytime soon.
 
     The second part is of the key are a description of the actual arguments, see `CallArgsDescription` type alias.
-    There are two ways for describing the arguments:
-    - `_AbstarctCallArgument`: Which encode only the structure of the arguments.
-        These are essentially the tracer used by Jax.
-    - `_ConcreteCallArgument`: Which represents actual values of the call.
-        These are either the static arguments or compile options.
-
-    While `JaceWrapped.lower()` uses both, `JaceLowered.compile()` will only use concrete arguments.
-    In addition an argument can be positional or a named argument,
-    in which case it consists of a `tuple[str, _AbstarctCallArgument  | _ConcreteCallArgument]`.
+    For this the `_make_call_description()` method of the stage is used.
+    The arguments can be described in two different ways:
+    - Abstract description: In this way, the actual value of the argument is irrelevant,
+        only the structure of them are important, this is similar to the tracers used in Jax.
+    - Concrete description: Here one caches on the actual value of the argument,
+        which is similar to static arguments in Jax.
+        The only restriction is that they are hash able.
 
     Notes:
         The base assumption is that the stages are immutable.
@@ -208,19 +205,15 @@ class CachedCallDescription:
 
 
 class TranslationCache:
-    """The _internal_ cache object.
-
-    It implements a simple LRU cache, for storing the results of the `JaceWrapped.lower()` and `JaceLowered.compile()` calls.
-    You should not use this cache directly but instead use the `cached_translation` decorator.
+    """The cache object used to cache the stage transitions.
 
     Notes:
-        The most recently used entry is at the end of the `OrderedDict`.
-            The reason for this is, because there the new entries are added.
+        The most recently used entry is at the end of the `OrderedDict`, because it puts new entries there.
     """
 
-    __slots__ = ["_memory", "_size"]
+    __slots__ = ("_memory", "_size")
 
-    _memory: OrderedDict[CachedCallDescription, stages.Stage]
+    _memory: collections.OrderedDict[CachedCallDescription, stages.Stage]
     _size: int
 
     def __init__(
@@ -233,17 +226,17 @@ def __init__(
         """
         if size <= 0:
             raise ValueError(f"Invalid cache size of '{size}'")
-        self._memory: OrderedDict[CachedCallDescription, stages.Stage] = OrderedDict()
+        self._memory = collections.OrderedDict()
         self._size = size
 
-    def has(
+    def __contains__(
         self,
         key: CachedCallDescription,
     ) -> bool:
         """Check if `self` have a record of `key`."""
         return key in self._memory
 
-    def get(
+    def __getitem__(
         self,
         key: CachedCallDescription,
     ) -> stages.Stage:
@@ -253,18 +246,18 @@ def get(
             It is an error if `key` does not exist.
             This function will mark `key` as most recently used.
         """
-        if not self.has(key):
+        if key not in self:
             raise KeyError(f"Key '{key}' is unknown.")
         self._memory.move_to_end(key, last=True)
         return self._memory[key]
 
-    def add(
+    def __setitem__(
         self,
         key: CachedCallDescription,
         res: stages.Stage,
     ) -> TranslationCache:
-        """Adds `res` under `key` to `self`."""
-        if self.has(key):
+        """Adds or update `key` to map to `res`."""
+        if key in self:
             # `key` is known, so move it to the end and update the mapped value.
             self._memory.move_to_end(key, last=True)
             self._memory[key] = res
@@ -272,11 +265,11 @@ def add(
         else:
             # `key` is not known so we have to add it
             while len(self._memory) >= self._size:
-                self._evict(None)
+                self.popitem(None)
             self._memory[key] = res
         return self
 
-    def _evict(
+    def popitem(
         self,
         key: CachedCallDescription | None,
     ) -> None:
@@ -288,7 +281,7 @@ def _evict(
             return
         if key is None:
             self._memory.popitem(last=False)
-        elif self.has(key):
+        elif key in self:
             self._memory.move_to_end(key, last=False)
             self._memory.popitem(last=False)
 
diff --git a/src/jace/optimization/__init__.py b/src/jace/optimization.py
similarity index 72%
rename from src/jace/optimization/__init__.py
rename to src/jace/optimization.py
index f841b62..c875009 100644
--- a/src/jace/optimization/__init__.py
+++ b/src/jace/optimization.py
@@ -7,7 +7,7 @@
 
 """Module that will host all optimization functions specific to Jace.
 
-Currently it is just a dummy that exports some functions that do nothing.
+Currently just a dummy existing for the sake of providing some callable function.
 """
 
 from __future__ import annotations
@@ -17,9 +17,8 @@
 
 def jace_optimize(
     tsdfg: translator.TranslatedJaxprSDFG,
-    simplify: bool = False,
+    simplify: bool = True,
     auto_optimize: bool = False,
-    **kwargs: str | bool,  # noqa: ARG001  # Unused argument, for now
 ) -> None:
     """Performs optimization of the `fsdfg` _inplace_.
 
@@ -29,10 +28,6 @@ def jace_optimize(
     Args:
         simplify:       Run the simplification pilepline.
         auto_optimize:  Run the auto optimization pipeline (currently does nothing)
-
-    Notes:
-        All optimization flags must be disabled by default!
-            The reason for this is that `jaceLowered.compile({})` will disable all optimizations.
     """
     if not tsdfg.is_finalized:
         raise ValueError("Can only optimize finalized SDFGs.")
@@ -44,8 +39,3 @@ def jace_optimize(
         pass
 
     tsdfg.validate()
-
-
-__all__ = [
-    "jace_auto_optimize",
-]
diff --git a/src/jace/translator/jaxpr_translator_driver.py b/src/jace/translator/jaxpr_translator_driver.py
index ab7d905..77da631 100644
--- a/src/jace/translator/jaxpr_translator_driver.py
+++ b/src/jace/translator/jaxpr_translator_driver.py
@@ -53,15 +53,14 @@ class JaxprTranslationDriver:
 
     Notes:
         After the main translation has been performed the translator object can be used again.
-        Currently the driver will generate only Array as SDFG variables, however, this is a temporary solution.
-            For more on that see `add_array()`.
+        Currently the driver will generate only Array as SDFG variables, however, this is a temporary solution, see `add_array()`.
     """
 
-    __slots__ = (
-        "_ctx_stack",  # Stack of all contexts
-        "_sub_translators",
-        "_jax_name_map",
-    )
+    __slots__ = ("_ctx_stack", "_sub_translators", "_jax_name_map")
+
+    _sub_translators: Mapping[str, translator.PrimitiveTranslatorCallable]
+    _jax_name_map: dict[jax_core.Var | util.JaCeVar, str]
+    _ctx_stack: list[translator.TranslatedJaxprSDFG]
 
     def __init__(
         self,
@@ -73,28 +72,24 @@ def __init__(
             sub_translators:    Use these subtranslators to perform the translation.
 
         Notes:
-            `sub_translators` is not copied, thus the user has to guarantee,
-                that it will not change during translation.
-                It is highly advised but not required to use the output of
-                `get_regsitered_primitive_translators()` or pass a copy as argument.
+            `sub_translators` is not copied, however, the user has to guarantee, that it does not change during the lifetime of `self`.
         """
 
         # Maps the name of a Jax primitive to the primitive translator that should be used.
         #  Note that the subtranslator is only required to be a callable, and immutable.
-        #  Allocated through the lifetime of `self`, and shared with the outside.
-        self._sub_translators: Mapping[str, translator.PrimitiveTranslatorCallable] = (
-            sub_translators
-        )
+        #  User has to ensure that it does not change.
+        self._sub_translators = sub_translators
 
         # Maps Jax variables to the name of its SDFG equivalent.
         #  Note that it is shared among all translation contexts.
         #  This is done to create consistency between SDFG variables
         #  and the names used pretty printed Jaxprs.
-        self._jax_name_map: dict[jax_core.Var | util.JaCeVar, str] = {}
+        self._jax_name_map = {}
 
         # Context stack and current context.
         #  If it is empty, then no translation process is in process.
-        self._ctx_stack: list[translator.TranslatedJaxprSDFG] = []
+        #  If there is one entry, `self` is the root translator.
+        self._ctx_stack = []
 
     def translate_jaxpr(
         self,
@@ -334,11 +329,11 @@ def add_array(
 
         Notes:
             Currently the function will always create an Array, even if the Jax variable refers to a scalar.
-                This is done to work around some difficulties with scalar return values and so on.
-                This issue should actually handled in the post processing stage, but currently it is not.
-                However, from a point of building an SDFG manually, there is no difference between a Scalar and an Array.
-                According to the dace developer, the majority of the backend, i.e. optimization pipeline, should be handle to handle it.
-                But there are some special parts that might explicitly want a scalar, it also might block certain compiler optimization.
+            This is done to work around some difficulties with scalar return values and so on.
+            This issue should actually handled in the post processing stage, but currently it is not.
+            However, from a point of building an SDFG manually, there is no difference between a Scalar and an Array.
+            According to the dace developer, the majority of the backend, i.e. optimization pipeline, should be handle to handle it.
+            But there are some special parts that might explicitly want a scalar, it also might block certain compiler optimization.
         """
         shape: tuple[int | dace.symbol | str, ...] = util.get_jax_var_shape(arg)
         dtype: dace.typeclass = util.get_jax_var_dtype(arg)
@@ -430,7 +425,7 @@ def create_jax_var_list(  # type: ignore[misc]
             kwargs:             Will be forwarded to `self.add_array()` in case a variable is created.
 
         Todo:
-            Rollback if the creation fails.
+            - Rollback if the creation fails.
         """
         if only_creation and prevent_creation:
             raise ValueError("Specified both 'only_creation' and 'prevent_creation'.")
@@ -459,13 +454,7 @@ def _create_initial_input(
         self,
         jaxpr: jax_core.ClosedJaxpr,
     ) -> Sequence[str]:
-        """This function will create the internal input variables that are used for the SDFG.
-
-        Args:
-            jaxpr:                  The Jaxpr that we want to translate.
-
-        Returns:
-            The list of SDFG variables used as input arguments of `jaxpr` in the same order.
+        """Creates the input variables of `jaxpr` and return a list of their SDFG names.
 
         Notes:
             The function will populate the `inp_names` member of the current context.
@@ -493,13 +482,10 @@ def _create_constants(
         self,
         jaxpr: jax_core.ClosedJaxpr,
     ) -> Sequence[str]:
-        """Creates all constants requested by the `jaxpr`.
+        """Creates all constants requested by the `jaxpr` and return a list with their SDFG names.
 
         The function will create an SDFG variable and add them as constant to the SDFG.
         The value they should have is deepcopied.
-
-        Returns:
-            Names of the SDFG variables created for the constants in the same order.
         """
         from copy import deepcopy
 
@@ -527,8 +513,8 @@ def _allocate_translation_ctx(
     ) -> JaxprTranslationDriver:
         """This function allocates and initialize the members of the translation context of `self`.
 
-        If this function is called and `self` is already allocated, the function will create a new context.
-        This allows the driver to handle nested Jaxpr.
+        If this function is called and `self` is already allocated, the function will create a new context,
+        allowing the driver to handle nested Jaxpr.
         The first context that is created is also known as root translator.
 
         Args:
@@ -561,7 +547,6 @@ def _clear_translation_ctx(self) -> JaxprTranslationDriver:
         Notes:
             While it is allowed for outside code to call this function explicit it is is most likely an error.
             If `self` is not allocated this function acts as a noops.
-            If `self` is a root translator, then the function will also deallocate the shared state of `self`.
         """
         if not self.is_allocated():
             return self
@@ -581,7 +566,7 @@ def _translate_single_eqn(
     ) -> tuple[Sequence[str | None], Sequence[str]]:
         """Translate `eqn` into its SDFG equivalent.
 
-        To do this the function will do the following steps:
+        To do this the function will perform the following steps:
         - Assemble the in and output variables.
         - Select the appropriate subtranslator to use.
         - Create a new empty state terminal state.
@@ -671,9 +656,7 @@ def _translate_jaxpr_internal(
             jaxpr:      The Jaxpr to translate.
 
         Notes:
-            The function will unconditionally handle empty Jaxpr.
-            Equations that store into drop variables, i.e. with name `_`, will be skipped.
-                Jax used such variables to indicate that it is not needed, transformations such as `grad` include them.
+            Equations that store into drop variables, i.e. with name `_`, will be ignored.
         """
         nb_translated_eqn: int = 0
         out_var_names: Sequence[str] = ()
diff --git a/src/jace/translator/managing.py b/src/jace/translator/managing.py
index 1f16641..b235bb9 100644
--- a/src/jace/translator/managing.py
+++ b/src/jace/translator/managing.py
@@ -13,71 +13,86 @@
 
 from __future__ import annotations
 
-from collections.abc import Callable, Mapping
-from typing import TYPE_CHECKING, cast
+from collections.abc import Callable, Mapping, MutableMapping
+from typing import TYPE_CHECKING, Literal, cast, overload
 
 
 if TYPE_CHECKING:
     from jace import translator
 
 # These are the currently active primitive translators of JaCe.
-_PRIMITIVE_TRANSLATORS_DICT: dict[str, translator.PrimitiveTranslatorCallable] = {}
+_PRIMITIVE_TRANSLATORS_DICT: dict[str, translator.PrimitiveTranslator] = {}
 
 
-def register_primitive_translator(
-    prim_translator: translator.PrimitiveTranslator
-    | translator.PrimitiveTranslatorCallable
-    | None = None,
-    *,
-    primitive: str | None = None,
-    overwrite: bool = False,
+@overload
+def make_primitive_translator(
+    primitive: str,
+    prim_translator: Literal[None] = None,
+) -> Callable[[translator.PrimitiveTranslatorCallable], translator.PrimitiveTranslator]: ...
+
+
+@overload
+def make_primitive_translator(
+    primitive: str, prim_translator: translator.PrimitiveTranslatorCallable
+) -> translator.PrimitiveTranslator: ...
+
+
+def make_primitive_translator(
+    primitive: str,
+    prim_translator: translator.PrimitiveTranslatorCallable | None = None,
 ) -> (
-    translator.PrimitiveTranslator
-    | Callable[
-        [translator.PrimitiveTranslator | translator.PrimitiveTranslatorCallable],
-        translator.PrimitiveTranslator,
-    ]
+    Callable[[translator.PrimitiveTranslatorCallable], translator.PrimitiveTranslator]
+    | translator.PrimitiveTranslator
 ):
-    """Adds the primitive translator `prim_translator` to Jace's internal list of translators.
+    """Decorator to turn a Callable into a `PrimitiveTranslator` for primitive `primitive`.
+
+    This function can be used to decorate functions that should serve as primitive translators.
+    Essentially, the decorator adds a `primitive` property to the decorated function and returns it.
+    However, this function does not register the primitive into the global registry,
+    for this you have to use `register_primitive_translator()`.
+    """
+
+    def wrapper(
+        prim_translator: translator.PrimitiveTranslatorCallable,
+    ) -> translator.PrimitiveTranslator:
+        if getattr(prim_translator, "primitive", primitive) != primitive:
+            raise ValueError(
+                f"Tried to change the 'primitive' property of '{prim_translator}' from '{prim_translator.primitive}' to '{primitive}'."  # type: ignore[attr-defined]
+            )
+        prim_translator.primitive = primitive  # type: ignore[attr-defined]  # we add the attribute, so it is not defined yet.
+        return cast(translator.PrimitiveTranslator, prim_translator)
+
+    return wrapper if prim_translator is None else wrapper(prim_translator)
+
+
+def register_primitive_translator(
+    prim_translator: translator.PrimitiveTranslator,
+    overwrite: bool = False,
+) -> translator.PrimitiveTranslator:
+    """Adds the primitive translator to Jace's internal list of translators and return it again.
 
     If the primitive is already known an error is generated, if `overwrite` is set, it will be replaced.
+    To add a `primitive` property use the `@make_primitive_translator` decorator.
 
     Args:
         prim_translator:    The primitive translator to annotate.
-        primitive:          Name of the primitive `prim_translator` is handled.
-                                If not given will use `prim_translator.primitive`.
         overwrite:          Replace the current primitive translator with `prim_translator`.
-
-    Notes:
-        Can only be used to register instances.
     """
-    from jace import translator
 
     def wrapper(
-        prim_translator: translator.PrimitiveTranslator | translator.PrimitiveTranslatorCallable,
+        prim_translator: translator.PrimitiveTranslator,
     ) -> translator.PrimitiveTranslator:
-        if not hasattr(prim_translator, "primitive"):
-            if not primitive:
-                raise ValueError(f"Missing primitive name for '{prim_translator}'")
-            prim_translator.primitive = primitive  # type: ignore[attr-defined]
-        elif (primitive is not None) and (prim_translator.primitive != primitive):
-            raise TypeError(
-                f"Translator's primitive '{prim_translator.primitive}' doesn't match the supplied '{primitive}'."
-            )
-
         if prim_translator.primitive in _PRIMITIVE_TRANSLATORS_DICT and not overwrite:
             raise ValueError(
                 f"Explicit override=True needed for primitive '{prim_translator.primitive}' to overwrite existing one."
             )
         _PRIMITIVE_TRANSLATORS_DICT[prim_translator.primitive] = prim_translator
-
-        # We add a `.primitive` property, thus it is for sure now no longer just a `PrimitiveTranslatorCallable`.
-        return cast(translator.PrimitiveTranslator, prim_translator)
+        return prim_translator
 
     return wrapper if prim_translator is None else wrapper(prim_translator)
 
 
-def get_regsitered_primitive_translators() -> dict[str, translator.PrimitiveTranslatorCallable]:
+def get_regsitered_primitive_translators() -> dict[str, translator.PrimitiveTranslator]:
     """Returns a view of the _currently_ active set of installed primitive translators in Jace.
 
     The returned mapping represents the active primitive translators at the time of calling.
@@ -87,12 +102,12 @@ def get_regsitered_primitive_translators() -> dict[str, translator.PrimitiveTran
 
 
 def set_active_primitive_translators_to(
-    new_translators: Mapping[str, translator.PrimitiveTranslatorCallable],
-) -> Mapping[str, translator.PrimitiveTranslatorCallable]:
+    new_translators: Mapping[str, translator.PrimitiveTranslator],
+) -> MutableMapping[str, translator.PrimitiveTranslator]:
     """Exchange the currently active subtranslators in Jace with `new_translators` and returns the previous ones.
 
     This function allows you to restore a specific state that was obtained by a previous call to `get_regsitered_primitive_translators()`.
-    The function is mainly intended for debugging.
+    While the function returns a mutable object, any changes to the returned object have no effect on the global state of the registry.
     """
     global _PRIMITIVE_TRANSLATORS_DICT
     assert all(getattr(trans, "primitive", prim) for prim, trans in new_translators.items())
diff --git a/src/jace/translator/primitive_translator.py b/src/jace/translator/primitive_translator.py
index 6c350f0..df52f90 100644
--- a/src/jace/translator/primitive_translator.py
+++ b/src/jace/translator/primitive_translator.py
@@ -28,19 +28,12 @@
 
 
 class PrimitiveTranslatorCallable(Protocol):
-    """Interface for all Jax primitive translators, also known as subtranslator.
+    """Callable version of the primitive translators.
 
-    A translator for a primitive translates a single equation of a Jaxpr into its SDFG equivalent.
-    For satisfying this interface a concrete implementation must be immutable after construction.
+    Used for type annotation purposes, classes should be derived from `PrimitiveTranslator` instead.
 
-    Subtranslators are simple, but highly specialized objects that are only able to perform the translation of a single primitive.
-    The overall translation process itself is managed by a driver object, which also owns and manage the subtranslators.
-    In the end this implements the delegation pattern.
-
-    You can use `jace.translator.add_subtranslator()` to register your translator to Jace.
-
-    Notes:
-        Primitive translators that are implemented as a class, should be derived from `PrimitiveTranslator`.
+    Todo:
+        - This split information `__call__()` should be documented in `PrimitiveTranslator` instead and not here.
     """
 
     __slots__ = ()
@@ -111,10 +104,6 @@ class PrimitiveTranslator(PrimitiveTranslatorCallable, Protocol):
     In the end this implements the delegation pattern.
 
     You can use `jace.translator.add_subtranslator()` to register your translator to Jace.
-
-    Notes:
-        The main difference to to `PrimitiveTranslatorCallable` is that this interface specifies the `primitive` property.
-            Thus, it must not be specified during registration.
     """
 
     __slots__ = ()
diff --git a/src/jace/translator/translated_jaxpr_sdfg.py b/src/jace/translator/translated_jaxpr_sdfg.py
index eae6292..1d08fce 100644
--- a/src/jace/translator/translated_jaxpr_sdfg.py
+++ b/src/jace/translator/translated_jaxpr_sdfg.py
@@ -51,12 +51,10 @@ def __init__(
         """Initializes the context.
 
         The function allocates the SDFG and initializes the members properly.
+        However, a user should never call this function directly.
 
         Args:
             name:       Name of the SDFG object.
-
-        Notes:
-            A user should never need to call this function.
         """
         if isinstance(name, str) and not util.VALID_SDFG_OBJ_NAME.fullmatch(name):
             raise ValueError(f"'{name}' is not a valid SDFG name.")
diff --git a/src/jace/util/compiling.py b/src/jace/util/compiling.py
index 31afd59..657ef30 100644
--- a/src/jace/util/compiling.py
+++ b/src/jace/util/compiling.py
@@ -86,12 +86,11 @@ def run_jax_sdfg(
         cargs:      All positional arguments of the call.
         ckwargs:    All keyword arguments of the call.
 
-    Notes:
+    Note:
         There is no pytree mechanism jet, thus the return values are returned inside a `tuple`
-            or in case of one value, directly, in the order determined by Jax.
-        Currently, this function does not consider strides in the input,
-            all input must be `C_CONTIGUOUS`.
-        Currently the SDFG must not have any undefined symbols, i.e. no undefined sizes.
+        or in case of one value, directly, in the order determined by Jax.
+        Currently, this function does not consider strides in the input, all input must be `C_CONTIGUOUS`.
+        Currently, the SDFG must not have any undefined symbols, i.e. no undefined sizes.
     """
     from jace import util
 
diff --git a/src/jace/util/jax_helper.py b/src/jace/util/jax_helper.py
index 01eaa8f..af2dce8 100644
--- a/src/jace/util/jax_helper.py
+++ b/src/jace/util/jax_helper.py
@@ -15,9 +15,9 @@
 
 from __future__ import annotations
 
+import dataclasses
 import itertools
 from collections.abc import Mapping
-from dataclasses import dataclass
 from typing import Any
 
 import dace
@@ -28,23 +28,21 @@
 import jace.util as util
 
 
-@dataclass(repr=True, frozen=True, eq=False)
+@dataclasses.dataclass(repr=True, frozen=True, eq=False)
 class JaCeVar:
     """Replacement for the `jax.Var` class.
 
     This class can be seen as some kind of substitute `jax.core.Var`.
-    The main intention of this class is as an internal representation of values,
-    as they are used in Jax, but without the Jax machinery.
+    The main intention of this class is as an internal representation of values, as they are used in Jax, but without the Jax machinery.
     As abstract values in Jax this class has a datatype, which is a `dace.typeclass` instance and a shape.
-    In addition it has an optional name, which allows to create variables with a certain name using `JaxprTranslationDriver::add_array()`.
+    In addition it has an optional name, which allows to create variables with a certain name using `JaxprTranslationDriver.add_array()`.
 
-    Notes:
-        Main intention is to test functionality.
+    Note:
         If the name of a `JaCeVar` is '_' it is considered a drop variable.
         The definitions of `__hash__` and `__eq__` are in accordance how Jax variable works.
 
     Todo:
-        Add support for strides.
+        - Add support for strides.
     """
 
     shape: tuple[int | dace.symbol | str, ...]
@@ -78,9 +76,8 @@ def get_jax_var_name(jax_var: jax_core.Atom | JaCeVar) -> str:
 
     Notes:
         If `jax_var` is a `JaCeVar` the function will return, if defined, its `.name` property.
-            Otherwise it will compose a name similar to Jax `Var` objects.
+        Otherwise it will compose a name similar to Jax `Var` objects.
         The returned names are stable, i.e. it will output the same value for the same variable.
-        The returned name passes the `util.VALID_SDFG_VAR_NAME` pattern.
     """
     match jax_var:
         case jax_core.DropVar():
@@ -191,9 +188,9 @@ def propose_jax_name(
         jax_var:        The variable for which a name to propose.
         jax_name_map:   A mapping of all Jax variables that were already named.
 
-    Notes:
+    Note:
         The function guarantees that the returned name passes `VALID_SDFG_VAR_NAME` test
-            and that the name is not part of `util.FORBIDDEN_SDFG_VAR_NAMES`.
+        and that the name is not part of `util.FORBIDDEN_SDFG_VAR_NAMES`.
         Dropped variables will always be named `'_'`.
     """
     if isinstance(jax_var, jax_core.Literal):
diff --git a/tests/test_jaxpr_translator_driver.py b/tests/test_jaxpr_translator_driver.py
index 5a0aaee..96a7419 100644
--- a/tests/test_jaxpr_translator_driver.py
+++ b/tests/test_jaxpr_translator_driver.py
@@ -338,7 +338,7 @@ def test_driver_variable_invalid_prefix(
 def test_driver_variable_alloc_list(
     translation_driver: translator.JaxprTranslationDriver,
 ) -> None:
-    """Tests part of the `JaxprTranslationDriver::create_jax_var_list()` api."""
+    """Tests part of the `JaxprTranslationDriver.create_jax_var_list()` api."""
     var_list_1 = [array1, nscal, scal2]
     exp_names_1 = ["a", nscal.name, "c"]
 
@@ -365,7 +365,7 @@ def test_driver_variable_alloc_list(
 def test_driver_variable_alloc_list_cleaning(
     translation_driver: translator.JaxprTranslationDriver,
 ) -> None:
-    """Tests part of the `JaxprTranslationDriver::create_jax_var_list()` api.
+    """Tests part of the `JaxprTranslationDriver.create_jax_var_list()` api.
 
     It will fail because `update_var_mapping=False` thus the third variable will
     cause an error because it is proposed to `a`, which is already used.
@@ -386,7 +386,7 @@ def test_driver_variable_alloc_list_cleaning(
 def test_driver_variable_alloc_list_prevent_creation(
     translation_driver: translator.JaxprTranslationDriver,
 ) -> None:
-    """Tests part of the `JaxprTranslationDriver::create_jax_var_list()` api.
+    """Tests part of the `JaxprTranslationDriver.create_jax_var_list()` api.
 
     It will test the `prevent_creation` flag.
     """
@@ -413,7 +413,7 @@ def test_driver_variable_alloc_list_prevent_creation(
 def test_driver_variable_alloc_list_only_creation(
     translation_driver: translator.JaxprTranslationDriver,
 ) -> None:
-    """Tests part of the `JaxprTranslationDriver::create_jax_var_list()` api.
+    """Tests part of the `JaxprTranslationDriver.create_jax_var_list()` api.
 
     It will test the `only_creation` flag.
     """
@@ -439,7 +439,7 @@ def test_driver_variable_alloc_list_only_creation(
 def test_driver_variable_alloc_list_handle_literal(
     translation_driver: translator.JaxprTranslationDriver,
 ) -> None:
-    """Tests part of the `JaxprTranslationDriver::create_jax_var_list()` api.
+    """Tests part of the `JaxprTranslationDriver.create_jax_var_list()` api.
 
     It will test the `handle_literals` flag.
     """
@@ -473,7 +473,7 @@ def test_driver_variable_alloc_list_handle_literal(
 def test_driver_constants(
     translation_driver: translator.JaxprTranslationDriver,
 ) -> None:
-    """Tests part of the `JaxprTranslationDriver::_create_constants()` api.
+    """Tests part of the `JaxprTranslationDriver._create_constants()` api.
 
     See also the `test_subtranslators_alu.py::test_add3` test.
     """

From 3d867cc070cd21cf6e9d171b726756516a70f36d Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Thu, 23 May 2024 09:20:42 +0200
Subject: [PATCH 216/458] Forget to change the compiler argument stuff.

---
 src/jace/jax/stages.py          | 65 +++++++++++----------------------
 src/jace/optimization.py        | 43 ++++++++++++++++++++--
 src/jace/translator/__init__.py |  2 +
 src/jace/translator/managing.py | 21 ++++++++++-
 4 files changed, 84 insertions(+), 47 deletions(-)

diff --git a/src/jace/jax/stages.py b/src/jace/jax/stages.py
index 038b66d..5ad907e 100644
--- a/src/jace/jax/stages.py
+++ b/src/jace/jax/stages.py
@@ -24,23 +24,19 @@
 from __future__ import annotations
 
 import copy
-from collections.abc import Callable, Hashable, Mapping, Sequence
-from typing import Any, Final, TypeAlias
+from collections.abc import Callable, Mapping, Sequence
+from typing import Any
 
 import dace
 import jax as _jax
 
 from jace import optimization, translator, util
 from jace.jax import translation_cache as tcache
+from jace.optimization import CompilerOptions
 from jace.translator import post_translation as ptrans
 from jace.util import dace_helper as jdace
 
 
-# TODO(phimuell): Turn this into `TypedDict` thing.
-#: Map type to pass compiler options to `JaceLowered.compile()`.
-CompilerOptions: TypeAlias = dict[str, bool | str]
-
-
 class JaceWrapped(tcache.CachingStage):
     """A function ready to be specialized, lowered, and compiled.
 
@@ -159,11 +155,6 @@ class JaceLowered(tcache.CachingStage):
         - Handle pytrees.
     """
 
-    DEF_COMPILER_OPTIONS: Final[CompilerOptions] = {
-        "auto_optimize": True,
-        "simplify": True,
-    }
-
     # `self` assumes complete ownership of the
     _trans_sdfg: translator.TranslatedJaxprSDFG
 
@@ -188,33 +179,27 @@ def compile(
     ) -> JaceCompiled:
         """Compile the SDFG.
 
-        Returns an Object that encapsulates a compiled SDFG object.
-        You can pass a `dict` as argument which are passed to the `jace_optimize()` routine.
-        If you pass `None` then the default options are used.
-        To disable all optimization, pass an empty `dict`.
+        Returns an object that encapsulates a compiled SDFG object.
+        To influence the various optimizations and compile options of Jace you can use the `compiler_options` argument.
+        This is a `dict` which are used as arguments to `jace_optimize()`.
+
+        If nothing is specified `jace.optimization.DEFAULT_OPTIMIZATIONS` will be used.
+        Before `compiler_options` is forwarded to `jace_optimize()` it is merged with the default options.
 
-        Notes:
-            I am pretty sure that `None` in Jax means "use the default option".
-            See also `CachedCallDescription.make_call_description()`.
+        Note:
+            The result of this function is cached.
         """
         # We **must** deepcopy before we do any optimization.
-        #  There are many reasons for this but here are the most important ones:
-        #  All optimization DaCe functions works in place, if we would not copy the SDFG first, then we would have a problem.
-        #  Because, these optimization would then have a feedback of the SDFG object which is stored inside `self`.
-        #  Thus, if we would run this code `(jaceLoweredObject := jaceWrappedObject.lower()).compile({opti=True})` would return
-        #  an optimized object, which is what we intent to do.
-        #  However, if we would now call `jaceWrappedObject.lower()` (with the same arguments as before), we should get `jaceLoweredObject`,
-        #  since it was cached, but it would actually contain an already optimized SDFG, which is not what we want.
-        #  If you think you can remove this line then do it and run `tests/test_decorator.py::test_decorator_sharing`.
+        #  The reason is `self` is cached and assumed to be immutable.
+        #  Since all optimizations works in place, we would violate this assumption.
         tsdfg: translator.TranslatedJaxprSDFG = copy.deepcopy(self._trans_sdfg)
-        optimization.jace_optimize(
-            tsdfg=tsdfg,
-            **(self.DEF_COMPILER_OPTIONS if compiler_options is None else compiler_options),  # type: ignore[arg-type]  # type confusion.
-        )
-        csdfg: jdace.CompiledSDFG = util.compile_jax_sdfg(tsdfg)
+
+        # Must be the same as in `_make_call_description()`!
+        options = optimization.DEFAULT_OPTIMIZATIONS | (compiler_options or {})
+        optimization.jace_optimize(tsdfg=tsdfg, **options)
 
         return JaceCompiled(
-            csdfg=csdfg,
+            csdfg=util.compile_jax_sdfg(tsdfg),
             inp_names=tsdfg.inp_names,
             out_names=tsdfg.out_names,
         )
@@ -253,15 +238,9 @@ def _make_call_description(
         The function will construct a concrete description of the call using `(name, value)` pairs.
         This function is used by the cache.
         """
-        if compiler_options is None:  # Must be the same as in `compile()`!
-            compiler_options = self.DEF_COMPILER_OPTIONS
-        assert isinstance(compiler_options, dict)
-        fargs: tuple[tuple[str, Hashable], ...] = tuple(
-            sorted(
-                ((argname, argvalue) for argname, argvalue in compiler_options.items()),
-                key=lambda X: X[0],
-            )
-        )
+        # Must be the same as in `compile()`!
+        options = optimization.DEFAULT_OPTIMIZATIONS | (compiler_options or {})
+        fargs = tuple(sorted(options.items(), key=lambda X: X[0]))
         return tcache.CachedCallDescription(stage_id=id(self), fargs=fargs)
 
 
@@ -309,7 +288,7 @@ def __call__(
 
 __all__ = [
     "Stage",
-    "CompilerOptions",
+    "CompilerOptions",  # export for compatibility with Jax.
     "JaceWrapped",
     "JaceLowered",
     "JaceCompiled",
diff --git a/src/jace/optimization.py b/src/jace/optimization.py
index c875009..bc2bf10 100644
--- a/src/jace/optimization.py
+++ b/src/jace/optimization.py
@@ -12,13 +12,41 @@
 
 from __future__ import annotations
 
-from jace import translator
+from typing import TYPE_CHECKING, Final, TypedDict
+
+from typing_extensions import Unpack
+
+
+if TYPE_CHECKING:
+    from jace import translator
+
+
+class CompilerOptions(TypedDict, total=False):
+    """All known compiler options known to `JaceLowered.compile()`.
+
+    There are some predefined option sets in `jace.jax.stages`:
+    - `DEFAULT_COMPILER_OPTIONS`
+    - `NO_OPTIMIZATIONS`
+    """
+
+    auto_optimize: bool
+    simplify: bool
+
+
+DEFAULT_OPTIMIZATIONS: Final[CompilerOptions] = {
+    "auto_optimize": True,
+    "simplify": True,
+}
+
+NO_OPTIMIZATIONS: Final[CompilerOptions] = {
+    "auto_optimize": False,
+    "simplify": False,
+}
 
 
 def jace_optimize(
     tsdfg: translator.TranslatedJaxprSDFG,
-    simplify: bool = True,
-    auto_optimize: bool = False,
+    **kwargs: Unpack[CompilerOptions],
 ) -> None:
     """Performs optimization of the `fsdfg` _inplace_.
 
@@ -28,9 +56,18 @@ def jace_optimize(
     Args:
         simplify:       Run the simplification pilepline.
         auto_optimize:  Run the auto optimization pipeline (currently does nothing)
+
+    Note:
+        By default all optimizations are disabled and this function acts as a noops.
     """
     if not tsdfg.is_finalized:
         raise ValueError("Can only optimize finalized SDFGs.")
+    if not kwargs:
+        return
+
+    # Unpack the arguments, defaults are such that no optimization is done.
+    simplify = kwargs.get("simplify", False)
+    auto_optimize = kwargs.get("auto_optimize", False)
 
     if simplify:
         tsdfg.sdfg.simplify()
diff --git a/src/jace/translator/__init__.py b/src/jace/translator/__init__.py
index 341c713..49342be 100644
--- a/src/jace/translator/__init__.py
+++ b/src/jace/translator/__init__.py
@@ -12,6 +12,7 @@
 from .jaxpr_translator_driver import JaxprTranslationDriver
 from .managing import (
     get_regsitered_primitive_translators,
+    make_primitive_translator,
     register_primitive_translator,
     set_active_primitive_translators_to,
 )
@@ -27,4 +28,5 @@
     "register_primitive_translator",
     "get_regsitered_primitive_translators",
     "set_active_primitive_translators_to",
+    "make_primitive_translator",
 ]
diff --git a/src/jace/translator/managing.py b/src/jace/translator/managing.py
index b235bb9..08ec3f7 100644
--- a/src/jace/translator/managing.py
+++ b/src/jace/translator/managing.py
@@ -55,6 +55,8 @@ def make_primitive_translator(
     def wrapper(
         prim_translator: translator.PrimitiveTranslatorCallable,
     ) -> translator.PrimitiveTranslator:
+        from jace import translator  # Cyclic
+
         if getattr(prim_translator, "primitive", primitive) != primitive:
             raise ValueError(
                 f"Tried to change the 'primitive' property of '{prim_translator}' from '{prim_translator.primitive}' to '{primitive}'."  # type: ignore[attr-defined]
@@ -65,10 +67,27 @@ def wrapper(
     return wrapper if prim_translator is None else wrapper(prim_translator)
 
 
+@overload
+def register_primitive_translator(
+    prim_translator: Literal[None] = None,
+    overwrite: bool = False,
+) -> Callable[[translator.PrimitiveTranslator], translator.PrimitiveTranslator]: ...
+
+
+@overload
 def register_primitive_translator(
     prim_translator: translator.PrimitiveTranslator,
     overwrite: bool = False,
-) -> translator.PrimitiveTranslator:
+) -> translator.PrimitiveTranslator: ...
+
+
+def register_primitive_translator(
+    prim_translator: translator.PrimitiveTranslator | None = None,
+    overwrite: bool = False,
+) -> (
+    translator.PrimitiveTranslator
+    | Callable[[translator.PrimitiveTranslator], translator.PrimitiveTranslator]
+):
     """Adds the primitive translator to Jace's internal list of translators and return it again.
 
     If the primitive is already known an error is generated, if `overwrite` is set, it will be replaced.

From 8a9be47d173aa0d2b26f12e05d614af3d15a577a Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Thu, 23 May 2024 11:03:09 +0200
Subject: [PATCH 217/458] Updated the tests.

---
 tests/test_caching.py              |  30 +++++++--
 tests/test_subtranslator_helper.py | 103 +++++++++++++++++++----------
 2 files changed, 91 insertions(+), 42 deletions(-)

diff --git a/tests/test_caching.py b/tests/test_caching.py
index ea31153..e53b365 100644
--- a/tests/test_caching.py
+++ b/tests/test_caching.py
@@ -17,6 +17,7 @@
 import pytest
 
 import jace
+from jace import optimization
 from jace.jax import stages
 
 
@@ -138,13 +139,20 @@ def wrapped(A, B):
     # These are the known lowerings.
     lowerings: dict[tuple[int, int], stages.JaceLowered] = {}
     lowering_ids: set[int] = set()
+    # These are the known compilations.
+    compilations: dict[tuple[int, int], stages.JaceCompiled] = {}
+    compiled_ids: set[int] = set()
 
     # Generating the lowerings
     for arg1, arg2 in it.permutations([A, B, C, D], 2):
         lower = wrapped.lower(arg1, arg2)
+        compiled = lower.compile()
         assert id(lower) not in lowering_ids
+        assert id(compiled) not in compiled_ids
         lowerings[id(arg1), id(arg2)] = lower
         lowering_ids.add(id(lower))
+        compilations[id(arg1), id(arg2)] = compiled
+        compiled_ids.add(id(compiled))
 
     # Now check if they are still cached.
     for arg1, arg2 in it.permutations([A, B, C, D], 2):
@@ -152,6 +160,12 @@ def wrapped(A, B):
         clower = lowerings[id(arg1), id(arg2)]
         assert clower is lower
 
+        compiled1 = lower.compile()
+        compiled2 = clower.compile()
+        ccompiled = compilations[id(arg1), id(arg2)]
+        assert compiled1 is compiled2
+        assert compiled1 is ccompiled
+
 
 def test_caching_compilation():
     """Tests the compilation cache, this is just very simple, since it uses the same code paths as lowering."""
@@ -170,17 +184,21 @@ def jaceWrapped(A: np.ndarray, B: np.ndarray) -> np.ndarray:
     # Now we lower it.
     jaceLowered = jaceWrapped.lower(A, B)
 
-    # Now we compile it with enabled optimization.
-    optiCompiled = jaceLowered.compile(stages.JaceLowered.DEF_COMPILER_OPTIONS)
+    # Compiling it without any information.
+    optiCompiled = jaceLowered.compile()
+
+    # This should be the same as passing the defaults directly.
+    assert optiCompiled is jaceLowered.compile(optimization.DEFAULT_OPTIMIZATIONS)
 
-    # Passing `None` also means 'default' which is a bit strange, but it is what Jax does.
-    assert optiCompiled is jaceLowered.compile(None)
+    # Also if we pass the empty dict, we should get the default.
+    assert optiCompiled is jaceLowered.compile({})
 
-    # Now we compile it without any optimization.
-    unoptiCompiled = jaceLowered.compile({})
+    # Now we disable all optimizations
+    unoptiCompiled = jaceLowered.compile(optimization.NO_OPTIMIZATIONS)
 
     # Because of the way how things work the optimized must have more than the unoptimized.
     #  If there is sharing, then this would not be the case.
+    assert unoptiCompiled is not optiCompiled
     assert optiCompiled._csdfg.sdfg.number_of_nodes() == 1
     assert optiCompiled._csdfg.sdfg.number_of_nodes() < unoptiCompiled._csdfg.sdfg.number_of_nodes()
 
diff --git a/tests/test_subtranslator_helper.py b/tests/test_subtranslator_helper.py
index 8046e88..612df15 100644
--- a/tests/test_subtranslator_helper.py
+++ b/tests/test_subtranslator_helper.py
@@ -19,16 +19,18 @@
 from jace import translator
 from jace.translator import (
     get_regsitered_primitive_translators,
+    make_primitive_translator,
     register_primitive_translator,
+    set_active_primitive_translators_to,
 )
 
 
 @pytest.fixture(autouse=True)
 def _conserve_builtin_translators():
     """Restores the set of registered subtranslators after a test."""
-    initial_translators = translator.get_regsitered_primitive_translators()
+    initial_translators = get_regsitered_primitive_translators()
     yield
-    translator.set_active_primitive_translators_to(initial_translators)
+    set_active_primitive_translators_to(initial_translators)
 
 
 @pytest.fixture()
@@ -58,11 +60,14 @@ def __call__(self) -> None:  # type: ignore[override]  # Arguments
         raise NotImplementedError
 
 
-# fmt: off
+@make_primitive_translator("non_existing_callable_primitive3")
 def SubTrans3_Callable(*args: Any, **kwargs: Any) -> None:
     raise NotImplementedError
-SubTrans3_Callable.primitive = "non_existing_primitive3" # type: ignore[attr-defined]
-# fmt: on
+
+
+@make_primitive_translator("add")
+def fake_add_translator(*args: Any, **kwargs: Any) -> None:
+    raise NotImplementedError
 
 
 def test_are_subtranslators_imported():
@@ -94,49 +99,71 @@ def test_subtranslatior_managing(no_builtin_translators):
     assert len(active_subtrans) == 3
 
 
-def test_subtranslatior_managing_callable(no_builtin_translators):
-    """If we add a callable, and have no `.primitive` property defined."""
+def test_subtranslatior_managing_isolation():
+    """Tests if `get_regsitered_primitive_translators()` protects the internal registry."""
+    assert (
+        get_regsitered_primitive_translators()
+        is not translator.managing._PRIMITIVE_TRANSLATORS_DICT
+    )
 
-    def noname_translator_callable(*args: Any, **kwargs: Any) -> None:
-        raise NotImplementedError
+    initial_primitives = get_regsitered_primitive_translators()
+    assert get_regsitered_primitive_translators() is not initial_primitives
+    assert "add" in initial_primitives, "For this test the 'add' primitive must be registered."
+    org_add_prim = initial_primitives["add"]
 
-    # This will not work because `noname_translator_callable()` does not have a `.primitive` attribute.
-    with pytest.raises(
-        expected_exception=ValueError,
-        match=re.escape(f"Missing primitive name for '{noname_translator_callable}'"),
-    ):
-        register_primitive_translator(noname_translator_callable)
-    assert len(get_regsitered_primitive_translators()) == 0
+    initial_primitives["add"] = fake_add_translator
+    assert org_add_prim is not fake_add_translator
+    assert get_regsitered_primitive_translators()["add"] is org_add_prim
 
-    # This works because there is a primitive specified, it will also update the object.
-    prim_name = "noname_translator_callable_prim"
-    assert register_primitive_translator(noname_translator_callable, primitive=prim_name)
-    assert noname_translator_callable.primitive == prim_name
 
+def test_subtranslatior_managing_swap():
+    """Tests the `set_active_primitive_translators_to()` functionality."""
 
-def test_subtranslatior_managing_failing_wrong_name(no_builtin_translators):
-    """Tests if how it works with wrong name."""
-    sub1 = SubTrans1()
-    sub2 = SubTrans2()
+    # Allows to compare the structure of dicts.
+    def same_structure(d1: dict, d2: dict) -> bool:
+        return d1.keys() == d2.keys() and all(id(d2[k]) == id(d1[k]) for k in d1)
 
-    with pytest.raises(
-        expected_exception=TypeError,
-        match=re.escape(
-            f"Translator's primitive '{sub1.primitive}' doesn't match the supplied '{sub2.primitive}'."
-        ),
-    ):
-        register_primitive_translator(sub1, primitive=sub2.primitive)
+    initial_primitives = get_regsitered_primitive_translators()
+    assert "add" in initial_primitives
+
+    # Now mutate the dict a little bit, shallow copy it first.
+    mutated_primitives = initial_primitives.copy()
+    mutated_primitives["add"] = fake_add_translator
+    assert mutated_primitives.keys() == initial_primitives.keys()
+    assert same_structure(initial_primitives, get_regsitered_primitive_translators())
+    assert not same_structure(mutated_primitives, initial_primitives)
+    assert not same_structure(mutated_primitives, get_regsitered_primitive_translators())
+
+    # Now change the initial one with the mutated one.
+    #  The object is copied but should still have the same structure.
+    old_active = set_active_primitive_translators_to(mutated_primitives)
+    assert mutated_primitives is not translator.managing._PRIMITIVE_TRANSLATORS_DICT
+    assert same_structure(old_active, initial_primitives)
+    assert same_structure(mutated_primitives, get_regsitered_primitive_translators())
+
+
+def test_subtranslatior_managing_callable_annotation(no_builtin_translators):
+    """Test if `make_primitive_translator()` works."""
+
+    prim_name = "non_existing_property"
+
+    @make_primitive_translator(prim_name)
+    def non_existing_translator(*args: Any, **kwargs: Any) -> None:
+        raise NotImplementedError
+
+    assert hasattr(non_existing_translator, "primitive")
+    assert non_existing_translator.primitive == prim_name
+    assert len(get_regsitered_primitive_translators()) == 0
 
 
 def test_subtranslatior_managing_overwriting():
     """Tests if we are able to overwrite something."""
     current_add_translator = get_regsitered_primitive_translators()["add"]
 
+    @make_primitive_translator("add")
     def useless_add_translator(*args: Any, **kwargs: Any) -> None:
         raise NotImplementedError
 
-    useless_add_translator.primitive = "add"
-
     # This will not work because it is not overwritten.
     with pytest.raises(
         expected_exception=ValueError,
@@ -151,6 +178,7 @@ def useless_add_translator(*args: Any, **kwargs: Any) -> None:
     assert useless_add_translator is register_primitive_translator(
         useless_add_translator, overwrite=True
     )
+    assert useless_add_translator is get_regsitered_primitive_translators()["add"]
 
 
 def test_subtranslatior_managing_overwriting_2(no_builtin_translators):
@@ -158,8 +186,9 @@ def test_subtranslatior_managing_overwriting_2(no_builtin_translators):
 
     trans_cnt = [0]
 
-    @register_primitive_translator(primitive="add")
-    def still_but_less_useless_add_translator(*args: Any, **kwargs: Any) -> None:
+    @register_primitive_translator(overwrite=True)
+    @make_primitive_translator("add")
+    def still_useless_but_a_bit_less(*args: Any, **kwargs: Any) -> None:
         trans_cnt[0] += 1
         return
 
@@ -180,6 +209,7 @@ def test_subtranslatior_managing_decoupling():
     I.e. changes to the global state, does not affect already annotated functions.
     """
 
+    # This will use the translators that are currently installed.
     @jace.jit
     def foo(A):
         B = A + 1
@@ -187,7 +217,8 @@ def foo(A):
         D = C + 1
         return D + 1
 
-    @register_primitive_translator(primitive="add", overwrite=True)
+    @register_primitive_translator(overwrite=True)
+    @make_primitive_translator("add")
     def useless_add_translator(*args: Any, **kwargs: Any) -> None:
         raise NotImplementedError("The 'useless_add_translator' was called as expected.")
 

From 9dec076bef637b9b337b9b84a042a07654db6764 Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Wed, 22 May 2024 09:28:31 +0200
Subject: [PATCH 218/458] Small fixes.

---
 src/jace/jax/translation_cache.py | 2 +-
 src/jace/util/jax_helper.py       | 2 +-
 src/jace/util/traits.py           | 2 +-
 3 files changed, 3 insertions(+), 3 deletions(-)

diff --git a/src/jace/jax/translation_cache.py b/src/jace/jax/translation_cache.py
index be4b0a2..5bcb948 100644
--- a/src/jace/jax/translation_cache.py
+++ b/src/jace/jax/translation_cache.py
@@ -140,7 +140,7 @@ def from_value(
 
         if util.is_array(val):
             if util.is_jax_array(val):
-                val = val.__array__(copy=False)
+                val = val.__array__()  # Passing `copy=False` leads to error in NumPy.
             shape = val.shape
             dtype = util.translate_dtype(val.dtype)
             strides = getattr(val, "strides", None)
diff --git a/src/jace/util/jax_helper.py b/src/jace/util/jax_helper.py
index af2dce8..eb59fd1 100644
--- a/src/jace/util/jax_helper.py
+++ b/src/jace/util/jax_helper.py
@@ -167,7 +167,7 @@ def translate_dtype(dtype: Any) -> dace.typeclass:
     if hasattr(dace.dtypes, dtype_name):
         return getattr(dace.dtypes, dtype_name)
     if hasattr(np, dtype_name):
-        dtype = getattr(np, dtype)
+        dtype = getattr(np, dtype_name)
         return dace.dtype_to_typeclass(dtype)
     raise ValueError(f"Unable to translate '{dtype}' ino a DaCe dtype.")
 
diff --git a/src/jace/util/traits.py b/src/jace/util/traits.py
index 6336f6d..44ba097 100644
--- a/src/jace/util/traits.py
+++ b/src/jace/util/traits.py
@@ -142,5 +142,5 @@ def is_fully_addressable(
             Jax array is on this host.
     """
     if is_jax_array(obj):
-        return obj.is_fully_addressable()
+        return obj.is_fully_addressable
     return True

From 5d27e22f807689b5e26df7c7336f362281b24758 Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Wed, 22 May 2024 09:33:17 +0200
Subject: [PATCH 219/458] Added a new note regarding the `x64` Situation.

---
 src/jace/translator/jaxpr_translator_driver.py | 5 +++++
 1 file changed, 5 insertions(+)

diff --git a/src/jace/translator/jaxpr_translator_driver.py b/src/jace/translator/jaxpr_translator_driver.py
index 77da631..508322c 100644
--- a/src/jace/translator/jaxpr_translator_driver.py
+++ b/src/jace/translator/jaxpr_translator_driver.py
@@ -114,6 +114,11 @@ def translate_jaxpr(
         if len(jaxpr.effects) != 0:
             raise NotImplementedError("'Jaxpr' with side effects are not supported.")
         if not _jax.config.read("jax_enable_x64"):
+            # NOTE: What is interesting here is, that the SDFG can be called, but the result is garbage.
+            #  Beside that I think it should not work, I think it should not even call,
+            #  because of a mismatch in data types.
+            #  However, If we work with Jax arrays themselves, it should technically work.
+            #  But currently the best we can do, is forbid it!
             raise NotImplementedError(
                 "You have disabled 'x64' support in Jax, which interferes with the calling of the SDFG. "
                 "SDFG generated in this way will fail to call."

From ba29b4ed822e24dc3a72e86195f835f1af181fb6 Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Wed, 22 May 2024 09:45:16 +0200
Subject: [PATCH 220/458] Updated the tests, there is now also a test for
 checking the Datatype.

---
 tests/test_caching.py | 24 ++++++++++++++++++++++++
 1 file changed, 24 insertions(+)

diff --git a/tests/test_caching.py b/tests/test_caching.py
index e53b365..851ebdc 100644
--- a/tests/test_caching.py
+++ b/tests/test_caching.py
@@ -203,6 +203,30 @@ def jaceWrapped(A: np.ndarray, B: np.ndarray) -> np.ndarray:
     assert optiCompiled._csdfg.sdfg.number_of_nodes() < unoptiCompiled._csdfg.sdfg.number_of_nodes()
 
 
+def test_caching_dtype():
+    """Tests if the data type is properly included in the test."""
+
+    lowering_cnt = [0]
+
+    @jace.jit
+    def testee(A: np.ndarray) -> np.ndarray:
+        lowering_cnt[0] += 1
+        return A + A
+
+    dtypes = [np.float64, np.float32, np.int32, np.int64]
+    shape = (10, 10)
+
+    for i, dtype in enumerate(dtypes):
+        A = np.array((np.random.random(shape) - 0.5) * 10, dtype=dtype)  # noqa: NPY002
+
+        assert lowering_cnt[0] == i
+        _ = testee(A)
+        assert lowering_cnt[0] == i + 1
+
+        assert np.allclose(testee(A), 2 * A)
+        assert lowering_cnt[0] == i + 1
+
+
 def test_caching_strides() -> None:
     """Test if the cache detects a change in strides."""
 

From 7d5c64f1bfae30345436e340224a2c08ca430fd4 Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Wed, 22 May 2024 09:56:44 +0200
Subject: [PATCH 221/458] Added a test for a possible bug in DaCe.

---
 tests/test_decorator.py |  2 +-
 tests/test_misc.py      | 40 ++++++++++++++++++++++++++++++++++++++++
 2 files changed, 41 insertions(+), 1 deletion(-)
 create mode 100644 tests/test_misc.py

diff --git a/tests/test_decorator.py b/tests/test_decorator.py
index cf1ffaf..7877b07 100644
--- a/tests/test_decorator.py
+++ b/tests/test_decorator.py
@@ -8,7 +8,7 @@
 """Implements tests for the jit decorator.
 
 Also see the `test_jax_api.py` test file, that tests composability.
-."""
+"""
 
 from __future__ import annotations
 
diff --git a/tests/test_misc.py b/tests/test_misc.py
new file mode 100644
index 0000000..ec2a5b2
--- /dev/null
+++ b/tests/test_misc.py
@@ -0,0 +1,40 @@
+# JaCe - JAX Just-In-Time compilation using DaCe (Data Centric Parallel Programming)
+#
+# Copyright (c) 2024, ETH Zurich
+# All rights reserved.
+#
+# SPDX-License-Identifier: BSD-3-Clause
+
+"""Implements general tests for Jace."""
+
+from __future__ import annotations
+
+import numpy as np
+import pytest
+
+import jace
+
+
+@pytest.mark.skip("Possible bug in DaCe.")
+def test_mismatch_in_datatyte_calling():
+    """Tests compilation and calling with different types.
+
+    Note that this more or less tests the calling implementation of the `CompiledSDFG` class in DaCe.
+    As I understand the `CompiledSDFG::_construct_args()` function this should be detected.
+    However, as evidently it does not do this.
+    """
+
+    @jace.jit
+    def testee(A: np.ndarray) -> np.ndarray:
+        return -A
+
+    # Different types.
+    A1 = np.arange(12, dtype=np.float32).reshape((4, 3))
+    A2 = np.arange(12, dtype=np.int64).reshape((4, 3))
+
+    # Lower and compilation for first type
+    callee = testee.lower(A1).compile()
+
+    # But calling with the second type
+    with pytest.raises(Exception):  # noqa: B017, PT011 # Unknown exception.
+        _ = callee(A2)

From 22c144114aae11b7ad7174b55d530f8d779c7146 Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Wed, 22 May 2024 10:40:40 +0200
Subject: [PATCH 222/458] Updated the `translate_dtype()` function.

I think this make it less magical, okay it is stil very guru level, but it looks a bit more reasonable.
---
 src/jace/util/jax_helper.py | 32 +++++---------------------------
 1 file changed, 5 insertions(+), 27 deletions(-)

diff --git a/src/jace/util/jax_helper.py b/src/jace/util/jax_helper.py
index eb59fd1..0832237 100644
--- a/src/jace/util/jax_helper.py
+++ b/src/jace/util/jax_helper.py
@@ -22,8 +22,6 @@
 
 import dace
 import jax.core as jax_core
-import jax.dtypes as jax_dtypes
-import numpy as np
 
 import jace.util as util
 
@@ -141,35 +139,15 @@ def is_tracing_ongoing(
 
 def translate_dtype(dtype: Any) -> dace.typeclass:
     """Turns a Jax datatype into a DaCe datatype."""
+    if dtype is None:
+        raise NotImplementedError  # Handling a special case in DaCe.
     if isinstance(dtype, dace.typeclass):
         return dtype
-    if dtype is None:
-        # Special behaviour of `dtype_to_typeclass()`
-        raise NotImplementedError()
-
-    # For reasons unknown to me we have to do the dtype conversion this way.
-    #  It is not possible to simply call `dace.typeclass(dtype)` or pass it to
-    #  `dace.dtype_to_typeclass()`, it will generate an error.
-    #  We keep the `dtype_to_typeclass()` function call, in order to handle
-    #  NumPy types as DaCe intended them to be handled.
-    try:
-        return dace.dtype_to_typeclass(dtype)
-    except KeyError:
-        pass
-
     try:
-        dtype_ = jax_dtypes.canonicalize_dtype(dtype)
-        return dace.dtype_to_typeclass(dtype_)
-    except Exception:
+        return dace.typeclass(dtype)
+    except (NameError, KeyError):
         pass
-
-    dtype_name = str(dtype)
-    if hasattr(dace.dtypes, dtype_name):
-        return getattr(dace.dtypes, dtype_name)
-    if hasattr(np, dtype_name):
-        dtype = getattr(np, dtype_name)
-        return dace.dtype_to_typeclass(dtype)
-    raise ValueError(f"Unable to translate '{dtype}' ino a DaCe dtype.")
+    return dace.dtype_to_typeclass(getattr(dtype, "type", dtype))
 
 
 def propose_jax_name(

From e457af14b6f0a6642ebad7ce7e95022a4736f0ce Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Thu, 23 May 2024 12:49:14 +0200
Subject: [PATCH 223/458] Fixed a problem in the convert_element_type
 translator.

---
 .../convert_element_type_translator.py             | 14 +++++++++++---
 .../mapped_operation_base_translator.py            |  9 ++++-----
 2 files changed, 15 insertions(+), 8 deletions(-)

diff --git a/src/jace/translator/primitive_translators/convert_element_type_translator.py b/src/jace/translator/primitive_translators/convert_element_type_translator.py
index 531cc48..e105abc 100644
--- a/src/jace/translator/primitive_translators/convert_element_type_translator.py
+++ b/src/jace/translator/primitive_translators/convert_element_type_translator.py
@@ -16,6 +16,7 @@
 from jax import core as jax_core
 from typing_extensions import override
 
+from jace import translator
 from jace.translator.primitive_translators.mapped_operation_base_translator import (
     MappedOperationBaseTranslator,
 )
@@ -58,7 +59,9 @@ def write_tasklet_code(
 
         in_var_name: str = in_var_names[0]
         in_dtype = eqn.invars[0].aval.dtype
+        in_dtype_s: str = str(in_dtype)
         out_dtype = eqn.outvars[0].aval.dtype
+        out_dtype_s: str = str(out_dtype)
 
         if in_var_name is None:
             raise NotImplementedError("'convert_element_type' is not supported for literals.")
@@ -75,13 +78,15 @@ def write_tasklet_code(
         #  Thus we have to do it in this way.
         conv_code = "__in0"
 
-        if str(in_dtype).startswith("bool") and str(out_dtype).startswith("int"):
+        if in_dtype_s.startswith("bool") and out_dtype_s.startswith("int"):
             # Interestingly `__out0 = int(__in0)` will fail, Dace will optimize it away.
             conv_code = f"(1 if {conv_code} else 0)"
 
         # Now do the actual casting.
-        if hasattr(dace.dtypes, str(out_dtype)):
-            conv_code = f"dace.{out_dtype!s}(__in)"
+        if out_dtype_s == "bool":
+            conv_code = f"dace.bool_({conv_code})"
+        elif hasattr(dace.dtypes, str(out_dtype)):
+            conv_code = f"dace.{out_dtype!s}({conv_code})"
         else:
             raise NotImplementedError(
                 f"Cannot convert '{in_dtype}' to '{out_dtype}' as this type is not known to DaCe."
@@ -89,3 +94,6 @@ def write_tasklet_code(
 
         # Now writing the full Tasklet, i.e. with the output.
         return f"__out0 = {conv_code}"
+
+
+_ = translator.register_primitive_translator(ConvertElementTypeTranslator())
diff --git a/src/jace/translator/primitive_translators/mapped_operation_base_translator.py b/src/jace/translator/primitive_translators/mapped_operation_base_translator.py
index 5f217f1..6b9f416 100644
--- a/src/jace/translator/primitive_translators/mapped_operation_base_translator.py
+++ b/src/jace/translator/primitive_translators/mapped_operation_base_translator.py
@@ -81,6 +81,7 @@ def __call__(
             eqn:            The Jax equation that is translated.
             eqn_state:      State into which the primitive's SDFG representation is constructed.
         """
+        assert len(out_var_names) == 1
         if eqn.outvars[0].aval.shape != ():
             tskl_ranges: list[tuple[str, str]] = [
                 (f"__i{dim}", f"0:{N}") for dim, N in enumerate(eqn.outvars[0].aval.shape)
@@ -156,11 +157,9 @@ def make_input_memlets(
         return {
             f"__in{i}": dace.Memlet.simple(
                 in_var_name,
-                (
-                    ", ".join(name for name, _ in tskl_ranges)
-                    if eqn.outvars[0].aval.shape != ()
-                    else "0"
-                ),
+                ", ".join(name for name, _ in tskl_ranges)
+                if eqn.outvars[0].aval.shape != ()
+                else "0",
             )
             for i, in_var_name in enumerate(in_var_names)
             if in_var_name is not None

From 614ed582340d6511c6170bdbc933a1f374c04ad2 Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Thu, 23 May 2024 12:52:16 +0200
Subject: [PATCH 224/458] The `TranslatedJaxprSDFG.validate()` now also tests
 if there are free symbols.

This is a temporary solution, without it, we would get some strange errors in code generation.
---
 src/jace/translator/translated_jaxpr_sdfg.py | 10 ++++++++++
 1 file changed, 10 insertions(+)

diff --git a/src/jace/translator/translated_jaxpr_sdfg.py b/src/jace/translator/translated_jaxpr_sdfg.py
index 1d08fce..faef510 100644
--- a/src/jace/translator/translated_jaxpr_sdfg.py
+++ b/src/jace/translator/translated_jaxpr_sdfg.py
@@ -99,5 +99,15 @@ def validate(self) -> bool:
             )
         if not self.is_finalized:
             return True  # More we can not do for an unfinalized SDFG.
+
+        if len(self.sdfg.free_symbols) != 0:
+            # For the moment we require this.
+            #  Without it, we would get some strange error in codegen.
+            raise dace.sdfg.InvalidSDFGError(
+                f"Expected that there are no free symbols in the SDFG, but found: {self.sdfg.free_symbols}.",
+                self.sdfg,
+                self.sdfg.node_id(self.sdfg.start_state),
+            )
+
         self.sdfg.validate()
         return True

From 655db1ba67f4a49410c7442fe4fabddc6c3e7493 Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Thu, 23 May 2024 13:37:17 +0200
Subject: [PATCH 225/458] Added the tests for the element conversion.

Some are relly heavy, thus there are shorter ones.
---
 tests/test_caching.py              |  1 -
 tests/test_convert_element_type.py | 67 ++++++++++++++++++++++++++++--
 2 files changed, 63 insertions(+), 5 deletions(-)

diff --git a/tests/test_caching.py b/tests/test_caching.py
index 851ebdc..2d34eda 100644
--- a/tests/test_caching.py
+++ b/tests/test_caching.py
@@ -113,7 +113,6 @@ def wrapped(A, B):
     assert compiled1 is not compiled2
 
 
-@pytest.mark.skip(reason="Missing primitive translators")
 def test_caching_different_structure():
     """Now tests if we can handle multiple arguments with different structures.
 
diff --git a/tests/test_convert_element_type.py b/tests/test_convert_element_type.py
index 8d8a9ca..8ed0bbd 100644
--- a/tests/test_convert_element_type.py
+++ b/tests/test_convert_element_type.py
@@ -9,10 +9,69 @@
 
 from __future__ import annotations
 
+from collections.abc import Sequence
+from typing import Final
 
-def test_convert_element_type_non_bool():
-    """Tests all conversions with the exception of bool as conversion target."""
+import numpy as np
+import pytest
+from jax import numpy as jnp
 
+import jace
 
-def test_convert_element_type_bool():
-    """Tests all conversions with the exception of bool as conversion target."""
+
+# fmt: off
+_DACE_TYPES: Final[list[type]] = [
+        np.int_, np.int8, np.int16, np.int32, np.int64,
+        np.uint, np.uint8, np.uint16, np.uint32, np.uint64,
+        np.float64, np.float32, np.float64,
+]
+_DACE_COMPLEX: Final[list[type]] = [
+        np.complex128, np.complex64, np.complex128,
+]
+# fmt: on
+
+
+def _test_convert_element_type_impl(
+    input_types: Sequence,
+    output_types: Sequence,
+) -> bool:
+    """Implementation of the tests of the convert element types primitive."""
+    lowering_cnt = [0, 0]
+    for input_type in input_types:
+        for output_type in output_types:
+            A = np.array(np.random.random((10, 10)), dtype=input_type)  # noqa: NPY002
+            ref = np.array(A, copy=True, dtype=output_type)
+            lowering_cnt[1] += 1
+
+            @jace.jit
+            def converter(A: np.ndarray) -> np.ndarray:
+                lowering_cnt[0] += 1
+                return jnp.array(A, copy=False, dtype=output_type)  # noqa: B023  # Loop variable.
+
+            res = converter(A)
+            assert res.dtype == output_type
+            assert lowering_cnt[0] == lowering_cnt[1]
+            assert np.allclose(ref, res)
+    return True
+
+
+@pytest.mark.skip(reason="Too slow, find way to run only on demand.")
+def test_convert_element_type_main():
+    """Tests all conversions with the exception of conversions from bool and complex."""
+    _test_convert_element_type_impl(_DACE_TYPES, [*_DACE_TYPES, np.bool_])
+
+
+def test_convert_element_type_main_short():
+    """Fast running version of `test_convert_element_type_main()`."""
+    FAST_TYPES = [np.int32, np.int64, np.float64]
+    _test_convert_element_type_impl(FAST_TYPES, [*FAST_TYPES, np.bool_])
+
+
+def test_convert_element_type_complex():
+    """All complex conversions."""
+    _test_convert_element_type_impl(_DACE_COMPLEX, _DACE_COMPLEX)
+
+
+def test_convert_element_type_from_bool():
+    """Tests conversions from bools to any other types."""
+    _test_convert_element_type_impl([np.bool_], _DACE_COMPLEX)

From 69a88bcb7de35b6296e9a9331144cae850132513 Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Thu, 23 May 2024 14:38:06 +0200
Subject: [PATCH 226/458] Updated the Mapped Translator.

The thing is now able to broadcast by default, which is a bit of a gamble.
---
 .../primitive_translators/__init__.py         |   5 +-
 .../primitive_translators/alu_translators.py  | 137 ++----------------
 .../convert_element_type_translator.py        |   4 +-
 .../mapped_operation_base_translator.py       |  47 +++---
 tests/test_sub_translators_alu.py             |  44 +++++-
 5 files changed, 86 insertions(+), 151 deletions(-)

diff --git a/src/jace/translator/primitive_translators/__init__.py b/src/jace/translator/primitive_translators/__init__.py
index 043661c..9372adc 100644
--- a/src/jace/translator/primitive_translators/__init__.py
+++ b/src/jace/translator/primitive_translators/__init__.py
@@ -8,12 +8,11 @@
 
 from __future__ import annotations
 
-from .alu_translators import BinaryALUTranslator, UnaryALUTranslator
+from .alu_translators import ALUTranslator
 from .convert_element_type_translator import ConvertElementTypeTranslator
 
 
 __all__ = [
-    "BinaryALUTranslator",
-    "UnaryALUTranslator",
+    "ALUTranslator",
     "ConvertElementTypeTranslator",
 ]
diff --git a/src/jace/translator/primitive_translators/alu_translators.py b/src/jace/translator/primitive_translators/alu_translators.py
index fd3b442..22d6376 100644
--- a/src/jace/translator/primitive_translators/alu_translators.py
+++ b/src/jace/translator/primitive_translators/alu_translators.py
@@ -12,27 +12,21 @@
 from collections.abc import Sequence
 from typing import Final, cast
 
-import dace
 import numpy as np
 from jax import core as jax_core
 from typing_extensions import override
 
 from jace import translator
 from jace.translator.primitive_translators.mapped_operation_base_translator import (
-    MappedOperationBaseTranslator,
+    MappedOperationTranslatorBase,
 )
 
 
-class ALUBaseTranslator(MappedOperationBaseTranslator):
-    """Base for all ALU (arithmetic logical operations) translators.
+class ALUTranslator(MappedOperationTranslatorBase):
+    """Translator for all arithmetic and logical operations.
 
-    This class implements the `MappedOperationBaseTranslator::write_tasklet_code()` function.
-    The tasklet is written based on a template string.
-    In addition to that the function will also do literal substitution.
-
-    There are two subclasses:
-    - `UnaryALUTranslator` for all unary operations.
-    - `BinaryALUTranslator` for all binary operations.
+    The class uses `MappedOperationBaseTranslator` for generating the maps.
+    Its `write_tasklet_code()` function will perform replace all literals.
     """
 
     __slots__ = "_tskl_tmpl"
@@ -82,115 +76,10 @@ def write_tasklet_code(
         return tskl_code
 
 
-class UnaryALUTranslator(ALUBaseTranslator):
-    """Class for all unary operations.
-
-    Todo:
-        - Specialize for `integer_pow` to do code unrolling in certain situations.
-    """
-
-    @override
-    def write_tasklet_code(
-        self,
-        in_var_names: Sequence[str | None],
-        eqn: jax_core.JaxprEqn,
-    ) -> str:
-        if len(in_var_names) != 1:
-            raise RuntimeWarning(
-                f"'UnaryALUTranslator' can only handle unary operations.\nEqn: {eqn}"
-            )
-        return super().write_tasklet_code(
-            in_var_names=in_var_names,
-            eqn=eqn,
-        )
-
-
-class BinaryALUTranslator(ALUBaseTranslator):
-    """Class for all binary ALU operations.
-
-    While `MappedOperationBaseTranslator` requires that the inputs must have the same shape,
-    this class lift this restriction and allows to broadcast the operants.
-    However, broadcasting is only possible if both inputs have the same rank.
-
-    Notes:
-        The input `__in0` is identified with the left hand side of an operator and `__in1` is identified as the right hand side.
-    """
-
-    def make_input_memlets(
-        self,
-        tskl_ranges: Sequence[tuple[str, str]],
-        in_var_names: Sequence[str | None],
-        eqn: jax_core.JaxprEqn,
-    ) -> dict[str, dace.Memlet]:
-        if len(in_var_names) != 2:
-            raise RuntimeWarning(
-                f"'BinaryALUTranslator' can only handle binary operations.\nEqn: {eqn}"
-            )
-
-        out_shps = tuple(eqn.outvars[0].aval.shape)  # Shape of the output
-        inp_shpl = tuple(eqn.invars[0].aval.shape)  # Shape of the left/first input
-        inp_shpr = tuple(eqn.invars[1].aval.shape)  # Shape of the right/second input
-
-        # Which dimensions on which input should be broadcast, i.e. replicated.
-        #  A dimension that is replicated is always accessed with the index `0` in the Memlet.
-        #  If `dims_to_bcast*` is `None` then the corresponding argument is a scalar.
-        dims_to_bcastl: list[int] | None = []
-        dims_to_bcastr: list[int] | None = []
-
-        if out_shps == ():
-            # Output is scalar (thus also the inputs).
-            dims_to_bcastl = None
-            dims_to_bcastr = None
-
-        elif inp_shpl == inp_shpr:
-            # The two have the same shapes and neither is a scalar.
-            pass
-
-        elif inp_shpl == ():
-            # The LHS is a scalar (RHS is not)
-            dims_to_bcastl = None
-
-        elif inp_shpr == ():
-            # The RHS is a scalar (LHS is not)
-            dims_to_bcastr = None
-
-        else:
-            # This is the general broadcasting case
-            #  We assume that both inputs and the output have the same rank, Jax seems to ensure this.
-            assert len(out_shps) == len(inp_shpl) == len(inp_shpr)
-            for dim, shp_lft, shp_rgt in zip(range(len(out_shps)), inp_shpl, inp_shpr):
-                if shp_lft == shp_rgt:
-                    pass  # Needed for cases such as `(10, 1, 3) + (10, 1, 1)`.
-                elif shp_lft == 1:
-                    dims_to_bcastl.append(dim)  # type: ignore[union-attr]  # guaranteed to be not `None`
-                else:
-                    dims_to_bcastr.append(dim)  # type: ignore[union-attr]
-
-        # Now we will generate the input Memlets.
-        tskl_inputs: dict[str, dace.Memlet] = {}
-        for i, in_var_name, dims_to_bcast in zip(
-            range(2), in_var_names, [dims_to_bcastl, dims_to_bcastr]
-        ):
-            if in_var_name is None:  # Input is a literal: No Memlet needed
-                continue
-
-            if dims_to_bcast is None:
-                imemelt = dace.Memlet.simple(in_var_name, "0")  # Scalar
-            else:
-                imemelt = dace.Memlet.simple(
-                    in_var_name,
-                    ", ".join(
-                        ("0" if i in dims_to_bcast else it_var)
-                        for i, (it_var, _) in enumerate(tskl_ranges)
-                    ),
-                )
-            tskl_inputs[f"__in{i}"] = imemelt
-
-        return tskl_inputs
-
-
 # Contains all the templates for ALU operations.
-_ALU_UN_OPS_TMPL: Final[dict[str, str]] = {
+# fmt: off
+_ALU_OPS_TMPL: Final[dict[str, str]] = {
+    # Unary operations
     "pos": "__out0 = +(__in0)",
     "neg": "__out0 = -(__in0)",
     "not": "__out0 = not (__in0)",
@@ -210,8 +99,8 @@ def make_input_memlets(
     "tan": "__out0 = tan(__in0)",
     "atan": "__out0 = atan(__in0)",
     "tanh": "__out0 = tanh(__in0)",
-}
-_ALU_BI_OPS_TMPL: Final[dict[str, str]] = {
+
+    # Binary operations
     "add": "__out0 = (__in0)+(__in1)",
     "add_any": "__out0 = (__in0)+(__in1)",  # No idea what makes `add_any` differ from `add`
     "sub": "__out0 = (__in0)-(__in1)",
@@ -233,7 +122,5 @@ def make_input_memlets(
 }
 
 # Create the ALU translators
-for pname, ptmpl in _ALU_UN_OPS_TMPL.items():
-    translator.register_primitive_translator(UnaryALUTranslator(pname, ptmpl))
-for pname, ptmpl in _ALU_BI_OPS_TMPL.items():
-    translator.register_primitive_translator(BinaryALUTranslator(pname, ptmpl))
+for pname, ptmpl in _ALU_OPS_TMPL.items():
+    translator.register_primitive_translator(ALUTranslator(pname, ptmpl))
diff --git a/src/jace/translator/primitive_translators/convert_element_type_translator.py b/src/jace/translator/primitive_translators/convert_element_type_translator.py
index e105abc..3673359 100644
--- a/src/jace/translator/primitive_translators/convert_element_type_translator.py
+++ b/src/jace/translator/primitive_translators/convert_element_type_translator.py
@@ -18,11 +18,11 @@
 
 from jace import translator
 from jace.translator.primitive_translators.mapped_operation_base_translator import (
-    MappedOperationBaseTranslator,
+    MappedOperationTranslatorBase,
 )
 
 
-class ConvertElementTypeTranslator(MappedOperationBaseTranslator):
+class ConvertElementTypeTranslator(MappedOperationTranslatorBase):
     """Implements the `convert_element_type` primitive.
 
     Copies the input to the output and performs type conversion.
diff --git a/src/jace/translator/primitive_translators/mapped_operation_base_translator.py b/src/jace/translator/primitive_translators/mapped_operation_base_translator.py
index 6b9f416..7e28e87 100644
--- a/src/jace/translator/primitive_translators/mapped_operation_base_translator.py
+++ b/src/jace/translator/primitive_translators/mapped_operation_base_translator.py
@@ -19,28 +19,26 @@
 from jace import translator
 
 
-class MappedOperationBaseTranslator(translator.PrimitiveTranslator):
+class MappedOperationTranslatorBase(translator.PrimitiveTranslator):
     """Implements the base for all "mapped base operations".
 
     A mapped base operation `f` is an operation that has several inputs arrays that are elementwise combined to a single output array.
-    A prime example for this would be the addition of two arrays of the _same_ size.
+    A prime example for this would be the addition of two arrays.
     Essentially it assumes that the Tasklet code can be written as:
     ```
         __out0 = f(__in0, __in1, __in3, ...)
     ```
     where `__in*` are the connector names of the Tasklet and `__out0` is the output connector.
-    For problems such as this, the SDFG API provides the `SDFGState::add_mapped_tasklet()` function, however, in most cases it can not be directly used.
+    For problems such as this, the SDFG API provides the `SDFGState.add_mapped_tasklet()` function, however, in most cases it can not be directly used.
     Thus this class acts like a convenience wrapper around it.
 
     To use this class a user has to overwrite the `write_tasklet_code()` function.
     This function generates the Python code that should be put inside the Tasklet.
 
+    If needed the translator will perform broadcasting of the inputs.
+
     Notes:
         This class will always generate a mapped Tasklet, even if a scalar is handled.
-        The class will always map over the entirety of the output and assume that all inputs have the same shape as the output.
-            If you want to override this behaviour you have to override the `make_input_memlets()` method
-            and generate the appropriate Memlets to use as inputs yourself.
-        Only one output is allowed.
     """
 
     __slots__ = ("_prim_name",)
@@ -148,19 +146,32 @@ def make_input_memlets(
             in_var_names:       The list of SDFG variables used as input.
             eqn:                The equation object.
         """
-        if any(eqn.outvars[0].aval.shape != invar.aval.shape for invar in eqn.invars):
-            # If you want to use this class as base, then you must override this function.
+        out_shp = tuple(eqn.outvars[0].aval.shape)  # Shape of the output
+        out_rank = len(out_shp)
+        if any(len(invar.aval.shape) not in {0, out_rank} for invar in eqn.invars):
             raise NotImplementedError(
-                "`MappedOperationBaseTranslator` can only handle inputs and output of the same shape!\nEqn: {eqn}"
+                f"'MappedOperationTranslatorBase' Inputs must have the same rank as the output! Eqn: {eqn} || {tuple(eqn.outvars[0].aval.shape)}"
             )
 
-        return {
-            f"__in{i}": dace.Memlet.simple(
+        # Now we will generate the input Memlets.
+        tskl_inputs: dict[str, dace.Memlet] = {}
+        for i, (in_var_name, inp_shp) in enumerate(
+            zip(in_var_names, (invar.aval.shape for invar in eqn.invars))
+        ):
+            if in_var_name is None:  # Input is a literal: No Memlet needed
+                continue
+
+            if inp_shp == ():  # Scalars
+                tskl_inputs[f"__in{i}"] = dace.Memlet.simple(in_var_name, "0")  # Scalar
+                continue
+
+            # We have to to broadcasting (combine yes and no together)
+            dims_to_bcast: Sequence[int] = [dim for dim in range(out_rank) if inp_shp[dim] == 1]
+            tskl_inputs[f"__in{i}"] = dace.Memlet.simple(
                 in_var_name,
-                ", ".join(name for name, _ in tskl_ranges)
-                if eqn.outvars[0].aval.shape != ()
-                else "0",
+                ", ".join(
+                    ("0" if i in dims_to_bcast else it_var)
+                    for i, (it_var, _) in enumerate(tskl_ranges)
+                ),
             )
-            for i, in_var_name in enumerate(in_var_names)
-            if in_var_name is not None
-        }
+        return tskl_inputs
diff --git a/tests/test_sub_translators_alu.py b/tests/test_sub_translators_alu.py
index 5c3a995..6ea74b7 100644
--- a/tests/test_sub_translators_alu.py
+++ b/tests/test_sub_translators_alu.py
@@ -10,7 +10,7 @@
 from __future__ import annotations
 
 from collections.abc import Callable, Sequence
-from typing import Any
+from typing import Any, cast
 
 import jax
 import numpy as np
@@ -93,6 +93,15 @@ def testee(A: float) -> float:
     _perform_test(testee, 7.0)
 
 
+def test_alu_binary_scalar_literal_2():
+    """Scalar binary operation, with a literal."""
+
+    def testee(A: float) -> float:
+        return 2.03 * A
+
+    _perform_test(testee, 7.0)
+
+
 def test_alu_binary_array():
     """Test binary of arrays, with same size."""
 
@@ -107,12 +116,13 @@ def testee(A: np.ndarray, B: np.ndarray) -> np.ndarray:
 def test_alu_binary_array_scalar():
     """Test binary of array with scalar."""
 
-    def testee(A: np.ndarray, B: float) -> np.ndarray:
-        return A + B
+    def testee(A: np.ndarray | float, B: float | np.ndarray) -> np.ndarray:
+        return cast(np.ndarray, A + B)
 
     A = mkarr((100, 22))
     B = np.float64(1.34)
     _perform_test(testee, A, B)
+    _perform_test(testee, B, A)
 
 
 def test_alu_binary_array_literal():
@@ -167,3 +177,31 @@ def testee(A: np.ndarray, B: np.ndarray) -> np.ndarray:
     B = mkarr((100, 10))
     _perform_test(testee, A, B)
     _perform_test(testee, B, A)
+
+
+def test_alu_binary_broadcast_3():
+    """Test broadcasting."""
+
+    def testee(A: np.ndarray, B: np.ndarray) -> np.ndarray:
+        return A + B
+
+    A = mkarr(
+        (
+            5,
+            1,
+            3,
+            4,
+            1,
+        )
+    )
+    B = mkarr(
+        (
+            5,
+            1,
+            3,
+            1,
+            2,
+        )
+    )
+    _perform_test(testee, A, B)
+    _perform_test(testee, B, A)

From 406b3d54d3a978d1571cf4eab957a8ab1e895e80 Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Thu, 23 May 2024 14:52:28 +0200
Subject: [PATCH 227/458] Made some small fixes. So we now use `__out` instead
 of `__out0`, since we will always have one output.

---
 .../primitive_translators/alu_translators.py  | 74 +++++++++----------
 .../convert_element_type_translator.py        |  8 +-
 .../mapped_operation_base_translator.py       | 15 ++--
 3 files changed, 50 insertions(+), 47 deletions(-)

diff --git a/src/jace/translator/primitive_translators/alu_translators.py b/src/jace/translator/primitive_translators/alu_translators.py
index 22d6376..79b37da 100644
--- a/src/jace/translator/primitive_translators/alu_translators.py
+++ b/src/jace/translator/primitive_translators/alu_translators.py
@@ -80,45 +80,45 @@ def write_tasklet_code(
 # fmt: off
 _ALU_OPS_TMPL: Final[dict[str, str]] = {
     # Unary operations
-    "pos": "__out0 = +(__in0)",
-    "neg": "__out0 = -(__in0)",
-    "not": "__out0 = not (__in0)",
-    "floor": "__out0 = floor(__in0)",
-    "ceil": "__out0 = ceil(__in0)",
-    "round": "__out0 = round(__in0)",
-    "abs": "__out0 = abs(__in0)",
-    "sign": "__out0 = sign(__in0)",
-    "sqrt": "__out0 = sqrt(__in0)",
-    "log": "__out0 = log(__in0)",
-    "exp": "__out0 = exp(__in0)",
-    "integer_pow": "__out0 = (__in0)**({y})",  # 'y' is a parameter of the primitive
-    "sin": "__out0 = sin(__in0)",
-    "asin": "__out0 = asin(__in0)",
-    "cos": "__out0 = cos(__in0)",
-    "acos": "__out0 = acos(__in0)",
-    "tan": "__out0 = tan(__in0)",
-    "atan": "__out0 = atan(__in0)",
-    "tanh": "__out0 = tanh(__in0)",
+    "pos": "__out = +(__in0)",
+    "neg": "__out = -(__in0)",
+    "not": "__out = not (__in0)",
+    "floor": "__out = floor(__in0)",
+    "ceil": "__out = ceil(__in0)",
+    "round": "__out = round(__in0)",
+    "abs": "__out = abs(__in0)",
+    "sign": "__out = sign(__in0)",
+    "sqrt": "__out = sqrt(__in0)",
+    "log": "__out = log(__in0)",
+    "exp": "__out = exp(__in0)",
+    "integer_pow": "__out = (__in0)**({y})",  # 'y' is a parameter of the primitive
+    "sin": "__out = sin(__in0)",
+    "asin": "__out = asin(__in0)",
+    "cos": "__out = cos(__in0)",
+    "acos": "__out = acos(__in0)",
+    "tan": "__out = tan(__in0)",
+    "atan": "__out = atan(__in0)",
+    "tanh": "__out = tanh(__in0)",
 
     # Binary operations
-    "add": "__out0 = (__in0)+(__in1)",
-    "add_any": "__out0 = (__in0)+(__in1)",  # No idea what makes `add_any` differ from `add`
-    "sub": "__out0 = (__in0)-(__in1)",
-    "mul": "__out0 = (__in0)*(__in1)",
-    "div": "__out0 = (__in0)/(__in1)",
-    "rem": "__out0 = (__in0)%(__in1)",
-    "and": "__out0 = (__in0) and (__in1)",
-    "or": "__out0 = (__in0) or  (__in1)",
-    "pow": "__out0 = (__in0)**(__in1)",
-    "ipow": "__out0 = (__in0)**(int(__in1))",
-    "min": "__out0 = min(__in0, __in1)",
-    "max": "__out0 = max(__in0, __in1)",
-    "eq": "__out0 = __in0 == __in1",
-    "ne": "__out0 = __in0 != __in1",
-    "ge": "__out0 = __in0 >= __in1",
-    "gt": "__out0 = __in0 > __in1",
-    "le": "__out0 = __in0 <= __in1",
-    "lt": "__out0 = __in0 < __in1",
+    "add": "__out = (__in0)+(__in1)",
+    "add_any": "__out = (__in0)+(__in1)",  # No idea what makes `add_any` differ from `add`
+    "sub": "__out = (__in0)-(__in1)",
+    "mul": "__out = (__in0)*(__in1)",
+    "div": "__out = (__in0)/(__in1)",
+    "rem": "__out = (__in0)%(__in1)",
+    "and": "__out = (__in0) and (__in1)",
+    "or": "__out = (__in0) or  (__in1)",
+    "pow": "__out = (__in0)**(__in1)",
+    "ipow": "__out = (__in0)**(int(__in1))",
+    "min": "__out = min(__in0, __in1)",
+    "max": "__out = max(__in0, __in1)",
+    "eq": "__out = __in0 == __in1",
+    "ne": "__out = __in0 != __in1",
+    "ge": "__out = __in0 >= __in1",
+    "gt": "__out = __in0 > __in1",
+    "le": "__out = __in0 <= __in1",
+    "lt": "__out = __in0 < __in1",
 }
 
 # Create the ALU translators
diff --git a/src/jace/translator/primitive_translators/convert_element_type_translator.py b/src/jace/translator/primitive_translators/convert_element_type_translator.py
index 3673359..363f576 100644
--- a/src/jace/translator/primitive_translators/convert_element_type_translator.py
+++ b/src/jace/translator/primitive_translators/convert_element_type_translator.py
@@ -31,7 +31,7 @@ class ConvertElementTypeTranslator(MappedOperationTranslatorBase):
         This translator ignores the `new_dtype` and `weak_type` parameter of the equation and only performs casting
 
     Todo:
-        I occasionally Jax converts from the same type to another type.
+        Occasionally Jax converts from the same type to another type.
             This case should be handled by a Memlet directly, which can then be removed.
     """
 
@@ -74,12 +74,12 @@ def write_tasklet_code(
             )
 
         # This is the base of the template that we use for conversion.
-        #  You should notice that the Tasklet `__out0 = __in0` will fail, see commit `f5aabc3` of the prototype.
+        #  You should notice that the Tasklet `__out = __in0` will fail, see commit `f5aabc3` of the prototype.
         #  Thus we have to do it in this way.
         conv_code = "__in0"
 
         if in_dtype_s.startswith("bool") and out_dtype_s.startswith("int"):
-            # Interestingly `__out0 = int(__in0)` will fail, Dace will optimize it away.
+            # Interestingly `__out = int(__in0)` will fail, Dace will optimize it away.
             conv_code = f"(1 if {conv_code} else 0)"
 
         # Now do the actual casting.
@@ -93,7 +93,7 @@ def write_tasklet_code(
             )
 
         # Now writing the full Tasklet, i.e. with the output.
-        return f"__out0 = {conv_code}"
+        return f"__out = {conv_code}"
 
 
 _ = translator.register_primitive_translator(ConvertElementTypeTranslator())
diff --git a/src/jace/translator/primitive_translators/mapped_operation_base_translator.py b/src/jace/translator/primitive_translators/mapped_operation_base_translator.py
index 7e28e87..8838693 100644
--- a/src/jace/translator/primitive_translators/mapped_operation_base_translator.py
+++ b/src/jace/translator/primitive_translators/mapped_operation_base_translator.py
@@ -26,9 +26,9 @@ class MappedOperationTranslatorBase(translator.PrimitiveTranslator):
     A prime example for this would be the addition of two arrays.
     Essentially it assumes that the Tasklet code can be written as:
     ```
-        __out0 = f(__in0, __in1, __in3, ...)
+        __out = f(__in0, __in1, __in3, ...)
     ```
-    where `__in*` are the connector names of the Tasklet and `__out0` is the output connector.
+    where `__in*` are the connector names of the Tasklet and `__out` is the output connector.
     For problems such as this, the SDFG API provides the `SDFGState.add_mapped_tasklet()` function, however, in most cases it can not be directly used.
     Thus this class acts like a convenience wrapper around it.
 
@@ -39,6 +39,9 @@ class MappedOperationTranslatorBase(translator.PrimitiveTranslator):
 
     Notes:
         This class will always generate a mapped Tasklet, even if a scalar is handled.
+
+    Todo:
+        - `write_tasklet_code()` should no longer need to also include the `__out = ` part the base should do that.
     """
 
     __slots__ = ("_prim_name",)
@@ -85,7 +88,7 @@ def __call__(
                 (f"__i{dim}", f"0:{N}") for dim, N in enumerate(eqn.outvars[0].aval.shape)
             ]
             tskl_output: dict[str, dace.Memlet] = {
-                "__out0": dace.Memlet.simple(
+                "__out": dace.Memlet.simple(
                     out_var_names[0],
                     ", ".join(name for name, _ in tskl_ranges),
                 )
@@ -94,7 +97,7 @@ def __call__(
         else:
             # If we have a scalar we will generate a Map, but it will be trivial.
             tskl_ranges = [("__jace_iterator_SCALAR", "0:1")]
-            tskl_output = {"__out0": dace.Memlet.simple(out_var_names[0], "0")}
+            tskl_output = {"__out": dace.Memlet.simple(out_var_names[0], "0")}
 
         tskl_inputs: dict[str, dace.Memlet] = self.make_input_memlets(
             tskl_ranges, in_var_names, eqn
@@ -143,8 +146,8 @@ def make_input_memlets(
         Args:
             tskl_ranges:    List of the different map parameter, first element is the name of the dimension,
                                     second is the range, i.e. `0:SIZE`.
-            in_var_names:       The list of SDFG variables used as input.
-            eqn:                The equation object.
+            in_var_names:   The list of SDFG variables used as input.
+            eqn:            The equation object.
         """
         out_shp = tuple(eqn.outvars[0].aval.shape)  # Shape of the output
         out_rank = len(out_shp)

From 8ad51473a3617a835f4a443ffeb5c3b5fbcb7a61 Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Thu, 23 May 2024 15:02:27 +0200
Subject: [PATCH 228/458] Added a new helper function to unify how literal
 values are extracted.

---
 .../primitive_translators/alu_translators.py      | 15 ++++-----------
 src/jace/util/__init__.py                         |  2 ++
 src/jace/util/jax_helper.py                       | 15 +++++++++++++++
 3 files changed, 21 insertions(+), 11 deletions(-)

diff --git a/src/jace/translator/primitive_translators/alu_translators.py b/src/jace/translator/primitive_translators/alu_translators.py
index 79b37da..c9ca10f 100644
--- a/src/jace/translator/primitive_translators/alu_translators.py
+++ b/src/jace/translator/primitive_translators/alu_translators.py
@@ -10,13 +10,12 @@
 from __future__ import annotations
 
 from collections.abc import Sequence
-from typing import Final, cast
+from typing import Final
 
-import numpy as np
 from jax import core as jax_core
 from typing_extensions import override
 
-from jace import translator
+from jace import translator, util
 from jace.translator.primitive_translators.mapped_operation_base_translator import (
     MappedOperationTranslatorBase,
 )
@@ -61,15 +60,9 @@ def write_tasklet_code(
         for i, in_var_name in enumerate(in_var_names):
             if in_var_name is not None:
                 continue
+            t_val = util.get_jax_literal_value(eqn.invars[i])
+            tskl_code = tskl_code.replace(f"__in{i}", str(t_val))
 
-            jax_in_var: jax_core.Literal = cast(jax_core.Literal, eqn.invars[i])
-            if jax_in_var.aval.shape == ():
-                t_val = jax_in_var.val
-                if isinstance(t_val, np.ndarray):
-                    t_val = jax_in_var.val.max()  # I do not know a better way in that case
-                tskl_code = tskl_code.replace(f"__in{i}", str(t_val))
-            else:
-                raise ValueError(f"Can not handle non scalar literals: {jax_in_var}")
         if len(eqn.params) != 0:
             tskl_code = tskl_code.format(**eqn.params)
 
diff --git a/src/jace/util/__init__.py b/src/jace/util/__init__.py
index 6bff211..2cc61ee 100644
--- a/src/jace/util/__init__.py
+++ b/src/jace/util/__init__.py
@@ -15,6 +15,7 @@
 )
 from .jax_helper import (
     JaCeVar,
+    get_jax_literal_value,
     get_jax_var_dtype,
     get_jax_var_name,
     get_jax_var_shape,
@@ -60,6 +61,7 @@
     "get_jax_var_dtype",
     "get_jax_var_name",
     "get_jax_var_shape",
+    "get_jax_literal_value",
     "translate_dtype",
     "run_jax_sdfg",
     "propose_jax_name",
diff --git a/src/jace/util/jax_helper.py b/src/jace/util/jax_helper.py
index 0832237..bb5523a 100644
--- a/src/jace/util/jax_helper.py
+++ b/src/jace/util/jax_helper.py
@@ -22,6 +22,7 @@
 
 import dace
 import jax.core as jax_core
+import numpy as np
 
 import jace.util as util
 
@@ -192,3 +193,17 @@ def propose_jax_name(
     if jax_name in util.FORBIDDEN_SDFG_VAR_NAMES:
         jax_name = f"__jace_forbidden_{jax_name}"
     return jax_name
+
+
+def get_jax_literal_value(lit: jax_core.Literal) -> bool | float | int | np.generic:
+    """Returns the value a literal is wrapping.
+
+    The function guarantees to return a scalar value.
+    """
+    val = lit.val
+    if isinstance(val, np.ndarray):
+        assert val.shape == ()
+        return val.max()
+    if isinstance(val, (bool, float, int)):
+        return val
+    raise TypeError(f"Failed to extract value from '{lit}'.")

From aef8f37ca844c207f748cce59e3a5781c23a9368 Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Thu, 23 May 2024 15:45:29 +0200
Subject: [PATCH 229/458] Started with teh braodcasting translator.

However, tehre are no tests yet.
---
 .../primitive_translators/__init__.py         |  2 +
 .../broadcast_in_dim_translator.py            | 58 +++++++++++++++++++
 2 files changed, 60 insertions(+)
 create mode 100644 src/jace/translator/primitive_translators/broadcast_in_dim_translator.py

diff --git a/src/jace/translator/primitive_translators/__init__.py b/src/jace/translator/primitive_translators/__init__.py
index 9372adc..3d9fc07 100644
--- a/src/jace/translator/primitive_translators/__init__.py
+++ b/src/jace/translator/primitive_translators/__init__.py
@@ -9,10 +9,12 @@
 from __future__ import annotations
 
 from .alu_translators import ALUTranslator
+from .broadcast_in_dim_translator import BroadcastInDimTranslator
 from .convert_element_type_translator import ConvertElementTypeTranslator
 
 
 __all__ = [
     "ALUTranslator",
     "ConvertElementTypeTranslator",
+    "BroadcastInDimTranslator",
 ]
diff --git a/src/jace/translator/primitive_translators/broadcast_in_dim_translator.py b/src/jace/translator/primitive_translators/broadcast_in_dim_translator.py
new file mode 100644
index 0000000..3ed92a3
--- /dev/null
+++ b/src/jace/translator/primitive_translators/broadcast_in_dim_translator.py
@@ -0,0 +1,58 @@
+# JaCe - JAX Just-In-Time compilation using DaCe (Data Centric Parallel Programming)
+#
+# Copyright (c) 2024, ETH Zurich
+# All rights reserved.
+#
+# SPDX-License-Identifier: BSD-3-Clause
+
+"""This implements the `broadcast_in_dim` primitive."""
+
+from __future__ import annotations
+
+from collections.abc import Sequence
+
+import dace
+from jax import core as jax_core
+from typing_extensions import override
+
+from jace import translator, util
+from jace.translator.primitive_translators.mapped_operation_base_translator import (
+    MappedOperationTranslatorBase,
+)
+
+
+class BroadcastInDimTranslator(MappedOperationTranslatorBase):
+    """This handles the `broadcast_in_dim` primitives."""
+
+    __slots__ = ()
+
+    def __init__(self) -> None:
+        super().__init__(primitive_name="broadcast_in_dim")
+
+    @override
+    def write_tasklet_code(
+        self,
+        in_var_names: Sequence[str | None],
+        eqn: jax_core.JaxprEqn,
+    ) -> str:
+        if in_var_names[0] is None:
+            return f"__out = {util.get_jax_literal_value(eqn.eqn.invars[0])}"
+        return "__out = __in0"
+
+    def make_input_memlets(
+        self,
+        tskl_ranges: Sequence[tuple[str, str]],
+        in_var_names: Sequence[str | None],
+        eqn: jax_core.JaxprEqn,
+    ) -> dict[str, dace.Memlet]:
+        if in_var_names[0] is None:
+            return {}
+        return {
+            "__in0": dace.Memlet.simple(
+                in_var_names[0],
+                ", ".join(tskl_ranges[bdim][0] for bdim in eqn.params["broadcast_dimensions"]),
+            )
+        }
+
+
+translator.register_primitive_translator(BroadcastInDimTranslator())

From 05e4a885441c0cd589c13d90bfb728d8709cf3e3 Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Fri, 24 May 2024 07:17:10 +0200
Subject: [PATCH 230/458] A subclass of the mapped translator no longer needs
 to include the return value assignment.

---
 .../primitive_translators/alu_translators.py  | 74 +++++++++----------
 .../broadcast_in_dim_translator.py            |  4 +-
 .../convert_element_type_translator.py        | 13 +---
 .../mapped_operation_base_translator.py       |  8 +-
 4 files changed, 43 insertions(+), 56 deletions(-)

diff --git a/src/jace/translator/primitive_translators/alu_translators.py b/src/jace/translator/primitive_translators/alu_translators.py
index c9ca10f..5a10006 100644
--- a/src/jace/translator/primitive_translators/alu_translators.py
+++ b/src/jace/translator/primitive_translators/alu_translators.py
@@ -73,45 +73,45 @@ def write_tasklet_code(
 # fmt: off
 _ALU_OPS_TMPL: Final[dict[str, str]] = {
     # Unary operations
-    "pos": "__out = +(__in0)",
-    "neg": "__out = -(__in0)",
-    "not": "__out = not (__in0)",
-    "floor": "__out = floor(__in0)",
-    "ceil": "__out = ceil(__in0)",
-    "round": "__out = round(__in0)",
-    "abs": "__out = abs(__in0)",
-    "sign": "__out = sign(__in0)",
-    "sqrt": "__out = sqrt(__in0)",
-    "log": "__out = log(__in0)",
-    "exp": "__out = exp(__in0)",
-    "integer_pow": "__out = (__in0)**({y})",  # 'y' is a parameter of the primitive
-    "sin": "__out = sin(__in0)",
-    "asin": "__out = asin(__in0)",
-    "cos": "__out = cos(__in0)",
-    "acos": "__out = acos(__in0)",
-    "tan": "__out = tan(__in0)",
-    "atan": "__out = atan(__in0)",
-    "tanh": "__out = tanh(__in0)",
+    "pos": "+(__in0)",
+    "neg": "-(__in0)",
+    "not": "not (__in0)",
+    "floor": "floor(__in0)",
+    "ceil": "ceil(__in0)",
+    "round": "round(__in0)",
+    "abs": "abs(__in0)",
+    "sign": "sign(__in0)",
+    "sqrt": "sqrt(__in0)",
+    "log": "log(__in0)",
+    "exp": "exp(__in0)",
+    "integer_pow": "(__in0)**({y})",  # 'y' is a parameter of the primitive
+    "sin": "sin(__in0)",
+    "asin": "asin(__in0)",
+    "cos": "cos(__in0)",
+    "acos": "acos(__in0)",
+    "tan": "tan(__in0)",
+    "atan": "atan(__in0)",
+    "tanh": "tanh(__in0)",
 
     # Binary operations
-    "add": "__out = (__in0)+(__in1)",
-    "add_any": "__out = (__in0)+(__in1)",  # No idea what makes `add_any` differ from `add`
-    "sub": "__out = (__in0)-(__in1)",
-    "mul": "__out = (__in0)*(__in1)",
-    "div": "__out = (__in0)/(__in1)",
-    "rem": "__out = (__in0)%(__in1)",
-    "and": "__out = (__in0) and (__in1)",
-    "or": "__out = (__in0) or  (__in1)",
-    "pow": "__out = (__in0)**(__in1)",
-    "ipow": "__out = (__in0)**(int(__in1))",
-    "min": "__out = min(__in0, __in1)",
-    "max": "__out = max(__in0, __in1)",
-    "eq": "__out = __in0 == __in1",
-    "ne": "__out = __in0 != __in1",
-    "ge": "__out = __in0 >= __in1",
-    "gt": "__out = __in0 > __in1",
-    "le": "__out = __in0 <= __in1",
-    "lt": "__out = __in0 < __in1",
+    "add": "(__in0)+(__in1)",
+    "add_any": "(__in0)+(__in1)",  # No idea what makes `add_any` differ from `add`
+    "sub": "(__in0)-(__in1)",
+    "mul": "(__in0)*(__in1)",
+    "div": "(__in0)/(__in1)",
+    "rem": "(__in0)%(__in1)",
+    "and": "(__in0) and (__in1)",
+    "or": "(__in0) or  (__in1)",
+    "pow": "(__in0)**(__in1)",
+    "ipow": "(__in0)**(int(__in1))",
+    "min": "min(__in0, __in1)",
+    "max": "max(__in0, __in1)",
+    "eq": "__in0 == __in1",
+    "ne": "__in0 != __in1",
+    "ge": "__in0 >= __in1",
+    "gt": "__in0 > __in1",
+    "le": "__in0 <= __in1",
+    "lt": "__in0 < __in1",
 }
 
 # Create the ALU translators
diff --git a/src/jace/translator/primitive_translators/broadcast_in_dim_translator.py b/src/jace/translator/primitive_translators/broadcast_in_dim_translator.py
index 3ed92a3..c13168d 100644
--- a/src/jace/translator/primitive_translators/broadcast_in_dim_translator.py
+++ b/src/jace/translator/primitive_translators/broadcast_in_dim_translator.py
@@ -36,8 +36,8 @@ def write_tasklet_code(
         eqn: jax_core.JaxprEqn,
     ) -> str:
         if in_var_names[0] is None:
-            return f"__out = {util.get_jax_literal_value(eqn.eqn.invars[0])}"
-        return "__out = __in0"
+            return f"{util.get_jax_literal_value(eqn.eqn.invars[0])}"
+        return "__in0"
 
     def make_input_memlets(
         self,
diff --git a/src/jace/translator/primitive_translators/convert_element_type_translator.py b/src/jace/translator/primitive_translators/convert_element_type_translator.py
index 363f576..80acde8 100644
--- a/src/jace/translator/primitive_translators/convert_element_type_translator.py
+++ b/src/jace/translator/primitive_translators/convert_element_type_translator.py
@@ -46,15 +46,6 @@ def write_tasklet_code(
         in_var_names: Sequence[str | None],
         eqn: jax_core.JaxprEqn,
     ) -> str:
-        """Return the code that should be put inside the Tasklet.
-
-        Note that returned code is not processed any further.
-        Thus the function has to apply literal removal on its own.
-
-        Args:
-            in_var_names:   The list of SDFG variables used as input.
-            eqn:            The equation.
-        """
         assert in_var_names[0] is not None
 
         in_var_name: str = in_var_names[0]
@@ -91,9 +82,7 @@ def write_tasklet_code(
             raise NotImplementedError(
                 f"Cannot convert '{in_dtype}' to '{out_dtype}' as this type is not known to DaCe."
             )
-
-        # Now writing the full Tasklet, i.e. with the output.
-        return f"__out = {conv_code}"
+        return conv_code
 
 
 _ = translator.register_primitive_translator(ConvertElementTypeTranslator())
diff --git a/src/jace/translator/primitive_translators/mapped_operation_base_translator.py b/src/jace/translator/primitive_translators/mapped_operation_base_translator.py
index 8838693..27610f8 100644
--- a/src/jace/translator/primitive_translators/mapped_operation_base_translator.py
+++ b/src/jace/translator/primitive_translators/mapped_operation_base_translator.py
@@ -39,9 +39,6 @@ class MappedOperationTranslatorBase(translator.PrimitiveTranslator):
 
     Notes:
         This class will always generate a mapped Tasklet, even if a scalar is handled.
-
-    Todo:
-        - `write_tasklet_code()` should no longer need to also include the `__out = ` part the base should do that.
     """
 
     __slots__ = ("_prim_name",)
@@ -109,7 +106,7 @@ def __call__(
             name=tskl_name,
             map_ranges=tskl_ranges,
             inputs=tskl_inputs,
-            code=tskl_code,
+            code=f"__out = {tskl_code}",
             outputs=tskl_output,
             external_edges=True,
         )
@@ -122,10 +119,11 @@ def write_tasklet_code(
         in_var_names: Sequence[str | None],
         eqn: jax_core.JaxprEqn,
     ) -> str:
-        """Return the code that should be put inside the Tasklet.
+        """Return the code that should be put at the left hand side of the assignment statement inside the Tasklet.
 
         Note that returned code is not processed any further.
         Thus the function has to apply literal removal on its own.
+        It is important that the function does not need to return the part of the Tasklet code that is the assignment.
 
         Args:
             in_var_names:   The list of SDFG variables used as input.

From 3fefe29b79f258a0bf90b628df08094452d79f15 Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Fri, 24 May 2024 07:18:00 +0200
Subject: [PATCH 231/458] I added more tests, so I have to increase the number.

---
 tests/test_subtranslator_helper.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/tests/test_subtranslator_helper.py b/tests/test_subtranslator_helper.py
index 612df15..1f197c2 100644
--- a/tests/test_subtranslator_helper.py
+++ b/tests/test_subtranslator_helper.py
@@ -73,7 +73,7 @@ def fake_add_translator(*args: Any, **kwargs: Any) -> None:
 def test_are_subtranslators_imported():
     """Tests if something is inside the list of subtranslators."""
     # Must be adapted if new primitives are implemented.
-    assert len(get_regsitered_primitive_translators()) == 37
+    assert len(get_regsitered_primitive_translators()) == 39
 
 
 def test_subtranslatior_managing(no_builtin_translators):

From bd92a475995e9b57f067a320a17324e5d12898f8 Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Fri, 24 May 2024 07:34:25 +0200
Subject: [PATCH 232/458] Moved the literal substitution to the mapped base.

---
 .../primitive_translators/alu_translators.py  | 13 ++----
 .../broadcast_in_dim_translator.py            |  4 +-
 .../mapped_operation_base_translator.py       | 42 ++++++++++++++-----
 3 files changed, 37 insertions(+), 22 deletions(-)

diff --git a/src/jace/translator/primitive_translators/alu_translators.py b/src/jace/translator/primitive_translators/alu_translators.py
index 5a10006..6b93f16 100644
--- a/src/jace/translator/primitive_translators/alu_translators.py
+++ b/src/jace/translator/primitive_translators/alu_translators.py
@@ -15,7 +15,7 @@
 from jax import core as jax_core
 from typing_extensions import override
 
-from jace import translator, util
+from jace import translator
 from jace.translator.primitive_translators.mapped_operation_base_translator import (
     MappedOperationTranslatorBase,
 )
@@ -50,22 +50,17 @@ def write_tasklet_code(
         in_var_names: Sequence[str | None],
         eqn: jax_core.JaxprEqn,
     ) -> str:
-        """Return the code that should be put inside the Tasklet, with all parameters and literals substituted with their values.
+        """Returns the code for the Tasklet.
+
+        The function does parameter substitution, see `integer_pow`, while literal substitution is left to the base.
 
         Args:
             in_var_names:   The list of SDFG variables used as input.
             eqn:            The equation.
         """
         tskl_code = self._tskl_tmpl
-        for i, in_var_name in enumerate(in_var_names):
-            if in_var_name is not None:
-                continue
-            t_val = util.get_jax_literal_value(eqn.invars[i])
-            tskl_code = tskl_code.replace(f"__in{i}", str(t_val))
-
         if len(eqn.params) != 0:
             tskl_code = tskl_code.format(**eqn.params)
-
         return tskl_code
 
 
diff --git a/src/jace/translator/primitive_translators/broadcast_in_dim_translator.py b/src/jace/translator/primitive_translators/broadcast_in_dim_translator.py
index c13168d..0a69ee1 100644
--- a/src/jace/translator/primitive_translators/broadcast_in_dim_translator.py
+++ b/src/jace/translator/primitive_translators/broadcast_in_dim_translator.py
@@ -15,7 +15,7 @@
 from jax import core as jax_core
 from typing_extensions import override
 
-from jace import translator, util
+from jace import translator
 from jace.translator.primitive_translators.mapped_operation_base_translator import (
     MappedOperationTranslatorBase,
 )
@@ -35,8 +35,6 @@ def write_tasklet_code(
         in_var_names: Sequence[str | None],
         eqn: jax_core.JaxprEqn,
     ) -> str:
-        if in_var_names[0] is None:
-            return f"{util.get_jax_literal_value(eqn.eqn.invars[0])}"
         return "__in0"
 
     def make_input_memlets(
diff --git a/src/jace/translator/primitive_translators/mapped_operation_base_translator.py b/src/jace/translator/primitive_translators/mapped_operation_base_translator.py
index 27610f8..f76bcbc 100644
--- a/src/jace/translator/primitive_translators/mapped_operation_base_translator.py
+++ b/src/jace/translator/primitive_translators/mapped_operation_base_translator.py
@@ -16,7 +16,7 @@
 from jax import core as jax_core
 from typing_extensions import final, override
 
-from jace import translator
+from jace import translator, util
 
 
 class MappedOperationTranslatorBase(translator.PrimitiveTranslator):
@@ -33,9 +33,8 @@ class MappedOperationTranslatorBase(translator.PrimitiveTranslator):
     Thus this class acts like a convenience wrapper around it.
 
     To use this class a user has to overwrite the `write_tasklet_code()` function.
-    This function generates the Python code that should be put inside the Tasklet.
-
-    If needed the translator will perform broadcasting of the inputs.
+    This function generates the right hand side of the assignment code, i.e. everything after `__out =`.
+    If needed the translator will perform literal substitution on the returned code and broadcast the inputs to match the outputs.
 
     Notes:
         This class will always generate a mapped Tasklet, even if a scalar is handled.
@@ -69,7 +68,8 @@ def __call__(
 
         The function will create the map ranges and based on the shape of the output array.
         It will then call `make_input_memlets()` to get the input Memlets.
-        After that it calls `write_tasklet_code()` to get the Tasklet code.
+        After that it calls `write_tasklet_code()` to get the Tasklet code
+        and perform literal substitution by forwarding it to `self.literal_substitution()`.
         After that it will create the mapped Tasklet.
 
         Args:
@@ -99,8 +99,9 @@ def __call__(
         tskl_inputs: dict[str, dace.Memlet] = self.make_input_memlets(
             tskl_ranges, in_var_names, eqn
         )
-        tskl_name: str = f"{self.primitive}_{out_var_names[0]}"
-        tskl_code: str = self.write_tasklet_code(in_var_names, eqn)
+        tskl_name = f"{self.primitive}_{out_var_names[0]}"
+        tskl_code = self.write_tasklet_code(in_var_names, eqn)
+        tskl_code = self.literal_substitution(tskl_code, in_var_names, eqn)
 
         eqn_state.add_mapped_tasklet(
             name=tskl_name,
@@ -121,9 +122,7 @@ def write_tasklet_code(
     ) -> str:
         """Return the code that should be put at the left hand side of the assignment statement inside the Tasklet.
 
-        Note that returned code is not processed any further.
-        Thus the function has to apply literal removal on its own.
-        It is important that the function does not need to return the part of the Tasklet code that is the assignment.
+        Literal substitution is allied to the returned code.
 
         Args:
             in_var_names:   The list of SDFG variables used as input.
@@ -176,3 +175,26 @@ def make_input_memlets(
                 ),
             )
         return tskl_inputs
+
+    def literal_substitution(
+        self,
+        tskl_code: str,
+        in_var_names: Sequence[str | None],
+        eqn: jax_core.JaxprEqn,
+    ) -> str:
+        """Perform literal substitution on the proto Tasklet code `tskl_code`.
+
+        Args:
+            tskl_code:      The proto Tasklet code with literal.
+            in_var_names:   The list of SDFG variables used as input.
+            eqn:            The equation.
+
+        Note:
+            It is allowed but not recommended to override this function.
+        """
+        for i, in_var_name in enumerate(in_var_names):
+            if in_var_name is not None:
+                continue
+            t_val = util.get_jax_literal_value(eqn.invars[i])
+            tskl_code = tskl_code.replace(f"__in{i}", str(t_val))
+        return tskl_code

From 53444fa34729151b685e9e2cd01fcf71d91801a7 Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Fri, 24 May 2024 07:50:01 +0200
Subject: [PATCH 233/458] Updated a test.

---
 ...ement_type.py => test_sub_translators_convert_element_type.py} | 0
 1 file changed, 0 insertions(+), 0 deletions(-)
 rename tests/{test_convert_element_type.py => test_sub_translators_convert_element_type.py} (100%)

diff --git a/tests/test_convert_element_type.py b/tests/test_sub_translators_convert_element_type.py
similarity index 100%
rename from tests/test_convert_element_type.py
rename to tests/test_sub_translators_convert_element_type.py

From beda8361cd25f2b3459546f29736de0a5a60bc9d Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Fri, 24 May 2024 08:18:32 +0200
Subject: [PATCH 234/458] Found a test that shows that Jax sometimes casts
 between the same type.

---
 .../convert_element_type_translator.py        | 33 ++++++++++---------
 ...st_sub_translators_convert_element_type.py | 23 +++++++++++++
 2 files changed, 41 insertions(+), 15 deletions(-)

diff --git a/src/jace/translator/primitive_translators/convert_element_type_translator.py b/src/jace/translator/primitive_translators/convert_element_type_translator.py
index 80acde8..ede0977 100644
--- a/src/jace/translator/primitive_translators/convert_element_type_translator.py
+++ b/src/jace/translator/primitive_translators/convert_element_type_translator.py
@@ -46,34 +46,37 @@ def write_tasklet_code(
         in_var_names: Sequence[str | None],
         eqn: jax_core.JaxprEqn,
     ) -> str:
-        assert in_var_names[0] is not None
 
-        in_var_name: str = in_var_names[0]
+        if in_var_names[0] is None:
+            raise NotImplementedError("'convert_element_type' is not supported for literals.")
+
         in_dtype = eqn.invars[0].aval.dtype
         in_dtype_s: str = str(in_dtype)
         out_dtype = eqn.outvars[0].aval.dtype
         out_dtype_s: str = str(out_dtype)
 
-        if in_var_name is None:
-            raise NotImplementedError("'convert_element_type' is not supported for literals.")
-        if in_dtype == out_dtype:
-            # TODO(phimuell): make this into a pure Memlet such that it can be optimized away by DaCe.
-            # Believe it or not but it happens.
-            warnings.warn(
-                "convert_element_type({eqn}): is useless, because input and output have same type.",
-                stacklevel=1,  # Find a better one
-            )
-
         # This is the base of the template that we use for conversion.
         #  You should notice that the Tasklet `__out = __in0` will fail, see commit `f5aabc3` of the prototype.
         #  Thus we have to do it in this way.
         conv_code = "__in0"
 
+        # Handle special cases
+        if in_dtype == out_dtype:
+            # It sounds ridiculously but it can happen.
+            #  See: tests/test_sub_translators_convert_element_type.py::test_convert_element_type_useless_cast
+            # TODO(phimuell): Make this into a pure Memlet such that it can be optimized away by DaCe.
+            warnings.warn(
+                f"convert_element_type({eqn}): is useless, because input and output have same type.",
+                category=UserWarning,
+                stacklevel=1,  # Find a better one
+            )
+            return conv_code
         if in_dtype_s.startswith("bool") and out_dtype_s.startswith("int"):
-            # Interestingly `__out = int(__in0)` will fail, Dace will optimize it away.
-            conv_code = f"(1 if {conv_code} else 0)"
+            # Interestingly `__out = int(__in0)` will at some DaCe processing stage.
+            #  See commit `f5aabc` of the prototype.
+            return f"(1 if {conv_code} else 0)"
 
-        # Now do the actual casting.
+        # The general case
         if out_dtype_s == "bool":
             conv_code = f"dace.bool_({conv_code})"
         elif hasattr(dace.dtypes, str(out_dtype)):
diff --git a/tests/test_sub_translators_convert_element_type.py b/tests/test_sub_translators_convert_element_type.py
index 8ed0bbd..e2635cf 100644
--- a/tests/test_sub_translators_convert_element_type.py
+++ b/tests/test_sub_translators_convert_element_type.py
@@ -75,3 +75,26 @@ def test_convert_element_type_complex():
 def test_convert_element_type_from_bool():
     """Tests conversions from bools to any other types."""
     _test_convert_element_type_impl([np.bool_], _DACE_COMPLEX)
+
+
+def test_convert_element_type_useless_cast():
+    """Broadcast a literal to a matrix.
+
+    This test is here to show, that in certain situation Jax inserts
+    a `convert_element_type` primitive even if it is not needed.
+    """
+
+    def testee(a: float) -> np.ndarray:
+        # For it to work we have to use `numpy` instead of the Jax substitute.
+        return np.broadcast_to(1.0, (10, 10)) + a
+
+    with pytest.warns(
+        expected_warning=UserWarning,
+        match=r"convert_element_type\(.*\): is useless, because input and output have same type.",
+    ):
+        res = jace.jit(testee)(1.0)
+
+    ref = testee(1.0)
+    assert res.shape == ref.shape
+    assert res.dtype == ref.dtype
+    assert np.all(res == ref)

From 1e130a9ec8c11baf7a21354d41a82f2de4525731 Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Fri, 24 May 2024 09:00:31 +0200
Subject: [PATCH 235/458] Fixed a bug in the broadcast translator.

---
 .../primitive_translators/broadcast_in_dim_translator.py      | 4 +++-
 1 file changed, 3 insertions(+), 1 deletion(-)

diff --git a/src/jace/translator/primitive_translators/broadcast_in_dim_translator.py b/src/jace/translator/primitive_translators/broadcast_in_dim_translator.py
index 0a69ee1..23c1877 100644
--- a/src/jace/translator/primitive_translators/broadcast_in_dim_translator.py
+++ b/src/jace/translator/primitive_translators/broadcast_in_dim_translator.py
@@ -48,7 +48,9 @@ def make_input_memlets(
         return {
             "__in0": dace.Memlet.simple(
                 in_var_names[0],
-                ", ".join(tskl_ranges[bdim][0] for bdim in eqn.params["broadcast_dimensions"]),
+                ", ".join(tskl_ranges[bdim][0] for bdim in eqn.params["broadcast_dimensions"])
+                if eqn.params["broadcast_dimensions"]
+                else "0",
             )
         }
 

From 2d51b0ca88f0343cea1c17f94660f8eaa742d773 Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Fri, 24 May 2024 09:02:14 +0200
Subject: [PATCH 236/458] Added a test for the broadcast stuff.

---
 .../test_sub_translators_broadcast_in_dim.py  | 90 +++++++++++++++++++
 1 file changed, 90 insertions(+)
 create mode 100644 tests/test_sub_translators_broadcast_in_dim.py

diff --git a/tests/test_sub_translators_broadcast_in_dim.py b/tests/test_sub_translators_broadcast_in_dim.py
new file mode 100644
index 0000000..5f1a2f3
--- /dev/null
+++ b/tests/test_sub_translators_broadcast_in_dim.py
@@ -0,0 +1,90 @@
+# JaCe - JAX Just-In-Time compilation using DaCe (Data Centric Parallel Programming)
+#
+# Copyright (c) 2024, ETH Zurich
+# All rights reserved.
+#
+# SPDX-License-Identifier: BSD-3-Clause
+
+"""Implements tests for the broadcast in dim translator.
+
+Todo:
+    - `np.meshgrid`
+    - `np.expand_dims`
+    - `np.ix_`
+    - `np.indices`
+"""
+
+from __future__ import annotations
+
+from collections.abc import Sequence
+
+import numpy as np
+from jax import numpy as jnp
+
+import jace
+
+
+def test_bid_scalar():
+    """Broadcast a scalar to a matrix."""
+
+    def testee(A: float) -> np.ndarray:
+        return jnp.broadcast_to(A, (2, 2))
+
+    for a in [1, 1.0, 3.1415]:
+        ref = testee(a)
+        res = jace.jit(testee)(a)
+
+        assert res.shape == ref.shape
+        assert res.dtype == ref.dtype
+        assert np.all(res == ref), f"Expected '{ref.tolist()}' got '{res.tolist()}'."
+
+
+def test_bid_literal():
+    """Broadcast a literal to a matrix."""
+
+    def testee(a: float) -> np.ndarray:
+        return jnp.broadcast_to(1.0, (10, 10)) + a
+
+    for a in [1, 1.0, 3.1415]:
+        ref = testee(a)
+        res = jace.jit(testee)(a)
+        assert res.shape == ref.shape
+        assert res.dtype == ref.dtype
+        assert np.all(res == ref)
+
+
+def _expand_dims_test_impl(
+    shape: Sequence[int],
+    axes: Sequence[int | Sequence[int]],
+) -> None:
+    """Implementation of the test for `expand_dims()`.
+
+    Args:
+        shape:  Shape of the input array.
+        axes:   A series of axis that should be tried.
+    """
+    A = np.random.random(shape)  # noqa: NPY002
+    for axis in axes:
+
+        def testee(A):
+            return jnp.expand_dims(A, axis)  # noqa: B023  # Binding loop variable.
+
+        ref = testee(A)
+        res = jace.jit(testee)(A)
+
+        assert ref.shape == res.shape, f"A.shape = {shape}; Expected: {ref.shape}; Got: {res.shape}"
+        assert np.all(ref == res), f"Value error for shape '{shape}' and axis={axis}"
+
+
+def test_expand_dims():
+    """Test various calls to `np.expand_dims()`."""
+    _expand_dims_test_impl((10,), [0, -1, 1])
+    _expand_dims_test_impl(
+        (2, 3, 4, 5),
+        [
+            0,
+            -1,
+            (1, 2, 3),
+            (3, 2, 1),
+        ],
+    )

From a05baa54a0752d597dabf2357e22fc97f545c2a7 Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Fri, 24 May 2024 09:26:19 +0200
Subject: [PATCH 237/458] Make a note about the persistent memory.

---
 src/jace/jax/stages.py            | 4 ++++
 src/jace/jax/translation_cache.py | 4 ++++
 src/jace/optimization.py          | 5 +++++
 3 files changed, 13 insertions(+)

diff --git a/src/jace/jax/stages.py b/src/jace/jax/stages.py
index afa9a19..8c179df 100644
--- a/src/jace/jax/stages.py
+++ b/src/jace/jax/stages.py
@@ -247,6 +247,10 @@ def _make_call_description(
 class JaceCompiled:
     """Compiled version of the SDFG.
 
+    The SDFG handle, is only initialized the first time the function is called.
+    This has implications for persistent data and concurrency.
+    Thus for the time being it is unsafe to use a compiled object in multiple threads.
+
     Todo:
         - Handle pytrees.
     """
diff --git a/src/jace/jax/translation_cache.py b/src/jace/jax/translation_cache.py
index 5bcb948..7877375 100644
--- a/src/jace/jax/translation_cache.py
+++ b/src/jace/jax/translation_cache.py
@@ -47,6 +47,10 @@ class CachingStage:
 
     Todo:
         - Make a generic to indicate what the result stage is.
+        - Currently the cached stages are stored until they are evicted from the cache.
+            Since the default will be "persistent" memory the transients will remain allocated and occupy memory until then.
+            This should not be and we should handle this situation.
+            It sounds like a job for `WeakKeyDictionary`, that maps the caching state to the result, in addition to the cache.
     """
 
     _cache: TranslationCache
diff --git a/src/jace/optimization.py b/src/jace/optimization.py
index bc2bf10..ed2f2e3 100644
--- a/src/jace/optimization.py
+++ b/src/jace/optimization.py
@@ -31,16 +31,19 @@ class CompilerOptions(TypedDict, total=False):
 
     auto_optimize: bool
     simplify: bool
+    persistent: bool
 
 
 DEFAULT_OPTIMIZATIONS: Final[CompilerOptions] = {
     "auto_optimize": True,
     "simplify": True,
+    "persistent": True,
 }
 
 NO_OPTIMIZATIONS: Final[CompilerOptions] = {
     "auto_optimize": False,
     "simplify": False,
+    "persistent": False,
 }
 
 
@@ -56,6 +59,8 @@ def jace_optimize(
     Args:
         simplify:       Run the simplification pilepline.
         auto_optimize:  Run the auto optimization pipeline (currently does nothing)
+        persistent:     Make the memory allocation persistent, i.e. allocate the transients only
+                            once at the beginning and then reuse the memory across the lifetime of the SDFG.
 
     Note:
         By default all optimizations are disabled and this function acts as a noops.

From 8e1916b68433c60ef3ffebc902f4853643e16e0c Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Fri, 24 May 2024 10:41:22 +0200
Subject: [PATCH 238/458] Added a reshape translator.

---
 .../primitive_translators/__init__.py         |  4 +-
 .../reshape_translator.py                     | 59 +++++++++++++
 tests/test_sub_translators_reshape.py         | 83 +++++++++++++++++++
 tests/test_subtranslator_helper.py            |  2 +-
 4 files changed, 146 insertions(+), 2 deletions(-)
 create mode 100644 src/jace/translator/primitive_translators/reshape_translator.py
 create mode 100644 tests/test_sub_translators_reshape.py

diff --git a/src/jace/translator/primitive_translators/__init__.py b/src/jace/translator/primitive_translators/__init__.py
index 3d9fc07..4349317 100644
--- a/src/jace/translator/primitive_translators/__init__.py
+++ b/src/jace/translator/primitive_translators/__init__.py
@@ -11,10 +11,12 @@
 from .alu_translators import ALUTranslator
 from .broadcast_in_dim_translator import BroadcastInDimTranslator
 from .convert_element_type_translator import ConvertElementTypeTranslator
+from .reshape_translator import ReshapeTranslator
 
 
 __all__ = [
     "ALUTranslator",
-    "ConvertElementTypeTranslator",
     "BroadcastInDimTranslator",
+    "ConvertElementTypeTranslator",
+    "ReshapeTranslator",
 ]
diff --git a/src/jace/translator/primitive_translators/reshape_translator.py b/src/jace/translator/primitive_translators/reshape_translator.py
new file mode 100644
index 0000000..47a92bf
--- /dev/null
+++ b/src/jace/translator/primitive_translators/reshape_translator.py
@@ -0,0 +1,59 @@
+# JaCe - JAX Just-In-Time compilation using DaCe (Data Centric Parallel Programming)
+#
+# Copyright (c) 2024, ETH Zurich
+# All rights reserved.
+#
+# SPDX-License-Identifier: BSD-3-Clause
+
+from __future__ import annotations
+
+from collections.abc import MutableSequence, Sequence
+
+import dace
+from jax import core as jax_core
+from typing_extensions import override
+
+from jace import translator
+
+
+class ReshapeTranslator(translator.PrimitiveTranslator):
+    """Reshapes an array.
+
+    Todo:
+        - Handle `dimensions` parameter fully.
+        - Find a way to make it as a Map.
+    """
+
+    __slots__ = ()
+
+    @property
+    def primitive(self) -> str:
+        return "reshape"
+
+    @override
+    def __call__(
+        self,
+        driver: translator.JaxprTranslationDriver,
+        in_var_names: Sequence[str | None],
+        out_var_names: MutableSequence[str],
+        eqn: jax_core.JaxprEqn,
+        eqn_state: dace.SDFGState,
+    ) -> None:
+        """Performs the reshaping.
+
+        Currently a copy using a Memlet is performed.
+        """
+        if eqn.params["dimensions"] is not None:
+            raise NotImplementedError("Currently 'dimensions' must be 'None'.")
+        eqn_state.add_nedge(
+            eqn_state.add_read(in_var_names[0]),
+            eqn_state.add_write(out_var_names[0]),
+            dace.Memlet(
+                data=in_var_names[0],
+                subset=", ".join(f"0:{size}" for size in eqn.invars[0].aval.shape),
+                other_subset=", ".join(f"0:{size}" for size in eqn.params["new_sizes"]),
+            ),
+        )
+
+
+translator.register_primitive_translator(ReshapeTranslator())
diff --git a/tests/test_sub_translators_reshape.py b/tests/test_sub_translators_reshape.py
new file mode 100644
index 0000000..40844e5
--- /dev/null
+++ b/tests/test_sub_translators_reshape.py
@@ -0,0 +1,83 @@
+# JaCe - JAX Just-In-Time compilation using DaCe (Data Centric Parallel Programming)
+#
+# Copyright (c) 2024, ETH Zurich
+# All rights reserved.
+#
+# SPDX-License-Identifier: BSD-3-Clause
+
+"""Tests the rehaping functionality."""
+
+from __future__ import annotations
+
+from collections.abc import Sequence
+
+import numpy as np
+import pytest
+from jax import numpy as jnp
+
+import jace
+
+
+def _test_impl_reshaping(
+    src_shape: Sequence[int],
+    dst_shape: Sequence[int],
+    order: str = "C",
+) -> None:
+    """Performs a reshaping from `src_shape` to `dst_shape`."""
+    A = np.random.random(src_shape)  # noqa: NPY002
+    A = np.array(A, order=order)  # type: ignore[call-overload]  # MyPy wants a literal as order.
+
+    def testee(A: np.ndarray) -> np.ndarray:
+        return jnp.reshape(A, dst_shape)
+
+    print(f"SHAPE: {A.shape} -> {dst_shape}")
+
+    ref = testee(A)
+    res = jace.jit(testee)(A)
+
+    assert res.shape == dst_shape
+    assert np.all(res == ref)
+
+
+@pytest.fixture(
+    params=["C", pytest.param("F", marks=pytest.mark.skip("Non C order is not supported"))]
+)
+def mem_order(request) -> str:
+    """Gets the memory order that we want
+
+    Currently 'F' is skipped because it is not implemented by the logic.
+    """
+    return request.param
+
+
+def test_reshaping_same_rank(mem_order: str):
+    """Keeping the ranke same."""
+    _test_impl_reshaping((12, 2), (6, 4), mem_order)
+
+
+def test_reshaping_adding_rank(mem_order: str):
+    """Adding ranks to an array."""
+    _test_impl_reshaping((12,), (12, 1), mem_order)
+    _test_impl_reshaping((12,), (1, 12), mem_order)
+    _test_impl_reshaping((12,), (1, 1, 12), mem_order)
+    _test_impl_reshaping(
+        (1,),
+        (
+            1,
+            1,
+        ),
+        mem_order,
+    )
+
+
+def test_reshaping_removing_rank(mem_order: str):
+    """Removing ranks from an array."""
+    _test_impl_reshaping((12, 12), (144,), mem_order)
+    _test_impl_reshaping(
+        (
+            1,
+            1,
+        ),
+        (1,),
+        mem_order,
+    )
diff --git a/tests/test_subtranslator_helper.py b/tests/test_subtranslator_helper.py
index 1f197c2..5d197a4 100644
--- a/tests/test_subtranslator_helper.py
+++ b/tests/test_subtranslator_helper.py
@@ -73,7 +73,7 @@ def fake_add_translator(*args: Any, **kwargs: Any) -> None:
 def test_are_subtranslators_imported():
     """Tests if something is inside the list of subtranslators."""
     # Must be adapted if new primitives are implemented.
-    assert len(get_regsitered_primitive_translators()) == 39
+    assert len(get_regsitered_primitive_translators()) == 40
 
 
 def test_subtranslatior_managing(no_builtin_translators):

From 7faf8dbd4582b219831607eca627695d95741c7e Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Fri, 24 May 2024 11:46:27 +0200
Subject: [PATCH 239/458] Added the `squeeze` transformer.

---
 .../primitive_translators/__init__.py         |  2 +
 .../broadcast_in_dim_translator.py            |  1 +
 .../squeeze_translator.py                     | 62 ++++++++++++++++
 .../test_sub_translators_broadcast_in_dim.py  | 42 +----------
 ...est_sub_translators_squeeze_expand_dims.py | 73 +++++++++++++++++++
 tests/test_subtranslator_helper.py            |  2 +-
 6 files changed, 141 insertions(+), 41 deletions(-)
 create mode 100644 src/jace/translator/primitive_translators/squeeze_translator.py
 create mode 100644 tests/test_sub_translators_squeeze_expand_dims.py

diff --git a/src/jace/translator/primitive_translators/__init__.py b/src/jace/translator/primitive_translators/__init__.py
index 4349317..72b4f5d 100644
--- a/src/jace/translator/primitive_translators/__init__.py
+++ b/src/jace/translator/primitive_translators/__init__.py
@@ -12,6 +12,7 @@
 from .broadcast_in_dim_translator import BroadcastInDimTranslator
 from .convert_element_type_translator import ConvertElementTypeTranslator
 from .reshape_translator import ReshapeTranslator
+from .squeeze_translator import SqueezeTranslator
 
 
 __all__ = [
@@ -19,4 +20,5 @@
     "BroadcastInDimTranslator",
     "ConvertElementTypeTranslator",
     "ReshapeTranslator",
+    "SqueezeTranslator",
 ]
diff --git a/src/jace/translator/primitive_translators/broadcast_in_dim_translator.py b/src/jace/translator/primitive_translators/broadcast_in_dim_translator.py
index 23c1877..331ec55 100644
--- a/src/jace/translator/primitive_translators/broadcast_in_dim_translator.py
+++ b/src/jace/translator/primitive_translators/broadcast_in_dim_translator.py
@@ -37,6 +37,7 @@ def write_tasklet_code(
     ) -> str:
         return "__in0"
 
+    @override
     def make_input_memlets(
         self,
         tskl_ranges: Sequence[tuple[str, str]],
diff --git a/src/jace/translator/primitive_translators/squeeze_translator.py b/src/jace/translator/primitive_translators/squeeze_translator.py
new file mode 100644
index 0000000..914bf54
--- /dev/null
+++ b/src/jace/translator/primitive_translators/squeeze_translator.py
@@ -0,0 +1,62 @@
+# JaCe - JAX Just-In-Time compilation using DaCe (Data Centric Parallel Programming)
+#
+# Copyright (c) 2024, ETH Zurich
+# All rights reserved.
+#
+# SPDX-License-Identifier: BSD-3-Clause
+
+from __future__ import annotations
+
+import itertools
+from collections.abc import Sequence
+
+import dace
+from jax import core as jax_core
+from typing_extensions import override
+
+from jace import translator
+from jace.translator.primitive_translators.mapped_operation_base_translator import (
+    MappedOperationTranslatorBase,
+)
+
+
+class SqueezeTranslator(MappedOperationTranslatorBase):
+    """Allows to remove dimensions with size one.
+
+    Essentially equivalent to `np.squeeze` and the inverse to `np.expand_dims()`.
+    """
+
+    __slots__ = ()
+
+    def __init__(self) -> None:
+        super().__init__(primitive_name="squeeze")
+
+    @override
+    def write_tasklet_code(
+        self,
+        in_var_names: Sequence[str | None],
+        eqn: jax_core.JaxprEqn,
+    ) -> str:
+        return "__in0"
+
+    @override
+    def make_input_memlets(
+        self,
+        tskl_ranges: Sequence[tuple[str, str]],
+        in_var_names: Sequence[str | None],
+        eqn: jax_core.JaxprEqn,
+    ) -> dict[str, dace.Memlet]:
+        to_rem: Sequence[str] = eqn.params["dimensions"]
+        in_rank: int = len(eqn.invars[0].aval.shape)
+        cnt = itertools.count(0)
+        return {
+            "__in0": dace.Memlet.simple(
+                in_var_names[0],
+                ", ".join(
+                    "0" if dim in to_rem else tskl_ranges[next(cnt)][0] for dim in range(in_rank)
+                ),
+            )
+        }
+
+
+translator.register_primitive_translator(SqueezeTranslator())
diff --git a/tests/test_sub_translators_broadcast_in_dim.py b/tests/test_sub_translators_broadcast_in_dim.py
index 5f1a2f3..5a6df27 100644
--- a/tests/test_sub_translators_broadcast_in_dim.py
+++ b/tests/test_sub_translators_broadcast_in_dim.py
@@ -7,17 +7,16 @@
 
 """Implements tests for the broadcast in dim translator.
 
+Parts of the tests are also implemented inside `test_sub_translators_squeeze_expand_dims.py`.
+
 Todo:
     - `np.meshgrid`
-    - `np.expand_dims`
     - `np.ix_`
     - `np.indices`
 """
 
 from __future__ import annotations
 
-from collections.abc import Sequence
-
 import numpy as np
 from jax import numpy as jnp
 
@@ -51,40 +50,3 @@ def testee(a: float) -> np.ndarray:
         assert res.shape == ref.shape
         assert res.dtype == ref.dtype
         assert np.all(res == ref)
-
-
-def _expand_dims_test_impl(
-    shape: Sequence[int],
-    axes: Sequence[int | Sequence[int]],
-) -> None:
-    """Implementation of the test for `expand_dims()`.
-
-    Args:
-        shape:  Shape of the input array.
-        axes:   A series of axis that should be tried.
-    """
-    A = np.random.random(shape)  # noqa: NPY002
-    for axis in axes:
-
-        def testee(A):
-            return jnp.expand_dims(A, axis)  # noqa: B023  # Binding loop variable.
-
-        ref = testee(A)
-        res = jace.jit(testee)(A)
-
-        assert ref.shape == res.shape, f"A.shape = {shape}; Expected: {ref.shape}; Got: {res.shape}"
-        assert np.all(ref == res), f"Value error for shape '{shape}' and axis={axis}"
-
-
-def test_expand_dims():
-    """Test various calls to `np.expand_dims()`."""
-    _expand_dims_test_impl((10,), [0, -1, 1])
-    _expand_dims_test_impl(
-        (2, 3, 4, 5),
-        [
-            0,
-            -1,
-            (1, 2, 3),
-            (3, 2, 1),
-        ],
-    )
diff --git a/tests/test_sub_translators_squeeze_expand_dims.py b/tests/test_sub_translators_squeeze_expand_dims.py
new file mode 100644
index 0000000..5d7503e
--- /dev/null
+++ b/tests/test_sub_translators_squeeze_expand_dims.py
@@ -0,0 +1,73 @@
+# JaCe - JAX Just-In-Time compilation using DaCe (Data Centric Parallel Programming)
+#
+# Copyright (c) 2024, ETH Zurich
+# All rights reserved.
+#
+# SPDX-License-Identifier: BSD-3-Clause
+
+"""Implements tests for the squeeze translator.
+
+For several reasons parts of the tests related to broadcasting, especially the ones in which a single dimension is added, are also here.
+This is because of the inverse relationship between `expand_dims` and `squeeze`.
+"""
+
+from __future__ import annotations
+
+from collections.abc import Sequence
+
+import numpy as np
+import pytest
+from jax import numpy as jnp
+
+import jace
+
+
+def _roundtrip_implementation(
+    shape: Sequence[int],
+    axis: int | Sequence[int],
+) -> None:
+    """Implementation of the test for `expand_dims()` and `squeeze()`.
+
+    It will first add dimensions and then remove them.
+
+    Args:
+        shape:  Shape of the input array.
+        axes:   A series of axis that should be tried.
+    """
+    A = np.random.random(shape)  # noqa: NPY002
+    A_org = A.copy()
+
+    for ops in [jnp.expand_dims, jnp.squeeze]:
+        ref = ops(A, axis)
+        res = jace.jit(lambda A: ops(A, axis))(A)  # noqa: B023  # No capturing
+
+        assert ref.shape == res.shape, f"A.shape = {shape}; Expected: {ref.shape}; Got: {res.shape}"
+        assert np.all(ref == res), f"Value error for shape '{shape}' and axis={axis}"
+        A = np.array(ref, copy=True)  # It is a Jax array, and we have to reverse this.
+    assert A_org.shape == res.shape
+    assert np.all(A_org == res)
+
+
+@pytest.fixture(params=[0, -1, 1])
+def simple_axis(request) -> int:
+    return request.param
+
+
+@pytest.fixture(
+    params=[
+        0,
+        -1,
+        (1, 2, 3),
+        (3, 2, 1),
+    ]
+)
+def hard_axis(request) -> Sequence[int] | int:
+    return request.param
+
+
+def test_expand_squeeze_rountrip_simple(simple_axis):
+    _roundtrip_implementation((10,), simple_axis)
+
+
+def test_expand_squeeze_rountrip_big(hard_axis):
+    _roundtrip_implementation((2, 3, 4, 5), hard_axis)
diff --git a/tests/test_subtranslator_helper.py b/tests/test_subtranslator_helper.py
index 5d197a4..574f6f6 100644
--- a/tests/test_subtranslator_helper.py
+++ b/tests/test_subtranslator_helper.py
@@ -73,7 +73,7 @@ def fake_add_translator(*args: Any, **kwargs: Any) -> None:
 def test_are_subtranslators_imported():
     """Tests if something is inside the list of subtranslators."""
     # Must be adapted if new primitives are implemented.
-    assert len(get_regsitered_primitive_translators()) == 40
+    assert len(get_regsitered_primitive_translators()) == 41
 
 
 def test_subtranslatior_managing(no_builtin_translators):

From 1d3b166cb2dc4ac7c79354dae72b2b67f60e0f1d Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Fri, 24 May 2024 12:55:17 +0200
Subject: [PATCH 240/458] Realized that in some situations the tasklet ranges
 also have to be passed to the write code function of the mapped base.

---
 .../primitive_translators/alu_translators.py           | 10 ++--------
 .../broadcast_in_dim_translator.py                     |  1 +
 .../convert_element_type_translator.py                 |  2 +-
 .../mapped_operation_base_translator.py                |  5 ++++-
 .../primitive_translators/squeeze_translator.py        |  1 +
 5 files changed, 9 insertions(+), 10 deletions(-)

diff --git a/src/jace/translator/primitive_translators/alu_translators.py b/src/jace/translator/primitive_translators/alu_translators.py
index 6b93f16..29e50eb 100644
--- a/src/jace/translator/primitive_translators/alu_translators.py
+++ b/src/jace/translator/primitive_translators/alu_translators.py
@@ -47,17 +47,11 @@ def __init__(
     @override
     def write_tasklet_code(
         self,
+        tskl_ranges: Sequence[tuple[str, str]],
         in_var_names: Sequence[str | None],
         eqn: jax_core.JaxprEqn,
     ) -> str:
-        """Returns the code for the Tasklet.
-
-        The function does parameter substitution, see `integer_pow`, while literal substitution is left to the base.
-
-        Args:
-            in_var_names:   The list of SDFG variables used as input.
-            eqn:            The equation.
-        """
+        """Returns the code for the Tasklet, with all parameters replaced."""
         tskl_code = self._tskl_tmpl
         if len(eqn.params) != 0:
             tskl_code = tskl_code.format(**eqn.params)
diff --git a/src/jace/translator/primitive_translators/broadcast_in_dim_translator.py b/src/jace/translator/primitive_translators/broadcast_in_dim_translator.py
index 331ec55..f85e43f 100644
--- a/src/jace/translator/primitive_translators/broadcast_in_dim_translator.py
+++ b/src/jace/translator/primitive_translators/broadcast_in_dim_translator.py
@@ -32,6 +32,7 @@ def __init__(self) -> None:
     @override
     def write_tasklet_code(
         self,
+        tskl_ranges: Sequence[tuple[str, str]],
         in_var_names: Sequence[str | None],
         eqn: jax_core.JaxprEqn,
     ) -> str:
diff --git a/src/jace/translator/primitive_translators/convert_element_type_translator.py b/src/jace/translator/primitive_translators/convert_element_type_translator.py
index ede0977..f8f6683 100644
--- a/src/jace/translator/primitive_translators/convert_element_type_translator.py
+++ b/src/jace/translator/primitive_translators/convert_element_type_translator.py
@@ -43,10 +43,10 @@ def __init__(self) -> None:
     @override
     def write_tasklet_code(
         self,
+        tskl_ranges: Sequence[tuple[str, str]],
         in_var_names: Sequence[str | None],
         eqn: jax_core.JaxprEqn,
     ) -> str:
-
         if in_var_names[0] is None:
             raise NotImplementedError("'convert_element_type' is not supported for literals.")
 
diff --git a/src/jace/translator/primitive_translators/mapped_operation_base_translator.py b/src/jace/translator/primitive_translators/mapped_operation_base_translator.py
index f76bcbc..100f5d9 100644
--- a/src/jace/translator/primitive_translators/mapped_operation_base_translator.py
+++ b/src/jace/translator/primitive_translators/mapped_operation_base_translator.py
@@ -100,7 +100,7 @@ def __call__(
             tskl_ranges, in_var_names, eqn
         )
         tskl_name = f"{self.primitive}_{out_var_names[0]}"
-        tskl_code = self.write_tasklet_code(in_var_names, eqn)
+        tskl_code = self.write_tasklet_code(tskl_ranges, in_var_names, eqn)
         tskl_code = self.literal_substitution(tskl_code, in_var_names, eqn)
 
         eqn_state.add_mapped_tasklet(
@@ -117,6 +117,7 @@ def __call__(
     @abstractmethod
     def write_tasklet_code(
         self,
+        tskl_ranges: Sequence[tuple[str, str]],
         in_var_names: Sequence[str | None],
         eqn: jax_core.JaxprEqn,
     ) -> str:
@@ -125,6 +126,8 @@ def write_tasklet_code(
         Literal substitution is allied to the returned code.
 
         Args:
+            tskl_ranges:    The iteration indexes used by the map, first element is the iteration index itself,
+                                the second index is the iteration range.
             in_var_names:   The list of SDFG variables used as input.
             eqn:            The equation.
         """
diff --git a/src/jace/translator/primitive_translators/squeeze_translator.py b/src/jace/translator/primitive_translators/squeeze_translator.py
index 914bf54..85f7b3d 100644
--- a/src/jace/translator/primitive_translators/squeeze_translator.py
+++ b/src/jace/translator/primitive_translators/squeeze_translator.py
@@ -34,6 +34,7 @@ def __init__(self) -> None:
     @override
     def write_tasklet_code(
         self,
+        tskl_ranges: Sequence[tuple[str, str]],
         in_var_names: Sequence[str | None],
         eqn: jax_core.JaxprEqn,
     ) -> str:

From 1402924d6ca5dc99e44c3ddd772339aba32ef405 Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Fri, 24 May 2024 13:18:57 +0200
Subject: [PATCH 241/458] Implemented the iota translator.

---
 .../primitive_translators/__init__.py         |  2 +
 .../primitive_translators/iota_translator.py  | 54 +++++++++++++++++++
 tests/test_sub_translators_iota.py            | 47 ++++++++++++++++
 tests/test_subtranslator_helper.py            |  2 +-
 4 files changed, 104 insertions(+), 1 deletion(-)
 create mode 100644 src/jace/translator/primitive_translators/iota_translator.py
 create mode 100644 tests/test_sub_translators_iota.py

diff --git a/src/jace/translator/primitive_translators/__init__.py b/src/jace/translator/primitive_translators/__init__.py
index 72b4f5d..7c8cfb1 100644
--- a/src/jace/translator/primitive_translators/__init__.py
+++ b/src/jace/translator/primitive_translators/__init__.py
@@ -11,6 +11,7 @@
 from .alu_translators import ALUTranslator
 from .broadcast_in_dim_translator import BroadcastInDimTranslator
 from .convert_element_type_translator import ConvertElementTypeTranslator
+from .iota_translator import IotaTranslator
 from .reshape_translator import ReshapeTranslator
 from .squeeze_translator import SqueezeTranslator
 
@@ -19,6 +20,7 @@
     "ALUTranslator",
     "BroadcastInDimTranslator",
     "ConvertElementTypeTranslator",
+    "IotaTranslator",
     "ReshapeTranslator",
     "SqueezeTranslator",
 ]
diff --git a/src/jace/translator/primitive_translators/iota_translator.py b/src/jace/translator/primitive_translators/iota_translator.py
new file mode 100644
index 0000000..218cce8
--- /dev/null
+++ b/src/jace/translator/primitive_translators/iota_translator.py
@@ -0,0 +1,54 @@
+# JaCe - JAX Just-In-Time compilation using DaCe (Data Centric Parallel Programming)
+#
+# Copyright (c) 2024, ETH Zurich
+# All rights reserved.
+#
+# SPDX-License-Identifier: BSD-3-Clause
+
+"""This implements the `iota` primitive."""
+
+from __future__ import annotations
+
+from collections.abc import Sequence
+
+import dace
+from jax import core as jax_core
+from typing_extensions import override
+
+from jace import translator
+from jace.translator.primitive_translators.mapped_operation_base_translator import (
+    MappedOperationTranslatorBase,
+)
+
+
+class IotaTranslator(MappedOperationTranslatorBase):
+    """This handles the `iota` primitives.
+
+    Essentially a very general `jnp.arange()` function.
+    """
+
+    __slots__ = ()
+
+    def __init__(self) -> None:
+        super().__init__(primitive_name="iota")
+
+    @override
+    def write_tasklet_code(
+        self,
+        tskl_ranges: Sequence[tuple[str, str]],
+        in_var_names: Sequence[str | None],
+        eqn: jax_core.JaxprEqn,
+    ) -> str:
+        return f"{tskl_ranges[eqn.params['dimension']][0]}"
+
+    @override
+    def make_input_memlets(
+        self,
+        tskl_ranges: Sequence[tuple[str, str]],
+        in_var_names: Sequence[str | None],
+        eqn: jax_core.JaxprEqn,
+    ) -> dict[str, dace.Memlet]:
+        return {}
+
+
+translator.register_primitive_translator(IotaTranslator())
diff --git a/tests/test_sub_translators_iota.py b/tests/test_sub_translators_iota.py
new file mode 100644
index 0000000..fb35e57
--- /dev/null
+++ b/tests/test_sub_translators_iota.py
@@ -0,0 +1,47 @@
+# JaCe - JAX Just-In-Time compilation using DaCe (Data Centric Parallel Programming)
+#
+# Copyright (c) 2024, ETH Zurich
+# All rights reserved.
+#
+# SPDX-License-Identifier: BSD-3-Clause
+
+from __future__ import annotations
+
+import jax
+import numpy as np
+import pytest
+from jax import numpy as jnp
+
+import jace
+
+
+def test_iota_arange():
+    """Tests `jnp.arange` functionality."""
+
+    def testee(A: int) -> np.ndarray:
+        return jnp.arange(18, dtype=int) + A
+
+    ref = testee(0)
+
+    with pytest.warns(
+        expected_warning=UserWarning,
+        match=r"convert_element_type\(.*\): is useless, because input and output have same type.",
+    ):
+        res = jace.jit(testee)(0)
+    assert np.all(ref == res)
+
+
+def test_iota_broadcast():
+    """Test more iota using the `jax.lax.broadcasted_iota()` function."""
+    shape = (4, 4, 4, 4)
+
+    for d in range(len(shape)):
+
+        def testee(A: np.int32) -> np.ndarray:
+            return jax.lax.broadcasted_iota("int32", shape, d) + A  # noqa: B023  # Variable capturing.
+
+        ref = testee(np.int32(0))
+        res = jace.jit(testee)(np.int32(0))
+
+        assert res.shape == shape
+        assert np.all(ref == res)
diff --git a/tests/test_subtranslator_helper.py b/tests/test_subtranslator_helper.py
index 574f6f6..f108e08 100644
--- a/tests/test_subtranslator_helper.py
+++ b/tests/test_subtranslator_helper.py
@@ -73,7 +73,7 @@ def fake_add_translator(*args: Any, **kwargs: Any) -> None:
 def test_are_subtranslators_imported():
     """Tests if something is inside the list of subtranslators."""
     # Must be adapted if new primitives are implemented.
-    assert len(get_regsitered_primitive_translators()) == 41
+    assert len(get_regsitered_primitive_translators()) == 42
 
 
 def test_subtranslatior_managing(no_builtin_translators):

From d964719f828a078b36ed2833f8e3967bc2154bfc Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Fri, 24 May 2024 13:40:16 +0200
Subject: [PATCH 242/458] Updated the tests for the reshaping. They might be a
 bit overblown.

---
 tests/test_sub_translators_reshape.py | 63 +++++++++++++++------------
 1 file changed, 36 insertions(+), 27 deletions(-)

diff --git a/tests/test_sub_translators_reshape.py b/tests/test_sub_translators_reshape.py
index 40844e5..378cf61 100644
--- a/tests/test_sub_translators_reshape.py
+++ b/tests/test_sub_translators_reshape.py
@@ -50,34 +50,43 @@ def mem_order(request) -> str:
     return request.param
 
 
-def test_reshaping_same_rank(mem_order: str):
-    """Keeping the ranke same."""
-    _test_impl_reshaping((12, 2), (6, 4), mem_order)
+@pytest.fixture(params=[(216, 1, 1), (1, 216, 1), (1, 1, 216), (1, 6, 36), (36, 1, 6)])
+def new_shape(request):
+    """New shapes for the `test_reshaping_same_rank()` test."""
+    return request.param
+
+
+@pytest.fixture(params=[(12, 1), (1, 12), (1, 1, 12), (1, 2, 6)])
+def expanded_shape(request):
+    """New shapes for the `test_reshaping_removing_rank()` test."""
+    return request.param
+
+
+@pytest.fixture(params=[(216,), (6, 36), (36, 6), (216, 1)])
+def reduced_shape(request):
+    """New shapes for the `test_reshaping_adding_rank()` test."""
+    return request.param
 
 
-def test_reshaping_adding_rank(mem_order: str):
+def test_reshaping_same_rank(
+    new_shape: Sequence[int],
+    mem_order: str,
+) -> None:
+    """The rank, numbers of dimensions, stays the same,"""
+    _test_impl_reshaping((6, 6, 6), new_shape, mem_order)
+
+
+def test_reshaping_adding_rank(
+    expanded_shape: Sequence[int],
+    mem_order: str,
+) -> None:
     """Adding ranks to an array."""
-    _test_impl_reshaping((12,), (12, 1), mem_order)
-    _test_impl_reshaping((12,), (1, 12), mem_order)
-    _test_impl_reshaping((12,), (1, 1, 12), mem_order)
-    _test_impl_reshaping(
-        (1,),
-        (
-            1,
-            1,
-        ),
-        mem_order,
-    )
-
-
-def test_reshaping_removing_rank(mem_order: str):
+    _test_impl_reshaping((12,), expanded_shape, mem_order)
+
+
+def test_reshaping_removing_rank(
+    reduced_shape: Sequence[int],
+    mem_order: str,
+) -> None:
     """Removing ranks from an array."""
-    _test_impl_reshaping((12, 12), (144,), mem_order)
-    _test_impl_reshaping(
-        (
-            1,
-            1,
-        ),
-        (1,),
-        mem_order,
-    )
+    _test_impl_reshaping((6, 6, 6), reduced_shape, mem_order)

From 6ab2ad743fd16c9714e66a7c463444f2c66bb955 Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Fri, 24 May 2024 14:28:26 +0200
Subject: [PATCH 243/458] Fixed a typo.

---
 .../primitive_translators/convert_element_type_translator.py    | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/src/jace/translator/primitive_translators/convert_element_type_translator.py b/src/jace/translator/primitive_translators/convert_element_type_translator.py
index f8f6683..bc7304b 100644
--- a/src/jace/translator/primitive_translators/convert_element_type_translator.py
+++ b/src/jace/translator/primitive_translators/convert_element_type_translator.py
@@ -5,7 +5,7 @@
 #
 # SPDX-License-Identifier: BSD-3-Clause
 
-"""Implements the Translator for the `convert_element_type` primitive."""
+"""Implements the translator for the `convert_element_type` primitive."""
 
 from __future__ import annotations
 

From 345d1bb031bc79e2d821552f9d6ba9c6cdef4519 Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Fri, 24 May 2024 14:34:20 +0200
Subject: [PATCH 244/458] Added copy (`copy` and `device_put`) translators,
 however, there is no tests for them yet.

`device_put` is actually a very powerfull operation, such as Memlets, where source and destination are on different devices.
However, we do not support something like that yet, so we will keep it down yet.
---
 .../primitive_translators/__init__.py         |  3 +
 .../primitive_translators/copy_translator.py  | 70 +++++++++++++++++++
 tests/test_subtranslator_helper.py            |  2 +-
 3 files changed, 74 insertions(+), 1 deletion(-)
 create mode 100644 src/jace/translator/primitive_translators/copy_translator.py

diff --git a/src/jace/translator/primitive_translators/__init__.py b/src/jace/translator/primitive_translators/__init__.py
index 7c8cfb1..c9e76ce 100644
--- a/src/jace/translator/primitive_translators/__init__.py
+++ b/src/jace/translator/primitive_translators/__init__.py
@@ -11,6 +11,7 @@
 from .alu_translators import ALUTranslator
 from .broadcast_in_dim_translator import BroadcastInDimTranslator
 from .convert_element_type_translator import ConvertElementTypeTranslator
+from .copy_translator import CopyTranslator, DevicePutTranslator
 from .iota_translator import IotaTranslator
 from .reshape_translator import ReshapeTranslator
 from .squeeze_translator import SqueezeTranslator
@@ -20,6 +21,8 @@
     "ALUTranslator",
     "BroadcastInDimTranslator",
     "ConvertElementTypeTranslator",
+    "CopyTranslator",
+    "DevicePutTranslator",
     "IotaTranslator",
     "ReshapeTranslator",
     "SqueezeTranslator",
diff --git a/src/jace/translator/primitive_translators/copy_translator.py b/src/jace/translator/primitive_translators/copy_translator.py
new file mode 100644
index 0000000..145b146
--- /dev/null
+++ b/src/jace/translator/primitive_translators/copy_translator.py
@@ -0,0 +1,70 @@
+# JaCe - JAX Just-In-Time compilation using DaCe (Data Centric Parallel Programming)
+#
+# Copyright (c) 2024, ETH Zurich
+# All rights reserved.
+#
+# SPDX-License-Identifier: BSD-3-Clause
+
+"""Implements the translator related to data movement."""
+
+from __future__ import annotations
+
+from collections.abc import Sequence
+
+from jax import core as jax_core
+from typing_extensions import override
+
+from jace import translator
+from jace.translator.primitive_translators.mapped_operation_base_translator import (
+    MappedOperationTranslatorBase,
+)
+
+
+class CopyTranslator(MappedOperationTranslatorBase):
+    """Copy operations are implemented as a map to ensure that they can be fused with other maps."""
+
+    __slots__ = ()
+
+    def __init__(self) -> None:
+        super().__init__(primitive_name="copy")
+
+    @override
+    def write_tasklet_code(
+        self,
+        tskl_ranges: Sequence[tuple[str, str]],
+        in_var_names: Sequence[str | None],
+        eqn: jax_core.JaxprEqn,
+    ) -> str:
+        return "__in0"
+
+
+class DevicePutTranslator(MappedOperationTranslatorBase):
+    """The `device_put` primitive is used to transfer data between host and device.
+
+    The current implementation only supports the copying where the data already is.
+    Currently DaCe only knows about the Host and the GPU.
+    Furthermore, currently Jace works in such a way that everything is either put on the host or the device.
+    Because of this, the `DevicePutTranslator` is, currently, just a simple copy operation that should be removed, by the optimization.
+    """
+
+    __slots__ = ()
+
+    def __init__(self) -> None:
+        super().__init__(primitive_name="device_put")
+
+    @override
+    def write_tasklet_code(
+        self,
+        tskl_ranges: Sequence[tuple[str, str]],
+        in_var_names: Sequence[str | None],
+        eqn: jax_core.JaxprEqn,
+    ) -> str:
+        if not (eqn.params["device"] is None and eqn.params["src"] is None):
+            raise NotImplementedError(
+                f"Can only copy on the host, but not from {eqn.params['src']} to {eqn.params['device']}."
+            )
+        return "__in0"
+
+
+_ = translator.register_primitive_translator(CopyTranslator())
+_ = translator.register_primitive_translator(DevicePutTranslator())
diff --git a/tests/test_subtranslator_helper.py b/tests/test_subtranslator_helper.py
index f108e08..b72bffb 100644
--- a/tests/test_subtranslator_helper.py
+++ b/tests/test_subtranslator_helper.py
@@ -73,7 +73,7 @@ def fake_add_translator(*args: Any, **kwargs: Any) -> None:
 def test_are_subtranslators_imported():
     """Tests if something is inside the list of subtranslators."""
     # Must be adapted if new primitives are implemented.
-    assert len(get_regsitered_primitive_translators()) == 42
+    assert len(get_regsitered_primitive_translators()) == 44
 
 
 def test_subtranslatior_managing(no_builtin_translators):

From 979f4ec6ded5be6c2b596b73859c3eb1f84eb738 Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Mon, 27 May 2024 08:30:29 +0200
Subject: [PATCH 245/458] Made some small modifications.

---
 src/jace/util/compiling.py | 9 +++++++--
 tests/test_caching.py      | 4 +---
 2 files changed, 8 insertions(+), 5 deletions(-)

diff --git a/src/jace/util/compiling.py b/src/jace/util/compiling.py
index 657ef30..17568e0 100644
--- a/src/jace/util/compiling.py
+++ b/src/jace/util/compiling.py
@@ -12,6 +12,8 @@
 
 from __future__ import annotations
 
+import os
+import pathlib
 import time
 from collections.abc import Mapping, Sequence
 from typing import TYPE_CHECKING, Any
@@ -51,13 +53,16 @@ def compile_jax_sdfg(
     try:
         # We need to give the SDFG another name, this is needed to prevent a DaCe error/warning.
         #  This happens if we compile the same lowered SDFG multiple times with different options.
-        sdfg.name = f"{sdfg.name}__comp_{int(time.time() * 1000)}"
+        sdfg.name = f"{sdfg.name}__comp_{int(time.time() * 1000)}_{os.getpid()}"
+        assert len(sdfg.name) < 255
 
         # Actual compiling the stuff; forcing that a recompilation happens
         with dace.config.temporary_config():
+            dace.Config.set("compiler", "use_cache", value=False)
+            dace.Config.set("cache", value="name")
+            dace.Config.set("default_build_folder", value=pathlib.Path(".jacecache").resolve())
             sdfg._recompile = True
             sdfg._regenerate_code = True
-            dace.Config.set("compiler", "use_cache", value=False)
             csdfg: jdace.CompiledSDFG = sdfg.compile()
 
     finally:
diff --git a/tests/test_caching.py b/tests/test_caching.py
index 2d34eda..e19e259 100644
--- a/tests/test_caching.py
+++ b/tests/test_caching.py
@@ -18,7 +18,7 @@
 
 import jace
 from jace import optimization
-from jace.jax import stages
+from jace.jax import stages, translation_cache as tcache
 
 
 @pytest.fixture(autouse=True)
@@ -30,8 +30,6 @@ def _clear_translation_cache():
     Todo:
         Ask Enrique how I can make that fixture apply everywhere not just in the file but the whole test suite.
     """
-    from jace.jax import translation_cache as tcache
-
     tcache.clear_translation_cache()
     yield
     tcache.clear_translation_cache()

From 2d2c160c397c6b085d627300f5cf2cdde088c404 Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Mon, 27 May 2024 08:40:19 +0200
Subject: [PATCH 246/458] Reloacated some code.

---
 .../mapped_operation_base_translator.py                   | 0
 .../translator/primitive_translators/alu_translators.py   | 6 ++----
 .../primitive_translators/broadcast_in_dim_translator.py  | 6 ++----
 .../convert_element_type_translator.py                    | 6 ++----
 .../translator/primitive_translators/copy_translator.py   | 8 +++-----
 .../translator/primitive_translators/iota_translator.py   | 6 ++----
 .../primitive_translators/squeeze_translator.py           | 6 ++----
 7 files changed, 13 insertions(+), 25 deletions(-)
 rename src/jace/translator/{primitive_translators => }/mapped_operation_base_translator.py (100%)

diff --git a/src/jace/translator/primitive_translators/mapped_operation_base_translator.py b/src/jace/translator/mapped_operation_base_translator.py
similarity index 100%
rename from src/jace/translator/primitive_translators/mapped_operation_base_translator.py
rename to src/jace/translator/mapped_operation_base_translator.py
diff --git a/src/jace/translator/primitive_translators/alu_translators.py b/src/jace/translator/primitive_translators/alu_translators.py
index 29e50eb..f4eb304 100644
--- a/src/jace/translator/primitive_translators/alu_translators.py
+++ b/src/jace/translator/primitive_translators/alu_translators.py
@@ -16,12 +16,10 @@
 from typing_extensions import override
 
 from jace import translator
-from jace.translator.primitive_translators.mapped_operation_base_translator import (
-    MappedOperationTranslatorBase,
-)
+from jace.translator import mapped_operation_base_translator as mapped_base
 
 
-class ALUTranslator(MappedOperationTranslatorBase):
+class ALUTranslator(mapped_base.MappedOperationTranslatorBase):
     """Translator for all arithmetic and logical operations.
 
     The class uses `MappedOperationBaseTranslator` for generating the maps.
diff --git a/src/jace/translator/primitive_translators/broadcast_in_dim_translator.py b/src/jace/translator/primitive_translators/broadcast_in_dim_translator.py
index f85e43f..9194e57 100644
--- a/src/jace/translator/primitive_translators/broadcast_in_dim_translator.py
+++ b/src/jace/translator/primitive_translators/broadcast_in_dim_translator.py
@@ -16,12 +16,10 @@
 from typing_extensions import override
 
 from jace import translator
-from jace.translator.primitive_translators.mapped_operation_base_translator import (
-    MappedOperationTranslatorBase,
-)
+from jace.translator import mapped_operation_base_translator as mapped_base
 
 
-class BroadcastInDimTranslator(MappedOperationTranslatorBase):
+class BroadcastInDimTranslator(mapped_base.MappedOperationTranslatorBase):
     """This handles the `broadcast_in_dim` primitives."""
 
     __slots__ = ()
diff --git a/src/jace/translator/primitive_translators/convert_element_type_translator.py b/src/jace/translator/primitive_translators/convert_element_type_translator.py
index bc7304b..cd6da52 100644
--- a/src/jace/translator/primitive_translators/convert_element_type_translator.py
+++ b/src/jace/translator/primitive_translators/convert_element_type_translator.py
@@ -17,12 +17,10 @@
 from typing_extensions import override
 
 from jace import translator
-from jace.translator.primitive_translators.mapped_operation_base_translator import (
-    MappedOperationTranslatorBase,
-)
+from jace.translator import mapped_operation_base_translator as mapped_base
 
 
-class ConvertElementTypeTranslator(MappedOperationTranslatorBase):
+class ConvertElementTypeTranslator(mapped_base.MappedOperationTranslatorBase):
     """Implements the `convert_element_type` primitive.
 
     Copies the input to the output and performs type conversion.
diff --git a/src/jace/translator/primitive_translators/copy_translator.py b/src/jace/translator/primitive_translators/copy_translator.py
index 145b146..19634ae 100644
--- a/src/jace/translator/primitive_translators/copy_translator.py
+++ b/src/jace/translator/primitive_translators/copy_translator.py
@@ -15,12 +15,10 @@
 from typing_extensions import override
 
 from jace import translator
-from jace.translator.primitive_translators.mapped_operation_base_translator import (
-    MappedOperationTranslatorBase,
-)
+from jace.translator import mapped_operation_base_translator as mapped_base
 
 
-class CopyTranslator(MappedOperationTranslatorBase):
+class CopyTranslator(mapped_base.MappedOperationTranslatorBase):
     """Copy operations are implemented as a map to ensure that they can be fused with other maps."""
 
     __slots__ = ()
@@ -38,7 +36,7 @@ def write_tasklet_code(
         return "__in0"
 
 
-class DevicePutTranslator(MappedOperationTranslatorBase):
+class DevicePutTranslator(mapped_base.MappedOperationTranslatorBase):
     """The `device_put` primitive is used to transfer data between host and device.
 
     The current implementation only supports the copying where the data already is.
diff --git a/src/jace/translator/primitive_translators/iota_translator.py b/src/jace/translator/primitive_translators/iota_translator.py
index 218cce8..6283240 100644
--- a/src/jace/translator/primitive_translators/iota_translator.py
+++ b/src/jace/translator/primitive_translators/iota_translator.py
@@ -16,12 +16,10 @@
 from typing_extensions import override
 
 from jace import translator
-from jace.translator.primitive_translators.mapped_operation_base_translator import (
-    MappedOperationTranslatorBase,
-)
+from jace.translator import mapped_operation_base_translator as mapped_base
 
 
-class IotaTranslator(MappedOperationTranslatorBase):
+class IotaTranslator(mapped_base.MappedOperationTranslatorBase):
     """This handles the `iota` primitives.
 
     Essentially a very general `jnp.arange()` function.
diff --git a/src/jace/translator/primitive_translators/squeeze_translator.py b/src/jace/translator/primitive_translators/squeeze_translator.py
index 85f7b3d..82d9427 100644
--- a/src/jace/translator/primitive_translators/squeeze_translator.py
+++ b/src/jace/translator/primitive_translators/squeeze_translator.py
@@ -15,12 +15,10 @@
 from typing_extensions import override
 
 from jace import translator
-from jace.translator.primitive_translators.mapped_operation_base_translator import (
-    MappedOperationTranslatorBase,
-)
+from jace.translator import mapped_operation_base_translator as mapped_base
 
 
-class SqueezeTranslator(MappedOperationTranslatorBase):
+class SqueezeTranslator(mapped_base.MappedOperationTranslatorBase):
     """Allows to remove dimensions with size one.
 
     Essentially equivalent to `np.squeeze` and the inverse to `np.expand_dims()`.

From 8adae421bdb928d04904e44de16c5536cd7da95e Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Mon, 27 May 2024 09:56:40 +0200
Subject: [PATCH 247/458] Added a transformation for `slice`.

It is not yet dynamic sclice, but soon.
---
 .../primitive_translators/__init__.py         |   2 +
 .../primitive_translators/slicing.py          |  66 +++++++++
 tests/test_sub_translators_slicing.py         | 136 ++++++++++++++++++
 tests/test_subtranslator_helper.py            |   2 +-
 4 files changed, 205 insertions(+), 1 deletion(-)
 create mode 100644 src/jace/translator/primitive_translators/slicing.py
 create mode 100644 tests/test_sub_translators_slicing.py

diff --git a/src/jace/translator/primitive_translators/__init__.py b/src/jace/translator/primitive_translators/__init__.py
index c9e76ce..8d73695 100644
--- a/src/jace/translator/primitive_translators/__init__.py
+++ b/src/jace/translator/primitive_translators/__init__.py
@@ -14,6 +14,7 @@
 from .copy_translator import CopyTranslator, DevicePutTranslator
 from .iota_translator import IotaTranslator
 from .reshape_translator import ReshapeTranslator
+from .slicing import SlicingTranslator
 from .squeeze_translator import SqueezeTranslator
 
 
@@ -26,4 +27,5 @@
     "IotaTranslator",
     "ReshapeTranslator",
     "SqueezeTranslator",
+    "SlicingTranslator",
 ]
diff --git a/src/jace/translator/primitive_translators/slicing.py b/src/jace/translator/primitive_translators/slicing.py
new file mode 100644
index 0000000..d70580f
--- /dev/null
+++ b/src/jace/translator/primitive_translators/slicing.py
@@ -0,0 +1,66 @@
+# JaCe - JAX Just-In-Time compilation using DaCe (Data Centric Parallel Programming)
+#
+# Copyright (c) 2024, ETH Zurich
+# All rights reserved.
+#
+# SPDX-License-Identifier: BSD-3-Clause
+
+"""Implements slicing."""
+
+from __future__ import annotations
+
+from collections.abc import Sequence
+
+import dace
+from jax import core as jax_core
+from typing_extensions import override
+
+from jace import translator
+from jace.translator import mapped_operation_base_translator as mapped_base
+
+
+class SlicingTranslator(mapped_base.MappedOperationTranslatorBase):
+    """Implements the classical slicing operation.
+
+    It is basically a copy Tasklet that only copies parts of the input.
+    Note that there is also `dynamic_slice`.
+    """
+
+    __slots__ = ()
+
+    def __init__(self) -> None:
+        super().__init__(primitive_name="slice")
+
+    @override
+    def write_tasklet_code(
+        self,
+        tskl_ranges: Sequence[tuple[str, str]],
+        in_var_names: Sequence[str | None],
+        eqn: jax_core.JaxprEqn,
+    ) -> str:
+        return "__in0"
+
+    @override
+    def make_input_memlets(
+        self,
+        tskl_ranges: Sequence[tuple[str, str]],
+        in_var_names: Sequence[str | None],
+        eqn: jax_core.JaxprEqn,
+    ) -> dict[str, dace.Memlet]:
+        """We have to add the offsets to the Memlet accesses."""
+        if eqn.params["strides"] is not None:
+            raise NotImplementedError("Non 1 strides are not implemented.")
+
+        start_indices = eqn.params["start_indices"]  # Fist index to slice
+        return {
+            "__in0": dace.Memlet.simple(
+                in_var_names[0],
+                ", ".join(
+                    f"{it_idx} + {start_index}"
+                    for (it_idx, _), start_index in zip(tskl_ranges, start_indices)
+                ),
+            )
+        }
+
+
+translator.register_primitive_translator(SlicingTranslator())
diff --git a/tests/test_sub_translators_slicing.py b/tests/test_sub_translators_slicing.py
new file mode 100644
index 0000000..3317da6
--- /dev/null
+++ b/tests/test_sub_translators_slicing.py
@@ -0,0 +1,136 @@
+# JaCe - JAX Just-In-Time compilation using DaCe (Data Centric Parallel Programming)
+#
+# Copyright (c) 2024, ETH Zurich
+# All rights reserved.
+#
+# SPDX-License-Identifier: BSD-3-Clause
+
+"""Implements tests for slicing translator."""
+
+from __future__ import annotations
+
+import numpy as np
+import pytest
+
+import jace
+
+
+@pytest.fixture()
+def A_4x4():
+    return np.arange(16).reshape((4, 4))
+
+
+def test_slice_sub_view(A_4x4):
+    """Simple extraction of a subsize."""
+
+    @jace.jit
+    def testee(A: np.ndarray) -> np.ndarray:
+        return A[1:3, 1:3]
+
+    ref = A_4x4[1:3, 1:3]
+    res = testee(A_4x4)
+
+    assert ref.shape == res.shape
+    assert np.all(ref == res)
+
+
+def test_slice_rslice(A_4x4):
+    """Only slicing some rows."""
+
+    @jace.jit
+    def testee(A: np.ndarray) -> np.ndarray:
+        return A[1:3]
+
+    ref = A_4x4[1:3]
+    res = testee(A_4x4)
+
+    assert ref.shape == res.shape
+    assert np.all(ref == res)
+
+
+def test_slice_cslice(A_4x4):
+    """Slicing some columns."""
+
+    @jace.jit
+    def testee(A: np.ndarray) -> np.ndarray:
+        # NOTE: using `A[..., 1:3]` would trigger the `gather` primitive.
+        return A[:, 1:3]
+
+    ref = A_4x4[:, 1:3]
+    res = testee(A_4x4)
+
+    assert ref.shape == res.shape
+    assert np.all(ref == res)
+
+
+def test_slice_singelton(A_4x4):
+    """Only extracting a single value."""
+
+    @jace.jit
+    def testee(A: np.ndarray) -> np.ndarray:
+        return A[1:2, 1:2]
+
+    ref = A_4x4[1:2, 1:2]
+    res = testee(A_4x4)
+
+    assert ref.shape == res.shape
+    assert np.all(ref == res)
+
+
+@pytest.mark.skip(reason="Missing 'gather' translator.")
+def test_slice_strides_vec():
+    """Using strides.
+
+    Note:
+        Although we do not support the `strides` parameter of the `stride` primitive,
+        this is not the reason why the test fails.
+        It fails instead because Jax makes some strange gather stuff out of it.
+    """
+
+    A = np.arange(16)
+
+    @jace.jit
+    def testee(A: np.ndarray) -> np.ndarray:
+        return A[1:15:2]
+
+    ref = A[1:15:2]
+    res = testee(A)
+
+    assert ref.shape == res.shape
+    assert np.all(ref == res)
+
+
+@pytest.mark.skip(reason="Missing 'concatenate' translator.")
+def test_slice_strides(A_4x4):
+    """Using strides in a 2D matrix.
+
+    See `test_slice_strides_vec()` why the test is skipped.
+    """
+
+    @jace.jit
+    def testee(A: np.ndarray) -> np.ndarray:
+        return A[::2, ::2]
+
+    ref = A_4x4[::2, ::2]
+    res = testee(A_4x4)
+
+    assert ref.shape == res.shape
+    assert np.all(ref == res)
+
+
+def test_slice_too_big(A_4x4):
+    """Tests what happens if we specify a size that is too big.
+
+    Note:
+        It seems that the array is just returned as it is.
+    """
+
+    @jace.jit
+    def testee(A: np.ndarray) -> np.ndarray:
+        return A[:20]
+
+    res = testee(A_4x4)
+    ref = A_4x4[:20]
+
+    assert ref.shape == res.shape
+    assert np.all(ref == res)
diff --git a/tests/test_subtranslator_helper.py b/tests/test_subtranslator_helper.py
index b72bffb..174950c 100644
--- a/tests/test_subtranslator_helper.py
+++ b/tests/test_subtranslator_helper.py
@@ -73,7 +73,7 @@ def fake_add_translator(*args: Any, **kwargs: Any) -> None:
 def test_are_subtranslators_imported():
     """Tests if something is inside the list of subtranslators."""
     # Must be adapted if new primitives are implemented.
-    assert len(get_regsitered_primitive_translators()) == 44
+    assert len(get_regsitered_primitive_translators()) == 45
 
 
 def test_subtranslatior_managing(no_builtin_translators):

From 011a2d6db63dd3c3caeac19db7ada6467099c2ac Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Mon, 27 May 2024 10:47:56 +0200
Subject: [PATCH 248/458] Subclasses of mapped base now have to include the
 assignment to return value.

This restirction was removed commit `05e4a885441c0cd`.
However, I realized that it made some higher level translators impossible to write, such as `select_n`.
Thus I removed this restriction again.

Another solution would be to add another layer.
---
 .../mapped_operation_base_translator.py       |  9 ++-
 .../primitive_translators/alu_translators.py  | 74 +++++++++----------
 .../broadcast_in_dim_translator.py            |  2 +-
 .../convert_element_type_translator.py        |  6 +-
 .../primitive_translators/copy_translator.py  |  4 +-
 .../primitive_translators/iota_translator.py  |  2 +-
 .../primitive_translators/slicing.py          |  2 +-
 .../squeeze_translator.py                     |  2 +-
 8 files changed, 51 insertions(+), 50 deletions(-)

diff --git a/src/jace/translator/mapped_operation_base_translator.py b/src/jace/translator/mapped_operation_base_translator.py
index 100f5d9..f4ab189 100644
--- a/src/jace/translator/mapped_operation_base_translator.py
+++ b/src/jace/translator/mapped_operation_base_translator.py
@@ -33,7 +33,7 @@ class MappedOperationTranslatorBase(translator.PrimitiveTranslator):
     Thus this class acts like a convenience wrapper around it.
 
     To use this class a user has to overwrite the `write_tasklet_code()` function.
-    This function generates the right hand side of the assignment code, i.e. everything after `__out =`.
+    This function generates the entire code that should be put into the Tasklet, include the assignment to `__out`.
     If needed the translator will perform literal substitution on the returned code and broadcast the inputs to match the outputs.
 
     Notes:
@@ -107,7 +107,7 @@ def __call__(
             name=tskl_name,
             map_ranges=tskl_ranges,
             inputs=tskl_inputs,
-            code=f"__out = {tskl_code}",
+            code=tskl_code,
             outputs=tskl_output,
             external_edges=True,
         )
@@ -121,9 +121,10 @@ def write_tasklet_code(
         in_var_names: Sequence[str | None],
         eqn: jax_core.JaxprEqn,
     ) -> str:
-        """Return the code that should be put at the left hand side of the assignment statement inside the Tasklet.
+        """Return the (Python) code that should be put inside the Tasklet.
 
-        Literal substitution is allied to the returned code.
+        This also includes the assignment statement, i.e. `__out`.
+        However, the base will do literal substitution on the returned object.
 
         Args:
             tskl_ranges:    The iteration indexes used by the map, first element is the iteration index itself,
diff --git a/src/jace/translator/primitive_translators/alu_translators.py b/src/jace/translator/primitive_translators/alu_translators.py
index f4eb304..bb70572 100644
--- a/src/jace/translator/primitive_translators/alu_translators.py
+++ b/src/jace/translator/primitive_translators/alu_translators.py
@@ -60,45 +60,45 @@ def write_tasklet_code(
 # fmt: off
 _ALU_OPS_TMPL: Final[dict[str, str]] = {
     # Unary operations
-    "pos": "+(__in0)",
-    "neg": "-(__in0)",
-    "not": "not (__in0)",
-    "floor": "floor(__in0)",
-    "ceil": "ceil(__in0)",
-    "round": "round(__in0)",
-    "abs": "abs(__in0)",
-    "sign": "sign(__in0)",
-    "sqrt": "sqrt(__in0)",
-    "log": "log(__in0)",
-    "exp": "exp(__in0)",
-    "integer_pow": "(__in0)**({y})",  # 'y' is a parameter of the primitive
-    "sin": "sin(__in0)",
-    "asin": "asin(__in0)",
-    "cos": "cos(__in0)",
-    "acos": "acos(__in0)",
-    "tan": "tan(__in0)",
-    "atan": "atan(__in0)",
-    "tanh": "tanh(__in0)",
+    "pos": "__out = +(__in0)",
+    "neg": "__out = -(__in0)",
+    "not": "__out = not (__in0)",
+    "floor": "__out = floor(__in0)",
+    "ceil": "__out = ceil(__in0)",
+    "round": "__out = round(__in0)",
+    "abs": "__out = abs(__in0)",
+    "sign": "__out = sign(__in0)",
+    "sqrt": "__out = sqrt(__in0)",
+    "log": "__out = log(__in0)",
+    "exp": "__out = exp(__in0)",
+    "integer_pow": "__out = (__in0)**({y})",  # 'y' is a parameter of the primitive
+    "sin": "__out = sin(__in0)",
+    "asin": "__out = asin(__in0)",
+    "cos": "__out = cos(__in0)",
+    "acos": "__out = acos(__in0)",
+    "tan": "__out = tan(__in0)",
+    "atan": "__out = atan(__in0)",
+    "tanh": "__out = tanh(__in0)",
 
     # Binary operations
-    "add": "(__in0)+(__in1)",
-    "add_any": "(__in0)+(__in1)",  # No idea what makes `add_any` differ from `add`
-    "sub": "(__in0)-(__in1)",
-    "mul": "(__in0)*(__in1)",
-    "div": "(__in0)/(__in1)",
-    "rem": "(__in0)%(__in1)",
-    "and": "(__in0) and (__in1)",
-    "or": "(__in0) or  (__in1)",
-    "pow": "(__in0)**(__in1)",
-    "ipow": "(__in0)**(int(__in1))",
-    "min": "min(__in0, __in1)",
-    "max": "max(__in0, __in1)",
-    "eq": "__in0 == __in1",
-    "ne": "__in0 != __in1",
-    "ge": "__in0 >= __in1",
-    "gt": "__in0 > __in1",
-    "le": "__in0 <= __in1",
-    "lt": "__in0 < __in1",
+    "add": "__out = (__in0)+(__in1)",
+    "add_any": "__out = (__in0)+(__in1)",  # No idea what makes `add_any` differ from `add`
+    "sub": "__out = (__in0)-(__in1)",
+    "mul": "__out = (__in0)*(__in1)",
+    "div": "__out = (__in0)/(__in1)",
+    "rem": "__out = (__in0)%(__in1)",
+    "and": "__out = (__in0) and (__in1)",
+    "or": "__out = (__in0) or  (__in1)",
+    "pow": "__out = (__in0)**(__in1)",
+    "ipow": "__out = (__in0)**(int(__in1))",
+    "min": "__out = min(__in0, __in1)",
+    "max": "__out = max(__in0, __in1)",
+    "eq": "__out = __in0 == __in1",
+    "ne": "__out = __in0 != __in1",
+    "ge": "__out = __in0 >= __in1",
+    "gt": "__out = __in0 > __in1",
+    "le": "__out = __in0 <= __in1",
+    "lt": "__out = __in0 < __in1",
 }
 
 # Create the ALU translators
diff --git a/src/jace/translator/primitive_translators/broadcast_in_dim_translator.py b/src/jace/translator/primitive_translators/broadcast_in_dim_translator.py
index 9194e57..e03c0f0 100644
--- a/src/jace/translator/primitive_translators/broadcast_in_dim_translator.py
+++ b/src/jace/translator/primitive_translators/broadcast_in_dim_translator.py
@@ -34,7 +34,7 @@ def write_tasklet_code(
         in_var_names: Sequence[str | None],
         eqn: jax_core.JaxprEqn,
     ) -> str:
-        return "__in0"
+        return "__out = __in0"
 
     @override
     def make_input_memlets(
diff --git a/src/jace/translator/primitive_translators/convert_element_type_translator.py b/src/jace/translator/primitive_translators/convert_element_type_translator.py
index cd6da52..44ba62d 100644
--- a/src/jace/translator/primitive_translators/convert_element_type_translator.py
+++ b/src/jace/translator/primitive_translators/convert_element_type_translator.py
@@ -68,11 +68,11 @@ def write_tasklet_code(
                 category=UserWarning,
                 stacklevel=1,  # Find a better one
             )
-            return conv_code
+            return f"__out = {conv_code}"
         if in_dtype_s.startswith("bool") and out_dtype_s.startswith("int"):
             # Interestingly `__out = int(__in0)` will at some DaCe processing stage.
             #  See commit `f5aabc` of the prototype.
-            return f"(1 if {conv_code} else 0)"
+            return f"__out = (1 if {conv_code} else 0)"
 
         # The general case
         if out_dtype_s == "bool":
@@ -83,7 +83,7 @@ def write_tasklet_code(
             raise NotImplementedError(
                 f"Cannot convert '{in_dtype}' to '{out_dtype}' as this type is not known to DaCe."
             )
-        return conv_code
+        return f"__out = {conv_code}"
 
 
 _ = translator.register_primitive_translator(ConvertElementTypeTranslator())
diff --git a/src/jace/translator/primitive_translators/copy_translator.py b/src/jace/translator/primitive_translators/copy_translator.py
index 19634ae..1ff170e 100644
--- a/src/jace/translator/primitive_translators/copy_translator.py
+++ b/src/jace/translator/primitive_translators/copy_translator.py
@@ -33,7 +33,7 @@ def write_tasklet_code(
         in_var_names: Sequence[str | None],
         eqn: jax_core.JaxprEqn,
     ) -> str:
-        return "__in0"
+        return "__out = __in0"
 
 
 class DevicePutTranslator(mapped_base.MappedOperationTranslatorBase):
@@ -61,7 +61,7 @@ def write_tasklet_code(
             raise NotImplementedError(
                 f"Can only copy on the host, but not from {eqn.params['src']} to {eqn.params['device']}."
             )
-        return "__in0"
+        return "__out = __in0"
 
 
 _ = translator.register_primitive_translator(CopyTranslator())
diff --git a/src/jace/translator/primitive_translators/iota_translator.py b/src/jace/translator/primitive_translators/iota_translator.py
index 6283240..b64c138 100644
--- a/src/jace/translator/primitive_translators/iota_translator.py
+++ b/src/jace/translator/primitive_translators/iota_translator.py
@@ -37,7 +37,7 @@ def write_tasklet_code(
         in_var_names: Sequence[str | None],
         eqn: jax_core.JaxprEqn,
     ) -> str:
-        return f"{tskl_ranges[eqn.params['dimension']][0]}"
+        return f"__out = {tskl_ranges[eqn.params['dimension']][0]}"
 
     @override
     def make_input_memlets(
diff --git a/src/jace/translator/primitive_translators/slicing.py b/src/jace/translator/primitive_translators/slicing.py
index d70580f..2f4405e 100644
--- a/src/jace/translator/primitive_translators/slicing.py
+++ b/src/jace/translator/primitive_translators/slicing.py
@@ -38,7 +38,7 @@ def write_tasklet_code(
         in_var_names: Sequence[str | None],
         eqn: jax_core.JaxprEqn,
     ) -> str:
-        return "__in0"
+        return "__out = __in0"
 
     @override
     def make_input_memlets(
diff --git a/src/jace/translator/primitive_translators/squeeze_translator.py b/src/jace/translator/primitive_translators/squeeze_translator.py
index 82d9427..f699a63 100644
--- a/src/jace/translator/primitive_translators/squeeze_translator.py
+++ b/src/jace/translator/primitive_translators/squeeze_translator.py
@@ -36,7 +36,7 @@ def write_tasklet_code(
         in_var_names: Sequence[str | None],
         eqn: jax_core.JaxprEqn,
     ) -> str:
-        return "__in0"
+        return "__out = __in0"
 
     @override
     def make_input_memlets(

From a3ac86888fca9ff560b239d779a11eb4fb2fa5ce Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Mon, 27 May 2024 11:49:07 +0200
Subject: [PATCH 249/458] Implemented a test for teh `select_n` primitive.

I also observe random failures for the `test_iota_broadcast()` test if I run all tests.
However, if I only run it, then nothing happens, I have no idea why.
---
 .../primitive_translators/__init__.py         |  4 +-
 .../select_n_translator.py                    | 82 +++++++++++++++++
 tests/test_sub_translators_select_n.py        | 91 +++++++++++++++++++
 tests/test_subtranslator_helper.py            |  2 +-
 4 files changed, 177 insertions(+), 2 deletions(-)
 create mode 100644 src/jace/translator/primitive_translators/select_n_translator.py
 create mode 100644 tests/test_sub_translators_select_n.py

diff --git a/src/jace/translator/primitive_translators/__init__.py b/src/jace/translator/primitive_translators/__init__.py
index 8d73695..7e86238 100644
--- a/src/jace/translator/primitive_translators/__init__.py
+++ b/src/jace/translator/primitive_translators/__init__.py
@@ -14,6 +14,7 @@
 from .copy_translator import CopyTranslator, DevicePutTranslator
 from .iota_translator import IotaTranslator
 from .reshape_translator import ReshapeTranslator
+from .select_n_translator import SelectNTranslator
 from .slicing import SlicingTranslator
 from .squeeze_translator import SqueezeTranslator
 
@@ -26,6 +27,7 @@
     "DevicePutTranslator",
     "IotaTranslator",
     "ReshapeTranslator",
-    "SqueezeTranslator",
+    "SelectNTranslator",
     "SlicingTranslator",
+    "SqueezeTranslator",
 ]
diff --git a/src/jace/translator/primitive_translators/select_n_translator.py b/src/jace/translator/primitive_translators/select_n_translator.py
new file mode 100644
index 0000000..75a719b
--- /dev/null
+++ b/src/jace/translator/primitive_translators/select_n_translator.py
@@ -0,0 +1,82 @@
+# JaCe - JAX Just-In-Time compilation using DaCe (Data Centric Parallel Programming)
+#
+# Copyright (c) 2024, ETH Zurich
+# All rights reserved.
+#
+# SPDX-License-Identifier: BSD-3-Clause
+
+"""Implements `select_n`."""
+
+from __future__ import annotations
+
+from collections.abc import Sequence
+
+import dace
+from jax import core as jax_core
+from typing_extensions import override
+
+from jace import translator
+from jace.translator import mapped_operation_base_translator as mapped_base
+
+
+class SelectNTranslator(mapped_base.MappedOperationTranslatorBase):
+    """Implements the `select_n` primitive, which is a generalization of `np.where`
+
+    While `numpy.where` only supports two cases, the Jax primitive supports an arbitrary number of cases.
+    In that sense it is essentially a `C` `switch` statement, only that all cases have to materialize.
+
+    The behaviour is undefined if the predicate is out of bound.
+
+    Note:
+        For a better understanding this function renames its input connectors.
+        The first one, which is the predicate, is renamed to `__cond` and the others are renamed again to `__in{i}`, starting with zero.
+    """
+
+    __slots__ = ()
+
+    def __init__(self) -> None:
+        super().__init__(primitive_name="select_n")
+
+    @override
+    def write_tasklet_code(
+        self,
+        tskl_ranges: Sequence[tuple[str, str]],
+        in_var_names: Sequence[str | None],
+        eqn: jax_core.JaxprEqn,
+    ) -> str:
+        """Writes the selection code.
+
+        Literal substitution is deferred to the base.
+        """
+
+        if len(in_var_names) == 3:
+            # This order is correct, since `False` is interpreted as `0`, which means the first case.
+            #  DaCe seems to have some problems with bools and integer casting around, so we habdle
+            #  the bool case explicitly here; See also the `ConvertElementTypeTranslator`.
+            return "__out = __in1 if __cond else __in0"
+
+        return "\n".join(
+            ["if __cond == 0:  __out = __in0"]
+            + [f"elif __cond == {i}: __out = __in{i}" for i in range(1, len(in_var_names) - 1)]
+        )
+
+    @override
+    def make_input_memlets(
+        self,
+        tskl_ranges: Sequence[tuple[str, str]],
+        in_var_names: Sequence[str | None],
+        eqn: jax_core.JaxprEqn,
+    ) -> dict[str, dace.Memlet]:
+        """We have to add the offsets to the Memlet accesses."""
+        assert all(in_var_names)
+        return {
+            f"__in{i-1}" if i else "__cond": dace.Memlet.simple(
+                in_var_name,
+                ", ".join(f"{it_idx}" for it_idx, _ in tskl_ranges),
+            )
+            for i, in_var_name in enumerate(in_var_names)
+            if in_var_name
+        }
+
+
+translator.register_primitive_translator(SelectNTranslator())
diff --git a/tests/test_sub_translators_select_n.py b/tests/test_sub_translators_select_n.py
new file mode 100644
index 0000000..dd2002c
--- /dev/null
+++ b/tests/test_sub_translators_select_n.py
@@ -0,0 +1,91 @@
+# JaCe - JAX Just-In-Time compilation using DaCe (Data Centric Parallel Programming)
+#
+# Copyright (c) 2024, ETH Zurich
+# All rights reserved.
+#
+# SPDX-License-Identifier: BSD-3-Clause
+
+"""Tests the `select_n` translator."""
+
+from __future__ import annotations
+
+from typing import Any
+
+import jax
+import numpy as np
+import pytest
+from jax import numpy as jnp
+
+import jace
+
+
+@pytest.fixture(autouse=True)
+def _disable_jit():
+    """Decorator that ensures that `select_n` is not put in an implicit `jit`.
+
+    The reason we do this is because we can currently not handle this nested jits.
+    It is important that it also disabled explicit usage of `jax.jit`.
+    However, since Jace does not honor this flag we it does not affect us.
+
+    Todo:
+        Remove as soon as we can handle nested `jit`.
+    """
+    with jax.disable_jit(disable=True):
+        yield
+
+
+@pytest.fixture()
+def Pred() -> np.ndarray:
+    return np.random.random((10, 10)) > 0.5  # noqa: NPY002
+
+
+@pytest.fixture()
+def tbranch() -> np.ndarray:
+    return np.ones((10, 10))
+
+
+@pytest.fixture()
+def fbranch() -> np.ndarray:
+    return np.ones((10, 10))
+
+
+def _perform_test(P: Any, T: Any, F: Any):
+    def testee(P: Any, T: Any, F: Any):
+        return jnp.where(P, T, F)
+
+    res = testee(P, T, F)
+    ref = jace.jit(testee)(P, T, F)
+
+    assert np.all(res == ref)
+
+
+def test_select_n_where(Pred, tbranch, fbranch):
+    """Normal `np.where` test."""
+    _perform_test(Pred, tbranch, fbranch)
+
+
+def test_select_n_where_one_literal(Pred, tbranch, fbranch):
+    """`np.where` where one of the input is a literal."""
+    _perform_test(Pred, 2, fbranch)
+    _perform_test(Pred, tbranch, 3)
+
+
+def test_select_n_where_full_literal(Pred):
+    """`np.where` where all inputs are literals."""
+    _perform_test(Pred, 8, 9)
+
+
+def test_select_n_many_inputs():
+    """Tests the generalized way of using the primitive."""
+    nbcases = 5
+    shape = (10, 10)
+    cases = [np.full(shape, i) for i in range(nbcases)]
+    pred = np.arange(cases[0].size).reshape(shape) % 5
+
+    def testee(pred: np.ndarray, *cases: np.ndarray) -> np.ndarray:
+        return jax.lax.select_n(pred, *cases)
+
+    ref = testee(pred, *cases)
+    res = jace.jit(testee)(pred, *cases)
+
+    assert np.all(ref == res)
diff --git a/tests/test_subtranslator_helper.py b/tests/test_subtranslator_helper.py
index 174950c..5298b1d 100644
--- a/tests/test_subtranslator_helper.py
+++ b/tests/test_subtranslator_helper.py
@@ -73,7 +73,7 @@ def fake_add_translator(*args: Any, **kwargs: Any) -> None:
 def test_are_subtranslators_imported():
     """Tests if something is inside the list of subtranslators."""
     # Must be adapted if new primitives are implemented.
-    assert len(get_regsitered_primitive_translators()) == 45
+    assert len(get_regsitered_primitive_translators()) == 46
 
 
 def test_subtranslatior_managing(no_builtin_translators):

From 5f186f66144a1dabe1b0d98897ae88ddae6d9466 Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Mon, 27 May 2024 15:57:33 +0200
Subject: [PATCH 250/458] First, chunk of work.

---
 src/jace/__init__.py                          |   7 -
 src/jace/jax/api.py                           |  40 ++--
 src/jace/jax/stages.py                        | 139 ++++++------
 src/jace/jax/translation_cache.py             | 159 +++++++-------
 .../translator/jaxpr_translator_driver.py     | 200 ++++++++----------
 src/jace/translator/primitive_translator.py   |  74 +++----
 tests/test_jaxpr_translator_driver.py         |  10 +-
 7 files changed, 294 insertions(+), 335 deletions(-)

diff --git a/src/jace/__init__.py b/src/jace/__init__.py
index aad3265..05d9632 100644
--- a/src/jace/__init__.py
+++ b/src/jace/__init__.py
@@ -17,13 +17,6 @@
 from .jax import grad, jacfwd, jacrev, jit
 
 
-# In Jax `float32` is the main datatype, and they go to great lengths to avoid
-#  some aggressive [type promotion](https://jax.readthedocs.io/en/latest/type_promotion.html).
-#  However, in this case we will have problems when we call the SDFG, for some reasons
-#  `CompiledSDFG` does not work in that case correctly, thus we enable it now globally.
-_jax.config.update("jax_enable_x64", True)
-
-
 __all__ = [
     "__author__",
     "__copyright__",
diff --git a/src/jace/jax/api.py b/src/jace/jax/api.py
index a46702b..a214f5a 100644
--- a/src/jace/jax/api.py
+++ b/src/jace/jax/api.py
@@ -19,11 +19,19 @@
 from jace.jax import stages
 
 
+__all__ = [
+    "grad",
+    "jit",
+    "jacfwd",
+    "jacrev",
+]
+
+
 @overload
 def jit(
     fun: Literal[None] = None,
     /,
-    sub_translators: Mapping[str, translator.PrimitiveTranslator] | None = None,
+    primitive_translators: Mapping[str, translator.PrimitiveTranslator] | None = None,
     **kwargs: Any,
 ) -> Callable[[Callable], stages.JaceWrapped]: ...
 
@@ -32,7 +40,7 @@ def jit(
 def jit(
     fun: Callable,
     /,
-    sub_translators: Mapping[str, translator.PrimitiveTranslator] | None = None,
+    primitive_translators: Mapping[str, translator.PrimitiveTranslator] | None = None,
     **kwargs: Any,
 ) -> stages.JaceWrapped: ...
 
@@ -40,7 +48,7 @@ def jit(
 def jit(
     fun: Callable | None = None,
     /,
-    sub_translators: Mapping[str, translator.PrimitiveTranslator] | None = None,
+    primitive_translators: Mapping[str, translator.PrimitiveTranslator] | None = None,
     **kwargs: Any,
 ) -> stages.JaceWrapped | Callable[[Callable], stages.JaceWrapped]:
     """Jace's replacement for `jax.jit` (just-in-time) wrapper.
@@ -50,36 +58,28 @@ def jit(
     In addition it accepts some Jace specific arguments.
 
     Args:
-        sub_translators:    Use these subtranslators for the lowering to DaCe.
+        primitive_translators:    Use these primitive translators for the lowering to SDFG.
 
     Notes:
-        If no subtranslators are specified then the ones that are currently active,
-        i.e. the output of `get_regsitered_primitive_translators()`, are used.
-        After construction changes to the passed `sub_translators` have no effect on the returned object.
+        If no translators are specified the currently ones currently inside the global registry are used.
+        After construction changes to the passed `primitive_translators` have no effect on the returned object.
     """
     if kwargs:
+        # TODO(phimuell): Add proper name verification and exception type.
         raise NotImplementedError(
-            f"The following arguments of 'jax.jit' are not yet supported by jace: {', '.join(kwargs.keys())}."
+            f"The following arguments to 'jace.jit' are not yet supported: {', '.join(kwargs)}."
         )
 
     def wrapper(f: Callable) -> stages.JaceWrapped:
         jace_wrapper = stages.JaceWrapped(
             fun=f,
-            sub_translators=(
+            primitive_translators=(
                 translator.managing._PRIMITIVE_TRANSLATORS_DICT
-                if sub_translators is None
-                else sub_translators
+                if primitive_translators is None
+                else primitive_translators
             ),
-            jit_ops=kwargs,
+            jit_options=kwargs,
         )
         return functools.update_wrapper(jace_wrapper, f)
 
     return wrapper if fun is None else wrapper(fun)
-
-
-__all__ = [
-    "grad",
-    "jit",
-    "jacfwd",
-    "jacrev",
-]
diff --git a/src/jace/jax/stages.py b/src/jace/jax/stages.py
index 5ad907e..9a0218f 100644
--- a/src/jace/jax/stages.py
+++ b/src/jace/jax/stages.py
@@ -34,47 +34,49 @@
 from jace.jax import translation_cache as tcache
 from jace.optimization import CompilerOptions
 from jace.translator import post_translation as ptrans
-from jace.util import dace_helper as jdace
+from jace.util import dace_helper
 
 
-class JaceWrapped(tcache.CachingStage):
+class JaceWrapped(tcache.CachingStage["JaceLowered"]):
     """A function ready to be specialized, lowered, and compiled.
 
     This class represents the output of functions such as `jace.jit()`.
-    Calling it results in jit (just-in-time) lowering, compilation, and execution.
-    It can also be explicitly lowered prior to compilation, and the result compiled prior to execution.
-
-    You should not create `JaceWrapped` instances directly, instead you should use `jace.jit`.
+    Calling it results in jit (just-in-time) lowering, compilation and execution.
+    It is also possible to lower the function explicitly by calling `self.lower()`.
+    This function can be composed with other Jax transformations.
 
     Todo:
         - Handle pytrees.
+        - Handle all options to `jax.jit`.
+
+    Note:
+        The tracing of function will always happen with enabled `x64` mode, which is implicitly
+        and temporary activated during tracing. Furthermore, the disable JIT config flag is ignored.
     """
 
     _fun: Callable
-    _sub_translators: dict[str, translator.PrimitiveTranslator]
-    _jit_ops: dict[str, Any]
+    _primitive_translators: dict[str, translator.PrimitiveTranslator]
+    _jit_options: dict[str, Any]
 
     def __init__(
         self,
         fun: Callable,
-        sub_translators: Mapping[str, translator.PrimitiveTranslator],
-        jit_ops: Mapping[str, Any],
+        primitive_translators: Mapping[str, translator.PrimitiveTranslator],
+        jit_options: Mapping[str, Any],
     ) -> None:
         """Creates a wrapped jitable object of `fun`.
 
-        You should not create `JaceWrapped` instances directly, instead you should use `jace.jit`.
-
         Args:
-            fun:                The function that is wrapped.
-            sub_translators:    The list of subtranslators that that should be used.
-            jit_ops:            All options that we forward to `jax.jit`.
+            fun:                    The function that is wrapped.
+            primitive_translators:  The list of subtranslators that that should be used.
+            jit_options:            Options to influence the jit process.
         """
         super().__init__()
         # We have to shallow copy both the translator and the jit options.
         #  This prevents that any modifications affect `self`.
         #  Shallow is enough since the translators themselves are immutable.
-        self._sub_translators = dict(sub_translators)
-        self._jit_ops = dict(jit_ops)
+        self._primitive_translators = dict(primitive_translators)
+        self._jit_options = dict(jit_options)
         self._fun = fun
 
     def __call__(
@@ -84,22 +86,16 @@ def __call__(
     ) -> Any:
         """Executes the wrapped function, lowering and compiling as needed in one step."""
 
-        # TODO(phimuell): Handle the `disable_jit` context manager of Jax.
-
-        # This allows us to be composable with Jax transformations.
+        # If we are inside a traced context, then we forward the call to the wrapped function.
+        #  This ensures that Jace is composable with Jax.
         if util.is_tracing_ongoing(*args, **kwargs):
-            # TODO(phimuell): Handle the case of gradients:
-            #                   It seems that this one uses special tracers, since they can handle comparisons.
-            #                   https://jax.readthedocs.io/en/latest/notebooks/Common_Gotchas_in_JAX.html#python-control-flow-autodiff
             return self._fun(*args, **kwargs)
 
-        # TODO(phimuell): Handle static arguments correctly
-        #                   https://jax.readthedocs.io/en/latest/aot.html#lowering-with-static-arguments
         lowered = self.lower(*args, **kwargs)
         compiled = lowered.compile()
         return compiled(*args, **kwargs)
 
-    @tcache.cached_translation
+    @tcache.cached_transition
     def lower(
         self,
         *args: Any,
@@ -107,12 +103,8 @@ def lower(
     ) -> JaceLowered:
         """Lower this function explicitly for the given arguments.
 
-        Performs the first two steps of the AOT steps described above,
-        i.e. transformation into Jaxpr and then to SDFG.
-        The result is encapsulated into a `Lowered` object.
-
-        Todo:
-            - Handle pytrees.
+        Performs the first two steps of the AOT steps described above, i.e. transformation into
+        Jaxpr and then to SDFG. The result is encapsulated into a `Lowered` object.
         """
         if len(kwargs) != 0:
             raise NotImplementedError("Currently only positional arguments are supported.")
@@ -122,12 +114,19 @@ def lower(
         if not all((not util.is_array(arg)) or arg.flags["C_CONTIGUOUS"] for arg in args):
             raise NotImplementedError("Currently can not handle strides beside 'C_CONTIGUOUS'.")
 
-        jaxpr = _jax.make_jaxpr(self._fun)(*args)
-        driver = translator.JaxprTranslationDriver(sub_translators=self._sub_translators)
-        trans_sdfg: translator.TranslatedJaxprSDFG = driver.translate_jaxpr(jaxpr)
-        ptrans.postprocess_jaxpr_sdfg(tsdfg=trans_sdfg, fun=self.wrapped_fun)
-        # The `JaceLowered` assumes complete ownership of `trans_sdfg`!
-        return JaceLowered(trans_sdfg)
+        # In Jax `float32` is the main datatype, and they go to great lengths to avoid
+        #  some aggressive [type promotion](https://jax.readthedocs.io/en/latest/type_promotion.html).
+        #  However, in this case we will have problems when we call the SDFG, for some reasons
+        #  `CompiledSDFG` does not work in that case correctly, thus we enable it for the tracing.
+        with _jax.experimental.enable_x64():
+            driver = translator.JaxprTranslationDriver(
+                primitive_translators=self._primitive_translators
+            )
+            jaxpr = _jax.make_jaxpr(self._fun)(*args)
+            tsdfg: translator.TranslatedJaxprSDFG = driver.translate_jaxpr(jaxpr)
+        ptrans.postprocess_jaxpr_sdfg(tsdfg=tsdfg, fun=self.wrapped_fun)
+
+        return JaceLowered(tsdfg)
 
     @property
     def wrapped_fun(self) -> Callable:
@@ -137,42 +136,47 @@ def wrapped_fun(self) -> Callable:
     def _make_call_description(
         self,
         *args: Any,
-    ) -> tcache.CachedCallDescription:
+    ) -> tcache.StageTransformationDescription:
         """This function computes the key for the `JaceWrapped.lower()` call.
 
         Currently it is only able to handle positional argument and does not support static arguments.
         The function will fully abstractify its input arguments.
         This function is used by the cache to generate the key.
         """
-        fargs = tuple(tcache._AbstractCallArgument.from_value(x) for x in args)
-        return tcache.CachedCallDescription(stage_id=id(self), fargs=fargs)
+        call_args = tuple(tcache._AbstractCallArgument.from_value(x) for x in args)
+        return tcache.StageTransformationDescription(stage_id=id(self), call_args=call_args)
+
 
+class JaceLowered(tcache.CachingStage["JaceCompiled"]):
+    """Represents the original computation as an SDFG.
 
-class JaceLowered(tcache.CachingStage):
-    """Represents the original computation that was lowered to SDFG.
+    Although, `JaceWrapped` is composable with Jax transformations `JaceLowered` is not.
+    A user should never create such an object.
 
     Todo:
         - Handle pytrees.
     """
 
-    # `self` assumes complete ownership of the
-    _trans_sdfg: translator.TranslatedJaxprSDFG
+    _translated_sdfg: translator.TranslatedJaxprSDFG
 
     def __init__(
         self,
-        trans_sdfg: translator.TranslatedJaxprSDFG,
+        tsdfg: translator.TranslatedJaxprSDFG,
     ) -> None:
-        """Constructs the lowered object."""
-        if not trans_sdfg.is_finalized:
+        """Initialize the lowered object.
+
+        Args:
+            tsdfg:      The lowered SDFG with metadata. Must be finalized.
+
+        Notes:
+            The passed `tsdfg` will be managed by `self`.
+        """
+        if not tsdfg.is_finalized:
             raise ValueError("The translated SDFG must be finalized.")
-        if trans_sdfg.inp_names is None:
-            raise ValueError("Input names must be defined.")
-        if trans_sdfg.out_names is None:
-            raise ValueError("Output names must be defined.")
         super().__init__()
-        self._trans_sdfg = trans_sdfg
+        self._translated_sdfg = tsdfg
 
-    @tcache.cached_translation
+    @tcache.cached_transition
     def compile(
         self,
         compiler_options: CompilerOptions | None = None,
@@ -192,11 +196,9 @@ def compile(
         # We **must** deepcopy before we do any optimization.
         #  The reason is `self` is cached and assumed to be immutable.
         #  Since all optimizations works in place, we would violate this assumption.
-        tsdfg: translator.TranslatedJaxprSDFG = copy.deepcopy(self._trans_sdfg)
+        tsdfg: translator.TranslatedJaxprSDFG = copy.deepcopy(self._translated_sdfg)
 
-        # Must be the same as in `_make_call_description()`!
-        options = optimization.DEFAULT_OPTIMIZATIONS | (compiler_options or {})
-        optimization.jace_optimize(tsdfg=tsdfg, **options)
+        optimization.jace_optimize(tsdfg=tsdfg, **self._make_compiler_options(compiler_options))
 
         return JaceCompiled(
             csdfg=util.compile_jax_sdfg(tsdfg),
@@ -211,7 +213,7 @@ def compiler_ir(self, dialect: str | None = None) -> translator.TranslatedJaxprS
         It is important that modifying this object in any ways is considered an error.
         """
         if (dialect is None) or (dialect.upper() == "SDFG"):
-            return self._trans_sdfg
+            return self._translated_sdfg
         raise ValueError(f"Unknown dialect '{dialect}'.")
 
     def as_html(self, filename: str | None = None) -> None:
@@ -231,17 +233,22 @@ def as_sdfg(self) -> dace.SDFG:
     def _make_call_description(
         self,
         compiler_options: CompilerOptions | None = None,
-    ) -> tcache.CachedCallDescription:
+    ) -> tcache.StageTransformationDescription:
         """This function computes the key for the `self.compile()` call.
 
         The function only get one argument that is either a `dict` or a `None`, where `None` means `use default argument.
         The function will construct a concrete description of the call using `(name, value)` pairs.
         This function is used by the cache.
         """
-        # Must be the same as in `compile()`!
-        options = optimization.DEFAULT_OPTIMIZATIONS | (compiler_options or {})
-        fargs = tuple(sorted(options.items(), key=lambda X: X[0]))
-        return tcache.CachedCallDescription(stage_id=id(self), fargs=fargs)
+        options = self._make_compiler_options(compiler_options)
+        call_args = tuple(sorted(options.items(), key=lambda X: X[0]))
+        return tcache.StageTransformationDescription(stage_id=id(self), call_args=call_args)
+
+    def _make_compiler_options(
+        self,
+        compiler_options: CompilerOptions | None,
+    ) -> CompilerOptions:
+        return optimization.DEFAULT_OPTIMIZATIONS | (compiler_options or {})
 
 
 class JaceCompiled:
@@ -251,13 +258,13 @@ class JaceCompiled:
         - Handle pytrees.
     """
 
-    _csdfg: jdace.CompiledSDFG  # The compiled SDFG object.
+    _csdfg: dace_helper.CompiledSDFG  # The compiled SDFG object.
     _inp_names: tuple[str, ...]  # Name of all input arguments.
     _out_names: tuple[str, ...]  # Name of all output arguments.
 
     def __init__(
         self,
-        csdfg: jdace.CompiledSDFG,
+        csdfg: dace_helper.CompiledSDFG,
         inp_names: Sequence[str],
         out_names: Sequence[str],
     ) -> None:
diff --git a/src/jace/jax/translation_cache.py b/src/jace/jax/translation_cache.py
index 5bcb948..b29aa54 100644
--- a/src/jace/jax/translation_cache.py
+++ b/src/jace/jax/translation_cache.py
@@ -21,7 +21,14 @@
 import dataclasses
 import functools
 from collections.abc import Callable, Hashable
-from typing import TYPE_CHECKING, Any, Final, TypeAlias
+from typing import (
+    TYPE_CHECKING,
+    Any,
+    Generic,
+    TypeAlias,
+    TypeVar,
+    cast,
+)
 
 import dace
 from jax import core as jax_core
@@ -32,24 +39,24 @@
 if TYPE_CHECKING:
     from jace.jax import stages
 
-# This is the default cache size we are using
-_DEF_CACHE_SIZE: Final[int] = 256
+#: Caches used to store the state transition.
+#: The states are on a per stage and not per instant basis.
+_TRANSLATION_CACHES: dict[type[CachingStage], StageCache] = {}
 
-# This are the caches that we are using.
-_TRANSLATION_CACHES: dict[type[CachingStage], TranslationCache] = {}
 
+# Denotes the stage that follows the current one.
+#  Used by the `NextStage` Mixin.
+NextStage = TypeVar("NextStage", bound="stages.Stage")
 
-class CachingStage:
-    """Annotates a stage whose transition to the next one is cacheable.
 
-    This transitions are mainly `JaceWrapped.lower()` and `JaceLowered.compile()` calls.
-    To make a stage cacheable annotate the transition function with the `@cached_translation` decorator.
+class CachingStage(Generic[NextStage]):
+    """Annotates a stage whose transition to the next one is cacheable.
 
-    Todo:
-        - Make a generic to indicate what the result stage is.
+    To make a transition function cacheable it must be annotated by the
+    `@cached_transition` decorator.
     """
 
-    _cache: TranslationCache
+    _cache: StageCache[NextStage]
 
     def __init__(self) -> None:
         self._cache = get_cache(self)
@@ -59,14 +66,17 @@ def _make_call_description(
         self: CachingStage,
         *args: Any,
         **kwargs: Any,
-    ) -> CachedCallDescription:
+    ) -> StageTransformationDescription:
         """Generates the key that is used to store/locate the call in the cache."""
         ...
 
 
-def cached_translation(
-    action: Callable[..., stages.Stage],
-) -> Callable:
+Action_T = TypeVar("Action_T", bound=Callable[..., Any])
+
+
+def cached_transition(
+    action: Action_T,
+) -> Action_T:
     """Decorator for making the transition function of the stage cacheable.
 
     The decorator will call the annotated function only if the call is not stored inside the cache.
@@ -79,18 +89,15 @@ def _action_wrapper(
         self: CachingStage,
         *args: Any,
         **kwargs: Any,
-    ) -> stages.Stage:
-        # Get the abstract description of the call, that is used as key.
-        key: CachedCallDescription = self._make_call_description(*args, **kwargs)
+    ):
+        key: StageTransformationDescription = self._make_call_description(*args, **kwargs)
         if key in self._cache:
             return self._cache[key]
-
-        # We must actually perform the call
         next_stage: stages.Stage = action(self, *args, **kwargs)
         self._cache[key] = next_stage
         return next_stage
 
-    return _action_wrapper
+    return cast(Action_T, _action_wrapper)
 
 
 def clear_translation_cache() -> None:
@@ -100,13 +107,12 @@ def clear_translation_cache() -> None:
 
 def get_cache(
     stage: CachingStage,
-) -> TranslationCache:
+) -> StageCache:
     """Returns the cache that is used for `stage`."""
-    # The caches are per stage and not per instance basis
-    tstage = type(stage)
-    if tstage not in _TRANSLATION_CACHES:
-        _TRANSLATION_CACHES[tstage] = TranslationCache(size=_DEF_CACHE_SIZE)
-    return _TRANSLATION_CACHES[tstage]
+    stage_type = type(stage)
+    if stage_type not in _TRANSLATION_CACHES:
+        _TRANSLATION_CACHES[stage_type] = StageCache()
+    return _TRANSLATION_CACHES[stage_type]
 
 
 @dataclasses.dataclass(frozen=True)
@@ -116,6 +122,12 @@ class _AbstractCallArgument:
     It is used as part of the key in the cache.
     It represents the structure of the argument, i.e. its shape, type and so on, but nots its value.
     To construct it you should use the `from_value()` class function which interfere the characteristics from a value.
+
+    Attributes:
+        shape:      In case of an array its shape, in case of a scalar the empty tuple.
+        dtype:      The DaCe type of the argument.
+        strides:    The strides of the argument, or `None` if they are unknown or a scalar.
+        storage:    The storage type where the argument is stored.
     """
 
     shape: tuple[int, ...]
@@ -172,80 +184,69 @@ def from_value(
 
 
 @dataclasses.dataclass(frozen=True)
-class CachedCallDescription:
-    """Represents the full structure of a call in the cache as a key.
-
-    This class is the return type of the `CachingStage._make_call_description()` function,
-    which is used by the `@cached_translation` decorator to compute a key of transition.
-    This allows to either retrieve or then store the result of the actual call in the cache.
-
-    The actual key is composed of two parts, first the "origin of the call".
-    For this we just use the address of the stage object we are caching and hope that the
-    address is not reused for another stag anytime soon.
-
-    The second part is of the key are a description of the actual arguments, see `CallArgsDescription` type alias.
-    For this the `_make_call_description()` method of the stage is used.
-    The arguments can be described in two different ways:
-    - Abstract description: In this way, the actual value of the argument is irrelevant,
-        only the structure of them are important, this is similar to the tracers used in Jax.
-    - Concrete description: Here one caches on the actual value of the argument,
-        which is similar to static arguments in Jax.
-        The only restriction is that they are hash able.
+class StageTransformationDescription:
+    """Represents the call to a state transformation function.
+
+    State transition functions are annotated with `@cached_transition` and stored inside a cache.
+    This class serves as a key inside this cache and is generated by `CachingStage._make_call_description()`.
+    The actual key is consists of two parts.
+
+    Attributes:
+        stage_id:   Origin of the call, for which the id of the stage object should be used.
+        call_args:  Description of the arguments of the call. There are two ways to describe
+            the arguments:
+            - Abstract description: In this way, the actual value of the argument is irrelevant,
+                only the structure of them are important, similar to the tracers used in Jax.
+            - Concrete description: Here one caches on the actual value of the argument.
+                The only requirement is that they can be hashed.
 
     Notes:
         The base assumption is that the stages are immutable.
 
     Todo:
         - pytrees.
-        - Turn the references into week references, Jax does this and I am sure there is a reason for it.
     """
 
     stage_id: int
-    fargs: CallArgsDescription
+    call_args: CallArgsDescription
 
 
-class TranslationCache:
-    """The cache object used to cache the stage transitions.
+# Denotes the stage that is stored inside the cache.
+StageType = TypeVar("StageType", bound="stages.Stage")
+
+
+class StageCache(Generic[StageType]):
+    """LRU cache that is used to cache the stage transitions, i.e. lowering and compiling, in Jace.
 
     Notes:
-        The most recently used entry is at the end of the `OrderedDict`, because it puts new entries there.
+        The most recently used entry is at the end of the `OrderedDict`.
     """
 
-    __slots__ = ("_memory", "_size")
-
-    _memory: collections.OrderedDict[CachedCallDescription, stages.Stage]
+    _memory: collections.OrderedDict[StageTransformationDescription, StageType]
     _size: int
 
     def __init__(
         self,
-        size: int,
+        size: int = 256,
     ) -> None:
-        """Creates a cache instance of size.
+        """Creates a LRU cache with `size` many entries.
 
-        The cache will have size `size` and use `key` as key function.
+        Args:
+            size:   Number of entries the cache holds, defaults to 256.
         """
-        if size <= 0:
-            raise ValueError(f"Invalid cache size of '{size}'")
         self._memory = collections.OrderedDict()
         self._size = size
 
     def __contains__(
         self,
-        key: CachedCallDescription,
+        key: StageTransformationDescription,
     ) -> bool:
-        """Check if `self` have a record of `key`."""
         return key in self._memory
 
     def __getitem__(
         self,
-        key: CachedCallDescription,
-    ) -> stages.Stage:
-        """Get the next stage associated with `key`.
-
-        Notes:
-            It is an error if `key` does not exist.
-            This function will mark `key` as most recently used.
-        """
+        key: StageTransformationDescription,
+    ) -> StageType:
         if key not in self:
             raise KeyError(f"Key '{key}' is unknown.")
         self._memory.move_to_end(key, last=True)
@@ -253,25 +254,20 @@ def __getitem__(
 
     def __setitem__(
         self,
-        key: CachedCallDescription,
-        res: stages.Stage,
-    ) -> TranslationCache:
-        """Adds or update `key` to map to `res`."""
+        key: StageTransformationDescription,
+        res: StageType,
+    ) -> None:
         if key in self:
-            # `key` is known, so move it to the end and update the mapped value.
             self._memory.move_to_end(key, last=True)
             self._memory[key] = res
-
         else:
-            # `key` is not known so we have to add it
-            while len(self._memory) >= self._size:
+            if len(self._memory) == self._size:
                 self.popitem(None)
             self._memory[key] = res
-        return self
 
     def popitem(
         self,
-        key: CachedCallDescription | None,
+        key: StageTransformationDescription | None,
     ) -> None:
         """Evict `key` from `self`.
 
@@ -286,5 +282,4 @@ def popitem(
             self._memory.popitem(last=False)
 
     def __repr__(self) -> str:
-        """Textual representation for debugging."""
-        return f"TranslationCache({len(self._memory)} / {self._size} || {', '.join( '[' + repr(k) + ']' for k in self._memory)})"
+        return f"StageCache({len(self._memory)} / {self._size} || {', '.join( '[' + repr(k) + ']' for k in self._memory)})"
diff --git a/src/jace/translator/jaxpr_translator_driver.py b/src/jace/translator/jaxpr_translator_driver.py
index 508322c..aa794b6 100644
--- a/src/jace/translator/jaxpr_translator_driver.py
+++ b/src/jace/translator/jaxpr_translator_driver.py
@@ -33,62 +33,62 @@ class JaxprTranslationDriver:
     - the `arg_names` parameter is not set.
 
     For these reasons the SDFG is not directly usable, and further manipulations have to be performed.
-    Especially, DaCe's validation function will fail and it is unable to be processed by the optimization pipeline.
-    For more information also see `jace.translator.post_translation` module.
+    Especially, DaCe's validation function will fail and it is unable to be processed by the
+    optimization pipeline. For more information also see `jace.translator.post_translation` module.
 
-    The idea of the translator is extremely simple.
-    Since Jaxpr is a list consisting of more or less simple instructions/equations, they get processed one after the other.
-    Each equation is translated into its own state that is appended to the SDFG, thus the SDFG is a long list of states.
-    In certain cases it might be that an equation needs more states, but this is an exception.
+    The idea of the translator is extremely simple. Since Jaxpr is a list consisting of more or less
+    simple instructions/equations, they get processed one after the other.
+    Each equation is translated into its own state that is appended to the SDFG, thus the SDFG is a
+    long list of states. In certain cases it might be that an equation needs more states,
+    but this is an exception.
 
     The actual translation of the equation is not handled by the driver.
-    Instead the request is forwarded to a `PrimitiveTranslator` object, also known as subtranslator.
-    This is a highly specialized object that is able to handle one kind of primitive.
-    For more information on the subtranslators see the documentation of `PrimitiveTranslator`.
+    Instead the request is forwarded to a `PrimitiveTranslator` object, known as primitive translator
+    or subtranslator. This is a highly specialized object that is able to handle one kind of primitive.
+    For more information on them see the documentation of `PrimitiveTranslator`.
 
-    To start a translation the `translate_jaxpr()` function should be called, if this happens it is said that the driver has an ongoing translation.
-    If `translate_jaxpr()` is called on a driver that has an ongoing translation, a new translation context will be set up.
+    To start a translation the `translate_jaxpr()` function should be called, if this happens it is
+    said that the driver has an ongoing translation. If `translate_jaxpr()` is called on a driver
+    that has an ongoing translation, a new translation context will be set up.
     Thus the driver will then translate the supplied (nested) Jaxpr and return the result.
     However, this will have no influence on the translation process that is already going.
 
     Notes:
         After the main translation has been performed the translator object can be used again.
-        Currently the driver will generate only Array as SDFG variables, however, this is a temporary solution, see `add_array()`.
+        Currently the driver will generate only Array as SDFG variables, however, this is a
+        temporary solution, see `add_array()`.
     """
 
-    __slots__ = ("_ctx_stack", "_sub_translators", "_jax_name_map")
+    __slots__ = ("_ctx_stack", "_primitive_translators", "_jax_name_map")
 
-    _sub_translators: Mapping[str, translator.PrimitiveTranslatorCallable]
+    _primitive_translators: Mapping[str, translator.PrimitiveTranslatorCallable]
     _jax_name_map: dict[jax_core.Var | util.JaCeVar, str]
     _ctx_stack: list[translator.TranslatedJaxprSDFG]
 
     def __init__(
         self,
-        sub_translators: Mapping[str, translator.PrimitiveTranslatorCallable],
+        primitive_translators: Mapping[str, translator.PrimitiveTranslatorCallable],
     ) -> None:
-        """Creates the driver.
+        """Creates the driver ready for translation.
 
         Args:
-            sub_translators:    Use these subtranslators to perform the translation.
+            primitive_translators:    Primitive to use during the translation.
 
-        Notes:
-            `sub_translators` is not copied, however, the user has to guarantee, that it does not change during the lifetime of `self`.
+        Note:
+            The primitive translators are not copied, thus the user has to ensure that the passed mapping
+            does not change during the translation.
         """
-
-        # Maps the name of a Jax primitive to the primitive translator that should be used.
-        #  Note that the subtranslator is only required to be a callable, and immutable.
-        #  User has to ensure that it does not change.
-        self._sub_translators = sub_translators
+        # Maps name of primitives to the associated translator.
+        self._primitive_translators = primitive_translators
 
         # Maps Jax variables to the name of its SDFG equivalent.
-        #  Note that it is shared among all translation contexts.
-        #  This is done to create consistency between SDFG variables
-        #  and the names used pretty printed Jaxprs.
+        #  Shared between all translation contexts, to ensure consecutive
+        #  variable naming as seen as in a pretty printed Jaxpr.
+        #  Will be cleared by `_clear_translation_ctx()` at the end of the translation.
         self._jax_name_map = {}
 
-        # Context stack and current context.
-        #  If it is empty, then no translation process is in process.
-        #  If there is one entry, `self` is the root translator.
+        # Stack of all context, to handle nested Jaxpr instances.
+        #  The first one, i.e. index 0, is known as head translator.
         self._ctx_stack = []
 
     def translate_jaxpr(
@@ -99,30 +99,21 @@ def translate_jaxpr(
     ) -> translator.TranslatedJaxprSDFG:
         """Perform the translation of a Jaxpr into a SDFG.
 
-        In case this function is called and `self` has an ongoing translation process, a new translation context will be created.
-        This means the Jaxpr will be translated independently from the previous one.
+        In case this function is called and `self` has an ongoing translation process, a new
+        translation context will be created. This means the Jaxpr will be translated independently
+        from the previous one.
 
         Returns:
             The function will translate the passed Jaxpr object into an SDFG in canonical form.
-            This SDFG together with additional meta data, that is needed for further processing is encapsulated inside a `TranslatedJaxprSDFG` object.
+            This SDFG together with additional meta data, that is needed for further processing
+            is encapsulated inside a `TranslatedJaxprSDFG` object.
 
         Args:
             name:                   Use this name for the SDFG instead some generated one.
         """
-        import jax as _jax
 
         if len(jaxpr.effects) != 0:
             raise NotImplementedError("'Jaxpr' with side effects are not supported.")
-        if not _jax.config.read("jax_enable_x64"):
-            # NOTE: What is interesting here is, that the SDFG can be called, but the result is garbage.
-            #  Beside that I think it should not work, I think it should not even call,
-            #  because of a mismatch in data types.
-            #  However, If we work with Jax arrays themselves, it should technically work.
-            #  But currently the best we can do, is forbid it!
-            raise NotImplementedError(
-                "You have disabled 'x64' support in Jax, which interferes with the calling of the SDFG. "
-                "SDFG generated in this way will fail to call."
-            )
 
         # NOTE: If `self` is already allocated, i.e. has an ongoing translation process,
         #       the `_allocate_translation_ctx()` function will start a new context.
@@ -136,11 +127,8 @@ def translate_jaxpr(
             jaxpr=jaxpr,
         )
         self._create_initial_input(jaxpr=jaxpr)
-        # Note that `self` and `jsdfg` still share the same underlying memory, i.e. context.
-        jsdfg: translator.TranslatedJaxprSDFG = self._translate_jaxpr_internal(jaxpr)
-        self._clear_translation_ctx()
 
-        return jsdfg
+        return self._translate_jaxpr_internal(jaxpr)
 
     def append_new_state(
         self,
@@ -257,7 +245,7 @@ def map_jax_var_to_sdfg(
     def sdfg(self) -> dace.SDFG:
         """Returns the SDFG that is currently constructed.
 
-        If you want access to the arrays of the SDFG use `self.arrays()`/`self.get_array()`.
+        If you want access to the arrays of the SDFG use `self.arrays`/`self.get_array()`.
         """
         return self._ctx.sdfg
 
@@ -288,8 +276,8 @@ def add_jax_name_mapping(
     ) -> JaxprTranslationDriver:
         """Creates a new mapping between `jax_var` to `sdfg_name`.
 
-        If the mapping already exists an error will be generated.
-        This function is not able to delete a variable mapping that was established before, for this use TBA.
+        If the mapping already exists an error will be generated. This function is not
+        able to delete a variable mapping that was established before, for this use TBA.
 
         Args:
             jax_var:     The Jax variable.
@@ -299,7 +287,8 @@ def add_jax_name_mapping(
 
         if jax_var in self._jax_name_map:
             raise ValueError(
-                f"Tried to create the mapping '{jax_var} -> {sdfg_name}', but the variable is already mapped."
+                f"Cannot change the mapping of '{jax_var}' from"
+                f" '{self.map_jax_var_to_sdfg(jax_var)}' to '{sdfg_name}'."
             )
         if sdfg_name not in self._ctx.sdfg.arrays:
             raise KeyError(f"Mapping '{jax_var} -> {sdfg_name}': SDFG target unknown.")
@@ -320,9 +309,10 @@ def add_array(
 
         The SDFG object is always created as a transient.
 
-        By default the function will use `jace.util.propose_jax_name()` to derive the name that should be used.
-        However, by passing a `JaCeVar` with a name it is possible to suggest a specific name.
-        In addition it is possible to specify `name_prefix` to prefix name that would be used.
+        By default the function will use `jace.util.propose_jax_name()` to derive
+        the name that should be used. However, by passing a `JaCeVar` with a name it
+        is possible to suggest a specific name. In addition it is possible to specify
+        `name_prefix` to prefix name that would be used.
 
         The function will not update the internal variable mapping.
         If this is desired one can set `update_var_mapping`, for forcing this.
@@ -333,12 +323,11 @@ def add_array(
             update_var_mapping: Update the internal variable mapping; by default `False`.
 
         Notes:
-            Currently the function will always create an Array, even if the Jax variable refers to a scalar.
-            This is done to work around some difficulties with scalar return values and so on.
-            This issue should actually handled in the post processing stage, but currently it is not.
-            However, from a point of building an SDFG manually, there is no difference between a Scalar and an Array.
-            According to the dace developer, the majority of the backend, i.e. optimization pipeline, should be handle to handle it.
-            But there are some special parts that might explicitly want a scalar, it also might block certain compiler optimization.
+            As a temporary fix for handling scalar return values, the function will always
+            generate arrays, even if `arg` is a scalar.
+            According to the dace developer, the majority of the backend, i.e. optimization
+            pipeline, should be handle to handle it. But there are some special parts that
+            might explicitly want a scalar, it also might block certain compiler optimization.
         """
         shape: tuple[int | dace.symbol | str, ...] = util.get_jax_var_shape(arg)
         dtype: dace.typeclass = util.get_jax_var_dtype(arg)
@@ -415,12 +404,12 @@ def create_jax_var_list(  # type: ignore[misc]
         If no corresponding SDFG variable is known the function will create one using `add_array()`.
 
         By setting `prevent_creation` the function will not create any new SDFG variables,
-        if no corresponding SDFG variable exists an error is generated.
-        By setting `only_creation` the function will only create new SDFG variables,
-        if a variable already have a corresponding SDFG variable an error will be created.
+        if no corresponding SDFG variable exists an error is generated. By setting `only_creation`
+        the function will only create new SDFG variables, if a variable already have a
+        corresponding SDFG variable an error will be created.
 
-        By default literals cause an error.
-        However, by setting `handle_literals` to `True` literals will will be included in the output with the value `None`.
+        By default literals cause an error. However, by setting `handle_literals` to `True`
+        literals will will be included in the output with the value `None`.
 
         Args:
             jax_var_list:       The list of Jax variables that should be transformed to SDFG names.
@@ -518,8 +507,8 @@ def _allocate_translation_ctx(
     ) -> JaxprTranslationDriver:
         """This function allocates and initialize the members of the translation context of `self`.
 
-        If this function is called and `self` is already allocated, the function will create a new context,
-        allowing the driver to handle nested Jaxpr.
+        If this function is called and `self` is already allocated, the function will create a
+        new context, allowing the driver to handle nested Jaxpr.
         The first context that is created is also known as root translator.
 
         Args:
@@ -534,10 +523,6 @@ def _allocate_translation_ctx(
             )
         )
 
-        if self.is_root_translator():
-            # In the future we will populate the generate state here, i.e. if we are on GPU or not and so on.
-            assert len(self._jax_name_map) == 0
-
         return self
 
     @property
@@ -546,15 +531,13 @@ def _ctx(self) -> translator.TranslatedJaxprSDFG:
         assert len(self._ctx_stack) != 0, "No context is active."
         return self._ctx_stack[-1]
 
-    def _clear_translation_ctx(self) -> JaxprTranslationDriver:
-        """This function deallocate the currently active translation context of `self`.
+    def _clear_translation_ctx(self) -> translator.TranslatedJaxprSDFG | None:
+        """Remove the current active context from `self` and returns its state.
 
-        Notes:
-            While it is allowed for outside code to call this function explicit it is is most likely an error.
-            If `self` is not allocated this function acts as a noops.
+        If `self` is not allocated it will return `None`.
         """
         if not self.is_allocated():
-            return self
+            return None
 
         if self.is_root_translator():
             # The translation as a whole has finished, so restore the driver,
@@ -562,8 +545,7 @@ def _clear_translation_ctx(self) -> JaxprTranslationDriver:
             self._jax_name_map = {}
 
         # Remove the current head stack.
-        _ = self._ctx_stack.pop()
-        return self
+        return self._ctx_stack.pop()
 
     def _translate_single_eqn(
         self,
@@ -573,17 +555,13 @@ def _translate_single_eqn(
 
         To do this the function will perform the following steps:
         - Assemble the in and output variables.
-        - Select the appropriate subtranslator to use.
+        - Select the appropriate primitive translator to use.
         - Create a new empty state terminal state.
-        - Call the subtranslator to perform the translation inside the new state.
+        - Call the primitive translator to perform the translation inside the new state.
 
         Returns:
             The SDFG names that were used as input and output are returned.
             The inputs might contain `None` which indicates that that input was a Jax Literal.
-
-        Notes:
-            The equation, `eqn` must come from the unclosed jaxpr instance.
-            The function will perform some consistency checking after the subtranslator was called.
         """
         if len(eqn.effects) != 0:
             raise NotImplementedError(f"Equation '{eqn}' has side effects.")
@@ -603,24 +581,22 @@ def _translate_single_eqn(
             update_var_mapping=True,
         )
 
-        # Find the subtranslator
-        prim_name: str = eqn.primitive.name
-        if prim_name not in self._sub_translators:
-            raise NotImplementedError(f"No subtranslators known to handle '{prim_name}'.")
-        subtranslator = self._sub_translators[prim_name]
+        pname: str = eqn.primitive.name
+        if pname not in self._primitive_translators:
+            raise NotImplementedError(f"No translator known to handle '{pname}'.")
+        ptranslator = self._primitive_translators[pname]
 
         # Create the state into which the equation should be translated
-        last_term_state: dace.SDFGState = self._terminal_sdfg_state  # noqa: F841 # Will be used later
         eqn_state = self.append_new_state(
-            label=f"{eqn.primitive.name}_{'_'.join(out_var_names)}",
+            label=f"{pname}_{'_'.join(out_var_names)}",
             prev_state=None,  # forces terminal state to use
         )
 
         # Now perform the actual translation of the equation.
-        new_sdfg_term_state = subtranslator(
+        new_sdfg_term_state = ptranslator(
             driver=self,
             in_var_names=in_var_names,
-            out_var_names=out_var_names,  # Might be modified by the subtranslator!
+            out_var_names=out_var_names,  # Might be modified by the translator!
             eqn=eqn,
             eqn_state=eqn_state,
         )
@@ -631,8 +607,8 @@ def _translate_single_eqn(
                 raise RuntimeError("Inconsistent terminal state was detected.")
             new_sdfg_term_state = eqn_state
 
-        # In case a subtranslator decided to not use the variables we created for it, which is allowed
-        #  but it must update the `out_var_names` list correctly, we will now verify this.
+        # In case a translator decided to not use the variables we created for it, which is
+        #  allowed but it must update the `out_var_names` list correctly, we will now verify this.
         for expectedSDFGName, jax_var in zip(out_var_names, eqn.outvars, strict=True):
             mapped_sdfg_name = self.map_jax_var_to_sdfg(jax_var)
             if mapped_sdfg_name != expectedSDFGName:
@@ -654,8 +630,9 @@ def _translate_jaxpr_internal(
         """Performs the actual translation of the Jaxpr into an SDFG.
 
         The function assumes that the context is allocated as well as the initial variables.
-        The function will return the internal state of `self` encapsulated inside a `TranslatedJaxprSDFG` object.
-        However, it will not deallocate the translation context, thus `self` and the return value share the same memory.
+        The function will return the internal state of `self` encapsulated inside a
+        `TranslatedJaxprSDFG` object.
+        The function will also deallocate the current context upon return.
 
         Args:
             jaxpr:      The Jaxpr to translate.
@@ -678,10 +655,10 @@ def _translate_jaxpr_internal(
         if nb_translated_eqn == 0:
             out_var_names = self._handle_null_jaxpr(jaxpr)
 
-        # Set the output names inside the context.
+        # Proper output names in the context.
         self._ctx.out_names = tuple(out_var_names)
 
-        return self._ctx
+        return cast("translator.TranslatedJaxprSDFG", self._clear_translation_ctx())
 
     def _handle_null_jaxpr(
         self,
@@ -689,9 +666,10 @@ def _handle_null_jaxpr(
     ) -> Sequence[str]:
         """This function is called in case a `Jaxpr` with zero equations is encountered.
 
-        A function with zero equation might still have output, in which case an input is copied to an output.
-        This function will handle the copying from the input into the corresponding output variable.
-        It is important that the function will remove the input and output variables from the internal mapping.
+        A function with zero equation might still have output, in which case an input is copied
+        to an output. This function will handle the copying from the input into the corresponding
+        output variable. It is important that the function will remove the variables that are used
+        as input and output from the mapping.
 
         Returns:
             The function returns a list denoting the SDFG variables that refers to the output.
@@ -710,9 +688,9 @@ def _handle_null_jaxpr(
 
         # If we are here then we are dealing with a nested SDFG/Jaxpr, that has output.
         #  Because an input also serves as output, the nested SDFG will have a connector for the
-        #  input and one for the output, but both with the same name.
-        #  This will make node validation fail.
-        #  We have to work around this by introducing some fake copies, which will be removed by DaCe later.
+        #  input and one for the output, but both with the same name. This will make node
+        #  validation fail. We have to work around this by introducing some fake copies, which
+        #  will be removed by DaCe later.
         for jax_out_var in jaxpr.jaxpr.outvars:
             # Since the output is also used as an input the variable mapping must be already known.
             sdfg_in_name: str = self.map_jax_var_to_sdfg(jax_out_var)
@@ -735,11 +713,11 @@ def _handle_null_jaxpr(
                 data=dace.Memlet.from_array(sdfg_in_name, self.get_array(sdfg_in_name)),
             )
 
-            # A Jax variable now has, in some sense, two SDFG equivalent, the input, that was previously created by
-            #  `self._create_initial_input()` and the `sdfg_out_name` we just created.
-            #  But we can not add this to the mapping, because of this situation we will now remove the variable from the mapping all together.
+            # A Jax variable now has, in some sense, two SDFG equivalent, the input, that
+            #  was previously created by `self._create_initial_input()` and the `sdfg_out_name`
+            #  we just created. But we can not add this to the mapping, because of this situation
+            #  we will now remove the variable from the mapping all together.
             #  I am open for different approaches.
-            #  Note that input variables that are not used as outputs, will remain in the mapping.
             self._jax_name_map.pop(jax_out_var)
 
         return tuple(out_var_names)
diff --git a/src/jace/translator/primitive_translator.py b/src/jace/translator/primitive_translator.py
index df52f90..8e18a27 100644
--- a/src/jace/translator/primitive_translator.py
+++ b/src/jace/translator/primitive_translator.py
@@ -4,14 +4,7 @@
 # All rights reserved.
 #
 # SPDX-License-Identifier: BSD-3-Clause
-"""Contains the interface for all primitive subtranslators.
-
-Note the name of this file is because it has to be the first that is imported in the `__init__.py` file.
-If not, we would get a cyclic import error.
-However, all attempts to prevent ruff from mindlessly (rule abiding) destroying this orders failed.
-Thus the name was changed to enforce this.
-If you have the solution, feel free to implement it.
-"""
+"""Contains the interface for all primitive translators."""
 
 from __future__ import annotations
 
@@ -31,9 +24,6 @@ class PrimitiveTranslatorCallable(Protocol):
     """Callable version of the primitive translators.
 
     Used for type annotation purposes, classes should be derived from `PrimitiveTranslator` instead.
-
-    Todo:
-        - This split information `__call__()` should be documented in `PrimitiveTranslator` instead and not here.
     """
 
     __slots__ = ()
@@ -51,33 +41,30 @@ def __call__(
 
         Before the driver calls this function it will perform the following
         preparatory tasks:
-        - It will allocate the SDFG variables that are used as outputs.
-            Their names will be passed through the `out_var_names` argument,
-            in the same order as `eqn.outvars`.
-        - It will collect the names of the SDFG variables that are used as input
-            and place them in `in_var_names`, in the same order as `eqn.invars`.
-            If an input argument refers to a literal no SDFG variable is created
-            for it and `None` is passed to indicate this.
-        - The subtranslator will create variables that are used as output.
-            They are passed as `out_var_names`, same order as in the equation.
-        - The driver will create a new terminal state and pass it as
-            `eqn_state` argument. This state is guaranteed to be empty and
-            `translator.terminal_sdfg_state is eqn_state` holds.
-
-        Then the subtranslator is called.
-        Usually a subtranslator should construct the dataflow graph inside `eqn_state`.
-        It is allowed that the subtranslators creates more states if needed, but this state machinery
-        has to have a single terminal state, which must be returned and reachable from `eqn_state`.
-        If the function returns `None` the driver will assume that subtranslator was able to
-        fully construct the dataflow graph within `eqn_state`.
-
-        While a subtranslator is forbidden from meddling with the input variables mentioned in
-        `in_var_names` in any way, it is allowed to modify the output variables.
-        For example it could create a new SDFG variable, with different strides.
-        But in that case the subtranslator must update the internal mapping of the driver TBA HOW,
-        and modify the mapping specified by `out_var_names`.
-        However, the subtranslator is allowed to create internal temporary variables.
-        It just have to ensure that no name collision will occur, a way to do this is to use a passed variable name as prefix.
+        - It will allocate the SDFG variables that are used as outputs. Their names will be passed
+            through the `out_var_names` argument, in the same order as `eqn.outvars`.
+        - It will collect the names of the SDFG variables that are used as input and place them in
+            `in_var_names`, in the same order as `eqn.invars`. If an input argument refers to a
+            literal no SDFG variable is created for it and `None` is passed to indicate this.
+        - The driver will create variables that are used as output. They are passed as
+            `out_var_names`, same order as in the equation.
+        - The driver will create a new terminal state and pass it as `eqn_state` argument. This
+            state is guaranteed to be empty and `translator.terminal_sdfg_state is eqn_state` holds.
+
+        Then the primitive translator is called.
+        Usually a primitive translator should construct the dataflow graph inside `eqn_state`.
+        It is allowed that the primitive translators creates more states if needed, but this
+        state machinery has to have a single terminal state, which must be returned and reachable
+        from `eqn_state`. If the function returns `None` the driver will assume that primitive
+        translator was able to fully construct the dataflow graph within `eqn_state`.
+
+        While a primitive translator is forbidden from meddling with the input variables mentioned
+        in `in_var_names` in any way, it is allowed to modify the output variables. For example
+        it could create a new SDFG variable, with different strides. But in that case the primitive
+        translator must update the internal mapping of the driver TBA HOW, and modify the mapping
+        specified by `out_var_names`. However, the subtranslator is allowed to create internal
+        temporary variables. It just have to ensure that no name collision will occur, a way to
+        do this is to use a passed variable name as prefix.
 
         Args:
             driver:         The driver object of the translation.
@@ -94,16 +81,17 @@ def __call__(
 
 @runtime_checkable
 class PrimitiveTranslator(PrimitiveTranslatorCallable, Protocol):
-    """Interface for all Jax primitive translators, also known as subtranslator, that are implemented as class.
+    """Interface for all Jax primitive translators.
 
     A translator for a primitive translates a single equation of a Jaxpr into its SDFG equivalent.
     For satisfying this interface a concrete implementation must be immutable after construction.
 
-    Subtranslators are simple, but highly specialized objects that are only able to perform the translation of a single primitive.
-    The overall translation process itself is managed by a driver object, which also owns and manage the subtranslators.
-    In the end this implements the delegation pattern.
+    Primitive translators are simple, but highly specialized objects that are only able to perform
+    the translation of a single primitive. The overall translation process itself is managed by a
+    driver object, which also owns and manage the primitive translators. In the end this implements
+    the delegation pattern.
 
-    You can use `jace.translator.add_subtranslator()` to register your translator to Jace.
+    You can use `jace.translator.register_primitive_translator()` to register your translator to Jace.
     """
 
     __slots__ = ()
diff --git a/tests/test_jaxpr_translator_driver.py b/tests/test_jaxpr_translator_driver.py
index 96a7419..3a16cee 100644
--- a/tests/test_jaxpr_translator_driver.py
+++ b/tests/test_jaxpr_translator_driver.py
@@ -42,7 +42,7 @@ def translation_driver():
     """Returns an allocated driver instance."""
     name = "fixture_driver"
     driver = translator.JaxprTranslationDriver(
-        sub_translators=translator.get_regsitered_primitive_translators()
+        primitive_translators=translator.get_regsitered_primitive_translators()
     )
     driver._allocate_translation_ctx(name=name)
     return driver
@@ -54,7 +54,7 @@ def test_driver_alloc() -> None:
     Does not use the fixture because it does it on its own.
     """
     driver = translator.JaxprTranslationDriver(
-        sub_translators=translator.get_regsitered_primitive_translators()
+        primitive_translators=translator.get_regsitered_primitive_translators()
     )
     assert not driver.is_allocated(), "Driver was created allocated."
     assert len(driver._ctx_stack) == 0
@@ -220,9 +220,7 @@ def test_driver_nested(translation_driver: translator.JaxprTranslationDriver) ->
     #  However, it is not able to update the mapping.
     with pytest.raises(
         expected_exception=ValueError,
-        match=re.escape(
-            f"Tried to create the mapping '{array1} -> {name_1}', but the variable is already mapped."
-        ),
+        match=re.escape(f"Cannot change the mapping of '{array1}' from '{name_1}' to '{name_1}'."),
     ):
         _ = translation_driver.add_array(array1, update_var_mapping=True)
     assert name_1 not in translation_driver.sdfg.arrays
@@ -307,7 +305,7 @@ def test_driver_variable_multiple_variables(
     with pytest.raises(
         expected_exception=ValueError,
         match=re.escape(
-            f"Tried to create the mapping '{array1} -> {prefix_expected_name}', but the variable is already mapped."
+            f"Cannot change the mapping of '{array1}' from '{translation_driver.map_jax_var_to_sdfg(array1)}' to '{prefix_expected_name}'."
         ),
     ):
         _ = translation_driver.add_array(array1, update_var_mapping=True, name_prefix=prefix)

From df82038fe1eea24116790a05894e214cab0b1223 Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Tue, 28 May 2024 07:40:29 +0200
Subject: [PATCH 251/458] Small corrections.

---
 src/jace/jax/stages.py             |  1 -
 src/jace/jax/translation_cache.py  | 12 ++++++------
 src/jace/util/__init__.py          |  2 --
 src/jace/util/util.py              | 26 +-------------------------
 tests/test_subtranslator_helper.py | 13 ++++++++-----
 5 files changed, 15 insertions(+), 39 deletions(-)

diff --git a/src/jace/jax/stages.py b/src/jace/jax/stages.py
index 9a0218f..ea24489 100644
--- a/src/jace/jax/stages.py
+++ b/src/jace/jax/stages.py
@@ -197,7 +197,6 @@ def compile(
         #  The reason is `self` is cached and assumed to be immutable.
         #  Since all optimizations works in place, we would violate this assumption.
         tsdfg: translator.TranslatedJaxprSDFG = copy.deepcopy(self._translated_sdfg)
-
         optimization.jace_optimize(tsdfg=tsdfg, **self._make_compiler_options(compiler_options))
 
         return JaceCompiled(
diff --git a/src/jace/jax/translation_cache.py b/src/jace/jax/translation_cache.py
index b29aa54..cf2e2b6 100644
--- a/src/jace/jax/translation_cache.py
+++ b/src/jace/jax/translation_cache.py
@@ -40,7 +40,7 @@
     from jace.jax import stages
 
 #: Caches used to store the state transition.
-#: The states are on a per stage and not per instant basis.
+#: The caches are on a per stage and not per instant basis.
 _TRANSLATION_CACHES: dict[type[CachingStage], StageCache] = {}
 
 
@@ -71,12 +71,12 @@ def _make_call_description(
         ...
 
 
-Action_T = TypeVar("Action_T", bound=Callable[..., Any])
+ActionFunction = TypeVar("ActionFunction", bound=Callable[..., Any])
 
 
 def cached_transition(
-    action: Action_T,
-) -> Action_T:
+    action: ActionFunction,
+) -> ActionFunction:
     """Decorator for making the transition function of the stage cacheable.
 
     The decorator will call the annotated function only if the call is not stored inside the cache.
@@ -85,7 +85,7 @@ def cached_transition(
     """
 
     @functools.wraps(action)
-    def _action_wrapper(
+    def _action_wrapper(  # type: ignore [no-untyped-def]  # return type is deduced from `ActionFunction`
         self: CachingStage,
         *args: Any,
         **kwargs: Any,
@@ -97,7 +97,7 @@ def _action_wrapper(
         self._cache[key] = next_stage
         return next_stage
 
-    return cast(Action_T, _action_wrapper)
+    return cast(ActionFunction, _action_wrapper)
 
 
 def clear_translation_cache() -> None:
diff --git a/src/jace/util/__init__.py b/src/jace/util/__init__.py
index 6bff211..863472e 100644
--- a/src/jace/util/__init__.py
+++ b/src/jace/util/__init__.py
@@ -36,7 +36,6 @@
     FORBIDDEN_SDFG_VAR_NAMES,
     VALID_SDFG_OBJ_NAME,
     VALID_SDFG_VAR_NAME,
-    as_sequence,
 )
 
 
@@ -45,7 +44,6 @@
     "VALID_SDFG_VAR_NAME",
     "FORBIDDEN_SDFG_VAR_NAMES",
     "JaCeVar",
-    "as_sequence",
     "compile_jax_sdfg",
     "dataclass_with_default_init",
     "is_array",
diff --git a/src/jace/util/util.py b/src/jace/util/util.py
index 342295f..7e02c28 100644
--- a/src/jace/util/util.py
+++ b/src/jace/util/util.py
@@ -8,31 +8,7 @@
 from __future__ import annotations
 
 import re
-from collections.abc import Iterable
-from typing import Final, TypeVar, cast, overload
-
-import jace.util.traits as traits
-
-
-_T = TypeVar("_T")
-
-
-@overload
-def as_sequence(value: str) -> Iterable[str]: ...
-
-
-@overload
-def as_sequence(value: Iterable[_T]) -> Iterable[_T]: ...
-
-
-@overload
-def as_sequence(value: _T) -> Iterable[_T]: ...
-
-
-def as_sequence(value: _T | Iterable[_T]) -> Iterable[_T]:
-    if traits.is_non_string_iterable(value):
-        return value
-    return cast(Iterable[_T], [value])
+from typing import Final
 
 
 # Valid name for an SDFG variable.
diff --git a/tests/test_subtranslator_helper.py b/tests/test_subtranslator_helper.py
index 612df15..3810ab3 100644
--- a/tests/test_subtranslator_helper.py
+++ b/tests/test_subtranslator_helper.py
@@ -34,10 +34,10 @@ def _conserve_builtin_translators():
 
 
 @pytest.fixture()
-def no_builtin_translators() -> str:
+def no_builtin_translators():  # noqa: PT004  # This is how you should do it: https://docs.pytest.org/en/7.1.x/how-to/fixtures.html#use-fixtures-in-classes-and-modules-with-usefixtures
     """This fixture can be used if the test does not want any builtin translators."""
     initial_translators = translator.set_active_primitive_translators_to({})
-    yield "DUMMY_VALUE"
+    yield
     translator.set_active_primitive_translators_to(initial_translators)
 
 
@@ -76,7 +76,8 @@ def test_are_subtranslators_imported():
     assert len(get_regsitered_primitive_translators()) == 37
 
 
-def test_subtranslatior_managing(no_builtin_translators):
+@pytest.mark.usefixtures("no_builtin_translators")
+def test_subtranslatior_managing():
     """Basic functionality of the subtranslators."""
     original_active_subtrans = get_regsitered_primitive_translators()
     assert len(original_active_subtrans) == 0
@@ -142,7 +143,8 @@ def same_structure(d1: dict, d2: dict) -> bool:
     assert same_structure(mutated_primitives, get_regsitered_primitive_translators())
 
 
-def test_subtranslatior_managing_callable_annotation(no_builtin_translators):
+@pytest.mark.usefixtures("no_builtin_translators")
+def test_subtranslatior_managing_callable_annotation():
     """Test if `make_primitive_translator()` works."""
 
     prim_name = "non_existing_property"
@@ -181,7 +183,8 @@ def useless_add_translator(*args: Any, **kwargs: Any) -> None:
     assert useless_add_translator is get_regsitered_primitive_translators()["add"]
 
 
-def test_subtranslatior_managing_overwriting_2(no_builtin_translators):
+@pytest.mark.usefixtures("no_builtin_translators")
+def test_subtranslatior_managing_overwriting_2():
     """Again an overwriting test, but this time a bit more complicated."""
 
     trans_cnt = [0]

From 60b7acba2e31d048703d88d9756d7e4267dbd1a4 Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Tue, 28 May 2024 09:27:41 +0200
Subject: [PATCH 252/458] Size corrections.

---
 src/jace/jax/api.py                           |   8 +-
 src/jace/jax/stages.py                        |  78 ++++++------
 src/jace/jax/translation_cache.py             | 103 +++++++--------
 src/jace/optimization.py                      |   6 +-
 .../translator/jaxpr_translator_driver.py     | 117 +++++++++---------
 src/jace/translator/managing.py               |  91 ++++++++------
 src/jace/translator/post_translation.py       |  11 +-
 src/jace/translator/primitive_translator.py   |   2 +
 src/jace/translator/translated_jaxpr_sdfg.py  |  44 ++++---
 src/jace/util/compiling.py                    |  35 +++---
 src/jace/util/jax_helper.py                   |  57 ++++-----
 src/jace/util/traits.py                       |  28 ++---
 src/jace/util/util.py                         |   6 +-
 13 files changed, 302 insertions(+), 284 deletions(-)

diff --git a/src/jace/jax/api.py b/src/jace/jax/api.py
index a214f5a..bbbfe6a 100644
--- a/src/jace/jax/api.py
+++ b/src/jace/jax/api.py
@@ -53,16 +53,16 @@ def jit(
 ) -> stages.JaceWrapped | Callable[[Callable], stages.JaceWrapped]:
     """Jace's replacement for `jax.jit` (just-in-time) wrapper.
 
-    It works the same way as `jax.jit` does, but instead of using XLA the computation is lowered to DaCe.
-    It supports the same arguments as `jax.jit` (although currently not) does.
+    It works the same way as `jax.jit` does, but instead of using XLA the computation is lowered
+    to DaCe. It supports the same arguments as `jax.jit` (although currently not) does.
     In addition it accepts some Jace specific arguments.
 
     Args:
         primitive_translators:    Use these primitive translators for the lowering to SDFG.
 
     Notes:
-        If no translators are specified the currently ones currently inside the global registry are used.
-        After construction changes to the passed `primitive_translators` have no effect on the returned object.
+        If no translators are specified, the ones in the global registry are implicitly passed
+        as argument. After constructions any change to `primitive_translators` has no effect.
     """
     if kwargs:
         # TODO(phimuell): Add proper name verification and exception type.
diff --git a/src/jace/jax/stages.py b/src/jace/jax/stages.py
index ea24489..5fc9de4 100644
--- a/src/jace/jax/stages.py
+++ b/src/jace/jax/stages.py
@@ -9,12 +9,13 @@
 This module reimplements the public classes of that Jax module.
 However, they are a big different, because Jace uses DaCe as backend.
 
-As in Jax Jace has different stages, the terminology is taken from [Jax' AOT-Tutorial](https://jax.readthedocs.io/en/latest/aot.html).
+As in Jax Jace has different stages, the terminology is taken from
+[Jax' AOT-Tutorial](https://jax.readthedocs.io/en/latest/aot.html).
 - Stage out:
     In this phase we translate an executable python function into Jaxpr.
 - Lower:
-    This will transform the Jaxpr into an SDFG equivalent.
-    As a implementation note, currently this and the previous step are handled as a single step.
+    This will transform the Jaxpr into an SDFG equivalent. As a implementation note,
+    currently this and the previous step are handled as a single step.
 - Compile:
     This will turn the SDFG into an executable object, see `dace.codegen.CompiledSDFG`.
 - Execution:
@@ -40,10 +41,13 @@
 class JaceWrapped(tcache.CachingStage["JaceLowered"]):
     """A function ready to be specialized, lowered, and compiled.
 
-    This class represents the output of functions such as `jace.jit()`.
-    Calling it results in jit (just-in-time) lowering, compilation and execution.
-    It is also possible to lower the function explicitly by calling `self.lower()`.
-    This function can be composed with other Jax transformations.
+    This class represents the output of functions such as `jace.jit()` and is the first stage in
+    the translation/compilation chain of Jace. A user should never create a `JaceWrapped` object
+    directly, instead `jace.jit` should be used for that.
+    While it supports just-in-time lowering and compilation these steps can also be performed
+    explicitly. The lowering performed by this stage is cached, thus if a `JaceWrapped` object is
+    lowered later, with the same argument the result is taken from the cache.
+    Furthermore, a `JaceWrapped` object is composable with all Jax transformations.
 
     Todo:
         - Handle pytrees.
@@ -51,7 +55,7 @@ class JaceWrapped(tcache.CachingStage["JaceLowered"]):
 
     Note:
         The tracing of function will always happen with enabled `x64` mode, which is implicitly
-        and temporary activated during tracing. Furthermore, the disable JIT config flag is ignored.
+        and temporary activated during tracing.
     """
 
     _fun: Callable
@@ -103,19 +107,20 @@ def lower(
     ) -> JaceLowered:
         """Lower this function explicitly for the given arguments.
 
-        Performs the first two steps of the AOT steps described above, i.e. transformation into
-        Jaxpr and then to SDFG. The result is encapsulated into a `Lowered` object.
+        Performs the first two steps of the AOT steps described above, i.e. stage out to Jaxpr
+        and then translate to SDFG. The result is encapsulated and returned into a `Lowered` object.
         """
         if len(kwargs) != 0:
             raise NotImplementedError("Currently only positional arguments are supported.")
 
-        # Currently we do not allow memory order beside `C_CONTIGUOUS`.
-        #  This is the best place to check for it.
+        # Currently the SDFG that we build only supports `C_CONTIGUOUS` memory order.
+        #  Since we support the paradigm that "everything passed to `lower` should also be
+        #  accepted as argument to call the result", we forbid other memory orders here.
         if not all((not util.is_array(arg)) or arg.flags["C_CONTIGUOUS"] for arg in args):
             raise NotImplementedError("Currently can not handle strides beside 'C_CONTIGUOUS'.")
 
-        # In Jax `float32` is the main datatype, and they go to great lengths to avoid
-        #  some aggressive [type promotion](https://jax.readthedocs.io/en/latest/type_promotion.html).
+        # In Jax `float32` is the main datatype, and they go to great lengths to avoid some
+        #  aggressive [type promotion](https://jax.readthedocs.io/en/latest/type_promotion.html).
         #  However, in this case we will have problems when we call the SDFG, for some reasons
         #  `CompiledSDFG` does not work in that case correctly, thus we enable it for the tracing.
         with _jax.experimental.enable_x64():
@@ -137,11 +142,10 @@ def _make_call_description(
         self,
         *args: Any,
     ) -> tcache.StageTransformationDescription:
-        """This function computes the key for the `JaceWrapped.lower()` call.
+        """This function computes the key for the `JaceWrapped.lower()` call to cache it.
 
-        Currently it is only able to handle positional argument and does not support static arguments.
-        The function will fully abstractify its input arguments.
-        This function is used by the cache to generate the key.
+        The function will compute a full abstract description on its argument. Currently it is
+        only able to handle positional argument and does not support static arguments.
         """
         call_args = tuple(tcache._AbstractCallArgument.from_value(x) for x in args)
         return tcache.StageTransformationDescription(stage_id=id(self), call_args=call_args)
@@ -150,8 +154,10 @@ def _make_call_description(
 class JaceLowered(tcache.CachingStage["JaceCompiled"]):
     """Represents the original computation as an SDFG.
 
+    It represents the computation wrapped by a `JaceWrapped` translated and lowered to SDFG.
+    It is followed by the `JaceCompiled` stage.
     Although, `JaceWrapped` is composable with Jax transformations `JaceLowered` is not.
-    A user should never create such an object.
+    A user should never create such an object, instead `JaceWrapped.lower()` should be used.
 
     Todo:
         - Handle pytrees.
@@ -181,21 +187,18 @@ def compile(
         self,
         compiler_options: CompilerOptions | None = None,
     ) -> JaceCompiled:
-        """Compile the SDFG.
-
-        Returns an object that encapsulates a compiled SDFG object.
-        To influence the various optimizations and compile options of Jace you can use the `compiler_options` argument.
-        This is a `dict` which are used as arguments to `jace_optimize()`.
+        """Optimize and compile the lowered SDFG using `compiler_options`.
 
+        Returns an object that encapsulates a compiled SDFG object. To influence the various
+        optimizations and compile options of Jace you can use the `compiler_options` argument.
         If nothing is specified `jace.optimization.DEFAULT_OPTIMIZATIONS` will be used.
-        Before `compiler_options` is forwarded to `jace_optimize()` it is merged with the default options.
 
         Note:
-            The result of this function is cached.
+            Before `compiler_options` is forwarded to `jace_optimize()` it will be merged with
+            the default arguments.
         """
-        # We **must** deepcopy before we do any optimization.
-        #  The reason is `self` is cached and assumed to be immutable.
-        #  Since all optimizations works in place, we would violate this assumption.
+        # We **must** deepcopy before we do any optimization, because all optimizations are in
+        #  place, however, to properly cache stages, they have to be immutable.
         tsdfg: translator.TranslatedJaxprSDFG = copy.deepcopy(self._translated_sdfg)
         optimization.jace_optimize(tsdfg=tsdfg, **self._make_compiler_options(compiler_options))
 
@@ -209,23 +212,20 @@ def compiler_ir(self, dialect: str | None = None) -> translator.TranslatedJaxprS
         """Returns the internal SDFG.
 
         The function returns a `TranslatedJaxprSDFG` object.
-        It is important that modifying this object in any ways is considered an error.
+        It is important that modifying this object in any way is undefined behavior.
         """
         if (dialect is None) or (dialect.upper() == "SDFG"):
             return self._translated_sdfg
         raise ValueError(f"Unknown dialect '{dialect}'.")
 
     def as_html(self, filename: str | None = None) -> None:
-        """Runs the `view()` method of the underlying SDFG.
-
-        This is a Jace extension.
-        """
+        """Runs the `view()` method of the underlying SDFG."""
         self.compiler_ir().sdfg.view(filename=filename, verbose=False)
 
     def as_sdfg(self) -> dace.SDFG:
         """Returns the encapsulated SDFG.
 
-        It is an error to modify the returned object.
+        Modifying the returned SDFG in any way is undefined behavior.
         """
         return self.compiler_ir().sdfg
 
@@ -233,11 +233,11 @@ def _make_call_description(
         self,
         compiler_options: CompilerOptions | None = None,
     ) -> tcache.StageTransformationDescription:
-        """This function computes the key for the `self.compile()` call.
+        """This function computes the key for the `self.compile()` call to cache it.
 
-        The function only get one argument that is either a `dict` or a `None`, where `None` means `use default argument.
-        The function will construct a concrete description of the call using `(name, value)` pairs.
-        This function is used by the cache.
+        The key that is computed by this function is based on the concrete values of the passed
+        compiler options. This is different from the key computed by `JaceWrapped` which is an
+        abstract description.
         """
         options = self._make_compiler_options(compiler_options)
         call_args = tuple(sorted(options.items(), key=lambda X: X[0]))
diff --git a/src/jace/jax/translation_cache.py b/src/jace/jax/translation_cache.py
index cf2e2b6..3b95594 100644
--- a/src/jace/jax/translation_cache.py
+++ b/src/jace/jax/translation_cache.py
@@ -7,11 +7,10 @@
 
 """This module contains the functionality related to the compilation cache of the stages.
 
-Actually there are two different caches:
-- The lowering cache.
-- And the compilation cache.
-
-Both are implemented as a singleton.
+The cache currently caches the lowering, i.e. the result of `JaceWrapped.lower()` and the
+compilation, i.e. `JaceLowered.compile()`. The caches are on a per stage basis and not on a
+per instant basis. To make a stage cacheable, it must be derived from `CachingStage` and
+its transition function must be decoration with `@cached_transition`.
 """
 
 from __future__ import annotations
@@ -50,10 +49,14 @@
 
 
 class CachingStage(Generic[NextStage]):
-    """Annotates a stage whose transition to the next one is cacheable.
+    """Annotates a stage whose transition to the next stage is cacheable.
+
+    To make the transition of a stage cacheable, the stage must be derived from this class,
+    and its initialization must call `CachingStage.__init__()`. Furthermore, its transition
+    function must be annotated by the `@cached_transition` decorator.
 
-    To make a transition function cacheable it must be annotated by the
-    `@cached_transition` decorator.
+    A class must implement the `_make_call_description()` to compute an abstract description
+    of the call. This is needed to operate the cache to store the stage transitions.
     """
 
     _cache: StageCache[NextStage]
@@ -71,21 +74,21 @@ def _make_call_description(
         ...
 
 
-ActionFunction = TypeVar("ActionFunction", bound=Callable[..., Any])
+# Type of the transition function.
+TransitionFunction = TypeVar("TransitionFunction", bound=Callable[..., Any])
 
 
 def cached_transition(
-    action: ActionFunction,
-) -> ActionFunction:
+    transition: TransitionFunction,
+) -> TransitionFunction:
     """Decorator for making the transition function of the stage cacheable.
 
-    The decorator will call the annotated function only if the call is not stored inside the cache.
-    The key to look up the call in the cache is computed by `self._make_call_description()`.
-    For this the stage must be derived from `CachingStage`.
+    In order to work, the stage must be derived from `CachingStage`. For computing the key of a
+    call the function will use the `_make_call_description()` function of the cache.
     """
 
-    @functools.wraps(action)
-    def _action_wrapper(  # type: ignore [no-untyped-def]  # return type is deduced from `ActionFunction`
+    @functools.wraps(transition)
+    def transition_wrapper(  # type: ignore [no-untyped-def]  # return type is deduced from `TransitionFunction`
         self: CachingStage,
         *args: Any,
         **kwargs: Any,
@@ -93,11 +96,11 @@ def _action_wrapper(  # type: ignore [no-untyped-def]  # return type is deduced
         key: StageTransformationDescription = self._make_call_description(*args, **kwargs)
         if key in self._cache:
             return self._cache[key]
-        next_stage: stages.Stage = action(self, *args, **kwargs)
+        next_stage: stages.Stage = transition(self, *args, **kwargs)
         self._cache[key] = next_stage
         return next_stage
 
-    return cast(ActionFunction, _action_wrapper)
+    return cast(TransitionFunction, transition_wrapper)
 
 
 def clear_translation_cache() -> None:
@@ -108,7 +111,7 @@ def clear_translation_cache() -> None:
 def get_cache(
     stage: CachingStage,
 ) -> StageCache:
-    """Returns the cache that is used for `stage`."""
+    """Returns the cache that should be used for `stage`."""
     stage_type = type(stage)
     if stage_type not in _TRANSLATION_CACHES:
         _TRANSLATION_CACHES[stage_type] = StageCache()
@@ -117,11 +120,15 @@ def get_cache(
 
 @dataclasses.dataclass(frozen=True)
 class _AbstractCallArgument:
-    """Class to represent one argument to the call in an abstract way.
+    """Class to represent a single argument to the transition function in an abstract way.
 
-    It is used as part of the key in the cache.
-    It represents the structure of the argument, i.e. its shape, type and so on, but nots its value.
-    To construct it you should use the `from_value()` class function which interfere the characteristics from a value.
+    As noted in `StageTransformationDescription` there are two ways to describe an argument,
+    either using its concrete value or an abstract description, which is similar to tracers in Jax.
+    This class represents the second way.
+    To create an instance you should use `_AbstractCallArgument.from_value()`.
+
+    Its description is limited to scalars and arrays. To describe more complex types, they
+    should be processed by pytrees first.
 
     Attributes:
         shape:      In case of an array its shape, in case of a scalar the empty tuple.
@@ -138,41 +145,39 @@ class _AbstractCallArgument:
     @classmethod
     def from_value(
         cls,
-        val: Any,
+        value: Any,
     ) -> _AbstractCallArgument:
-        """Construct an `_AbstractCallArgument` from a value.
-
-        Todo:
-            Handle storage location of arrays correctly.
-        """
-        if not util.is_fully_addressable(val):
+        """Construct an `_AbstractCallArgument` from `value`."""
+        if not util.is_fully_addressable(value):
             raise NotImplementedError("Distributed arrays are not addressed yet.")
-        if isinstance(val, jax_core.Literal):
+        if isinstance(value, jax_core.Literal):
             raise TypeError("Jax Literals are not supported as cache keys.")
 
-        if util.is_array(val):
-            if util.is_jax_array(val):
-                val = val.__array__()  # Passing `copy=False` leads to error in NumPy.
-            shape = val.shape
-            dtype = util.translate_dtype(val.dtype)
-            strides = getattr(val, "strides", None)
+        if util.is_array(value):
+            if util.is_jax_array(value):
+                value = value.__array__()  # Passing `copy=False` leads to error in NumPy.
+            shape = value.shape
+            dtype = util.translate_dtype(value.dtype)
+            strides = getattr(value, "strides", None)
             # Is `CPU_Heap` always okay? There would also be `CPU_Pinned`.
             storage = (
-                dace.StorageType.GPU_Global if util.is_on_device(val) else dace.StorageType.CPU_Heap
+                dace.StorageType.GPU_Global
+                if util.is_on_device(value)
+                else dace.StorageType.CPU_Heap
             )
 
             return cls(shape=shape, dtype=dtype, strides=strides, storage=storage)
 
-        if util.is_scalar(val):
+        if util.is_scalar(value):
             shape = ()
-            dtype = util.translate_dtype(type(val))
+            dtype = util.translate_dtype(type(value))
             strides = None
             # Scalar arguments are always on the CPU and never on the GPU.
             storage = dace.StorageType.CPU_Heap
 
             return cls(shape=shape, dtype=dtype, strides=strides, storage=storage)
 
-        raise TypeError(f"Can not make 'an abstract description from '{type(val).__name__}'.")
+        raise TypeError(f"Can not make 'an abstract description from '{type(value).__name__}'.")
 
 
 #: This type is the abstract description of a function call.
@@ -185,11 +190,12 @@ def from_value(
 
 @dataclasses.dataclass(frozen=True)
 class StageTransformationDescription:
-    """Represents the call to a state transformation function.
+    """Represents the entire call to a state transformation function of a stage.
 
-    State transition functions are annotated with `@cached_transition` and stored inside a cache.
-    This class serves as a key inside this cache and is generated by `CachingStage._make_call_description()`.
-    The actual key is consists of two parts.
+    State transition functions are annotated with `@cached_transition` and their result may be
+    cached. They key to locate them inside the cache is represented by this class.
+    The cache will call the `CachingStage._make_call_description()` function to get a key.
+    The actual key is consists of two parts, `stage_id` and `call_args`.
 
     Attributes:
         stage_id:   Origin of the call, for which the id of the stage object should be used.
@@ -200,11 +206,8 @@ class StageTransformationDescription:
             - Concrete description: Here one caches on the actual value of the argument.
                 The only requirement is that they can be hashed.
 
-    Notes:
-        The base assumption is that the stages are immutable.
-
     Todo:
-        - pytrees.
+        In the future pytrees will be used as third part.
     """
 
     stage_id: int
@@ -216,7 +219,7 @@ class StageTransformationDescription:
 
 
 class StageCache(Generic[StageType]):
-    """LRU cache that is used to cache the stage transitions, i.e. lowering and compiling, in Jace.
+    """Simple LRU cache to cache the results of the stage transition function.
 
     Notes:
         The most recently used entry is at the end of the `OrderedDict`.
diff --git a/src/jace/optimization.py b/src/jace/optimization.py
index bc2bf10..c719bd4 100644
--- a/src/jace/optimization.py
+++ b/src/jace/optimization.py
@@ -24,6 +24,8 @@
 class CompilerOptions(TypedDict, total=False):
     """All known compiler options known to `JaceLowered.compile()`.
 
+    See `jace_optimize()` for a description of the different options.
+
     There are some predefined option sets in `jace.jax.stages`:
     - `DEFAULT_COMPILER_OPTIONS`
     - `NO_OPTIMIZATIONS`
@@ -48,13 +50,13 @@ def jace_optimize(
     tsdfg: translator.TranslatedJaxprSDFG,
     **kwargs: Unpack[CompilerOptions],
 ) -> None:
-    """Performs optimization of the `fsdfg` _inplace_.
+    """Performs optimization of the `fsdfg` _in place_.
 
     Currently this function only supports simplification.
     Its main job is to exists that we have something that we can call in the tool chain.
 
     Args:
-        simplify:       Run the simplification pilepline.
+        simplify:       Run the simplification pipeline.
         auto_optimize:  Run the auto optimization pipeline (currently does nothing)
 
     Note:
diff --git a/src/jace/translator/jaxpr_translator_driver.py b/src/jace/translator/jaxpr_translator_driver.py
index aa794b6..b801214 100644
--- a/src/jace/translator/jaxpr_translator_driver.py
+++ b/src/jace/translator/jaxpr_translator_driver.py
@@ -32,26 +32,27 @@ class JaxprTranslationDriver:
     - It lacks the special `__return` variable,
     - the `arg_names` parameter is not set.
 
-    For these reasons the SDFG is not directly usable, and further manipulations have to be performed.
-    Especially, DaCe's validation function will fail and it is unable to be processed by the
-    optimization pipeline. For more information also see `jace.translator.post_translation` module.
-
-    The idea of the translator is extremely simple. Since Jaxpr is a list consisting of more or less
-    simple instructions/equations, they get processed one after the other.
-    Each equation is translated into its own state that is appended to the SDFG, thus the SDFG is a
-    long list of states. In certain cases it might be that an equation needs more states,
-    but this is an exception.
-
-    The actual translation of the equation is not handled by the driver.
-    Instead the request is forwarded to a `PrimitiveTranslator` object, known as primitive translator
-    or subtranslator. This is a highly specialized object that is able to handle one kind of primitive.
-    For more information on them see the documentation of `PrimitiveTranslator`.
+    For these reasons the SDFG is not directly usable, and further manipulations have to be
+    performed. Especially, DaCe's validation function will fail and it is unable to be processed
+    by the optimization pipeline. For more information also see `jace.translator.post_translation`
+    module.
+
+    The idea of the translator is extremely simple. Since Jaxpr is a list consisting of more or
+    less simple instructions/equations, they get processed one after the other. Each equation is
+    translated into its own state that is appended to the SDFG, thus the SDFG is a long list of
+    states. In certain cases it might be that an equation needs more states, but this is an
+    exception.
+
+    The actual translation of the equation is not handled by the driver. Instead the request is
+    forwarded to a `PrimitiveTranslator` object, known as primitive translator or subtranslator.
+    This is a highly specialized object that is able to handle one kind of primitive. For more
+    information on them see the documentation of `PrimitiveTranslator`.
 
     To start a translation the `translate_jaxpr()` function should be called, if this happens it is
     said that the driver has an ongoing translation. If `translate_jaxpr()` is called on a driver
-    that has an ongoing translation, a new translation context will be set up.
-    Thus the driver will then translate the supplied (nested) Jaxpr and return the result.
-    However, this will have no influence on the translation process that is already going.
+    that has an ongoing translation, a new translation context will be set up. Thus the driver
+    will then translate the supplied (nested) Jaxpr and return the result. However, this will have
+    no influence on the translation process that is already going.
 
     Notes:
         After the main translation has been performed the translator object can be used again.
@@ -75,8 +76,8 @@ def __init__(
             primitive_translators:    Primitive to use during the translation.
 
         Note:
-            The primitive translators are not copied, thus the user has to ensure that the passed mapping
-            does not change during the translation.
+            The primitive translators are not copied, thus the user has to ensure that the
+            passed mapping does not change during the translation.
         """
         # Maps name of primitives to the associated translator.
         self._primitive_translators = primitive_translators
@@ -118,8 +119,8 @@ def translate_jaxpr(
         # NOTE: If `self` is already allocated, i.e. has an ongoing translation process,
         #       the `_allocate_translation_ctx()` function will start a new context.
         #       Thus the driver will start to translate a second (nested) SDFG.
-        #       Also note that there is no mechanism that forces the integration of the nested SDFG/Jaxpr,
-        #       this must be done manually.
+        #       Also note that there is no mechanism that forces the integration of the nested
+        #       SDFG/Jaxpr, this must be done manually.
         self._allocate_translation_ctx(
             name=name,
         )
@@ -139,11 +140,12 @@ def append_new_state(
     ) -> dace.SDFGState:
         """Creates a new `SDFGState` and adds it to the SDFG.
 
-        By default the new state is appended to the current terminal state,
-        which will also update the terminal state of recorded inside `self`.
+        By default the new state is appended to the current terminal state, which will also update
+        the terminal state inside `self`.
 
-        However, if `prev_state` is specified the state new state will be appended to `prev_state` instead.
-        The terminal state of `self` will only be modified if `prev_state` is the current terminal state.
+        However, if `prev_state` is specified the state new state will be appended to `prev_state`
+        instead. The terminal state of `self` will only be modified if `prev_state` is the current
+        terminal state.
 
         Args:
             label:          The name that should be given to the new `SDFGState`.
@@ -178,8 +180,8 @@ def arrays(self) -> Mapping[str, ddata.Data]:
         """Get all data descriptors that are currently known to the SDFG.
 
         Notes:
-            Essentially a shorthand and preferred way for `self.sdfg.arrays`.
-            For getting a specific data descriptor use `self.get_array()`.
+            Essentially a shorthand and preferred way for `self.sdfg.arrays`. For getting a
+            specific data descriptor use `self.get_array()`.
         """
         return cast(Mapping[str, ddata.Data], self._ctx.sdfg.arrays)
 
@@ -189,8 +191,8 @@ def get_array(
     ) -> ddata.Data:
         """Returns the SDFG `Data` object `name` referees to.
 
-        If `name` is a string it is directly interpreted as the name of an SDFG variable.
-        In other cases it is first translated using `self.map_jax_var_to_sdfg()`.
+        If `name` is a string it is directly interpreted as the name of an SDFG variable. In other
+        cases it is first translated using `self.map_jax_var_to_sdfg()`.
         """
         if isinstance(name, (jax_core.Var, util.JaCeVar)):
             sdfg_name: str = self.map_jax_var_to_sdfg(name)
@@ -259,7 +261,7 @@ def is_allocated(self) -> bool:
         return False
 
     def is_root_translator(self) -> bool:
-        """Tests if `self` is a root translator.
+        """Tests if `self` is the root translator.
 
         The root translator (context) is the very first translator process that was started.
         """
@@ -276,8 +278,8 @@ def add_jax_name_mapping(
     ) -> JaxprTranslationDriver:
         """Creates a new mapping between `jax_var` to `sdfg_name`.
 
-        If the mapping already exists an error will be generated. This function is not
-        able to delete a variable mapping that was established before, for this use TBA.
+        If the mapping already exists an error will be generated. This function is not able to
+        delete a variable mapping that was established before.
 
         Args:
             jax_var:     The Jax variable.
@@ -309,13 +311,13 @@ def add_array(
 
         The SDFG object is always created as a transient.
 
-        By default the function will use `jace.util.propose_jax_name()` to derive
-        the name that should be used. However, by passing a `JaCeVar` with a name it
-        is possible to suggest a specific name. In addition it is possible to specify
-        `name_prefix` to prefix name that would be used.
+        By default the function will use `jace.util.propose_jax_name()` to derive the name that
+        should be used. However, by passing a `JaCeVar` with a name it is possible to suggest a
+        specific name. In addition it is possible to specify `name_prefix` to prefix name that
+        would be used.
 
-        The function will not update the internal variable mapping.
-        If this is desired one can set `update_var_mapping`, for forcing this.
+        The function will not update the internal variable mapping. If this is desired one can
+        set `update_var_mapping`, for forcing this.
 
         Args:
             arg:                The Jax object for which a SDFG equivalent should be created.
@@ -403,10 +405,10 @@ def create_jax_var_list(  # type: ignore[misc]
         If a Jax variable already has a SDFG equivalent then the function will use this variable.
         If no corresponding SDFG variable is known the function will create one using `add_array()`.
 
-        By setting `prevent_creation` the function will not create any new SDFG variables,
-        if no corresponding SDFG variable exists an error is generated. By setting `only_creation`
-        the function will only create new SDFG variables, if a variable already have a
-        corresponding SDFG variable an error will be created.
+        By setting `prevent_creation` the function will not create any new SDFG variables, if no
+        corresponding SDFG variable exists an error is generated. By setting `only_creation` the
+        function will only create new SDFG variables, if a variable already have a corresponding
+        SDFG variable an error will be created.
 
         By default literals cause an error. However, by setting `handle_literals` to `True`
         literals will will be included in the output with the value `None`.
@@ -416,7 +418,7 @@ def create_jax_var_list(  # type: ignore[misc]
             prevent_creation:   Never create a variable, all must already be known.
             only_creation:      Always create a variable, it is an error if one already exist.
             handle_literals:    Allow the processing of literals.
-            kwargs:             Will be forwarded to `self.add_array()` in case a variable is created.
+            kwargs:             Will be forwarded to `self.add_array()` if a variable is created.
 
         Todo:
             - Rollback if the creation fails.
@@ -478,8 +480,8 @@ def _create_constants(
     ) -> Sequence[str]:
         """Creates all constants requested by the `jaxpr` and return a list with their SDFG names.
 
-        The function will create an SDFG variable and add them as constant to the SDFG.
-        The value they should have is deepcopied.
+        The function will create an SDFG variable and add them as constant to the SDFG. Their value
+        is deepcopied.
         """
         from copy import deepcopy
 
@@ -507,16 +509,15 @@ def _allocate_translation_ctx(
     ) -> JaxprTranslationDriver:
         """This function allocates and initialize the members of the translation context of `self`.
 
-        If this function is called and `self` is already allocated, the function will create a
-        new context, allowing the driver to handle nested Jaxpr.
-        The first context that is created is also known as root translator.
+        If this function is called and `self` is already allocated, the function will create a new
+        context, allowing the driver to handle nested Jaxpr.
+        The first context that is created is known as root translator.
 
         Args:
             name:               The name of the SDFG.
         """
         from jace import translator  # Cyclic import
 
-        # Create a new translation context and put it on the stack.
         self._ctx_stack.append(
             translator.TranslatedJaxprSDFG(
                 name=name,
@@ -631,8 +632,8 @@ def _translate_jaxpr_internal(
 
         The function assumes that the context is allocated as well as the initial variables.
         The function will return the internal state of `self` encapsulated inside a
-        `TranslatedJaxprSDFG` object.
-        The function will also deallocate the current context upon return.
+        `TranslatedJaxprSDFG` object. The function will also deallocate the current context
+        upon return.
 
         Args:
             jaxpr:      The Jaxpr to translate.
@@ -643,7 +644,6 @@ def _translate_jaxpr_internal(
         nb_translated_eqn: int = 0
         out_var_names: Sequence[str] = ()
 
-        # Translate the equations one by one.
         for eqn in jaxpr.jaxpr.eqns:
             if any(util.is_drop_var(outVar) for outVar in eqn.outvars):
                 assert all(util.is_drop_var(outVar) for outVar in eqn.outvars)
@@ -651,11 +651,10 @@ def _translate_jaxpr_internal(
             _, out_var_names = self._translate_single_eqn(eqn=eqn)
             nb_translated_eqn += 1
 
-        # There were no equation, so handle the copying of input to output.
+        # There were no (useful) equations; thus the Jaxpr was empty.
         if nb_translated_eqn == 0:
             out_var_names = self._handle_null_jaxpr(jaxpr)
 
-        # Proper output names in the context.
         self._ctx.out_names = tuple(out_var_names)
 
         return cast("translator.TranslatedJaxprSDFG", self._clear_translation_ctx())
@@ -683,7 +682,7 @@ def _handle_null_jaxpr(
         if len(jaxpr.out_avals) == 0:
             return ()
 
-        # List of the output variables.
+        # List of the real output variables.
         out_var_names: list[str] = []
 
         # If we are here then we are dealing with a nested SDFG/Jaxpr, that has output.
@@ -696,7 +695,7 @@ def _handle_null_jaxpr(
             sdfg_in_name: str = self.map_jax_var_to_sdfg(jax_out_var)
 
             # Now we create a variable that serves as true output, however, since the Jax variable
-            #  is already known we can not update the variable mapping.
+            #  is already known we can not update the variable mapping and must use another name.
             sdfg_out_name = self.add_array(
                 jax_out_var,
                 name_prefix="_zero_equation_output_for_",
@@ -713,10 +712,10 @@ def _handle_null_jaxpr(
                 data=dace.Memlet.from_array(sdfg_in_name, self.get_array(sdfg_in_name)),
             )
 
-            # A Jax variable now has, in some sense, two SDFG equivalent, the input, that
+            # `jax_out_var` now has, in some sense, two SDFG equivalents, the input, that
             #  was previously created by `self._create_initial_input()` and the `sdfg_out_name`
-            #  we just created. But we can not add this to the mapping, because of this situation
-            #  we will now remove the variable from the mapping all together.
+            #  we just created. But we can not add this to the mapping. Because it is the best,
+            #  as in least worst, thing we can do we remove it from the mapping.
             #  I am open for different approaches.
             self._jax_name_map.pop(jax_out_var)
 
diff --git a/src/jace/translator/managing.py b/src/jace/translator/managing.py
index 08ec3f7..b785186 100644
--- a/src/jace/translator/managing.py
+++ b/src/jace/translator/managing.py
@@ -4,11 +4,13 @@
 # All rights reserved.
 #
 # SPDX-License-Identifier: BSD-3-Clause
-"""Module for managing the individual sutranslators.
+"""Module for managing the global primitive translators.
 
-The high level idea is that there is a "list" of instances of `PrimitiveTranslator`,
-which is known as `_PRIMITIVE_TRANSLATORS_DICT`.
-If not specified the content of this list is used to perform the translation.
+The high level idea is that there is a registry of all currently active primitive translators.
+If `primitive_translators` is not given to `jit` it will use this global registry.
+A primitive, i.e. an object that satisfies the `PrimitiveTranslator` interface, can be added
+to the registry by `register_primitive_translator()`. To retrieve the translators that are
+currently active you can use the `get_regsitered_primitive_translators()` function.
 """
 
 from __future__ import annotations
@@ -20,102 +22,112 @@
 if TYPE_CHECKING:
     from jace import translator
 
-# These are the currently active primitive translators of JaCe.
+#: Global registry of the active primitive translators.
+#:  The `dict` maps the name of a primitive to its associated translators.
 _PRIMITIVE_TRANSLATORS_DICT: dict[str, translator.PrimitiveTranslator] = {}
 
 
 @overload
 def make_primitive_translator(
     primitive: str,
-    prim_translator: Literal[None] = None,
+    primitive_translator: Literal[None] = None,
 ) -> Callable[[translator.PrimitiveTranslatorCallable], translator.PrimitiveTranslator]: ...
 
 
 @overload
 def make_primitive_translator(
-    primitive: str, prim_translator: translator.PrimitiveTranslatorCallable
+    primitive: str, primitive_translator: translator.PrimitiveTranslatorCallable
 ) -> translator.PrimitiveTranslator: ...
 
 
 def make_primitive_translator(
     primitive: str,
-    prim_translator: translator.PrimitiveTranslatorCallable | None = None,
+    primitive_translator: translator.PrimitiveTranslatorCallable | None = None,
 ) -> (
     Callable[[translator.PrimitiveTranslatorCallable], translator.PrimitiveTranslator]
     | translator.PrimitiveTranslator
 ):
-    """Decorator to turn a Callable into a `PrimitiveTranslator` for primitive `primitive`.
+    """Turn `primitive_translator` into a `PrimitiveTranslator` for primitive `primitive`.
 
-    This function can be used to decorate functions that should serve as primitive translators.
-    Essentially, the decorator adds a `primitive` property to the decorated function and returns it.
-    However, this function does not register the primitive into the global registry,
-    for this you have to use `register_primitive_translator()`.
+    Essentially, this function adds the `primitive` property to a callable, such that it satisfy
+    the `PrimitiveTranslator` protocol. However, it does not add it to the registry, for that
+    `register_primitive_translator()` has to be used.
+
+    Notes:
+        This function cal also be used as decorator.
     """
 
     def wrapper(
-        prim_translator: translator.PrimitiveTranslatorCallable,
+        primitive_translator: translator.PrimitiveTranslatorCallable,
     ) -> translator.PrimitiveTranslator:
         from jace import translator  # Cyclic
 
-        if getattr(prim_translator, "primitive", primitive) != primitive:
+        if getattr(primitive_translator, "primitive", primitive) != primitive:
             raise ValueError(
-                f"Tried to change the 'primitive' property of '{prim_translator}' from '{prim_translator.primitive}' to '{primitive}'."  # type: ignore[attr-defined]
+                f"Tried to change the 'primitive' property of '{primitive_translator}' from "
+                f"'{primitive_translator.primitive}' to '{primitive}'."  # type: ignore[attr-defined]
             )
-        prim_translator.primitive = primitive  # type: ignore[attr-defined]  # we add the attribute, so it is not defined yet.
-        return cast(translator.PrimitiveTranslator, prim_translator)
+        primitive_translator.primitive = primitive  # type: ignore[attr-defined]  # We define the attribute.
+        return cast(translator.PrimitiveTranslator, primitive_translator)
 
-    return wrapper if prim_translator is None else wrapper(prim_translator)
+    return wrapper if primitive_translator is None else wrapper(primitive_translator)
 
 
 @overload
 def register_primitive_translator(
-    prim_translator: Literal[None] = None,
+    primitive_translator: Literal[None] = None,
     overwrite: bool = False,
 ) -> Callable[[translator.PrimitiveTranslator], translator.PrimitiveTranslator]: ...
 
 
 @overload
 def register_primitive_translator(
-    prim_translator: translator.PrimitiveTranslator,
+    primitive_translator: translator.PrimitiveTranslator,
     overwrite: bool = False,
 ) -> translator.PrimitiveTranslator: ...
 
 
 def register_primitive_translator(
-    prim_translator: translator.PrimitiveTranslator | None = None,
+    primitive_translator: translator.PrimitiveTranslator | None = None,
     overwrite: bool = False,
 ) -> (
     translator.PrimitiveTranslator
     | Callable[[translator.PrimitiveTranslator], translator.PrimitiveTranslator]
 ):
-    """Adds the primitive translator to Jace's internal list of translators and return it again.
+    """Adds a primitive translator to Jace's global registry.
 
-    If the primitive is already known an error is generated, if `overwrite` is set, it will be replaced.
-    To add a `primitive` property use the `@make_primitive_translator` decorator.
+    If a translator for `primitive` is already registered an error will be generated. However,
+    by specifying `overwrite` `primitive_translator` will replace the current one.
 
     Args:
-        prim_translator:    The primitive translator to annotate.
-        overwrite:          Replace the current primitive translator with `prim_translator`.
+        primitive_translator: The primitive translator to add to the global registry.
+        overwrite:            Replace the current primitive translator with `primitive_translator`.
+
+    Note:
+        To add a `primitive` property use the `@make_primitive_translator` decorator.
+        This function returns `primitive_translator` unmodified, which allows it to be
+        used as decorator.
     """
 
     def wrapper(
-        prim_translator: translator.PrimitiveTranslator,
+        primitive_translator: translator.PrimitiveTranslator,
     ) -> translator.PrimitiveTranslator:
-        if prim_translator.primitive in _PRIMITIVE_TRANSLATORS_DICT and not overwrite:
+        if primitive_translator.primitive in _PRIMITIVE_TRANSLATORS_DICT and not overwrite:
             raise ValueError(
-                f"Explicit override=True needed for primitive '{prim_translator.primitive}' to overwrite existing one."
+                f"Explicit override=True needed for primitive '{primitive_translator.primitive}' "
+                "to overwrite existing one."
             )
-        _PRIMITIVE_TRANSLATORS_DICT[prim_translator.primitive] = prim_translator
-        return prim_translator
+        _PRIMITIVE_TRANSLATORS_DICT[primitive_translator.primitive] = primitive_translator
+        return primitive_translator
 
-    return wrapper if prim_translator is None else wrapper(prim_translator)
+    return wrapper if primitive_translator is None else wrapper(primitive_translator)
 
 
 def get_regsitered_primitive_translators() -> dict[str, translator.PrimitiveTranslator]:
-    """Returns a view of the _currently_ active set of installed primitive translators in Jace.
+    """Returns a copy of the current state of Jace's global primitive registry.
 
-    The returned mapping represents the active primitive translators at the time of calling.
-    This means that calls to `register_primitive_translator()` or any other mutating call will not affect the returned object.
+    The function returns a mapping that maps the name of a primitive to the associated translator.
+    No change to the global registry will affect the return value and vice versa.
     """
     return _PRIMITIVE_TRANSLATORS_DICT.copy()
 
@@ -123,10 +135,11 @@ def get_regsitered_primitive_translators() -> dict[str, translator.PrimitiveTran
 def set_active_primitive_translators_to(
     new_translators: Mapping[str, translator.PrimitiveTranslator],
 ) -> MutableMapping[str, translator.PrimitiveTranslator]:
-    """Exchange the currently active subtranslators in Jace with `new_translators` and returns the previous ones.
+    """Exchange the global translator registry of Jace with `new_translators`.
 
-    This function allows you to restore a specific state that was obtained by a previous call to `get_regsitered_primitive_translators()`.
-    While the function returns a mutable object, any changes to the returned object have no effect on the global state of the registry.
+    The function will return the state of the global translator registry just before this call.
+    Any changes to `new_translators` after calling this function will have no effect on the
+    global translator registry and vice versa.
     """
     global _PRIMITIVE_TRANSLATORS_DICT
     assert all(getattr(trans, "primitive", prim) for prim, trans in new_translators.items())
diff --git a/src/jace/translator/post_translation.py b/src/jace/translator/post_translation.py
index fc28160..bfe5125 100644
--- a/src/jace/translator/post_translation.py
+++ b/src/jace/translator/post_translation.py
@@ -8,6 +8,8 @@
 """This module contains all functions that are related to post processing the SDFG.
 
 Most of them operate on `TranslatedJaxprSDFG` objects.
+
+Currently they mostly exist for the sake of existing.
 """
 
 from __future__ import annotations
@@ -47,9 +49,10 @@ def finalize_jaxpr_sdfg(
 
     This function will turn a non finalized, i.e. canonical, SDFG into a finalized one,
     i.e. after this function `tsdfg.is_finalized` is `True`.
-    Thus the function will:
-    - Mark all input and output variables, i.e. listed in `tsdfg.{inp, out}_names`, as globals.
-    - Deallocate all members of `tsdfg` that are no longer needed.
+    The function will:
+    - mark all input and output variables, i.e. listed in `tsdfg.{inp, out}_names`, as globals,
+    - set the `arg_names` property of the SDFG,
+    - deallocate all members of `tsdfg` that are no longer needed.
     """
     if tsdfg.is_finalized:
         raise ValueError("The supplied SDFG is already finalized.")
@@ -67,7 +70,7 @@ def finalize_jaxpr_sdfg(
         sdfg_arg_names.append(glob_name)
 
     # This forces the signature of the SDFG to include all arguments in order they appear.
-    #  If an argument is reused (donated) then it is only listed once, the first time it appears
+    #  If an argument is used as input and output then it is only listed as input.
     tsdfg.sdfg.arg_names = sdfg_arg_names
 
     # Now we will deallocate the fields and mark `self` as finalized.
diff --git a/src/jace/translator/primitive_translator.py b/src/jace/translator/primitive_translator.py
index 8e18a27..bdca3d4 100644
--- a/src/jace/translator/primitive_translator.py
+++ b/src/jace/translator/primitive_translator.py
@@ -24,6 +24,8 @@ class PrimitiveTranslatorCallable(Protocol):
     """Callable version of the primitive translators.
 
     Used for type annotation purposes, classes should be derived from `PrimitiveTranslator` instead.
+    You can use `jace.translator.make_primitive_translator()` to add a `primitive` property to
+    a callable.
     """
 
     __slots__ = ()
diff --git a/src/jace/translator/translated_jaxpr_sdfg.py b/src/jace/translator/translated_jaxpr_sdfg.py
index 1d08fce..3196b27 100644
--- a/src/jace/translator/translated_jaxpr_sdfg.py
+++ b/src/jace/translator/translated_jaxpr_sdfg.py
@@ -15,26 +15,30 @@
 class TranslatedJaxprSDFG:
     """Encapsulates the result of a translation run of the `JaxprTranslationDriver` object.
 
-    The fields used to store the result are:
-    - `sdfg` the SDFG object that was created.
-    - `inp_names` a list of the SDFG variables that are used as input, in the same order as `Jaxpr.invars`.
-    - `out_names` a list of the SDFG variables that are used as output, in the same order as `Jaxpr.outvars`.
-    - `start_state` the first state in the SDFG state machine.
-    - `terminal_state` the last state in the state machine.
-    - `is_finalized` a bool that indicates if `self` represents a finalized or canonical SDFG, see below.
-
-    Note, that it might happen that a name appears in both the `inp_names` and `out_names` lists.
-    This happens if an argument is used both as input and output, and it is not an error.
-    In Jax this is called argument donation.
-
-    By default `self` encapsulates a canonical SDFG, see `JaxprTranslationDriver` for more information on this.
-    However, if `is_finalized` is set, then `self` contains a finalized SDFG, i.e.
-    - all input an output arrays are marked as global,
-    - however, there are no `__return` arrays, i.e. all arguments are passed as arguments,
-    - its `arg_names` are set with set `inp_names + out_names`, however,
-        arguments that are input and outputs are only listed as inputs.
-
-    Furthermore, only `sdfg`, `inp_names` and `out_names` are guaranteed to be allocated, all other fields might be `None`.
+    This class is used by the `JaxprTranslationDriver` to store the context of the SDFG that is
+    currently under construction and the return value of `JaxprTranslationDriver.translate_jaxpr()`.
+    A user should never create a `TranslatedJaxprSDFG` manually.
+
+    It might happen that a name appears in both the `inp_names` and `out_names` lists. This happens
+    if an argument is used both as input and output, and it is not an error. In Jax this is called
+    argument donation.
+
+    By default `self` encapsulates a canonical SDFG, see `JaxprTranslationDriver` for more
+    information on this. However, if `is_finalized` is set, then `self` contains a finalized SDFG,
+    which differs from a canonical SDFG in the following ways:
+    - all input and output arrays are marked as global,
+    - however, there are no `__return` arrays, i.e. all return values are passed as arguments,
+    - its `arg_names` are set with set `inp_names + out_names`, however, arguments that are input
+        and outputs are only listed as inputs,
+    - only the `sdfg`, `inp_names`, `out_names` and `is_finalized` are guaranteed to be not `None`.
+
+    Attributes:
+        sdfg:           The SDFG object that was created.
+        inp_names:      A list of the SDFG variables that are used as input, same order as `Jaxpr.invars`.
+        out_names:      A list of the SDFG variables that are used as output, same order as `Jaxpr.outvars`.
+        start_state:    The first state in the SDFG state machine.
+        terminal_state: The (currently) last state in the state machine.
+        is_finalized:   Indicates if `self` represents a finalized or canonical SDFG.
     """
 
     sdfg: dace.SDFG
diff --git a/src/jace/util/compiling.py b/src/jace/util/compiling.py
index 657ef30..c3d7249 100644
--- a/src/jace/util/compiling.py
+++ b/src/jace/util/compiling.py
@@ -5,10 +5,7 @@
 #
 # SPDX-License-Identifier: BSD-3-Clause
 
-"""This module contains functions for debugging the translator.
-
-Everything in this module is experimental and might vanish anytime.
-"""
+"""Contains everything for compiling and running `TranslatedJaxprSDFG` instances."""
 
 from __future__ import annotations
 
@@ -18,20 +15,20 @@
 
 import dace
 import numpy as np
-from dace import data as ddata
+from dace import data as dace_data
 
 
 if TYPE_CHECKING:
     from jace import translator
-    from jace.util import dace_helper as jdace
+    from jace.util import dace_helper
 
 
 def compile_jax_sdfg(
     tsdfg: translator.TranslatedJaxprSDFG,
-) -> jdace.CompiledSDFG:
-    """This function compiles the SDFG embedded in the embedded `tsdfg` (`TranslatedJaxprSDFG`).
+) -> dace_helper.CompiledSDFG:
+    """Compiles the SDFG embedded in `tsdfg` and return the resulting `CompiledSDFG` object.
 
-    For executing the SDFG, the `run_jax_sdfg()` function, together with the `tsdfg.{inp, out}_names` can be used.
+    The function requires that `tsdfg` is finalized.
     """
     if not tsdfg.is_finalized:
         raise ValueError("Can only compile a finalized SDFG.")
@@ -53,12 +50,11 @@ def compile_jax_sdfg(
         #  This happens if we compile the same lowered SDFG multiple times with different options.
         sdfg.name = f"{sdfg.name}__comp_{int(time.time() * 1000)}"
 
-        # Actual compiling the stuff; forcing that a recompilation happens
         with dace.config.temporary_config():
             sdfg._recompile = True
             sdfg._regenerate_code = True
             dace.Config.set("compiler", "use_cache", value=False)
-            csdfg: jdace.CompiledSDFG = sdfg.compile()
+            csdfg: dace_helper.CompiledSDFG = sdfg.compile()
 
     finally:
         sdfg.name = org_sdfg_name
@@ -69,7 +65,7 @@ def compile_jax_sdfg(
 
 
 def run_jax_sdfg(
-    csdfg: jdace.CompiledSDFG,
+    csdfg: dace_helper.CompiledSDFG,
     inp_names: Sequence[str],
     out_names: Sequence[str],
     cargs: Sequence[Any],
@@ -78,6 +74,8 @@ def run_jax_sdfg(
     """Run the compiled SDFG.
 
     The function assumes that the SDFG was finalized and then compiled by `compile_jax_sdfg()`.
+    For running the SDFG you also have to pass the input names (`inp_names`) and output names
+    (`out_names`) that where inside the `TranslatedJaxprSDFG` from which `csdfg` was compiled from.
 
     Args:
         csdfg:      The `CompiledSDFG` object.
@@ -89,8 +87,13 @@ def run_jax_sdfg(
     Note:
         There is no pytree mechanism jet, thus the return values are returned inside a `tuple`
         or in case of one value, directly, in the order determined by Jax.
-        Currently, this function does not consider strides in the input, all input must be `C_CONTIGUOUS`.
-        Currently, the SDFG must not have any undefined symbols, i.e. no undefined sizes.
+        Currently, this function does not consider strides in the input, all input must be
+        `C_CONTIGUOUS` nor have any undefined symbols.
+
+    Todo:
+        Since we do not have symbols and a fixed size this works and there is no problem.
+        However, if we have symbols or variable sizes, we must ensure that the init function of
+        the SDFG is called every time, or ensure that its exit function runs every time.
     """
     from jace import util
 
@@ -117,8 +120,8 @@ def run_jax_sdfg(
 
     for out_name, sarray in ((name, sdfg.arrays[name]) for name in out_names):
         assert not (out_name in call_args and util.is_jax_array(call_args[out_name]))
-        assert isinstance(sarray, ddata.Array)
-        call_args[out_name] = ddata.make_array_from_descriptor(sarray)
+        assert isinstance(sarray, dace_data.Array)
+        call_args[out_name] = dace_data.make_array_from_descriptor(sarray)
 
     assert len(call_args) == len(csdfg.argnames), (
         "Failed to construct the call arguments,"
diff --git a/src/jace/util/jax_helper.py b/src/jace/util/jax_helper.py
index 0832237..1a8ae12 100644
--- a/src/jace/util/jax_helper.py
+++ b/src/jace/util/jax_helper.py
@@ -7,10 +7,8 @@
 
 """Implements all utility functions that are related to Jax.
 
-Most of the functions defined here allow an unified access to Jax' internals
-in a consistent and stable way.
-It is important that this module is different from the `jace.jax` module, which
-mimics the full `jax` package itself.
+Most of the functions defined here allow an unified access to Jax' internal in a consistent and
+stable way.
 """
 
 from __future__ import annotations
@@ -30,14 +28,15 @@
 class JaCeVar:
     """Replacement for the `jax.Var` class.
 
-    This class can be seen as some kind of substitute `jax.core.Var`.
-    The main intention of this class is as an internal representation of values, as they are used in Jax, but without the Jax machinery.
-    As abstract values in Jax this class has a datatype, which is a `dace.typeclass` instance and a shape.
-    In addition it has an optional name, which allows to create variables with a certain name using `JaxprTranslationDriver.add_array()`.
+    This class can be seen as some kind of substitute `jax.core.Var`. The main intention of this
+    class is as an internal representation of values, as they are used in Jax, but without the Jax
+    machinery. As abstract values in Jax this class has a datatype, which is a `dace.typeclass`
+    instance and a shape. In addition it has an optional name, which allows to create variables
+    with a certain name using `JaxprTranslationDriver.add_array()`.
 
     Note:
         If the name of a `JaCeVar` is '_' it is considered a drop variable.
-        The definitions of `__hash__` and `__eq__` are in accordance how Jax variable works.
+        The definitions of `__hash__` and `__eq__` are in accordance with how Jax variable works.
 
     Todo:
         - Add support for strides.
@@ -74,8 +73,8 @@ def get_jax_var_name(jax_var: jax_core.Atom | JaCeVar) -> str:
 
     Notes:
         If `jax_var` is a `JaCeVar` the function will return, if defined, its `.name` property.
-        Otherwise it will compose a name similar to Jax `Var` objects.
-        The returned names are stable, i.e. it will output the same value for the same variable.
+        Otherwise it will compose a name similar to Jax `Var` objects. The returned names are
+        stable, i.e. it will output the same value for the same variable.
     """
     match jax_var:
         case jax_core.DropVar():
@@ -83,22 +82,20 @@ def get_jax_var_name(jax_var: jax_core.Atom | JaCeVar) -> str:
         case JaCeVar():
             return jax_var.name if jax_var.name else f"jax{id(jax_var)}"
         case jax_core.Var():
-            # This is not how the pretty printer works nor Jax.Var.__repr__, but leads to stable names that can be used.
+            # This is not how the pretty printer works nor Jax.Var.__repr__,
+            #  but leads to stable and valid names.
             return f"jax{jax_var.count}{jax_var.suffix}"
         case jax_core.Literal():
             raise TypeError("Can not derive a name from a Jax Literal.")
         case _:
             raise TypeError(
-                f"Does not know how to transform '{jax_var}' (type: '{type(jax_var).__name__}') into a string."
+                f"Does not know how to transform '{jax_var}' (type: '{type(jax_var).__name__}') "
+                "into a string."
             )
 
 
 def get_jax_var_shape(jax_var: jax_core.Atom | JaCeVar) -> tuple[int | dace.symbol | str, ...]:
-    """Returns the shape of a Jax variable.
-
-    Args:
-        jax_var:     The variable to process
-    """
+    """Returns the shape of `jax_var`."""
     match jax_var:
         case jax_core.Var() | jax_core.Literal():
             return jax_var.aval.shape
@@ -114,7 +111,7 @@ def get_jax_var_dtype(jax_var: jax_core.Atom | JaCeVar) -> dace.typeclass:
         case jax_core.Var() | jax_core.Literal():
             return translate_dtype(jax_var.aval.dtype)
         case JaCeVar():
-            return translate_dtype(jax_var.dtype)
+            return jax_var.dtype
         case _:
             raise TypeError(f"'get_jax_var_dtype()` is not implemented for '{type(jax_var)}'.")
 
@@ -125,11 +122,8 @@ def is_tracing_ongoing(
 ) -> bool:
     """Test if tracing is ongoing.
 
-    While a return value `True` guarantees that a translation is ongoing,
-    a value of `False` does not guarantees that no tracing is active.
-
-    Raises:
-        RuntimeError: If the function fails to make a detection.
+    While a return value `True` guarantees that a translation is ongoing, a value of `False`
+    does not guarantees that no tracing is active.
     """
     # The current implementation only checks the arguments if it contains tracers.
     if (len(args) == 0) and (len(kwargs) == 0):
@@ -156,19 +150,19 @@ def propose_jax_name(
 ) -> str:
     """Proposes a variable name for `jax_var`.
 
-    If `jax_name_map` is `None` then the function will fallback to `get_jax_var_name()`.
+    If `jax_name_map` is `None` the function will fallback to `get_jax_var_name(jax_var)`.
     If `jax_name_map` is supplied the function will:
     - if `jax_var` is stored inside `jax_name_map` this value will be returned.
-    - if `jax_var` is a `JaCeVar` with a set `.name` property it will be returned.
-    - otherwise the function will generate a new name similar to how the pretty printer of Jaxpr works.
+    - if `jax_var` is a `JaCeVar` with a set `.name` property that name will be returned.
+    - otherwise the function will generate a new name in a similar way than pretty printer of Jaxpr.
 
     Args:
         jax_var:        The variable for which a name to propose.
         jax_name_map:   A mapping of all Jax variables that were already named.
 
     Note:
-        The function guarantees that the returned name passes `VALID_SDFG_VAR_NAME` test
-        and that the name is not part of `util.FORBIDDEN_SDFG_VAR_NAMES`.
+        The function guarantees that the returned name passes `VALID_SDFG_VAR_NAME` test and that
+        the name is not inside `util.FORBIDDEN_SDFG_VAR_NAMES`.
         Dropped variables will always be named `'_'`.
     """
     if isinstance(jax_var, jax_core.Literal):
@@ -180,8 +174,9 @@ def propose_jax_name(
     if isinstance(jax_var, JaCeVar) and (jax_var.name is not None):
         return jax_var.name
 
-    # We have the set of all previous names, so we generate names
-    #  in the same way as Jax does:
+    # This code is taken from Jax so it will generate similar ways, the difference is that
+    #  we do the counting differently.
+    #  Note that `z` is followed by `ba` and not `aa` as it is in Excel.
     c = len(jax_name_map)
     jax_name = ""
     while len(jax_name) == 0 or c != 0:
diff --git a/src/jace/util/traits.py b/src/jace/util/traits.py
index 44ba097..8e063cc 100644
--- a/src/jace/util/traits.py
+++ b/src/jace/util/traits.py
@@ -24,12 +24,10 @@
 def is_jaceified(obj: Any) -> TypeGuard[jjax.JaceWrapped]:
     """Tests if `obj` is decorated by JaCe.
 
-    Similar to `jace.util.is_jaxified`, but for JaCe object.
+    Similar to `is_jaxified`, but for JaCe object.
     """
     if util.is_jaxified(obj):
         return False
-    # Currently it is quite simple because we can just check if `obj`
-    #  is derived from `jace.jax.JaceWrapped`, might become harder in the future.
     return isinstance(obj, jjax.JaceWrapped)
 
 
@@ -39,9 +37,7 @@ def is_drop_var(jax_var: jax_core.Atom | util.JaCeVar) -> TypeGuard[jax_core.Dro
     if isinstance(jax_var, jax_core.DropVar):
         return True
     if isinstance(jax_var, util.JaCeVar):
-        # We type narrow it to a pure jax DropVar, because essentially
-        #  you can not do anything with it.
-        return jax_var.name == "_"
+        return jax_var.name == "_" if jax_var.name else False
     return False
 
 
@@ -51,14 +47,12 @@ def is_jaxified(
     """Tests if `obj` is a "jaxified" object.
 
     A "jaxified" object is an object that was processed by Jax.
-    While a return value of `True` guarantees a jaxified object, `False` might not proof the contrary.
-    See also `jace.util.is_jaceified()` to tests if something is a Jace object.
+    While a return value of `True` guarantees a jaxified object, `False` does not proof the
+    contrary. See also `jace.util.is_jaceified()` to tests if something is a Jace object.
     """
-
-    # These are all types we consider as jaxify
     jaxifyed_types = (
         jax_core.Primitive,
-        # jstage.Wrapped is not runtime chakable
+        # jax_core.stage.Wrapped is not runtime chakable
         jax_src.pjit.JitWrapped,
         jax_xe.PjitFunction,
     )
@@ -70,7 +64,7 @@ def is_jax_array(
 ) -> TypeGuard[jax.Array]:
     """Tests if `obj` is a jax array.
 
-    Notes jax array are special, you can not write to them directly.
+    Notes jax array are special as you can not write to them directly.
     Furthermore, they always allocate also on GPU, beside the CPU allocation.
     """
     return isinstance(obj, jax.Array)
@@ -120,8 +114,8 @@ def is_on_device(
 ) -> bool:
     """Tests if `obj` is on a device.
 
-    Jax arrays are always on the CPU and GPU (if there is one).
-    Thus for Jax arrays this function is more of a test, if there is a GPU or not.
+    Jax arrays are always on the CPU and GPU (if there is one). Thus for Jax arrays this
+    function is more of a test, if there is a GPU or not.
     """
     if is_jax_array(obj):
         try:
@@ -135,11 +129,11 @@ def is_on_device(
 def is_fully_addressable(
     obj: Any,
 ) -> bool:
-    """Tests if `obj` is fully addreassable, i.e. is only on this host.
+    """Tests if `obj` is fully addressable, i.e. is only on this host.
 
     Notes:
-        The function (currently) assumes that everything that is not a distributed
-            Jax array is on this host.
+        This function currently assumes that everything that is not a Jax array is always fully
+        addressable.
     """
     if is_jax_array(obj):
         return obj.is_fully_addressable
diff --git a/src/jace/util/util.py b/src/jace/util/util.py
index 7e02c28..d593c70 100644
--- a/src/jace/util/util.py
+++ b/src/jace/util/util.py
@@ -11,15 +11,15 @@
 from typing import Final
 
 
-# Valid name for an SDFG variable.
+#: Valid name for an SDFG variable.
 VALID_SDFG_VAR_NAME: re.Pattern = re.compile("[a-zA-Z_][a-zA-Z0-9_]*")
 
-# Valid name for an SDFG itself, includes `SDFGState` objects.
+#: Valid name for an SDFG itself, includes `SDFGState` objects.
 VALID_SDFG_OBJ_NAME: re.Pattern = re.compile("[a-zA-Z_][a-zA-Z0-9_]*")
 
 
 # fmt: off
-# This is a set of all names that are invalid SDFG names.
+#: This is a set of all names that are invalid SDFG names.
 FORBIDDEN_SDFG_VAR_NAMES: Final[set[str]] = {
     # These should be most of the C++ keywords, it is more important to have the short ones.
     #  Taken from 'https://learn.microsoft.com/en-us/cpp/cpp/keywords-cpp?view=msvc-170'

From 2190fafadb1ed343aa708eb30b25623e3d779f82 Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Tue, 28 May 2024 10:37:12 +0200
Subject: [PATCH 253/458] Moved the description of the constructor arguments
 from `__init__` to the class description.

---
 src/jace/jax/stages.py                        | 37 +++++++++++--------
 src/jace/jax/translation_cache.py             | 13 ++++---
 .../translator/jaxpr_translator_driver.py     | 16 ++++----
 src/jace/translator/translated_jaxpr_sdfg.py  |  3 ++
 src/jace/util/jax_helper.py                   |  5 +++
 5 files changed, 44 insertions(+), 30 deletions(-)

diff --git a/src/jace/jax/stages.py b/src/jace/jax/stages.py
index 5fc9de4..ac8e282 100644
--- a/src/jace/jax/stages.py
+++ b/src/jace/jax/stages.py
@@ -49,6 +49,11 @@ class JaceWrapped(tcache.CachingStage["JaceLowered"]):
     lowered later, with the same argument the result is taken from the cache.
     Furthermore, a `JaceWrapped` object is composable with all Jax transformations.
 
+    Args:
+        fun:                    The function that is wrapped.
+        primitive_translators:  The list of subtranslators that that should be used.
+        jit_options:            Options to influence the jit process.
+
     Todo:
         - Handle pytrees.
         - Handle all options to `jax.jit`.
@@ -68,13 +73,6 @@ def __init__(
         primitive_translators: Mapping[str, translator.PrimitiveTranslator],
         jit_options: Mapping[str, Any],
     ) -> None:
-        """Creates a wrapped jitable object of `fun`.
-
-        Args:
-            fun:                    The function that is wrapped.
-            primitive_translators:  The list of subtranslators that that should be used.
-            jit_options:            Options to influence the jit process.
-        """
         super().__init__()
         # We have to shallow copy both the translator and the jit options.
         #  This prevents that any modifications affect `self`.
@@ -159,6 +157,12 @@ class JaceLowered(tcache.CachingStage["JaceCompiled"]):
     Although, `JaceWrapped` is composable with Jax transformations `JaceLowered` is not.
     A user should never create such an object, instead `JaceWrapped.lower()` should be used.
 
+    Args:
+        tsdfg:  The lowered SDFG with metadata. Must be finalized.
+
+    Note:
+        `self` will manage the passed `tsdfg` object. Modifying it results in undefined behavior.
+
     Todo:
         - Handle pytrees.
     """
@@ -169,14 +173,6 @@ def __init__(
         self,
         tsdfg: translator.TranslatedJaxprSDFG,
     ) -> None:
-        """Initialize the lowered object.
-
-        Args:
-            tsdfg:      The lowered SDFG with metadata. Must be finalized.
-
-        Notes:
-            The passed `tsdfg` will be managed by `self`.
-        """
         if not tsdfg.is_finalized:
             raise ValueError("The translated SDFG must be finalized.")
         super().__init__()
@@ -253,6 +249,17 @@ def _make_compiler_options(
 class JaceCompiled:
     """Compiled version of the SDFG.
 
+    This is the last stage of the jit chain. A user should never create a `JaceCompiled` instance,
+    instead `JaceLowered.compile()` should be used.
+
+    Args:
+        csdfg:      The compiled SDFG object.
+        inp_names:  Names of the SDFG variables used as inputs.
+        out_names:  Names of the SDFG variables used as outputs.
+
+    Note:
+        The class assumes ownership of its input arguments.
+
     Todo:
         - Handle pytrees.
     """
diff --git a/src/jace/jax/translation_cache.py b/src/jace/jax/translation_cache.py
index 3b95594..cf2a970 100644
--- a/src/jace/jax/translation_cache.py
+++ b/src/jace/jax/translation_cache.py
@@ -57,6 +57,9 @@ class CachingStage(Generic[NextStage]):
 
     A class must implement the `_make_call_description()` to compute an abstract description
     of the call. This is needed to operate the cache to store the stage transitions.
+
+    Notes:
+        The `__init__()` function must explicitly be called to fully setup `self`.
     """
 
     _cache: StageCache[NextStage]
@@ -197,7 +200,7 @@ class StageTransformationDescription:
     The cache will call the `CachingStage._make_call_description()` function to get a key.
     The actual key is consists of two parts, `stage_id` and `call_args`.
 
-    Attributes:
+    Args:
         stage_id:   Origin of the call, for which the id of the stage object should be used.
         call_args:  Description of the arguments of the call. There are two ways to describe
             the arguments:
@@ -221,6 +224,9 @@ class StageTransformationDescription:
 class StageCache(Generic[StageType]):
     """Simple LRU cache to cache the results of the stage transition function.
 
+    Args:
+        size:   The size of the cache, defaults to 256.
+
     Notes:
         The most recently used entry is at the end of the `OrderedDict`.
     """
@@ -232,11 +238,6 @@ def __init__(
         self,
         size: int = 256,
     ) -> None:
-        """Creates a LRU cache with `size` many entries.
-
-        Args:
-            size:   Number of entries the cache holds, defaults to 256.
-        """
         self._memory = collections.OrderedDict()
         self._size = size
 
diff --git a/src/jace/translator/jaxpr_translator_driver.py b/src/jace/translator/jaxpr_translator_driver.py
index b801214..f66407d 100644
--- a/src/jace/translator/jaxpr_translator_driver.py
+++ b/src/jace/translator/jaxpr_translator_driver.py
@@ -54,10 +54,17 @@ class JaxprTranslationDriver:
     will then translate the supplied (nested) Jaxpr and return the result. However, this will have
     no influence on the translation process that is already going.
 
+    Args:
+        primitive_translators:    Primitive to use during the translation.
+
     Notes:
+        The `primitive_translators` that is passed at construction is not copied. The user has
+        to ensure that it does not change.
         After the main translation has been performed the translator object can be used again.
         Currently the driver will generate only Array as SDFG variables, however, this is a
         temporary solution, see `add_array()`.
+
+
     """
 
     __slots__ = ("_ctx_stack", "_primitive_translators", "_jax_name_map")
@@ -70,15 +77,6 @@ def __init__(
         self,
         primitive_translators: Mapping[str, translator.PrimitiveTranslatorCallable],
     ) -> None:
-        """Creates the driver ready for translation.
-
-        Args:
-            primitive_translators:    Primitive to use during the translation.
-
-        Note:
-            The primitive translators are not copied, thus the user has to ensure that the
-            passed mapping does not change during the translation.
-        """
         # Maps name of primitives to the associated translator.
         self._primitive_translators = primitive_translators
 
diff --git a/src/jace/translator/translated_jaxpr_sdfg.py b/src/jace/translator/translated_jaxpr_sdfg.py
index 3196b27..e47d11f 100644
--- a/src/jace/translator/translated_jaxpr_sdfg.py
+++ b/src/jace/translator/translated_jaxpr_sdfg.py
@@ -39,6 +39,9 @@ class TranslatedJaxprSDFG:
         start_state:    The first state in the SDFG state machine.
         terminal_state: The (currently) last state in the state machine.
         is_finalized:   Indicates if `self` represents a finalized or canonical SDFG.
+
+    Args:
+        name:   The name that should be given to the SDFG, optional.
     """
 
     sdfg: dace.SDFG
diff --git a/src/jace/util/jax_helper.py b/src/jace/util/jax_helper.py
index 1a8ae12..bed727e 100644
--- a/src/jace/util/jax_helper.py
+++ b/src/jace/util/jax_helper.py
@@ -34,6 +34,11 @@ class is as an internal representation of values, as they are used in Jax, but w
     instance and a shape. In addition it has an optional name, which allows to create variables
     with a certain name using `JaxprTranslationDriver.add_array()`.
 
+    Args:
+        shape:      The shape of the variable.
+        dtype:      The dace datatype of the variable.
+        name:       Name the variable should have, optional.
+
     Note:
         If the name of a `JaCeVar` is '_' it is considered a drop variable.
         The definitions of `__hash__` and `__eq__` are in accordance with how Jax variable works.

From 5d6962a7ede31830dd05626080a53064037af1f2 Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Tue, 28 May 2024 12:42:08 +0200
Subject: [PATCH 254/458] Moved the `jax` package.

---
 src/jace/__init__.py                        |  6 +---
 src/jace/{jax => }/api.py                   |  3 +-
 src/jace/jax/__init__.py                    | 34 ---------------------
 src/jace/{jax => }/stages.py                | 11 +++----
 src/jace/util/traits.py                     |  6 ++--
 src/jace/{jax => util}/translation_cache.py | 26 ++++++++--------
 tests/test_caching.py                       |  5 ++-
 tests/test_decorator.py                     |  2 +-
 8 files changed, 26 insertions(+), 67 deletions(-)
 rename src/jace/{jax => }/api.py (97%)
 delete mode 100644 src/jace/jax/__init__.py
 rename src/jace/{jax => }/stages.py (96%)
 rename src/jace/{jax => util}/translation_cache.py (92%)

diff --git a/src/jace/__init__.py b/src/jace/__init__.py
index 05d9632..7fed965 100644
--- a/src/jace/__init__.py
+++ b/src/jace/__init__.py
@@ -9,12 +9,10 @@
 
 from __future__ import annotations
 
-import jax as _jax
-
 import jace.translator.primitive_translators as _  # noqa: F401  # Populate the internal registry.
 
 from .__about__ import __author__, __copyright__, __license__, __version__, __version_info__
-from .jax import grad, jacfwd, jacrev, jit
+from .api import grad, jacfwd, jacrev, jit
 
 
 __all__ = [
@@ -28,5 +26,3 @@
     "__version__",
     "__version_info__",
 ]
-
-del _jax
diff --git a/src/jace/jax/api.py b/src/jace/api.py
similarity index 97%
rename from src/jace/jax/api.py
rename to src/jace/api.py
index bbbfe6a..f1600c8 100644
--- a/src/jace/jax/api.py
+++ b/src/jace/api.py
@@ -15,8 +15,7 @@
 
 from jax import grad, jacfwd, jacrev
 
-from jace import translator
-from jace.jax import stages
+from jace import stages, translator
 
 
 __all__ = [
diff --git a/src/jace/jax/__init__.py b/src/jace/jax/__init__.py
deleted file mode 100644
index f4df884..0000000
--- a/src/jace/jax/__init__.py
+++ /dev/null
@@ -1,34 +0,0 @@
-# JaCe - JAX Just-In-Time compilation using DaCe (Data Centric Parallel Programming)
-#
-# Copyright (c) 2024, ETH Zurich
-# All rights reserved.
-#
-# SPDX-License-Identifier: BSD-3-Clause
-
-"""This package mimics the `jax` functions and features supported by JaCe."""
-
-from __future__ import annotations
-
-from .api import grad, jacfwd, jacrev, jit
-from .stages import (
-    CompilerOptions,
-    JaceCompiled,
-    JaceLowered,
-    JaceWrapped,
-)
-
-
-__all__ = [
-    "Compiled",
-    "CompilerOptions",
-    "JaceWrapped",
-    "JaceLowered",
-    "JaceCompiled",
-    "Lowered",
-    "Wrapped",
-    "api_helper",
-    "jit",
-    "jacfwd",
-    "jacrev",
-    "grad",
-]
diff --git a/src/jace/jax/stages.py b/src/jace/stages.py
similarity index 96%
rename from src/jace/jax/stages.py
rename to src/jace/stages.py
index ac8e282..52a44fc 100644
--- a/src/jace/jax/stages.py
+++ b/src/jace/stages.py
@@ -32,10 +32,9 @@
 import jax as _jax
 
 from jace import optimization, translator, util
-from jace.jax import translation_cache as tcache
 from jace.optimization import CompilerOptions
 from jace.translator import post_translation as ptrans
-from jace.util import dace_helper
+from jace.util import dace_helper, translation_cache as tcache
 
 
 class JaceWrapped(tcache.CachingStage["JaceLowered"]):
@@ -139,14 +138,14 @@ def wrapped_fun(self) -> Callable:
     def _make_call_description(
         self,
         *args: Any,
-    ) -> tcache.StageTransformationDescription:
+    ) -> tcache.StageTransformationSpec:
         """This function computes the key for the `JaceWrapped.lower()` call to cache it.
 
         The function will compute a full abstract description on its argument. Currently it is
         only able to handle positional argument and does not support static arguments.
         """
         call_args = tuple(tcache._AbstractCallArgument.from_value(x) for x in args)
-        return tcache.StageTransformationDescription(stage_id=id(self), call_args=call_args)
+        return tcache.StageTransformationSpec(stage_id=id(self), call_args=call_args)
 
 
 class JaceLowered(tcache.CachingStage["JaceCompiled"]):
@@ -228,7 +227,7 @@ def as_sdfg(self) -> dace.SDFG:
     def _make_call_description(
         self,
         compiler_options: CompilerOptions | None = None,
-    ) -> tcache.StageTransformationDescription:
+    ) -> tcache.StageTransformationSpec:
         """This function computes the key for the `self.compile()` call to cache it.
 
         The key that is computed by this function is based on the concrete values of the passed
@@ -237,7 +236,7 @@ def _make_call_description(
         """
         options = self._make_compiler_options(compiler_options)
         call_args = tuple(sorted(options.items(), key=lambda X: X[0]))
-        return tcache.StageTransformationDescription(stage_id=id(self), call_args=call_args)
+        return tcache.StageTransformationSpec(stage_id=id(self), call_args=call_args)
 
     def _make_compiler_options(
         self,
diff --git a/src/jace/util/traits.py b/src/jace/util/traits.py
index 8e063cc..0355dac 100644
--- a/src/jace/util/traits.py
+++ b/src/jace/util/traits.py
@@ -17,18 +17,18 @@
 from jax import _src as jax_src, core as jax_core
 from jaxlib import xla_extension as jax_xe
 
-import jace.jax as jjax
 import jace.util as util
+from jace import stages
 
 
-def is_jaceified(obj: Any) -> TypeGuard[jjax.JaceWrapped]:
+def is_jaceified(obj: Any) -> TypeGuard[stages.JaceWrapped]:
     """Tests if `obj` is decorated by JaCe.
 
     Similar to `is_jaxified`, but for JaCe object.
     """
     if util.is_jaxified(obj):
         return False
-    return isinstance(obj, jjax.JaceWrapped)
+    return isinstance(obj, stages.JaceWrapped)
 
 
 def is_drop_var(jax_var: jax_core.Atom | util.JaCeVar) -> TypeGuard[jax_core.DropVarp]:
diff --git a/src/jace/jax/translation_cache.py b/src/jace/util/translation_cache.py
similarity index 92%
rename from src/jace/jax/translation_cache.py
rename to src/jace/util/translation_cache.py
index cf2a970..3bf47c5 100644
--- a/src/jace/jax/translation_cache.py
+++ b/src/jace/util/translation_cache.py
@@ -36,7 +36,7 @@
 
 
 if TYPE_CHECKING:
-    from jace.jax import stages
+    from jace import stages
 
 #: Caches used to store the state transition.
 #: The caches are on a per stage and not per instant basis.
@@ -72,7 +72,7 @@ def _make_call_description(
         self: CachingStage,
         *args: Any,
         **kwargs: Any,
-    ) -> StageTransformationDescription:
+    ) -> StageTransformationSpec:
         """Generates the key that is used to store/locate the call in the cache."""
         ...
 
@@ -96,10 +96,10 @@ def transition_wrapper(  # type: ignore [no-untyped-def]  # return type is deduc
         *args: Any,
         **kwargs: Any,
     ):
-        key: StageTransformationDescription = self._make_call_description(*args, **kwargs)
+        key: StageTransformationSpec = self._make_call_description(*args, **kwargs)
         if key in self._cache:
             return self._cache[key]
-        next_stage: stages.Stage = transition(self, *args, **kwargs)
+        next_stage = transition(self, *args, **kwargs)
         self._cache[key] = next_stage
         return next_stage
 
@@ -125,7 +125,7 @@ def get_cache(
 class _AbstractCallArgument:
     """Class to represent a single argument to the transition function in an abstract way.
 
-    As noted in `StageTransformationDescription` there are two ways to describe an argument,
+    As noted in `StageTransformationSpec` there are two ways to describe an argument,
     either using its concrete value or an abstract description, which is similar to tracers in Jax.
     This class represents the second way.
     To create an instance you should use `_AbstractCallArgument.from_value()`.
@@ -185,14 +185,14 @@ def from_value(
 
 #: This type is the abstract description of a function call.
 #:  It is part of the key used in the cache.
-CallArgsDescription: TypeAlias = tuple[
+CallArgsSpec: TypeAlias = tuple[
     _AbstractCallArgument | Hashable | tuple[str, _AbstractCallArgument | Hashable],
     ...,
 ]
 
 
 @dataclasses.dataclass(frozen=True)
-class StageTransformationDescription:
+class StageTransformationSpec:
     """Represents the entire call to a state transformation function of a stage.
 
     State transition functions are annotated with `@cached_transition` and their result may be
@@ -214,7 +214,7 @@ class StageTransformationDescription:
     """
 
     stage_id: int
-    call_args: CallArgsDescription
+    call_args: CallArgsSpec
 
 
 # Denotes the stage that is stored inside the cache.
@@ -231,7 +231,7 @@ class StageCache(Generic[StageType]):
         The most recently used entry is at the end of the `OrderedDict`.
     """
 
-    _memory: collections.OrderedDict[StageTransformationDescription, StageType]
+    _memory: collections.OrderedDict[StageTransformationSpec, StageType]
     _size: int
 
     def __init__(
@@ -243,13 +243,13 @@ def __init__(
 
     def __contains__(
         self,
-        key: StageTransformationDescription,
+        key: StageTransformationSpec,
     ) -> bool:
         return key in self._memory
 
     def __getitem__(
         self,
-        key: StageTransformationDescription,
+        key: StageTransformationSpec,
     ) -> StageType:
         if key not in self:
             raise KeyError(f"Key '{key}' is unknown.")
@@ -258,7 +258,7 @@ def __getitem__(
 
     def __setitem__(
         self,
-        key: StageTransformationDescription,
+        key: StageTransformationSpec,
         res: StageType,
     ) -> None:
         if key in self:
@@ -271,7 +271,7 @@ def __setitem__(
 
     def popitem(
         self,
-        key: StageTransformationDescription | None,
+        key: StageTransformationSpec | None,
     ) -> None:
         """Evict `key` from `self`.
 
diff --git a/tests/test_caching.py b/tests/test_caching.py
index 851ebdc..9a624a2 100644
--- a/tests/test_caching.py
+++ b/tests/test_caching.py
@@ -17,8 +17,7 @@
 import pytest
 
 import jace
-from jace import optimization
-from jace.jax import stages
+from jace import optimization, stages
 
 
 @pytest.fixture(autouse=True)
@@ -30,7 +29,7 @@ def _clear_translation_cache():
     Todo:
         Ask Enrique how I can make that fixture apply everywhere not just in the file but the whole test suite.
     """
-    from jace.jax import translation_cache as tcache
+    from jace.util import translation_cache as tcache
 
     tcache.clear_translation_cache()
     yield
diff --git a/tests/test_decorator.py b/tests/test_decorator.py
index 7877b07..812ba60 100644
--- a/tests/test_decorator.py
+++ b/tests/test_decorator.py
@@ -27,7 +27,7 @@ def _clear_translation_cache():
     Todo:
         Should be used _everywhere_.
     """
-    from jace.jax import translation_cache as tcache
+    from jace.util import translation_cache as tcache
 
     tcache.clear_translation_cache()
     yield

From 6c980a9e750a37630267c1774b2f999d4a87c446 Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Tue, 28 May 2024 13:02:05 +0200
Subject: [PATCH 255/458] Fixed the type annotation.

---
 src/jace/util/translation_cache.py | 22 +++++++++++++---------
 1 file changed, 13 insertions(+), 9 deletions(-)

diff --git a/src/jace/util/translation_cache.py b/src/jace/util/translation_cache.py
index 3bf47c5..bc4f0bf 100644
--- a/src/jace/util/translation_cache.py
+++ b/src/jace/util/translation_cache.py
@@ -23,7 +23,9 @@
 from typing import (
     TYPE_CHECKING,
     Any,
+    Concatenate,
     Generic,
+    ParamSpec,
     TypeAlias,
     TypeVar,
     cast,
@@ -77,13 +79,15 @@ def _make_call_description(
         ...
 
 
-# Type of the transition function.
-TransitionFunction = TypeVar("TransitionFunction", bound=Callable[..., Any])
+# Type annotation of the caching Stuff.
+P = ParamSpec("P")
+TransitionFunction = Callable[Concatenate[CachingStage[NextStage], P], NextStage]
+CachingStageType = TypeVar("CachingStageType", bound=CachingStage)
 
 
 def cached_transition(
-    transition: TransitionFunction,
-) -> TransitionFunction:
+    transition: Callable[Concatenate[CachingStageType, P], NextStage],
+) -> Callable[Concatenate[CachingStage[NextStage], P], NextStage]:
     """Decorator for making the transition function of the stage cacheable.
 
     In order to work, the stage must be derived from `CachingStage`. For computing the key of a
@@ -91,11 +95,11 @@ def cached_transition(
     """
 
     @functools.wraps(transition)
-    def transition_wrapper(  # type: ignore [no-untyped-def]  # return type is deduced from `TransitionFunction`
-        self: CachingStage,
-        *args: Any,
-        **kwargs: Any,
-    ):
+    def transition_wrapper(
+        self: CachingStageType,
+        *args: P.args,
+        **kwargs: P.kwargs,
+    ) -> NextStage:
         key: StageTransformationSpec = self._make_call_description(*args, **kwargs)
         if key in self._cache:
             return self._cache[key]

From 6dd65f3e0442a90dcf14c786f0b5223d4f3871be Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Tue, 28 May 2024 13:12:03 +0200
Subject: [PATCH 256/458] Added a todo.

---
 src/jace/stages.py | 6 +++---
 1 file changed, 3 insertions(+), 3 deletions(-)

diff --git a/src/jace/stages.py b/src/jace/stages.py
index 52a44fc..020eebc 100644
--- a/src/jace/stages.py
+++ b/src/jace/stages.py
@@ -110,9 +110,9 @@ def lower(
         if len(kwargs) != 0:
             raise NotImplementedError("Currently only positional arguments are supported.")
 
-        # Currently the SDFG that we build only supports `C_CONTIGUOUS` memory order.
-        #  Since we support the paradigm that "everything passed to `lower` should also be
-        #  accepted as argument to call the result", we forbid other memory orders here.
+        # TODO(phimuell): Currently the SDFG that we build only supports `C_CONTIGUOUS` memory
+        #  order. Since we support the paradigm that "everything passed to `lower` should also
+        #  be accepted as argument to call the result", we forbid other memory orders here.
         if not all((not util.is_array(arg)) or arg.flags["C_CONTIGUOUS"] for arg in args):
             raise NotImplementedError("Currently can not handle strides beside 'C_CONTIGUOUS'.")
 

From f7fe13d38a69fa5d7b31e261a8c69d1efed996e2 Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Tue, 28 May 2024 14:17:19 +0200
Subject: [PATCH 257/458] Found something interesting in DaCe, but it does not
 fully match the Jax stuff about the primitives.

---
 src/jace/translator/primitive_translators/alu_translators.py | 2 ++
 1 file changed, 2 insertions(+)

diff --git a/src/jace/translator/primitive_translators/alu_translators.py b/src/jace/translator/primitive_translators/alu_translators.py
index bb70572..43d7a00 100644
--- a/src/jace/translator/primitive_translators/alu_translators.py
+++ b/src/jace/translator/primitive_translators/alu_translators.py
@@ -57,6 +57,8 @@ def write_tasklet_code(
 
 
 # Contains all the templates for ALU operations.
+#  TODO(phimuell): Import them also from `frontend/python/replacements.py`, however, the names
+#   do not fully matches the Jax names, `grep -P '^[a-zA-Z0-9_]+_p[[:space:]]+' -r -o -h | sort -u`
 # fmt: off
 _ALU_OPS_TMPL: Final[dict[str, str]] = {
     # Unary operations

From 7b7b7eff1668904a781e6d3fb49275a2f64db6c8 Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Tue, 28 May 2024 15:56:54 +0200
Subject: [PATCH 258/458] WIP: Dynamic slicing, it seems to work, but it is not
 nice.

---
 .../primitive_translators/slicing.py          | 92 ++++++++++++++++++-
 tests/test_sub_translators_slicing.py         | 22 +++++
 2 files changed, 112 insertions(+), 2 deletions(-)

diff --git a/src/jace/translator/primitive_translators/slicing.py b/src/jace/translator/primitive_translators/slicing.py
index 2f4405e..dcf2c07 100644
--- a/src/jace/translator/primitive_translators/slicing.py
+++ b/src/jace/translator/primitive_translators/slicing.py
@@ -9,13 +9,14 @@
 
 from __future__ import annotations
 
-from collections.abc import Sequence
+import itertools
+from collections.abc import MutableSequence, Sequence
 
 import dace
 from jax import core as jax_core
 from typing_extensions import override
 
-from jace import translator
+from jace import translator, util
 from jace.translator import mapped_operation_base_translator as mapped_base
 
 
@@ -63,4 +64,91 @@ def make_input_memlets(
         }
 
 
+class DynamicSlicingTranslator(translator.PrimitiveTranslator):
+    """Implements the dynamic slicing translator.
+
+    The [dynamic slicing](https://jax.readthedocs.io/en/latest/_autosummary/jax.lax.dynamic_slice.html)
+    performs a slicing of a _fixed_ window, however, the starting indexes are not fix, but are
+    variables that can come from the outside.
+    For this it uses symbols that, but since it uses the "Dynamic Map Ranges" no additional state
+    is needed.
+
+    Unlike the normal slicing primitive, it is not derived from `MappedOperationTranslatorBase`.
+    """
+
+    __slots__ = ()
+
+    @property
+    def primitive(self) -> str:
+        return "dynamic_slice"
+
+    @override
+    def __call__(
+        self,
+        driver: translator.JaxprTranslationDriver,
+        in_var_names: Sequence[str | None],
+        out_var_names: MutableSequence[str],
+        eqn: jax_core.JaxprEqn,
+        eqn_state: dace.SDFGState,
+    ) -> None:
+        assert in_var_names[0]
+        assert len(in_var_names) == len(eqn.invars[0].aval.shape) + 1
+
+        # First input to the primitive is the array we slice from, the others are
+
+        in_var_name: str = in_var_names[0]
+        start_indices: Sequence[str | None] = in_var_names[1:]
+
+        tskl_ranges: list[tuple[str, str]] = [
+            (f"__i{dim}", f"0:{N}") for dim, N in enumerate(eqn.outvars[0].aval.shape)
+        ]
+        tskl_output: dict[str, dace.Memlet] = {
+            "__out": dace.Memlet.simple(
+                out_var_names[0],
+                ", ".join(name for name, _ in tskl_ranges),
+            )
+        }
+
+        # Maps the symbol that is used inside the Memlet as offset to the variable where it came from.
+        dynamic_map_ranges: dict[str, str] = {}
+        mem_accesses: list[str] = []
+
+        for i, (it_var, _), start_idx in zip(itertools.count(), tskl_ranges, start_indices):
+            if start_idx is None:  # The index is a literal
+                mem_access = f"{it_var} + {util.get_jax_literal_value(eqn.invars[i + 1])}"
+            else:
+                symb_name = f"__jace_dynamic_map_range_{start_idx}"
+                mem_access = f"{it_var} + {symb_name}"
+                dynamic_map_ranges[symb_name] = start_idx
+            mem_accesses.append(mem_access)
+
+        tskl_input: dict[str, dace.Memlet] = {
+            "__in": dace.Memlet.simple(in_var_name, ", ".join(mem_accesses))
+        }
+
+        # Now generating the mapped Tasklet.
+        tskl_name = f"{self.primitive}_{out_var_names[0]}"
+
+        _, map_entry, _ = eqn_state.add_mapped_tasklet(
+            name=tskl_name,
+            map_ranges=tskl_ranges,
+            inputs=tskl_input,
+            code="__out = __in",
+            outputs=tskl_output,
+            external_edges=True,
+        )
+
+        # Now we add the dynamic map indexes.
+        for symb_name, start_idx_name in dynamic_map_ranges.items():
+            eqn_state.add_edge(
+                eqn_state.add_read(start_idx_name),
+                None,
+                map_entry,
+                symb_name,
+                dace.Memlet.simple(start_idx_name, "0"),  # It is always a scalar
+            )
+            map_entry.add_in_connector(symb_name)
+
+
 translator.register_primitive_translator(SlicingTranslator())
+translator.register_primitive_translator(DynamicSlicingTranslator())
diff --git a/tests/test_sub_translators_slicing.py b/tests/test_sub_translators_slicing.py
index 3317da6..357c118 100644
--- a/tests/test_sub_translators_slicing.py
+++ b/tests/test_sub_translators_slicing.py
@@ -9,12 +9,20 @@
 
 from __future__ import annotations
 
+import jax
 import numpy as np
 import pytest
 
 import jace
 
 
+@pytest.fixture(autouse=True)
+def _enable_x64_mode_in_jax():
+    """Ensures that x64 mode in Jax ins enabled."""
+    with jax.experimental.enable_x64():
+        yield
+
+
 @pytest.fixture()
 def A_4x4():
     return np.arange(16).reshape((4, 4))
@@ -134,3 +142,17 @@ def testee(A: np.ndarray) -> np.ndarray:
 
     assert ref.shape == res.shape
     assert np.all(ref == res)
+
+
+def test_dynamic_slice(A_4x4):
+    def testee(A: np.ndarray, s1: int, s2: int) -> np.ndarray:
+        return jax.lax.dynamic_slice(A, (s1, s2), (2, 2))
+
+    ref = testee(A_4x4, 1, 1)
+
+    with pytest.warns(
+        expected_warning=UserWarning,
+    ):
+        res = jace.jit(testee)(A_4x4, 1, 1)
+
+    assert np.all(ref == res)

From 28c77cac11c385c8e2013d6d46cb66aad21e5a80 Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Wed, 29 May 2024 08:12:39 +0200
Subject: [PATCH 259/458] Tidied up the dynamic slicing, however, it is not yet
 fully compatible.

Jax adjust the start indexes if the window overruns, however, this is not done, instead an out of bound error happens.
---
 .../primitive_translators/slicing.py          | 64 +++++++++---------
 tests/test_sub_translators_slicing.py         | 65 +++++++++++++++++--
 2 files changed, 94 insertions(+), 35 deletions(-)

diff --git a/src/jace/translator/primitive_translators/slicing.py b/src/jace/translator/primitive_translators/slicing.py
index dcf2c07..7ee28b8 100644
--- a/src/jace/translator/primitive_translators/slicing.py
+++ b/src/jace/translator/primitive_translators/slicing.py
@@ -9,7 +9,6 @@
 
 from __future__ import annotations
 
-import itertools
 from collections.abc import MutableSequence, Sequence
 
 import dace
@@ -74,6 +73,16 @@ class DynamicSlicingTranslator(translator.PrimitiveTranslator):
     is needed.
 
     Unlike the normal slicing primitive, it is not derived from `MappedOperationTranslatorBase`.
+
+    Note:
+        Jax will adjust the start indexes if the window overrun, however, Jace will not do that.
+        Instead, Jace will consider this as undefined behaviour.
+
+    Todo:
+        Fix the divergence with Jax, for this pre process the start indexes by the following
+        formula $min(s + w, N) - w$, where $s$ is the start index, $w$ the window size and
+        $N$ the length in a particular dimension, for this we need Tasklets, if we want to
+        preserve merge ability.
     """
 
     __slots__ = ()
@@ -94,58 +103,53 @@ def __call__(
         assert in_var_names[0]
         assert len(in_var_names) == len(eqn.invars[0].aval.shape) + 1
 
-        # First input to the primitive is the array we slice from, the others are
-
+        # The first input to the primitive is the array we slice from, the others are the start
+        #  indices of the slice window, each is a scalar, maybe literals
         in_var_name: str = in_var_names[0]
         start_indices: Sequence[str | None] = in_var_names[1:]
 
         tskl_ranges: list[tuple[str, str]] = [
             (f"__i{dim}", f"0:{N}") for dim, N in enumerate(eqn.outvars[0].aval.shape)
         ]
-        tskl_output: dict[str, dace.Memlet] = {
-            "__out": dace.Memlet.simple(
-                out_var_names[0],
-                ", ".join(name for name, _ in tskl_ranges),
-            )
-        }
 
-        # Maps the symbol that is used inside the Memlet as offset to the variable where it came from.
+        # We use dynamic map ranges, thus the map entry has entries, not with the typical `IN_*`
+        #  name and the connector name defines a symbol within the map scope. This `dict` maps
+        #  the symbol name to the name of the input variable, that defines the symbol. If the
+        #  input is a literal, than it has no correspondence and the constant is substituted.
         dynamic_map_ranges: dict[str, str] = {}
-        mem_accesses: list[str] = []
+        memlet_accesses: list[str] = []
 
-        for i, (it_var, _), start_idx in zip(itertools.count(), tskl_ranges, start_indices):
-            if start_idx is None:  # The index is a literal
-                mem_access = f"{it_var} + {util.get_jax_literal_value(eqn.invars[i + 1])}"
+        for i, ((it_var, _), start_idx) in enumerate(zip(tskl_ranges, start_indices)):
+            if start_idx is None:
+                offset = str(util.get_jax_literal_value(eqn.invars[i + 1]))
             else:
-                symb_name = f"__jace_dynamic_map_range_{start_idx}"
-                mem_access = f"{it_var} + {symb_name}"
-                dynamic_map_ranges[symb_name] = start_idx
-            mem_accesses.append(mem_access)
-
-        tskl_input: dict[str, dace.Memlet] = {
-            "__in": dace.Memlet.simple(in_var_name, ", ".join(mem_accesses))
-        }
-
-        # Now generating the mapped Tasklet.
-        tskl_name = f"{self.primitive}_{out_var_names[0]}"
+                offset = f"__jace_dynamic_map_range_{out_var_names[0]}_{start_idx}"
+                dynamic_map_ranges[offset] = start_idx
+            memlet_accesses.append(f"{it_var} + {offset}")
+
+        tskl_input = dace.Memlet.simple(in_var_name, ", ".join(memlet_accesses))
+        tskl_output = dace.Memlet.simple(
+            out_var_names[0],
+            ", ".join(name for name, _ in tskl_ranges),
+        )
 
         _, map_entry, _ = eqn_state.add_mapped_tasklet(
-            name=tskl_name,
+            name=f"{self.primitive}_{out_var_names[0]}",
             map_ranges=tskl_ranges,
-            inputs=tskl_input,
+            inputs={"__in": tskl_input},
             code="__out = __in",
-            outputs=tskl_output,
+            outputs={"__out": tskl_output},
             external_edges=True,
         )
 
-        # Now we add the dynamic map indexes.
+        # Creating the inputs for the dynamic map ranges.
         for symb_name, start_idx_name in dynamic_map_ranges.items():
             eqn_state.add_edge(
                 eqn_state.add_read(start_idx_name),
                 None,
                 map_entry,
                 symb_name,
-                dace.Memlet.simple(start_idx_name, "0"),  # It is always a scalar
+                dace.Memlet.simple(start_idx_name, "0"),
             )
             map_entry.add_in_connector(symb_name)
 
diff --git a/tests/test_sub_translators_slicing.py b/tests/test_sub_translators_slicing.py
index 357c118..69fd9ab 100644
--- a/tests/test_sub_translators_slicing.py
+++ b/tests/test_sub_translators_slicing.py
@@ -28,6 +28,31 @@ def A_4x4():
     return np.arange(16).reshape((4, 4))
 
 
+@pytest.fixture()
+def A_4x4x4x4():
+    return np.arange(4**4).reshape((4, 4, 4, 4))
+
+
+@pytest.fixture(
+    params=[
+        (1, 2, 1, 2),
+        (0, 0, 0, 0),
+        pytest.param(
+            (3, 3, 3, 3), marks=pytest.mark.skip("Overrun dynamic windows are not supported.")
+        ),
+    ]
+)
+def full_dynamic_start_idx(request):
+    """Start indexes for the slice window of `test_dynamic_slice_full_dynamic()`.
+
+    Note:
+        The `(3, 3, 3, 3)` is clearly out of bound for the `A_4x4x4x4` case, however, Jax
+        explicitly allows [this](https://jax.readthedocs.io/en/latest/_autosummary/jax.lax.dynamic_slice.html).
+        However, it is not supported in Jace.
+    """
+    return request.param
+
+
 def test_slice_sub_view(A_4x4):
     """Simple extraction of a subsize."""
 
@@ -144,15 +169,45 @@ def testee(A: np.ndarray) -> np.ndarray:
     assert np.all(ref == res)
 
 
-def test_dynamic_slice(A_4x4):
-    def testee(A: np.ndarray, s1: int, s2: int) -> np.ndarray:
-        return jax.lax.dynamic_slice(A, (s1, s2), (2, 2))
+def test_dynamic_slice_full_dynamic(A_4x4x4x4, full_dynamic_start_idx):
+    """Dynamic slicing where all start index are input parameters."""
+
+    def testee(A: np.ndarray, s1: int, s2: int, s3: int, s4: int) -> np.ndarray:
+        return jax.lax.dynamic_slice(A, (s1, s2, s3, s4), (2, 2, 2, 2))
+
+    # TODO(phimuell): Get rid of this warning, or allow it to disable.
+    with pytest.warns(
+        expected_warning=UserWarning,
+    ):
+        res = jace.jit(testee)(A_4x4x4x4, *full_dynamic_start_idx)
+    ref = testee(A_4x4x4x4, *full_dynamic_start_idx)
 
-    ref = testee(A_4x4, 1, 1)
+    assert np.all(ref == res)
+
+
+def test_dynamic_slice_partially_dynamic(A_4x4x4x4):
+    """Dynamic slicing where some start index are input parameters and others are literals."""
 
+    def testee(A: np.ndarray, s1: int, s2: int) -> np.ndarray:
+        return jax.lax.dynamic_slice(A, (s1, 1, s2, 2), (2, 2, 2, 2))
+
+    # TODO(phimuell): Get rid of this warning, or allow it to disable.
     with pytest.warns(
         expected_warning=UserWarning,
     ):
-        res = jace.jit(testee)(A_4x4, 1, 1)
+        res = jace.jit(testee)(A_4x4x4x4, 1, 2)
+    ref = testee(A_4x4x4x4, 1, 2)
+
+    assert np.all(ref == res)
+
+
+def test_dynamic_slice_full_literal(A_4x4x4x4):
+    """Dynamic slicing where all start indexes are literals."""
+
+    def testee(A: np.ndarray) -> np.ndarray:
+        return jax.lax.dynamic_slice(A, (0, 1, 0, 2), (2, 2, 2, 2))
+
+    res = jace.jit(testee)(A_4x4x4x4)
+    ref = testee(A_4x4x4x4)
 
     assert np.all(ref == res)

From 054bb22c245846cd74fe9a0a4ccdc2c868619159 Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Wed, 29 May 2024 11:11:06 +0200
Subject: [PATCH 260/458] Dynamic slice now also supports the shifting of
 windows.

During that work I also detected some [issue](https://github.com/spcl/dace/issues/1579) in DaCe's simplification pipeline.
---
 .../primitive_translators/slicing.py          | 93 ++++++++++++++-----
 tests/test_sub_translators_slicing.py         | 13 +--
 2 files changed, 73 insertions(+), 33 deletions(-)

diff --git a/src/jace/translator/primitive_translators/slicing.py b/src/jace/translator/primitive_translators/slicing.py
index 7ee28b8..babfa08 100644
--- a/src/jace/translator/primitive_translators/slicing.py
+++ b/src/jace/translator/primitive_translators/slicing.py
@@ -73,16 +73,6 @@ class DynamicSlicingTranslator(translator.PrimitiveTranslator):
     is needed.
 
     Unlike the normal slicing primitive, it is not derived from `MappedOperationTranslatorBase`.
-
-    Note:
-        Jax will adjust the start indexes if the window overrun, however, Jace will not do that.
-        Instead, Jace will consider this as undefined behaviour.
-
-    Todo:
-        Fix the divergence with Jax, for this pre process the start indexes by the following
-        formula $min(s + w, N) - w$, where $s$ is the start index, $w$ the window size and
-        $N$ the length in a particular dimension, for this we need Tasklets, if we want to
-        preserve merge ability.
     """
 
     __slots__ = ()
@@ -103,28 +93,85 @@ def __call__(
         assert in_var_names[0]
         assert len(in_var_names) == len(eqn.invars[0].aval.shape) + 1
 
+        # This is the sizes of the slice window.
+        window_sizes: Sequence[int] = eqn.params["slice_sizes"]
+
         # The first input to the primitive is the array we slice from, the others are the start
-        #  indices of the slice window, each is a scalar, maybe literals
+        #  indices of the slice window, each is a scalar, maybe literals, we might adapt them later.
         in_var_name: str = in_var_names[0]
-        start_indices: Sequence[str | None] = in_var_names[1:]
+        start_indices: list[str | None] = list(in_var_names[1:])
+
+        # For storing the adapted start index, we have to create access nodes, to store them.
+        #  However, to ensure a total order of execution, once we added them as dynamic map ranges
+        #  to the map, we must use the same access nodes.
+        in_access: dict[str, dace.nodes.AccessNode] = {}
+
+        # Jax will adjust the start indexes if the window will overrun.
+        #  The adjustment is based on the formula $min(s + w, N) - w$, where $s$ is the start
+        #  index, $w$ the window size and $N$ the length in a particular dimension.
+        #  To do it we will use Tasklets, because otherwise we can not merge the state.
+        # TODO(phimuell): Make the Tasklet mapped, that they can be merged.
+        for dim, (start_index, dim_size, wsize) in enumerate(
+            zip(start_indices, eqn.invars[0].aval.shape, window_sizes)
+        ):
+            if start_index is None:
+                continue
+
+            tasklet = dace.nodes.Tasklet(
+                label=f"adjustment_of_slice_start_{start_index}_for_{out_var_names[0]}",
+                inputs={"unadjusted_start_idx": None},
+                outputs={"adjusted_start_idx": None},
+                code=f"adjusted_start_idx = min(unadjusted_start_idx + {wsize}, {dim_size}) - {wsize}",
+            )
+
+            # Intermediate value for the adjusted start index.
+            new_start_idx_var_name = driver.add_array(
+                eqn.invars[dim + 1],
+                name_prefix=f"__jace_adapted_start_idx_{start_index}",
+            )
+            new_start_idx_acc = eqn_state.add_access(new_start_idx_var_name)
+
+            # Create the connections to and from the Tasklet.
+            eqn_state.add_edge(
+                eqn_state.add_read(start_index),
+                None,
+                tasklet,
+                "unadjusted_start_idx",
+                dace.Memlet.simple(start_index, "0"),
+            )
+            eqn_state.add_edge(
+                tasklet,
+                "adjusted_start_idx",
+                new_start_idx_acc,
+                None,
+                dace.Memlet.simple(new_start_idx_var_name, "0"),
+            )
+
+            # Now store the result
+            start_indices[dim] = new_start_idx_var_name
+            in_access[new_start_idx_var_name] = new_start_idx_acc
 
         tskl_ranges: list[tuple[str, str]] = [
             (f"__i{dim}", f"0:{N}") for dim, N in enumerate(eqn.outvars[0].aval.shape)
         ]
 
-        # We use dynamic map ranges, thus the map entry has entries, not with the typical `IN_*`
-        #  name and the connector name defines a symbol within the map scope. This `dict` maps
-        #  the symbol name to the name of the input variable, that defines the symbol. If the
-        #  input is a literal, than it has no correspondence and the constant is substituted.
+        # We use dynamic map ranges, thus the map entry has input connectors, that does not start
+        #  with `IN_*`, instead the connector name defines a symbol within the map scope. This
+        #  `dict` maps the symbol name to the name of the input variable, that defines the symbol.
+        #  If the input is a literal, than it has no correspondence and the constant is substituted.
         dynamic_map_ranges: dict[str, str] = {}
         memlet_accesses: list[str] = []
 
-        for i, ((it_var, _), start_idx) in enumerate(zip(tskl_ranges, start_indices)):
-            if start_idx is None:
+        for i, ((it_var, _), start_index) in enumerate(zip(tskl_ranges, start_indices)):
+            if start_index is None:
                 offset = str(util.get_jax_literal_value(eqn.invars[i + 1]))
             else:
-                offset = f"__jace_dynamic_map_range_{out_var_names[0]}_{start_idx}"
-                dynamic_map_ranges[offset] = start_idx
+                # Because of [issue 1579](https://github.com/spcl/dace/issues/1579) we have to use
+                #  the same name as the data container for the symbol and can not mangle it.
+                # TODO(phimuell): Activate mangling when the issue is resolved.
+                # offset = f"__jace_dynamic_map_range_{out_var_names[0]}_{start_index}" # noqa: ERA001
+                offset = start_index
+                dynamic_map_ranges[offset] = start_index
             memlet_accesses.append(f"{it_var} + {offset}")
 
         tskl_input = dace.Memlet.simple(in_var_name, ", ".join(memlet_accesses))
@@ -143,13 +190,13 @@ def __call__(
         )
 
         # Creating the inputs for the dynamic map ranges.
-        for symb_name, start_idx_name in dynamic_map_ranges.items():
+        for symb_name, start_index in dynamic_map_ranges.items():
             eqn_state.add_edge(
-                eqn_state.add_read(start_idx_name),
+                in_access[start_index],
                 None,
                 map_entry,
                 symb_name,
-                dace.Memlet.simple(start_idx_name, "0"),
+                dace.Memlet.simple(start_index, "0"),
             )
             map_entry.add_in_connector(symb_name)
 
diff --git a/tests/test_sub_translators_slicing.py b/tests/test_sub_translators_slicing.py
index 69fd9ab..a6f9e6c 100644
--- a/tests/test_sub_translators_slicing.py
+++ b/tests/test_sub_translators_slicing.py
@@ -37,19 +37,12 @@ def A_4x4x4x4():
     params=[
         (1, 2, 1, 2),
         (0, 0, 0, 0),
-        pytest.param(
-            (3, 3, 3, 3), marks=pytest.mark.skip("Overrun dynamic windows are not supported.")
-        ),
+        (3, 3, 3, 3),  # Will lead to readjustment.
+        (3, 1, 3, 0),  # Will lead to readjustment.
     ]
 )
 def full_dynamic_start_idx(request):
-    """Start indexes for the slice window of `test_dynamic_slice_full_dynamic()`.
-
-    Note:
-        The `(3, 3, 3, 3)` is clearly out of bound for the `A_4x4x4x4` case, however, Jax
-        explicitly allows [this](https://jax.readthedocs.io/en/latest/_autosummary/jax.lax.dynamic_slice.html).
-        However, it is not supported in Jace.
-    """
+    """Start indexes for the slice window of `test_dynamic_slice_full_dynamic()`."""
     return request.param
 
 
From c7e8b9feec0e7fe6ddffa42bab11b6147b1c42cd Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Wed, 29 May 2024 11:56:56 +0200
Subject: [PATCH 261/458] Some cleaning.

---
 .../mapped_operation_base_translator.py       | 50 +++++++++++--------
 src/jace/translator/primitive_translator.py   |  3 +-
 .../convert_element_type_translator.py        | 14 +++---
 .../primitive_translators/copy_translator.py  | 11 ++--
 .../select_n_translator.py                    | 16 +++---
 ...st_sub_translators_convert_element_type.py |  2 +-
 tests/test_sub_translators_iota.py            |  5 +-
 tests/test_sub_translators_slicing.py         |  8 +--
 tests/test_subtranslator_helper.py            |  2 +-
 9 files changed, 59 insertions(+), 52 deletions(-)

diff --git a/src/jace/translator/mapped_operation_base_translator.py b/src/jace/translator/mapped_operation_base_translator.py
index f4ab189..e7a3941 100644
--- a/src/jace/translator/mapped_operation_base_translator.py
+++ b/src/jace/translator/mapped_operation_base_translator.py
@@ -22,19 +22,28 @@
 class MappedOperationTranslatorBase(translator.PrimitiveTranslator):
     """Implements the base for all "mapped base operations".
 
-    A mapped base operation `f` is an operation that has several inputs arrays that are elementwise combined to a single output array.
-    A prime example for this would be the addition of two arrays.
+    A mapped base operation `f` is an operation that has several inputs arrays that are
+    elementwise combined to a single output array. A prime example for this would be the
+    addition of two arrays.
     Essentially it assumes that the Tasklet code can be written as:
     ```
         __out = f(__in0, __in1, __in3, ...)
     ```
-    where `__in*` are the connector names of the Tasklet and `__out` is the output connector.
-    For problems such as this, the SDFG API provides the `SDFGState.add_mapped_tasklet()` function, however, in most cases it can not be directly used.
+    where `__in*` are the connector names of the Tasklet and `__out` is the output connector. For
+    problems such as this, the SDFG API provides the `SDFGState.add_mapped_tasklet()` function,
+    however, in most cases it can not be directly used, for various reasons.
     Thus this class acts like a convenience wrapper around it.
 
-    To use this class a user has to overwrite the `write_tasklet_code()` function.
-    This function generates the entire code that should be put into the Tasklet, include the assignment to `__out`.
-    If needed the translator will perform literal substitution on the returned code and broadcast the inputs to match the outputs.
+    To use this class a user has to overwrite the `write_tasklet_code()` function. This function
+    generates the entire code that should be put into the Tasklet, include the assignment to
+    `__out`. If needed the translator will perform literal substitution on the returned code and
+    broadcast the inputs to match the outputs.
+
+    If needed a subclass can also override the `make_input_memlets()` function to generate custom
+    input Memlets, such as adding an offset.
+
+    Args:
+        primitive_name:     The name of the primitive `self` should bind to.
 
     Notes:
         This class will always generate a mapped Tasklet, even if a scalar is handled.
@@ -46,7 +55,6 @@ def __init__(
         self,
         primitive_name: str,
     ) -> None:
-        """Bind `self` to the primitive with name `primitive_name`."""
         self._prim_name = primitive_name
 
     @property
@@ -72,12 +80,8 @@ def __call__(
         and perform literal substitution by forwarding it to `self.literal_substitution()`.
         After that it will create the mapped Tasklet.
 
-        Args:
-            driver:         The driver object of the translation.
-            in_var_names:   List of the names of the arrays created inside the SDFG for the inputs or 'None' in case of a literal.
-            out_var_names:  List of the names of the arrays created inside the SDFG for the outputs.
-            eqn:            The Jax equation that is translated.
-            eqn_state:      State into which the primitive's SDFG representation is constructed.
+        Note:
+            For a description of the arguments see `PrimitiveTranslatorCallable`.
         """
         assert len(out_var_names) == 1
         if eqn.outvars[0].aval.shape != ():
@@ -127,9 +131,9 @@ def write_tasklet_code(
         However, the base will do literal substitution on the returned object.
 
         Args:
-            tskl_ranges:    The iteration indexes used by the map, first element is the iteration index itself,
-                                the second index is the iteration range.
-            in_var_names:   The list of SDFG variables used as input.
+            tskl_ranges:    List of pairs used as map parameter, first element is the name
+                iteration index of the dimension, second is its range, i.e. `0:SIZE`.
+            in_var_names:   The list of SDFG variables used as input, `None` if literal.
             eqn:            The equation.
         """
         ...
@@ -142,19 +146,21 @@ def make_input_memlets(
     ) -> dict[str, dace.Memlet]:
         """Generate the input Memlets for the non literal operators of the primitive.
 
-        The returned `dict` maps the input connector of the Tasklet to the Memlet that is used to connect it to the Map entry node.
+        The returned `dict` maps the input connector of the Tasklet to the Memlet that is used
+        to connect it to the Map entry node.
 
         Args:
-            tskl_ranges:    List of the different map parameter, first element is the name of the dimension,
-                                    second is the range, i.e. `0:SIZE`.
-            in_var_names:   The list of SDFG variables used as input.
+            tskl_ranges:    List of pairs used as map parameter, first element is the name
+                iteration index of the dimension, second is its range, i.e. `0:SIZE`.
+            in_var_names:   The list of SDFG variables used as input, `None` if literal.
             eqn:            The equation object.
         """
         out_shp = tuple(eqn.outvars[0].aval.shape)  # Shape of the output
         out_rank = len(out_shp)
         if any(len(invar.aval.shape) not in {0, out_rank} for invar in eqn.invars):
             raise NotImplementedError(
-                f"'MappedOperationTranslatorBase' Inputs must have the same rank as the output! Eqn: {eqn} || {tuple(eqn.outvars[0].aval.shape)}"
+                f"'MappedOperationTranslatorBase' Inputs must have the same rank as the output! "
+                f"Eqn: {eqn} || {tuple(eqn.outvars[0].aval.shape)}"
             )
 
         # Now we will generate the input Memlets.
diff --git a/src/jace/translator/primitive_translator.py b/src/jace/translator/primitive_translator.py
index bdca3d4..f748cc0 100644
--- a/src/jace/translator/primitive_translator.py
+++ b/src/jace/translator/primitive_translator.py
@@ -93,7 +93,8 @@ class PrimitiveTranslator(PrimitiveTranslatorCallable, Protocol):
     driver object, which also owns and manage the primitive translators. In the end this implements
     the delegation pattern.
 
-    You can use `jace.translator.register_primitive_translator()` to register your translator to Jace.
+    You can use `jace.translator.register_primitive_translator()` to register your translator to
+    Jace.
     """
 
     __slots__ = ()
diff --git a/src/jace/translator/primitive_translators/convert_element_type_translator.py b/src/jace/translator/primitive_translators/convert_element_type_translator.py
index 44ba62d..a1db547 100644
--- a/src/jace/translator/primitive_translators/convert_element_type_translator.py
+++ b/src/jace/translator/primitive_translators/convert_element_type_translator.py
@@ -26,11 +26,13 @@ class ConvertElementTypeTranslator(mapped_base.MappedOperationTranslatorBase):
     Copies the input to the output and performs type conversion.
 
     Notes:
-        This translator ignores the `new_dtype` and `weak_type` parameter of the equation and only performs casting
+        This translator ignores the `new_dtype` and `weak_type` parameter the equation
+        and only performs the casting.
 
     Todo:
-        Occasionally Jax converts from the same type to another type.
-            This case should be handled by a Memlet directly, which can then be removed.
+        - Occasionally Jax generates a cast that is not needed, because the types are the same.
+            Currently this is handled, by generating an explicit copy, however, it should be
+            handled by a Memlet.
     """
 
     __slots__ = ()
@@ -54,8 +56,8 @@ def write_tasklet_code(
         out_dtype_s: str = str(out_dtype)
 
         # This is the base of the template that we use for conversion.
-        #  You should notice that the Tasklet `__out = __in0` will fail, see commit `f5aabc3` of the prototype.
-        #  Thus we have to do it in this way.
+        #  You should notice that the Tasklet `__out = __in0` will fail, see commit
+        #  `f5aabc3` of the prototype. Thus we have to do it in this way.
         conv_code = "__in0"
 
         # Handle special cases
@@ -64,7 +66,7 @@ def write_tasklet_code(
             #  See: tests/test_sub_translators_convert_element_type.py::test_convert_element_type_useless_cast
             # TODO(phimuell): Make this into a pure Memlet such that it can be optimized away by DaCe.
             warnings.warn(
-                f"convert_element_type({eqn}): is useless, because input and output have same type.",
+                f"convert_element_type({eqn}): is useless, input and output have same type.",
                 category=UserWarning,
                 stacklevel=1,  # Find a better one
             )
diff --git a/src/jace/translator/primitive_translators/copy_translator.py b/src/jace/translator/primitive_translators/copy_translator.py
index 1ff170e..acab7bd 100644
--- a/src/jace/translator/primitive_translators/copy_translator.py
+++ b/src/jace/translator/primitive_translators/copy_translator.py
@@ -39,10 +39,13 @@ def write_tasklet_code(
 class DevicePutTranslator(mapped_base.MappedOperationTranslatorBase):
     """The `device_put` primitive is used to transfer data between host and device.
 
-    The current implementation only supports the copying where the data already is.
-    Currently DaCe only knows about the Host and the GPU.
-    Furthermore, currently Jace works in such a way that everything is either put on the host or the device.
-    Because of this, the `DevicePutTranslator` is, currently, just a simple copy operation that should be removed, by the optimization.
+    The current implementation only supports the copying where the data already is. Currently DaCe
+    only knows about the Host and the GPU. Furthermore, currently Jace works in such a way that
+    everything is either put on the host or the device. Because of this, the `DevicePutTranslator`
+    is, currently, just a simple copy operation that should be removed, by the optimization.
+
+    Todo:
+        - Make into a Memlet because only the Memlet can handle copying between devices.
     """
 
     __slots__ = ()
diff --git a/src/jace/translator/primitive_translators/select_n_translator.py b/src/jace/translator/primitive_translators/select_n_translator.py
index 75a719b..b2f0e58 100644
--- a/src/jace/translator/primitive_translators/select_n_translator.py
+++ b/src/jace/translator/primitive_translators/select_n_translator.py
@@ -22,14 +22,16 @@
 class SelectNTranslator(mapped_base.MappedOperationTranslatorBase):
     """Implements the `select_n` primitive, which is a generalization of `np.where`
 
-    While `numpy.where` only supports two cases, the Jax primitive supports an arbitrary number of cases.
-    In that sense it is essentially a `C` `switch` statement, only that all cases have to materialize.
+    While `numpy.where` only supports two cases, the Jax primitive supports an arbitrary number
+    of cases. In that sense it is essentially a `C` `switch` statement, only that all cases have
+    to materialize.
 
     The behaviour is undefined if the predicate is out of bound.
 
     Note:
-        For a better understanding this function renames its input connectors.
-        The first one, which is the predicate, is renamed to `__cond` and the others are renamed again to `__in{i}`, starting with zero.
+        For a better understanding this function renames its input connectors. The first one,
+        which is the predicate, is renamed to `__cond` and the others are renamed again to
+        `__in{i}`, starting with zero.
     """
 
     __slots__ = ()
@@ -50,9 +52,9 @@ def write_tasklet_code(
         """
 
         if len(in_var_names) == 3:
-            # This order is correct, since `False` is interpreted as `0`, which means the first case.
-            #  DaCe seems to have some problems with bools and integer casting around, so we habdle
-            #  the bool case explicitly here; See also the `ConvertElementTypeTranslator`.
+            # This order is correct, since `False` is interpreted as `0`, which means the first
+            #  case. DaCe seems to have some problems with bools and integer casting around,
+            #  so we handle the bool case explicitly here; See also `ConvertElementTypeTranslator`.
             return "__out = __in1 if __cond else __in0"
 
         return "\n".join(
diff --git a/tests/test_sub_translators_convert_element_type.py b/tests/test_sub_translators_convert_element_type.py
index e2635cf..2684f34 100644
--- a/tests/test_sub_translators_convert_element_type.py
+++ b/tests/test_sub_translators_convert_element_type.py
@@ -90,7 +90,7 @@ def testee(a: float) -> np.ndarray:
 
     with pytest.warns(
         expected_warning=UserWarning,
-        match=r"convert_element_type\(.*\): is useless, because input and output have same type.",
+        match=r"convert_element_type\(.*\): is useless, input and output have same type.",
     ):
         res = jace.jit(testee)(1.0)
 
diff --git a/tests/test_sub_translators_iota.py b/tests/test_sub_translators_iota.py
index fb35e57..c3ce269 100644
--- a/tests/test_sub_translators_iota.py
+++ b/tests/test_sub_translators_iota.py
@@ -23,10 +23,7 @@ def testee(A: int) -> np.ndarray:
 
     ref = testee(0)
 
-    with pytest.warns(
-        expected_warning=UserWarning,
-        match=r"convert_element_type\(.*\): is useless, because input and output have same type.",
-    ):
+    with pytest.warns(expected_warning=UserWarning):
         res = jace.jit(testee)(0)
     assert np.all(ref == res)
 
diff --git a/tests/test_sub_translators_slicing.py b/tests/test_sub_translators_slicing.py
index a6f9e6c..398c704 100644
--- a/tests/test_sub_translators_slicing.py
+++ b/tests/test_sub_translators_slicing.py
@@ -169,9 +169,7 @@ def testee(A: np.ndarray, s1: int, s2: int, s3: int, s4: int) -> np.ndarray:
         return jax.lax.dynamic_slice(A, (s1, s2, s3, s4), (2, 2, 2, 2))
 
     # TODO(phimuell): Get rid of this warning, or allow it to disable.
-    with pytest.warns(
-        expected_warning=UserWarning,
-    ):
+    with pytest.warns(expected_warning=UserWarning):
         res = jace.jit(testee)(A_4x4x4x4, *full_dynamic_start_idx)
     ref = testee(A_4x4x4x4, *full_dynamic_start_idx)
 
@@ -185,9 +183,7 @@ def testee(A: np.ndarray, s1: int, s2: int) -> np.ndarray:
         return jax.lax.dynamic_slice(A, (s1, 1, s2, 2), (2, 2, 2, 2))
 
     # TODO(phimuell): Get rid of this warning, or allow it to disable.
-    with pytest.warns(
-        expected_warning=UserWarning,
-    ):
+    with pytest.warns(expected_warning=UserWarning):
         res = jace.jit(testee)(A_4x4x4x4, 1, 2)
     ref = testee(A_4x4x4x4, 1, 2)
 
diff --git a/tests/test_subtranslator_helper.py b/tests/test_subtranslator_helper.py
index 3091282..fb34bcf 100644
--- a/tests/test_subtranslator_helper.py
+++ b/tests/test_subtranslator_helper.py
@@ -73,7 +73,7 @@ def fake_add_translator(*args: Any, **kwargs: Any) -> None:
 def test_are_subtranslators_imported():
     """Tests if something is inside the list of subtranslators."""
     # Must be adapted if new primitives are implemented.
-    assert len(get_regsitered_primitive_translators()) == 46
+    assert len(get_regsitered_primitive_translators()) == 47
 
 
 @pytest.mark.usefixtures("no_builtin_translators")

From a28a9c82bd2f3f613d67ae379561123c6e76918b Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Wed, 29 May 2024 12:57:00 +0200
Subject: [PATCH 262/458] Removed the warning about the useless casting in the
 tests.

---
 .../convert_element_type_translator.py             | 14 +++++---------
 tests/test_sub_translators_convert_element_type.py | 10 ++++++----
 tests/test_sub_translators_iota.py                 |  5 +----
 tests/test_sub_translators_slicing.py              |  8 ++------
 4 files changed, 14 insertions(+), 23 deletions(-)

diff --git a/src/jace/translator/primitive_translators/convert_element_type_translator.py b/src/jace/translator/primitive_translators/convert_element_type_translator.py
index a1db547..c316bb9 100644
--- a/src/jace/translator/primitive_translators/convert_element_type_translator.py
+++ b/src/jace/translator/primitive_translators/convert_element_type_translator.py
@@ -9,7 +9,6 @@
 
 from __future__ import annotations
 
-import warnings
 from collections.abc import Sequence
 
 import dace
@@ -62,14 +61,11 @@ def write_tasklet_code(
 
         # Handle special cases
         if in_dtype == out_dtype:
-            # It sounds ridiculously but it can happen.
-            #  See: tests/test_sub_translators_convert_element_type.py::test_convert_element_type_useless_cast
-            # TODO(phimuell): Make this into a pure Memlet such that it can be optimized away by DaCe.
-            warnings.warn(
-                f"convert_element_type({eqn}): is useless, input and output have same type.",
-                category=UserWarning,
-                stacklevel=1,  # Find a better one
-            )
+            # This happens and previously there was a warning here, but that thing got so annoying
+            #  We handle it explicitly because otherwise, DaCe could not remove the Tasklet.
+            #  inside the tests that it was removed, see the `tests/test_sub_translators_convert_element_type.py::test_convert_element_type_useless_cast`
+            #  for more.
+            # TODO(phimuell): Make this into a pure Memlet.
             return f"__out = {conv_code}"
         if in_dtype_s.startswith("bool") and out_dtype_s.startswith("int"):
             # Interestingly `__out = int(__in0)` will at some DaCe processing stage.
diff --git a/tests/test_sub_translators_convert_element_type.py b/tests/test_sub_translators_convert_element_type.py
index 2684f34..cb2e690 100644
--- a/tests/test_sub_translators_convert_element_type.py
+++ b/tests/test_sub_translators_convert_element_type.py
@@ -77,11 +77,13 @@ def test_convert_element_type_from_bool():
     _test_convert_element_type_impl([np.bool_], _DACE_COMPLEX)
 
 
+@pytest.mark.skip(reason="The warning was disabled, so the test is useless.")
 def test_convert_element_type_useless_cast():
-    """Broadcast a literal to a matrix.
+    """Shows that under some conditions there is really a casting from one type to the same.
 
-    This test is here to show, that in certain situation Jax inserts
-    a `convert_element_type` primitive even if it is not needed.
+    In certain cases, also in some slicing tests, this useless cast is inserted by Jax.
+    This test was originally here to show this. However, that thing got so annoying that it was
+    removed. The test is kept here to serve as some kind of a reference.
     """
 
     def testee(a: float) -> np.ndarray:
@@ -90,7 +92,7 @@ def testee(a: float) -> np.ndarray:
 
     with pytest.warns(
         expected_warning=UserWarning,
-        match=r"convert_element_type\(.*\): is useless, input and output have same type.",
+        match=r"convert_element_type\(.*\): is useless, input and output have same type\.",
     ):
         res = jace.jit(testee)(1.0)
 
diff --git a/tests/test_sub_translators_iota.py b/tests/test_sub_translators_iota.py
index c3ce269..696a536 100644
--- a/tests/test_sub_translators_iota.py
+++ b/tests/test_sub_translators_iota.py
@@ -9,7 +9,6 @@
 
 import jax
 import numpy as np
-import pytest
 from jax import numpy as jnp
 
 import jace
@@ -22,9 +21,7 @@ def testee(A: int) -> np.ndarray:
         return jnp.arange(18, dtype=int) + A
 
     ref = testee(0)
-
-    with pytest.warns(expected_warning=UserWarning):
-        res = jace.jit(testee)(0)
+    res = jace.jit(testee)(0)
     assert np.all(ref == res)
 
 
diff --git a/tests/test_sub_translators_slicing.py b/tests/test_sub_translators_slicing.py
index 398c704..7faa930 100644
--- a/tests/test_sub_translators_slicing.py
+++ b/tests/test_sub_translators_slicing.py
@@ -168,9 +168,7 @@ def test_dynamic_slice_full_dynamic(A_4x4x4x4, full_dynamic_start_idx):
     def testee(A: np.ndarray, s1: int, s2: int, s3: int, s4: int) -> np.ndarray:
         return jax.lax.dynamic_slice(A, (s1, s2, s3, s4), (2, 2, 2, 2))
 
-    # TODO(phimuell): Get rid of this warning, or allow it to disable.
-    with pytest.warns(expected_warning=UserWarning):
-        res = jace.jit(testee)(A_4x4x4x4, *full_dynamic_start_idx)
+    res = jace.jit(testee)(A_4x4x4x4, *full_dynamic_start_idx)
     ref = testee(A_4x4x4x4, *full_dynamic_start_idx)
 
     assert np.all(ref == res)
@@ -182,9 +180,7 @@ def test_dynamic_slice_partially_dynamic(A_4x4x4x4):
     def testee(A: np.ndarray, s1: int, s2: int) -> np.ndarray:
         return jax.lax.dynamic_slice(A, (s1, 1, s2, 2), (2, 2, 2, 2))
 
-    # TODO(phimuell): Get rid of this warning, or allow it to disable.
-    with pytest.warns(expected_warning=UserWarning):
-        res = jace.jit(testee)(A_4x4x4x4, 1, 2)
+    res = jace.jit(testee)(A_4x4x4x4, 1, 2)
     ref = testee(A_4x4x4x4, 1, 2)
 
     assert np.all(ref == res)

From 5bb4b5e557906af0855e95e7bc23d0509e28578a Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Wed, 29 May 2024 13:35:37 +0200
Subject: [PATCH 263/458] Started to reorganize the tests.

---
 tests/conftest.py                                         | 8 ++++++++
 tests/general_tests/__init__.py                           | 8 ++++++++
 tests/{ => general_tests}/test_caching.py                 | 0
 tests/{ => general_tests}/test_decorator.py               | 0
 tests/{ => general_tests}/test_jax_api.py                 | 0
 tests/{ => general_tests}/test_misc.py                    | 0
 tests/{ => general_tests}/test_package.py                 | 0
 tests/translator_tests/__init__.py                        | 8 ++++++++
 tests/translator_tests/primitive_translators/__init__.py  | 8 ++++++++
 .../primitive_translators}/test_sub_translators_alu.py    | 0
 .../test_sub_translators_broadcast_in_dim.py              | 0
 .../test_sub_translators_convert_element_type.py          | 0
 .../primitive_translators}/test_sub_translators_iota.py   | 0
 .../test_sub_translators_reshape.py                       | 0
 .../test_sub_translators_select_n.py                      | 0
 .../test_sub_translators_slicing.py                       | 0
 .../test_sub_translators_squeeze_expand_dims.py           | 0
 tests/{ => translator_tests}/test_empty_jaxpr.py          | 0
 .../test_jaxpr_translator_driver.py                       | 0
 tests/{ => translator_tests}/test_subtranslator_helper.py | 0
 20 files changed, 32 insertions(+)
 create mode 100644 tests/conftest.py
 create mode 100644 tests/general_tests/__init__.py
 rename tests/{ => general_tests}/test_caching.py (100%)
 rename tests/{ => general_tests}/test_decorator.py (100%)
 rename tests/{ => general_tests}/test_jax_api.py (100%)
 rename tests/{ => general_tests}/test_misc.py (100%)
 rename tests/{ => general_tests}/test_package.py (100%)
 create mode 100644 tests/translator_tests/__init__.py
 create mode 100644 tests/translator_tests/primitive_translators/__init__.py
 rename tests/{ => translator_tests/primitive_translators}/test_sub_translators_alu.py (100%)
 rename tests/{ => translator_tests/primitive_translators}/test_sub_translators_broadcast_in_dim.py (100%)
 rename tests/{ => translator_tests/primitive_translators}/test_sub_translators_convert_element_type.py (100%)
 rename tests/{ => translator_tests/primitive_translators}/test_sub_translators_iota.py (100%)
 rename tests/{ => translator_tests/primitive_translators}/test_sub_translators_reshape.py (100%)
 rename tests/{ => translator_tests/primitive_translators}/test_sub_translators_select_n.py (100%)
 rename tests/{ => translator_tests/primitive_translators}/test_sub_translators_slicing.py (100%)
 rename tests/{ => translator_tests/primitive_translators}/test_sub_translators_squeeze_expand_dims.py (100%)
 rename tests/{ => translator_tests}/test_empty_jaxpr.py (100%)
 rename tests/{ => translator_tests}/test_jaxpr_translator_driver.py (100%)
 rename tests/{ => translator_tests}/test_subtranslator_helper.py (100%)

diff --git a/tests/conftest.py b/tests/conftest.py
new file mode 100644
index 0000000..f2d8b8f
--- /dev/null
+++ b/tests/conftest.py
@@ -0,0 +1,8 @@
+# JaCe - JAX Just-In-Time compilation using DaCe (Data Centric Parallel Programming)
+#
+# Copyright (c) 2024, ETH Zurich
+# All rights reserved.
+#
+# SPDX-License-Identifier: BSD-3-Clause
+
+"""General configuration for the tests."""
diff --git a/tests/general_tests/__init__.py b/tests/general_tests/__init__.py
new file mode 100644
index 0000000..a2c2edf
--- /dev/null
+++ b/tests/general_tests/__init__.py
@@ -0,0 +1,8 @@
+# JaCe - JAX Just-In-Time compilation using DaCe (Data Centric Parallel Programming)
+#
+# Copyright (c) 2024, ETH Zurich
+# All rights reserved.
+#
+# SPDX-License-Identifier: BSD-3-Clause
+
+"""General Jace tests."""
diff --git a/tests/test_caching.py b/tests/general_tests/test_caching.py
similarity index 100%
rename from tests/test_caching.py
rename to tests/general_tests/test_caching.py
diff --git a/tests/test_decorator.py b/tests/general_tests/test_decorator.py
similarity index 100%
rename from tests/test_decorator.py
rename to tests/general_tests/test_decorator.py
diff --git a/tests/test_jax_api.py b/tests/general_tests/test_jax_api.py
similarity index 100%
rename from tests/test_jax_api.py
rename to tests/general_tests/test_jax_api.py
diff --git a/tests/test_misc.py b/tests/general_tests/test_misc.py
similarity index 100%
rename from tests/test_misc.py
rename to tests/general_tests/test_misc.py
diff --git a/tests/test_package.py b/tests/general_tests/test_package.py
similarity index 100%
rename from tests/test_package.py
rename to tests/general_tests/test_package.py
diff --git a/tests/translator_tests/__init__.py b/tests/translator_tests/__init__.py
new file mode 100644
index 0000000..a04e6d9
--- /dev/null
+++ b/tests/translator_tests/__init__.py
@@ -0,0 +1,8 @@
+# JaCe - JAX Just-In-Time compilation using DaCe (Data Centric Parallel Programming)
+#
+# Copyright (c) 2024, ETH Zurich
+# All rights reserved.
+#
+# SPDX-License-Identifier: BSD-3-Clause
+
+"""Tests related to the translators."""
diff --git a/tests/translator_tests/primitive_translators/__init__.py b/tests/translator_tests/primitive_translators/__init__.py
new file mode 100644
index 0000000..16abf65
--- /dev/null
+++ b/tests/translator_tests/primitive_translators/__init__.py
@@ -0,0 +1,8 @@
+# JaCe - JAX Just-In-Time compilation using DaCe (Data Centric Parallel Programming)
+#
+# Copyright (c) 2024, ETH Zurich
+# All rights reserved.
+#
+# SPDX-License-Identifier: BSD-3-Clause
+
+"""Tests related to the actual primitive subtranslators."""
diff --git a/tests/test_sub_translators_alu.py b/tests/translator_tests/primitive_translators/test_sub_translators_alu.py
similarity index 100%
rename from tests/test_sub_translators_alu.py
rename to tests/translator_tests/primitive_translators/test_sub_translators_alu.py
diff --git a/tests/test_sub_translators_broadcast_in_dim.py b/tests/translator_tests/primitive_translators/test_sub_translators_broadcast_in_dim.py
similarity index 100%
rename from tests/test_sub_translators_broadcast_in_dim.py
rename to tests/translator_tests/primitive_translators/test_sub_translators_broadcast_in_dim.py
diff --git a/tests/test_sub_translators_convert_element_type.py b/tests/translator_tests/primitive_translators/test_sub_translators_convert_element_type.py
similarity index 100%
rename from tests/test_sub_translators_convert_element_type.py
rename to tests/translator_tests/primitive_translators/test_sub_translators_convert_element_type.py
diff --git a/tests/test_sub_translators_iota.py b/tests/translator_tests/primitive_translators/test_sub_translators_iota.py
similarity index 100%
rename from tests/test_sub_translators_iota.py
rename to tests/translator_tests/primitive_translators/test_sub_translators_iota.py
diff --git a/tests/test_sub_translators_reshape.py b/tests/translator_tests/primitive_translators/test_sub_translators_reshape.py
similarity index 100%
rename from tests/test_sub_translators_reshape.py
rename to tests/translator_tests/primitive_translators/test_sub_translators_reshape.py
diff --git a/tests/test_sub_translators_select_n.py b/tests/translator_tests/primitive_translators/test_sub_translators_select_n.py
similarity index 100%
rename from tests/test_sub_translators_select_n.py
rename to tests/translator_tests/primitive_translators/test_sub_translators_select_n.py
diff --git a/tests/test_sub_translators_slicing.py b/tests/translator_tests/primitive_translators/test_sub_translators_slicing.py
similarity index 100%
rename from tests/test_sub_translators_slicing.py
rename to tests/translator_tests/primitive_translators/test_sub_translators_slicing.py
diff --git a/tests/test_sub_translators_squeeze_expand_dims.py b/tests/translator_tests/primitive_translators/test_sub_translators_squeeze_expand_dims.py
similarity index 100%
rename from tests/test_sub_translators_squeeze_expand_dims.py
rename to tests/translator_tests/primitive_translators/test_sub_translators_squeeze_expand_dims.py
diff --git a/tests/test_empty_jaxpr.py b/tests/translator_tests/test_empty_jaxpr.py
similarity index 100%
rename from tests/test_empty_jaxpr.py
rename to tests/translator_tests/test_empty_jaxpr.py
diff --git a/tests/test_jaxpr_translator_driver.py b/tests/translator_tests/test_jaxpr_translator_driver.py
similarity index 100%
rename from tests/test_jaxpr_translator_driver.py
rename to tests/translator_tests/test_jaxpr_translator_driver.py
diff --git a/tests/test_subtranslator_helper.py b/tests/translator_tests/test_subtranslator_helper.py
similarity index 100%
rename from tests/test_subtranslator_helper.py
rename to tests/translator_tests/test_subtranslator_helper.py

From 959849accb60762665589a653cf5568562ca106f Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Wed, 29 May 2024 13:47:35 +0200
Subject: [PATCH 264/458] WIP: Started to better organize the tests.

---
 tests/common_fixture.py | 8 ++++++++
 1 file changed, 8 insertions(+)
 create mode 100644 tests/common_fixture.py

diff --git a/tests/common_fixture.py b/tests/common_fixture.py
new file mode 100644
index 0000000..b36f22d
--- /dev/null
+++ b/tests/common_fixture.py
@@ -0,0 +1,8 @@
+# JaCe - JAX Just-In-Time compilation using DaCe (Data Centric Parallel Programming)
+#
+# Copyright (c) 2024, ETH Zurich
+# All rights reserved.
+#
+# SPDX-License-Identifier: BSD-3-Clause
+
+"""Contains all common fixture we need."""

From 047bb4691302d5c84637d9490d8271e1c1093a26 Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Wed, 29 May 2024 15:08:40 +0200
Subject: [PATCH 265/458] Applied a first version to the new code.

---
 src/jace/api.py                               |  6 ++---
 .../translator/jaxpr_translator_driver.py     | 23 +++++++++----------
 src/jace/util/jax_helper.py                   |  8 ++++---
 src/jace/util/traits.py                       |  8 ++-----
 4 files changed, 21 insertions(+), 24 deletions(-)

diff --git a/src/jace/api.py b/src/jace/api.py
index f1600c8..84b500a 100644
--- a/src/jace/api.py
+++ b/src/jace/api.py
@@ -11,7 +11,7 @@
 
 import functools
 from collections.abc import Callable, Mapping
-from typing import Any, Literal, overload
+from typing import Any, Literal, cast, overload
 
 from jax import grad, jacfwd, jacrev
 
@@ -20,9 +20,9 @@
 
 __all__ = [
     "grad",
-    "jit",
     "jacfwd",
     "jacrev",
+    "jit",
 ]
 
 
@@ -79,6 +79,6 @@ def wrapper(f: Callable) -> stages.JaceWrapped:
             ),
             jit_options=kwargs,
         )
-        return functools.update_wrapper(jace_wrapper, f)
+        return cast(stages.JaceWrapped, functools.update_wrapper(jace_wrapper, f))
 
     return wrapper if fun is None else wrapper(fun)
diff --git a/src/jace/translator/jaxpr_translator_driver.py b/src/jace/translator/jaxpr_translator_driver.py
index f66407d..9ab648c 100644
--- a/src/jace/translator/jaxpr_translator_driver.py
+++ b/src/jace/translator/jaxpr_translator_driver.py
@@ -67,7 +67,7 @@ class JaxprTranslationDriver:
 
     """
 
-    __slots__ = ("_ctx_stack", "_primitive_translators", "_jax_name_map")
+    __slots__ = ("_ctx_stack", "_jax_name_map", "_primitive_translators")
 
     _primitive_translators: Mapping[str, translator.PrimitiveTranslatorCallable]
     _jax_name_map: dict[jax_core.Var | util.JaCeVar, str]
@@ -205,14 +205,13 @@ def get_array(
     @overload
     def map_jax_var_to_sdfg(
         self,
-        jax_var: str | jax_core.Atom | util.JaCeVar,
+        jax_var: jax_core.Atom | util.JaCeVar,
+        allow_fail: Literal[False] = False,
     ) -> str: ...
 
     @overload
     def map_jax_var_to_sdfg(
-        self,
-        jax_var: str | jax_core.Atom | util.JaCeVar,
-        allow_fail: Literal[True],
+        self, jax_var: jax_core.Atom | util.JaCeVar, allow_fail: Literal[True]
     ) -> str | None: ...
 
     def map_jax_var_to_sdfg(
@@ -227,7 +226,7 @@ def map_jax_var_to_sdfg(
             allow_fail:     If mapping is not known return `None` instead of raising `KeyError`.
         """
         if isinstance(jax_var, jax_core.Literal):
-            raise RuntimeError("There is no SDFG variable for literal '{jax_var}'.")
+            raise RuntimeError(f"There is no SDFG variable for literal '{jax_var}'.")
         if jax_var in self._jax_name_map:
             sdfg_name = self._jax_name_map[jax_var]
         elif allow_fail:
@@ -254,9 +253,7 @@ def is_allocated(self) -> bool:
 
         If `self` is allocated then there is also an ongoing translation process.
         """
-        if len(self._ctx_stack) != 0:
-            return True
-        return False
+        return len(self._ctx_stack) != 0
 
     def is_root_translator(self) -> bool:
         """Tests if `self` is the root translator.
@@ -265,9 +262,7 @@ def is_root_translator(self) -> bool:
         """
         if not self.is_allocated():
             raise RuntimeError("Driver is not allocated.")
-        if len(self._ctx_stack) == 1:
-            return True
-        return False
+        return len(self._ctx_stack) == 1
 
     def add_jax_name_mapping(
         self,
@@ -329,6 +324,10 @@ def add_array(
             pipeline, should be handle to handle it. But there are some special parts that
             might explicitly want a scalar, it also might block certain compiler optimization.
         """
+
+        if isinstance(arg, jax_core.Literal):
+            raise ValueError(f"Can not generate an SDFG variable for literal '{arg}'.")
+
         shape: tuple[int | dace.symbol | str, ...] = util.get_jax_var_shape(arg)
         dtype: dace.typeclass = util.get_jax_var_dtype(arg)
         storage: dace.StorageType = dace.StorageType.Default  # Set at later stages (optimization)
diff --git a/src/jace/util/jax_helper.py b/src/jace/util/jax_helper.py
index 5641a48..68c31ce 100644
--- a/src/jace/util/jax_helper.py
+++ b/src/jace/util/jax_helper.py
@@ -104,7 +104,7 @@ def get_jax_var_shape(jax_var: jax_core.Atom | JaCeVar) -> tuple[int | dace.symb
     """Returns the shape of `jax_var`."""
     match jax_var:
         case jax_core.Var() | jax_core.Literal():
-            return jax_var.aval.shape
+            return jax_var.aval.shape  # type: ignore[attr-defined]  # AbstractValue is too abstract.
         case JaCeVar():
             return jax_var.shape
         case _:
@@ -115,7 +115,7 @@ def get_jax_var_dtype(jax_var: jax_core.Atom | JaCeVar) -> dace.typeclass:
     """Returns the DaCe equivalent of `jax_var`s datatype."""
     match jax_var:
         case jax_core.Var() | jax_core.Literal():
-            return translate_dtype(jax_var.aval.dtype)
+            return translate_dtype(jax_var.aval.dtype)  # type: ignore[attr-defined]  # AbstractValue is too abstract.
         case JaCeVar():
             return jax_var.dtype
         case _:
@@ -195,11 +195,13 @@ def propose_jax_name(
     return jax_name
 
 
-def get_jax_literal_value(lit: jax_core.Literal) -> bool | float | int | np.generic:
+def get_jax_literal_value(lit: jax_core.Atom) -> bool | float | int | np.generic:
     """Returns the value a literal is wrapping.
 
     The function guarantees to return a scalar value.
     """
+    if not isinstance(lit, jax_core.Literal):
+        raise ValueError(f"Can only extract literals not '{type(lit)}'.")
     val = lit.val
     if isinstance(val, np.ndarray):
         assert val.shape == ()
diff --git a/src/jace/util/traits.py b/src/jace/util/traits.py
index 92ed336..1f51d9e 100644
--- a/src/jace/util/traits.py
+++ b/src/jace/util/traits.py
@@ -32,7 +32,7 @@ def is_jaceified(obj: Any) -> TypeGuard[stages.JaceWrapped]:
     return isinstance(obj, stages.JaceWrapped)
 
 
-def is_drop_var(jax_var: jax_core.Atom | util.JaCeVar) -> TypeGuard[jax_core.DropVarp]:
+def is_drop_var(jax_var: jax_core.Atom | util.JaCeVar) -> TypeGuard[jax_core.DropVar]:
     """Tests if `jax_var` is a drop variable, i.e. a variable that is not read from in a Jaxpr."""
 
     if isinstance(jax_var, jax_core.DropVar):
@@ -119,11 +119,7 @@ def is_on_device(
     function is more of a test, if there is a GPU or not.
     """
     if is_jax_array(obj):
-        try:
-            _ = obj.__cuda_array_interface__
-            return True
-        except AttributeError:
-            return False
+        return hasattr(obj, "__cuda_array_interface__")
     return dace.is_gpu_array(obj)
 
 
From 64135b9de800a93d9fbadee602bdd3bb01665daf Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Wed, 29 May 2024 15:25:55 +0200
Subject: [PATCH 266/458] Second round.

---
 src/jace/__init__.py            |  8 ++++----
 src/jace/stages.py              |  6 +++---
 src/jace/translator/__init__.py |  4 ++--
 src/jace/util/__init__.py       | 20 ++++++++++----------
 4 files changed, 19 insertions(+), 19 deletions(-)

diff --git a/src/jace/__init__.py b/src/jace/__init__.py
index 7fed965..de111ec 100644
--- a/src/jace/__init__.py
+++ b/src/jace/__init__.py
@@ -18,11 +18,11 @@
 __all__ = [
     "__author__",
     "__copyright__",
-    "grad",
-    "jit",
-    "jacfwd",
-    "jacrev",
     "__license__",
     "__version__",
     "__version_info__",
+    "grad",
+    "jacfwd",
+    "jacrev",
+    "jit",
 ]
diff --git a/src/jace/stages.py b/src/jace/stages.py
index 43c07c2..1757a77 100644
--- a/src/jace/stages.py
+++ b/src/jace/stages.py
@@ -299,9 +299,9 @@ def __call__(
 
 
 __all__ = [
-    "Stage",
     "CompilerOptions",  # export for compatibility with Jax.
-    "JaceWrapped",
-    "JaceLowered",
     "JaceCompiled",
+    "JaceLowered",
+    "JaceWrapped",
+    "Stage",
 ]
diff --git a/src/jace/translator/__init__.py b/src/jace/translator/__init__.py
index 49342be..1bc0494 100644
--- a/src/jace/translator/__init__.py
+++ b/src/jace/translator/__init__.py
@@ -25,8 +25,8 @@
     "PrimitiveTranslator",
     "PrimitiveTranslatorCallable",
     "TranslatedJaxprSDFG",
-    "register_primitive_translator",
     "get_regsitered_primitive_translators",
-    "set_active_primitive_translators_to",
     "make_primitive_translator",
+    "register_primitive_translator",
+    "set_active_primitive_translators_to",
 ]
diff --git a/src/jace/util/__init__.py b/src/jace/util/__init__.py
index 572561f..7adcf90 100644
--- a/src/jace/util/__init__.py
+++ b/src/jace/util/__init__.py
@@ -41,26 +41,26 @@
 
 
 __all__ = [
+    "FORBIDDEN_SDFG_VAR_NAMES",
     "VALID_SDFG_OBJ_NAME",
     "VALID_SDFG_VAR_NAME",
-    "FORBIDDEN_SDFG_VAR_NAMES",
     "JaCeVar",
     "compile_jax_sdfg",
     "dataclass_with_default_init",
+    "get_jax_literal_value",
+    "get_jax_var_dtype",
+    "get_jax_var_name",
+    "get_jax_var_shape",
     "is_array",
     "is_drop_var",
-    "is_tracing_ongoing",
+    "is_fully_addressable",
     "is_jaceified",
-    "is_jaxified",
     "is_jax_array",
-    "is_fully_addressable",
+    "is_jaxified",
     "is_on_device",
     "is_scalar",
-    "get_jax_var_dtype",
-    "get_jax_var_name",
-    "get_jax_var_shape",
-    "get_jax_literal_value",
-    "translate_dtype",
-    "run_jax_sdfg",
+    "is_tracing_ongoing",
     "propose_jax_name",
+    "run_jax_sdfg",
+    "translate_dtype",
 ]

From 5756d1ec43c9b58cc5c47de287524af1b91330a1 Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Thu, 30 May 2024 07:29:45 +0200
Subject: [PATCH 267/458] Third rounds for updated configuration.

---
 .../translator/mapped_operation_base_translator.py  | 13 +++++++------
 .../convert_element_type_translator.py              |  6 +++---
 .../primitive_translators/reshape_translator.py     |  4 ++--
 .../translator/primitive_translators/slicing.py     |  6 +++---
 .../primitive_translators/squeeze_translator.py     |  4 ++--
 src/jace/util/jax_helper.py                         |  8 ++++++--
 6 files changed, 23 insertions(+), 18 deletions(-)

diff --git a/src/jace/translator/mapped_operation_base_translator.py b/src/jace/translator/mapped_operation_base_translator.py
index e7a3941..7202ef6 100644
--- a/src/jace/translator/mapped_operation_base_translator.py
+++ b/src/jace/translator/mapped_operation_base_translator.py
@@ -84,9 +84,10 @@ def __call__(
             For a description of the arguments see `PrimitiveTranslatorCallable`.
         """
         assert len(out_var_names) == 1
-        if eqn.outvars[0].aval.shape != ():
+        if util.get_jax_var_shape(eqn.outvars[0]) != ():
             tskl_ranges: list[tuple[str, str]] = [
-                (f"__i{dim}", f"0:{N}") for dim, N in enumerate(eqn.outvars[0].aval.shape)
+                (f"__i{dim}", f"0:{N}")
+                for dim, N in enumerate(util.get_jax_var_shape(eqn.outvars[0]))
             ]
             tskl_output: dict[str, dace.Memlet] = {
                 "__out": dace.Memlet.simple(
@@ -155,18 +156,18 @@ def make_input_memlets(
             in_var_names:   The list of SDFG variables used as input, `None` if literal.
             eqn:            The equation object.
         """
-        out_shp = tuple(eqn.outvars[0].aval.shape)  # Shape of the output
+        out_shp = tuple(util.get_jax_var_shape(eqn.outvars[0]))  # Shape of the output
         out_rank = len(out_shp)
-        if any(len(invar.aval.shape) not in {0, out_rank} for invar in eqn.invars):
+        if any(len(util.get_jax_var_shape(invar)) not in {0, out_rank} for invar in eqn.invars):
             raise NotImplementedError(
                 f"'MappedOperationTranslatorBase' Inputs must have the same rank as the output! "
-                f"Eqn: {eqn} || {tuple(eqn.outvars[0].aval.shape)}"
+                f"Eqn: {eqn} || {tuple(util.get_jax_var_shape(eqn.outvars[0]))}"
             )
 
         # Now we will generate the input Memlets.
         tskl_inputs: dict[str, dace.Memlet] = {}
         for i, (in_var_name, inp_shp) in enumerate(
-            zip(in_var_names, (invar.aval.shape for invar in eqn.invars))
+            zip(in_var_names, (util.get_jax_var_shape(invar) for invar in eqn.invars))
         ):
             if in_var_name is None:  # Input is a literal: No Memlet needed
                 continue
diff --git a/src/jace/translator/primitive_translators/convert_element_type_translator.py b/src/jace/translator/primitive_translators/convert_element_type_translator.py
index c316bb9..1c6343d 100644
--- a/src/jace/translator/primitive_translators/convert_element_type_translator.py
+++ b/src/jace/translator/primitive_translators/convert_element_type_translator.py
@@ -15,7 +15,7 @@
 from jax import core as jax_core
 from typing_extensions import override
 
-from jace import translator
+from jace import translator, util
 from jace.translator import mapped_operation_base_translator as mapped_base
 
 
@@ -49,9 +49,9 @@ def write_tasklet_code(
         if in_var_names[0] is None:
             raise NotImplementedError("'convert_element_type' is not supported for literals.")
 
-        in_dtype = eqn.invars[0].aval.dtype
+        in_dtype = util.get_jax_var_dtype(eqn.invars[0])
         in_dtype_s: str = str(in_dtype)
-        out_dtype = eqn.outvars[0].aval.dtype
+        out_dtype = util.get_jax_var_dtype(eqn.outvars[0])
         out_dtype_s: str = str(out_dtype)
 
         # This is the base of the template that we use for conversion.
diff --git a/src/jace/translator/primitive_translators/reshape_translator.py b/src/jace/translator/primitive_translators/reshape_translator.py
index 47a92bf..e5e4894 100644
--- a/src/jace/translator/primitive_translators/reshape_translator.py
+++ b/src/jace/translator/primitive_translators/reshape_translator.py
@@ -13,7 +13,7 @@
 from jax import core as jax_core
 from typing_extensions import override
 
-from jace import translator
+from jace import translator, util
 
 
 class ReshapeTranslator(translator.PrimitiveTranslator):
@@ -50,7 +50,7 @@ def __call__(
             eqn_state.add_write(out_var_names[0]),
             dace.Memlet(
                 data=in_var_names[0],
-                subset=", ".join(f"0:{size}" for size in eqn.invars[0].aval.shape),
+                subset=", ".join(f"0:{size}" for size in util.get_jax_var_shape(eqn.invars[0])),
                 other_subset=", ".join(f"0:{size}" for size in eqn.params["new_sizes"]),
             ),
         )
diff --git a/src/jace/translator/primitive_translators/slicing.py b/src/jace/translator/primitive_translators/slicing.py
index babfa08..1e32f41 100644
--- a/src/jace/translator/primitive_translators/slicing.py
+++ b/src/jace/translator/primitive_translators/slicing.py
@@ -91,7 +91,7 @@ def __call__(
         eqn_state: dace.SDFGState,
     ) -> None:
         assert in_var_names[0]
-        assert len(in_var_names) == len(eqn.invars[0].aval.shape) + 1
+        assert len(in_var_names) == len(util.get_jax_var_shape(eqn.invars[0])) + 1
 
         # This is the sizes of the slice window.
         window_sizes: Sequence[int] = eqn.params["slice_sizes"]
@@ -112,7 +112,7 @@ def __call__(
         #  To do it we will use Tasklets, because otherwise we can not merge the state.
         # TODO(phimuell): Make the Tasklet mapped, that they can be merged.
         for dim, (start_index, dim_size, wsize) in enumerate(
-            zip(start_indices, eqn.invars[0].aval.shape, window_sizes)
+            zip(start_indices, util.get_jax_var_shape(eqn.invars[0]), window_sizes)
         ):
             if start_index is None:
                 continue
@@ -152,7 +152,7 @@ def __call__(
             in_access[new_start_idx_var_name] = new_start_idx_acc
 
         tskl_ranges: list[tuple[str, str]] = [
-            (f"__i{dim}", f"0:{N}") for dim, N in enumerate(eqn.outvars[0].aval.shape)
+            (f"__i{dim}", f"0:{N}") for dim, N in enumerate(util.get_jax_var_shape(eqn.outvars[0]))
         ]
 
         # We use dynamic map ranges, thus the map entry has input connectors, that does not start
diff --git a/src/jace/translator/primitive_translators/squeeze_translator.py b/src/jace/translator/primitive_translators/squeeze_translator.py
index f699a63..fc63607 100644
--- a/src/jace/translator/primitive_translators/squeeze_translator.py
+++ b/src/jace/translator/primitive_translators/squeeze_translator.py
@@ -14,7 +14,7 @@
 from jax import core as jax_core
 from typing_extensions import override
 
-from jace import translator
+from jace import translator, util
 from jace.translator import mapped_operation_base_translator as mapped_base
 
 
@@ -46,7 +46,7 @@ def make_input_memlets(
         eqn: jax_core.JaxprEqn,
     ) -> dict[str, dace.Memlet]:
         to_rem: Sequence[str] = eqn.params["dimensions"]
-        in_rank: int = len(eqn.invars[0].aval.shape)
+        in_rank: int = len(util.get_jax_var_shape(eqn.invars[0]))
         cnt = itertools.count(0)
         return {
             "__in0": dace.Memlet.simple(
diff --git a/src/jace/util/jax_helper.py b/src/jace/util/jax_helper.py
index 68c31ce..8cbfb45 100644
--- a/src/jace/util/jax_helper.py
+++ b/src/jace/util/jax_helper.py
@@ -104,7 +104,9 @@ def get_jax_var_shape(jax_var: jax_core.Atom | JaCeVar) -> tuple[int | dace.symb
     """Returns the shape of `jax_var`."""
     match jax_var:
         case jax_core.Var() | jax_core.Literal():
-            return jax_var.aval.shape  # type: ignore[attr-defined]  # AbstractValue is too abstract.
+            # AbstractValue, does not have a `shape` attribute, but in all cases we care, it will.
+            assert hasattr(jax_var.aval, "shape")
+            return jax_var.aval.shape
         case JaCeVar():
             return jax_var.shape
         case _:
@@ -115,7 +117,9 @@ def get_jax_var_dtype(jax_var: jax_core.Atom | JaCeVar) -> dace.typeclass:
     """Returns the DaCe equivalent of `jax_var`s datatype."""
     match jax_var:
         case jax_core.Var() | jax_core.Literal():
-            return translate_dtype(jax_var.aval.dtype)  # type: ignore[attr-defined]  # AbstractValue is too abstract.
+            # AbstractValue, does not have a `dtype` attribute, but in all cases we care, it will.
+            assert hasattr(jax_var.aval, "dtype")
+            return translate_dtype(jax_var.aval.dtype)
         case JaCeVar():
             return jax_var.dtype
         case _:

From 8b66af8ca8648afe9b4eb7c9c14f84952ae4339f Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Thu, 30 May 2024 07:56:49 +0200
Subject: [PATCH 268/458] Fourth batch of adapting new configuration.

---
 src/jace/api.py                               | 23 ++++---
 src/jace/optimization.py                      |  4 +-
 src/jace/stages.py                            | 64 ++++++++++---------
 src/jace/translator/managing.py               |  9 +--
 .../mapped_operation_base_translator.py       |  9 ++-
 src/jace/translator/pre_post_translation.py   |  3 +-
 src/jace/translator/primitive_translator.py   | 11 ++--
 .../primitive_translators/alu_translators.py  | 10 ++-
 .../broadcast_in_dim_translator.py            |  9 ++-
 .../convert_element_type_translator.py        | 21 +++---
 .../primitive_translators/copy_translator.py  | 11 +++-
 .../primitive_translators/iota_translator.py  | 11 +++-
 .../reshape_translator.py                     |  9 ++-
 .../select_n_translator.py                    |  9 ++-
 .../primitive_translators/slicing.py          |  9 ++-
 .../squeeze_translator.py                     |  9 ++-
 src/jace/util/compiling.py                    |  3 +-
 src/jace/util/jax_helper.py                   |  7 +-
 src/jace/util/traits.py                       |  6 +-
 src/jace/util/translation_cache.py            |  4 +-
 tests/general_tests/__init__.py               |  2 +-
 tests/general_tests/test_caching.py           | 16 ++---
 tests/general_tests/test_jax_api.py           | 10 +--
 tests/general_tests/test_misc.py              |  2 +-
 .../test_sub_translators_alu.py               | 35 ++++------
 .../test_sub_translators_broadcast_in_dim.py  |  4 +-
 ...st_sub_translators_convert_element_type.py | 10 ++-
 .../test_sub_translators_iota.py              |  4 +-
 .../test_sub_translators_reshape.py           | 11 ++--
 .../test_sub_translators_select_n.py          | 13 +++-
 .../test_sub_translators_slicing.py           |  6 +-
 ...est_sub_translators_squeeze_expand_dims.py | 10 ++-
 .../test_jaxpr_translator_driver.py           |  2 +-
 33 files changed, 217 insertions(+), 149 deletions(-)

diff --git a/src/jace/api.py b/src/jace/api.py
index 84b500a..4aed96c 100644
--- a/src/jace/api.py
+++ b/src/jace/api.py
@@ -10,14 +10,17 @@
 from __future__ import annotations
 
 import functools
-from collections.abc import Callable, Mapping
-from typing import Any, Literal, cast, overload
+from typing import TYPE_CHECKING, Any, Literal, cast, overload
 
 from jax import grad, jacfwd, jacrev
 
 from jace import stages, translator
 
 
+if TYPE_CHECKING:
+    from collections.abc import Callable, Mapping
+
+
 __all__ = [
     "grad",
     "jacfwd",
@@ -32,7 +35,7 @@ def jit(
     /,
     primitive_translators: Mapping[str, translator.PrimitiveTranslator] | None = None,
     **kwargs: Any,
-) -> Callable[[Callable], stages.JaceWrapped]: ...
+) -> Callable[[Callable], stages.JaCeWrapped]: ...
 
 
 @overload
@@ -41,7 +44,7 @@ def jit(
     /,
     primitive_translators: Mapping[str, translator.PrimitiveTranslator] | None = None,
     **kwargs: Any,
-) -> stages.JaceWrapped: ...
+) -> stages.JaCeWrapped: ...
 
 
 def jit(
@@ -49,12 +52,12 @@ def jit(
     /,
     primitive_translators: Mapping[str, translator.PrimitiveTranslator] | None = None,
     **kwargs: Any,
-) -> stages.JaceWrapped | Callable[[Callable], stages.JaceWrapped]:
-    """Jace's replacement for `jax.jit` (just-in-time) wrapper.
+) -> stages.JaCeWrapped | Callable[[Callable], stages.JaCeWrapped]:
+    """JaCe's replacement for `jax.jit` (just-in-time) wrapper.
 
     It works the same way as `jax.jit` does, but instead of using XLA the computation is lowered
     to DaCe. It supports the same arguments as `jax.jit` (although currently not) does.
-    In addition it accepts some Jace specific arguments.
+    In addition it accepts some JaCe specific arguments.
 
     Args:
         primitive_translators:    Use these primitive translators for the lowering to SDFG.
@@ -69,8 +72,8 @@ def jit(
             f"The following arguments to 'jace.jit' are not yet supported: {', '.join(kwargs)}."
         )
 
-    def wrapper(f: Callable) -> stages.JaceWrapped:
-        jace_wrapper = stages.JaceWrapped(
+    def wrapper(f: Callable) -> stages.JaCeWrapped:
+        jace_wrapper = stages.JaCeWrapped(
             fun=f,
             primitive_translators=(
                 translator.managing._PRIMITIVE_TRANSLATORS_DICT
@@ -79,6 +82,6 @@ def wrapper(f: Callable) -> stages.JaceWrapped:
             ),
             jit_options=kwargs,
         )
-        return cast(stages.JaceWrapped, functools.update_wrapper(jace_wrapper, f))
+        return cast(stages.JaCeWrapped, functools.update_wrapper(jace_wrapper, f))
 
     return wrapper if fun is None else wrapper(fun)
diff --git a/src/jace/optimization.py b/src/jace/optimization.py
index d232902..255485d 100644
--- a/src/jace/optimization.py
+++ b/src/jace/optimization.py
@@ -5,7 +5,7 @@
 #
 # SPDX-License-Identifier: BSD-3-Clause
 
-"""Module that will host all optimization functions specific to Jace.
+"""Module that will host all optimization functions specific to JaCe.
 
 Currently just a dummy existing for the sake of providing some callable function.
 """
@@ -22,7 +22,7 @@
 
 
 class CompilerOptions(TypedDict, total=False):
-    """All known compiler options known to `JaceLowered.compile()`.
+    """All known compiler options known to `JaCeLowered.compile()`.
 
     See `jace_optimize()` for a description of the different options.
 
diff --git a/src/jace/stages.py b/src/jace/stages.py
index 1757a77..288b2db 100644
--- a/src/jace/stages.py
+++ b/src/jace/stages.py
@@ -7,9 +7,9 @@
 """Reimplementation of the `jax.stages` module.
 
 This module reimplements the public classes of that Jax module.
-However, they are a big different, because Jace uses DaCe as backend.
+However, they are a big different, because JaCe uses DaCe as backend.
 
-As in Jax Jace has different stages, the terminology is taken from
+As in Jax JaCe has different stages, the terminology is taken from
 [Jax' AOT-Tutorial](https://jax.readthedocs.io/en/latest/aot.html).
 - Stage out:
     In this phase we translate an executable python function into Jaxpr.
@@ -25,10 +25,8 @@
 from __future__ import annotations
 
 import copy
-from collections.abc import Callable, Mapping, Sequence
-from typing import Any
+from typing import TYPE_CHECKING, Any
 
-import dace
 import jax as _jax
 
 from jace import optimization, translator, util
@@ -37,16 +35,22 @@
 from jace.util import dace_helper, translation_cache as tcache
 
 
-class JaceWrapped(tcache.CachingStage["JaceLowered"]):
+if TYPE_CHECKING:
+    from collections.abc import Callable, Mapping, Sequence
+
+    import dace
+
+
+class JaCeWrapped(tcache.CachingStage["JaCeLowered"]):
     """A function ready to be specialized, lowered, and compiled.
 
     This class represents the output of functions such as `jace.jit()` and is the first stage in
-    the translation/compilation chain of Jace. A user should never create a `JaceWrapped` object
+    the translation/compilation chain of JaCe. A user should never create a `JaCeWrapped` object
     directly, instead `jace.jit` should be used for that.
     While it supports just-in-time lowering and compilation these steps can also be performed
-    explicitly. The lowering performed by this stage is cached, thus if a `JaceWrapped` object is
+    explicitly. The lowering performed by this stage is cached, thus if a `JaCeWrapped` object is
     lowered later, with the same argument the result is taken from the cache.
-    Furthermore, a `JaceWrapped` object is composable with all Jax transformations.
+    Furthermore, a `JaCeWrapped` object is composable with all Jax transformations.
 
     Args:
         fun:                    The function that is wrapped.
@@ -88,7 +92,7 @@ def __call__(
         """Executes the wrapped function, lowering and compiling as needed in one step."""
 
         # If we are inside a traced context, then we forward the call to the wrapped function.
-        #  This ensures that Jace is composable with Jax.
+        #  This ensures that JaCe is composable with Jax.
         if util.is_tracing_ongoing(*args, **kwargs):
             return self._fun(*args, **kwargs)
 
@@ -101,7 +105,7 @@ def lower(
         self,
         *args: Any,
         **kwargs: Any,
-    ) -> JaceLowered:
+    ) -> JaCeLowered:
         """Lower this function explicitly for the given arguments.
 
         Performs the first two steps of the AOT steps described above, i.e. stage out to Jaxpr
@@ -128,7 +132,7 @@ def lower(
             tsdfg: translator.TranslatedJaxprSDFG = driver.translate_jaxpr(jaxpr)
         ptrans.postprocess_jaxpr_sdfg(tsdfg=tsdfg, fun=self.wrapped_fun)
 
-        return JaceLowered(tsdfg)
+        return JaCeLowered(tsdfg)
 
     @property
     def wrapped_fun(self) -> Callable:
@@ -139,7 +143,7 @@ def _make_call_description(
         self,
         *args: Any,
     ) -> tcache.StageTransformationSpec:
-        """This function computes the key for the `JaceWrapped.lower()` call to cache it.
+        """This function computes the key for the `JaCeWrapped.lower()` call to cache it.
 
         The function will compute a full abstract description on its argument. Currently it is
         only able to handle positional argument and does not support static arguments.
@@ -148,13 +152,13 @@ def _make_call_description(
         return tcache.StageTransformationSpec(stage_id=id(self), call_args=call_args)
 
 
-class JaceLowered(tcache.CachingStage["JaceCompiled"]):
+class JaCeLowered(tcache.CachingStage["JaCeCompiled"]):
     """Represents the original computation as an SDFG.
 
-    It represents the computation wrapped by a `JaceWrapped` translated and lowered to SDFG.
-    It is followed by the `JaceCompiled` stage.
-    Although, `JaceWrapped` is composable with Jax transformations `JaceLowered` is not.
-    A user should never create such an object, instead `JaceWrapped.lower()` should be used.
+    It represents the computation wrapped by a `JaCeWrapped` translated and lowered to SDFG.
+    It is followed by the `JaCeCompiled` stage.
+    Although, `JaCeWrapped` is composable with Jax transformations `JaCeLowered` is not.
+    A user should never create such an object, instead `JaCeWrapped.lower()` should be used.
 
     Args:
         tsdfg:  The lowered SDFG with metadata. Must be finalized.
@@ -181,11 +185,11 @@ def __init__(
     def compile(
         self,
         compiler_options: CompilerOptions | None = None,
-    ) -> JaceCompiled:
+    ) -> JaCeCompiled:
         """Optimize and compile the lowered SDFG using `compiler_options`.
 
         Returns an object that encapsulates a compiled SDFG object. To influence the various
-        optimizations and compile options of Jace you can use the `compiler_options` argument.
+        optimizations and compile options of JaCe you can use the `compiler_options` argument.
         If nothing is specified `jace.optimization.DEFAULT_OPTIMIZATIONS` will be used.
 
         Note:
@@ -197,7 +201,7 @@ def compile(
         tsdfg: translator.TranslatedJaxprSDFG = copy.deepcopy(self._translated_sdfg)
         optimization.jace_optimize(tsdfg=tsdfg, **self._make_compiler_options(compiler_options))
 
-        return JaceCompiled(
+        return JaCeCompiled(
             csdfg=util.compile_jax_sdfg(tsdfg),
             inp_names=tsdfg.inp_names,
             out_names=tsdfg.out_names,
@@ -231,7 +235,7 @@ def _make_call_description(
         """This function computes the key for the `self.compile()` call to cache it.
 
         The key that is computed by this function is based on the concrete values of the passed
-        compiler options. This is different from the key computed by `JaceWrapped` which is an
+        compiler options. This is different from the key computed by `JaCeWrapped` which is an
         abstract description.
         """
         options = self._make_compiler_options(compiler_options)
@@ -245,11 +249,11 @@ def _make_compiler_options(
         return optimization.DEFAULT_OPTIMIZATIONS | (compiler_options or {})
 
 
-class JaceCompiled:
+class JaCeCompiled:
     """Compiled version of the SDFG.
 
-    This is the last stage of the jit chain. A user should never create a `JaceCompiled` instance,
-    instead `JaceLowered.compile()` should be used.
+    This is the last stage of the jit chain. A user should never create a `JaCeCompiled` instance,
+    instead `JaCeLowered.compile()` should be used.
 
     Args:
         csdfg:      The compiled SDFG object.
@@ -294,14 +298,14 @@ def __call__(
         )
 
 
-#: Known compilation stages in Jace.
-Stage = JaceWrapped | JaceLowered | JaceCompiled
+#: Known compilation stages in JaCe.
+Stage = JaCeWrapped | JaCeLowered | JaCeCompiled
 
 
 __all__ = [
     "CompilerOptions",  # export for compatibility with Jax.
-    "JaceCompiled",
-    "JaceLowered",
-    "JaceWrapped",
+    "JaCeCompiled",
+    "JaCeLowered",
+    "JaCeWrapped",
     "Stage",
 ]
diff --git a/src/jace/translator/managing.py b/src/jace/translator/managing.py
index b785186..b081321 100644
--- a/src/jace/translator/managing.py
+++ b/src/jace/translator/managing.py
@@ -15,11 +15,12 @@
 
 from __future__ import annotations
 
-from collections.abc import Callable, Mapping, MutableMapping
 from typing import TYPE_CHECKING, Literal, cast, overload
 
 
 if TYPE_CHECKING:
+    from collections.abc import Callable, Mapping, MutableMapping
+
     from jace import translator
 
 #: Global registry of the active primitive translators.
@@ -94,7 +95,7 @@ def register_primitive_translator(
     translator.PrimitiveTranslator
     | Callable[[translator.PrimitiveTranslator], translator.PrimitiveTranslator]
 ):
-    """Adds a primitive translator to Jace's global registry.
+    """Adds a primitive translator to JaCe's global registry.
 
     If a translator for `primitive` is already registered an error will be generated. However,
     by specifying `overwrite` `primitive_translator` will replace the current one.
@@ -124,7 +125,7 @@ def wrapper(
 
 
 def get_regsitered_primitive_translators() -> dict[str, translator.PrimitiveTranslator]:
-    """Returns a copy of the current state of Jace's global primitive registry.
+    """Returns a copy of the current state of JaCe's global primitive registry.
 
     The function returns a mapping that maps the name of a primitive to the associated translator.
     No change to the global registry will affect the return value and vice versa.
@@ -135,7 +136,7 @@ def get_regsitered_primitive_translators() -> dict[str, translator.PrimitiveTran
 def set_active_primitive_translators_to(
     new_translators: Mapping[str, translator.PrimitiveTranslator],
 ) -> MutableMapping[str, translator.PrimitiveTranslator]:
-    """Exchange the global translator registry of Jace with `new_translators`.
+    """Exchange the global translator registry of JaCe with `new_translators`.
 
     The function will return the state of the global translator registry just before this call.
     Any changes to `new_translators` after calling this function will have no effect on the
diff --git a/src/jace/translator/mapped_operation_base_translator.py b/src/jace/translator/mapped_operation_base_translator.py
index 7202ef6..e400cfa 100644
--- a/src/jace/translator/mapped_operation_base_translator.py
+++ b/src/jace/translator/mapped_operation_base_translator.py
@@ -10,15 +10,20 @@
 from __future__ import annotations
 
 from abc import abstractmethod
-from collections.abc import MutableSequence, Sequence
+from typing import TYPE_CHECKING
 
 import dace
-from jax import core as jax_core
 from typing_extensions import final, override
 
 from jace import translator, util
 
 
+if TYPE_CHECKING:
+    from collections.abc import MutableSequence, Sequence
+
+    from jax import core as jax_core
+
+
 class MappedOperationTranslatorBase(translator.PrimitiveTranslator):
     """Implements the base for all "mapped base operations".
 
diff --git a/src/jace/translator/pre_post_translation.py b/src/jace/translator/pre_post_translation.py
index bfe5125..5cf8a58 100644
--- a/src/jace/translator/pre_post_translation.py
+++ b/src/jace/translator/pre_post_translation.py
@@ -14,11 +14,12 @@
 
 from __future__ import annotations
 
-from collections.abc import Callable
 from typing import TYPE_CHECKING
 
 
 if TYPE_CHECKING:
+    from collections.abc import Callable
+
     from jace import translator
 
 
diff --git a/src/jace/translator/primitive_translator.py b/src/jace/translator/primitive_translator.py
index f748cc0..57b9236 100644
--- a/src/jace/translator/primitive_translator.py
+++ b/src/jace/translator/primitive_translator.py
@@ -9,14 +9,15 @@
 from __future__ import annotations
 
 from abc import abstractmethod
-from collections.abc import MutableSequence, Sequence
 from typing import TYPE_CHECKING, Protocol, runtime_checkable
 
-import dace
-from jax import core as jax_core
-
 
 if TYPE_CHECKING:
+    from collections.abc import MutableSequence, Sequence
+
+    import dace
+    from jax import core as jax_core
+
     from jace import translator
 
 
@@ -94,7 +95,7 @@ class PrimitiveTranslator(PrimitiveTranslatorCallable, Protocol):
     the delegation pattern.
 
     You can use `jace.translator.register_primitive_translator()` to register your translator to
-    Jace.
+    JaCe.
     """
 
     __slots__ = ()
diff --git a/src/jace/translator/primitive_translators/alu_translators.py b/src/jace/translator/primitive_translators/alu_translators.py
index 43d7a00..a6d8bcc 100644
--- a/src/jace/translator/primitive_translators/alu_translators.py
+++ b/src/jace/translator/primitive_translators/alu_translators.py
@@ -9,16 +9,20 @@
 
 from __future__ import annotations
 
-from collections.abc import Sequence
-from typing import Final
+from typing import TYPE_CHECKING, Final
 
-from jax import core as jax_core
 from typing_extensions import override
 
 from jace import translator
 from jace.translator import mapped_operation_base_translator as mapped_base
 
 
+if TYPE_CHECKING:
+    from collections.abc import Sequence
+
+    from jax import core as jax_core
+
+
 class ALUTranslator(mapped_base.MappedOperationTranslatorBase):
     """Translator for all arithmetic and logical operations.
 
diff --git a/src/jace/translator/primitive_translators/broadcast_in_dim_translator.py b/src/jace/translator/primitive_translators/broadcast_in_dim_translator.py
index e03c0f0..a42c61a 100644
--- a/src/jace/translator/primitive_translators/broadcast_in_dim_translator.py
+++ b/src/jace/translator/primitive_translators/broadcast_in_dim_translator.py
@@ -9,16 +9,21 @@
 
 from __future__ import annotations
 
-from collections.abc import Sequence
+from typing import TYPE_CHECKING
 
 import dace
-from jax import core as jax_core
 from typing_extensions import override
 
 from jace import translator
 from jace.translator import mapped_operation_base_translator as mapped_base
 
 
+if TYPE_CHECKING:
+    from collections.abc import Sequence
+
+    from jax import core as jax_core
+
+
 class BroadcastInDimTranslator(mapped_base.MappedOperationTranslatorBase):
     """This handles the `broadcast_in_dim` primitives."""
 
diff --git a/src/jace/translator/primitive_translators/convert_element_type_translator.py b/src/jace/translator/primitive_translators/convert_element_type_translator.py
index 1c6343d..7d006e0 100644
--- a/src/jace/translator/primitive_translators/convert_element_type_translator.py
+++ b/src/jace/translator/primitive_translators/convert_element_type_translator.py
@@ -9,16 +9,21 @@
 
 from __future__ import annotations
 
-from collections.abc import Sequence
+from typing import TYPE_CHECKING
 
 import dace
-from jax import core as jax_core
 from typing_extensions import override
 
 from jace import translator, util
 from jace.translator import mapped_operation_base_translator as mapped_base
 
 
+if TYPE_CHECKING:
+    from collections.abc import Sequence
+
+    from jax import core as jax_core
+
+
 class ConvertElementTypeTranslator(mapped_base.MappedOperationTranslatorBase):
     """Implements the `convert_element_type` primitive.
 
@@ -49,10 +54,10 @@ def write_tasklet_code(
         if in_var_names[0] is None:
             raise NotImplementedError("'convert_element_type' is not supported for literals.")
 
-        in_dtype = util.get_jax_var_dtype(eqn.invars[0])
-        in_dtype_s: str = str(in_dtype)
-        out_dtype = util.get_jax_var_dtype(eqn.outvars[0])
-        out_dtype_s: str = str(out_dtype)
+        in_dtype = util.get_jax_var_dtype(eqn.invars[0]).type
+        in_dtype_s: str = in_dtype.__name__
+        out_dtype = util.get_jax_var_dtype(eqn.outvars[0]).type
+        out_dtype_s: str = out_dtype.__name__
 
         # This is the base of the template that we use for conversion.
         #  You should notice that the Tasklet `__out = __in0` will fail, see commit
@@ -75,8 +80,8 @@ def write_tasklet_code(
         # The general case
         if out_dtype_s == "bool":
             conv_code = f"dace.bool_({conv_code})"
-        elif hasattr(dace.dtypes, str(out_dtype)):
-            conv_code = f"dace.{out_dtype!s}({conv_code})"
+        elif hasattr(dace.dtypes, out_dtype_s):
+            conv_code = f"dace.{out_dtype_s}({conv_code})"
         else:
             raise NotImplementedError(
                 f"Cannot convert '{in_dtype}' to '{out_dtype}' as this type is not known to DaCe."
diff --git a/src/jace/translator/primitive_translators/copy_translator.py b/src/jace/translator/primitive_translators/copy_translator.py
index acab7bd..466016a 100644
--- a/src/jace/translator/primitive_translators/copy_translator.py
+++ b/src/jace/translator/primitive_translators/copy_translator.py
@@ -9,15 +9,20 @@
 
 from __future__ import annotations
 
-from collections.abc import Sequence
+from typing import TYPE_CHECKING
 
-from jax import core as jax_core
 from typing_extensions import override
 
 from jace import translator
 from jace.translator import mapped_operation_base_translator as mapped_base
 
 
+if TYPE_CHECKING:
+    from collections.abc import Sequence
+
+    from jax import core as jax_core
+
+
 class CopyTranslator(mapped_base.MappedOperationTranslatorBase):
     """Copy operations are implemented as a map to ensure that they can be fused with other maps."""
 
@@ -40,7 +45,7 @@ class DevicePutTranslator(mapped_base.MappedOperationTranslatorBase):
     """The `device_put` primitive is used to transfer data between host and device.
 
     The current implementation only supports the copying where the data already is. Currently DaCe
-    only knows about the Host and the GPU. Furthermore, currently Jace works in such a way that
+    only knows about the Host and the GPU. Furthermore, currently JaCe works in such a way that
     everything is either put on the host or the device. Because of this, the `DevicePutTranslator`
     is, currently, just a simple copy operation that should be removed, by the optimization.
 
diff --git a/src/jace/translator/primitive_translators/iota_translator.py b/src/jace/translator/primitive_translators/iota_translator.py
index b64c138..ef2ced6 100644
--- a/src/jace/translator/primitive_translators/iota_translator.py
+++ b/src/jace/translator/primitive_translators/iota_translator.py
@@ -9,16 +9,21 @@
 
 from __future__ import annotations
 
-from collections.abc import Sequence
+from typing import TYPE_CHECKING
 
-import dace
-from jax import core as jax_core
 from typing_extensions import override
 
 from jace import translator
 from jace.translator import mapped_operation_base_translator as mapped_base
 
 
+if TYPE_CHECKING:
+    from collections.abc import Sequence
+
+    import dace
+    from jax import core as jax_core
+
+
 class IotaTranslator(mapped_base.MappedOperationTranslatorBase):
     """This handles the `iota` primitives.
 
diff --git a/src/jace/translator/primitive_translators/reshape_translator.py b/src/jace/translator/primitive_translators/reshape_translator.py
index e5e4894..a1a0381 100644
--- a/src/jace/translator/primitive_translators/reshape_translator.py
+++ b/src/jace/translator/primitive_translators/reshape_translator.py
@@ -7,15 +7,20 @@
 
 from __future__ import annotations
 
-from collections.abc import MutableSequence, Sequence
+from typing import TYPE_CHECKING
 
 import dace
-from jax import core as jax_core
 from typing_extensions import override
 
 from jace import translator, util
 
 
+if TYPE_CHECKING:
+    from collections.abc import MutableSequence, Sequence
+
+    from jax import core as jax_core
+
+
 class ReshapeTranslator(translator.PrimitiveTranslator):
     """Reshapes an array.
 
diff --git a/src/jace/translator/primitive_translators/select_n_translator.py b/src/jace/translator/primitive_translators/select_n_translator.py
index b2f0e58..00447f4 100644
--- a/src/jace/translator/primitive_translators/select_n_translator.py
+++ b/src/jace/translator/primitive_translators/select_n_translator.py
@@ -9,16 +9,21 @@
 
 from __future__ import annotations
 
-from collections.abc import Sequence
+from typing import TYPE_CHECKING
 
 import dace
-from jax import core as jax_core
 from typing_extensions import override
 
 from jace import translator
 from jace.translator import mapped_operation_base_translator as mapped_base
 
 
+if TYPE_CHECKING:
+    from collections.abc import Sequence
+
+    from jax import core as jax_core
+
+
 class SelectNTranslator(mapped_base.MappedOperationTranslatorBase):
     """Implements the `select_n` primitive, which is a generalization of `np.where`
 
diff --git a/src/jace/translator/primitive_translators/slicing.py b/src/jace/translator/primitive_translators/slicing.py
index 1e32f41..14a5582 100644
--- a/src/jace/translator/primitive_translators/slicing.py
+++ b/src/jace/translator/primitive_translators/slicing.py
@@ -9,16 +9,21 @@
 
 from __future__ import annotations
 
-from collections.abc import MutableSequence, Sequence
+from typing import TYPE_CHECKING
 
 import dace
-from jax import core as jax_core
 from typing_extensions import override
 
 from jace import translator, util
 from jace.translator import mapped_operation_base_translator as mapped_base
 
 
+if TYPE_CHECKING:
+    from collections.abc import MutableSequence, Sequence
+
+    from jax import core as jax_core
+
+
 class SlicingTranslator(mapped_base.MappedOperationTranslatorBase):
     """Implements the classical slicing operation.
 
diff --git a/src/jace/translator/primitive_translators/squeeze_translator.py b/src/jace/translator/primitive_translators/squeeze_translator.py
index fc63607..2b1e6a1 100644
--- a/src/jace/translator/primitive_translators/squeeze_translator.py
+++ b/src/jace/translator/primitive_translators/squeeze_translator.py
@@ -8,16 +8,21 @@
 from __future__ import annotations
 
 import itertools
-from collections.abc import Sequence
+from typing import TYPE_CHECKING
 
 import dace
-from jax import core as jax_core
 from typing_extensions import override
 
 from jace import translator, util
 from jace.translator import mapped_operation_base_translator as mapped_base
 
 
+if TYPE_CHECKING:
+    from collections.abc import Sequence
+
+    from jax import core as jax_core
+
+
 class SqueezeTranslator(mapped_base.MappedOperationTranslatorBase):
     """Allows to remove dimensions with size one.
 
diff --git a/src/jace/util/compiling.py b/src/jace/util/compiling.py
index 29f05e5..1402a9a 100644
--- a/src/jace/util/compiling.py
+++ b/src/jace/util/compiling.py
@@ -12,7 +12,6 @@
 import os
 import pathlib
 import time
-from collections.abc import Mapping, Sequence
 from typing import TYPE_CHECKING, Any
 
 import dace
@@ -21,6 +20,8 @@
 
 
 if TYPE_CHECKING:
+    from collections.abc import Mapping, Sequence
+
     from jace import translator
     from jace.util import dace_helper
 
diff --git a/src/jace/util/jax_helper.py b/src/jace/util/jax_helper.py
index 8cbfb45..d41ffaa 100644
--- a/src/jace/util/jax_helper.py
+++ b/src/jace/util/jax_helper.py
@@ -15,8 +15,7 @@
 
 import dataclasses
 import itertools
-from collections.abc import Mapping
-from typing import Any
+from typing import TYPE_CHECKING, Any
 
 import dace
 import jax.core as jax_core
@@ -25,6 +24,10 @@
 import jace.util as util
 
 
+if TYPE_CHECKING:
+    from collections.abc import Mapping
+
+
 @dataclasses.dataclass(repr=True, frozen=True, eq=False)
 class JaCeVar:
     """Replacement for the `jax.Var` class.
diff --git a/src/jace/util/traits.py b/src/jace/util/traits.py
index 1f51d9e..ae2f41b 100644
--- a/src/jace/util/traits.py
+++ b/src/jace/util/traits.py
@@ -21,7 +21,7 @@
 from jace import stages
 
 
-def is_jaceified(obj: Any) -> TypeGuard[stages.JaceWrapped]:
+def is_jaceified(obj: Any) -> TypeGuard[stages.JaCeWrapped]:
     """Tests if `obj` is decorated by JaCe.
 
     Similar to `is_jaxified`, but for JaCe object.
@@ -29,7 +29,7 @@ def is_jaceified(obj: Any) -> TypeGuard[stages.JaceWrapped]:
 
     if util.is_jaxified(obj):
         return False
-    return isinstance(obj, stages.JaceWrapped)
+    return isinstance(obj, stages.JaCeWrapped)
 
 
 def is_drop_var(jax_var: jax_core.Atom | util.JaCeVar) -> TypeGuard[jax_core.DropVar]:
@@ -49,7 +49,7 @@ def is_jaxified(
 
     A "jaxified" object is an object that was processed by Jax.
     While a return value of `True` guarantees a jaxified object, `False` does not proof the
-    contrary. See also `jace.util.is_jaceified()` to tests if something is a Jace object.
+    contrary. See also `jace.util.is_jaceified()` to tests if something is a JaCe object.
     """
     jaxifyed_types = (
         jax_core.Primitive,
diff --git a/src/jace/util/translation_cache.py b/src/jace/util/translation_cache.py
index bc4f0bf..73ff4dd 100644
--- a/src/jace/util/translation_cache.py
+++ b/src/jace/util/translation_cache.py
@@ -7,8 +7,8 @@
 
 """This module contains the functionality related to the compilation cache of the stages.
 
-The cache currently caches the lowering, i.e. the result of `JaceWrapped.lower()` and the
-compilation, i.e. `JaceLowered.compile()`. The caches are on a per stage basis and not on a
+The cache currently caches the lowering, i.e. the result of `JaCeWrapped.lower()` and the
+compilation, i.e. `JaCeLowered.compile()`. The caches are on a per stage basis and not on a
 per instant basis. To make a stage cacheable, it must be derived from `CachingStage` and
 its transition function must be decoration with `@cached_transition`.
 """
diff --git a/tests/general_tests/__init__.py b/tests/general_tests/__init__.py
index a2c2edf..5be01f1 100644
--- a/tests/general_tests/__init__.py
+++ b/tests/general_tests/__init__.py
@@ -5,4 +5,4 @@
 #
 # SPDX-License-Identifier: BSD-3-Clause
 
-"""General Jace tests."""
+"""General JaCe tests."""
diff --git a/tests/general_tests/test_caching.py b/tests/general_tests/test_caching.py
index fb050be..3f5dd0f 100644
--- a/tests/general_tests/test_caching.py
+++ b/tests/general_tests/test_caching.py
@@ -35,7 +35,7 @@ def _clear_translation_cache():
     tcache.clear_translation_cache()
 
 
-def test_caching_same_sizes():
+def test_caching_same_sizes() -> None:
     """The behaviour of the cache if same sizes are used."""
 
     # Counter for how many time it was lowered.
@@ -60,8 +60,8 @@ def wrapped(A, B):
     BB = B + 0.638956
 
     # Now let's lower it once directly and call it.
-    lowered: stages.JaceLowered = wrapped.lower(A, B)
-    compiled: stages.JaceCompiled = lowered.compile()
+    lowered: stages.JaCeLowered = wrapped.lower(A, B)
+    compiled: stages.JaCeCompiled = lowered.compile()
     assert lowering_cnt[0] == 1
     assert np.allclose(testee(A, B), compiled(A, B))
 
@@ -111,7 +111,7 @@ def wrapped(A, B):
     assert compiled1 is not compiled2
 
 
-def test_caching_different_structure():
+def test_caching_different_structure() -> None:
     """Now tests if we can handle multiple arguments with different structures.
 
     Todo:
@@ -134,10 +134,10 @@ def wrapped(A, B):
     # These are the arrays.
     args: dict[int, np.ndarray] = {id(x): x for x in [A, B, C, D]}
     # These are the known lowerings.
-    lowerings: dict[tuple[int, int], stages.JaceLowered] = {}
+    lowerings: dict[tuple[int, int], stages.JaCeLowered] = {}
     lowering_ids: set[int] = set()
     # These are the known compilations.
-    compilations: dict[tuple[int, int], stages.JaceCompiled] = {}
+    compilations: dict[tuple[int, int], stages.JaCeCompiled] = {}
     compiled_ids: set[int] = set()
 
     # Generating the lowerings
@@ -164,7 +164,7 @@ def wrapped(A, B):
         assert compiled1 is ccompiled
 
 
-def test_caching_compilation():
+def test_caching_compilation() -> None:
     """Tests the compilation cache, this is just very simple, since it uses the same code paths as lowering."""
 
     @jace.jit
@@ -255,6 +255,6 @@ def wrapped(A: np.ndarray) -> np.ndarray:
         F_lower = wrapped.lower(F)
         F_res = wrapped(F)
     assert F_lower is None  # Remove later.
-    assert C_res is not F_res  # Remove later
+    assert C_res is not F_res  # type: ignore[unreachable]
     assert np.allclose(F_res, C_res)
     assert F_lower is not C_lower
diff --git a/tests/general_tests/test_jax_api.py b/tests/general_tests/test_jax_api.py
index 221733a..f6c89df 100644
--- a/tests/general_tests/test_jax_api.py
+++ b/tests/general_tests/test_jax_api.py
@@ -45,7 +45,7 @@ def testee(A: np.ndarray, B: np.ndarray) -> np.ndarray:
 
 
 def test_composition_itself():
-    """Tests if Jace is composable with itself."""
+    """Tests if JaCe is composable with itself."""
 
     # Pure Python functions
     def f_ref(x):
@@ -83,7 +83,7 @@ def ddf(x):
 
 @pytest.mark.skip(reason="Nested Jaxpr are not handled.")
 def test_composition_with_jax():
-    """Tests if Jace can interact with Jax and vice versa."""
+    """Tests if JaCe can interact with Jax and vice versa."""
 
     def base_fun(A, B, C):
         return A + B * jnp.sin(C) - A * B
@@ -102,7 +102,7 @@ def jax_fun(A, B, C):
 
 @pytest.mark.skip(reason="Nested Jaxpr are not handled.")
 def test_composition_with_jax_2():
-    """Second test if Jace can interact with Jax and vice versa."""
+    """Second test if JaCe can interact with Jax and vice versa."""
 
     @jax.jit
     def f1_jax(A, B):
@@ -187,7 +187,7 @@ def df(x):
     assert df(x2) == df_x2, f"Failed upper branch, expected '{df_x2}', got '{res_2}'."
 
 
-@pytest.mark.skip(reason="Running Jace with disabled 'x64' support does not work.")
+@pytest.mark.skip(reason="Running JaCe with disabled 'x64' support does not work.")
 def test_disabled_x64():
     """Tests the behaviour of the tool chain if we explicitly disable x64 support in Jax.
 
@@ -203,7 +203,7 @@ def testee(A: np.ndarray, B: np.float64) -> np.ndarray:
 
     # Run them with disabled x64 support
     with disable_x64():
-        # Jace
+        # JaCe
         jace_testee = jace.jit(testee)
         jace_lowered = jace_testee.lower(A, B)
         jace_comp = jace_lowered.compile()
diff --git a/tests/general_tests/test_misc.py b/tests/general_tests/test_misc.py
index ec2a5b2..8870674 100644
--- a/tests/general_tests/test_misc.py
+++ b/tests/general_tests/test_misc.py
@@ -5,7 +5,7 @@
 #
 # SPDX-License-Identifier: BSD-3-Clause
 
-"""Implements general tests for Jace."""
+"""Implements general tests for JaCe."""
 
 from __future__ import annotations
 
diff --git a/tests/translator_tests/primitive_translators/test_sub_translators_alu.py b/tests/translator_tests/primitive_translators/test_sub_translators_alu.py
index 6ea74b7..24db139 100644
--- a/tests/translator_tests/primitive_translators/test_sub_translators_alu.py
+++ b/tests/translator_tests/primitive_translators/test_sub_translators_alu.py
@@ -9,8 +9,7 @@
 
 from __future__ import annotations
 
-from collections.abc import Callable, Sequence
-from typing import Any, cast
+from typing import TYPE_CHECKING, Any, cast
 
 import jax
 import numpy as np
@@ -19,6 +18,10 @@
 import jace
 
 
+if TYPE_CHECKING:
+    from collections.abc import Callable, Sequence
+
+
 def _perform_test(testee: Callable, *args: Any) -> None:
     """General function that just performs the test."""
     wrapped = jace.jit(testee)
@@ -38,7 +41,7 @@ def mkarr(
 def test_alu_unary_scalar():
     """Test unary ALU translator in the scalar case."""
 
-    def testee(A: float) -> float:
+    def testee(A: float) -> float | jax.Array:
         return jnp.cos(A)
 
     _perform_test(testee, 1.0)
@@ -47,7 +50,7 @@ def testee(A: float) -> float:
 def test_alu_unary_array():
     """Test unary ALU translator with array argument."""
 
-    def testee(A: np.ndarray) -> np.ndarray:
+    def testee(A: np.ndarray) -> jax.Array:
         return jnp.sin(A)
 
     A = mkarr((100, 10, 3))
@@ -58,7 +61,7 @@ def testee(A: np.ndarray) -> np.ndarray:
 def test_alu_unary_scalar_literal():
     """Test unary ALU translator with literal argument"""
 
-    def testee(A: float) -> float:
+    def testee(A: float) -> float | jax.Array:
         return jnp.sin(1.98) + A
 
     _perform_test(testee, 10.0)
@@ -149,7 +152,7 @@ def test_alu_binary_array_constants():
     """Test binary of array with constant."""
 
     def testee(A: np.ndarray) -> np.ndarray:
-        return A + jax.numpy.array([[1.0, 2.0, 3.0], [4.0, 5.0, 6.0], [7.0, 8.0, 9.0]])
+        return A + jnp.array([[1.0, 2.0, 3.0], [4.0, 5.0, 6.0], [7.0, 8.0, 9.0]])
 
     A = mkarr((3, 3))
     _perform_test(testee, A)
@@ -185,23 +188,7 @@ def test_alu_binary_broadcast_3():
     def testee(A: np.ndarray, B: np.ndarray) -> np.ndarray:
         return A + B
 
-    A = mkarr(
-        (
-            5,
-            1,
-            3,
-            4,
-            1,
-        )
-    )
-    B = mkarr(
-        (
-            5,
-            1,
-            3,
-            1,
-            2,
-        )
-    )
+    A = mkarr((5, 1, 3, 4, 1))
+    B = mkarr((5, 1, 3, 1, 2))
     _perform_test(testee, A, B)
     _perform_test(testee, B, A)
diff --git a/tests/translator_tests/primitive_translators/test_sub_translators_broadcast_in_dim.py b/tests/translator_tests/primitive_translators/test_sub_translators_broadcast_in_dim.py
index 28ebae7..7e6add5 100644
--- a/tests/translator_tests/primitive_translators/test_sub_translators_broadcast_in_dim.py
+++ b/tests/translator_tests/primitive_translators/test_sub_translators_broadcast_in_dim.py
@@ -35,7 +35,7 @@ def _enable_x64_mode_in_jax():
 def test_bid_scalar():
     """Broadcast a scalar to a matrix."""
 
-    def testee(A: float) -> np.ndarray:
+    def testee(A: float) -> jax.Array:
         return jnp.broadcast_to(A, (2, 2))
 
     for a in [1, 1.0, 3.1415]:
@@ -50,7 +50,7 @@ def testee(A: float) -> np.ndarray:
 def test_bid_literal():
     """Broadcast a literal to a matrix."""
 
-    def testee(a: float) -> np.ndarray:
+    def testee(a: float) -> np.ndarray | jax.Array:
         return jnp.broadcast_to(1.0, (10, 10)) + a
 
     for a in [1, 1.0, 3.1415]:
diff --git a/tests/translator_tests/primitive_translators/test_sub_translators_convert_element_type.py b/tests/translator_tests/primitive_translators/test_sub_translators_convert_element_type.py
index cb2e690..f1d9ec6 100644
--- a/tests/translator_tests/primitive_translators/test_sub_translators_convert_element_type.py
+++ b/tests/translator_tests/primitive_translators/test_sub_translators_convert_element_type.py
@@ -9,9 +9,9 @@
 
 from __future__ import annotations
 
-from collections.abc import Sequence
-from typing import Final
+from typing import TYPE_CHECKING, Final
 
+import jax
 import numpy as np
 import pytest
 from jax import numpy as jnp
@@ -19,6 +19,10 @@
 import jace
 
 
+if TYPE_CHECKING:
+    from collections.abc import Sequence
+
+
 # fmt: off
 _DACE_TYPES: Final[list[type]] = [
         np.int_, np.int8, np.int16, np.int32, np.int64,
@@ -44,7 +48,7 @@ def _test_convert_element_type_impl(
             lowering_cnt[1] += 1
 
             @jace.jit
-            def converter(A: np.ndarray) -> np.ndarray:
+            def converter(A: np.ndarray) -> jax.Array:
                 lowering_cnt[0] += 1
                 return jnp.array(A, copy=False, dtype=output_type)  # noqa: B023  # Loop variable.
 
diff --git a/tests/translator_tests/primitive_translators/test_sub_translators_iota.py b/tests/translator_tests/primitive_translators/test_sub_translators_iota.py
index 696a536..63f790b 100644
--- a/tests/translator_tests/primitive_translators/test_sub_translators_iota.py
+++ b/tests/translator_tests/primitive_translators/test_sub_translators_iota.py
@@ -17,7 +17,7 @@
 def test_iota_arange():
     """Tests `jnp.arange` functionality."""
 
-    def testee(A: int) -> np.ndarray:
+    def testee(A: int) -> jax.Array:
         return jnp.arange(18, dtype=int) + A
 
     ref = testee(0)
@@ -31,7 +31,7 @@ def test_iota_broadcast():
 
     for d in range(len(shape)):
 
-        def testee(A: np.int32) -> np.ndarray:
+        def testee(A: np.int32) -> jax.Array:
             return jax.lax.broadcasted_iota("int32", shape, d) + A  # noqa: B023  # Variable capturing.
 
         ref = testee(np.int32(0))
diff --git a/tests/translator_tests/primitive_translators/test_sub_translators_reshape.py b/tests/translator_tests/primitive_translators/test_sub_translators_reshape.py
index 378cf61..80b1e8d 100644
--- a/tests/translator_tests/primitive_translators/test_sub_translators_reshape.py
+++ b/tests/translator_tests/primitive_translators/test_sub_translators_reshape.py
@@ -9,8 +9,9 @@
 
 from __future__ import annotations
 
-from collections.abc import Sequence
+from typing import TYPE_CHECKING
 
+import jax
 import numpy as np
 import pytest
 from jax import numpy as jnp
@@ -18,6 +19,10 @@
 import jace
 
 
+if TYPE_CHECKING:
+    from collections.abc import Sequence
+
+
 def _test_impl_reshaping(
     src_shape: Sequence[int],
     dst_shape: Sequence[int],
@@ -27,11 +32,9 @@ def _test_impl_reshaping(
     A = np.random.random(src_shape)  # noqa: NPY002
     A = np.array(A, order=order)  # type: ignore[call-overload]  # MyPy wants a literal as order.
 
-    def testee(A: np.ndarray) -> np.ndarray:
+    def testee(A: np.ndarray) -> jax.Array:
         return jnp.reshape(A, dst_shape)
 
-    print(f"SHAPE: {A.shape} -> {dst_shape}")
-
     ref = testee(A)
     res = jace.jit(testee)(A)
 
diff --git a/tests/translator_tests/primitive_translators/test_sub_translators_select_n.py b/tests/translator_tests/primitive_translators/test_sub_translators_select_n.py
index dd2002c..576e53f 100644
--- a/tests/translator_tests/primitive_translators/test_sub_translators_select_n.py
+++ b/tests/translator_tests/primitive_translators/test_sub_translators_select_n.py
@@ -25,7 +25,7 @@ def _disable_jit():
 
     The reason we do this is because we can currently not handle this nested jits.
     It is important that it also disabled explicit usage of `jax.jit`.
-    However, since Jace does not honor this flag we it does not affect us.
+    However, since JaCe does not honor this flag we it does not affect us.
 
     Todo:
         Remove as soon as we can handle nested `jit`.
@@ -34,6 +34,13 @@ def _disable_jit():
         yield
 
 
+@pytest.fixture(autouse=True)
+def _enable_x64_mode_in_jax():
+    """Ensures that x64 mode in Jax ins enabled."""
+    with jax.experimental.enable_x64():
+        yield
+
+
 @pytest.fixture()
 def Pred() -> np.ndarray:
     return np.random.random((10, 10)) > 0.5  # noqa: NPY002
@@ -46,7 +53,7 @@ def tbranch() -> np.ndarray:
 
 @pytest.fixture()
 def fbranch() -> np.ndarray:
-    return np.ones((10, 10))
+    return np.zeros((10, 10))
 
 
 def _perform_test(P: Any, T: Any, F: Any):
@@ -82,7 +89,7 @@ def test_select_n_many_inputs():
     cases = [np.full(shape, i) for i in range(nbcases)]
     pred = np.arange(cases[0].size).reshape(shape) % 5
 
-    def testee(pred: np.ndarray, *cases: np.ndarray) -> np.ndarray:
+    def testee(pred: np.ndarray, *cases: np.ndarray) -> jax.Array:
         return jax.lax.select_n(pred, *cases)
 
     ref = testee(pred, *cases)
diff --git a/tests/translator_tests/primitive_translators/test_sub_translators_slicing.py b/tests/translator_tests/primitive_translators/test_sub_translators_slicing.py
index 7faa930..75c88a9 100644
--- a/tests/translator_tests/primitive_translators/test_sub_translators_slicing.py
+++ b/tests/translator_tests/primitive_translators/test_sub_translators_slicing.py
@@ -165,7 +165,7 @@ def testee(A: np.ndarray) -> np.ndarray:
 def test_dynamic_slice_full_dynamic(A_4x4x4x4, full_dynamic_start_idx):
     """Dynamic slicing where all start index are input parameters."""
 
-    def testee(A: np.ndarray, s1: int, s2: int, s3: int, s4: int) -> np.ndarray:
+    def testee(A: np.ndarray, s1: int, s2: int, s3: int, s4: int) -> jax.Array:
         return jax.lax.dynamic_slice(A, (s1, s2, s3, s4), (2, 2, 2, 2))
 
     res = jace.jit(testee)(A_4x4x4x4, *full_dynamic_start_idx)
@@ -177,7 +177,7 @@ def testee(A: np.ndarray, s1: int, s2: int, s3: int, s4: int) -> np.ndarray:
 def test_dynamic_slice_partially_dynamic(A_4x4x4x4):
     """Dynamic slicing where some start index are input parameters and others are literals."""
 
-    def testee(A: np.ndarray, s1: int, s2: int) -> np.ndarray:
+    def testee(A: np.ndarray, s1: int, s2: int) -> jax.Array:
         return jax.lax.dynamic_slice(A, (s1, 1, s2, 2), (2, 2, 2, 2))
 
     res = jace.jit(testee)(A_4x4x4x4, 1, 2)
@@ -189,7 +189,7 @@ def testee(A: np.ndarray, s1: int, s2: int) -> np.ndarray:
 def test_dynamic_slice_full_literal(A_4x4x4x4):
     """Dynamic slicing where all start indexes are literals."""
 
-    def testee(A: np.ndarray) -> np.ndarray:
+    def testee(A: np.ndarray) -> jax.Array:
         return jax.lax.dynamic_slice(A, (0, 1, 0, 2), (2, 2, 2, 2))
 
     res = jace.jit(testee)(A_4x4x4x4)
diff --git a/tests/translator_tests/primitive_translators/test_sub_translators_squeeze_expand_dims.py b/tests/translator_tests/primitive_translators/test_sub_translators_squeeze_expand_dims.py
index 3137c9f..f76fd3d 100644
--- a/tests/translator_tests/primitive_translators/test_sub_translators_squeeze_expand_dims.py
+++ b/tests/translator_tests/primitive_translators/test_sub_translators_squeeze_expand_dims.py
@@ -13,7 +13,7 @@
 
 from __future__ import annotations
 
-from collections.abc import Sequence
+from typing import TYPE_CHECKING
 
 import jax
 import numpy as np
@@ -23,6 +23,10 @@
 import jace
 
 
+if TYPE_CHECKING:
+    from collections.abc import Sequence
+
+
 def _roundtrip_implementation(
     shape: Sequence[int],
     axis: int | Sequence[int],
@@ -40,8 +44,8 @@ def _roundtrip_implementation(
 
     for ops in [jnp.expand_dims, jnp.squeeze]:
         with jax.experimental.enable_x64():
-            ref = ops(A, axis)
-            res = jace.jit(lambda A: ops(A, axis))(A)  # noqa: B023  # No capturing
+            ref = ops(A, axis)  # type: ignore[operator]  # Function of unknown type.
+            res = jace.jit(lambda A: ops(A, axis))(A)  # type: ignore[operator]  # noqa: B023
 
         assert ref.shape == res.shape, f"A.shape = {shape}; Expected: {ref.shape}; Got: {res.shape}"
         assert ref.dtype == res.dtype
diff --git a/tests/translator_tests/test_jaxpr_translator_driver.py b/tests/translator_tests/test_jaxpr_translator_driver.py
index 3a16cee..efae90a 100644
--- a/tests/translator_tests/test_jaxpr_translator_driver.py
+++ b/tests/translator_tests/test_jaxpr_translator_driver.py
@@ -21,7 +21,7 @@
 from jace.util import JaCeVar
 
 
-# These are some Jace variables that we use inside the tests
+# These are some JaCe variables that we use inside the tests
 #  Unnamed arrays
 array1 = JaCeVar((10, 12), dace.float64)
 array2 = JaCeVar((10, 13), dace.float32)

From a5826e925ca2130e168a9e2d99c515a472cd53c1 Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Thu, 30 May 2024 08:42:43 +0200
Subject: [PATCH 269/458] Fixed a bug in the cache.

The cleaning was not correct.
The function essentially created some deatached caches.
---
 src/jace/util/translation_cache.py | 6 +++++-
 1 file changed, 5 insertions(+), 1 deletion(-)

diff --git a/src/jace/util/translation_cache.py b/src/jace/util/translation_cache.py
index bc4f0bf..42f7b6a 100644
--- a/src/jace/util/translation_cache.py
+++ b/src/jace/util/translation_cache.py
@@ -112,7 +112,8 @@ def transition_wrapper(
 
 def clear_translation_cache() -> None:
     """Clear all caches associated to translation."""
-    _TRANSLATION_CACHES.clear()
+    for stage_caches in _TRANSLATION_CACHES.values():
+        stage_caches.clear()
 
 
 def get_cache(
@@ -289,5 +290,8 @@ def popitem(
             self._memory.move_to_end(key, last=False)
             self._memory.popitem(last=False)
 
+    def clear(self) -> None:
+        self._memory.clear()
+
     def __repr__(self) -> str:
         return f"StageCache({len(self._memory)} / {self._size} || {', '.join( '[' + repr(k) + ']' for k in self._memory)})"

From 6f4c45bdb99cafe1e2772db52e0caf6afbe92b7f Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Thu, 30 May 2024 08:42:43 +0200
Subject: [PATCH 270/458] Fixed a bug in the cache.

The cleaning was not correct.
The function essentially created some deatached caches.
---
 src/jace/util/translation_cache.py | 6 +++++-
 1 file changed, 5 insertions(+), 1 deletion(-)

diff --git a/src/jace/util/translation_cache.py b/src/jace/util/translation_cache.py
index 73ff4dd..c0f6fce 100644
--- a/src/jace/util/translation_cache.py
+++ b/src/jace/util/translation_cache.py
@@ -112,7 +112,8 @@ def transition_wrapper(
 
 def clear_translation_cache() -> None:
     """Clear all caches associated to translation."""
-    _TRANSLATION_CACHES.clear()
+    for stage_caches in _TRANSLATION_CACHES.values():
+        stage_caches.clear()
 
 
 def get_cache(
@@ -289,5 +290,8 @@ def popitem(
             self._memory.move_to_end(key, last=False)
             self._memory.popitem(last=False)
 
+    def clear(self) -> None:
+        self._memory.clear()
+
     def __repr__(self) -> str:
         return f"StageCache({len(self._memory)} / {self._size} || {', '.join( '[' + repr(k) + ']' for k in self._memory)})"

From 4735092db37767b48ecf0fbcecc512c339eb91c1 Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Thu, 30 May 2024 10:01:22 +0200
Subject: [PATCH 271/458] Reorganized some stuff.

---
 .../__init__.py                               |   5 +-
 .../primitive_translators/__init__.py         |   0
 .../test_primitive_alu.py}                    |   0
 .../test_primitive_broadcast_in_dim.py}       |   0
 .../test_primitive_convert_element_type.py    | 132 ++++++++++++++++++
 .../test_primitive_iota.py}                   |   0
 .../test_primitive_reshape.py}                |   0
 .../test_primitive_select_n.py}               |   0
 .../test_primitive_slicing.py}                |   0
 .../test_primitive_squeeze_expand_dims.py}    |   0
 .../test_empty_jaxpr.py                       |   5 +-
 .../test_jaxpr_translator_driver.py           |  16 ++-
 .../test_primitive_translator_managing.py}    |   2 +-
 ...st_sub_translators_convert_element_type.py | 106 --------------
 .../{general_tests => unit_tests}/__init__.py |   2 +-
 .../test_caching.py                           |   0
 .../test_decorator.py                         |   0
 .../test_jax_api.py                           |   0
 .../test_misc.py                              |   0
 .../test_package.py                           |   0
 20 files changed, 157 insertions(+), 111 deletions(-)
 rename tests/{translator_tests => integration_tests}/__init__.py (65%)
 rename tests/{translator_tests => integration_tests}/primitive_translators/__init__.py (100%)
 rename tests/{translator_tests/primitive_translators/test_sub_translators_alu.py => integration_tests/primitive_translators/test_primitive_alu.py} (100%)
 rename tests/{translator_tests/primitive_translators/test_sub_translators_broadcast_in_dim.py => integration_tests/primitive_translators/test_primitive_broadcast_in_dim.py} (100%)
 create mode 100644 tests/integration_tests/primitive_translators/test_primitive_convert_element_type.py
 rename tests/{translator_tests/primitive_translators/test_sub_translators_iota.py => integration_tests/primitive_translators/test_primitive_iota.py} (100%)
 rename tests/{translator_tests/primitive_translators/test_sub_translators_reshape.py => integration_tests/primitive_translators/test_primitive_reshape.py} (100%)
 rename tests/{translator_tests/primitive_translators/test_sub_translators_select_n.py => integration_tests/primitive_translators/test_primitive_select_n.py} (100%)
 rename tests/{translator_tests/primitive_translators/test_sub_translators_slicing.py => integration_tests/primitive_translators/test_primitive_slicing.py} (100%)
 rename tests/{translator_tests/primitive_translators/test_sub_translators_squeeze_expand_dims.py => integration_tests/primitive_translators/test_primitive_squeeze_expand_dims.py} (100%)
 rename tests/{translator_tests => integration_tests}/test_empty_jaxpr.py (90%)
 rename tests/{translator_tests => integration_tests}/test_jaxpr_translator_driver.py (97%)
 rename tests/{translator_tests/test_subtranslator_helper.py => integration_tests/test_primitive_translator_managing.py} (99%)
 delete mode 100644 tests/translator_tests/primitive_translators/test_sub_translators_convert_element_type.py
 rename tests/{general_tests => unit_tests}/__init__.py (87%)
 rename tests/{general_tests => unit_tests}/test_caching.py (100%)
 rename tests/{general_tests => unit_tests}/test_decorator.py (100%)
 rename tests/{general_tests => unit_tests}/test_jax_api.py (100%)
 rename tests/{general_tests => unit_tests}/test_misc.py (100%)
 rename tests/{general_tests => unit_tests}/test_package.py (100%)

diff --git a/tests/translator_tests/__init__.py b/tests/integration_tests/__init__.py
similarity index 65%
rename from tests/translator_tests/__init__.py
rename to tests/integration_tests/__init__.py
index a04e6d9..edaf6ea 100644
--- a/tests/translator_tests/__init__.py
+++ b/tests/integration_tests/__init__.py
@@ -5,4 +5,7 @@
 #
 # SPDX-License-Identifier: BSD-3-Clause
 
-"""Tests related to the translators."""
+"""JaCe's integration tests.
+
+Currently they are mostly related to the primitive translators.
+"""
diff --git a/tests/translator_tests/primitive_translators/__init__.py b/tests/integration_tests/primitive_translators/__init__.py
similarity index 100%
rename from tests/translator_tests/primitive_translators/__init__.py
rename to tests/integration_tests/primitive_translators/__init__.py
diff --git a/tests/translator_tests/primitive_translators/test_sub_translators_alu.py b/tests/integration_tests/primitive_translators/test_primitive_alu.py
similarity index 100%
rename from tests/translator_tests/primitive_translators/test_sub_translators_alu.py
rename to tests/integration_tests/primitive_translators/test_primitive_alu.py
diff --git a/tests/translator_tests/primitive_translators/test_sub_translators_broadcast_in_dim.py b/tests/integration_tests/primitive_translators/test_primitive_broadcast_in_dim.py
similarity index 100%
rename from tests/translator_tests/primitive_translators/test_sub_translators_broadcast_in_dim.py
rename to tests/integration_tests/primitive_translators/test_primitive_broadcast_in_dim.py
diff --git a/tests/integration_tests/primitive_translators/test_primitive_convert_element_type.py b/tests/integration_tests/primitive_translators/test_primitive_convert_element_type.py
new file mode 100644
index 0000000..482842f
--- /dev/null
+++ b/tests/integration_tests/primitive_translators/test_primitive_convert_element_type.py
@@ -0,0 +1,132 @@
+# JaCe - JAX Just-In-Time compilation using DaCe (Data Centric Parallel Programming)
+#
+# Copyright (c) 2024, ETH Zurich
+# All rights reserved.
+#
+# SPDX-License-Identifier: BSD-3-Clause
+
+"""Tests the element type conversion functionality."""
+
+from __future__ import annotations
+
+from typing import TYPE_CHECKING, Final
+
+import jax
+import numpy as np
+import pytest
+from jax import numpy as jnp
+
+import jace
+from jace.util import translation_cache as tcache
+
+
+if TYPE_CHECKING:
+    pass
+
+
+# fmt: off
+_DACE_REAL_TYPES: Final[list[type]] = [
+        np.int_, np.int8, np.int16, np.int32, np.int64,
+        np.uint, np.uint8, np.uint16, np.uint32, np.uint64,
+        np.float64, np.float32, np.float64,
+]
+_DACE_COMPLEX_TYPES: Final[list[type]] = [
+        np.complex128, np.complex64, np.complex128,
+]
+# fmt: on
+
+
+@pytest.fixture(autouse=True)
+def _clear_translation_cache():
+    """Decorator that clears the translation cache.
+
+    Ensures that a function finds an empty cache and clears up afterwards.
+
+    Todo:
+        Ask Enrique how I can make that fixture apply everywhere not just in the file but the whole test suite.
+    """
+    tcache.clear_translation_cache()
+    yield
+    tcache.clear_translation_cache()
+
+
+@pytest.fixture(params=_DACE_REAL_TYPES)
+def src_type(request) -> type:
+    """All valid source types, with the exception of bool."""
+    return request.param
+
+
+@pytest.fixture(params=_DACE_REAL_TYPES + _DACE_COMPLEX_TYPES)
+def dst_type(request) -> type:
+    """All valid destination types, with the exception of bool.
+
+    Includes also complex types, because going from real to complex is useful, but the other
+    way is not.
+    """
+    return request.param
+
+
+def _convert_element_type_impl(
+    input_type: type,
+    output_type: type,
+) -> bool:
+    """Implementation of the tests of the convert element types primitive."""
+    lowering_cnt = [0]
+    A: np.ndarray = np.array(np.random.random((10, 10)), dtype=input_type)  # noqa: NPY002
+    assert A.dtype == input_type
+    ref: np.ndarray = np.array(A, copy=True, dtype=output_type)
+    assert ref.dtype == output_type
+
+    @jace.jit
+    def converter(A: np.ndarray) -> jax.Array:
+        lowering_cnt[0] += 1
+        return jnp.array(A, copy=False, dtype=output_type)  # Loop variable.
+
+    res = converter(A)
+    assert lowering_cnt[0] == 1
+    assert (
+        res.dtype == output_type
+    ), f"Expected '{output_type}', but got '{res.dtype}', input was '{input_type}'."
+    assert np.allclose(ref, res)
+    return True
+
+
+@pytest.mark.skip(reason="This test is too long, only do it on certain conditions.")
+def test_convert_element_type_main(src_type, dst_type):
+    """Tests all conversions with the exception of conversions from bool and complex."""
+    _convert_element_type_impl(src_type, dst_type)
+
+
+@pytest.mark.skip(reason="This test is too long, only do it on certain conditions.")
+def test_convert_element_type_from_bool(src_type):
+    _convert_element_type_impl(np.bool_, src_type)
+
+
+@pytest.mark.skip(reason="This test is too long, only do it on certain conditions.")
+def test_convert_element_type_to_bool(dst_type):
+    _convert_element_type_impl(dst_type, np.bool_)
+
+
+@pytest.mark.skip(reason="The warning was disabled, so the test is at the moment useless.")
+def test_convert_element_type_useless_cast():
+    """Shows that under some conditions there is really a casting from one type to the same.
+
+    In certain cases, also in some slicing tests, this useless cast is inserted by Jax.
+    This test was originally here to show this. However, that thing got so annoying that it was
+    removed. The test is kept here to serve as some kind of a reference.
+    """
+
+    def testee(a: float) -> np.ndarray:
+        # For it to work we have to use `numpy` instead of the Jax substitute.
+        return np.broadcast_to(1.0, (10, 10)) + a
+
+    with pytest.warns(
+        expected_warning=UserWarning,
+        match=r"convert_element_type\(.*\): is useless, input and output have same type\.",
+    ):
+        res = jace.jit(testee)(1.0)
+
+    ref = testee(1.0)
+    assert res.shape == ref.shape
+    assert res.dtype == ref.dtype
+    assert np.all(res == ref)
diff --git a/tests/translator_tests/primitive_translators/test_sub_translators_iota.py b/tests/integration_tests/primitive_translators/test_primitive_iota.py
similarity index 100%
rename from tests/translator_tests/primitive_translators/test_sub_translators_iota.py
rename to tests/integration_tests/primitive_translators/test_primitive_iota.py
diff --git a/tests/translator_tests/primitive_translators/test_sub_translators_reshape.py b/tests/integration_tests/primitive_translators/test_primitive_reshape.py
similarity index 100%
rename from tests/translator_tests/primitive_translators/test_sub_translators_reshape.py
rename to tests/integration_tests/primitive_translators/test_primitive_reshape.py
diff --git a/tests/translator_tests/primitive_translators/test_sub_translators_select_n.py b/tests/integration_tests/primitive_translators/test_primitive_select_n.py
similarity index 100%
rename from tests/translator_tests/primitive_translators/test_sub_translators_select_n.py
rename to tests/integration_tests/primitive_translators/test_primitive_select_n.py
diff --git a/tests/translator_tests/primitive_translators/test_sub_translators_slicing.py b/tests/integration_tests/primitive_translators/test_primitive_slicing.py
similarity index 100%
rename from tests/translator_tests/primitive_translators/test_sub_translators_slicing.py
rename to tests/integration_tests/primitive_translators/test_primitive_slicing.py
diff --git a/tests/translator_tests/primitive_translators/test_sub_translators_squeeze_expand_dims.py b/tests/integration_tests/primitive_translators/test_primitive_squeeze_expand_dims.py
similarity index 100%
rename from tests/translator_tests/primitive_translators/test_sub_translators_squeeze_expand_dims.py
rename to tests/integration_tests/primitive_translators/test_primitive_squeeze_expand_dims.py
diff --git a/tests/translator_tests/test_empty_jaxpr.py b/tests/integration_tests/test_empty_jaxpr.py
similarity index 90%
rename from tests/translator_tests/test_empty_jaxpr.py
rename to tests/integration_tests/test_empty_jaxpr.py
index 36e8247..18308f5 100644
--- a/tests/translator_tests/test_empty_jaxpr.py
+++ b/tests/integration_tests/test_empty_jaxpr.py
@@ -6,7 +6,10 @@
 # SPDX-License-Identifier: BSD-3-Clause
 
 """Implements tests for empty jaxprs.
-."""
+
+Todo:
+    Add more tests that are related to `cond`, i.e. not all inputs are needed.
+"""
 
 from __future__ import annotations
 
diff --git a/tests/translator_tests/test_jaxpr_translator_driver.py b/tests/integration_tests/test_jaxpr_translator_driver.py
similarity index 97%
rename from tests/translator_tests/test_jaxpr_translator_driver.py
rename to tests/integration_tests/test_jaxpr_translator_driver.py
index efae90a..5f3659f 100644
--- a/tests/translator_tests/test_jaxpr_translator_driver.py
+++ b/tests/integration_tests/test_jaxpr_translator_driver.py
@@ -499,7 +499,7 @@ def test_driver_constants(
 def test_driver_scalar_return_value(
     translation_driver: translator.JaxprTranslationDriver,
 ) -> None:
-    """Tests if scalars can be returned directly"""
+    """Tests if scalars can be returned directly."""
 
     def scalar_ops(A: float) -> float:
         return A + A - A * A
@@ -519,6 +519,20 @@ def wrapped(A: float) -> float:
     assert lower_cnt[0] == 1
 
 
+@pytest.mark.skip(reason="Currently 'scalar' return values, are actually shape '(1,)' arrays.")
+def test_driver_scalar_return_type(
+    translation_driver: translator.JaxprTranslationDriver,
+) -> None:
+    """Tests if the type is the same, in case of scalar return."""
+
+    @jace.jit
+    def wrapped(A: np.float64) -> np.float64:
+        return A + A - A * A
+
+    A = np.float64(1.0)
+    assert type(A) is np.float64, f"Expected type 'np.float64', but got '{type(A).__name__}'."
+
+
 def test_driver_jace_var() -> None:
     """Simple tests about the `JaCeVar` objects."""
     for iname in ["do", "", "_ _", "9al", "_!"]:
diff --git a/tests/translator_tests/test_subtranslator_helper.py b/tests/integration_tests/test_primitive_translator_managing.py
similarity index 99%
rename from tests/translator_tests/test_subtranslator_helper.py
rename to tests/integration_tests/test_primitive_translator_managing.py
index fb34bcf..51d5e09 100644
--- a/tests/translator_tests/test_subtranslator_helper.py
+++ b/tests/integration_tests/test_primitive_translator_managing.py
@@ -5,7 +5,7 @@
 #
 # SPDX-License-Identifier: BSD-3-Clause
 
-"""Implements tests to check if the sorting algorithm is correct."""
+"""Implements tests for managing the primitive subtranslators."""
 
 from __future__ import annotations
 
diff --git a/tests/translator_tests/primitive_translators/test_sub_translators_convert_element_type.py b/tests/translator_tests/primitive_translators/test_sub_translators_convert_element_type.py
deleted file mode 100644
index f1d9ec6..0000000
--- a/tests/translator_tests/primitive_translators/test_sub_translators_convert_element_type.py
+++ /dev/null
@@ -1,106 +0,0 @@
-# JaCe - JAX Just-In-Time compilation using DaCe (Data Centric Parallel Programming)
-#
-# Copyright (c) 2024, ETH Zurich
-# All rights reserved.
-#
-# SPDX-License-Identifier: BSD-3-Clause
-
-"""Tests the element type conversion functionality."""
-
-from __future__ import annotations
-
-from typing import TYPE_CHECKING, Final
-
-import jax
-import numpy as np
-import pytest
-from jax import numpy as jnp
-
-import jace
-
-
-if TYPE_CHECKING:
-    from collections.abc import Sequence
-
-
-# fmt: off
-_DACE_TYPES: Final[list[type]] = [
-        np.int_, np.int8, np.int16, np.int32, np.int64,
-        np.uint, np.uint8, np.uint16, np.uint32, np.uint64,
-        np.float64, np.float32, np.float64,
-]
-_DACE_COMPLEX: Final[list[type]] = [
-        np.complex128, np.complex64, np.complex128,
-]
-# fmt: on
-
-
-def _test_convert_element_type_impl(
-    input_types: Sequence,
-    output_types: Sequence,
-) -> bool:
-    """Implementation of the tests of the convert element types primitive."""
-    lowering_cnt = [0, 0]
-    for input_type in input_types:
-        for output_type in output_types:
-            A = np.array(np.random.random((10, 10)), dtype=input_type)  # noqa: NPY002
-            ref = np.array(A, copy=True, dtype=output_type)
-            lowering_cnt[1] += 1
-
-            @jace.jit
-            def converter(A: np.ndarray) -> jax.Array:
-                lowering_cnt[0] += 1
-                return jnp.array(A, copy=False, dtype=output_type)  # noqa: B023  # Loop variable.
-
-            res = converter(A)
-            assert res.dtype == output_type
-            assert lowering_cnt[0] == lowering_cnt[1]
-            assert np.allclose(ref, res)
-    return True
-
-
-@pytest.mark.skip(reason="Too slow, find way to run only on demand.")
-def test_convert_element_type_main():
-    """Tests all conversions with the exception of conversions from bool and complex."""
-    _test_convert_element_type_impl(_DACE_TYPES, [*_DACE_TYPES, np.bool_])
-
-
-def test_convert_element_type_main_short():
-    """Fast running version of `test_convert_element_type_main()`."""
-    FAST_TYPES = [np.int32, np.int64, np.float64]
-    _test_convert_element_type_impl(FAST_TYPES, [*FAST_TYPES, np.bool_])
-
-
-def test_convert_element_type_complex():
-    """All complex conversions."""
-    _test_convert_element_type_impl(_DACE_COMPLEX, _DACE_COMPLEX)
-
-
-def test_convert_element_type_from_bool():
-    """Tests conversions from bools to any other types."""
-    _test_convert_element_type_impl([np.bool_], _DACE_COMPLEX)
-
-
-@pytest.mark.skip(reason="The warning was disabled, so the test is useless.")
-def test_convert_element_type_useless_cast():
-    """Shows that under some conditions there is really a casting from one type to the same.
-
-    In certain cases, also in some slicing tests, this useless cast is inserted by Jax.
-    This test was originally here to show this. However, that thing got so annoying that it was
-    removed. The test is kept here to serve as some kind of a reference.
-    """
-
-    def testee(a: float) -> np.ndarray:
-        # For it to work we have to use `numpy` instead of the Jax substitute.
-        return np.broadcast_to(1.0, (10, 10)) + a
-
-    with pytest.warns(
-        expected_warning=UserWarning,
-        match=r"convert_element_type\(.*\): is useless, input and output have same type\.",
-    ):
-        res = jace.jit(testee)(1.0)
-
-    ref = testee(1.0)
-    assert res.shape == ref.shape
-    assert res.dtype == ref.dtype
-    assert np.all(res == ref)
diff --git a/tests/general_tests/__init__.py b/tests/unit_tests/__init__.py
similarity index 87%
rename from tests/general_tests/__init__.py
rename to tests/unit_tests/__init__.py
index 5be01f1..5ce9af1 100644
--- a/tests/general_tests/__init__.py
+++ b/tests/unit_tests/__init__.py
@@ -5,4 +5,4 @@
 #
 # SPDX-License-Identifier: BSD-3-Clause
 
-"""General JaCe tests."""
+"""JaCe's unit tests."""
diff --git a/tests/general_tests/test_caching.py b/tests/unit_tests/test_caching.py
similarity index 100%
rename from tests/general_tests/test_caching.py
rename to tests/unit_tests/test_caching.py
diff --git a/tests/general_tests/test_decorator.py b/tests/unit_tests/test_decorator.py
similarity index 100%
rename from tests/general_tests/test_decorator.py
rename to tests/unit_tests/test_decorator.py
diff --git a/tests/general_tests/test_jax_api.py b/tests/unit_tests/test_jax_api.py
similarity index 100%
rename from tests/general_tests/test_jax_api.py
rename to tests/unit_tests/test_jax_api.py
diff --git a/tests/general_tests/test_misc.py b/tests/unit_tests/test_misc.py
similarity index 100%
rename from tests/general_tests/test_misc.py
rename to tests/unit_tests/test_misc.py
diff --git a/tests/general_tests/test_package.py b/tests/unit_tests/test_package.py
similarity index 100%
rename from tests/general_tests/test_package.py
rename to tests/unit_tests/test_package.py

From 758adc825b833c41722c5c9ffe0737d7a1b1af06 Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Thu, 30 May 2024 11:39:01 +0200
Subject: [PATCH 272/458] Improved coverage.

---
 src/jace/util/translation_cache.py            | 21 +++-
 .../test_primitive_copy.py                    | 26 +++++
 tests/unit_tests/test_caching.py              | 96 ++++++++++++++++++-
 3 files changed, 137 insertions(+), 6 deletions(-)
 create mode 100644 tests/integration_tests/primitive_translators/test_primitive_copy.py

diff --git a/src/jace/util/translation_cache.py b/src/jace/util/translation_cache.py
index c0f6fce..d02320e 100644
--- a/src/jace/util/translation_cache.py
+++ b/src/jace/util/translation_cache.py
@@ -237,14 +237,14 @@ class StageCache(Generic[StageType]):
     """
 
     _memory: collections.OrderedDict[StageTransformationSpec, StageType]
-    _size: int
+    _capacity: int
 
     def __init__(
         self,
-        size: int = 256,
+        capachity: int = 256,
     ) -> None:
         self._memory = collections.OrderedDict()
-        self._size = size
+        self._capacity = capachity
 
     def __contains__(
         self,
@@ -270,7 +270,7 @@ def __setitem__(
             self._memory.move_to_end(key, last=True)
             self._memory[key] = res
         else:
-            if len(self._memory) == self._size:
+            if len(self._memory) == self._capacity:
                 self.popitem(None)
             self._memory[key] = res
 
@@ -293,5 +293,16 @@ def popitem(
     def clear(self) -> None:
         self._memory.clear()
 
+    def __len__(self) -> int:
+        return len(self._memory)
+
+    @property
+    def capacity(self) -> int:
+        return self._capacity
+
+    def front(self) -> tuple[StageTransformationSpec, StageType]:
+        """Returns the front, i.e. newest entry in the cache."""
+        return next(reversed(self._memory.items()))
+
     def __repr__(self) -> str:
-        return f"StageCache({len(self._memory)} / {self._size} || {', '.join( '[' + repr(k) + ']' for k in self._memory)})"
+        return f"StageCache({len(self._memory)} / {self._capacity} || {', '.join( '[' + repr(k) + ']' for k in self._memory)})"
diff --git a/tests/integration_tests/primitive_translators/test_primitive_copy.py b/tests/integration_tests/primitive_translators/test_primitive_copy.py
new file mode 100644
index 0000000..7fcdaad
--- /dev/null
+++ b/tests/integration_tests/primitive_translators/test_primitive_copy.py
@@ -0,0 +1,26 @@
+# JaCe - JAX Just-In-Time compilation using DaCe (Data Centric Parallel Programming)
+#
+# Copyright (c) 2024, ETH Zurich
+# All rights reserved.
+#
+# SPDX-License-Identifier: BSD-3-Clause
+
+from __future__ import annotations
+
+import jax
+import numpy as np
+from jax import numpy as jnp
+
+import jace
+
+
+def test_copy():
+    @jace.jit
+    def testee(A: np.ndarray) -> jax.Array:
+        return jnp.copy(A)
+
+    A = np.random.random((10, 10, 10))  # noqa: NPY002
+    ref = np.copy(A)
+    res = testee(A)
+    assert ref.dtype == res.dtype
+    assert np.all(ref == res)
diff --git a/tests/unit_tests/test_caching.py b/tests/unit_tests/test_caching.py
index 3f5dd0f..2ce48e4 100644
--- a/tests/unit_tests/test_caching.py
+++ b/tests/unit_tests/test_caching.py
@@ -36,7 +36,7 @@ def _clear_translation_cache():
 
 
 def test_caching_same_sizes() -> None:
-    """The behaviour of the cache if same sizes are used."""
+    """The behaviour of the cache if same sizes are used, in two different functions."""
 
     # Counter for how many time it was lowered.
     lowering_cnt = [0]
@@ -224,6 +224,100 @@ def testee(A: np.ndarray) -> np.ndarray:
         assert lowering_cnt[0] == i + 1
 
 
+def test_caching_eviction_simple():
+    """Simple tests for cache eviction."""
+
+    @jace.jit
+    def testee(A: np.ndarray) -> np.ndarray:
+        return A + 1.0
+
+    cache: tcache.StageCache = testee._cache
+
+    first_lowered = testee.lower(np.ones(10))
+    first_key = cache.front()[0]
+    second_lowered = testee.lower(np.ones(11))
+    second_key = cache.front()[0]
+    third_lowered = testee.lower(np.ones(12))
+    third_key = cache.front()[0]
+
+    assert first_key != second_key
+    assert first_key != third_key
+    assert second_key != third_key
+
+    assert first_key in cache
+    assert second_key in cache
+    assert third_key in cache
+    assert cache.front()[0] == third_key
+
+    # We now evict the second key, which should not change anything on the order.
+    cache.popitem(second_key)
+    assert first_key in cache
+    assert second_key not in cache
+    assert third_key in cache
+    assert cache.front()[0] == third_key
+
+    # Now we modify first_key, which moves it to the front.
+    cache[first_key] = first_lowered
+    assert first_key in cache
+    assert second_key not in cache
+    assert third_key in cache
+    assert cache.front()[0] == first_key
+
+    # Now we evict the oldest one, which is third_key
+    cache.popitem(None)
+    assert first_key in cache
+    assert second_key not in cache
+    assert third_key not in cache
+    assert cache.front()[0] == first_key
+
+
+def test_caching_eviction_complex():
+    """Tests if the stuff is properly evicted if the cache is full."""
+
+    @jace.jit
+    def testee(A: np.ndarray) -> np.ndarray:
+        return A + 1.0
+
+    cache: tcache.StageCache = testee._cache
+    capacity = cache.capacity
+    assert len(cache) == 0
+
+    # Lets fill the cache to the brim.
+    for i in range(capacity):
+        A = np.ones(i + 10)
+        lowered = testee.lower(A)
+        assert len(cache) == i + 1
+
+        if i == 0:
+            first_key: tcache.StageTransformationSpec = cache.front()[0]
+            first_lowered = cache[first_key]
+            assert lowered is first_lowered
+        elif i == 1:
+            second_key: tcache.StageTransformationSpec = cache.front()[0]
+            assert second_key != first_key
+            assert cache[second_key] is lowered
+        assert first_key in cache
+
+    assert len(cache) == capacity
+    assert first_key in cache
+    assert second_key in cache
+
+    # Now we will modify the first key, this should make it the newest.
+    assert cache.front()[0] != first_key
+    cache[first_key] = first_lowered
+    assert len(cache) == capacity
+    assert first_key in cache
+    assert second_key in cache
+    assert cache.front()[0] == first_key
+
+    # Now we will add a new entry to the cache, this will evict the second entry.
+    _ = testee.lower(np.ones(capacity + 1000))
+    assert len(cache) == capacity
+    assert cache.front()[0] != first_key
+    assert first_key in cache
+    assert second_key not in cache
+
+
 def test_caching_strides() -> None:
     """Test if the cache detects a change in strides."""
 

From 7fa03c3f890cc0e8f9ef08b81e947c2ed0d2f6ee Mon Sep 17 00:00:00 2001
From: Enrique Gonzalez Paredes <enriqueg@cscs.ch>
Date: Thu, 30 May 2024 12:17:41 +0200
Subject: [PATCH 273/458] chore: add missing dependencies in the mypy hook for
 pre-commit

---
 .pre-commit-config.yaml | 2 ++
 1 file changed, 2 insertions(+)

diff --git a/.pre-commit-config.yaml b/.pre-commit-config.yaml
index 97e8d51..1442e7b 100644
--- a/.pre-commit-config.yaml
+++ b/.pre-commit-config.yaml
@@ -65,6 +65,8 @@ repos:
     - dace==0.15.1
     - jax[cpu]==0.4.28
     - numpy==1.26.4
+    - pytest==8.2.1
+    - typing-extensions==4.12.0
 - repo: https://github.com/codespell-project/codespell
   rev: "v2.2.6"
   hooks:

From ba854e021d6923733c222e07ac82b259c7ba4255 Mon Sep 17 00:00:00 2001
From: Enrique Gonzalez Paredes <enriqueg@cscs.ch>
Date: Thu, 30 May 2024 12:20:06 +0200
Subject: [PATCH 274/458] remove typing-extensions

---
 .pre-commit-config.yaml | 1 -
 1 file changed, 1 deletion(-)

diff --git a/.pre-commit-config.yaml b/.pre-commit-config.yaml
index 1442e7b..6ae432a 100644
--- a/.pre-commit-config.yaml
+++ b/.pre-commit-config.yaml
@@ -66,7 +66,6 @@ repos:
     - jax[cpu]==0.4.28
     - numpy==1.26.4
     - pytest==8.2.1
-    - typing-extensions==4.12.0
 - repo: https://github.com/codespell-project/codespell
   rev: "v2.2.6"
   hooks:

From 2cdd3fdea22e1d47e7093b22cfd3c3097818a96b Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Thu, 30 May 2024 13:35:37 +0200
Subject: [PATCH 275/458] First batch of fixes.

---
 src/jace/api.py                               |   2 +-
 src/jace/stages.py                            |   2 +-
 src/jace/translator/__init__.py               |   5 +-
 .../translator/jaxpr_translator_driver.py     |  19 +--
 src/jace/translator/managing.py               | 148 ------------------
 src/jace/translator/primitive_translator.py   | 144 +++++++++++++++--
 .../primitive_translators/__init__.py         |   2 +-
 .../primitive_translators/alu_translator.py   |   8 +-
 src/jace/util/compiling.py                    |   4 +-
 tests/test_subtranslator_helper.py            |   4 +-
 10 files changed, 153 insertions(+), 185 deletions(-)
 delete mode 100644 src/jace/translator/managing.py

diff --git a/src/jace/api.py b/src/jace/api.py
index f1600c8..7bf4cfa 100644
--- a/src/jace/api.py
+++ b/src/jace/api.py
@@ -73,7 +73,7 @@ def wrapper(f: Callable) -> stages.JaceWrapped:
         jace_wrapper = stages.JaceWrapped(
             fun=f,
             primitive_translators=(
-                translator.managing._PRIMITIVE_TRANSLATORS_DICT
+                translator.primitive_translator._PRIMITIVE_TRANSLATORS_REGISTRY
                 if primitive_translators is None
                 else primitive_translators
             ),
diff --git a/src/jace/stages.py b/src/jace/stages.py
index 020eebc..2397bb1 100644
--- a/src/jace/stages.py
+++ b/src/jace/stages.py
@@ -50,7 +50,7 @@ class JaceWrapped(tcache.CachingStage["JaceLowered"]):
 
     Args:
         fun:                    The function that is wrapped.
-        primitive_translators:  The list of subtranslators that that should be used.
+        primitive_translators:  The list of primitive translators that that should be used.
         jit_options:            Options to influence the jit process.
 
     Todo:
diff --git a/src/jace/translator/__init__.py b/src/jace/translator/__init__.py
index 49342be..cda6c85 100644
--- a/src/jace/translator/__init__.py
+++ b/src/jace/translator/__init__.py
@@ -10,13 +10,14 @@
 from __future__ import annotations
 
 from .jaxpr_translator_driver import JaxprTranslationDriver
-from .managing import (
+from .primitive_translator import (
+    PrimitiveTranslator,
+    PrimitiveTranslatorCallable,
     get_regsitered_primitive_translators,
     make_primitive_translator,
     register_primitive_translator,
     set_active_primitive_translators_to,
 )
-from .primitive_translator import PrimitiveTranslator, PrimitiveTranslatorCallable
 from .translated_jaxpr_sdfg import TranslatedJaxprSDFG
 
 
diff --git a/src/jace/translator/jaxpr_translator_driver.py b/src/jace/translator/jaxpr_translator_driver.py
index f66407d..4faf45d 100644
--- a/src/jace/translator/jaxpr_translator_driver.py
+++ b/src/jace/translator/jaxpr_translator_driver.py
@@ -7,6 +7,7 @@
 
 from __future__ import annotations
 
+import copy
 from collections.abc import Mapping, MutableSequence, Sequence
 from typing import TYPE_CHECKING, Any, Literal, cast, overload
 
@@ -44,9 +45,9 @@ class JaxprTranslationDriver:
     exception.
 
     The actual translation of the equation is not handled by the driver. Instead the request is
-    forwarded to a `PrimitiveTranslator` object, known as primitive translator or subtranslator.
-    This is a highly specialized object that is able to handle one kind of primitive. For more
-    information on them see the documentation of `PrimitiveTranslator`.
+    forwarded to a `PrimitiveTranslator` object, known as primitive translator. This is a highly
+    specialized object that is able to handle one kind of primitive. For more information on them
+    see the documentation of `PrimitiveTranslator`.
 
     To start a translation the `translate_jaxpr()` function should be called, if this happens it is
     said that the driver has an ongoing translation. If `translate_jaxpr()` is called on a driver
@@ -58,17 +59,11 @@ class JaxprTranslationDriver:
         primitive_translators:    Primitive to use during the translation.
 
     Notes:
-        The `primitive_translators` that is passed at construction is not copied. The user has
-        to ensure that it does not change.
         After the main translation has been performed the translator object can be used again.
         Currently the driver will generate only Array as SDFG variables, however, this is a
         temporary solution, see `add_array()`.
-
-
     """
 
-    __slots__ = ("_ctx_stack", "_primitive_translators", "_jax_name_map")
-
     _primitive_translators: Mapping[str, translator.PrimitiveTranslatorCallable]
     _jax_name_map: dict[jax_core.Var | util.JaCeVar, str]
     _ctx_stack: list[translator.TranslatedJaxprSDFG]
@@ -78,7 +73,7 @@ def __init__(
         primitive_translators: Mapping[str, translator.PrimitiveTranslatorCallable],
     ) -> None:
         # Maps name of primitives to the associated translator.
-        self._primitive_translators = primitive_translators
+        self._primitive_translators = {**primitive_translators}
 
         # Maps Jax variables to the name of its SDFG equivalent.
         #  Shared between all translation contexts, to ensure consecutive
@@ -481,8 +476,6 @@ def _create_constants(
         The function will create an SDFG variable and add them as constant to the SDFG. Their value
         is deepcopied.
         """
-        from copy import deepcopy
-
         if not self.is_allocated():
             raise RuntimeError("Driver is not allocated, can not create constants.")
         if len(jaxpr.consts) == 0:
@@ -497,7 +490,7 @@ def _create_constants(
         )
         for sdfg_name, const_value in zip(sdfg_const_names, jaxpr.consts, strict=True):
             self._ctx.sdfg.add_constant(
-                sdfg_name, deepcopy(const_value), self._ctx.sdfg.arrays[sdfg_name]
+                sdfg_name, copy.deepcopy(const_value), self._ctx.sdfg.arrays[sdfg_name]
             )
         return sdfg_const_names
 
diff --git a/src/jace/translator/managing.py b/src/jace/translator/managing.py
deleted file mode 100644
index b785186..0000000
--- a/src/jace/translator/managing.py
+++ /dev/null
@@ -1,148 +0,0 @@
-# JaCe - JAX Just-In-Time compilation using DaCe (Data Centric Parallel Programming)
-#
-# Copyright (c) 2024, ETH Zurich
-# All rights reserved.
-#
-# SPDX-License-Identifier: BSD-3-Clause
-"""Module for managing the global primitive translators.
-
-The high level idea is that there is a registry of all currently active primitive translators.
-If `primitive_translators` is not given to `jit` it will use this global registry.
-A primitive, i.e. an object that satisfies the `PrimitiveTranslator` interface, can be added
-to the registry by `register_primitive_translator()`. To retrieve the translators that are
-currently active you can use the `get_regsitered_primitive_translators()` function.
-"""
-
-from __future__ import annotations
-
-from collections.abc import Callable, Mapping, MutableMapping
-from typing import TYPE_CHECKING, Literal, cast, overload
-
-
-if TYPE_CHECKING:
-    from jace import translator
-
-#: Global registry of the active primitive translators.
-#:  The `dict` maps the name of a primitive to its associated translators.
-_PRIMITIVE_TRANSLATORS_DICT: dict[str, translator.PrimitiveTranslator] = {}
-
-
-@overload
-def make_primitive_translator(
-    primitive: str,
-    primitive_translator: Literal[None] = None,
-) -> Callable[[translator.PrimitiveTranslatorCallable], translator.PrimitiveTranslator]: ...
-
-
-@overload
-def make_primitive_translator(
-    primitive: str, primitive_translator: translator.PrimitiveTranslatorCallable
-) -> translator.PrimitiveTranslator: ...
-
-
-def make_primitive_translator(
-    primitive: str,
-    primitive_translator: translator.PrimitiveTranslatorCallable | None = None,
-) -> (
-    Callable[[translator.PrimitiveTranslatorCallable], translator.PrimitiveTranslator]
-    | translator.PrimitiveTranslator
-):
-    """Turn `primitive_translator` into a `PrimitiveTranslator` for primitive `primitive`.
-
-    Essentially, this function adds the `primitive` property to a callable, such that it satisfy
-    the `PrimitiveTranslator` protocol. However, it does not add it to the registry, for that
-    `register_primitive_translator()` has to be used.
-
-    Notes:
-        This function cal also be used as decorator.
-    """
-
-    def wrapper(
-        primitive_translator: translator.PrimitiveTranslatorCallable,
-    ) -> translator.PrimitiveTranslator:
-        from jace import translator  # Cyclic
-
-        if getattr(primitive_translator, "primitive", primitive) != primitive:
-            raise ValueError(
-                f"Tried to change the 'primitive' property of '{primitive_translator}' from "
-                f"'{primitive_translator.primitive}' to '{primitive}'."  # type: ignore[attr-defined]
-            )
-        primitive_translator.primitive = primitive  # type: ignore[attr-defined]  # We define the attribute.
-        return cast(translator.PrimitiveTranslator, primitive_translator)
-
-    return wrapper if primitive_translator is None else wrapper(primitive_translator)
-
-
-@overload
-def register_primitive_translator(
-    primitive_translator: Literal[None] = None,
-    overwrite: bool = False,
-) -> Callable[[translator.PrimitiveTranslator], translator.PrimitiveTranslator]: ...
-
-
-@overload
-def register_primitive_translator(
-    primitive_translator: translator.PrimitiveTranslator,
-    overwrite: bool = False,
-) -> translator.PrimitiveTranslator: ...
-
-
-def register_primitive_translator(
-    primitive_translator: translator.PrimitiveTranslator | None = None,
-    overwrite: bool = False,
-) -> (
-    translator.PrimitiveTranslator
-    | Callable[[translator.PrimitiveTranslator], translator.PrimitiveTranslator]
-):
-    """Adds a primitive translator to Jace's global registry.
-
-    If a translator for `primitive` is already registered an error will be generated. However,
-    by specifying `overwrite` `primitive_translator` will replace the current one.
-
-    Args:
-        primitive_translator: The primitive translator to add to the global registry.
-        overwrite:            Replace the current primitive translator with `primitive_translator`.
-
-    Note:
-        To add a `primitive` property use the `@make_primitive_translator` decorator.
-        This function returns `primitive_translator` unmodified, which allows it to be
-        used as decorator.
-    """
-
-    def wrapper(
-        primitive_translator: translator.PrimitiveTranslator,
-    ) -> translator.PrimitiveTranslator:
-        if primitive_translator.primitive in _PRIMITIVE_TRANSLATORS_DICT and not overwrite:
-            raise ValueError(
-                f"Explicit override=True needed for primitive '{primitive_translator.primitive}' "
-                "to overwrite existing one."
-            )
-        _PRIMITIVE_TRANSLATORS_DICT[primitive_translator.primitive] = primitive_translator
-        return primitive_translator
-
-    return wrapper if primitive_translator is None else wrapper(primitive_translator)
-
-
-def get_regsitered_primitive_translators() -> dict[str, translator.PrimitiveTranslator]:
-    """Returns a copy of the current state of Jace's global primitive registry.
-
-    The function returns a mapping that maps the name of a primitive to the associated translator.
-    No change to the global registry will affect the return value and vice versa.
-    """
-    return _PRIMITIVE_TRANSLATORS_DICT.copy()
-
-
-def set_active_primitive_translators_to(
-    new_translators: Mapping[str, translator.PrimitiveTranslator],
-) -> MutableMapping[str, translator.PrimitiveTranslator]:
-    """Exchange the global translator registry of Jace with `new_translators`.
-
-    The function will return the state of the global translator registry just before this call.
-    Any changes to `new_translators` after calling this function will have no effect on the
-    global translator registry and vice versa.
-    """
-    global _PRIMITIVE_TRANSLATORS_DICT
-    assert all(getattr(trans, "primitive", prim) for prim, trans in new_translators.items())
-    previous_translators = _PRIMITIVE_TRANSLATORS_DICT
-    _PRIMITIVE_TRANSLATORS_DICT = dict(new_translators)
-    return previous_translators
diff --git a/src/jace/translator/primitive_translator.py b/src/jace/translator/primitive_translator.py
index bdca3d4..0ceb1c7 100644
--- a/src/jace/translator/primitive_translator.py
+++ b/src/jace/translator/primitive_translator.py
@@ -4,13 +4,20 @@
 # All rights reserved.
 #
 # SPDX-License-Identifier: BSD-3-Clause
-"""Contains the interface for all primitive translators."""
+"""Interface for all primitive translators and managing of the global translator registry.
+
+The high level idea is that there is a registry of all currently active primitive translators.
+If `primitive_translators` is not given to `jit` it will use this global registry.
+A primitive, i.e. an object that satisfies the `PrimitiveTranslator` interface, can be added
+to the registry by `register_primitive_translator()`. To retrieve the translators that are
+currently active you can use the `get_regsitered_primitive_translators()` function.
+"""
 
 from __future__ import annotations
 
 from abc import abstractmethod
-from collections.abc import MutableSequence, Sequence
-from typing import TYPE_CHECKING, Protocol, runtime_checkable
+from collections.abc import Callable, Mapping, MutableMapping, MutableSequence, Sequence
+from typing import TYPE_CHECKING, Literal, Protocol, cast, overload, runtime_checkable
 
 import dace
 from jax import core as jax_core
@@ -19,6 +26,10 @@
 if TYPE_CHECKING:
     from jace import translator
 
+#: Global registry of the active primitive translators.
+#:  The `dict` maps the name of a primitive to its associated translators.
+_PRIMITIVE_TRANSLATORS_REGISTRY: dict[str, translator.PrimitiveTranslator] = {}
+
 
 class PrimitiveTranslatorCallable(Protocol):
     """Callable version of the primitive translators.
@@ -28,8 +39,6 @@ class PrimitiveTranslatorCallable(Protocol):
     a callable.
     """
 
-    __slots__ = ()
-
     @abstractmethod
     def __call__(
         self,
@@ -63,8 +72,8 @@ def __call__(
         While a primitive translator is forbidden from meddling with the input variables mentioned
         in `in_var_names` in any way, it is allowed to modify the output variables. For example
         it could create a new SDFG variable, with different strides. But in that case the primitive
-        translator must update the internal mapping of the driver TBA HOW, and modify the mapping
-        specified by `out_var_names`. However, the subtranslator is allowed to create internal
+        translator must update the internal mapping of the driver TBA HOW, and modify the names
+        passed through `out_var_names`. However, the translator is allowed to create internal
         temporary variables. It just have to ensure that no name collision will occur, a way to
         do this is to use a passed variable name as prefix.
 
@@ -96,10 +105,127 @@ class PrimitiveTranslator(PrimitiveTranslatorCallable, Protocol):
     You can use `jace.translator.register_primitive_translator()` to register your translator to Jace.
     """
 
-    __slots__ = ()
-
     @property
     @abstractmethod
     def primitive(self) -> str:
         """Returns the name of the Jax primitive that `self` is able to handle."""
         ...
+
+
+@overload
+def make_primitive_translator(
+    primitive: str,
+    primitive_translator: Literal[None] = None,
+) -> Callable[[translator.PrimitiveTranslatorCallable], translator.PrimitiveTranslator]: ...
+
+
+@overload
+def make_primitive_translator(
+    primitive: str, primitive_translator: translator.PrimitiveTranslatorCallable
+) -> translator.PrimitiveTranslator: ...
+
+
+def make_primitive_translator(
+    primitive: str,
+    primitive_translator: translator.PrimitiveTranslatorCallable | None = None,
+) -> (
+    Callable[[translator.PrimitiveTranslatorCallable], translator.PrimitiveTranslator]
+    | translator.PrimitiveTranslator
+):
+    """Turn `primitive_translator` into a `PrimitiveTranslator` for primitive `primitive`.
+
+    Essentially, this function adds the `primitive` property to a callable, such that it satisfy
+    the `PrimitiveTranslator` protocol. However, it does not add it to the registry, for that
+    `register_primitive_translator()` has to be used.
+
+    Notes:
+        This function cal also be used as decorator.
+    """
+
+    def wrapper(
+        primitive_translator: translator.PrimitiveTranslatorCallable,
+    ) -> translator.PrimitiveTranslator:
+        if getattr(primitive_translator, "primitive", primitive) != primitive:
+            raise ValueError(
+                f"Tried to change the 'primitive' property of '{primitive_translator}' from "
+                f"'{primitive_translator.primitive}' to '{primitive}'."  # type: ignore[attr-defined]
+            )
+        primitive_translator.primitive = primitive  # type: ignore[attr-defined]  # We define the attribute.
+        return cast("translator.PrimitiveTranslator", primitive_translator)
+
+    return wrapper if primitive_translator is None else wrapper(primitive_translator)
+
+
+@overload
+def register_primitive_translator(
+    primitive_translator: Literal[None] = None,
+    overwrite: bool = False,
+) -> Callable[[translator.PrimitiveTranslator], translator.PrimitiveTranslator]: ...
+
+
+@overload
+def register_primitive_translator(
+    primitive_translator: translator.PrimitiveTranslator,
+    overwrite: bool = False,
+) -> translator.PrimitiveTranslator: ...
+
+
+def register_primitive_translator(
+    primitive_translator: translator.PrimitiveTranslator | None = None,
+    overwrite: bool = False,
+) -> (
+    translator.PrimitiveTranslator
+    | Callable[[translator.PrimitiveTranslator], translator.PrimitiveTranslator]
+):
+    """Adds a primitive translator to Jace's global registry.
+
+    If a translator for `primitive` is already registered an error will be generated. However,
+    by specifying `overwrite` `primitive_translator` will replace the current one.
+
+    Args:
+        primitive_translator: The primitive translator to add to the global registry.
+        overwrite:            Replace the current primitive translator with `primitive_translator`.
+
+    Note:
+        To add a `primitive` property use the `@make_primitive_translator` decorator.
+        This function returns `primitive_translator` unmodified, which allows it to be
+        used as decorator.
+    """
+
+    def wrapper(
+        primitive_translator: translator.PrimitiveTranslator,
+    ) -> translator.PrimitiveTranslator:
+        if primitive_translator.primitive in _PRIMITIVE_TRANSLATORS_REGISTRY and not overwrite:
+            raise ValueError(
+                f"Explicit override=True needed for primitive '{primitive_translator.primitive}' "
+                "to overwrite existing one."
+            )
+        _PRIMITIVE_TRANSLATORS_REGISTRY[primitive_translator.primitive] = primitive_translator
+        return primitive_translator
+
+    return wrapper if primitive_translator is None else wrapper(primitive_translator)
+
+
+def get_regsitered_primitive_translators() -> dict[str, translator.PrimitiveTranslator]:
+    """Returns a copy of the current state of Jace's global primitive registry.
+
+    The function returns a mapping that maps the name of a primitive to the associated translator.
+    No change to the global registry will affect the return value and vice versa.
+    """
+    return _PRIMITIVE_TRANSLATORS_REGISTRY.copy()
+
+
+def set_active_primitive_translators_to(
+    new_translators: Mapping[str, translator.PrimitiveTranslator],
+) -> MutableMapping[str, translator.PrimitiveTranslator]:
+    """Exchange the global translator registry of Jace with `new_translators`.
+
+    The function will return the state of the global translator registry just before this call.
+    Any changes to `new_translators` after calling this function will have no effect on the
+    global translator registry and vice versa.
+    """
+    global _PRIMITIVE_TRANSLATORS_REGISTRY
+    assert all(getattr(trans, "primitive", prim) for prim, trans in new_translators.items())
+    previous_translators = _PRIMITIVE_TRANSLATORS_REGISTRY
+    _PRIMITIVE_TRANSLATORS_REGISTRY = dict(new_translators)
+    return previous_translators
diff --git a/src/jace/translator/primitive_translators/__init__.py b/src/jace/translator/primitive_translators/__init__.py
index 08bff9d..729134b 100644
--- a/src/jace/translator/primitive_translators/__init__.py
+++ b/src/jace/translator/primitive_translators/__init__.py
@@ -4,7 +4,7 @@
 # All rights reserved.
 #
 # SPDX-License-Identifier: BSD-3-Clause
-"""Module collecting all built-in subtranslators."""
+"""Module collecting all built-in primitive translators."""
 
 from __future__ import annotations
 
diff --git a/src/jace/translator/primitive_translators/alu_translator.py b/src/jace/translator/primitive_translators/alu_translator.py
index 0d19973..9b10ca4 100644
--- a/src/jace/translator/primitive_translators/alu_translator.py
+++ b/src/jace/translator/primitive_translators/alu_translator.py
@@ -26,8 +26,6 @@ class ALUTranslator(translator.PrimitiveTranslator):
     This translator will be reworked soon, it just exists that the initial PR can do anything at all!!
     """
 
-    __slots__ = ("_prim_name", "_prim_tmpl")
-
     def __init__(
         self,
         prim_name: str,
@@ -242,7 +240,7 @@ def _list_to_dict(inp: Sequence[tuple[None | Any, Any]]) -> dict[Any, Any]:
 
 
 # Contains all the templates for ALU operations.
-_ALU_OPS_TMPL: Final[dict[str, str]] = {
+_ALU_OPS_TASKLET_TEMPLATES: Final[dict[str, str]] = {
     # Unary operations
     "pos": "__out0 = +(__in0)",
     "neg": "__out0 = -(__in0)",
@@ -284,7 +282,5 @@ def _list_to_dict(inp: Sequence[tuple[None | Any, Any]]) -> dict[Any, Any]:
     "lt": "__out0 = __in0 < __in1",
 }
 
-_ = [
+for prim_name, prim_tmpl in _ALU_OPS_TASKLET_TEMPLATES.items():
     translator.register_primitive_translator(ALUTranslator(prim_name, prim_tmpl))
-    for prim_name, prim_tmpl in _ALU_OPS_TMPL.items()
-]
diff --git a/src/jace/util/compiling.py b/src/jace/util/compiling.py
index c3d7249..a9658fb 100644
--- a/src/jace/util/compiling.py
+++ b/src/jace/util/compiling.py
@@ -17,6 +17,8 @@
 import numpy as np
 from dace import data as dace_data
 
+from jace import util
+
 
 if TYPE_CHECKING:
     from jace import translator
@@ -95,8 +97,6 @@ def run_jax_sdfg(
         However, if we have symbols or variable sizes, we must ensure that the init function of
         the SDFG is called every time, or ensure that its exit function runs every time.
     """
-    from jace import util
-
     sdfg: dace.SDFG = csdfg.sdfg
 
     if len(ckwargs) != 0:
diff --git a/tests/test_subtranslator_helper.py b/tests/test_subtranslator_helper.py
index 3810ab3..b9c1d4e 100644
--- a/tests/test_subtranslator_helper.py
+++ b/tests/test_subtranslator_helper.py
@@ -104,7 +104,7 @@ def test_subtranslatior_managing_isolation():
     """Tests if `get_regsitered_primitive_translators()` protects the internal registry."""
     assert (
         get_regsitered_primitive_translators()
-        is not translator.managing._PRIMITIVE_TRANSLATORS_DICT
+        is not translator.primitive_translator._PRIMITIVE_TRANSLATORS_REGISTRY
     )
 
     initial_primitives = get_regsitered_primitive_translators()
@@ -138,7 +138,7 @@ def same_structure(d1: dict, d2: dict) -> bool:
     # Now change the initial one with the mutated one.
     #  The object is copied but should still have the same structure.
     old_active = set_active_primitive_translators_to(mutated_primitives)
-    assert mutated_primitives is not translator.managing._PRIMITIVE_TRANSLATORS_DICT
+    assert mutated_primitives is not translator.primitive_translator._PRIMITIVE_TRANSLATORS_REGISTRY
     assert same_structure(old_active, initial_primitives)
     assert same_structure(mutated_primitives, get_regsitered_primitive_translators())
 

From 37c933cf2a0c8fd025123a8acad96ee75902f57f Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Thu, 30 May 2024 14:00:11 +0200
Subject: [PATCH 276/458] Integrated some of Enrique's changes.

---
 src/jace/__init__.py                          |   8 +-
 src/jace/api.py                               |  25 ++--
 src/jace/optimization.py                      |   4 +-
 src/jace/stages.py                            |  66 +++++-----
 src/jace/translator/__init__.py               |   4 +-
 .../translator/jaxpr_translator_driver.py     |  21 ++-
 src/jace/translator/post_translation.py       |   3 +-
 src/jace/translator/primitive_translator.py   |  17 +--
 .../primitive_translators/alu_translator.py   |  34 +++--
 src/jace/util/__init__.py                     |  18 +--
 src/jace/util/compiling.py                    |   3 +-
 src/jace/util/jax_helper.py                   |  28 +++-
 src/jace/util/traits.py                       |  15 +--
 src/jace/util/translation_cache.py            |   4 +-
 tests/test_caching.py                         | 121 ++++++++++++++++--
 tests/test_jax_api.py                         |  10 +-
 tests/test_jaxpr_translator_driver.py         |  28 ++--
 tests/test_misc.py                            |   2 +-
 tests/test_subtranslator_helper.py            |  20 +--
 19 files changed, 284 insertions(+), 147 deletions(-)

diff --git a/src/jace/__init__.py b/src/jace/__init__.py
index 7fed965..de111ec 100644
--- a/src/jace/__init__.py
+++ b/src/jace/__init__.py
@@ -18,11 +18,11 @@
 __all__ = [
     "__author__",
     "__copyright__",
-    "grad",
-    "jit",
-    "jacfwd",
-    "jacrev",
     "__license__",
     "__version__",
     "__version_info__",
+    "grad",
+    "jacfwd",
+    "jacrev",
+    "jit",
 ]
diff --git a/src/jace/api.py b/src/jace/api.py
index 7bf4cfa..1efacc8 100644
--- a/src/jace/api.py
+++ b/src/jace/api.py
@@ -10,19 +10,22 @@
 from __future__ import annotations
 
 import functools
-from collections.abc import Callable, Mapping
-from typing import Any, Literal, overload
+from typing import TYPE_CHECKING, Any, Literal, cast, overload
 
 from jax import grad, jacfwd, jacrev
 
 from jace import stages, translator
 
 
+if TYPE_CHECKING:
+    from collections.abc import Callable, Mapping
+
+
 __all__ = [
     "grad",
-    "jit",
     "jacfwd",
     "jacrev",
+    "jit",
 ]
 
 
@@ -32,7 +35,7 @@ def jit(
     /,
     primitive_translators: Mapping[str, translator.PrimitiveTranslator] | None = None,
     **kwargs: Any,
-) -> Callable[[Callable], stages.JaceWrapped]: ...
+) -> Callable[[Callable], stages.JaCeWrapped]: ...
 
 
 @overload
@@ -41,7 +44,7 @@ def jit(
     /,
     primitive_translators: Mapping[str, translator.PrimitiveTranslator] | None = None,
     **kwargs: Any,
-) -> stages.JaceWrapped: ...
+) -> stages.JaCeWrapped: ...
 
 
 def jit(
@@ -49,12 +52,12 @@ def jit(
     /,
     primitive_translators: Mapping[str, translator.PrimitiveTranslator] | None = None,
     **kwargs: Any,
-) -> stages.JaceWrapped | Callable[[Callable], stages.JaceWrapped]:
-    """Jace's replacement for `jax.jit` (just-in-time) wrapper.
+) -> stages.JaCeWrapped | Callable[[Callable], stages.JaCeWrapped]:
+    """JaCe's replacement for `jax.jit` (just-in-time) wrapper.
 
     It works the same way as `jax.jit` does, but instead of using XLA the computation is lowered
     to DaCe. It supports the same arguments as `jax.jit` (although currently not) does.
-    In addition it accepts some Jace specific arguments.
+    In addition it accepts some JaCe specific arguments.
 
     Args:
         primitive_translators:    Use these primitive translators for the lowering to SDFG.
@@ -69,8 +72,8 @@ def jit(
             f"The following arguments to 'jace.jit' are not yet supported: {', '.join(kwargs)}."
         )
 
-    def wrapper(f: Callable) -> stages.JaceWrapped:
-        jace_wrapper = stages.JaceWrapped(
+    def wrapper(f: Callable) -> stages.JaCeWrapped:
+        jace_wrapper = stages.JaCeWrapped(
             fun=f,
             primitive_translators=(
                 translator.primitive_translator._PRIMITIVE_TRANSLATORS_REGISTRY
@@ -79,6 +82,6 @@ def wrapper(f: Callable) -> stages.JaceWrapped:
             ),
             jit_options=kwargs,
         )
-        return functools.update_wrapper(jace_wrapper, f)
+        return cast(stages.JaCeWrapped, functools.update_wrapper(jace_wrapper, f))
 
     return wrapper if fun is None else wrapper(fun)
diff --git a/src/jace/optimization.py b/src/jace/optimization.py
index c719bd4..68f7b1f 100644
--- a/src/jace/optimization.py
+++ b/src/jace/optimization.py
@@ -5,7 +5,7 @@
 #
 # SPDX-License-Identifier: BSD-3-Clause
 
-"""Module that will host all optimization functions specific to Jace.
+"""Module that will host all optimization functions specific to JaCe.
 
 Currently just a dummy existing for the sake of providing some callable function.
 """
@@ -22,7 +22,7 @@
 
 
 class CompilerOptions(TypedDict, total=False):
-    """All known compiler options known to `JaceLowered.compile()`.
+    """All known compiler options known to `JaCeLowered.compile()`.
 
     See `jace_optimize()` for a description of the different options.
 
diff --git a/src/jace/stages.py b/src/jace/stages.py
index 2397bb1..3f42436 100644
--- a/src/jace/stages.py
+++ b/src/jace/stages.py
@@ -7,9 +7,9 @@
 """Reimplementation of the `jax.stages` module.
 
 This module reimplements the public classes of that Jax module.
-However, they are a big different, because Jace uses DaCe as backend.
+However, they are a big different, because JaCe uses DaCe as backend.
 
-As in Jax Jace has different stages, the terminology is taken from
+As in Jax JaCe has different stages, the terminology is taken from
 [Jax' AOT-Tutorial](https://jax.readthedocs.io/en/latest/aot.html).
 - Stage out:
     In this phase we translate an executable python function into Jaxpr.
@@ -25,10 +25,8 @@
 from __future__ import annotations
 
 import copy
-from collections.abc import Callable, Mapping, Sequence
-from typing import Any
+from typing import TYPE_CHECKING, Any
 
-import dace
 import jax as _jax
 
 from jace import optimization, translator, util
@@ -37,16 +35,22 @@
 from jace.util import dace_helper, translation_cache as tcache
 
 
-class JaceWrapped(tcache.CachingStage["JaceLowered"]):
+if TYPE_CHECKING:
+    from collections.abc import Callable, Mapping, Sequence
+
+    import dace
+
+
+class JaCeWrapped(tcache.CachingStage["JaCeLowered"]):
     """A function ready to be specialized, lowered, and compiled.
 
     This class represents the output of functions such as `jace.jit()` and is the first stage in
-    the translation/compilation chain of Jace. A user should never create a `JaceWrapped` object
+    the translation/compilation chain of JaCe. A user should never create a `JaCeWrapped` object
     directly, instead `jace.jit` should be used for that.
     While it supports just-in-time lowering and compilation these steps can also be performed
-    explicitly. The lowering performed by this stage is cached, thus if a `JaceWrapped` object is
+    explicitly. The lowering performed by this stage is cached, thus if a `JaCeWrapped` object is
     lowered later, with the same argument the result is taken from the cache.
-    Furthermore, a `JaceWrapped` object is composable with all Jax transformations.
+    Furthermore, a `JaCeWrapped` object is composable with all Jax transformations.
 
     Args:
         fun:                    The function that is wrapped.
@@ -88,7 +92,7 @@ def __call__(
         """Executes the wrapped function, lowering and compiling as needed in one step."""
 
         # If we are inside a traced context, then we forward the call to the wrapped function.
-        #  This ensures that Jace is composable with Jax.
+        #  This ensures that JaCe is composable with Jax.
         if util.is_tracing_ongoing(*args, **kwargs):
             return self._fun(*args, **kwargs)
 
@@ -101,7 +105,7 @@ def lower(
         self,
         *args: Any,
         **kwargs: Any,
-    ) -> JaceLowered:
+    ) -> JaCeLowered:
         """Lower this function explicitly for the given arguments.
 
         Performs the first two steps of the AOT steps described above, i.e. stage out to Jaxpr
@@ -128,7 +132,7 @@ def lower(
             tsdfg: translator.TranslatedJaxprSDFG = driver.translate_jaxpr(jaxpr)
         ptrans.postprocess_jaxpr_sdfg(tsdfg=tsdfg, fun=self.wrapped_fun)
 
-        return JaceLowered(tsdfg)
+        return JaCeLowered(tsdfg)
 
     @property
     def wrapped_fun(self) -> Callable:
@@ -139,7 +143,7 @@ def _make_call_description(
         self,
         *args: Any,
     ) -> tcache.StageTransformationSpec:
-        """This function computes the key for the `JaceWrapped.lower()` call to cache it.
+        """This function computes the key for the `JaCeWrapped.lower()` call to cache it.
 
         The function will compute a full abstract description on its argument. Currently it is
         only able to handle positional argument and does not support static arguments.
@@ -148,13 +152,13 @@ def _make_call_description(
         return tcache.StageTransformationSpec(stage_id=id(self), call_args=call_args)
 
 
-class JaceLowered(tcache.CachingStage["JaceCompiled"]):
+class JaCeLowered(tcache.CachingStage["JaCeCompiled"]):
     """Represents the original computation as an SDFG.
 
-    It represents the computation wrapped by a `JaceWrapped` translated and lowered to SDFG.
-    It is followed by the `JaceCompiled` stage.
-    Although, `JaceWrapped` is composable with Jax transformations `JaceLowered` is not.
-    A user should never create such an object, instead `JaceWrapped.lower()` should be used.
+    It represents the computation wrapped by a `JaCeWrapped` translated and lowered to SDFG.
+    It is followed by the `JaCeCompiled` stage.
+    Although, `JaCeWrapped` is composable with Jax transformations `JaCeLowered` is not.
+    A user should never create such an object, instead `JaCeWrapped.lower()` should be used.
 
     Args:
         tsdfg:  The lowered SDFG with metadata. Must be finalized.
@@ -181,11 +185,11 @@ def __init__(
     def compile(
         self,
         compiler_options: CompilerOptions | None = None,
-    ) -> JaceCompiled:
+    ) -> JaCeCompiled:
         """Optimize and compile the lowered SDFG using `compiler_options`.
 
         Returns an object that encapsulates a compiled SDFG object. To influence the various
-        optimizations and compile options of Jace you can use the `compiler_options` argument.
+        optimizations and compile options of JaCe you can use the `compiler_options` argument.
         If nothing is specified `jace.optimization.DEFAULT_OPTIMIZATIONS` will be used.
 
         Note:
@@ -197,7 +201,7 @@ def compile(
         tsdfg: translator.TranslatedJaxprSDFG = copy.deepcopy(self._translated_sdfg)
         optimization.jace_optimize(tsdfg=tsdfg, **self._make_compiler_options(compiler_options))
 
-        return JaceCompiled(
+        return JaCeCompiled(
             csdfg=util.compile_jax_sdfg(tsdfg),
             inp_names=tsdfg.inp_names,
             out_names=tsdfg.out_names,
@@ -231,7 +235,7 @@ def _make_call_description(
         """This function computes the key for the `self.compile()` call to cache it.
 
         The key that is computed by this function is based on the concrete values of the passed
-        compiler options. This is different from the key computed by `JaceWrapped` which is an
+        compiler options. This is different from the key computed by `JaCeWrapped` which is an
         abstract description.
         """
         options = self._make_compiler_options(compiler_options)
@@ -245,11 +249,11 @@ def _make_compiler_options(
         return optimization.DEFAULT_OPTIMIZATIONS | (compiler_options or {})
 
 
-class JaceCompiled:
+class JaCeCompiled:
     """Compiled version of the SDFG.
 
-    This is the last stage of the jit chain. A user should never create a `JaceCompiled` instance,
-    instead `JaceLowered.compile()` should be used.
+    This is the last stage of the jit chain. A user should never create a `JaCeCompiled` instance,
+    instead `JaCeLowered.compile()` should be used.
 
     Args:
         csdfg:      The compiled SDFG object.
@@ -294,14 +298,14 @@ def __call__(
         )
 
 
-#: Known compilation stages in Jace.
-Stage = JaceWrapped | JaceLowered | JaceCompiled
+#: Known compilation stages in JaCe.
+Stage = JaCeWrapped | JaCeLowered | JaCeCompiled
 
 
 __all__ = [
-    "Stage",
     "CompilerOptions",  # export for compatibility with Jax.
-    "JaceWrapped",
-    "JaceLowered",
-    "JaceCompiled",
+    "JaCeCompiled",
+    "JaCeLowered",
+    "JaCeWrapped",
+    "Stage",
 ]
diff --git a/src/jace/translator/__init__.py b/src/jace/translator/__init__.py
index cda6c85..95bf4c7 100644
--- a/src/jace/translator/__init__.py
+++ b/src/jace/translator/__init__.py
@@ -26,8 +26,8 @@
     "PrimitiveTranslator",
     "PrimitiveTranslatorCallable",
     "TranslatedJaxprSDFG",
-    "register_primitive_translator",
     "get_regsitered_primitive_translators",
-    "set_active_primitive_translators_to",
     "make_primitive_translator",
+    "register_primitive_translator",
+    "set_active_primitive_translators_to",
 ]
diff --git a/src/jace/translator/jaxpr_translator_driver.py b/src/jace/translator/jaxpr_translator_driver.py
index 4faf45d..b00f167 100644
--- a/src/jace/translator/jaxpr_translator_driver.py
+++ b/src/jace/translator/jaxpr_translator_driver.py
@@ -200,14 +200,13 @@ def get_array(
     @overload
     def map_jax_var_to_sdfg(
         self,
-        jax_var: str | jax_core.Atom | util.JaCeVar,
+        jax_var: jax_core.Atom | util.JaCeVar,
+        allow_fail: Literal[False] = False,
     ) -> str: ...
 
     @overload
     def map_jax_var_to_sdfg(
-        self,
-        jax_var: str | jax_core.Atom | util.JaCeVar,
-        allow_fail: Literal[True],
+        self, jax_var: jax_core.Atom | util.JaCeVar, allow_fail: Literal[True]
     ) -> str | None: ...
 
     def map_jax_var_to_sdfg(
@@ -222,7 +221,7 @@ def map_jax_var_to_sdfg(
             allow_fail:     If mapping is not known return `None` instead of raising `KeyError`.
         """
         if isinstance(jax_var, jax_core.Literal):
-            raise RuntimeError("There is no SDFG variable for literal '{jax_var}'.")
+            raise RuntimeError(f"There is no SDFG variable for literal '{jax_var}'.")
         if jax_var in self._jax_name_map:
             sdfg_name = self._jax_name_map[jax_var]
         elif allow_fail:
@@ -249,9 +248,7 @@ def is_allocated(self) -> bool:
 
         If `self` is allocated then there is also an ongoing translation process.
         """
-        if len(self._ctx_stack) != 0:
-            return True
-        return False
+        return len(self._ctx_stack) != 0
 
     def is_root_translator(self) -> bool:
         """Tests if `self` is the root translator.
@@ -260,9 +257,7 @@ def is_root_translator(self) -> bool:
         """
         if not self.is_allocated():
             raise RuntimeError("Driver is not allocated.")
-        if len(self._ctx_stack) == 1:
-            return True
-        return False
+        return len(self._ctx_stack) == 1
 
     def add_jax_name_mapping(
         self,
@@ -324,6 +319,10 @@ def add_array(
             pipeline, should be handle to handle it. But there are some special parts that
             might explicitly want a scalar, it also might block certain compiler optimization.
         """
+
+        if isinstance(arg, jax_core.Literal):
+            raise ValueError(f"Can not generate an SDFG variable for literal '{arg}'.")
+
         shape: tuple[int | dace.symbol | str, ...] = util.get_jax_var_shape(arg)
         dtype: dace.typeclass = util.get_jax_var_dtype(arg)
         storage: dace.StorageType = dace.StorageType.Default  # Set at later stages (optimization)
diff --git a/src/jace/translator/post_translation.py b/src/jace/translator/post_translation.py
index bfe5125..5cf8a58 100644
--- a/src/jace/translator/post_translation.py
+++ b/src/jace/translator/post_translation.py
@@ -14,11 +14,12 @@
 
 from __future__ import annotations
 
-from collections.abc import Callable
 from typing import TYPE_CHECKING
 
 
 if TYPE_CHECKING:
+    from collections.abc import Callable
+
     from jace import translator
 
 
diff --git a/src/jace/translator/primitive_translator.py b/src/jace/translator/primitive_translator.py
index 0ceb1c7..e1dbac0 100644
--- a/src/jace/translator/primitive_translator.py
+++ b/src/jace/translator/primitive_translator.py
@@ -16,14 +16,15 @@
 from __future__ import annotations
 
 from abc import abstractmethod
-from collections.abc import Callable, Mapping, MutableMapping, MutableSequence, Sequence
 from typing import TYPE_CHECKING, Literal, Protocol, cast, overload, runtime_checkable
 
-import dace
-from jax import core as jax_core
-
 
 if TYPE_CHECKING:
+    from collections.abc import Callable, Mapping, MutableMapping, MutableSequence, Sequence
+
+    import dace
+    from jax import core as jax_core
+
     from jace import translator
 
 #: Global registry of the active primitive translators.
@@ -102,7 +103,7 @@ class PrimitiveTranslator(PrimitiveTranslatorCallable, Protocol):
     driver object, which also owns and manage the primitive translators. In the end this implements
     the delegation pattern.
 
-    You can use `jace.translator.register_primitive_translator()` to register your translator to Jace.
+    You can use `jace.translator.register_primitive_translator()` to register your translator to JaCe.
     """
 
     @property
@@ -177,7 +178,7 @@ def register_primitive_translator(
     translator.PrimitiveTranslator
     | Callable[[translator.PrimitiveTranslator], translator.PrimitiveTranslator]
 ):
-    """Adds a primitive translator to Jace's global registry.
+    """Adds a primitive translator to JaCe's global registry.
 
     If a translator for `primitive` is already registered an error will be generated. However,
     by specifying `overwrite` `primitive_translator` will replace the current one.
@@ -207,7 +208,7 @@ def wrapper(
 
 
 def get_regsitered_primitive_translators() -> dict[str, translator.PrimitiveTranslator]:
-    """Returns a copy of the current state of Jace's global primitive registry.
+    """Returns a copy of the current state of JaCe's global primitive registry.
 
     The function returns a mapping that maps the name of a primitive to the associated translator.
     No change to the global registry will affect the return value and vice versa.
@@ -218,7 +219,7 @@ def get_regsitered_primitive_translators() -> dict[str, translator.PrimitiveTran
 def set_active_primitive_translators_to(
     new_translators: Mapping[str, translator.PrimitiveTranslator],
 ) -> MutableMapping[str, translator.PrimitiveTranslator]:
-    """Exchange the global translator registry of Jace with `new_translators`.
+    """Exchange the global translator registry of JaCe with `new_translators`.
 
     The function will return the state of the global translator registry just before this call.
     Any changes to `new_translators` after calling this function will have no effect on the
diff --git a/src/jace/translator/primitive_translators/alu_translator.py b/src/jace/translator/primitive_translators/alu_translator.py
index 9b10ca4..afce301 100644
--- a/src/jace/translator/primitive_translators/alu_translator.py
+++ b/src/jace/translator/primitive_translators/alu_translator.py
@@ -9,15 +9,18 @@
 
 from __future__ import annotations
 
-from collections.abc import MutableSequence, Sequence
-from typing import Any, Final, cast
+from typing import TYPE_CHECKING, Any, Final, cast
 
 import dace
 import numpy as np
 from jax import core as jax_core
 from typing_extensions import override
 
-from jace import translator
+from jace import translator, util
+
+
+if TYPE_CHECKING:
+    from collections.abc import MutableSequence, Sequence
 
 
 class ALUTranslator(translator.PrimitiveTranslator):
@@ -65,12 +68,13 @@ def __call__(
         assert self._prim_name == eqn.primitive.name
 
         # Determine what kind of input we got and how we should proceed.
-        is_scalar = len(eqn.outvars[0].aval.shape) == 0
-        inp_scalars = [len(Inp.aval.shape) == 0 for i, Inp in enumerate(eqn.invars)]
+        is_scalar = len(util.get_jax_var_shape(eqn.outvars[0])) == 0
+        inp_scalars = [len(util.get_jax_var_shape(Inp)) == 0 for i, Inp in enumerate(eqn.invars)]
         has_scalars_as_inputs = any(inp_scalars)
         has_some_literals = any(x is None for x in in_var_names)
         inps_same_shape = all(
-            eqn.invars[0].aval.shape == eqn.invars[i].aval.shape for i in range(1, len(eqn.invars))
+            util.get_jax_var_shape(eqn.invars[0]) == util.get_jax_var_shape(eqn.invars[i])
+            for i in range(1, len(eqn.invars))
         )
 
         # We will now look which dimensions have to be broadcasted on which operator.
@@ -85,12 +89,12 @@ def __call__(
         elif has_some_literals or has_scalars_as_inputs:
             # This is essentially an array plus a scalar, that is eitehr a literal or a variable.
             assert (not has_some_literals) or all(
-                invar.aval.shape == eqn.outvars[0].aval.shape
+                util.get_jax_var_shape(invar) == util.get_jax_var_shape(eqn.outvars[0])
                 for (invar, x) in zip(eqn.invars, in_var_names, strict=False)
                 if x is not None
             )
             assert (not has_scalars_as_inputs) or all(
-                invar.aval.shape in {eqn.outvars[0].aval.shape, ()}
+                util.get_jax_var_shape(invar) in {util.get_jax_var_shape(eqn.outvars[0]), ()}
                 for (invar, x) in zip(eqn.invars, in_var_names, strict=False)
                 if x is not None
             )
@@ -101,9 +105,11 @@ def __call__(
             #  It seems that Jax ensures this.
             #  We further assume that if the size in a dimension differs then one must have size 1.
             #  This is the size we broadcast over, i.e. conceptually replicated.
-            out_shps = tuple(eqn.outvars[0].aval.shape)  # Shape of the output
-            inp_shpl = tuple(eqn.invars[0].aval.shape)  # Shape of the left/first input
-            inp_shpr = tuple(eqn.invars[1].aval.shape)  # Shape of the right/second input
+            out_shps = tuple(util.get_jax_var_shape(eqn.outvars[0]))  # Shape of the output
+            inp_shpl = tuple(util.get_jax_var_shape(eqn.invars[0]))  # Shape of the left/first input
+            inp_shpr = tuple(
+                util.get_jax_var_shape(eqn.invars[1])
+            )  # Shape of the right/second input
 
             if not ((len(inp_shpl) == len(inp_shpr)) and (len(out_shps) == len(inp_shpr))):
                 raise NotImplementedError("Can not broadcast over different ranks.")
@@ -124,7 +130,7 @@ def __call__(
         tskl_code: str = self._write_tasklet_code(in_var_names, eqn)
         tskl_name: str = eqn.primitive.name
         tskl_map_ranges: list[tuple[str, str]] = [
-            (f"__i{dim}", f"0:{N}") for dim, N in enumerate(eqn.outvars[0].aval.shape)
+            (f"__i{dim}", f"0:{N}") for dim, N in enumerate(util.get_jax_var_shape(eqn.outvars[0]))
         ]
         tskl_output: tuple[str, dace.Memlet] = None  # type: ignore[assignment]
         tskl_inputs: list[tuple[str, dace.Memlet] | tuple[None, None]] = []
@@ -214,14 +220,14 @@ def _write_tasklet_code(
                 continue
 
             jax_in_var: jax_core.Literal = cast(jax_core.Literal, eqn.invars[i])
-            if jax_in_var.aval.shape == ():
+            if util.get_jax_var_shape(jax_in_var) == ():
                 t_val = jax_in_var.val
                 if isinstance(t_val, np.ndarray):
                     t_val = jax_in_var.val.max()  # I do not know a better way in that case
                 t_code = t_code.replace(f"__in{i}", str(t_val))
             else:
                 raise ValueError(
-                    f"Can not handle the literal case of shape: {jax_in_var.aval.shape}"
+                    f"Can not handle the literal case of shape: {util.get_jax_var_shape(jax_in_var)}"
                 )
 
         # Now replace the parameters
diff --git a/src/jace/util/__init__.py b/src/jace/util/__init__.py
index 863472e..51e6b75 100644
--- a/src/jace/util/__init__.py
+++ b/src/jace/util/__init__.py
@@ -40,25 +40,25 @@
 
 
 __all__ = [
+    "FORBIDDEN_SDFG_VAR_NAMES",
     "VALID_SDFG_OBJ_NAME",
     "VALID_SDFG_VAR_NAME",
-    "FORBIDDEN_SDFG_VAR_NAMES",
     "JaCeVar",
     "compile_jax_sdfg",
     "dataclass_with_default_init",
+    "get_jax_var_dtype",
+    "get_jax_var_name",
+    "get_jax_var_shape",
     "is_array",
     "is_drop_var",
-    "is_tracing_ongoing",
+    "is_fully_addressable",
     "is_jaceified",
-    "is_jaxified",
     "is_jax_array",
-    "is_fully_addressable",
+    "is_jaxified",
     "is_on_device",
     "is_scalar",
-    "get_jax_var_dtype",
-    "get_jax_var_name",
-    "get_jax_var_shape",
-    "translate_dtype",
-    "run_jax_sdfg",
+    "is_tracing_ongoing",
     "propose_jax_name",
+    "run_jax_sdfg",
+    "translate_dtype",
 ]
diff --git a/src/jace/util/compiling.py b/src/jace/util/compiling.py
index a9658fb..f68c22b 100644
--- a/src/jace/util/compiling.py
+++ b/src/jace/util/compiling.py
@@ -10,7 +10,6 @@
 from __future__ import annotations
 
 import time
-from collections.abc import Mapping, Sequence
 from typing import TYPE_CHECKING, Any
 
 import dace
@@ -21,6 +20,8 @@
 
 
 if TYPE_CHECKING:
+    from collections.abc import Mapping, Sequence
+
     from jace import translator
     from jace.util import dace_helper
 
diff --git a/src/jace/util/jax_helper.py b/src/jace/util/jax_helper.py
index bed727e..d41ffaa 100644
--- a/src/jace/util/jax_helper.py
+++ b/src/jace/util/jax_helper.py
@@ -15,15 +15,19 @@
 
 import dataclasses
 import itertools
-from collections.abc import Mapping
-from typing import Any
+from typing import TYPE_CHECKING, Any
 
 import dace
 import jax.core as jax_core
+import numpy as np
 
 import jace.util as util
 
 
+if TYPE_CHECKING:
+    from collections.abc import Mapping
+
+
 @dataclasses.dataclass(repr=True, frozen=True, eq=False)
 class JaCeVar:
     """Replacement for the `jax.Var` class.
@@ -103,6 +107,8 @@ def get_jax_var_shape(jax_var: jax_core.Atom | JaCeVar) -> tuple[int | dace.symb
     """Returns the shape of `jax_var`."""
     match jax_var:
         case jax_core.Var() | jax_core.Literal():
+            # AbstractValue, does not have a `shape` attribute, but in all cases we care, it will.
+            assert hasattr(jax_var.aval, "shape")
             return jax_var.aval.shape
         case JaCeVar():
             return jax_var.shape
@@ -114,6 +120,8 @@ def get_jax_var_dtype(jax_var: jax_core.Atom | JaCeVar) -> dace.typeclass:
     """Returns the DaCe equivalent of `jax_var`s datatype."""
     match jax_var:
         case jax_core.Var() | jax_core.Literal():
+            # AbstractValue, does not have a `dtype` attribute, but in all cases we care, it will.
+            assert hasattr(jax_var.aval, "dtype")
             return translate_dtype(jax_var.aval.dtype)
         case JaCeVar():
             return jax_var.dtype
@@ -192,3 +200,19 @@ def propose_jax_name(
     if jax_name in util.FORBIDDEN_SDFG_VAR_NAMES:
         jax_name = f"__jace_forbidden_{jax_name}"
     return jax_name
+
+
+def get_jax_literal_value(lit: jax_core.Atom) -> bool | float | int | np.generic:
+    """Returns the value a literal is wrapping.
+
+    The function guarantees to return a scalar value.
+    """
+    if not isinstance(lit, jax_core.Literal):
+        raise ValueError(f"Can only extract literals not '{type(lit)}'.")
+    val = lit.val
+    if isinstance(val, np.ndarray):
+        assert val.shape == ()
+        return val.max()
+    if isinstance(val, (bool, float, int)):
+        return val
+    raise TypeError(f"Failed to extract value from '{lit}'.")
diff --git a/src/jace/util/traits.py b/src/jace/util/traits.py
index 0355dac..ae2f41b 100644
--- a/src/jace/util/traits.py
+++ b/src/jace/util/traits.py
@@ -21,17 +21,18 @@
 from jace import stages
 
 
-def is_jaceified(obj: Any) -> TypeGuard[stages.JaceWrapped]:
+def is_jaceified(obj: Any) -> TypeGuard[stages.JaCeWrapped]:
     """Tests if `obj` is decorated by JaCe.
 
     Similar to `is_jaxified`, but for JaCe object.
     """
+
     if util.is_jaxified(obj):
         return False
-    return isinstance(obj, stages.JaceWrapped)
+    return isinstance(obj, stages.JaCeWrapped)
 
 
-def is_drop_var(jax_var: jax_core.Atom | util.JaCeVar) -> TypeGuard[jax_core.DropVarp]:
+def is_drop_var(jax_var: jax_core.Atom | util.JaCeVar) -> TypeGuard[jax_core.DropVar]:
     """Tests if `jax_var` is a drop variable, i.e. a variable that is not read from in a Jaxpr."""
 
     if isinstance(jax_var, jax_core.DropVar):
@@ -48,7 +49,7 @@ def is_jaxified(
 
     A "jaxified" object is an object that was processed by Jax.
     While a return value of `True` guarantees a jaxified object, `False` does not proof the
-    contrary. See also `jace.util.is_jaceified()` to tests if something is a Jace object.
+    contrary. See also `jace.util.is_jaceified()` to tests if something is a JaCe object.
     """
     jaxifyed_types = (
         jax_core.Primitive,
@@ -118,11 +119,7 @@ def is_on_device(
     function is more of a test, if there is a GPU or not.
     """
     if is_jax_array(obj):
-        try:
-            _ = obj.__cuda_array_interface__
-            return True
-        except AttributeError:
-            return False
+        return hasattr(obj, "__cuda_array_interface__")
     return dace.is_gpu_array(obj)
 
 
diff --git a/src/jace/util/translation_cache.py b/src/jace/util/translation_cache.py
index 42f7b6a..c0f6fce 100644
--- a/src/jace/util/translation_cache.py
+++ b/src/jace/util/translation_cache.py
@@ -7,8 +7,8 @@
 
 """This module contains the functionality related to the compilation cache of the stages.
 
-The cache currently caches the lowering, i.e. the result of `JaceWrapped.lower()` and the
-compilation, i.e. `JaceLowered.compile()`. The caches are on a per stage basis and not on a
+The cache currently caches the lowering, i.e. the result of `JaCeWrapped.lower()` and the
+compilation, i.e. `JaCeLowered.compile()`. The caches are on a per stage basis and not on a
 per instant basis. To make a stage cacheable, it must be derived from `CachingStage` and
 its transition function must be decoration with `@cached_transition`.
 """
diff --git a/tests/test_caching.py b/tests/test_caching.py
index 9a624a2..437feee 100644
--- a/tests/test_caching.py
+++ b/tests/test_caching.py
@@ -18,6 +18,7 @@
 
 import jace
 from jace import optimization, stages
+from jace.util import translation_cache as tcache
 
 
 @pytest.fixture(autouse=True)
@@ -29,15 +30,13 @@ def _clear_translation_cache():
     Todo:
         Ask Enrique how I can make that fixture apply everywhere not just in the file but the whole test suite.
     """
-    from jace.util import translation_cache as tcache
-
     tcache.clear_translation_cache()
     yield
     tcache.clear_translation_cache()
 
 
-def test_caching_same_sizes():
-    """The behaviour of the cache if same sizes are used."""
+def test_caching_same_sizes() -> None:
+    """The behaviour of the cache if same sizes are used, in two different functions."""
 
     # Counter for how many time it was lowered.
     lowering_cnt = [0]
@@ -61,8 +60,8 @@ def wrapped(A, B):
     BB = B + 0.638956
 
     # Now let's lower it once directly and call it.
-    lowered: stages.JaceLowered = wrapped.lower(A, B)
-    compiled: stages.JaceCompiled = lowered.compile()
+    lowered: stages.JaCeLowered = wrapped.lower(A, B)
+    compiled: stages.JaCeCompiled = lowered.compile()
     assert lowering_cnt[0] == 1
     assert np.allclose(testee(A, B), compiled(A, B))
 
@@ -112,8 +111,7 @@ def wrapped(A, B):
     assert compiled1 is not compiled2
 
 
-@pytest.mark.skip(reason="Missing primitive translators")
-def test_caching_different_structure():
+def test_caching_different_structure() -> None:
     """Now tests if we can handle multiple arguments with different structures.
 
     Todo:
@@ -133,13 +131,11 @@ def wrapped(A, B):
     C = np.full((5, 3), 14, dtype=np.float64)
     D = np.full((6, 3), 14, dtype=np.int64)
 
-    # These are the arrays.
-    args: dict[int, np.ndarray] = {id(x): x for x in [A, B, C, D]}
     # These are the known lowerings.
-    lowerings: dict[tuple[int, int], stages.JaceLowered] = {}
+    lowerings: dict[tuple[int, int], stages.JaCeLowered] = {}
     lowering_ids: set[int] = set()
     # These are the known compilations.
-    compilations: dict[tuple[int, int], stages.JaceCompiled] = {}
+    compilations: dict[tuple[int, int], stages.JaCeCompiled] = {}
     compiled_ids: set[int] = set()
 
     # Generating the lowerings
@@ -166,7 +162,7 @@ def wrapped(A, B):
         assert compiled1 is ccompiled
 
 
-def test_caching_compilation():
+def test_caching_compilation() -> None:
     """Tests the compilation cache, this is just very simple, since it uses the same code paths as lowering."""
 
     @jace.jit
@@ -226,6 +222,103 @@ def testee(A: np.ndarray) -> np.ndarray:
         assert lowering_cnt[0] == i + 1
 
 
+def test_caching_eviction_simple():
+    """Simple tests for cache eviction."""
+
+    @jace.jit
+    def testee(A: np.ndarray) -> np.ndarray:
+        return A + 1.0
+
+    cache: tcache.StageCache = testee._cache
+
+    first_lowered = testee.lower(np.ones(10))
+    first_key = cache.front()[0]
+    second_lowered = testee.lower(np.ones(11))
+    second_key = cache.front()[0]
+    third_lowered = testee.lower(np.ones(12))
+    third_key = cache.front()[0]
+
+    assert first_key != second_key
+    assert first_key != third_key
+    assert second_key != third_key
+    assert cache[first_key] is first_lowered
+    assert cache[second_key] is second_lowered
+    assert cache[third_key] is third_lowered
+
+    assert first_key in cache
+    assert second_key in cache
+    assert third_key in cache
+    assert cache.front()[0] == third_key
+
+    # We now evict the second key, which should not change anything on the order.
+    cache.popitem(second_key)
+    assert first_key in cache
+    assert second_key not in cache
+    assert third_key in cache
+    assert cache.front()[0] == third_key
+
+    # Now we modify first_key, which moves it to the front.
+    cache[first_key] = first_lowered
+    assert first_key in cache
+    assert second_key not in cache
+    assert third_key in cache
+    assert cache.front()[0] == first_key
+
+    # Now we evict the oldest one, which is third_key
+    cache.popitem(None)
+    assert first_key in cache
+    assert second_key not in cache
+    assert third_key not in cache
+    assert cache.front()[0] == first_key
+
+
+def test_caching_eviction_complex():
+    """Tests if the stuff is properly evicted if the cache is full."""
+
+    @jace.jit
+    def testee(A: np.ndarray) -> np.ndarray:
+        return A + 1.0
+
+    cache: tcache.StageCache = testee._cache
+    capacity = cache.capacity
+    assert len(cache) == 0
+
+    # Lets fill the cache to the brim.
+    for i in range(capacity):
+        A = np.ones(i + 10)
+        lowered = testee.lower(A)
+        assert len(cache) == i + 1
+
+        if i == 0:
+            first_key: tcache.StageTransformationSpec = cache.front()[0]
+            first_lowered = cache[first_key]
+            assert lowered is first_lowered
+        elif i == 1:
+            second_key: tcache.StageTransformationSpec = cache.front()[0]
+            assert second_key != first_key
+            assert cache[second_key] is lowered
+        assert first_key in cache
+
+    assert len(cache) == capacity
+    assert first_key in cache
+    assert second_key in cache
+
+    # Now we will modify the first key, this should make it the newest.
+    assert cache.front()[0] != first_key
+    cache[first_key] = first_lowered
+    assert len(cache) == capacity
+    assert first_key in cache
+    assert second_key in cache
+    assert cache.front()[0] == first_key
+
+    # Now we will add a new entry to the cache, this will evict the second entry.
+    _ = testee.lower(np.ones(capacity + 1000))
+    assert len(cache) == capacity
+    assert cache.front()[0] != first_key
+    assert first_key in cache
+    assert second_key not in cache
+
+
 def test_caching_strides() -> None:
     """Test if the cache detects a change in strides."""
 
@@ -257,6 +350,6 @@ def wrapped(A: np.ndarray) -> np.ndarray:
         F_lower = wrapped.lower(F)
         F_res = wrapped(F)
     assert F_lower is None  # Remove later.
-    assert C_res is not F_res  # Remove later
+    assert C_res is not F_res  # type: ignore[unreachable]
     assert np.allclose(F_res, C_res)
     assert F_lower is not C_lower
diff --git a/tests/test_jax_api.py b/tests/test_jax_api.py
index 221733a..f6c89df 100644
--- a/tests/test_jax_api.py
+++ b/tests/test_jax_api.py
@@ -45,7 +45,7 @@ def testee(A: np.ndarray, B: np.ndarray) -> np.ndarray:
 
 
 def test_composition_itself():
-    """Tests if Jace is composable with itself."""
+    """Tests if JaCe is composable with itself."""
 
     # Pure Python functions
     def f_ref(x):
@@ -83,7 +83,7 @@ def ddf(x):
 
 @pytest.mark.skip(reason="Nested Jaxpr are not handled.")
 def test_composition_with_jax():
-    """Tests if Jace can interact with Jax and vice versa."""
+    """Tests if JaCe can interact with Jax and vice versa."""
 
     def base_fun(A, B, C):
         return A + B * jnp.sin(C) - A * B
@@ -102,7 +102,7 @@ def jax_fun(A, B, C):
 
 @pytest.mark.skip(reason="Nested Jaxpr are not handled.")
 def test_composition_with_jax_2():
-    """Second test if Jace can interact with Jax and vice versa."""
+    """Second test if JaCe can interact with Jax and vice versa."""
 
     @jax.jit
     def f1_jax(A, B):
@@ -187,7 +187,7 @@ def df(x):
     assert df(x2) == df_x2, f"Failed upper branch, expected '{df_x2}', got '{res_2}'."
 
 
-@pytest.mark.skip(reason="Running Jace with disabled 'x64' support does not work.")
+@pytest.mark.skip(reason="Running JaCe with disabled 'x64' support does not work.")
 def test_disabled_x64():
     """Tests the behaviour of the tool chain if we explicitly disable x64 support in Jax.
 
@@ -203,7 +203,7 @@ def testee(A: np.ndarray, B: np.float64) -> np.ndarray:
 
     # Run them with disabled x64 support
     with disable_x64():
-        # Jace
+        # JaCe
         jace_testee = jace.jit(testee)
         jace_lowered = jace_testee.lower(A, B)
         jace_comp = jace_lowered.compile()
diff --git a/tests/test_jaxpr_translator_driver.py b/tests/test_jaxpr_translator_driver.py
index 3a16cee..5dafb03 100644
--- a/tests/test_jaxpr_translator_driver.py
+++ b/tests/test_jaxpr_translator_driver.py
@@ -21,7 +21,7 @@
 from jace.util import JaCeVar
 
 
-# These are some Jace variables that we use inside the tests
+# These are some JaCe variables that we use inside the tests
 #  Unnamed arrays
 array1 = JaCeVar((10, 12), dace.float64)
 array2 = JaCeVar((10, 13), dace.float32)
@@ -315,6 +315,7 @@ def test_driver_variable_multiple_variables(
     prefix_sdfg_name = translation_driver.add_array(
         array1, update_var_mapping=False, name_prefix=prefix
     )
+    assert prefix_expected_name == prefix_sdfg_name
     assert prefix_expected_name in translation_driver.sdfg.arrays
     assert narray1 == translation_driver.map_jax_var_to_sdfg(array1)
 
@@ -369,13 +370,12 @@ def test_driver_variable_alloc_list_cleaning(
     cause an error because it is proposed to `a`, which is already used.
     """
     var_list = [array1, nscal, scal2]
-    exp_names = ["a", nscal.name, "c"]
 
     with pytest.raises(
         expected_exception=ValueError,
         match=re.escape(f"add_array({scal2}): The proposed name 'a', is used."),
     ):
-        res_names = translation_driver.create_jax_var_list(var_list)
+        _ = translation_driver.create_jax_var_list(var_list)
 
     # This currently fails, because the `create_jax_var_list()` function does not clean up.
     assert len(translation_driver.arrays) == 0
@@ -496,10 +496,8 @@ def test_driver_constants(
     assert np.all(translation_driver.sdfg.constants["__const_a"] == constant)
 
 
-def test_driver_scalar_return_value(
-    translation_driver: translator.JaxprTranslationDriver,
-) -> None:
-    """Tests if scalars can be returned directly"""
+def test_driver_scalar_return_value() -> None:
+    """Tests if scalars can be returned directly."""
 
     def scalar_ops(A: float) -> float:
         return A + A - A * A
@@ -519,6 +517,18 @@ def wrapped(A: float) -> float:
     assert lower_cnt[0] == 1
 
 
+@pytest.mark.skip(reason="Currently 'scalar' return values, are actually shape '(1,)' arrays.")
+def test_driver_scalar_return_type() -> None:
+    """Tests if the type is the same, in case of scalar return."""
+
+    @jace.jit
+    def wrapped(A: np.float64) -> np.float64:
+        return A + A - A * A
+
+    A = np.float64(1.0)
+    assert type(A) is np.float64, f"Expected type 'np.float64', but got '{type(A).__name__}'."
+
+
 def test_driver_jace_var() -> None:
     """Simple tests about the `JaCeVar` objects."""
     for iname in ["do", "", "_ _", "9al", "_!"]:
@@ -529,9 +539,7 @@ def test_driver_jace_var() -> None:
             _ = JaCeVar((), dace.int8, name=iname)
 
 
-def test_driver_F_strides(
-    translation_driver: translator.JaxprTranslationDriver,
-) -> None:
+def test_driver_F_strides() -> None:
     """Tests if we can lower without a standard stride.
 
     Notes:
diff --git a/tests/test_misc.py b/tests/test_misc.py
index ec2a5b2..8870674 100644
--- a/tests/test_misc.py
+++ b/tests/test_misc.py
@@ -5,7 +5,7 @@
 #
 # SPDX-License-Identifier: BSD-3-Clause
 
-"""Implements general tests for Jace."""
+"""Implements general tests for JaCe."""
 
 from __future__ import annotations
 
diff --git a/tests/test_subtranslator_helper.py b/tests/test_subtranslator_helper.py
index b9c1d4e..3579da6 100644
--- a/tests/test_subtranslator_helper.py
+++ b/tests/test_subtranslator_helper.py
@@ -5,7 +5,7 @@
 #
 # SPDX-License-Identifier: BSD-3-Clause
 
-"""Implements tests to check if the sorting algorithm is correct."""
+"""Implements tests for managing the primitive subtranslators."""
 
 from __future__ import annotations
 
@@ -61,19 +61,19 @@ def __call__(self) -> None:  # type: ignore[override]  # Arguments
 
 
 @make_primitive_translator("non_existing_callable_primitive3")
-def SubTrans3_Callable(*args: Any, **kwargs: Any) -> None:
+def SubTrans3_Callable(*args: Any, **kwargs: Any) -> None:  # noqa: ARG001
     raise NotImplementedError
 
 
 @make_primitive_translator("add")
-def fake_add_translator(*args: Any, **kwargs: Any) -> None:
+def fake_add_translator(*args: Any, **kwargs: Any) -> None:  # noqa: ARG001
     raise NotImplementedError
 
 
 def test_are_subtranslators_imported():
     """Tests if something is inside the list of subtranslators."""
     # Must be adapted if new primitives are implemented.
-    assert len(get_regsitered_primitive_translators()) == 37
+    assert len(get_regsitered_primitive_translators()) == 47
 
 
 @pytest.mark.usefixtures("no_builtin_translators")
@@ -104,7 +104,7 @@ def test_subtranslatior_managing_isolation():
     """Tests if `get_regsitered_primitive_translators()` protects the internal registry."""
     assert (
         get_regsitered_primitive_translators()
-        is not translator.primitive_translator._PRIMITIVE_TRANSLATORS_REGISTRY
+        is not translator.managing._PRIMITIVE_TRANSLATORS_DICT
     )
 
     initial_primitives = get_regsitered_primitive_translators()
@@ -138,7 +138,7 @@ def same_structure(d1: dict, d2: dict) -> bool:
     # Now change the initial one with the mutated one.
     #  The object is copied but should still have the same structure.
     old_active = set_active_primitive_translators_to(mutated_primitives)
-    assert mutated_primitives is not translator.primitive_translator._PRIMITIVE_TRANSLATORS_REGISTRY
+    assert mutated_primitives is not translator.managing._PRIMITIVE_TRANSLATORS_DICT
     assert same_structure(old_active, initial_primitives)
     assert same_structure(mutated_primitives, get_regsitered_primitive_translators())
 
@@ -150,7 +150,7 @@ def test_subtranslatior_managing_callable_annotation():
     prim_name = "non_existing_property"
 
     @make_primitive_translator(prim_name)
-    def non_existing_translator(*args: Any, **kwargs: Any) -> None:
+    def non_existing_translator(*args: Any, **kwargs: Any) -> None:  # noqa: ARG001
         raise NotImplementedError
 
     assert hasattr(non_existing_translator, "primitive")
@@ -163,7 +163,7 @@ def test_subtranslatior_managing_overwriting():
     current_add_translator = get_regsitered_primitive_translators()["add"]
 
     @make_primitive_translator("add")
-    def useless_add_translator(*args: Any, **kwargs: Any) -> None:
+    def useless_add_translator(*args: Any, **kwargs: Any) -> None:  # noqa: ARG001
         raise NotImplementedError
 
     # This will not work because it is not overwritten.
@@ -191,7 +191,7 @@ def test_subtranslatior_managing_overwriting_2():
 
     @register_primitive_translator(overwrite=True)
     @make_primitive_translator("add")
-    def still_useless_but_a_bit_less(*args: Any, **kwargs: Any) -> None:
+    def still_useless_but_a_bit_less(*args: Any, **kwargs: Any) -> None:  # noqa: ARG001
         trans_cnt[0] += 1
         return
 
@@ -222,7 +222,7 @@ def foo(A):
 
     @register_primitive_translator(overwrite=True)
     @make_primitive_translator("add")
-    def useless_add_translator(*args: Any, **kwargs: Any) -> None:
+    def useless_add_translator(*args: Any, **kwargs: Any) -> None:  # noqa: ARG001
         raise NotImplementedError("The 'useless_add_translator' was called as expected.")
 
     # Since `foo` was already constructed, a new registering can not change anything.

From 699b93e6c13b0b75bfd6c30b6259157554394c8f Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Thu, 30 May 2024 15:04:18 +0200
Subject: [PATCH 277/458] Rereverted Some of Enrique's suggestions.

---
 src/jace/optimization.py                      |   5 +-
 src/jace/stages.py                            |  16 +--
 src/jace/translator/__init__.py               |   3 +-
 .../translator/jaxpr_translator_driver.py     | 115 ++++++++++++++++--
 src/jace/translator/post_translation.py       |  30 ++---
 src/jace/translator/translated_jaxpr_sdfg.py  |  74 ++++-------
 src/jace/util/compiling.py                    |   7 +-
 tests/test_caching.py                         |  98 +--------------
 tests/test_sub_translators_alu.py             |   2 +-
 tests/test_subtranslator_helper.py            |   6 +-
 10 files changed, 163 insertions(+), 193 deletions(-)

diff --git a/src/jace/optimization.py b/src/jace/optimization.py
index 68f7b1f..c90d612 100644
--- a/src/jace/optimization.py
+++ b/src/jace/optimization.py
@@ -50,20 +50,19 @@ def jace_optimize(
     tsdfg: translator.TranslatedJaxprSDFG,
     **kwargs: Unpack[CompilerOptions],
 ) -> None:
-    """Performs optimization of the `fsdfg` _in place_.
+    """Performs optimization of the `tsdfg` _in place_.
 
     Currently this function only supports simplification.
     Its main job is to exists that we have something that we can call in the tool chain.
 
     Args:
+        tsdfg:          The translated SDFG that should be optimized.
         simplify:       Run the simplification pipeline.
         auto_optimize:  Run the auto optimization pipeline (currently does nothing)
 
     Note:
         By default all optimizations are disabled and this function acts as a noops.
     """
-    if not tsdfg.is_finalized:
-        raise ValueError("Can only optimize finalized SDFGs.")
     if not kwargs:
         return
 
diff --git a/src/jace/stages.py b/src/jace/stages.py
index 3f42436..296690a 100644
--- a/src/jace/stages.py
+++ b/src/jace/stages.py
@@ -129,8 +129,15 @@ def lower(
                 primitive_translators=self._primitive_translators
             )
             jaxpr = _jax.make_jaxpr(self._fun)(*args)
-            tsdfg: translator.TranslatedJaxprSDFG = driver.translate_jaxpr(jaxpr)
-        ptrans.postprocess_jaxpr_sdfg(tsdfg=tsdfg, fun=self.wrapped_fun)
+            trans_ctx: translator.TranslationContext = driver.translate_jaxpr(jaxpr)
+
+        # Perform the post processing and turn it into a `TranslatedJaxprSDFG` that can be
+        #  compiled and called later.
+        # NOTE: `tsdfg` was deepcopied as a side effect of post processing.
+        tsdfg: translator.TranslatedJaxprSDFG = ptrans.postprocess_jaxpr_sdfg(
+            trans_ctx=trans_ctx,
+            fun=self.wrapped_fun,
+        )
 
         return JaCeLowered(tsdfg)
 
@@ -160,9 +167,6 @@ class JaCeLowered(tcache.CachingStage["JaCeCompiled"]):
     Although, `JaCeWrapped` is composable with Jax transformations `JaCeLowered` is not.
     A user should never create such an object, instead `JaCeWrapped.lower()` should be used.
 
-    Args:
-        tsdfg:  The lowered SDFG with metadata. Must be finalized.
-
     Note:
         `self` will manage the passed `tsdfg` object. Modifying it results in undefined behavior.
 
@@ -176,8 +180,6 @@ def __init__(
         self,
         tsdfg: translator.TranslatedJaxprSDFG,
     ) -> None:
-        if not tsdfg.is_finalized:
-            raise ValueError("The translated SDFG must be finalized.")
         super().__init__()
         self._translated_sdfg = tsdfg
 
diff --git a/src/jace/translator/__init__.py b/src/jace/translator/__init__.py
index 95bf4c7..31c6db1 100644
--- a/src/jace/translator/__init__.py
+++ b/src/jace/translator/__init__.py
@@ -9,7 +9,7 @@
 
 from __future__ import annotations
 
-from .jaxpr_translator_driver import JaxprTranslationDriver
+from .jaxpr_translator_driver import JaxprTranslationDriver, TranslationContext
 from .primitive_translator import (
     PrimitiveTranslator,
     PrimitiveTranslatorCallable,
@@ -26,6 +26,7 @@
     "PrimitiveTranslator",
     "PrimitiveTranslatorCallable",
     "TranslatedJaxprSDFG",
+    "TranslationContext",
     "get_regsitered_primitive_translators",
     "make_primitive_translator",
     "register_primitive_translator",
diff --git a/src/jace/translator/jaxpr_translator_driver.py b/src/jace/translator/jaxpr_translator_driver.py
index b00f167..ddbdad8 100644
--- a/src/jace/translator/jaxpr_translator_driver.py
+++ b/src/jace/translator/jaxpr_translator_driver.py
@@ -66,7 +66,7 @@ class JaxprTranslationDriver:
 
     _primitive_translators: Mapping[str, translator.PrimitiveTranslatorCallable]
     _jax_name_map: dict[jax_core.Var | util.JaCeVar, str]
-    _ctx_stack: list[translator.TranslatedJaxprSDFG]
+    _ctx_stack: list[TranslationContext]
 
     def __init__(
         self,
@@ -90,7 +90,7 @@ def translate_jaxpr(
         jaxpr: jax_core.ClosedJaxpr,
         *,
         name: str | None = None,
-    ) -> translator.TranslatedJaxprSDFG:
+    ) -> TranslationContext:
         """Perform the translation of a Jaxpr into a SDFG.
 
         In case this function is called and `self` has an ongoing translation process, a new
@@ -100,7 +100,7 @@ def translate_jaxpr(
         Returns:
             The function will translate the passed Jaxpr object into an SDFG in canonical form.
             This SDFG together with additional meta data, that is needed for further processing
-            is encapsulated inside a `TranslatedJaxprSDFG` object.
+            is encapsulated inside a `TranslationContext` object.
 
         Args:
             name:                   Use this name for the SDFG instead some generated one.
@@ -506,10 +506,9 @@ def _allocate_translation_ctx(
         Args:
             name:               The name of the SDFG.
         """
-        from jace import translator  # Cyclic import
 
         self._ctx_stack.append(
-            translator.TranslatedJaxprSDFG(
+            TranslationContext(
                 name=name,
             )
         )
@@ -517,12 +516,12 @@ def _allocate_translation_ctx(
         return self
 
     @property
-    def _ctx(self) -> translator.TranslatedJaxprSDFG:
+    def _ctx(self) -> TranslationContext:
         """Returns the currently active translation context."""
         assert len(self._ctx_stack) != 0, "No context is active."
         return self._ctx_stack[-1]
 
-    def _clear_translation_ctx(self) -> translator.TranslatedJaxprSDFG | None:
+    def _clear_translation_ctx(self) -> TranslationContext | None:
         """Remove the current active context from `self` and returns its state.
 
         If `self` is not allocated it will return `None`.
@@ -617,12 +616,12 @@ def _translate_single_eqn(
     def _translate_jaxpr_internal(
         self,
         jaxpr: jax_core.ClosedJaxpr,
-    ) -> translator.TranslatedJaxprSDFG:
+    ) -> TranslationContext:
         """Performs the actual translation of the Jaxpr into an SDFG.
 
         The function assumes that the context is allocated as well as the initial variables.
         The function will return the internal state of `self` encapsulated inside a
-        `TranslatedJaxprSDFG` object. The function will also deallocate the current context
+        `TranslationContext` object. The function will also deallocate the current context
         upon return.
 
         Args:
@@ -647,7 +646,7 @@ def _translate_jaxpr_internal(
 
         self._ctx.out_names = tuple(out_var_names)
 
-        return cast("translator.TranslatedJaxprSDFG", self._clear_translation_ctx())
+        return cast(TranslationContext, self._clear_translation_ctx())
 
     def _handle_null_jaxpr(
         self,
@@ -719,3 +718,99 @@ def _start_state(self) -> dace.SDFGState:
     def _terminal_sdfg_state(self) -> dace.SDFGState:
         """Returns the current terminal state of the SDFG under construction."""
         return cast(dace.SDFGState, self._ctx.terminal_state)
+
+
+class TranslationContext:
+    """Translation context used by the `JaxprTranslationDriver`.
+
+    Essentially it is a `TranslatedJaxprSDFG` object together with some additional meta data,
+    that is needed during translation. It is also returned by the `translate_jaxpr()` function.
+    It is important that the SDFG it encapsulates is not directly usable and should be passed
+    to the post processing stage.
+
+    Attributes:
+        start_state:    The first state in the SDFG state machine.
+        terminal_state: The (currently) last state in the state machine.
+
+    Args:
+        name:       The name of the SDFG, will be forwarded to the encapsulated `TranslatedJaxprSDFG`.
+    """
+
+    jsdfg: translator.TranslatedJaxprSDFG
+    start_state: dace.SDFGState
+    terminal_state: dace.SDFGState
+
+    def __init__(
+        self,
+        name: str | None = None,
+    ) -> None:
+        from jace import translator  # Cyclic import
+
+        self.jsdfg = translator.TranslatedJaxprSDFG(name=name)
+        self.start_state = self.sdfg.add_state(label="initial_state", is_start_block=True)
+        self.terminal_state = self.start_state
+
+    @property
+    def sdfg(self) -> dace.SDFG:
+        return self.jsdfg.sdfg
+
+    @property
+    def inp_names(self) -> tuple[str, ...]:
+        return self.jsdfg.inp_names
+
+    @inp_names.setter
+    def inp_names(self, inp_names: tuple[str, ...]) -> None:
+        if len(inp_names) == 0:
+            raise dace.sdfg.InvalidSDFGError(
+                "There are no input arguments.",
+                self.sdfg,
+                self.sdfg.node_id(self.sdfg.start_state),
+            )
+        if any(inp not in self.sdfg.arrays for inp in inp_names):
+            raise dace.sdfg.InvalidSDFGError(
+                f"Expected to find: {(inp for inp in inp_names if inp not in self.sdfg.arrays)}",
+                self.sdfg,
+                self.sdfg.node_id(self.start_state),
+            )
+        self.jsdfg.inp_names = inp_names
+
+    @property
+    def out_names(self) -> tuple[str, ...]:
+        return self.jsdfg.out_names
+
+    @out_names.setter
+    def out_names(self, out_names: tuple[str, ...]) -> None:
+        if len(out_names) == 0:
+            raise dace.sdfg.InvalidSDFGError(
+                "There are no output arguments.",
+                self.sdfg,
+                self.sdfg.node_id(self.start_state),
+            )
+        if any(out not in self.sdfg.arrays for out in out_names):
+            raise dace.sdfg.InvalidSDFGError(
+                f"Expected to find: {(out for out in out_names if out not in self.sdfg.arrays)}",
+                self.sdfg,
+                self.sdfg.node_id(self.start_state),
+            )
+        self.jsdfg.out_names = out_names
+
+    def validate(self) -> bool:
+        """Validate internal state of `self`.
+
+        This function will not check the embedded SDFG.
+        """
+        if self.start_state and (self.start_state is not self.sdfg.start_block):
+            raise dace.sdfg.InvalidSDFGError(
+                f"Expected to find '{self.start_state}' ({self.sdfg.node_id(self.start_state)}),"
+                f" instead found '{self.sdfg.start_block} ({self.sdfg.node_id(self.sdfg.start_block)}).",
+                self.sdfg,
+                self.sdfg.node_id(self.start_state),
+            )
+        if self.start_state and ({self.terminal_state} != set(self.sdfg.sink_nodes())):
+            raise dace.sdfg.InvalidSDFGError(
+                f"Expected to find '{self.terminal_state}' ({self.sdfg.node_id(self.terminal_state)}),"
+                f" instead found '{self.sdfg.sink_nodes()}.",
+                self.sdfg,
+                self.sdfg.node_id(self.terminal_state),
+            )
+        return True
diff --git a/src/jace/translator/post_translation.py b/src/jace/translator/post_translation.py
index 5cf8a58..aa1cc1a 100644
--- a/src/jace/translator/post_translation.py
+++ b/src/jace/translator/post_translation.py
@@ -14,6 +14,7 @@
 
 from __future__ import annotations
 
+import copy
 from typing import TYPE_CHECKING
 
 
@@ -24,24 +25,32 @@
 
 
 def postprocess_jaxpr_sdfg(
-    tsdfg: translator.TranslatedJaxprSDFG,
+    trans_ctx: translator.TranslationContext,
     fun: Callable,  # noqa: ARG001  # Currently unused
-) -> None:
-    """Perform the final post processing steps on the SDFG in place.
+) -> translator.TranslatedJaxprSDFG:
+    """Perform the final post processing steps on the `TranslationContext`.
 
-    Afterwards `tsdfg` will be finalized.
+    Returns:
+        The function returns a valid `TranslationContext` that is decoupled from the one
+        that was originally part of `trans_ctx`.
 
     Args:
-        tsdfg:  The translated SDFG object.
-        fun:    The original function that we translated.
+        trans_ctx:  The `TranslationContext` obtained from the `translate_jaxpr()` function.
+        fun:        The original function that was translated.
 
     Todo:
         - Setting correct input names (layer that does not depend on JAX).
         - Setting the correct strides & Storage properties.
     """
     # Currently we do nothing except finalizing.
+    trans_ctx.validate()
+    tsdfg: translator.TranslatedJaxprSDFG = copy.deepcopy(trans_ctx.jsdfg)
+
     finalize_jaxpr_sdfg(tsdfg)
 
+    tsdfg.validate()
+    return tsdfg
+
 
 def finalize_jaxpr_sdfg(
     tsdfg: translator.TranslatedJaxprSDFG,
@@ -49,14 +58,10 @@ def finalize_jaxpr_sdfg(
     """Finalizes the supplied `tsdfg` object in place.
 
     This function will turn a non finalized, i.e. canonical, SDFG into a finalized one,
-    i.e. after this function `tsdfg.is_finalized` is `True`.
     The function will:
     - mark all input and output variables, i.e. listed in `tsdfg.{inp, out}_names`, as globals,
     - set the `arg_names` property of the SDFG,
-    - deallocate all members of `tsdfg` that are no longer needed.
     """
-    if tsdfg.is_finalized:
-        raise ValueError("The supplied SDFG is already finalized.")
     if not tsdfg.inp_names:
         raise ValueError("Input names are not specified.")
     if not tsdfg.out_names:
@@ -73,8 +78,3 @@ def finalize_jaxpr_sdfg(
     # This forces the signature of the SDFG to include all arguments in order they appear.
     #  If an argument is used as input and output then it is only listed as input.
     tsdfg.sdfg.arg_names = sdfg_arg_names
-
-    # Now we will deallocate the fields and mark `self` as finalized.
-    tsdfg.start_state = None
-    tsdfg.terminal_state = None
-    tsdfg.is_finalized = True
diff --git a/src/jace/translator/translated_jaxpr_sdfg.py b/src/jace/translator/translated_jaxpr_sdfg.py
index e47d11f..1a3fd32 100644
--- a/src/jace/translator/translated_jaxpr_sdfg.py
+++ b/src/jace/translator/translated_jaxpr_sdfg.py
@@ -15,30 +15,25 @@
 class TranslatedJaxprSDFG:
     """Encapsulates the result of a translation run of the `JaxprTranslationDriver` object.
 
-    This class is used by the `JaxprTranslationDriver` to store the context of the SDFG that is
-    currently under construction and the return value of `JaxprTranslationDriver.translate_jaxpr()`.
-    A user should never create a `TranslatedJaxprSDFG` manually.
+    The only valid way to obtain a `TranslatedJaxprSDFG` is by passing a `TranslationContext`,
+    that was in turn constructed by `JaxprTranslationDriver.translate_jaxpr()` to
+    `postprocess_jaxpr_sdfg()`.
+    This class encapsulates a translated SDFG as well as the meta data needed to run it.
 
-    It might happen that a name appears in both the `inp_names` and `out_names` lists. This happens
-    if an argument is used both as input and output, and it is not an error. In Jax this is called
-    argument donation.
-
-    By default `self` encapsulates a canonical SDFG, see `JaxprTranslationDriver` for more
-    information on this. However, if `is_finalized` is set, then `self` contains a finalized SDFG,
-    which differs from a canonical SDFG in the following ways:
-    - all input and output arrays are marked as global,
-    - however, there are no `__return` arrays, i.e. all return values are passed as arguments,
-    - its `arg_names` are set with set `inp_names + out_names`, however, arguments that are input
-        and outputs are only listed as inputs,
-    - only the `sdfg`, `inp_names`, `out_names` and `is_finalized` are guaranteed to be not `None`.
+    Contrary to the SDFG that is encapsulated inside the `TranslationContext` object, `self`
+    carries a proper SDFG, however:
+    - it does not have `__return*` variables, instead all return arguments are passed by arguments,
+    - its `arg_names` is set to  `inp_names + out_names`, but arguments that are input and outputs
+        are only listed as inputs.
 
     Attributes:
         sdfg:           The SDFG object that was created.
         inp_names:      A list of the SDFG variables that are used as input, same order as `Jaxpr.invars`.
         out_names:      A list of the SDFG variables that are used as output, same order as `Jaxpr.outvars`.
-        start_state:    The first state in the SDFG state machine.
-        terminal_state: The (currently) last state in the state machine.
-        is_finalized:   Indicates if `self` represents a finalized or canonical SDFG.
+
+    It might happen that a name appears in both the `inp_names` and `out_names` lists. This happens
+    if an argument is used both as input and output, and it is not an error. In Jax this is called
+    argument donation.
 
     Args:
         name:   The name that should be given to the SDFG, optional.
@@ -47,64 +42,43 @@ class TranslatedJaxprSDFG:
     sdfg: dace.SDFG
     inp_names: tuple[str, ...]
     out_names: tuple[str, ...]
-    is_finalized: bool
-    start_state: dace.SDFGState | None
-    terminal_state: dace.SDFGState | None
 
     def __init__(
         self,
         name: str | None = None,
     ) -> None:
-        """Initializes the context.
-
-        The function allocates the SDFG and initializes the members properly.
-        However, a user should never call this function directly.
-
-        Args:
-            name:       Name of the SDFG object.
-        """
         if isinstance(name, str) and not util.VALID_SDFG_OBJ_NAME.fullmatch(name):
             raise ValueError(f"'{name}' is not a valid SDFG name.")
 
         self.sdfg = dace.SDFG(name=(name or f"unnamed_SDFG_{id(self)}"))
         self.inp_names = ()
         self.out_names = ()
-        self.is_finalized = False
-        self.start_state = self.sdfg.add_state(label="initial_state", is_start_block=True)
-        self.terminal_state = self.start_state
 
     def validate(self) -> bool:
-        """Validate the underlying SDFG.
-
-        The actual SDFG is only validated for finalized SDFGs.
-        """
-        if len(self.inp_names) == 0:
+        """Validate the underlying SDFG."""
+        if not self.inp_names:
             raise dace.sdfg.InvalidSDFGError(
                 "There are no input arguments.",
                 self.sdfg,
                 self.sdfg.node_id(self.sdfg.start_state),
             )
-        if len(self.out_names) == 0:
+        if not all(not self.sdfg.arrays[inp].transient for inp in self.inp_names):
             raise dace.sdfg.InvalidSDFGError(
-                "There are no output arguments.",
+                f"Found transient inputs: {(inp for inp in self.inp_names if self.sdfg.arrays[inp].transient)}",
                 self.sdfg,
-                self.sdfg.node_id(self.start_state),
+                self.sdfg.node_id(self.sdfg.start_state),
             )
-        if self.start_state and (self.start_state is not self.sdfg.start_block):
+        if not self.out_names:
             raise dace.sdfg.InvalidSDFGError(
-                f"Expected to find '{self.start_state}' ({self.sdfg.node_id(self.start_state)}),"
-                f" instead found '{self.sdfg.start_block} ({self.sdfg.node_id(self.sdfg.start_block)}).",
+                "There are no output arguments.",
                 self.sdfg,
-                self.sdfg.node_id(self.start_state),
+                self.sdfg.node_id(self.sdfg.start_state),
             )
-        if self.start_state and ({self.terminal_state} != set(self.sdfg.sink_nodes())):
+        if not all(not self.sdfg.arrays[out].transient for out in self.out_names):
             raise dace.sdfg.InvalidSDFGError(
-                f"Expected to find '{self.terminal_state}' ({self.sdfg.node_id(self.terminal_state)}),"
-                f" instead found '{self.sdfg.sink_nodes()}.",
+                f"Found transient outputs: {(out for out in self.out_names if self.sdfg.arrays[out].transient)}",
                 self.sdfg,
-                self.sdfg.node_id(self.terminal_state),
+                self.sdfg.node_id(self.sdfg.start_state),
             )
-        if not self.is_finalized:
-            return True  # More we can not do for an unfinalized SDFG.
         self.sdfg.validate()
         return True
diff --git a/src/jace/util/compiling.py b/src/jace/util/compiling.py
index f68c22b..290eafe 100644
--- a/src/jace/util/compiling.py
+++ b/src/jace/util/compiling.py
@@ -29,12 +29,7 @@
 def compile_jax_sdfg(
     tsdfg: translator.TranslatedJaxprSDFG,
 ) -> dace_helper.CompiledSDFG:
-    """Compiles the SDFG embedded in `tsdfg` and return the resulting `CompiledSDFG` object.
-
-    The function requires that `tsdfg` is finalized.
-    """
-    if not tsdfg.is_finalized:
-        raise ValueError("Can only compile a finalized SDFG.")
+    """Compiles the SDFG embedded in `tsdfg` and return the resulting `CompiledSDFG` object."""
     if any(  # We do not support the DaCe return mechanism
         arrname.startswith("__return")
         for arrname in tsdfg.sdfg.arrays.keys()  # noqa: SIM118  # we can not use `in` because we are also interested in `__return_`!
diff --git a/tests/test_caching.py b/tests/test_caching.py
index 437feee..db568a3 100644
--- a/tests/test_caching.py
+++ b/tests/test_caching.py
@@ -111,6 +111,7 @@ def wrapped(A, B):
     assert compiled1 is not compiled2
 
 
+@pytest.mark.skip("'convert_element_type' primitive is not implemented.")
 def test_caching_different_structure() -> None:
     """Now tests if we can handle multiple arguments with different structures.
 
@@ -222,103 +223,6 @@ def testee(A: np.ndarray) -> np.ndarray:
         assert lowering_cnt[0] == i + 1
 
 
-def test_caching_eviction_simple():
-    """Simple tests for cache eviction."""
-
-    @jace.jit
-    def testee(A: np.ndarray) -> np.ndarray:
-        return A + 1.0
-
-    cache: tcache.StageCache = testee._cache
-
-    first_lowered = testee.lower(np.ones(10))
-    first_key = cache.front()[0]
-    second_lowered = testee.lower(np.ones(11))
-    second_key = cache.front()[0]
-    third_lowered = testee.lower(np.ones(12))
-    third_key = cache.front()[0]
-
-    assert first_key != second_key
-    assert first_key != third_key
-    assert second_key != third_key
-    assert cache[first_key] is first_lowered
-    assert cache[second_key] is second_lowered
-    assert cache[third_key] is third_lowered
-
-    assert first_key in cache
-    assert second_key in cache
-    assert third_key in cache
-    assert cache.front()[0] == third_key
-
-    # We now evict the second key, which should not change anything on the order.
-    cache.popitem(second_key)
-    assert first_key in cache
-    assert second_key not in cache
-    assert third_key in cache
-    assert cache.front()[0] == third_key
-
-    # Now we modify first_key, which moves it to the front.
-    cache[first_key] = first_lowered
-    assert first_key in cache
-    assert second_key not in cache
-    assert third_key in cache
-    assert cache.front()[0] == first_key
-
-    # Now we evict the oldest one, which is third_key
-    cache.popitem(None)
-    assert first_key in cache
-    assert second_key not in cache
-    assert third_key not in cache
-    assert cache.front()[0] == first_key
-
-
-def test_caching_eviction_complex():
-    """Tests if the stuff is properly evicted if the cache is full."""
-
-    @jace.jit
-    def testee(A: np.ndarray) -> np.ndarray:
-        return A + 1.0
-
-    cache: tcache.StageCache = testee._cache
-    capacity = cache.capacity
-    assert len(cache) == 0
-
-    # Lets fill the cache to the brim.
-    for i in range(capacity):
-        A = np.ones(i + 10)
-        lowered = testee.lower(A)
-        assert len(cache) == i + 1
-
-        if i == 0:
-            first_key: tcache.StageTransformationSpec = cache.front()[0]
-            first_lowered = cache[first_key]
-            assert lowered is first_lowered
-        elif i == 1:
-            second_key: tcache.StageTransformationSpec = cache.front()[0]
-            assert second_key != first_key
-            assert cache[second_key] is lowered
-        assert first_key in cache
-
-    assert len(cache) == capacity
-    assert first_key in cache
-    assert second_key in cache
-
-    # Now we will modify the first key, this should make it the newest.
-    assert cache.front()[0] != first_key
-    cache[first_key] = first_lowered
-    assert len(cache) == capacity
-    assert first_key in cache
-    assert second_key in cache
-    assert cache.front()[0] == first_key
-
-    # Now we will add a new entry to the cache, this will evict the second entry.
-    _ = testee.lower(np.ones(capacity + 1000))
-    assert len(cache) == capacity
-    assert cache.front()[0] != first_key
-    assert first_key in cache
-    assert second_key not in cache
-
-
 def test_caching_strides() -> None:
     """Test if the cache detects a change in strides."""
 
diff --git a/tests/test_sub_translators_alu.py b/tests/test_sub_translators_alu.py
index 45a5548..603f57c 100644
--- a/tests/test_sub_translators_alu.py
+++ b/tests/test_sub_translators_alu.py
@@ -46,7 +46,7 @@ def testee(A: np.ndarray, B: np.ndarray) -> np.ndarray:
     ref = testee(A, B)
     res = jace.jit(testee)(A, B)
 
-    assert np.allclose(ref, res), f"Expected '{ref}' got '{res}'."
+    assert np.allclose(ref, res), f"Expected '{ref.tolist()}' got '{res.tolist()}'."
 
 
 def test_add3():
diff --git a/tests/test_subtranslator_helper.py b/tests/test_subtranslator_helper.py
index 3579da6..0c5faa6 100644
--- a/tests/test_subtranslator_helper.py
+++ b/tests/test_subtranslator_helper.py
@@ -73,7 +73,7 @@ def fake_add_translator(*args: Any, **kwargs: Any) -> None:  # noqa: ARG001
 def test_are_subtranslators_imported():
     """Tests if something is inside the list of subtranslators."""
     # Must be adapted if new primitives are implemented.
-    assert len(get_regsitered_primitive_translators()) == 47
+    assert len(get_regsitered_primitive_translators()) == 37
 
 
 @pytest.mark.usefixtures("no_builtin_translators")
@@ -104,7 +104,7 @@ def test_subtranslatior_managing_isolation():
     """Tests if `get_regsitered_primitive_translators()` protects the internal registry."""
     assert (
         get_regsitered_primitive_translators()
-        is not translator.managing._PRIMITIVE_TRANSLATORS_DICT
+        is not translator.primitive_translator._PRIMITIVE_TRANSLATORS_REGISTRY
     )
 
     initial_primitives = get_regsitered_primitive_translators()
@@ -138,7 +138,7 @@ def same_structure(d1: dict, d2: dict) -> bool:
     # Now change the initial one with the mutated one.
     #  The object is copied but should still have the same structure.
     old_active = set_active_primitive_translators_to(mutated_primitives)
-    assert mutated_primitives is not translator.managing._PRIMITIVE_TRANSLATORS_DICT
+    assert mutated_primitives is not translator.primitive_translator._PRIMITIVE_TRANSLATORS_REGISTRY
     assert same_structure(old_active, initial_primitives)
     assert same_structure(mutated_primitives, get_regsitered_primitive_translators())
 

From 53aae7b90f0989a77644fa587c92b6cf7de03972 Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Thu, 30 May 2024 15:13:34 +0200
Subject: [PATCH 278/458] Made the renaming from driver to builder, that is in
 my view pointless.

---
 src/jace/stages.py                            |   4 +-
 src/jace/translator/__init__.py               |   4 +-
 ..._driver.py => jaxpr_translator_builder.py} |  32 +-
 src/jace/translator/primitive_translator.py   |  16 +-
 .../primitive_translators/alu_translator.py   |   4 +-
 src/jace/translator/translated_jaxpr_sdfg.py  |   4 +-
 src/jace/util/jax_helper.py                   |   2 +-
 ...er.py => test_jaxpr_translator_builder.py} | 288 +++++++++---------
 8 files changed, 177 insertions(+), 177 deletions(-)
 rename src/jace/translator/{jaxpr_translator_driver.py => jaxpr_translator_builder.py} (97%)
 rename tests/{test_jaxpr_translator_driver.py => test_jaxpr_translator_builder.py} (59%)

diff --git a/src/jace/stages.py b/src/jace/stages.py
index 296690a..b130107 100644
--- a/src/jace/stages.py
+++ b/src/jace/stages.py
@@ -125,11 +125,11 @@ def lower(
         #  However, in this case we will have problems when we call the SDFG, for some reasons
         #  `CompiledSDFG` does not work in that case correctly, thus we enable it for the tracing.
         with _jax.experimental.enable_x64():
-            driver = translator.JaxprTranslationDriver(
+            builder = translator.JaxprTranslationBuilder(
                 primitive_translators=self._primitive_translators
             )
             jaxpr = _jax.make_jaxpr(self._fun)(*args)
-            trans_ctx: translator.TranslationContext = driver.translate_jaxpr(jaxpr)
+            trans_ctx: translator.TranslationContext = builder.translate_jaxpr(jaxpr)
 
         # Perform the post processing and turn it into a `TranslatedJaxprSDFG` that can be
         #  compiled and called later.
diff --git a/src/jace/translator/__init__.py b/src/jace/translator/__init__.py
index 31c6db1..a97d3c4 100644
--- a/src/jace/translator/__init__.py
+++ b/src/jace/translator/__init__.py
@@ -9,7 +9,7 @@
 
 from __future__ import annotations
 
-from .jaxpr_translator_driver import JaxprTranslationDriver, TranslationContext
+from .jaxpr_translator_builder import JaxprTranslationBuilder, TranslationContext
 from .primitive_translator import (
     PrimitiveTranslator,
     PrimitiveTranslatorCallable,
@@ -22,7 +22,7 @@
 
 
 __all__ = [
-    "JaxprTranslationDriver",
+    "JaxprTranslationBuilder",
     "PrimitiveTranslator",
     "PrimitiveTranslatorCallable",
     "TranslatedJaxprSDFG",
diff --git a/src/jace/translator/jaxpr_translator_driver.py b/src/jace/translator/jaxpr_translator_builder.py
similarity index 97%
rename from src/jace/translator/jaxpr_translator_driver.py
rename to src/jace/translator/jaxpr_translator_builder.py
index ddbdad8..e41f823 100644
--- a/src/jace/translator/jaxpr_translator_driver.py
+++ b/src/jace/translator/jaxpr_translator_builder.py
@@ -22,8 +22,8 @@
 from jace import util
 
 
-class JaxprTranslationDriver:
-    """Internal driver class for creating an SDFG equivalent of a `Jaxpr` instance.
+class JaxprTranslationBuilder:
+    """Internal builder class for creating an SDFG equivalent of a `Jaxpr` instance.
 
     The SDFG that is created by this class has a very particular form, which we consider canonical.
     The main feature of a canonical SDFG are:
@@ -44,14 +44,14 @@ class JaxprTranslationDriver:
     states. In certain cases it might be that an equation needs more states, but this is an
     exception.
 
-    The actual translation of the equation is not handled by the driver. Instead the request is
+    The actual translation of the equation is not handled by the builder. Instead the request is
     forwarded to a `PrimitiveTranslator` object, known as primitive translator. This is a highly
     specialized object that is able to handle one kind of primitive. For more information on them
     see the documentation of `PrimitiveTranslator`.
 
     To start a translation the `translate_jaxpr()` function should be called, if this happens it is
-    said that the driver has an ongoing translation. If `translate_jaxpr()` is called on a driver
-    that has an ongoing translation, a new translation context will be set up. Thus the driver
+    said that the builder has an ongoing translation. If `translate_jaxpr()` is called on a builder
+    that has an ongoing translation, a new translation context will be set up. Thus the builder
     will then translate the supplied (nested) Jaxpr and return the result. However, this will have
     no influence on the translation process that is already going.
 
@@ -60,7 +60,7 @@ class JaxprTranslationDriver:
 
     Notes:
         After the main translation has been performed the translator object can be used again.
-        Currently the driver will generate only Array as SDFG variables, however, this is a
+        Currently the builder will generate only Array as SDFG variables, however, this is a
         temporary solution, see `add_array()`.
     """
 
@@ -111,7 +111,7 @@ def translate_jaxpr(
 
         # NOTE: If `self` is already allocated, i.e. has an ongoing translation process,
         #       the `_allocate_translation_ctx()` function will start a new context.
-        #       Thus the driver will start to translate a second (nested) SDFG.
+        #       Thus the builder will start to translate a second (nested) SDFG.
         #       Also note that there is no mechanism that forces the integration of the nested
         #       SDFG/Jaxpr, this must be done manually.
         self._allocate_translation_ctx(
@@ -256,14 +256,14 @@ def is_root_translator(self) -> bool:
         The root translator (context) is the very first translator process that was started.
         """
         if not self.is_allocated():
-            raise RuntimeError("Driver is not allocated.")
+            raise RuntimeError("Builder is not allocated.")
         return len(self._ctx_stack) == 1
 
     def add_jax_name_mapping(
         self,
         jax_var: jax_core.Var | util.JaCeVar,
         sdfg_name: str,
-    ) -> JaxprTranslationDriver:
+    ) -> JaxprTranslationBuilder:
         """Creates a new mapping between `jax_var` to `sdfg_name`.
 
         If the mapping already exists an error will be generated. This function is not able to
@@ -448,7 +448,7 @@ def _create_initial_input(
             The function will populate the `inp_names` member of the current context.
         """
         if not self.is_allocated():
-            raise RuntimeError("Driver is not allocated, can not create constants.")
+            raise RuntimeError("Builder is not allocated, can not create constants.")
         assert len(self._ctx.inp_names) == 0
 
         # Handle the initial input arguments
@@ -476,7 +476,7 @@ def _create_constants(
         is deepcopied.
         """
         if not self.is_allocated():
-            raise RuntimeError("Driver is not allocated, can not create constants.")
+            raise RuntimeError("Builder is not allocated, can not create constants.")
         if len(jaxpr.consts) == 0:
             return ()
 
@@ -496,11 +496,11 @@ def _create_constants(
     def _allocate_translation_ctx(
         self,
         name: str | None = None,
-    ) -> JaxprTranslationDriver:
+    ) -> JaxprTranslationBuilder:
         """This function allocates and initialize the members of the translation context of `self`.
 
         If this function is called and `self` is already allocated, the function will create a new
-        context, allowing the driver to handle nested Jaxpr.
+        context, allowing the builder to handle nested Jaxpr.
         The first context that is created is known as root translator.
 
         Args:
@@ -530,7 +530,7 @@ def _clear_translation_ctx(self) -> TranslationContext | None:
             return None
 
         if self.is_root_translator():
-            # The translation as a whole has finished, so restore the driver,
+            # The translation as a whole has finished, so restore the builder,
             #  i.e. delete all the shared state.
             self._jax_name_map = {}
 
@@ -584,7 +584,7 @@ def _translate_single_eqn(
 
         # Now perform the actual translation of the equation.
         new_sdfg_term_state = ptranslator(
-            driver=self,
+            builder=self,
             in_var_names=in_var_names,
             out_var_names=out_var_names,  # Might be modified by the translator!
             eqn=eqn,
@@ -721,7 +721,7 @@ def _terminal_sdfg_state(self) -> dace.SDFGState:
 
 
 class TranslationContext:
-    """Translation context used by the `JaxprTranslationDriver`.
+    """Translation context used by the `JaxprTranslationBuilder`.
 
     Essentially it is a `TranslatedJaxprSDFG` object together with some additional meta data,
     that is needed during translation. It is also returned by the `translate_jaxpr()` function.
diff --git a/src/jace/translator/primitive_translator.py b/src/jace/translator/primitive_translator.py
index e1dbac0..e50ac73 100644
--- a/src/jace/translator/primitive_translator.py
+++ b/src/jace/translator/primitive_translator.py
@@ -43,7 +43,7 @@ class PrimitiveTranslatorCallable(Protocol):
     @abstractmethod
     def __call__(
         self,
-        driver: translator.JaxprTranslationDriver,
+        builder: translator.JaxprTranslationBuilder,
         in_var_names: Sequence[str | None],
         out_var_names: MutableSequence[str],
         eqn: jax_core.JaxprEqn,
@@ -51,35 +51,35 @@ def __call__(
     ) -> dace.SDFGState | None:
         """Translates the Jax primitive into its SDFG equivalent.
 
-        Before the driver calls this function it will perform the following
+        Before the builder calls this function it will perform the following
         preparatory tasks:
         - It will allocate the SDFG variables that are used as outputs. Their names will be passed
             through the `out_var_names` argument, in the same order as `eqn.outvars`.
         - It will collect the names of the SDFG variables that are used as input and place them in
             `in_var_names`, in the same order as `eqn.invars`. If an input argument refers to a
             literal no SDFG variable is created for it and `None` is passed to indicate this.
-        - The driver will create variables that are used as output. They are passed as
+        - The builder will create variables that are used as output. They are passed as
             `out_var_names`, same order as in the equation.
-        - The driver will create a new terminal state and pass it as `eqn_state` argument. This
+        - The builder will create a new terminal state and pass it as `eqn_state` argument. This
             state is guaranteed to be empty and `translator.terminal_sdfg_state is eqn_state` holds.
 
         Then the primitive translator is called.
         Usually a primitive translator should construct the dataflow graph inside `eqn_state`.
         It is allowed that the primitive translators creates more states if needed, but this
         state machinery has to have a single terminal state, which must be returned and reachable
-        from `eqn_state`. If the function returns `None` the driver will assume that primitive
+        from `eqn_state`. If the function returns `None` the builder will assume that primitive
         translator was able to fully construct the dataflow graph within `eqn_state`.
 
         While a primitive translator is forbidden from meddling with the input variables mentioned
         in `in_var_names` in any way, it is allowed to modify the output variables. For example
         it could create a new SDFG variable, with different strides. But in that case the primitive
-        translator must update the internal mapping of the driver TBA HOW, and modify the names
+        translator must update the internal mapping of the builder TBA HOW, and modify the names
         passed through `out_var_names`. However, the translator is allowed to create internal
         temporary variables. It just have to ensure that no name collision will occur, a way to
         do this is to use a passed variable name as prefix.
 
         Args:
-            driver:         The driver object of the translation.
+            builder:         The builder object of the translation.
             in_var_names:   List of the names of the arrays created inside the
                                 SDFG for the inpts or `None` in case of a literal.
             out_var_names:  List of the names of the arrays created inside the
@@ -100,7 +100,7 @@ class PrimitiveTranslator(PrimitiveTranslatorCallable, Protocol):
 
     Primitive translators are simple, but highly specialized objects that are only able to perform
     the translation of a single primitive. The overall translation process itself is managed by a
-    driver object, which also owns and manage the primitive translators. In the end this implements
+    builder object, which also owns and manage the primitive translators. In the end this implements
     the delegation pattern.
 
     You can use `jace.translator.register_primitive_translator()` to register your translator to JaCe.
diff --git a/src/jace/translator/primitive_translators/alu_translator.py b/src/jace/translator/primitive_translators/alu_translator.py
index afce301..33f5800 100644
--- a/src/jace/translator/primitive_translators/alu_translator.py
+++ b/src/jace/translator/primitive_translators/alu_translator.py
@@ -46,7 +46,7 @@ def primitive(self) -> str:
     @override
     def __call__(
         self,
-        driver: translator.JaxprTranslationDriver,
+        builder: translator.JaxprTranslationBuilder,
         in_var_names: Sequence[str | None],
         out_var_names: MutableSequence[str],
         eqn: jax_core.JaxprEqn,
@@ -59,7 +59,7 @@ def __call__(
         The function will always perform the translation inside the provided state.
 
         Args:
-            driver:         The driver object of the translation.
+            builder:         The builder object of the translation.
             in_var_names:   List of the names of the arrays created inside the SDFG for the inpts or 'None' in case of a literal.
             out_var_names:  List of the names of the arrays created inside the SDFG for the outputs.
             eqn:            The Jax equation that is translated.
diff --git a/src/jace/translator/translated_jaxpr_sdfg.py b/src/jace/translator/translated_jaxpr_sdfg.py
index 1a3fd32..13f34dd 100644
--- a/src/jace/translator/translated_jaxpr_sdfg.py
+++ b/src/jace/translator/translated_jaxpr_sdfg.py
@@ -13,10 +13,10 @@
 
 
 class TranslatedJaxprSDFG:
-    """Encapsulates the result of a translation run of the `JaxprTranslationDriver` object.
+    """Encapsulates the result of a translation run of the `JaxprTranslationBuilder` object.
 
     The only valid way to obtain a `TranslatedJaxprSDFG` is by passing a `TranslationContext`,
-    that was in turn constructed by `JaxprTranslationDriver.translate_jaxpr()` to
+    that was in turn constructed by `JaxprTranslationBuilder.translate_jaxpr()` to
     `postprocess_jaxpr_sdfg()`.
     This class encapsulates a translated SDFG as well as the meta data needed to run it.
 
diff --git a/src/jace/util/jax_helper.py b/src/jace/util/jax_helper.py
index d41ffaa..b7bb2e4 100644
--- a/src/jace/util/jax_helper.py
+++ b/src/jace/util/jax_helper.py
@@ -36,7 +36,7 @@ class JaCeVar:
     class is as an internal representation of values, as they are used in Jax, but without the Jax
     machinery. As abstract values in Jax this class has a datatype, which is a `dace.typeclass`
     instance and a shape. In addition it has an optional name, which allows to create variables
-    with a certain name using `JaxprTranslationDriver.add_array()`.
+    with a certain name using `JaxprTranslationBuilder.add_array()`.
 
     Args:
         shape:      The shape of the variable.
diff --git a/tests/test_jaxpr_translator_driver.py b/tests/test_jaxpr_translator_builder.py
similarity index 59%
rename from tests/test_jaxpr_translator_driver.py
rename to tests/test_jaxpr_translator_builder.py
index 5dafb03..13a3835 100644
--- a/tests/test_jaxpr_translator_driver.py
+++ b/tests/test_jaxpr_translator_builder.py
@@ -5,7 +5,7 @@
 #
 # SPDX-License-Identifier: BSD-3-Clause
 
-"""Implements some tests of the subtranslator driver."""
+"""Implements some tests of the subtranslator builder."""
 
 from __future__ import annotations
 
@@ -38,67 +38,67 @@
 
 
 @pytest.fixture()
-def translation_driver():
-    """Returns an allocated driver instance."""
-    name = "fixture_driver"
-    driver = translator.JaxprTranslationDriver(
+def translation_builder():
+    """Returns an allocated builder instance."""
+    name = "fixture_builder"
+    builder = translator.JaxprTranslationBuilder(
         primitive_translators=translator.get_regsitered_primitive_translators()
     )
-    driver._allocate_translation_ctx(name=name)
-    return driver
+    builder._allocate_translation_ctx(name=name)
+    return builder
 
 
-def test_driver_alloc() -> None:
+def test_builder_alloc() -> None:
     """Tests the state right after allocation.
 
     Does not use the fixture because it does it on its own.
     """
-    driver = translator.JaxprTranslationDriver(
+    builder = translator.JaxprTranslationBuilder(
         primitive_translators=translator.get_regsitered_primitive_translators()
     )
-    assert not driver.is_allocated(), "Driver was created allocated."
-    assert len(driver._ctx_stack) == 0
+    assert not builder.is_allocated(), "Builder was created allocated."
+    assert len(builder._ctx_stack) == 0
 
-    # The reserved names will be tested in `test_driver_fork()`.
+    # The reserved names will be tested in `test_builder_fork()`.
     sdfg_name = "qwertzuiopasdfghjkl"
-    driver._allocate_translation_ctx(name=sdfg_name)
-    assert len(driver._ctx_stack) == 1
-    assert driver.is_root_translator()
+    builder._allocate_translation_ctx(name=sdfg_name)
+    assert len(builder._ctx_stack) == 1
+    assert builder.is_root_translator()
 
-    sdfg: dace.SDFG = driver.sdfg
+    sdfg: dace.SDFG = builder.sdfg
 
-    assert driver._ctx.sdfg is sdfg
-    assert driver.sdfg.name == sdfg_name
+    assert builder._ctx.sdfg is sdfg
+    assert builder.sdfg.name == sdfg_name
     assert sdfg.number_of_nodes() == 1
     assert sdfg.number_of_edges() == 0
-    assert sdfg.start_block is driver._ctx.start_state
-    assert driver._terminal_sdfg_state is driver._ctx.start_state
+    assert sdfg.start_block is builder._ctx.start_state
+    assert builder._terminal_sdfg_state is builder._ctx.start_state
 
 
-def test_driver_variable_alloc_auto_naming(
-    translation_driver: translator.JaxprTranslationDriver,
+def test_builder_variable_alloc_auto_naming(
+    translation_builder: translator.JaxprTranslationBuilder,
 ) -> None:
     """Tests simple variable allocation."""
     for i, var in enumerate([array1, array2, scal1, array3, scal2, scal3]):
-        sdfg_name = translation_driver.add_array(var, update_var_mapping=True)
-        sdfg_var = translation_driver.get_array(sdfg_name)
+        sdfg_name = translation_builder.add_array(var, update_var_mapping=True)
+        sdfg_var = translation_builder.get_array(sdfg_name)
         assert sdfg_name == chr(97 + i)
         assert isinstance(sdfg_var, Array)  # Everything is now an array
         assert sdfg_var.shape == ((1,) if var.shape == () else var.shape)
         assert sdfg_var.dtype == var.dtype
 
 
-def test_driver_variable_alloc_mixed_naming(
-    translation_driver: translator.JaxprTranslationDriver,
+def test_builder_variable_alloc_mixed_naming(
+    translation_builder: translator.JaxprTranslationBuilder,
 ) -> None:
     """Tests the naming in a mixed setting.
 
-    If `update_var_mapping=True` is given, then the naming will skip variables, see also `test_driver_variable_alloc_mixed_naming2()`.
+    If `update_var_mapping=True` is given, then the naming will skip variables, see also `test_builder_variable_alloc_mixed_naming2()`.
     """
     #                        *       b       c       d      *      f      g
     for i, var in enumerate([narray, array1, array2, scal1, nscal, scal2, scal3]):
-        sdfg_name = translation_driver.add_array(var, update_var_mapping=True)
-        sdfg_var = translation_driver.get_array(sdfg_name)
+        sdfg_name = translation_builder.add_array(var, update_var_mapping=True)
+        sdfg_var = translation_builder.get_array(sdfg_name)
         if var.name is None:
             assert sdfg_name == chr(97 + i)
         else:
@@ -108,8 +108,8 @@ def test_driver_variable_alloc_mixed_naming(
         assert sdfg_var.dtype == var.dtype
 
 
-def test_driver_variable_alloc_mixed_naming2(
-    translation_driver: translator.JaxprTranslationDriver,
+def test_builder_variable_alloc_mixed_naming2(
+    translation_builder: translator.JaxprTranslationBuilder,
 ) -> None:
     """Tests the naming in a mixed setting.
 
@@ -119,8 +119,8 @@ def test_driver_variable_alloc_mixed_naming2(
     letoff = 0
     #             *      a        b       c      *      d     e
     for var in [narray, array1, array2, scal1, nscal, scal2, scal3]:
-        sdfg_name = translation_driver.add_array(var, update_var_mapping=var.name is None)
-        sdfg_var = translation_driver.get_array(sdfg_name)
+        sdfg_name = translation_builder.add_array(var, update_var_mapping=var.name is None)
+        sdfg_var = translation_builder.get_array(sdfg_name)
         if var.name is None:
             assert sdfg_name == chr(97 + letoff)
             letoff += 1
@@ -131,13 +131,13 @@ def test_driver_variable_alloc_mixed_naming2(
         assert sdfg_var.dtype == var.dtype
 
 
-def test_driver_variable_alloc_prefix_naming(
-    translation_driver: translator.JaxprTranslationDriver,
+def test_builder_variable_alloc_prefix_naming(
+    translation_builder: translator.JaxprTranslationBuilder,
 ) -> None:
     """Using the prefix to name variables."""
     prefix_1 = "__my_special_prefix"
     exp_name_1 = prefix_1 + "a"
-    sdfg_name_1 = translation_driver.add_array(
+    sdfg_name_1 = translation_builder.add_array(
         array1, name_prefix=prefix_1, update_var_mapping=False
     )
     assert exp_name_1 == sdfg_name_1
@@ -145,7 +145,7 @@ def test_driver_variable_alloc_prefix_naming(
     # Because `update_var_mapping` is `False` above, 'a' will be reused.
     prefix_2 = "__my_special_prefix_second_"
     exp_name_2 = prefix_2 + "a"
-    sdfg_name_2 = translation_driver.add_array(
+    sdfg_name_2 = translation_builder.add_array(
         array1, name_prefix=prefix_2, update_var_mapping=False
     )
     assert exp_name_2 == sdfg_name_2
@@ -153,14 +153,14 @@ def test_driver_variable_alloc_prefix_naming(
     # Now we use a named variables, which are also affected.
     prefix_3 = "__my_special_prefix_third_named_"
     exp_name_3 = prefix_3 + nscal.name  # type: ignore[operator]  # `.name` is not `None`.
-    sdfg_name_3 = translation_driver.add_array(
+    sdfg_name_3 = translation_builder.add_array(
         nscal, name_prefix=prefix_3, update_var_mapping=False
     )
     assert exp_name_3 == sdfg_name_3
 
 
-def test_driver_variable_alloc_auto_naming_wrapped(
-    translation_driver: translator.JaxprTranslationDriver,
+def test_builder_variable_alloc_auto_naming_wrapped(
+    translation_builder: translator.JaxprTranslationBuilder,
 ) -> None:
     """Tests the variable naming if we have more than 26 variables."""
     single_letters = [chr(x) for x in range(97, 123)]
@@ -170,8 +170,8 @@ def test_driver_variable_alloc_auto_naming_wrapped(
             i += 1
             # Create a variable and enter it into the variable naming.
             var = JaCeVar(shape=(19, 19), dtype=dace.float64)
-            sdfg_name = translation_driver.add_array(arg=var, update_var_mapping=True)
-            mapped_name = translation_driver.map_jax_var_to_sdfg(var)
+            sdfg_name = translation_builder.add_array(arg=var, update_var_mapping=True)
+            mapped_name = translation_builder.map_jax_var_to_sdfg(var)
             assert (
                 sdfg_name == mapped_name
             ), f"Mapping for '{var}' failed, expected '{sdfg_name}' got '{mapped_name}'."
@@ -185,26 +185,26 @@ def test_driver_variable_alloc_auto_naming_wrapped(
             ), f"Automated naming failed, expected '{exp_name}' but got '{sdfg_name}'."
 
 
-def test_driver_nested(translation_driver: translator.JaxprTranslationDriver) -> None:
-    """Tests the ability of the nesting of the driver."""
+def test_builder_nested(translation_builder: translator.JaxprTranslationBuilder) -> None:
+    """Tests the ability of the nesting of the builder."""
 
     # Now add a variable to the current subtext.
-    name_1 = translation_driver.add_array(array1, update_var_mapping=True)
+    name_1 = translation_builder.add_array(array1, update_var_mapping=True)
     assert name_1 == "a"
-    assert translation_driver.map_jax_var_to_sdfg(array1) == name_1
+    assert translation_builder.map_jax_var_to_sdfg(array1) == name_1
 
     # For the sake of doing it add a new state to the SDFG.
-    translation_driver.append_new_state("sake_state")
-    assert translation_driver.sdfg.number_of_nodes() == 2
-    assert translation_driver.sdfg.number_of_edges() == 1
+    translation_builder.append_new_state("sake_state")
+    assert translation_builder.sdfg.number_of_nodes() == 2
+    assert translation_builder.sdfg.number_of_edges() == 1
 
     # Now we go one subcontext deeper; note we do this manually which should not be done.
-    translation_driver._allocate_translation_ctx("driver")
-    assert len(translation_driver._ctx_stack) == 2
-    assert translation_driver.sdfg.name == "driver"
-    assert translation_driver.sdfg.number_of_nodes() == 1
-    assert translation_driver.sdfg.number_of_edges() == 0
-    assert not translation_driver.is_root_translator()
+    translation_builder._allocate_translation_ctx("builder")
+    assert len(translation_builder._ctx_stack) == 2
+    assert translation_builder.sdfg.name == "builder"
+    assert translation_builder.sdfg.number_of_nodes() == 1
+    assert translation_builder.sdfg.number_of_edges() == 0
+    assert not translation_builder.is_root_translator()
 
     # Because we have a new SDFG the mapping to previous SDFG does not work,
     #  regardless the fact that it still exists.
@@ -214,7 +214,7 @@ def test_driver_nested(translation_driver: translator.JaxprTranslationDriver) ->
             f"Jax variable '{array1}' was supposed to map to '{name_1}', but no such SDFG variable is known."
         ),
     ):
-        _ = translation_driver.map_jax_var_to_sdfg(array1)
+        _ = translation_builder.map_jax_var_to_sdfg(array1)
 
     # Because the SDFGs are distinct it is possible to add `array1` to the nested one.
     #  However, it is not able to update the mapping.
@@ -222,22 +222,22 @@ def test_driver_nested(translation_driver: translator.JaxprTranslationDriver) ->
         expected_exception=ValueError,
         match=re.escape(f"Cannot change the mapping of '{array1}' from '{name_1}' to '{name_1}'."),
     ):
-        _ = translation_driver.add_array(array1, update_var_mapping=True)
-    assert name_1 not in translation_driver.sdfg.arrays
+        _ = translation_builder.add_array(array1, update_var_mapping=True)
+    assert name_1 not in translation_builder.sdfg.arrays
 
     # Without updating the mapping it is possible create the variable.
-    assert name_1 == translation_driver.add_array(array1, update_var_mapping=False)
+    assert name_1 == translation_builder.add_array(array1, update_var_mapping=False)
 
     # Now add a new variable, the map is shared, so a new name will be generated.
-    name_2 = translation_driver.add_array(array2, update_var_mapping=True)
+    name_2 = translation_builder.add_array(array2, update_var_mapping=True)
     assert name_2 == "b"
-    assert name_2 == translation_driver.map_jax_var_to_sdfg(array2)
+    assert name_2 == translation_builder.map_jax_var_to_sdfg(array2)
 
     # Now we go one stack level back.
-    translation_driver._clear_translation_ctx()
-    assert len(translation_driver._ctx_stack) == 1
-    assert translation_driver.sdfg.number_of_nodes() == 2
-    assert translation_driver.sdfg.number_of_edges() == 1
+    translation_builder._clear_translation_ctx()
+    assert len(translation_builder._ctx_stack) == 1
+    assert translation_builder.sdfg.number_of_nodes() == 2
+    assert translation_builder.sdfg.number_of_edges() == 1
 
     # Again the variable that was declared in the last stack is now no longer present.
     #  Note if the nested SDFG was integrated into the parent SDFG it would be accessible
@@ -247,57 +247,57 @@ def test_driver_nested(translation_driver: translator.JaxprTranslationDriver) ->
             f"Jax variable '{array2}' was supposed to map to '{name_2}', but no such SDFG variable is known."
         ),
     ):
-        _ = translation_driver.map_jax_var_to_sdfg(array2)
-    assert name_2 == translation_driver._jax_name_map[array2]
+        _ = translation_builder.map_jax_var_to_sdfg(array2)
+    assert name_2 == translation_builder._jax_name_map[array2]
 
     # Now add a new variable, since the map is shared, we will now get the next name.
-    name_3 = translation_driver.add_array(array3, update_var_mapping=True)
+    name_3 = translation_builder.add_array(array3, update_var_mapping=True)
     assert name_3 == "c"
-    assert name_3 == translation_driver.map_jax_var_to_sdfg(array3)
+    assert name_3 == translation_builder.map_jax_var_to_sdfg(array3)
 
 
-def test_driver_append_state(translation_driver: translator.JaxprTranslationDriver) -> None:
+def test_builder_append_state(translation_builder: translator.JaxprTranslationBuilder) -> None:
     """Tests the functionality of appending states."""
-    sdfg: dace.SDFG = translation_driver.sdfg
+    sdfg: dace.SDFG = translation_builder.sdfg
 
-    terminal_state_1: dace.SDFGState = translation_driver.append_new_state("terminal_state_1")
+    terminal_state_1: dace.SDFGState = translation_builder.append_new_state("terminal_state_1")
     assert sdfg.number_of_nodes() == 2
     assert sdfg.number_of_edges() == 1
-    assert terminal_state_1 is translation_driver._terminal_sdfg_state
-    assert translation_driver._terminal_sdfg_state is translation_driver._ctx.terminal_state
-    assert translation_driver._ctx.start_state is sdfg.start_block
-    assert translation_driver._ctx.start_state is not terminal_state_1
+    assert terminal_state_1 is translation_builder._terminal_sdfg_state
+    assert translation_builder._terminal_sdfg_state is translation_builder._ctx.terminal_state
+    assert translation_builder._ctx.start_state is sdfg.start_block
+    assert translation_builder._ctx.start_state is not terminal_state_1
     assert next(iter(sdfg.edges())).src is sdfg.start_block
     assert next(iter(sdfg.edges())).dst is terminal_state_1
 
-    # Specifying an explicit append state that is the terminal should also update the terminal state of the driver.
-    terminal_state_2: dace.SDFGState = translation_driver.append_new_state(
+    # Specifying an explicit append state that is the terminal should also update the terminal state of the builder.
+    terminal_state_2: dace.SDFGState = translation_builder.append_new_state(
         "terminal_state_2", prev_state=terminal_state_1
     )
     assert sdfg.number_of_nodes() == 3
     assert sdfg.number_of_edges() == 2
-    assert terminal_state_2 is translation_driver._terminal_sdfg_state
+    assert terminal_state_2 is translation_builder._terminal_sdfg_state
     assert sdfg.out_degree(terminal_state_1) == 1
     assert sdfg.out_degree(terminal_state_2) == 0
     assert sdfg.in_degree(terminal_state_2) == 1
     assert next(iter(sdfg.in_edges(terminal_state_2))).src is terminal_state_1
 
     # Specifying a previous node that is not the terminal state should not do anything.
-    non_terminal_state: dace.SDFGState = translation_driver.append_new_state(
+    non_terminal_state: dace.SDFGState = translation_builder.append_new_state(
         "non_terminal_state", prev_state=terminal_state_1
     )
-    assert translation_driver._terminal_sdfg_state is not non_terminal_state
+    assert translation_builder._terminal_sdfg_state is not non_terminal_state
     assert sdfg.in_degree(non_terminal_state) == 1
     assert sdfg.out_degree(non_terminal_state) == 0
     assert next(iter(sdfg.in_edges(non_terminal_state))).src is terminal_state_1
 
 
-def test_driver_variable_multiple_variables(
-    translation_driver: translator.JaxprTranslationDriver,
+def test_builder_variable_multiple_variables(
+    translation_builder: translator.JaxprTranslationBuilder,
 ) -> None:
     """A simple test in which we try to add a variable that are known, but with a different name."""
     # Now we will add `array1` and then different ways of updating it.
-    narray1: str = translation_driver.add_array(array1, update_var_mapping=True)
+    narray1: str = translation_builder.add_array(array1, update_var_mapping=True)
 
     # It will fail if we use the prefix, because we also want to update.
     prefix = "__jace_prefix"
@@ -305,23 +305,23 @@ def test_driver_variable_multiple_variables(
     with pytest.raises(
         expected_exception=ValueError,
         match=re.escape(
-            f"Cannot change the mapping of '{array1}' from '{translation_driver.map_jax_var_to_sdfg(array1)}' to '{prefix_expected_name}'."
+            f"Cannot change the mapping of '{array1}' from '{translation_builder.map_jax_var_to_sdfg(array1)}' to '{prefix_expected_name}'."
         ),
     ):
-        _ = translation_driver.add_array(array1, update_var_mapping=True, name_prefix=prefix)
-    assert prefix_expected_name not in translation_driver.sdfg.arrays
+        _ = translation_builder.add_array(array1, update_var_mapping=True, name_prefix=prefix)
+    assert prefix_expected_name not in translation_builder.sdfg.arrays
 
     # But if we do not want to update it then it works.
-    prefix_sdfg_name = translation_driver.add_array(
+    prefix_sdfg_name = translation_builder.add_array(
         array1, update_var_mapping=False, name_prefix=prefix
     )
     assert prefix_expected_name == prefix_sdfg_name
-    assert prefix_expected_name in translation_driver.sdfg.arrays
-    assert narray1 == translation_driver.map_jax_var_to_sdfg(array1)
+    assert prefix_expected_name in translation_builder.sdfg.arrays
+    assert narray1 == translation_builder.map_jax_var_to_sdfg(array1)
 
 
-def test_driver_variable_invalid_prefix(
-    translation_driver: translator.JaxprTranslationDriver,
+def test_builder_variable_invalid_prefix(
+    translation_builder: translator.JaxprTranslationBuilder,
 ) -> None:
     """Use invalid prefix."""
     # It will fail if we use the prefix, because we also want to update.
@@ -330,41 +330,41 @@ def test_driver_variable_invalid_prefix(
             expected_exception=ValueError,
             match=re.escape(f"add_array({array1}): Supplied invalid prefix '{iprefix}'."),
         ):
-            _ = translation_driver.add_array(array1, update_var_mapping=False, name_prefix=iprefix)
-        assert len(translation_driver.sdfg.arrays) == 0
+            _ = translation_builder.add_array(array1, update_var_mapping=False, name_prefix=iprefix)
+        assert len(translation_builder.sdfg.arrays) == 0
 
 
-def test_driver_variable_alloc_list(
-    translation_driver: translator.JaxprTranslationDriver,
+def test_builder_variable_alloc_list(
+    translation_builder: translator.JaxprTranslationBuilder,
 ) -> None:
-    """Tests part of the `JaxprTranslationDriver.create_jax_var_list()` api."""
+    """Tests part of the `JaxprTranslationBuilder.create_jax_var_list()` api."""
     var_list_1 = [array1, nscal, scal2]
     exp_names_1 = ["a", nscal.name, "c"]
 
-    res_names_1 = translation_driver.create_jax_var_list(
+    res_names_1 = translation_builder.create_jax_var_list(
         var_list_1,
         update_var_mapping=True,
     )
-    assert len(translation_driver.arrays) == 3
+    assert len(translation_builder.arrays) == 3
     assert res_names_1 == exp_names_1
 
     # Now a mixture of the collection and creation.
     var_list_2 = [array2, nscal, scal1]
     exp_names_2 = ["d", nscal.name, "e"]
 
-    res_names_2 = translation_driver.create_jax_var_list(
+    res_names_2 = translation_builder.create_jax_var_list(
         var_list_2,
         update_var_mapping=True,
     )
     assert res_names_2 == exp_names_2
-    assert len(translation_driver.arrays) == 5
+    assert len(translation_builder.arrays) == 5
 
 
 @pytest.mark.skip(reason="'create_jax_var_list()' does not clean up in case of an error.")
-def test_driver_variable_alloc_list_cleaning(
-    translation_driver: translator.JaxprTranslationDriver,
+def test_builder_variable_alloc_list_cleaning(
+    translation_builder: translator.JaxprTranslationBuilder,
 ) -> None:
-    """Tests part of the `JaxprTranslationDriver.create_jax_var_list()` api.
+    """Tests part of the `JaxprTranslationBuilder.create_jax_var_list()` api.
 
     It will fail because `update_var_mapping=False` thus the third variable will
     cause an error because it is proposed to `a`, which is already used.
@@ -375,22 +375,22 @@ def test_driver_variable_alloc_list_cleaning(
         expected_exception=ValueError,
         match=re.escape(f"add_array({scal2}): The proposed name 'a', is used."),
     ):
-        _ = translation_driver.create_jax_var_list(var_list)
+        _ = translation_builder.create_jax_var_list(var_list)
 
     # This currently fails, because the `create_jax_var_list()` function does not clean up.
-    assert len(translation_driver.arrays) == 0
+    assert len(translation_builder.arrays) == 0
 
 
-def test_driver_variable_alloc_list_prevent_creation(
-    translation_driver: translator.JaxprTranslationDriver,
+def test_builder_variable_alloc_list_prevent_creation(
+    translation_builder: translator.JaxprTranslationBuilder,
 ) -> None:
-    """Tests part of the `JaxprTranslationDriver.create_jax_var_list()` api.
+    """Tests part of the `JaxprTranslationBuilder.create_jax_var_list()` api.
 
     It will test the `prevent_creation` flag.
     """
     # First create a variable.
-    translation_driver.add_array(array1, update_var_mapping=True)
-    assert len(translation_driver.arrays) == 1
+    translation_builder.add_array(array1, update_var_mapping=True)
+    assert len(translation_builder.arrays) == 1
 
     # Now create the variables
     var_list = [array1, array2]
@@ -399,25 +399,25 @@ def test_driver_variable_alloc_list_prevent_creation(
         expected_exception=ValueError,
         match=re.escape(f"'prevent_creation' given but have to create '{array2}'."),
     ):
-        translation_driver.create_jax_var_list(
+        translation_builder.create_jax_var_list(
             var_list,
             prevent_creation=True,
         )
-    assert len(translation_driver.arrays) == 1
-    assert translation_driver.map_jax_var_to_sdfg(array1) == "a"
+    assert len(translation_builder.arrays) == 1
+    assert translation_builder.map_jax_var_to_sdfg(array1) == "a"
 
 
 @pytest.mark.skip(reason="'create_jax_var_list()' does not clean up in case of an error.")
-def test_driver_variable_alloc_list_only_creation(
-    translation_driver: translator.JaxprTranslationDriver,
+def test_builder_variable_alloc_list_only_creation(
+    translation_builder: translator.JaxprTranslationBuilder,
 ) -> None:
-    """Tests part of the `JaxprTranslationDriver.create_jax_var_list()` api.
+    """Tests part of the `JaxprTranslationBuilder.create_jax_var_list()` api.
 
     It will test the `only_creation` flag.
     """
     # First create a variable.
-    translation_driver.add_array(array1, update_var_mapping=True)
-    assert len(translation_driver.arrays) == 1
+    translation_builder.add_array(array1, update_var_mapping=True)
+    assert len(translation_builder.arrays) == 1
 
     # Now create the variables
     var_list = [array2, array1]
@@ -426,18 +426,18 @@ def test_driver_variable_alloc_list_only_creation(
         expected_exception=ValueError,
         match=re.escape(f"'only_creation' given '{array1}' already exists."),
     ):
-        translation_driver.create_jax_var_list(
+        translation_builder.create_jax_var_list(
             var_list,
             only_creation=True,
         )
-    assert len(translation_driver.arrays) == 1
-    assert translation_driver.map_jax_var_to_sdfg(array1) == "a"
+    assert len(translation_builder.arrays) == 1
+    assert translation_builder.map_jax_var_to_sdfg(array1) == "a"
 
 
-def test_driver_variable_alloc_list_handle_literal(
-    translation_driver: translator.JaxprTranslationDriver,
+def test_builder_variable_alloc_list_handle_literal(
+    translation_builder: translator.JaxprTranslationBuilder,
 ) -> None:
-    """Tests part of the `JaxprTranslationDriver.create_jax_var_list()` api.
+    """Tests part of the `JaxprTranslationBuilder.create_jax_var_list()` api.
 
     It will test the `handle_literals` flag.
     """
@@ -454,24 +454,24 @@ def test_driver_variable_alloc_list_handle_literal(
         expected_exception=ValueError,
         match=re.escape("Encountered a literal but `handle_literals` was `False`."),
     ):
-        translation_driver.create_jax_var_list(
+        translation_builder.create_jax_var_list(
             var_list,
             handle_literals=False,
         )
-    assert len(translation_driver.arrays) == 0
+    assert len(translation_builder.arrays) == 0
 
-    name_list = translation_driver.create_jax_var_list(
+    name_list = translation_builder.create_jax_var_list(
         var_list,
         handle_literals=True,
     )
-    assert len(translation_driver.arrays) == 0
+    assert len(translation_builder.arrays) == 0
     assert name_list == [None]
 
 
-def test_driver_constants(
-    translation_driver: translator.JaxprTranslationDriver,
+def test_builder_constants(
+    translation_builder: translator.JaxprTranslationBuilder,
 ) -> None:
-    """Tests part of the `JaxprTranslationDriver._create_constants()` api.
+    """Tests part of the `JaxprTranslationBuilder._create_constants()` api.
 
     See also the `test_subtranslators_alu.py::test_add3` test.
     """
@@ -481,22 +481,22 @@ def test_driver_constants(
     constant = [[1.0, 2.0, 3.0], [4.0, 5.0, 6.0], [7.0, 8.0, 9.0]]
     jaxpr = jax.make_jaxpr(lambda A: A + jax.numpy.array(constant))(1.0)
 
-    # We have to manually allocate the driver context.
+    # We have to manually allocate the builder context.
     #  You should not do that.
-    translation_driver._allocate_translation_ctx(name="Manual_test")
+    translation_builder._allocate_translation_ctx(name="Manual_test")
 
     # No create the constants.
-    translation_driver._create_constants(jaxpr)
+    translation_builder._create_constants(jaxpr)
 
     # Test if it was created with the correct value.
-    assert len(translation_driver.arrays) == 1
-    assert len(translation_driver._jax_name_map) == 1
-    assert next(iter(translation_driver._jax_name_map.values())) == "__const_a"
-    assert len(translation_driver.sdfg.constants) == 1
-    assert np.all(translation_driver.sdfg.constants["__const_a"] == constant)
+    assert len(translation_builder.arrays) == 1
+    assert len(translation_builder._jax_name_map) == 1
+    assert next(iter(translation_builder._jax_name_map.values())) == "__const_a"
+    assert len(translation_builder.sdfg.constants) == 1
+    assert np.all(translation_builder.sdfg.constants["__const_a"] == constant)
 
 
-def test_driver_scalar_return_value() -> None:
+def test_builder_scalar_return_value() -> None:
     """Tests if scalars can be returned directly."""
 
     def scalar_ops(A: float) -> float:
@@ -518,7 +518,7 @@ def wrapped(A: float) -> float:
 
 
 @pytest.mark.skip(reason="Currently 'scalar' return values, are actually shape '(1,)' arrays.")
-def test_driver_scalar_return_type() -> None:
+def test_builder_scalar_return_type() -> None:
     """Tests if the type is the same, in case of scalar return."""
 
     @jace.jit
@@ -529,7 +529,7 @@ def wrapped(A: np.float64) -> np.float64:
     assert type(A) is np.float64, f"Expected type 'np.float64', but got '{type(A).__name__}'."
 
 
-def test_driver_jace_var() -> None:
+def test_builder_jace_var() -> None:
     """Simple tests about the `JaCeVar` objects."""
     for iname in ["do", "", "_ _", "9al", "_!"]:
         with pytest.raises(
@@ -539,7 +539,7 @@ def test_driver_jace_var() -> None:
             _ = JaCeVar((), dace.int8, name=iname)
 
 
-def test_driver_F_strides() -> None:
+def test_builder_F_strides() -> None:
     """Tests if we can lower without a standard stride.
 
     Notes:

From f0ea5b48f27c68a50e86469554cfdb83e4feb29d Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Thu, 30 May 2024 16:56:37 +0200
Subject: [PATCH 279/458] Made some small changes.

---
 tests/integration_tests/test_jaxpr_translator_builder.py | 2 ++
 1 file changed, 2 insertions(+)

diff --git a/tests/integration_tests/test_jaxpr_translator_builder.py b/tests/integration_tests/test_jaxpr_translator_builder.py
index 13a3835..c50d174 100644
--- a/tests/integration_tests/test_jaxpr_translator_builder.py
+++ b/tests/integration_tests/test_jaxpr_translator_builder.py
@@ -192,6 +192,8 @@ def test_builder_nested(translation_builder: translator.JaxprTranslationBuilder)
     name_1 = translation_builder.add_array(array1, update_var_mapping=True)
     assert name_1 == "a"
     assert translation_builder.map_jax_var_to_sdfg(array1) == name_1
+    assert translation_builder.sdfg.arrays[name_1] is translation_builder.get_array(array1)
+    assert translation_builder.sdfg.arrays[name_1] is translation_builder.get_array(name_1)
 
     # For the sake of doing it add a new state to the SDFG.
     translation_builder.append_new_state("sake_state")

From fae3ce3a74fbd26509b0c5d5800e2cced9d8ba33 Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Fri, 31 May 2024 09:15:10 +0200
Subject: [PATCH 280/458] Last screening.

---
 src/jace/api.py                               |  10 +-
 src/jace/optimization.py                      |  19 ++-
 src/jace/stages.py                            |  86 +++++++----
 src/jace/translator/__init__.py               |   6 +-
 .../translator/jaxpr_translator_builder.py    | 142 ++++++++++--------
 src/jace/translator/primitive_translator.py   |  46 +++---
 src/jace/translator/translated_jaxpr_sdfg.py  |  13 +-
 src/jace/util/compiling.py                    |  20 ++-
 src/jace/util/jax_helper.py                   |  18 +--
 src/jace/util/traits.py                       |  30 ++--
 src/jace/util/translation_cache.py            |  16 +-
 tests/test_caching.py                         |   2 +-
 tests/test_jaxpr_translator_builder.py        |   4 +-
 13 files changed, 232 insertions(+), 180 deletions(-)

diff --git a/src/jace/api.py b/src/jace/api.py
index 1efacc8..78d2c65 100644
--- a/src/jace/api.py
+++ b/src/jace/api.py
@@ -5,7 +5,7 @@
 #
 # SPDX-License-Identifier: BSD-3-Clause
 
-"""Contains the implementation of the jit functioanlity of JaCe."""
+"""Stand in for the `jax.*` namespace."""
 
 from __future__ import annotations
 
@@ -56,15 +56,15 @@ def jit(
     """JaCe's replacement for `jax.jit` (just-in-time) wrapper.
 
     It works the same way as `jax.jit` does, but instead of using XLA the computation is lowered
-    to DaCe. It supports the same arguments as `jax.jit` (although currently not) does.
-    In addition it accepts some JaCe specific arguments.
+    to DaCe. In addition it accepts some JaCe specific arguments, it accepts the same arguments
+    as `jax.jit` does.
 
     Args:
         primitive_translators:    Use these primitive translators for the lowering to SDFG.
+            If not specified the translators in the global registry are used.
 
     Notes:
-        If no translators are specified, the ones in the global registry are implicitly passed
-        as argument. After constructions any change to `primitive_translators` has no effect.
+        After constructions any change to `primitive_translators` has no effect.
     """
     if kwargs:
         # TODO(phimuell): Add proper name verification and exception type.
diff --git a/src/jace/optimization.py b/src/jace/optimization.py
index c90d612..249225e 100644
--- a/src/jace/optimization.py
+++ b/src/jace/optimization.py
@@ -5,9 +5,9 @@
 #
 # SPDX-License-Identifier: BSD-3-Clause
 
-"""Module that will host all optimization functions specific to JaCe.
+"""JaCe specific optimizations.
 
-Currently just a dummy existing for the sake of providing some callable function.
+Currently just a dummy exists for the sake of providing a callable function.
 """
 
 from __future__ import annotations
@@ -22,13 +22,16 @@
 
 
 class CompilerOptions(TypedDict, total=False):
-    """All known compiler options known to `JaCeLowered.compile()`.
+    """All known compiler options to `JaCeLowered.compile()`.
 
     See `jace_optimize()` for a description of the different options.
 
     There are some predefined option sets in `jace.jax.stages`:
-    - `DEFAULT_COMPILER_OPTIONS`
+    - `DEFAULT_OPTIONS`
     - `NO_OPTIMIZATIONS`
+
+    Todo:
+        - Implement a context manager to dynamically change the default.
     """
 
     auto_optimize: bool
@@ -50,10 +53,10 @@ def jace_optimize(
     tsdfg: translator.TranslatedJaxprSDFG,
     **kwargs: Unpack[CompilerOptions],
 ) -> None:
-    """Performs optimization of the `tsdfg` _in place_.
+    """Performs optimization of the translated SDFG _in place_.
 
-    Currently this function only supports simplification.
-    Its main job is to exists that we have something that we can call in the tool chain.
+    It is recommended to use the `CompilerOptions` `TypedDict` to pass options to the function.
+    However, any option that is not specified will be interpreted as to be disabled.
 
     Args:
         tsdfg:          The translated SDFG that should be optimized.
@@ -61,7 +64,7 @@ def jace_optimize(
         auto_optimize:  Run the auto optimization pipeline (currently does nothing)
 
     Note:
-        By default all optimizations are disabled and this function acts as a noops.
+        Its main job is to exists that we have something that we can call in the tool chain.
     """
     if not kwargs:
         return
diff --git a/src/jace/stages.py b/src/jace/stages.py
index b130107..8941906 100644
--- a/src/jace/stages.py
+++ b/src/jace/stages.py
@@ -7,7 +7,7 @@
 """Reimplementation of the `jax.stages` module.
 
 This module reimplements the public classes of that Jax module.
-However, they are a big different, because JaCe uses DaCe as backend.
+However, they are a bit different, because JaCe uses DaCe as backend.
 
 As in Jax JaCe has different stages, the terminology is taken from
 [Jax' AOT-Tutorial](https://jax.readthedocs.io/en/latest/aot.html).
@@ -20,6 +20,8 @@
     This will turn the SDFG into an executable object, see `dace.codegen.CompiledSDFG`.
 - Execution:
     This is the actual running of the computation.
+
+As in Jax the `stages` module give access to the last three stages, but not the first one.
 """
 
 from __future__ import annotations
@@ -40,6 +42,14 @@
 
     import dace
 
+__all__ = [
+    "CompilerOptions",  # export for compatibility with Jax.
+    "JaCeCompiled",
+    "JaCeLowered",
+    "JaCeWrapped",
+    "Stage",
+]
+
 
 class JaCeWrapped(tcache.CachingStage["JaCeLowered"]):
     """A function ready to be specialized, lowered, and compiled.
@@ -47,10 +57,10 @@ class JaCeWrapped(tcache.CachingStage["JaCeLowered"]):
     This class represents the output of functions such as `jace.jit()` and is the first stage in
     the translation/compilation chain of JaCe. A user should never create a `JaCeWrapped` object
     directly, instead `jace.jit` should be used for that.
-    While it supports just-in-time lowering and compilation these steps can also be performed
-    explicitly. The lowering performed by this stage is cached, thus if a `JaCeWrapped` object is
-    lowered later, with the same argument the result is taken from the cache.
-    Furthermore, a `JaCeWrapped` object is composable with all Jax transformations.
+    While it supports just-in-time lowering and compilation, by just calling it, these steps can
+    also be performed explicitly. The lowering performed by this stage is cached, thus if a
+    `JaCeWrapped` object is lowered later, with the same argument the result is taken from the
+    cache. Furthermore, a `JaCeWrapped` object is composable with all Jax transformations.
 
     Args:
         fun:                    The function that is wrapped.
@@ -63,7 +73,7 @@ class JaCeWrapped(tcache.CachingStage["JaCeLowered"]):
 
     Note:
         The tracing of function will always happen with enabled `x64` mode, which is implicitly
-        and temporary activated during tracing.
+        and temporary activated while tracing.
     """
 
     _fun: Callable
@@ -81,6 +91,7 @@ def __init__(
         #  This prevents that any modifications affect `self`.
         #  Shallow is enough since the translators themselves are immutable.
         self._primitive_translators = dict(primitive_translators)
+        # TODO(phimuell): Do we need to deepcopy the options?
         self._jit_options = dict(jit_options)
         self._fun = fun
 
@@ -89,7 +100,10 @@ def __call__(
         *args: Any,
         **kwargs: Any,
     ) -> Any:
-        """Executes the wrapped function, lowering and compiling as needed in one step."""
+        """Executes the wrapped function, lowering and compiling as needed in one step.
+
+        The arguments passed to this function are the same as the wrapped function uses.
+        """
 
         # If we are inside a traced context, then we forward the call to the wrapped function.
         #  This ensures that JaCe is composable with Jax.
@@ -108,17 +122,23 @@ def lower(
     ) -> JaCeLowered:
         """Lower this function explicitly for the given arguments.
 
-        Performs the first two steps of the AOT steps described above, i.e. stage out to Jaxpr
-        and then translate to SDFG. The result is encapsulated and returned into a `Lowered` object.
+        Performs the first two steps of the AOT steps described above, i.e. trace the wrapped
+        function with the given arguments and stage it out to a Jaxpr. Then translate it to SDFG.
+        The result is encapsulated inside a `JaCeLowered` object which can later be compiled.
+
+        Note:
+            The call to the function is cached. As key an abstract description of the call,
+            similar to the tracers used by Jax, is used.
+            The tracing is always done with activated `x64` mode.
         """
         if len(kwargs) != 0:
             raise NotImplementedError("Currently only positional arguments are supported.")
 
         # TODO(phimuell): Currently the SDFG that we build only supports `C_CONTIGUOUS` memory
-        #  order. Since we support the paradigm that "everything passed to `lower` should also
+        #  order. Since we support the paradigm that "everything passed to `lower()` should also
         #  be accepted as argument to call the result", we forbid other memory orders here.
         if not all((not util.is_array(arg)) or arg.flags["C_CONTIGUOUS"] for arg in args):
-            raise NotImplementedError("Currently can not handle strides beside 'C_CONTIGUOUS'.")
+            raise NotImplementedError("Currently can not yet handle strides beside 'C_CONTIGUOUS'.")
 
         # In Jax `float32` is the main datatype, and they go to great lengths to avoid some
         #  aggressive [type promotion](https://jax.readthedocs.io/en/latest/type_promotion.html).
@@ -150,10 +170,13 @@ def _make_call_description(
         self,
         *args: Any,
     ) -> tcache.StageTransformationSpec:
-        """This function computes the key for the `JaCeWrapped.lower()` call to cache it.
+        """This function computes the key for the `JaCeWrapped.lower()` call inside the cache.
+
+        The function will compute a full abstract description on its argument.
 
-        The function will compute a full abstract description on its argument. Currently it is
-        only able to handle positional argument and does not support static arguments.
+        Todo:
+            - Support keyword arguments and default values of the wrapped function.
+            - Support static arguments.
         """
         call_args = tuple(tcache._AbstractCallArgument.from_value(x) for x in args)
         return tcache.StageTransformationSpec(stage_id=id(self), call_args=call_args)
@@ -162,13 +185,16 @@ def _make_call_description(
 class JaCeLowered(tcache.CachingStage["JaCeCompiled"]):
     """Represents the original computation as an SDFG.
 
-    It represents the computation wrapped by a `JaCeWrapped` translated and lowered to SDFG.
-    It is followed by the `JaCeCompiled` stage.
-    Although, `JaCeWrapped` is composable with Jax transformations `JaCeLowered` is not.
-    A user should never create such an object, instead `JaCeWrapped.lower()` should be used.
+    This class represents the output of `JaCeWrapped.lower()` and represents the originally wrapped
+    computation as an SDFG. This stage is followed by the `JaCeCompiled` stage.
+
+    Args:
+        tsdfg:      The translated SDFG object representing the computation.
 
     Note:
         `self` will manage the passed `tsdfg` object. Modifying it results in undefined behavior.
+        Although, `JaCeWrapped` is composable with Jax transformations `JaCeLowered` is not.
+        A user should never create such an object, instead `JaCeWrapped.lower()` should be used.
 
     Todo:
         - Handle pytrees.
@@ -212,8 +238,8 @@ def compile(
     def compiler_ir(self, dialect: str | None = None) -> translator.TranslatedJaxprSDFG:
         """Returns the internal SDFG.
 
-        The function returns a `TranslatedJaxprSDFG` object.
-        It is important that modifying this object in any way is undefined behavior.
+        The function returns a `TranslatedJaxprSDFG` object. It is important that modifying this
+        object in any way is undefined behavior.
         """
         if (dialect is None) or (dialect.upper() == "SDFG"):
             return self._translated_sdfg
@@ -234,11 +260,10 @@ def _make_call_description(
         self,
         compiler_options: CompilerOptions | None = None,
     ) -> tcache.StageTransformationSpec:
-        """This function computes the key for the `self.compile()` call to cache it.
+        """This function computes the key for the `self.compile()` call inside the cache.
 
         The key that is computed by this function is based on the concrete values of the passed
-        compiler options. This is different from the key computed by `JaCeWrapped` which is an
-        abstract description.
+        compiler options.
         """
         options = self._make_compiler_options(compiler_options)
         call_args = tuple(sorted(options.items(), key=lambda X: X[0]))
@@ -290,7 +315,11 @@ def __call__(
         *args: Any,
         **kwargs: Any,
     ) -> Any:
-        """Calls the embedded computation."""
+        """Calls the embedded computation.
+
+        The arguments must be the same as for the wrapped function, but with all static arguments
+        removed.
+        """
         return util.run_jax_sdfg(
             self._csdfg,
             self._inp_names,
@@ -302,12 +331,3 @@ def __call__(
 
 #: Known compilation stages in JaCe.
 Stage = JaCeWrapped | JaCeLowered | JaCeCompiled
-
-
-__all__ = [
-    "CompilerOptions",  # export for compatibility with Jax.
-    "JaCeCompiled",
-    "JaCeLowered",
-    "JaCeWrapped",
-    "Stage",
-]
diff --git a/src/jace/translator/__init__.py b/src/jace/translator/__init__.py
index a97d3c4..2acbb7f 100644
--- a/src/jace/translator/__init__.py
+++ b/src/jace/translator/__init__.py
@@ -5,7 +5,11 @@
 #
 # SPDX-License-Identifier: BSD-3-Clause
 
-"""Subpackage containing all the code related to Jaxpr translation"""
+"""Subpackage containing all the code related to the Jaxpr to SDFG translation.
+
+The concrete primitive translators that ships with JaCe are inside the `primitive_translators`
+subpackage.
+"""
 
 from __future__ import annotations
 
diff --git a/src/jace/translator/jaxpr_translator_builder.py b/src/jace/translator/jaxpr_translator_builder.py
index e41f823..1cc8265 100644
--- a/src/jace/translator/jaxpr_translator_builder.py
+++ b/src/jace/translator/jaxpr_translator_builder.py
@@ -5,6 +5,8 @@
 #
 # SPDX-License-Identifier: BSD-3-Clause
 
+"""Contains the translator that actually builds an SDFG based on a Jaxpr description."""
+
 from __future__ import annotations
 
 import copy
@@ -25,9 +27,10 @@
 class JaxprTranslationBuilder:
     """Internal builder class for creating an SDFG equivalent of a `Jaxpr` instance.
 
-    The SDFG that is created by this class has a very particular form, which we consider canonical.
-    The main feature of a canonical SDFG are:
+    The SDFG created by this class has a very particular form, which we call canonical. The main
+    features of such an SDFG are:
     - the SDFG is a list of states, ideally each state corresponds to single Jax primitive,
+    - it has a single source and sink state.
     - all variable names are derived from Jax names,
     - there are only transient variables inside the SDFG,
     - It lacks the special `__return` variable,
@@ -35,31 +38,31 @@ class JaxprTranslationBuilder:
 
     For these reasons the SDFG is not directly usable, and further manipulations have to be
     performed. Especially, DaCe's validation function will fail and it is unable to be processed
-    by the optimization pipeline. For more information also see `jace.translator.post_translation`
+    by JaCe's optimization pipeline. For more information also see `jace.translator.post_translation`
     module.
 
-    The idea of the translator is extremely simple. Since Jaxpr is a list consisting of more or
-    less simple instructions/equations, they get processed one after the other. Each equation is
-    translated into its own state that is appended to the SDFG, thus the SDFG is a long list of
-    states. In certain cases it might be that an equation needs more states, but this is an
-    exception.
+    The idea of the translator is extremely simple. A Jaxpr is essentially a list consisting of
+    more or less simple instructions/equations, they get processed one after the other. Each
+    equation is translated into its own state that is successively appended to the SDFG, while the
+    SDFG is being build, which explains the particular form of the SDFG.
 
-    The actual translation of the equation is not handled by the builder. Instead the request is
-    forwarded to a `PrimitiveTranslator` object, known as primitive translator. This is a highly
-    specialized object that is able to handle one kind of primitive. For more information on them
-    see the documentation of `PrimitiveTranslator`.
+    However, the actual translation of the equations is not handled by the builder. Instead the
+    request is forwarded to a `PrimitiveTranslator` object, known as primitive translator. This is
+    a highly specialized object that is able to handle one kind of primitive. For more information
+    on them see the documentation of `PrimitiveTranslator`.
 
-    To start a translation the `translate_jaxpr()` function should be called, if this happens it is
-    said that the builder has an ongoing translation. If `translate_jaxpr()` is called on a builder
-    that has an ongoing translation, a new translation context will be set up. Thus the builder
-    will then translate the supplied (nested) Jaxpr and return the result. However, this will have
-    no influence on the translation process that is already going.
+    To start a translation the `translate_jaxpr()` function has to be called, if this happens it is
+    said that the builder has an ongoing translation. The first translator is known as root,
+    translator. If `translate_jaxpr()` is called on a builder that has an ongoing translation,
+    a new translation context will be set up. Thus the builder will then translate the supplied
+    (nested) Jaxpr and return the result. However, this will have no influence on the translation
+    process that is already going.
 
     Args:
         primitive_translators:    Primitive to use during the translation.
 
     Notes:
-        After the main translation has been performed the translator object can be used again.
+        After a translation has been performed the translator object can be used again.
         Currently the builder will generate only Array as SDFG variables, however, this is a
         temporary solution, see `add_array()`.
     """
@@ -76,9 +79,9 @@ def __init__(
         self._primitive_translators = {**primitive_translators}
 
         # Maps Jax variables to the name of its SDFG equivalent.
-        #  Shared between all translation contexts, to ensure consecutive
-        #  variable naming as seen as in a pretty printed Jaxpr.
-        #  Will be cleared by `_clear_translation_ctx()` at the end of the translation.
+        #  Shared between all translation contexts, to ensure consecutive variable naming as
+        #  seen as in a pretty printed Jaxpr.
+        #  Will be cleared by `_clear_translation_ctx()` at the end of the root translation.
         self._jax_name_map = {}
 
         # Stack of all context, to handle nested Jaxpr instances.
@@ -94,16 +97,17 @@ def translate_jaxpr(
         """Perform the translation of a Jaxpr into a SDFG.
 
         In case this function is called and `self` has an ongoing translation process, a new
-        translation context will be created. This means the Jaxpr will be translated independently
-        from the previous one.
+        translation context will be created. This allows to handled nested Jaxprs.
+        However, the variable map is shared among all.
 
         Returns:
             The function will translate the passed Jaxpr object into an SDFG in canonical form.
             This SDFG together with additional meta data, that is needed for further processing
             is encapsulated inside a `TranslationContext` object.
+            For further use it should be passed to `postprocess_jaxpr_sdfg()`.
 
         Args:
-            name:                   Use this name for the SDFG instead some generated one.
+            name:   Use this name for the SDFG instead some generated one.
         """
 
         if len(jaxpr.effects) != 0:
@@ -131,20 +135,23 @@ def append_new_state(
         assignments: Mapping[str, Any] | None = None,
         prev_state: dace.SDFGState | None = None,
     ) -> dace.SDFGState:
-        """Creates a new `SDFGState` and adds it to the SDFG.
-
-        By default the new state is appended to the current terminal state, which will also update
-        the terminal state inside `self`.
+        """Creates a new `SDFGState`, adds it to the SDFG and returns it.
 
-        However, if `prev_state` is specified the state new state will be appended to `prev_state`
-        instead. The terminal state of `self` will only be modified if `prev_state` is the current
-        terminal state.
+        By default the new state is appended to the current terminal state. However, if
+        `prev_state` is specified it will be appended to it.
+        In case the new state is appended to the current terminal state, this will modify the
+        terminal state of `self`.
 
         Args:
             label:          The name that should be given to the new `SDFGState`.
             condition:      The condition of the state transitions used on the `InterstateEdge`.
             assignments:    Symbol assignments that should be done during the transition.
             prev_state:     Alternative `SDFGState` at which we should append the new state.
+
+        Notes:
+            It is potentially dangerous to not append to the current terminal state, as a
+            canonical SDFG only has one sink state. If this is done the user has to ensure,
+            that at the end of the processing the SDFG is back in canonical form.
         """
         if isinstance(label, str) and (not util.VALID_SDFG_OBJ_NAME.fullmatch(label)):
             raise ValueError(f"Can not create state with label '{label}' since it is invalid.")
@@ -184,8 +191,9 @@ def get_array(
     ) -> ddata.Data:
         """Returns the SDFG `Data` object `name` referees to.
 
-        If `name` is a string it is directly interpreted as the name of an SDFG variable. In other
-        cases it is first translated using `self.map_jax_var_to_sdfg()`.
+        `name` can either be a string, in which case it is interpreted as a verbatim SDFG name.
+        If it is a Jax or JaCe variable, the function will first perform a lookup using
+        `self.map_jax_var_to_sdfg(name)`.
         """
         if isinstance(name, (jax_core.Var, util.JaCeVar)):
             sdfg_name: str = self.map_jax_var_to_sdfg(name)
@@ -214,11 +222,11 @@ def map_jax_var_to_sdfg(
         jax_var: jax_core.Atom | util.JaCeVar,
         allow_fail: bool = False,
     ) -> str | None:
-        """Get the _name_ of the SDFG variable to which `jax_var` is referring to.
+        """Get the name of the SDFG variable to which `jax_var` is referring to.
 
         Args:
             jax_var:        The Jax variable to look up.
-            allow_fail:     If mapping is not known return `None` instead of raising `KeyError`.
+            allow_fail:     If no mapping is known return `None` instead of raising `KeyError`.
         """
         if isinstance(jax_var, jax_core.Literal):
             raise RuntimeError(f"There is no SDFG variable for literal '{jax_var}'.")
@@ -272,8 +280,11 @@ def add_jax_name_mapping(
         Args:
             jax_var:     The Jax variable.
             sdfg_name:   The name of the corresponding SDFG variable.
+
+        Todo:
+            - Implement a way to delete or to modify a mapping.
         """
-        assert len(sdfg_name) > 0
+        assert sdfg_name
 
         if jax_var in self._jax_name_map:
             raise ValueError(
@@ -295,17 +306,15 @@ def add_array(
         name_prefix: str | None = None,
         update_var_mapping: bool = False,
     ) -> str:
-        """Creates an SDFG variable for the Jax variable `arg` and returns its SDFG name.
+        """Creates an SDFG variable for Jax variable `arg` and returns its SDFG name.
 
-        The SDFG object is always created as a transient.
+        The SDFG object is always created as a transient. Furthermore, the function will not
+        update the internal variable mapping, by default.
 
         By default the function will use `jace.util.propose_jax_name()` to derive the name that
         should be used. However, by passing a `JaCeVar` with a name it is possible to suggest a
-        specific name. In addition it is possible to specify `name_prefix` to prefix name that
-        would be used.
-
-        The function will not update the internal variable mapping. If this is desired one can
-        set `update_var_mapping`, for forcing this.
+        specific name. In addition it is possible to specify `name_prefix` to supply a prefix
+        to the determined name that should be used.
 
         Args:
             arg:                The Jax object for which a SDFG equivalent should be created.
@@ -330,19 +339,21 @@ def add_array(
         as_transient = True
         strides = None
 
-        if shape == ():  # Shape of a DaCe scalar.
+        if shape == ():  # Temporary fix for handling DaCe scalars, see above for more.
             shape = (1,)
 
         # Propose a name and if needed extend it.
         arg_name = util.propose_jax_name(arg, self._jax_name_map)
-        if name_prefix is not None:
-            if not util.VALID_SDFG_VAR_NAME.fullmatch(name_prefix):
-                raise ValueError(f"add_array({arg}): Supplied invalid prefix '{name_prefix}'.")
+        if name_prefix:
             arg_name = f"{name_prefix}{arg_name}"
 
         # final checks
         if arg_name in self._ctx.sdfg.arrays:
             raise ValueError(f"add_array({arg}): The proposed name '{arg_name}', is used.")
+        if not util.VALID_SDFG_VAR_NAME.fullmatch(arg_name):
+            raise ValueError(f"add_array({arg}): The proposed name '{arg_name}', is invalid.")
+        if arg_name in util.FORBIDDEN_SDFG_VAR_NAMES:
+            raise ValueError(f"add_array({arg}): The proposed name '{arg_name}', is forbidden.")
 
         self._ctx.sdfg.add_array(
             name=arg_name,
@@ -400,7 +411,7 @@ def create_jax_var_list(  # type: ignore[misc]
         By setting `prevent_creation` the function will not create any new SDFG variables, if no
         corresponding SDFG variable exists an error is generated. By setting `only_creation` the
         function will only create new SDFG variables, if a variable already have a corresponding
-        SDFG variable an error will be created.
+        SDFG variable an error will be generated.
 
         By default literals cause an error. However, by setting `handle_literals` to `True`
         literals will will be included in the output with the value `None`.
@@ -431,7 +442,7 @@ def create_jax_var_list(  # type: ignore[misc]
                 if mapped_sdfg_name is None:
                     sdfg_name = self.add_array(arg=jax_var, **kwargs)
                 elif only_creation:
-                    raise ValueError(f"'only_creation' given '{jax_var}' already exists.")
+                    raise ValueError(f"'only_creation' given but '{jax_var}' already exists.")
                 else:
                     sdfg_name = mapped_sdfg_name
             ret_list.append(sdfg_name)
@@ -497,16 +508,11 @@ def _allocate_translation_ctx(
         self,
         name: str | None = None,
     ) -> JaxprTranslationBuilder:
-        """This function allocates and initialize the members of the translation context of `self`.
-
-        If this function is called and `self` is already allocated, the function will create a new
-        context, allowing the builder to handle nested Jaxpr.
-        The first context that is created is known as root translator.
+        """Allocate a new context and activate it.
 
         Args:
             name:               The name of the SDFG.
         """
-
         self._ctx_stack.append(
             TranslationContext(
                 name=name,
@@ -522,7 +528,7 @@ def _ctx(self) -> TranslationContext:
         return self._ctx_stack[-1]
 
     def _clear_translation_ctx(self) -> TranslationContext | None:
-        """Remove the current active context from `self` and returns its state.
+        """Remove the currently active context from `self` and returns it.
 
         If `self` is not allocated it will return `None`.
         """
@@ -530,7 +536,7 @@ def _clear_translation_ctx(self) -> TranslationContext | None:
             return None
 
         if self.is_root_translator():
-            # The translation as a whole has finished, so restore the builder,
+            # The translation, as a whole has finished, so restore the builder,
             #  i.e. delete all the shared state.
             self._jax_name_map = {}
 
@@ -550,8 +556,8 @@ def _translate_single_eqn(
         - Call the primitive translator to perform the translation inside the new state.
 
         Returns:
-            The SDFG names that were used as input and output are returned.
-            The inputs might contain `None` which indicates that that input was a Jax Literal.
+            The SDFG names that were used as inputs and outputs. The inputs might contain `None`
+            which indicates that this particular input was a literal.
         """
         if len(eqn.effects) != 0:
             raise NotImplementedError(f"Equation '{eqn}' has side effects.")
@@ -579,7 +585,7 @@ def _translate_single_eqn(
         # Create the state into which the equation should be translated
         eqn_state = self.append_new_state(
             label=f"{pname}_{'_'.join(out_var_names)}",
-            prev_state=None,  # forces terminal state to use
+            prev_state=None,  # forces the creation of a new terminal state
         )
 
         # Now perform the actual translation of the equation.
@@ -596,6 +602,8 @@ def _translate_single_eqn(
             if eqn_state is not self._ctx.terminal_state:
                 raise RuntimeError("Inconsistent terminal state was detected.")
             new_sdfg_term_state = eqn_state
+        if not self._ctx.validate():
+            raise RuntimeError("Detected an invalid SDFG under construction.")
 
         # In case a translator decided to not use the variables we created for it, which is
         #  allowed but it must update the `out_var_names` list correctly, we will now verify this.
@@ -620,9 +628,7 @@ def _translate_jaxpr_internal(
         """Performs the actual translation of the Jaxpr into an SDFG.
 
         The function assumes that the context is allocated as well as the initial variables.
-        The function will return the internal state of `self` encapsulated inside a
-        `TranslationContext` object. The function will also deallocate the current context
-        upon return.
+        The function removes and returns the currently active translation context.
 
         Args:
             jaxpr:      The Jaxpr to translate.
@@ -662,6 +668,9 @@ def _handle_null_jaxpr(
         Returns:
             The function returns a list denoting the SDFG variables that refers to the output.
             The order of the list is the same as in `jaxpr.jaxpr.outvars`.
+
+        Todo:
+            - Handle the case if if the output is a literal.
         """
         assert self._ctx.terminal_state is self._ctx.start_state
         assert len(self._ctx.inp_names) > 0
@@ -704,7 +713,7 @@ def _handle_null_jaxpr(
             # `jax_out_var` now has, in some sense, two SDFG equivalents, the input, that
             #  was previously created by `self._create_initial_input()` and the `sdfg_out_name`
             #  we just created. But we can not add this to the mapping. Because it is the best,
-            #  as in least worst, thing we can do we remove it from the mapping.
+            #  as in the least worst thing we can do, we remove it from the mapping.
             #  I am open for different approaches.
             self._jax_name_map.pop(jax_out_var)
 
@@ -726,9 +735,12 @@ class TranslationContext:
     Essentially it is a `TranslatedJaxprSDFG` object together with some additional meta data,
     that is needed during translation. It is also returned by the `translate_jaxpr()` function.
     It is important that the SDFG it encapsulates is not directly usable and should be passed
-    to the post processing stage.
+    to the post processing stage, i.e. `postprocess_jaxpr_sdfg()`, which will turn a context into
+    a `TranslatedJaxprSDFG` object.
 
     Attributes:
+        jsdfg:          The wrapped `TranslatedJaxprSDFG` object that stores the SDFG under
+            construction. `self` adds access properties to all attributes of the `TranslatedJaxprSDFG`.
         start_state:    The first state in the SDFG state machine.
         terminal_state: The (currently) last state in the state machine.
 
diff --git a/src/jace/translator/primitive_translator.py b/src/jace/translator/primitive_translator.py
index e50ac73..f0b2088 100644
--- a/src/jace/translator/primitive_translator.py
+++ b/src/jace/translator/primitive_translator.py
@@ -6,11 +6,8 @@
 # SPDX-License-Identifier: BSD-3-Clause
 """Interface for all primitive translators and managing of the global translator registry.
 
-The high level idea is that there is a registry of all currently active primitive translators.
-If `primitive_translators` is not given to `jit` it will use this global registry.
-A primitive, i.e. an object that satisfies the `PrimitiveTranslator` interface, can be added
-to the registry by `register_primitive_translator()`. To retrieve the translators that are
-currently active you can use the `get_regsitered_primitive_translators()` function.
+Todo:
+    Implement proper context manager for working with the registry.
 """
 
 from __future__ import annotations
@@ -51,13 +48,12 @@ def __call__(
     ) -> dace.SDFGState | None:
         """Translates the Jax primitive into its SDFG equivalent.
 
-        Before the builder calls this function it will perform the following
-        preparatory tasks:
+        Before the builder calls this function it will perform the following preparatory tasks:
         - It will allocate the SDFG variables that are used as outputs. Their names will be passed
             through the `out_var_names` argument, in the same order as `eqn.outvars`.
-        - It will collect the names of the SDFG variables that are used as input and place them in
+        - It will collect the names of the SDFG variables that are used as inputs and place them in
             `in_var_names`, in the same order as `eqn.invars`. If an input argument refers to a
-            literal no SDFG variable is created for it and `None` is passed to indicate this.
+            literal no SDFG variable is created for it and `None` is used to indicate this.
         - The builder will create variables that are used as output. They are passed as
             `out_var_names`, same order as in the equation.
         - The builder will create a new terminal state and pass it as `eqn_state` argument. This
@@ -65,21 +61,22 @@ def __call__(
 
         Then the primitive translator is called.
         Usually a primitive translator should construct the dataflow graph inside `eqn_state`.
-        It is allowed that the primitive translators creates more states if needed, but this
-        state machinery has to have a single terminal state, which must be returned and reachable
-        from `eqn_state`. If the function returns `None` the builder will assume that primitive
-        translator was able to fully construct the dataflow graph within `eqn_state`.
+        However, it is allowed that the primitive translators creates more states if needed, but
+        this state machinery has to have a single terminal state, which must be returned and
+        reachable from `eqn_state`. If the function returns `None` the builder will assume that
+        primitive translator was able to fully construct the dataflow graph within `eqn_state`.
 
         While a primitive translator is forbidden from meddling with the input variables mentioned
         in `in_var_names` in any way, it is allowed to modify the output variables. For example
-        it could create a new SDFG variable, with different strides. But in that case the primitive
-        translator must update the internal mapping of the builder TBA HOW, and modify the names
-        passed through `out_var_names`. However, the translator is allowed to create internal
-        temporary variables. It just have to ensure that no name collision will occur, a way to
-        do this is to use a passed variable name as prefix.
+        a translator could create a new SDFG variable, with different strides. But in that case
+        the primitive translator must update the internal mapping of the builder TBA HOW, and
+        modify the names passed through `out_var_names`. However, the translator is allowed to
+        create internal temporary variables without registering them to the mapping, as long as it
+        uses the supplied variables as final output. To ensure that there are no collision with
+        further variables, the translator should prefix them.
 
         Args:
-            builder:         The builder object of the translation.
+            builder:        The builder object of the translation.
             in_var_names:   List of the names of the arrays created inside the
                                 SDFG for the inpts or `None` in case of a literal.
             out_var_names:  List of the names of the arrays created inside the
@@ -180,6 +177,9 @@ def register_primitive_translator(
 ):
     """Adds a primitive translator to JaCe's global registry.
 
+    The default set of primitives that are used if nothing is specified to to `jace.jit` are stored
+    inside a global registry. To add a translator to this registry this function can be used.
+
     If a translator for `primitive` is already registered an error will be generated. However,
     by specifying `overwrite` `primitive_translator` will replace the current one.
 
@@ -210,8 +210,8 @@ def wrapper(
 def get_regsitered_primitive_translators() -> dict[str, translator.PrimitiveTranslator]:
     """Returns a copy of the current state of JaCe's global primitive registry.
 
-    The function returns a mapping that maps the name of a primitive to the associated translator.
-    No change to the global registry will affect the return value and vice versa.
+    The state returned by this function is compatible to what `jace.hit`'s `primitive_translators`
+    argument expects. It is important the the returned object is decoupled from the registry.
     """
     return _PRIMITIVE_TRANSLATORS_REGISTRY.copy()
 
@@ -219,9 +219,9 @@ def get_regsitered_primitive_translators() -> dict[str, translator.PrimitiveTran
 def set_active_primitive_translators_to(
     new_translators: Mapping[str, translator.PrimitiveTranslator],
 ) -> MutableMapping[str, translator.PrimitiveTranslator]:
-    """Exchange the global translator registry of JaCe with `new_translators`.
+    """Exchange the global translator registry state of JaCe with `new_translators`.
 
-    The function will return the state of the global translator registry just before this call.
+    The function will return the state of the global translator registry prior to this call.
     Any changes to `new_translators` after calling this function will have no effect on the
     global translator registry and vice versa.
     """
diff --git a/src/jace/translator/translated_jaxpr_sdfg.py b/src/jace/translator/translated_jaxpr_sdfg.py
index 13f34dd..77c6001 100644
--- a/src/jace/translator/translated_jaxpr_sdfg.py
+++ b/src/jace/translator/translated_jaxpr_sdfg.py
@@ -16,9 +16,9 @@ class TranslatedJaxprSDFG:
     """Encapsulates the result of a translation run of the `JaxprTranslationBuilder` object.
 
     The only valid way to obtain a `TranslatedJaxprSDFG` is by passing a `TranslationContext`,
-    that was in turn constructed by `JaxprTranslationBuilder.translate_jaxpr()` to
-    `postprocess_jaxpr_sdfg()`.
-    This class encapsulates a translated SDFG as well as the meta data needed to run it.
+    that was in turn constructed by `JaxprTranslationBuilder.translate_jaxpr()`, to the
+    `postprocess_jaxpr_sdfg()` function.
+    This class encapsulates a translated SDFG as well as the meta data needed to compile and run it.
 
     Contrary to the SDFG that is encapsulated inside the `TranslationContext` object, `self`
     carries a proper SDFG, however:
@@ -27,10 +27,11 @@ class TranslatedJaxprSDFG:
         are only listed as inputs.
 
     Attributes:
-        sdfg:           The SDFG object that was created.
-        inp_names:      A list of the SDFG variables that are used as input, same order as `Jaxpr.invars`.
-        out_names:      A list of the SDFG variables that are used as output, same order as `Jaxpr.outvars`.
+        sdfg:           The encapsulated SDFG object.
+        inp_names:      A list of the SDFG variables that are used as input
+        out_names:      A list of the SDFG variables that are used as output.
 
+    The `inp_names` and `out_name` are in the same order as in the original Jaxpr object.
     It might happen that a name appears in both the `inp_names` and `out_names` lists. This happens
     if an argument is used both as input and output, and it is not an error. In Jax this is called
     argument donation.
diff --git a/src/jace/util/compiling.py b/src/jace/util/compiling.py
index 290eafe..0e3fcd7 100644
--- a/src/jace/util/compiling.py
+++ b/src/jace/util/compiling.py
@@ -29,7 +29,12 @@
 def compile_jax_sdfg(
     tsdfg: translator.TranslatedJaxprSDFG,
 ) -> dace_helper.CompiledSDFG:
-    """Compiles the SDFG embedded in `tsdfg` and return the resulting `CompiledSDFG` object."""
+    """Compiles the SDFG embedded in `tsdfg` and return the resulting `CompiledSDFG` object.
+
+    Note:
+        For calling the returned `CompiledSDFG` object you need the `inp_names` and `out_names`
+        of the input `TranslatedJaxprSDFG`.
+    """
     if any(  # We do not support the DaCe return mechanism
         arrname.startswith("__return")
         for arrname in tsdfg.sdfg.arrays.keys()  # noqa: SIM118  # we can not use `in` because we are also interested in `__return_`!
@@ -73,7 +78,7 @@ def run_jax_sdfg(
 
     The function assumes that the SDFG was finalized and then compiled by `compile_jax_sdfg()`.
     For running the SDFG you also have to pass the input names (`inp_names`) and output names
-    (`out_names`) that where inside the `TranslatedJaxprSDFG` from which `csdfg` was compiled from.
+    (`out_names`) that were inside the `TranslatedJaxprSDFG` from which `csdfg` was compiled from.
 
     Args:
         csdfg:      The `CompiledSDFG` object.
@@ -85,13 +90,14 @@ def run_jax_sdfg(
     Note:
         There is no pytree mechanism jet, thus the return values are returned inside a `tuple`
         or in case of one value, directly, in the order determined by Jax.
-        Currently, this function does not consider strides in the input, all input must be
-        `C_CONTIGUOUS` nor have any undefined symbols.
+        Furthermore, DaCe does not support scalar return values, thus they are silently converted
+        into arrays of length 1, the same holds for inputs.
 
     Todo:
-        Since we do not have symbols and a fixed size this works and there is no problem.
-        However, if we have symbols or variable sizes, we must ensure that the init function of
-        the SDFG is called every time, or ensure that its exit function runs every time.
+        - Since we do not have symbols and a fixed size this works and there is no problem.
+            However, if we have symbols or variable sizes, we must ensure that the init function of
+            the SDFG is called every time, or ensure that its exit function runs every time.
+        - Implement non C strides.
     """
     sdfg: dace.SDFG = csdfg.sdfg
 
diff --git a/src/jace/util/jax_helper.py b/src/jace/util/jax_helper.py
index b7bb2e4..c5b518d 100644
--- a/src/jace/util/jax_helper.py
+++ b/src/jace/util/jax_helper.py
@@ -38,6 +38,9 @@ class is as an internal representation of values, as they are used in Jax, but w
     instance and a shape. In addition it has an optional name, which allows to create variables
     with a certain name using `JaxprTranslationBuilder.add_array()`.
 
+    If you are expect to handle both real Jax variables and JaCe variable, you should use the
+    `get_jax_var_*()` functions to access them.
+
     Args:
         shape:      The shape of the variable.
         dtype:      The dace datatype of the variable.
@@ -75,10 +78,7 @@ def __eq__(self, other: Any) -> bool:
 
 
 def get_jax_var_name(jax_var: jax_core.Atom | JaCeVar) -> str:
-    """Returns the name of the Jax variable as a string.
-
-    Args:
-        jax_var:     The variable to stringify.
+    """Returns the name of `jax_var` as a string.
 
     Notes:
         If `jax_var` is a `JaCeVar` the function will return, if defined, its `.name` property.
@@ -91,7 +91,7 @@ def get_jax_var_name(jax_var: jax_core.Atom | JaCeVar) -> str:
         case JaCeVar():
             return jax_var.name if jax_var.name else f"jax{id(jax_var)}"
         case jax_core.Var():
-            # This is not how the pretty printer works nor Jax.Var.__repr__,
+            # This is not how the pretty printer works nor `jax.Var.__repr__()`,
             #  but leads to stable and valid names.
             return f"jax{jax_var.count}{jax_var.suffix}"
         case jax_core.Literal():
@@ -136,7 +136,7 @@ def is_tracing_ongoing(
     """Test if tracing is ongoing.
 
     While a return value `True` guarantees that a translation is ongoing, a value of `False`
-    does not guarantees that no tracing is active.
+    does not guarantees that no tracing is ongoing.
     """
     # The current implementation only checks the arguments if it contains tracers.
     if (len(args) == 0) and (len(kwargs) == 0):
@@ -165,9 +165,9 @@ def propose_jax_name(
 
     If `jax_name_map` is `None` the function will fallback to `get_jax_var_name(jax_var)`.
     If `jax_name_map` is supplied the function will:
-    - if `jax_var` is stored inside `jax_name_map` this value will be returned.
-    - if `jax_var` is a `JaCeVar` with a set `.name` property that name will be returned.
-    - otherwise the function will generate a new name in a similar way than pretty printer of Jaxpr.
+    - If `jax_var` is stored inside `jax_name_map`, returns the mapped value.
+    - If `jax_var` is a `JaCeVar` with a set `.name` property that name will be returned.
+    - Otherwise the function will generate a new name in a similar way to the pretty printer of Jaxpr.
 
     Args:
         jax_var:        The variable for which a name to propose.
diff --git a/src/jace/util/traits.py b/src/jace/util/traits.py
index ae2f41b..56f4f7e 100644
--- a/src/jace/util/traits.py
+++ b/src/jace/util/traits.py
@@ -24,7 +24,7 @@
 def is_jaceified(obj: Any) -> TypeGuard[stages.JaCeWrapped]:
     """Tests if `obj` is decorated by JaCe.
 
-    Similar to `is_jaxified`, but for JaCe object.
+    Similar to `is_jaxified` but for JaCe objects.
     """
 
     if util.is_jaxified(obj):
@@ -32,16 +32,6 @@ def is_jaceified(obj: Any) -> TypeGuard[stages.JaCeWrapped]:
     return isinstance(obj, stages.JaCeWrapped)
 
 
-def is_drop_var(jax_var: jax_core.Atom | util.JaCeVar) -> TypeGuard[jax_core.DropVar]:
-    """Tests if `jax_var` is a drop variable, i.e. a variable that is not read from in a Jaxpr."""
-
-    if isinstance(jax_var, jax_core.DropVar):
-        return True
-    if isinstance(jax_var, util.JaCeVar):
-        return jax_var.name == "_" if jax_var.name else False
-    return False
-
-
 def is_jaxified(
     obj: Any,
 ) -> TypeGuard[jax_core.Primitive | jax_src.pjit.JitWrapped | jax_xe.PjitFunction]:
@@ -60,13 +50,23 @@ def is_jaxified(
     return isinstance(obj, jaxifyed_types)
 
 
+def is_drop_var(jax_var: jax_core.Atom | util.JaCeVar) -> TypeGuard[jax_core.DropVar]:
+    """Tests if `jax_var` is a drop variable, i.e. a variable that is not read from in a Jaxpr."""
+
+    if isinstance(jax_var, jax_core.DropVar):
+        return True
+    if isinstance(jax_var, util.JaCeVar):
+        return jax_var.name == "_" if jax_var.name else False
+    return False
+
+
 def is_jax_array(
     obj: Any,
 ) -> TypeGuard[jax.Array]:
-    """Tests if `obj` is a jax array.
+    """Tests if `obj` is a Jax array.
 
-    Notes jax array are special as you can not write to them directly.
-    Furthermore, they always allocate also on GPU, beside the CPU allocation.
+    Notes Jax array are special as you can not write to them directly.
+    Furthermore, they always allocate on the CPU and if present, also on the GPU.
     """
     return isinstance(obj, jax.Array)
 
@@ -116,7 +116,7 @@ def is_on_device(
     """Tests if `obj` is on a device.
 
     Jax arrays are always on the CPU and GPU (if there is one). Thus for Jax arrays this
-    function is more of a test, if there is a GPU or not.
+    function is more of a test, if there is a GPU at all.
     """
     if is_jax_array(obj):
         return hasattr(obj, "__cuda_array_interface__")
diff --git a/src/jace/util/translation_cache.py b/src/jace/util/translation_cache.py
index c0f6fce..02ba9ef 100644
--- a/src/jace/util/translation_cache.py
+++ b/src/jace/util/translation_cache.py
@@ -62,6 +62,9 @@ class CachingStage(Generic[NextStage]):
 
     Notes:
         The `__init__()` function must explicitly be called to fully setup `self`.
+
+    Todo:
+        - Handle eviction from the cache due to collecting of unused predecessor stages.
     """
 
     _cache: StageCache[NextStage]
@@ -79,7 +82,7 @@ def _make_call_description(
         ...
 
 
-# Type annotation of the caching Stuff.
+# Type annotation for the caching.
 P = ParamSpec("P")
 TransitionFunction = Callable[Concatenate[CachingStage[NextStage], P], NextStage]
 CachingStageType = TypeVar("CachingStageType", bound=CachingStage)
@@ -92,6 +95,9 @@ def cached_transition(
 
     In order to work, the stage must be derived from `CachingStage`. For computing the key of a
     call the function will use the `_make_call_description()` function of the cache.
+
+    Todo:
+        - Implement a way to temporary disable the cache.
     """
 
     @functools.wraps(transition)
@@ -130,8 +136,8 @@ def get_cache(
 class _AbstractCallArgument:
     """Class to represent a single argument to the transition function in an abstract way.
 
-    As noted in `StageTransformationSpec` there are two ways to describe an argument,
-    either using its concrete value or an abstract description, which is similar to tracers in Jax.
+    As noted in `StageTransformationSpec` there are two ways to describe an argument, either by
+    using its concrete value or an abstract description, which is similar to tracers in Jax.
     This class represents the second way.
     To create an instance you should use `_AbstractCallArgument.from_value()`.
 
@@ -201,8 +207,8 @@ class StageTransformationSpec:
     """Represents the entire call to a state transformation function of a stage.
 
     State transition functions are annotated with `@cached_transition` and their result may be
-    cached. They key to locate them inside the cache is represented by this class.
-    The cache will call the `CachingStage._make_call_description()` function to get a key.
+    cached. They key to locate them inside the cache is represented by this class and computed by
+    the `CachingStage._make_call_description()` function.
     The actual key is consists of two parts, `stage_id` and `call_args`.
 
     Args:
diff --git a/tests/test_caching.py b/tests/test_caching.py
index db568a3..b9d42a9 100644
--- a/tests/test_caching.py
+++ b/tests/test_caching.py
@@ -249,7 +249,7 @@ def wrapped(A: np.ndarray) -> np.ndarray:
     F_res = C_res.copy()  # Remove later
     with pytest.raises(  # noqa: PT012 # Multiple calls
         expected_exception=NotImplementedError,
-        match=re.escape("Currently can not handle strides beside 'C_CONTIGUOUS'."),
+        match=re.escape("Currently can not yet handle strides beside 'C_CONTIGUOUS'."),
     ):
         F_lower = wrapped.lower(F)
         F_res = wrapped(F)
diff --git a/tests/test_jaxpr_translator_builder.py b/tests/test_jaxpr_translator_builder.py
index 13a3835..75e8ded 100644
--- a/tests/test_jaxpr_translator_builder.py
+++ b/tests/test_jaxpr_translator_builder.py
@@ -328,7 +328,7 @@ def test_builder_variable_invalid_prefix(
     for iprefix in ["0_", "_ja ", "_!"]:
         with pytest.raises(
             expected_exception=ValueError,
-            match=re.escape(f"add_array({array1}): Supplied invalid prefix '{iprefix}'."),
+            match=re.escape(f"add_array({array1}): The proposed name '{iprefix}a', is invalid."),
         ):
             _ = translation_builder.add_array(array1, update_var_mapping=False, name_prefix=iprefix)
         assert len(translation_builder.sdfg.arrays) == 0
@@ -555,6 +555,6 @@ def testee(A: np.ndarray) -> np.ndarray:
 
     with pytest.raises(
         expected_exception=NotImplementedError,
-        match=re.escape("Currently can not handle strides beside 'C_CONTIGUOUS'."),
+        match=re.escape("Currently can not yet handle strides beside 'C_CONTIGUOUS'."),
     ):
         _ = testee(F)

From a23f0ab837f7d5ea2eaaeb3f1349f47aa72217d8 Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Fri, 31 May 2024 11:50:39 +0200
Subject: [PATCH 281/458] Started to restructure the tests.

I also have to reformat them.
---
 tests/conftest.py                             | 64 +++++++++++++-
 .../test_primitive_alu.py                     | 85 +++++++++----------
 .../test_primitive_broadcast_in_dim.py        | 42 ++++++---
 .../test_primitive_convert_element_type.py    | 46 +---------
 .../test_primitive_copy.py                    | 10 ++-
 .../test_primitive_reshape.py                 |  4 +-
 .../test_primitive_select_n.py                | 24 +-----
 .../test_primitive_slicing.py                 | 15 ++--
 .../test_primitive_squeeze_expand_dims.py     |  9 +-
 tests/integration_tests/test_empty_jaxpr.py   | 37 +++++++-
 .../test_jaxpr_translator_builder.py          | 14 +--
 .../test_primitive_translator_managing.py     | 25 +++---
 tests/unit_tests/test_caching.py              | 53 ++++++------
 tests/unit_tests/test_decorator.py            | 25 ++----
 tests/unit_tests/test_jax_api.py              | 15 ++--
 tests/unit_tests/test_misc.py                 | 12 +--
 tests/util.py                                 | 42 +++++++++
 17 files changed, 306 insertions(+), 216 deletions(-)
 create mode 100644 tests/util.py

diff --git a/tests/conftest.py b/tests/conftest.py
index f2d8b8f..e55ad74 100644
--- a/tests/conftest.py
+++ b/tests/conftest.py
@@ -5,4 +5,66 @@
 #
 # SPDX-License-Identifier: BSD-3-Clause
 
-"""General configuration for the tests."""
+"""General configuration for the tests.
+
+Todo:
+    - Implement some fixture that allows to force validation.
+"""
+
+from __future__ import annotations
+
+import jax
+import numpy as np
+import pytest
+
+from jace.util import translation_cache as tcache
+
+
+@pytest.fixture(autouse=True)
+def _enable_x64_mode_in_jax():
+    """Fixture of enable the `x64` mode in Jax.
+
+    Currently, JaCe requires that `x64` mode is enabled and will do all Jax things with it enabled.
+    However, if we use Jax with the intend to compare it against JaCe we must also enable it for
+    Jax.
+    """
+    with jax.experimental.enable_x64():
+        yield
+
+
+@pytest.fixture(autouse=True)
+def _disable_jit():
+    """Fixture for disable the dynamic jiting in Jax.
+
+    For certain reasons Jax puts certain primitives inside a `pjit` primitive, i.e. nested Jaxpr.
+    The intent is, that these operations can/should run on an accelerator.
+
+    But this is a problem, since JaCe can not handle this primitive, it leads to an error.
+    To overcome this problem, we will globally disable this feature until we can handle `pjit`.
+
+    Todo:
+        Remove as soon as we can handle nested `jit`.
+    """
+    with jax.disable_jit(disable=True):
+        yield
+
+
+@pytest.fixture(autouse=True)
+def _clear_translation_cache():
+    """Decorator that clears the translation cache.
+
+    Ensures that a function finds an empty cache and clears up afterwards.
+    """
+    tcache.clear_translation_cache()
+    yield
+    tcache.clear_translation_cache()
+
+
+@pytest.fixture(autouse=True)
+def _reset_random_seed():
+    """Fixture for resetting the random seed.
+
+    This ensures that for every test the random seed of NumPy is reset.
+    This seed is used by the `util.mkarray()` helper.
+    """
+    np.random.seed(42)  # noqa: NPY002  # We use this seed for the time being.
diff --git a/tests/integration_tests/primitive_translators/test_primitive_alu.py b/tests/integration_tests/primitive_translators/test_primitive_alu.py
index 24db139..51e5a3e 100644
--- a/tests/integration_tests/primitive_translators/test_primitive_alu.py
+++ b/tests/integration_tests/primitive_translators/test_primitive_alu.py
@@ -5,7 +5,11 @@
 #
 # SPDX-License-Identifier: BSD-3-Clause
 
-"""Implements tests for the ALU translator."""
+"""Implements tests for the ALU translator.
+
+Todo:
+    - Add all supported primitives, to see if the template is valid.
+"""
 
 from __future__ import annotations
 
@@ -17,12 +21,14 @@
 
 import jace
 
+from tests import util as testutil
+
 
 if TYPE_CHECKING:
-    from collections.abc import Callable, Sequence
+    from collections.abc import Callable
 
 
-def _perform_test(testee: Callable, *args: Any) -> None:
+def _perform_alu_test(testee: Callable, *args: Any) -> None:
     """General function that just performs the test."""
     wrapped = jace.jit(testee)
 
@@ -31,20 +37,13 @@ def _perform_test(testee: Callable, *args: Any) -> None:
     assert np.allclose(ref, res), f"Expected '{ref.tolist()}' got '{res.tolist()}'"
 
 
-def mkarr(
-    shape: Sequence[int],
-    dtype=np.float64,
-) -> np.ndarray:
-    return np.array(np.random.random(shape), dtype=dtype)  # noqa: NPY002
-
-
 def test_alu_unary_scalar():
     """Test unary ALU translator in the scalar case."""
 
     def testee(A: float) -> float | jax.Array:
         return jnp.cos(A)
 
-    _perform_test(testee, 1.0)
+    _perform_alu_test(testee, 1.0)
 
 
 def test_alu_unary_array():
@@ -53,9 +52,9 @@ def test_alu_unary_array():
     def testee(A: np.ndarray) -> jax.Array:
         return jnp.sin(A)
 
-    A = mkarr((100, 10, 3))
+    A = testutil.mkarray((100, 10, 3))
 
-    _perform_test(testee, A)
+    _perform_alu_test(testee, A)
 
 
 def test_alu_unary_scalar_literal():
@@ -64,7 +63,7 @@ def test_alu_unary_scalar_literal():
     def testee(A: float) -> float | jax.Array:
         return jnp.sin(1.98) + A
 
-    _perform_test(testee, 10.0)
+    _perform_alu_test(testee, 10.0)
 
 
 def test_alu_unary_integer_power():
@@ -74,8 +73,8 @@ def test_alu_unary_integer_power():
         def testee(A: np.ndarray) -> np.ndarray:
             return A ** int(exp)  # noqa: B023 # `exp` is not used in the body
 
-        A = mkarr((10, 2 + exp, 3))
-        _perform_test(testee, A)
+        A = testutil.mkarray((10, 2 + exp, 3))
+        _perform_alu_test(testee, A)
 
 
 def test_alu_binary_scalar():
@@ -84,7 +83,7 @@ def test_alu_binary_scalar():
     def testee(A: float, B: float) -> float:
         return A * B
 
-    _perform_test(testee, 1.0, 2.0)
+    _perform_alu_test(testee, 1.0, 2.0)
 
 
 def test_alu_binary_scalar_literal():
@@ -93,7 +92,7 @@ def test_alu_binary_scalar_literal():
     def testee(A: float) -> float:
         return A * 2.03
 
-    _perform_test(testee, 7.0)
+    _perform_alu_test(testee, 7.0)
 
 
 def test_alu_binary_scalar_literal_2():
@@ -102,7 +101,7 @@ def test_alu_binary_scalar_literal_2():
     def testee(A: float) -> float:
         return 2.03 * A
 
-    _perform_test(testee, 7.0)
+    _perform_alu_test(testee, 7.0)
 
 
 def test_alu_binary_array():
@@ -111,9 +110,9 @@ def test_alu_binary_array():
     def testee(A: np.ndarray, B: np.ndarray) -> np.ndarray:
         return A + B
 
-    A = mkarr((100, 10, 3))
-    B = mkarr((100, 10, 3))
-    _perform_test(testee, A, B)
+    A = testutil.mkarray((100, 10, 3))
+    B = testutil.mkarray((100, 10, 3))
+    _perform_alu_test(testee, A, B)
 
 
 def test_alu_binary_array_scalar():
@@ -122,10 +121,10 @@ def test_alu_binary_array_scalar():
     def testee(A: np.ndarray | float, B: float | np.ndarray) -> np.ndarray:
         return cast(np.ndarray, A + B)
 
-    A = mkarr((100, 22))
+    A = testutil.mkarray((100, 22))
     B = np.float64(1.34)
-    _perform_test(testee, A, B)
-    _perform_test(testee, B, A)
+    _perform_alu_test(testee, A, B)
+    _perform_alu_test(testee, B, A)
 
 
 def test_alu_binary_array_literal():
@@ -134,8 +133,8 @@ def test_alu_binary_array_literal():
     def testee(A: np.ndarray) -> np.ndarray:
         return A + 1.52
 
-    A = mkarr((100, 22))
-    _perform_test(testee, A)
+    A = testutil.mkarray((100, 22))
+    _perform_alu_test(testee, A)
 
 
 def test_alu_binary_array_literal_2():
@@ -144,8 +143,8 @@ def test_alu_binary_array_literal_2():
     def testee(A: np.ndarray) -> np.ndarray:
         return 1.52 + A
 
-    A = mkarr((100, 22))
-    _perform_test(testee, A)
+    A = testutil.mkarray((100, 22))
+    _perform_alu_test(testee, A)
 
 
 def test_alu_binary_array_constants():
@@ -154,8 +153,8 @@ def test_alu_binary_array_constants():
     def testee(A: np.ndarray) -> np.ndarray:
         return A + jnp.array([[1.0, 2.0, 3.0], [4.0, 5.0, 6.0], [7.0, 8.0, 9.0]])
 
-    A = mkarr((3, 3))
-    _perform_test(testee, A)
+    A = testutil.mkarray((3, 3))
+    _perform_alu_test(testee, A)
 
 
 def test_alu_binary_broadcast_1():
@@ -164,10 +163,10 @@ def test_alu_binary_broadcast_1():
     def testee(A: np.ndarray, B: np.ndarray) -> np.ndarray:
         return A + B
 
-    A = mkarr((100, 1, 3))
-    B = mkarr((100, 1, 1))
-    _perform_test(testee, A, B)
-    _perform_test(testee, B, A)
+    A = testutil.mkarray((100, 1, 3))
+    B = testutil.mkarray((100, 1, 1))
+    _perform_alu_test(testee, A, B)
+    _perform_alu_test(testee, B, A)
 
 
 def test_alu_binary_broadcast_2():
@@ -176,10 +175,10 @@ def test_alu_binary_broadcast_2():
     def testee(A: np.ndarray, B: np.ndarray) -> np.ndarray:
         return A + B
 
-    A = mkarr((100, 1))
-    B = mkarr((100, 10))
-    _perform_test(testee, A, B)
-    _perform_test(testee, B, A)
+    A = testutil.mkarray((100, 1))
+    B = testutil.mkarray((100, 10))
+    _perform_alu_test(testee, A, B)
+    _perform_alu_test(testee, B, A)
 
 
 def test_alu_binary_broadcast_3():
@@ -188,7 +187,7 @@ def test_alu_binary_broadcast_3():
     def testee(A: np.ndarray, B: np.ndarray) -> np.ndarray:
         return A + B
 
-    A = mkarr((5, 1, 3, 4, 1))
-    B = mkarr((5, 1, 3, 1, 2))
-    _perform_test(testee, A, B)
-    _perform_test(testee, B, A)
+    A = testutil.mkarray((5, 1, 3, 4, 1))
+    B = testutil.mkarray((5, 1, 3, 1, 2))
+    _perform_alu_test(testee, A, B)
+    _perform_alu_test(testee, B, A)
diff --git a/tests/integration_tests/primitive_translators/test_primitive_broadcast_in_dim.py b/tests/integration_tests/primitive_translators/test_primitive_broadcast_in_dim.py
index 7e6add5..f49efdc 100644
--- a/tests/integration_tests/primitive_translators/test_primitive_broadcast_in_dim.py
+++ b/tests/integration_tests/primitive_translators/test_primitive_broadcast_in_dim.py
@@ -17,6 +17,8 @@
 
 from __future__ import annotations
 
+from typing import TYPE_CHECKING
+
 import jax
 import numpy as np
 import pytest
@@ -24,12 +26,17 @@
 
 import jace
 
+from tests import util as testutil
+
+
+if TYPE_CHECKING:
+    from collections.abc import Sequence
+
 
-@pytest.fixture(autouse=True)
-def _enable_x64_mode_in_jax():
-    """Ensures that x64 mode in Jax ins enabled."""
-    with jax.experimental.enable_x64():
-        yield
+@pytest.fixture(params=[(10,), (10, 1), (1, 10)])
+def vector_shape(request) -> tuple[int, ...]:
+    """Shapes used in the `test_bid_vector()` tests."""
+    return request.param
 
 
 def test_bid_scalar():
@@ -53,9 +60,22 @@ def test_bid_literal():
     def testee(a: float) -> np.ndarray | jax.Array:
         return jnp.broadcast_to(1.0, (10, 10)) + a
 
-    for a in [1, 1.0, 3.1415]:
-        ref = testee(a)
-        res = jace.jit(testee)(a)
-        assert res.shape == ref.shape
-        assert res.dtype == ref.dtype
-        assert np.all(res == ref)
+    ref = testee(0.0)
+    res = jace.jit(testee)(0.0)
+    assert res.shape == ref.shape
+    assert res.dtype == ref.dtype
+    assert np.all(res == ref)
+
+
+def test_bid_vector(vector_shape: Sequence[int]):
+    """Broadcast a vector to a tensor."""
+
+    def testee(a: np.ndarray) -> np.ndarray | jax.Array:
+        return jnp.broadcast_to(a, (10, 10)) + a
+
+    a = testutil.mkarray(vector_shape)
+    ref = testee(a)
+    res = jace.jit(testee)(a)
+    assert res.shape == ref.shape
+    assert res.dtype == ref.dtype
+    assert np.all(res == ref)
diff --git a/tests/integration_tests/primitive_translators/test_primitive_convert_element_type.py b/tests/integration_tests/primitive_translators/test_primitive_convert_element_type.py
index 00d5ec1..a85b145 100644
--- a/tests/integration_tests/primitive_translators/test_primitive_convert_element_type.py
+++ b/tests/integration_tests/primitive_translators/test_primitive_convert_element_type.py
@@ -17,7 +17,8 @@
 from jax import numpy as jnp
 
 import jace
-from jace.util import translation_cache as tcache
+
+from tests import util as testutil
 
 
 # fmt: off
@@ -32,20 +33,6 @@
 # fmt: on
 
 
-@pytest.fixture(autouse=True)
-def _clear_translation_cache():
-    """Decorator that clears the translation cache.
-
-    Ensures that a function finds an empty cache and clears up afterwards.
-
-    Todo:
-        Ask Enrique how I can make that fixture apply everywhere not just in the file but the whole test suite.
-    """
-    tcache.clear_translation_cache()
-    yield
-    tcache.clear_translation_cache()
-
-
 @pytest.fixture(params=_DACE_REAL_TYPES)
 def src_type(request) -> type:
     """All valid source types, with the exception of bool."""
@@ -68,10 +55,8 @@ def _convert_element_type_impl(
 ) -> bool:
     """Implementation of the tests of the convert element types primitive."""
     lowering_cnt = [0]
-    A: np.ndarray = np.array(np.random.random((10, 10)), dtype=input_type)  # noqa: NPY002
-    assert A.dtype == input_type
+    A: np.ndarray = testutil.mkarray((10, 10), input_type)
     ref: np.ndarray = np.array(A, copy=True, dtype=output_type)
-    assert ref.dtype == output_type
 
     @jace.jit
     def converter(A: np.ndarray) -> jax.Array:
@@ -101,28 +86,3 @@ def test_convert_element_type_from_bool(src_type):
 @pytest.mark.skip(reason="This test is too long, only do it on certain conditions.")
 def test_convert_element_type_to_bool(dst_type):
     _convert_element_type_impl(dst_type, np.bool_)
-
-
-@pytest.mark.skip(reason="The warning was disabled, so the test is at the moment useless.")
-def test_convert_element_type_useless_cast():
-    """Shows that under some conditions there is really a casting from one type to the same.
-
-    In certain cases, also in some slicing tests, this useless cast is inserted by Jax.
-    This test was originally here to show this. However, that thing got so annoying that it was
-    removed. The test is kept here to serve as some kind of a reference.
-    """
-
-    def testee(a: float) -> np.ndarray:
-        # For it to work we have to use `numpy` instead of the Jax substitute.
-        return np.broadcast_to(1.0, (10, 10)) + a
-
-    with pytest.warns(
-        expected_warning=UserWarning,
-        match=r"convert_element_type\(.*\): is useless, input and output have same type\.",
-    ):
-        res = jace.jit(testee)(1.0)
-
-    ref = testee(1.0)
-    assert res.shape == ref.shape
-    assert res.dtype == ref.dtype
-    assert np.all(res == ref)
diff --git a/tests/integration_tests/primitive_translators/test_primitive_copy.py b/tests/integration_tests/primitive_translators/test_primitive_copy.py
index 7fcdaad..ecbc3c6 100644
--- a/tests/integration_tests/primitive_translators/test_primitive_copy.py
+++ b/tests/integration_tests/primitive_translators/test_primitive_copy.py
@@ -13,14 +13,16 @@
 
 import jace
 
+from tests import util as testutil
+
 
 def test_copy():
     @jace.jit
     def testee(A: np.ndarray) -> jax.Array:
         return jnp.copy(A)
 
-    A = np.random.random((10, 10, 10))  # noqa: NPY002
-    ref = np.copy(A)
+    A = testutil.mkarray((10, 10, 10))
     res = testee(A)
-    assert ref.dtype == res.dtype
-    assert np.all(ref == res)
+    assert A.dtype == res.dtype
+    assert A.shape == res.shape
+    assert np.all(res == A)
diff --git a/tests/integration_tests/primitive_translators/test_primitive_reshape.py b/tests/integration_tests/primitive_translators/test_primitive_reshape.py
index 80b1e8d..7bd142b 100644
--- a/tests/integration_tests/primitive_translators/test_primitive_reshape.py
+++ b/tests/integration_tests/primitive_translators/test_primitive_reshape.py
@@ -18,6 +18,8 @@
 
 import jace
 
+from tests import util as testutil
+
 
 if TYPE_CHECKING:
     from collections.abc import Sequence
@@ -29,7 +31,7 @@ def _test_impl_reshaping(
     order: str = "C",
 ) -> None:
     """Performs a reshaping from `src_shape` to `dst_shape`."""
-    A = np.random.random(src_shape)  # noqa: NPY002
+    A = testutil.mkarray(src_shape)
     A = np.array(A, order=order)  # type: ignore[call-overload]  # MyPy wants a literal as order.
 
     def testee(A: np.ndarray) -> jax.Array:
diff --git a/tests/integration_tests/primitive_translators/test_primitive_select_n.py b/tests/integration_tests/primitive_translators/test_primitive_select_n.py
index 576e53f..c887b23 100644
--- a/tests/integration_tests/primitive_translators/test_primitive_select_n.py
+++ b/tests/integration_tests/primitive_translators/test_primitive_select_n.py
@@ -18,32 +18,12 @@
 
 import jace
 
-
-@pytest.fixture(autouse=True)
-def _disable_jit():
-    """Decorator that ensures that `select_n` is not put in an implicit `jit`.
-
-    The reason we do this is because we can currently not handle this nested jits.
-    It is important that it also disabled explicit usage of `jax.jit`.
-    However, since JaCe does not honor this flag we it does not affect us.
-
-    Todo:
-        Remove as soon as we can handle nested `jit`.
-    """
-    with jax.disable_jit(disable=True):
-        yield
-
-
-@pytest.fixture(autouse=True)
-def _enable_x64_mode_in_jax():
-    """Ensures that x64 mode in Jax ins enabled."""
-    with jax.experimental.enable_x64():
-        yield
+from tests import util as testutil
 
 
 @pytest.fixture()
 def Pred() -> np.ndarray:
-    return np.random.random((10, 10)) > 0.5  # noqa: NPY002
+    return testutil.mkarray((10, 10)) > 0.5
 
 
 @pytest.fixture()
diff --git a/tests/integration_tests/primitive_translators/test_primitive_slicing.py b/tests/integration_tests/primitive_translators/test_primitive_slicing.py
index 75c88a9..dc5f8be 100644
--- a/tests/integration_tests/primitive_translators/test_primitive_slicing.py
+++ b/tests/integration_tests/primitive_translators/test_primitive_slicing.py
@@ -15,30 +15,25 @@
 
 import jace
 
-
-@pytest.fixture(autouse=True)
-def _enable_x64_mode_in_jax():
-    """Ensures that x64 mode in Jax ins enabled."""
-    with jax.experimental.enable_x64():
-        yield
+from tests import util as testutil
 
 
 @pytest.fixture()
 def A_4x4():
-    return np.arange(16).reshape((4, 4))
+    return testutil.mkarray((4, 4))
 
 
 @pytest.fixture()
 def A_4x4x4x4():
-    return np.arange(4**4).reshape((4, 4, 4, 4))
+    return testutil.mkarray((4, 4, 4, 4))
 
 
 @pytest.fixture(
     params=[
         (1, 2, 1, 2),
         (0, 0, 0, 0),
-        (3, 3, 3, 3),  # Will lead to readjustment.
-        (3, 1, 3, 0),  # Will lead to readjustment.
+        (3, 3, 3, 3),  # Will lead to readjustment of the start index.
+        (3, 1, 3, 0),  # Will lead to readjustment of the start index.
     ]
 )
 def full_dynamic_start_idx(request):
diff --git a/tests/integration_tests/primitive_translators/test_primitive_squeeze_expand_dims.py b/tests/integration_tests/primitive_translators/test_primitive_squeeze_expand_dims.py
index f76fd3d..bf9e89f 100644
--- a/tests/integration_tests/primitive_translators/test_primitive_squeeze_expand_dims.py
+++ b/tests/integration_tests/primitive_translators/test_primitive_squeeze_expand_dims.py
@@ -7,8 +7,9 @@
 
 """Implements tests for the squeeze translator.
 
-For several reasons parts of the tests related to broadcasting, especially the ones in which a single dimension is added, are also here.
-This is because of the inverse relationship between `expand_dims` and `squeeze`.
+For several reasons parts of the tests related to broadcasting, especially the ones in which
+a single dimension is added, are also here. This is because of the inverse relationship between
+`expand_dims` and `squeeze`.
 """
 
 from __future__ import annotations
@@ -22,6 +23,8 @@
 
 import jace
 
+from tests import util as testutil
+
 
 if TYPE_CHECKING:
     from collections.abc import Sequence
@@ -39,7 +42,7 @@ def _roundtrip_implementation(
         shape:  Shape of the input array.
         axes:   A series of axis that should be tried.
     """
-    A = np.random.random(shape)  # noqa: NPY002
+    A = testutil.mkarray(shape)
     A_org = A.copy()
 
     for ops in [jnp.expand_dims, jnp.squeeze]:
diff --git a/tests/integration_tests/test_empty_jaxpr.py b/tests/integration_tests/test_empty_jaxpr.py
index 18308f5..8dfc495 100644
--- a/tests/integration_tests/test_empty_jaxpr.py
+++ b/tests/integration_tests/test_empty_jaxpr.py
@@ -43,9 +43,42 @@ def testee(A: float) -> float:
 @pytest.mark.skip(reason="Nested Jaxpr are not handled.")
 def test_empty_nested():
     @jace.jit
-    def testee3(A: float) -> float:
+    def testee(A: float) -> float:
         return jax.jit(lambda A: A)(A)
 
     A = np.pi
 
-    assert np.all(testee3(A) == A)
+    assert np.all(testee(A) == A)
+
+
+def test_empty_with_drop_vars():
+    """Tests if we can handle an empty input = output case, with present drop variables."""
+
+    @jace.jit
+    @jace.grad
+    def testee(A: float) -> float:
+        return A * A
+
+    A = np.pi
+
+    assert np.all(testee(A) == 2.0 * A)
+
+
+@pytest.mark.skip(reason="Literal return value is not implemented.")
+def test_empty_literal_return():
+    """Tests if we can handle a literal return value.
+
+    Note:
+        Using this test function serves another purpose. Since Jax includes the original
+        computation in the Jaxpr coming from a `grad` annotated function, the result will have
+        only drop variables.
+    """
+
+    @jace.jit
+    @jace.grad
+    def testee(A: float) -> float:
+        return A + A + A
+
+    A = np.e
+
+    assert np.all(testee(A) == 3.0)
diff --git a/tests/integration_tests/test_jaxpr_translator_builder.py b/tests/integration_tests/test_jaxpr_translator_builder.py
index 30fad6d..09ba0b7 100644
--- a/tests/integration_tests/test_jaxpr_translator_builder.py
+++ b/tests/integration_tests/test_jaxpr_translator_builder.py
@@ -20,6 +20,8 @@
 from jace import translator, util
 from jace.util import JaCeVar
 
+from tests import util as testutil
+
 
 # These are some JaCe variables that we use inside the tests
 #  Unnamed arrays
@@ -93,7 +95,8 @@ def test_builder_variable_alloc_mixed_naming(
 ) -> None:
     """Tests the naming in a mixed setting.
 
-    If `update_var_mapping=True` is given, then the naming will skip variables, see also `test_builder_variable_alloc_mixed_naming2()`.
+    If `update_var_mapping=True` is given, then the naming will skip variables,
+    see also `test_builder_variable_alloc_mixed_naming2()`.
     """
     #                        *       b       c       d      *      f      g
     for i, var in enumerate([narray, array1, array2, scal1, nscal, scal2, scal3]):
@@ -113,8 +116,8 @@ def test_builder_variable_alloc_mixed_naming2(
 ) -> None:
     """Tests the naming in a mixed setting.
 
-    This time we do not use `update_var_mapping=True`, instead it now depends on the name.
-    This means that automatic naming will now again include all, letters, but not in a linear order.
+    This time we do not use `update_var_mapping=True`, instead it now depends on the name. This
+    means that automatic naming will now again include all, letters, but not in a linear order.
     """
     letoff = 0
     #             *      a        b       c      *      d     e
@@ -272,7 +275,8 @@ def test_builder_append_state(translation_builder: translator.JaxprTranslationBu
     assert next(iter(sdfg.edges())).src is sdfg.start_block
     assert next(iter(sdfg.edges())).dst is terminal_state_1
 
-    # Specifying an explicit append state that is the terminal should also update the terminal state of the builder.
+    # Specifying an explicit append state that is the terminal should also update the terminal
+    #  state of the builder.
     terminal_state_2: dace.SDFGState = translation_builder.append_new_state(
         "terminal_state_2", prev_state=terminal_state_1
     )
@@ -511,7 +515,7 @@ def wrapped(A: float) -> float:
         lower_cnt[0] += 1
         return scalar_ops(A)
 
-    vals = np.random.random(100)  # noqa: NPY002
+    vals = testutil.mkarray(100)
     for i in range(vals.size):
         res = wrapped(vals[i])
         ref = scalar_ops(vals[i])
diff --git a/tests/integration_tests/test_primitive_translator_managing.py b/tests/integration_tests/test_primitive_translator_managing.py
index b804fd7..92db164 100644
--- a/tests/integration_tests/test_primitive_translator_managing.py
+++ b/tests/integration_tests/test_primitive_translator_managing.py
@@ -25,14 +25,6 @@
 )
 
 
-@pytest.fixture(autouse=True)
-def _conserve_builtin_translators():
-    """Restores the set of registered subtranslators after a test."""
-    initial_translators = get_regsitered_primitive_translators()
-    yield
-    set_active_primitive_translators_to(initial_translators)
-
-
 @pytest.fixture()
 def no_builtin_translators():  # noqa: PT004  # This is how you should do it: https://docs.pytest.org/en/7.1.x/how-to/fixtures.html#use-fixtures-in-classes-and-modules-with-usefixtures
     """This fixture can be used if the test does not want any builtin translators."""
@@ -41,6 +33,17 @@ def no_builtin_translators():  # noqa: PT004  # This is how you should do it: ht
     translator.set_active_primitive_translators_to(initial_translators)
 
 
+@pytest.fixture(autouse=True)
+def _conserve_builtin_translators():
+    """Restores the state of the global registry.
+
+    Needed to revert the modifications some tests do to the global registry state.
+    """
+    initial_translators = get_regsitered_primitive_translators()
+    yield
+    set_active_primitive_translators_to(initial_translators)
+
+
 # These are definitions of some Subtranslators that can be used to test things.
 class SubTrans1(translator.PrimitiveTranslator):
     @property
@@ -196,7 +199,7 @@ def still_useless_but_a_bit_less(*args: Any, **kwargs: Any) -> None:  # noqa: AR
         return
 
     @jace.jit
-    def foo(A):
+    def foo(A: int) -> int:
         B = A + 1
         C = B + 1
         D = C + 1
@@ -214,7 +217,7 @@ def test_subtranslatior_managing_decoupling():
 
     # This will use the translators that are currently installed.
     @jace.jit
-    def foo(A):
+    def foo(A: int) -> int:
         B = A + 1
         C = B + 1
         D = C + 1
@@ -225,6 +228,8 @@ def foo(A):
     def useless_add_translator(*args: Any, **kwargs: Any) -> None:  # noqa: ARG001
         raise NotImplementedError("The 'useless_add_translator' was called as expected.")
 
+    assert get_regsitered_primitive_translators()["add"] is useless_add_translator
+
     # Since `foo` was already constructed, a new registering can not change anything.
     A = np.zeros((10, 10))
     assert np.all(foo(A) == 4)
diff --git a/tests/unit_tests/test_caching.py b/tests/unit_tests/test_caching.py
index 283adec..f593ae4 100644
--- a/tests/unit_tests/test_caching.py
+++ b/tests/unit_tests/test_caching.py
@@ -12,27 +12,19 @@
 
 import itertools as it
 import re
+from typing import TYPE_CHECKING
 
 import numpy as np
 import pytest
 
 import jace
 from jace import optimization, stages
-from jace.util import translation_cache as tcache
 
+from tests import util as testutil
 
-@pytest.fixture(autouse=True)
-def _clear_translation_cache():
-    """Decorator that clears the translation cache.
 
-    Ensures that a function finds an empty cache and clears up afterwards.
-
-    Todo:
-        Ask Enrique how I can make that fixture apply everywhere not just in the file but the whole test suite.
-    """
-    tcache.clear_translation_cache()
-    yield
-    tcache.clear_translation_cache()
+if TYPE_CHECKING:
+    from jace.util import translation_cache as tcache
 
 
 def test_caching_same_sizes() -> None:
@@ -52,8 +44,8 @@ def wrapped(A, B):
         return testee(A, B)
 
     # First batch of arguments.
-    A = np.arange(12, dtype=np.float64).reshape((4, 3))
-    B = np.full((4, 3), 10, dtype=np.float64)
+    A = testutil.mkarray((4, 3))
+    B = testutil.mkarray((4, 3))
 
     # The second batch of argument, it is the same size (structurally) but different values.
     AA = A + 1.0362
@@ -91,12 +83,12 @@ def wrapped(A, B):
         return A * B
 
     # First size of arguments
-    A = np.arange(12, dtype=np.float64).reshape((4, 3))
-    B = np.full((4, 3), 10, dtype=np.float64)
+    A = testutil.mkarray((4, 3))
+    B = testutil.mkarray((4, 3))
 
     # Second size of arguments
-    C = np.arange(16, dtype=np.float64).reshape((4, 4))
-    D = np.full((4, 4), 10, dtype=np.float64)
+    C = testutil.mkarray((4, 4))
+    D = testutil.mkarray((4, 4))
 
     # Now lower the function once for each.
     lowered1 = wrapped.lower(A, B)
@@ -126,10 +118,10 @@ def wrapped(A, B):
         lowering_cnt[0] += 1
         return A * 4.0, B + 2.0
 
-    A = np.full((4, 30), 10, dtype=np.float64)
-    B = np.full((4, 3), 10, dtype=np.float64)
-    C = np.full((5, 3), 14, dtype=np.float64)
-    D = np.full((6, 3), 14, dtype=np.int64)
+    A = testutil.mkarray((4, 30), dtype=np.float64)
+    B = testutil.mkarray((4, 3), dtype=np.float64)
+    C = testutil.mkarray((4, 3), dtype=np.int64)
+    D = testutil.mkarray((6, 3), dtype=np.int64)
 
     # These are the known lowerings.
     lowerings: dict[tuple[int, int], stages.JaCeLowered] = {}
@@ -163,7 +155,10 @@ def wrapped(A, B):
 
 
 def test_caching_compilation() -> None:
-    """Tests the compilation cache, this is just very simple, since it uses the same code paths as lowering."""
+    """Tests the compilation cache.
+
+    The actual implementation is simple, because it uses the same code paths as lowering.
+    """
 
     @jace.jit
     def jaceWrapped(A: np.ndarray, B: np.ndarray) -> np.ndarray:
@@ -173,8 +168,8 @@ def jaceWrapped(A: np.ndarray, B: np.ndarray) -> np.ndarray:
         return A + B + C + D + E
 
     # These are the argument
-    A = np.arange(12, dtype=np.float64).reshape((4, 3))
-    B = np.full((4, 3), 10, dtype=np.float64)
+    A = testutil.mkarray((4, 3))
+    B = testutil.mkarray((4, 3))
 
     # Now we lower it.
     jaceLowered = jaceWrapped.lower(A, B)
@@ -212,12 +207,14 @@ def testee(A: np.ndarray) -> np.ndarray:
     shape = (10, 10)
 
     for i, dtype in enumerate(dtypes):
-        A = np.array((np.random.random(shape) - 0.5) * 10, dtype=dtype)  # noqa: NPY002
+        A = testutil.mkarray(shape, dtype=dtype)
 
+        # First lowering
         assert lowering_cnt[0] == i
         _ = testee(A)
         assert lowering_cnt[0] == i + 1
 
+        # Second, implicit, lowering, which must be cached.
         assert np.allclose(testee(A), 2 * A)
         assert lowering_cnt[0] == i + 1
 
@@ -272,7 +269,7 @@ def testee(A: np.ndarray) -> np.ndarray:
     assert cache.front()[0] == first_key
 
 
-def test_caching_eviction_complex():
+def test_caching_eviction_complex() -> None:
     """Tests if the stuff is properly evicted if the cache is full."""
 
     @jace.jit
@@ -328,7 +325,7 @@ def wrapped(A: np.ndarray) -> np.ndarray:
 
     shape = (10, 100, 1000)
     C = np.array(
-        (np.random.random(shape) - 0.5) * 10,  # noqa: NPY002
+        (testutil.mkarray(shape) - 0.5) * 10,
         order="C",
         dtype=np.float64,
     )
diff --git a/tests/unit_tests/test_decorator.py b/tests/unit_tests/test_decorator.py
index 812ba60..0cffc34 100644
--- a/tests/unit_tests/test_decorator.py
+++ b/tests/unit_tests/test_decorator.py
@@ -13,25 +13,10 @@
 from __future__ import annotations
 
 import numpy as np
-import pytest
 
 import jace
 
-
-@pytest.fixture(autouse=True)
-def _clear_translation_cache():
-    """Decorator that clears the translation cache.
-
-    Ensures that a function finds an empty cache and clears up afterwards.
-
-    Todo:
-        Should be used _everywhere_.
-    """
-    from jace.util import translation_cache as tcache
-
-    tcache.clear_translation_cache()
-    yield
-    tcache.clear_translation_cache()
+from tests import util as testutil
 
 
 def test_decorator_individually():
@@ -47,8 +32,8 @@ def testee(A, B):
         lowering_cnt[0] += 1
         return testee_(A, B)
 
-    A = np.arange(12, dtype=np.float64).reshape((4, 3))
-    B = np.full((4, 3), 10, dtype=np.float64)
+    A = testutil.mkarray((4, 3))
+    B = testutil.mkarray((4, 3))
 
     lowered = testee.lower(A, B)
     compiled = lowered.compile()
@@ -73,8 +58,8 @@ def testee(A, B):
         lowering_cnt[0] += 1
         return testee_(A, B)
 
-    A = np.arange(12, dtype=np.float64).reshape((4, 3))
-    B = np.full((4, 3), 10, dtype=np.float64)
+    A = testutil.mkarray((4, 3))
+    B = testutil.mkarray((4, 3))
 
     ref = testee_(A, B)
     res = testee(A, B)
diff --git a/tests/unit_tests/test_jax_api.py b/tests/unit_tests/test_jax_api.py
index f6c89df..e2f42e2 100644
--- a/tests/unit_tests/test_jax_api.py
+++ b/tests/unit_tests/test_jax_api.py
@@ -17,8 +17,7 @@
 import jace
 from jace import util as jutil
 
-
-np.random.seed(42)  # noqa: NPY002  # random generator
+from tests import util as testutil
 
 
 def test_jit():
@@ -27,8 +26,8 @@ def test_jit():
     def testee(A: np.ndarray, B: np.ndarray) -> np.ndarray:
         return A + B
 
-    A = np.arange(12, dtype=np.float64).reshape((4, 3))
-    B = np.full((4, 3), 10, dtype=np.float64)
+    A = testutil.mkarray((4, 3))
+    B = testutil.mkarray((4, 3))
 
     jax_testee = jax.jit(testee)
     jace_testee = jace.jit(testee)
@@ -95,7 +94,7 @@ def jace_fun(A, B, C):
     def jax_fun(A, B, C):
         return jace.jit(base_fun)(A, B, C)
 
-    A, B, C = (np.random.random((10, 3, 50)) for _ in range(3))  # noqa: NPY002  # random generator
+    A, B, C = (testutil.mkarray((10, 3, 50)) for _ in range(3))
 
     assert np.allclose(jace_fun(A, B, C), jax_fun(A, B, C))
 
@@ -128,7 +127,7 @@ def f3_jace(A, B, C, D):
 
     assert jutil.is_jaceified(f3_jace)
 
-    A, B, C, D = (np.random.random((10, 3, 50)) for _ in range(4))  # noqa: NPY002  # random generator
+    A, B, C, D = (testutil.mkarray((10, 3, 50)) for _ in range(4))
 
     ref = ((A + B) - C) * D
 
@@ -154,7 +153,7 @@ def jace_ddf(x):
         return jace.grad(jace.grad(f))(x)
 
     # These are the random numbers where we test
-    Xs = (np.random.random(10) - 0.5) * 10  # noqa: NPY002  # Random number generator
+    Xs = (testutil.mkarray(10) - 0.5) * 10
 
     for i in range(Xs.shape[0]):
         x = Xs[i]
@@ -198,7 +197,7 @@ def test_disabled_x64():
     def testee(A: np.ndarray, B: np.float64) -> np.ndarray:
         return A + B
 
-    A = np.arange(12, dtype=np.float64).reshape((4, 3))
+    A = testutil.mkarray((4, 3))
     B = np.float64(10.0)
 
     # Run them with disabled x64 support
diff --git a/tests/unit_tests/test_misc.py b/tests/unit_tests/test_misc.py
index 8870674..6c30783 100644
--- a/tests/unit_tests/test_misc.py
+++ b/tests/unit_tests/test_misc.py
@@ -14,14 +14,16 @@
 
 import jace
 
+from tests import util as testutil
+
 
 @pytest.mark.skip("Possible bug in DaCe.")
 def test_mismatch_in_datatyte_calling():
     """Tests compilation and calling with different types.
 
-    Note that this more or less tests the calling implementation of the `CompiledSDFG` class in DaCe.
-    As I understand the `CompiledSDFG::_construct_args()` function this should be detected.
-    However, as evidently it does not do this.
+    Note that this more or less a test for the calling implementation of the `CompiledSDFG`
+    class in DaCe. As I understand the `CompiledSDFG::_construct_args()` function this should be
+    detected. However, as evidently it does not do this.
     """
 
     @jace.jit
@@ -29,8 +31,8 @@ def testee(A: np.ndarray) -> np.ndarray:
         return -A
 
     # Different types.
-    A1 = np.arange(12, dtype=np.float32).reshape((4, 3))
-    A2 = np.arange(12, dtype=np.int64).reshape((4, 3))
+    A1 = testutil.mkarray((4, 3), dtype=np.float32)
+    A2 = testutil.mkarray((4, 3), dtype=np.int64)
 
     # Lower and compilation for first type
     callee = testee.lower(A1).compile()
diff --git a/tests/util.py b/tests/util.py
new file mode 100644
index 0000000..4069958
--- /dev/null
+++ b/tests/util.py
@@ -0,0 +1,42 @@
+# JaCe - JAX Just-In-Time compilation using DaCe (Data Centric Parallel Programming)
+#
+# Copyright (c) 2024, ETH Zurich
+# All rights reserved.
+#
+# SPDX-License-Identifier: BSD-3-Clause
+
+"""Utility functions for the testing infrastructure."""
+
+from __future__ import annotations
+
+from typing import TYPE_CHECKING
+
+import numpy as np
+
+
+if TYPE_CHECKING:
+    from collections.abc import Sequence
+
+
+__all__ = [
+    "mkarray",
+]
+
+
+def mkarray(
+    shape: Sequence[int] | int,
+    dtype: type = np.float64,
+) -> np.ndarray:
+    """Generates a NumPy ndarray with shape `shape`.
+
+    The function uses the generator that is managed by the `_reset_random_seed()` fixture.
+    Thus inside a function the value will be deterministic.
+
+    Args:
+        shape:      The shape to use.
+        dtype:      The data type to use.
+    """
+    if isinstance(shape, int):
+        shape = (shape,)
+    assert shape
+    return np.array(np.random.random(shape), dtype=dtype)  # noqa: NPY002

From 555e815ddef2e840e956215b145356f793416204 Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Fri, 31 May 2024 13:38:03 +0200
Subject: [PATCH 282/458] Screened some primitive translators.

---
 .../primitive_translators/alu_translators.py  |  2 +-
 .../broadcast_in_dim_translator.py            |  2 --
 .../convert_element_type_translator.py        | 16 ++++-----
 .../primitive_translators/copy_translator.py  |  4 ---
 .../primitive_translators/iota_translator.py  |  2 --
 .../reshape_translator.py                     |  2 --
 .../select_n_translator.py                    |  2 --
 .../primitive_translators/slicing.py          | 33 ++++++++-----------
 .../squeeze_translator.py                     |  2 --
 9 files changed, 20 insertions(+), 45 deletions(-)

diff --git a/src/jace/translator/primitive_translators/alu_translators.py b/src/jace/translator/primitive_translators/alu_translators.py
index a6d8bcc..95d7f36 100644
--- a/src/jace/translator/primitive_translators/alu_translators.py
+++ b/src/jace/translator/primitive_translators/alu_translators.py
@@ -30,7 +30,7 @@ class ALUTranslator(mapped_base.MappedOperationTranslatorBase):
     Its `write_tasklet_code()` function will perform replace all literals.
     """
 
-    __slots__ = "_tskl_tmpl"
+    __slots__ = ("_tskl_tmpl",)
 
     def __init__(
         self,
diff --git a/src/jace/translator/primitive_translators/broadcast_in_dim_translator.py b/src/jace/translator/primitive_translators/broadcast_in_dim_translator.py
index a42c61a..bd5e587 100644
--- a/src/jace/translator/primitive_translators/broadcast_in_dim_translator.py
+++ b/src/jace/translator/primitive_translators/broadcast_in_dim_translator.py
@@ -27,8 +27,6 @@
 class BroadcastInDimTranslator(mapped_base.MappedOperationTranslatorBase):
     """This handles the `broadcast_in_dim` primitives."""
 
-    __slots__ = ()
-
     def __init__(self) -> None:
         super().__init__(primitive_name="broadcast_in_dim")
 
diff --git a/src/jace/translator/primitive_translators/convert_element_type_translator.py b/src/jace/translator/primitive_translators/convert_element_type_translator.py
index 7d006e0..5228f17 100644
--- a/src/jace/translator/primitive_translators/convert_element_type_translator.py
+++ b/src/jace/translator/primitive_translators/convert_element_type_translator.py
@@ -39,8 +39,6 @@ class ConvertElementTypeTranslator(mapped_base.MappedOperationTranslatorBase):
             handled by a Memlet.
     """
 
-    __slots__ = ()
-
     def __init__(self) -> None:
         super().__init__(primitive_name="convert_element_type")
 
@@ -66,18 +64,16 @@ def write_tasklet_code(
 
         # Handle special cases
         if in_dtype == out_dtype:
-            # This happens and previously there was a warning here, but that thing got so annoying
-            #  We handle it explicitly because otherwise, DaCe could not remove the Tasklet.
-            #  inside the tests that it was removed, see the `tests/test_sub_translators_convert_element_type.py::test_convert_element_type_useless_cast`
-            #  for more.
+            # This happens and previously there was a warning here, but that thing has become
+            #  so annoying, that it was removed. However, we still handle the case explicitly to
+            #  guarantee that the Tasklet is trivial.
             # TODO(phimuell): Make this into a pure Memlet.
             return f"__out = {conv_code}"
-        if in_dtype_s.startswith("bool") and out_dtype_s.startswith("int"):
-            # Interestingly `__out = int(__in0)` will at some DaCe processing stage.
+        if in_dtype_s.startswith("bool"):
+            # Interestingly `__out = int(__in0)` will not work at some DaCe processing stage.
             #  See commit `f5aabc` of the prototype.
-            return f"__out = (1 if {conv_code} else 0)"
+            conv_code = f"(1 if {conv_code} else 0)"
 
-        # The general case
         if out_dtype_s == "bool":
             conv_code = f"dace.bool_({conv_code})"
         elif hasattr(dace.dtypes, out_dtype_s):
diff --git a/src/jace/translator/primitive_translators/copy_translator.py b/src/jace/translator/primitive_translators/copy_translator.py
index 466016a..69dc923 100644
--- a/src/jace/translator/primitive_translators/copy_translator.py
+++ b/src/jace/translator/primitive_translators/copy_translator.py
@@ -26,8 +26,6 @@
 class CopyTranslator(mapped_base.MappedOperationTranslatorBase):
     """Copy operations are implemented as a map to ensure that they can be fused with other maps."""
 
-    __slots__ = ()
-
     def __init__(self) -> None:
         super().__init__(primitive_name="copy")
 
@@ -53,8 +51,6 @@ class DevicePutTranslator(mapped_base.MappedOperationTranslatorBase):
         - Make into a Memlet because only the Memlet can handle copying between devices.
     """
 
-    __slots__ = ()
-
     def __init__(self) -> None:
         super().__init__(primitive_name="device_put")
 
diff --git a/src/jace/translator/primitive_translators/iota_translator.py b/src/jace/translator/primitive_translators/iota_translator.py
index ef2ced6..b664f53 100644
--- a/src/jace/translator/primitive_translators/iota_translator.py
+++ b/src/jace/translator/primitive_translators/iota_translator.py
@@ -30,8 +30,6 @@ class IotaTranslator(mapped_base.MappedOperationTranslatorBase):
     Essentially a very general `jnp.arange()` function.
     """
 
-    __slots__ = ()
-
     def __init__(self) -> None:
         super().__init__(primitive_name="iota")
 
diff --git a/src/jace/translator/primitive_translators/reshape_translator.py b/src/jace/translator/primitive_translators/reshape_translator.py
index cf9c35f..87d90c1 100644
--- a/src/jace/translator/primitive_translators/reshape_translator.py
+++ b/src/jace/translator/primitive_translators/reshape_translator.py
@@ -29,8 +29,6 @@ class ReshapeTranslator(translator.PrimitiveTranslator):
         - Find a way to make it as a Map.
     """
 
-    __slots__ = ()
-
     @property
     def primitive(self) -> str:
         return "reshape"
diff --git a/src/jace/translator/primitive_translators/select_n_translator.py b/src/jace/translator/primitive_translators/select_n_translator.py
index 00447f4..2057b83 100644
--- a/src/jace/translator/primitive_translators/select_n_translator.py
+++ b/src/jace/translator/primitive_translators/select_n_translator.py
@@ -39,8 +39,6 @@ class SelectNTranslator(mapped_base.MappedOperationTranslatorBase):
         `__in{i}`, starting with zero.
     """
 
-    __slots__ = ()
-
     def __init__(self) -> None:
         super().__init__(primitive_name="select_n")
 
diff --git a/src/jace/translator/primitive_translators/slicing.py b/src/jace/translator/primitive_translators/slicing.py
index c876de3..dc54e35 100644
--- a/src/jace/translator/primitive_translators/slicing.py
+++ b/src/jace/translator/primitive_translators/slicing.py
@@ -31,8 +31,6 @@ class SlicingTranslator(mapped_base.MappedOperationTranslatorBase):
     Note that there is also `dynamic_slice`.
     """
 
-    __slots__ = ()
-
     def __init__(self) -> None:
         super().__init__(primitive_name="slice")
 
@@ -73,15 +71,13 @@ class DynamicSlicingTranslator(translator.PrimitiveTranslator):
 
     The [dynamic slicing](https://jax.readthedocs.io/en/latest/_autosummary/jax.lax.dynamic_slice.html)
     performs a slicing of a _fixed_ window, however, the starting indexes are not fix, but are
-    variables that can come from the outside.
-    For this it uses symbols that, but since it uses the "Dynamic Map Ranges" no additional state
-    is needed.
+    variables that can come from the outside. Thus, the translator uses "Dynamic Map Ranges".
+    Furthermore, Jax guarantees that if the window overruns the start indexes are adjusted.
 
-    Unlike the normal slicing primitive, it is not derived from `MappedOperationTranslatorBase`.
+    Note:
+        Unlike the normal slicing primitive, it is not derived from `MappedOperationTranslatorBase`.
     """
 
-    __slots__ = ()
-
     @property
     def primitive(self) -> str:
         return "dynamic_slice"
@@ -102,20 +98,19 @@ def __call__(
         window_sizes: Sequence[int] = eqn.params["slice_sizes"]
 
         # The first input to the primitive is the array we slice from, the others are the start
-        #  indices of the slice window, each is a scalar, maybe literals, we might adapt them later.
+        #  indices of the slice window, each is a scalar, maybe literals.
         in_var_name: str = in_var_names[0]
         start_indices: list[str | None] = list(in_var_names[1:])
 
         # For storing the adapted start index, we have to create access nodes, to store them.
-        #  However, to ensure a total order of execution, once we added them as dynamic map ranges
-        #  to the map, we must use the same access nodes.
+        #  To ensure a total order of execution we have to use the same access nodes that are
+        #  used to store the adjusted start index and to feed them into the map.
         in_access: dict[str, dace.nodes.AccessNode] = {}
 
         # Jax will adjust the start indexes if the window will overrun.
         #  The adjustment is based on the formula $min(s + w, N) - w$, where $s$ is the start
-        #  index, $w$ the window size and $N$ the length in a particular dimension.
+        #  index, $w$ the window size and $N$ the length of a particular dimension.
         #  To do it we will use Tasklets, because otherwise we can not merge the state.
-        # TODO(phimuell): Make the Tasklet mapped, that they can be merged.
         for dim, (start_index, dim_size, wsize) in enumerate(
             zip(start_indices, util.get_jax_var_shape(eqn.invars[0]), window_sizes)
         ):
@@ -129,7 +124,7 @@ def __call__(
                 code=f"adjusted_start_idx = min(unadjusted_start_idx + {wsize}, {dim_size}) - {wsize}",
             )
 
-            # Intermediate value for the adjusted start index.
+            # Intermediate value to storing the adjusted start index.
             new_start_idx_var_name = builder.add_array(
                 eqn.invars[dim + 1],
                 name_prefix=f"__jace_adapted_start_idx_{start_index}",
@@ -151,8 +146,6 @@ def __call__(
                 None,
                 dace.Memlet.simple(new_start_idx_var_name, "0"),
             )
-
-            # Now store the result
             start_indices[dim] = new_start_idx_var_name
             in_access[new_start_idx_var_name] = new_start_idx_acc
 
@@ -162,14 +155,14 @@ def __call__(
 
         # We use dynamic map ranges, thus the map entry has input connectors, that does not start
         #  with `IN_*`, instead the connector name defines a symbol within the map scope. This
-        #  `dict` maps the symbol name to the name of the input variable, that defines the symbol.
-        #  If the input is a literal, than it has no correspondence and the constant is substituted.
+        #  `dict` maps the symbol name to the name of the input variable, that has the value of the
+        #  symbol. Literal substitution is done later.
         dynamic_map_ranges: dict[str, str] = {}
         memlet_accesses: list[str] = []
 
-        for i, ((it_var, _), start_index) in enumerate(zip(tskl_ranges, start_indices)):
+        for i, ((it_var, _), start_index) in enumerate(zip(tskl_ranges, start_indices), 1):
             if start_index is None:
-                offset = str(util.get_jax_literal_value(eqn.invars[i + 1]))
+                offset = str(util.get_jax_literal_value(eqn.invars[i]))
             else:
                 # Because of [issue 1579](https://github.com/spcl/dace/issues/1579) we have to use
                 #  the same name as the data container for the symbol and can not mangle it.
diff --git a/src/jace/translator/primitive_translators/squeeze_translator.py b/src/jace/translator/primitive_translators/squeeze_translator.py
index 2b1e6a1..a5a44a6 100644
--- a/src/jace/translator/primitive_translators/squeeze_translator.py
+++ b/src/jace/translator/primitive_translators/squeeze_translator.py
@@ -29,8 +29,6 @@ class SqueezeTranslator(mapped_base.MappedOperationTranslatorBase):
     Essentially equivalent to `np.squeeze` and the inverse to `np.expand_dims()`.
     """
 
-    __slots__ = ()
-
     def __init__(self) -> None:
         super().__init__(primitive_name="squeeze")
 

From fc911560dbb7d783740c4548257840826ed7ebf5 Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Fri, 31 May 2024 14:56:24 +0200
Subject: [PATCH 283/458] Added more stuff to the ALU translator and discovered
 something about logical operations in Jax.

Long story short, Jax only knows about bitwise operations, which was not handled correctly before.
See the note in the ALU file but also in the convert element code.
---
 .../primitive_translators/alu_translators.py  | 59 ++++++++++++++-----
 .../convert_element_type_translator.py        | 21 +++++--
 .../test_primitive_translator_managing.py     |  2 +-
 3 files changed, 61 insertions(+), 21 deletions(-)

diff --git a/src/jace/translator/primitive_translators/alu_translators.py b/src/jace/translator/primitive_translators/alu_translators.py
index 95d7f36..c64665f 100644
--- a/src/jace/translator/primitive_translators/alu_translators.py
+++ b/src/jace/translator/primitive_translators/alu_translators.py
@@ -63,28 +63,47 @@ def write_tasklet_code(
 # Contains all the templates for ALU operations.
 #  TODO(phimuell): Import them also from `frontend/python/replacements.py`, however, the names
 #   do not fully matches the Jax names, `grep -P '^[a-zA-Z0-9_]+_p[[:space:]]+' -r -o -h | sort -u`
+# NOTES:
+#   - Jax does not seem to have a mod, `%? , operation, instead a nested computation is done.
+#   - Jax has multiple shift operations, only one is implemented.
+#   - The logical operations, i.e. `and`, `xor`, `or` and `not` are bitwise, in Jax.
 # fmt: off
 _ALU_OPS_TMPL: Final[dict[str, str]] = {
     # Unary operations
     "pos": "__out = +(__in0)",
     "neg": "__out = -(__in0)",
-    "not": "__out = not (__in0)",
+
     "floor": "__out = floor(__in0)",
     "ceil": "__out = ceil(__in0)",
     "round": "__out = round(__in0)",
+
     "abs": "__out = abs(__in0)",
     "sign": "__out = sign(__in0)",
-    "sqrt": "__out = sqrt(__in0)",
-    "log": "__out = log(__in0)",
     "exp": "__out = exp(__in0)",
+    "exp2": "__out = exp2(__in0)",
+    "expm1": "__out = expm1(__in0)",
+    "log": "__out = log(__in0)",
+    "log1p": "__out = log1p(__in0)",
+    "conj": "__out = conj(__in0)",
+    "sqrt": "__out = sqrt(__in0)",
+    "cbrt": "__out = cbrt(__in0)",
+
     "integer_pow": "__out = (__in0)**({y})",  # 'y' is a parameter of the primitive
+    "is_finite": "__out = isfinite(__in0)",
+
     "sin": "__out = sin(__in0)",
     "asin": "__out = asin(__in0)",
     "cos": "__out = cos(__in0)",
     "acos": "__out = acos(__in0)",
     "tan": "__out = tan(__in0)",
     "atan": "__out = atan(__in0)",
+
+    "sinh": "__out = sinh(__in0)",
+    "asinh": "__out = asinh(__in0)",
+    "cosh": "__out = cosh(__in0)",
+    "acosh": "__out = acosh(__in0)",
     "tanh": "__out = tanh(__in0)",
+    "atanh": "__out = atanh(__in0)",
 
     # Binary operations
     "add": "__out = (__in0)+(__in1)",
@@ -93,18 +112,30 @@ def write_tasklet_code(
     "mul": "__out = (__in0)*(__in1)",
     "div": "__out = (__in0)/(__in1)",
     "rem": "__out = (__in0)%(__in1)",
-    "and": "__out = (__in0) and (__in1)",
-    "or": "__out = (__in0) or  (__in1)",
     "pow": "__out = (__in0)**(__in1)",
-    "ipow": "__out = (__in0)**(int(__in1))",
-    "min": "__out = min(__in0, __in1)",
-    "max": "__out = max(__in0, __in1)",
-    "eq": "__out = __in0 == __in1",
-    "ne": "__out = __in0 != __in1",
-    "ge": "__out = __in0 >= __in1",
-    "gt": "__out = __in0 > __in1",
-    "le": "__out = __in0 <= __in1",
-    "lt": "__out = __in0 < __in1",
+    "min": "__out = min((__in0), (__in1))",
+    "max": "__out = max((__in0), (__in1))",
+
+    "eq": "__out = (__in0) == (__in1)",
+    "ne": "__out = (__in0) != (__in1)",
+    "ge": "__out = (__in0) >= (__in1)",
+    "gt": "__out = (__in0) > (__in1)",
+    "le": "__out = (__in0) <= (__in1)",
+    "lt": "__out = (__in0) < (__in1)",
+
+    "atan2": "__out = atan2((__in0), (__in1))",
+
+    "left_shift": "__out = (__in0) << (__in1)",
+    "right_shift": "__out = (__in0) >> (__in1)",
+    "nextafter": "__out = nextafter((__in0), (__in1))",
+
+    # Logical operations
+    #  Note in Jax all logical operations are bitwise; for "logical" operations they are first
+    #  turned into "bools" by `ne a 0`.
+    "or": "__out = (__in0) | (__in1)",
+    "not": "__out = ~(__in0)",
+    "and": "__out = (__in0) & (__in1)",
+    "xor": "__out = (__in0) ^ (__in1)",
 }
 
 # Create the ALU translators
diff --git a/src/jace/translator/primitive_translators/convert_element_type_translator.py b/src/jace/translator/primitive_translators/convert_element_type_translator.py
index 5228f17..16e5e78 100644
--- a/src/jace/translator/primitive_translators/convert_element_type_translator.py
+++ b/src/jace/translator/primitive_translators/convert_element_type_translator.py
@@ -63,15 +63,24 @@ def write_tasklet_code(
         conv_code = "__in0"
 
         # Handle special cases
+        if in_dtype_s.startswith("bool") and in_dtype == out_dtype:
+            #  Second and more importantly, in Jax the casting from bool to bool has a special
+            #  meaning, because in Jax all logical operations are bitwise. If a logical operation
+            #  is used, then Jax first makes it a bool by running `a != 0`.
+            #  Jax does this to ensure that it has either `0` or a `1`, I assume that is because
+            #  XLA does not have a native bool, similar as C.
+            #  However, in C++, that has a native bool, this operation is kind of useless.
+            #  But we keep it as special case to serve as a documentation.
+            return f"__out = {conv_code}"
         if in_dtype == out_dtype:
-            # This happens and previously there was a warning here, but that thing has become
-            #  so annoying, that it was removed. However, we still handle the case explicitly to
-            #  guarantee that the Tasklet is trivial.
-            # TODO(phimuell): Make this into a pure Memlet.
+            # For some odd reason, this conversion also happens if with other types as bool,
+            #  see above. For that reason we also keep it as special case.
+            #  In previous versions we generated a warning here, but it had become so annoying
+            #  that it was removed.
             return f"__out = {conv_code}"
+
         if in_dtype_s.startswith("bool"):
-            # Interestingly `__out = int(__in0)` will not work at some DaCe processing stage.
-            #  See commit `f5aabc` of the prototype.
+            # Interestingly `__out = int(__in0)` will not work, see commit `f5aabc` of the prototype.
             conv_code = f"(1 if {conv_code} else 0)"
 
         if out_dtype_s == "bool":
diff --git a/tests/integration_tests/test_primitive_translator_managing.py b/tests/integration_tests/test_primitive_translator_managing.py
index 92db164..ca19631 100644
--- a/tests/integration_tests/test_primitive_translator_managing.py
+++ b/tests/integration_tests/test_primitive_translator_managing.py
@@ -76,7 +76,7 @@ def fake_add_translator(*args: Any, **kwargs: Any) -> None:  # noqa: ARG001
 def test_are_subtranslators_imported():
     """Tests if something is inside the list of subtranslators."""
     # Must be adapted if new primitives are implemented.
-    assert len(get_regsitered_primitive_translators()) == 47
+    assert len(get_regsitered_primitive_translators()) == 62
 
 
 @pytest.mark.usefixtures("no_builtin_translators")

From 1be3237322af214353db9894e20bd3de242aa1f9 Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Fri, 31 May 2024 15:26:27 +0200
Subject: [PATCH 284/458] Because of a bug in the `logical_not` implementation
 of teh ALU it does currently does not work.

---
 .../test_primitive_alu.py                     | 34 +++++++++++++++++++
 tests/util.py                                 |  3 ++
 2 files changed, 37 insertions(+)

diff --git a/tests/integration_tests/primitive_translators/test_primitive_alu.py b/tests/integration_tests/primitive_translators/test_primitive_alu.py
index 51e5a3e..774ebe4 100644
--- a/tests/integration_tests/primitive_translators/test_primitive_alu.py
+++ b/tests/integration_tests/primitive_translators/test_primitive_alu.py
@@ -13,10 +13,12 @@
 
 from __future__ import annotations
 
+from collections.abc import Callable
 from typing import TYPE_CHECKING, Any, cast
 
 import jax
 import numpy as np
+import pytest
 from jax import numpy as jnp
 
 import jace
@@ -28,6 +30,26 @@
     from collections.abc import Callable
 
 
+@pytest.fixture(
+    params=[
+        (jnp.logical_and, 2, np.bool_),
+        (jnp.logical_or, 2, np.bool_),
+        (jnp.logical_xor, 2, np.bool_),
+        (jnp.logical_not, 1, np.bool_),
+        (jnp.bitwise_and, 2, np.int64),
+        (jnp.bitwise_or, 2, np.int64),
+        (jnp.bitwise_xor, 2, np.int64),
+        (jnp.bitwise_not, 1, np.int64),
+    ]
+)
+def logical_ops(request) -> tuple[Callable, tuple[np.ndarray, ...]]:
+    """Returns a logical operation function and inputs."""
+    return (
+        request.param[0],
+        tuple(testutil.mkarray((2, 2), request.param[2]) for _ in range(request.param[1])),
+    )
+
+
 def _perform_alu_test(testee: Callable, *args: Any) -> None:
     """General function that just performs the test."""
     wrapped = jace.jit(testee)
@@ -191,3 +213,15 @@ def testee(A: np.ndarray, B: np.ndarray) -> np.ndarray:
     B = testutil.mkarray((5, 1, 3, 1, 2))
     _perform_alu_test(testee, A, B)
     _perform_alu_test(testee, B, A)
+
+
+def test_alu_logical_bitwise_operation(
+    logical_ops: tuple[Callable, tuple[np.ndarray, ...]],
+):
+    """Tests if the logical and bitwise operations works as they do in Jax."""
+    inputs: tuple[np.ndarray, ...] = logical_ops[1]
+
+    def testee(*args: np.ndarray) -> np.ndarray:
+        return logical_ops[0](*args)
+
+    _perform_alu_test(testee, *inputs)
diff --git a/tests/util.py b/tests/util.py
index 4069958..6ea3fe2 100644
--- a/tests/util.py
+++ b/tests/util.py
@@ -39,4 +39,7 @@ def mkarray(
     if isinstance(shape, int):
         shape = (shape,)
     assert shape
+
+    if dtype == np.bool_:
+        return mkarray(shape, np.float32) > 0.5
     return np.array(np.random.random(shape), dtype=dtype)  # noqa: NPY002

From 9ab2e9a04b211451b06f89f300b73cf79c6e9d28 Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.paul.mueller@bluemain.ch>
Date: Sat, 1 Jun 2024 14:16:06 +0200
Subject: [PATCH 285/458] Fixed a bug in the `select_n` translator.

This translator does some renaming of the connector names, it has to do literal substitution on its own.
---
 .../select_n_translator.py                    | 22 +++++++---
 .../test_primitive_select_n.py                | 42 +++++++++++++------
 tests/util.py                                 |  3 ++
 3 files changed, 49 insertions(+), 18 deletions(-)

diff --git a/src/jace/translator/primitive_translators/select_n_translator.py b/src/jace/translator/primitive_translators/select_n_translator.py
index 2057b83..084ced2 100644
--- a/src/jace/translator/primitive_translators/select_n_translator.py
+++ b/src/jace/translator/primitive_translators/select_n_translator.py
@@ -14,7 +14,7 @@
 import dace
 from typing_extensions import override
 
-from jace import translator
+from jace import translator, util
 from jace.translator import mapped_operation_base_translator as mapped_base
 
 
@@ -50,10 +50,7 @@ def write_tasklet_code(
         eqn: jax_core.JaxprEqn,
     ) -> str:
         """Writes the selection code.
-
-        Literal substitution is deferred to the base.
         """
-
         if len(in_var_names) == 3:
             # This order is correct, since `False` is interpreted as `0`, which means the first
             #  case. DaCe seems to have some problems with bools and integer casting around,
@@ -73,7 +70,6 @@ def make_input_memlets(
         eqn: jax_core.JaxprEqn,
     ) -> dict[str, dace.Memlet]:
         """We have to add the offsets to the Memlet accesses."""
-        assert all(in_var_names)
         return {
             f"__in{i-1}" if i else "__cond": dace.Memlet.simple(
                 in_var_name,
@@ -84,4 +80,20 @@ def make_input_memlets(
         }
 
 
+    def literal_substitution(
+        self,
+        tskl_code: str,
+        in_var_names: Sequence[str | None],
+        eqn: jax_core.JaxprEqn,
+    ) -> str:
+        """Can not be done by the base because of the renaming.
+        """
+        for i, in_var_name in enumerate(in_var_names[1:]):
+            if in_var_name is not None:
+                continue
+            t_val = util.get_jax_literal_value(eqn.invars[i + 1])
+            tskl_code = tskl_code.replace(f"__in{i}", str(t_val))
+        return tskl_code
+
+
 translator.register_primitive_translator(SelectNTranslator())
diff --git a/tests/integration_tests/primitive_translators/test_primitive_select_n.py b/tests/integration_tests/primitive_translators/test_primitive_select_n.py
index c887b23..98f6777 100644
--- a/tests/integration_tests/primitive_translators/test_primitive_select_n.py
+++ b/tests/integration_tests/primitive_translators/test_primitive_select_n.py
@@ -9,7 +9,7 @@
 
 from __future__ import annotations
 
-from typing import Any
+from typing import Any, Callable
 
 import jax
 import numpy as np
@@ -36,38 +36,54 @@ def fbranch() -> np.ndarray:
     return np.zeros((10, 10))
 
 
-def _perform_test(P: Any, T: Any, F: Any):
-    def testee(P: Any, T: Any, F: Any):
-        return jnp.where(P, T, F)
+def _perform_test(testee: Callable, *args: Any):
 
-    res = testee(P, T, F)
-    ref = jace.jit(testee)(P, T, F)
+    res = testee(*args)
+    ref = jace.jit(testee)(*args)
 
+    assert args[0].shape == res.shape
     assert np.all(res == ref)
 
 
 def test_select_n_where(Pred, tbranch, fbranch):
     """Normal `np.where` test."""
-    _perform_test(Pred, tbranch, fbranch)
+
+    def testee(P: Any, T: Any, F: Any) -> Any:
+        return jnp.where(P, T, F)
+    _perform_test(testee, Pred, tbranch, fbranch)
 
 
 def test_select_n_where_one_literal(Pred, tbranch, fbranch):
-    """`np.where` where one of the input is a literal."""
-    _perform_test(Pred, 2, fbranch)
-    _perform_test(Pred, tbranch, 3)
+    """`np.where` where one of the input is a literal.
+    """
+
+    def testee1(P: Any, F: Any) -> Any:
+        return jnp.where(P, 2, F)
+
+    def testee2(P: Any, T: Any) -> Any:
+        return jnp.where(P, T, 3)
+
+    _perform_test(testee1, Pred, fbranch)
+    _perform_test(testee2, Pred, tbranch)
 
 
 def test_select_n_where_full_literal(Pred):
     """`np.where` where all inputs are literals."""
-    _perform_test(Pred, 8, 9)
+
+    def testee(P: Any) -> Any:
+        return jnp.where(P, 8, 9)
+
+    # If not a scalar, Jax will do broadcasting and no literal substitution is done.
+    Pred = Pred[0, 0]
+    _perform_test(testee, Pred)
 
 
 def test_select_n_many_inputs():
     """Tests the generalized way of using the primitive."""
-    nbcases = 5
+    nbcases = 10
     shape = (10, 10)
     cases = [np.full(shape, i) for i in range(nbcases)]
-    pred = np.arange(cases[0].size).reshape(shape) % 5
+    pred = np.arange(cases[0].size).reshape(shape) % nbcases
 
     def testee(pred: np.ndarray, *cases: np.ndarray) -> jax.Array:
         return jax.lax.select_n(pred, *cases)
diff --git a/tests/util.py b/tests/util.py
index 6ea3fe2..0a438d7 100644
--- a/tests/util.py
+++ b/tests/util.py
@@ -35,6 +35,9 @@ def mkarray(
     Args:
         shape:      The shape to use.
         dtype:      The data type to use.
+
+    Todo:
+        - Also support integers.
     """
     if isinstance(shape, int):
         shape = (shape,)

From e4a099d06c8b12e27c3be03af4202d9ea529960c Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.paul.mueller@bluemain.ch>
Date: Sat, 1 Jun 2024 14:33:50 +0200
Subject: [PATCH 286/458] Updated the `mkarray()` function of the tests, it is
 now able to generate integers as well and scalars.

---
 tests/util.py | 8 ++++++--
 1 file changed, 6 insertions(+), 2 deletions(-)

diff --git a/tests/util.py b/tests/util.py
index 0a438d7..c434666 100644
--- a/tests/util.py
+++ b/tests/util.py
@@ -39,10 +39,14 @@ def mkarray(
     Todo:
         - Also support integers.
     """
+
+    if shape == ():
+        return mkarray((1,), dtype)[0]
     if isinstance(shape, int):
         shape = (shape,)
-    assert shape
 
     if dtype == np.bool_:
-        return mkarray(shape, np.float32) > 0.5
+        return np.random.random(shape) > 0.5  # noqa: NPY002
+    if np.issubdtype(dtype, np.integer):
+        return np.random.randint(low=-2**30, high=2**30, size=shape, dtype=dtype)  # noqa: NPY002
     return np.array(np.random.random(shape), dtype=dtype)  # noqa: NPY002

From 8bdea8238850dd7e7d7dee1753a158ed90a039ab Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.paul.mueller@bluemain.ch>
Date: Sat, 1 Jun 2024 14:34:37 +0200
Subject: [PATCH 287/458] Compacted the tests for select.

---
 .../test_primitive_select_n.py                | 61 +++++++------------
 1 file changed, 22 insertions(+), 39 deletions(-)

diff --git a/tests/integration_tests/primitive_translators/test_primitive_select_n.py b/tests/integration_tests/primitive_translators/test_primitive_select_n.py
index 98f6777..ec2285f 100644
--- a/tests/integration_tests/primitive_translators/test_primitive_select_n.py
+++ b/tests/integration_tests/primitive_translators/test_primitive_select_n.py
@@ -21,39 +21,27 @@
 from tests import util as testutil
 
 
-@pytest.fixture()
-def Pred() -> np.ndarray:
-    return testutil.mkarray((10, 10)) > 0.5
-
-
-@pytest.fixture()
-def tbranch() -> np.ndarray:
-    return np.ones((10, 10))
-
-
-@pytest.fixture()
-def fbranch() -> np.ndarray:
-    return np.zeros((10, 10))
-
-
 def _perform_test(testee: Callable, *args: Any):
 
     res = testee(*args)
     ref = jace.jit(testee)(*args)
-
-    assert args[0].shape == res.shape
     assert np.all(res == ref)
 
 
-def test_select_n_where(Pred, tbranch, fbranch):
+def test_select_n_where():
     """Normal `np.where` test."""
 
     def testee(P: Any, T: Any, F: Any) -> Any:
         return jnp.where(P, T, F)
-    _perform_test(testee, Pred, tbranch, fbranch)
+
+    shape = (10, 10)
+    pred = testutil.mkarray(shape, np.bool_)
+    tbranch = testutil.mkarray(shape)
+    fbranch = testutil.mkarray(shape)
+    _perform_test(testee, pred, tbranch, fbranch)
 
 
-def test_select_n_where_one_literal(Pred, tbranch, fbranch):
+def test_select_n_where_literal():
     """`np.where` where one of the input is a literal.
     """
 
@@ -63,32 +51,27 @@ def testee1(P: Any, F: Any) -> Any:
     def testee2(P: Any, T: Any) -> Any:
         return jnp.where(P, T, 3)
 
-    _perform_test(testee1, Pred, fbranch)
-    _perform_test(testee2, Pred, tbranch)
-
-
-def test_select_n_where_full_literal(Pred):
-    """`np.where` where all inputs are literals."""
-
-    def testee(P: Any) -> Any:
+    def testee3(P: Any) -> Any:
         return jnp.where(P, 8, 9)
 
-    # If not a scalar, Jax will do broadcasting and no literal substitution is done.
-    Pred = Pred[0, 0]
-    _perform_test(testee, Pred)
+    shape = ()
+    pred = testutil.mkarray(shape, np.bool_)
+    tbranch = testutil.mkarray(shape, np.int_)
+    fbranch = testutil.mkarray(shape, np.int_)
+
+    _perform_test(testee1, pred, fbranch)
+    _perform_test(testee2, pred, tbranch)
+    _perform_test(testee3, pred)
 
 
 def test_select_n_many_inputs():
     """Tests the generalized way of using the primitive."""
-    nbcases = 10
-    shape = (10, 10)
-    cases = [np.full(shape, i) for i in range(nbcases)]
-    pred = np.arange(cases[0].size).reshape(shape) % nbcases
 
     def testee(pred: np.ndarray, *cases: np.ndarray) -> jax.Array:
         return jax.lax.select_n(pred, *cases)
 
-    ref = testee(pred, *cases)
-    res = jace.jit(testee)(pred, *cases)
-
-    assert np.all(ref == res)
+    nbcases = 10
+    shape = (10, 10)
+    cases = [np.full(shape, i) for i in range(nbcases)]
+    pred = np.arange(cases[0].size).reshape(shape) % nbcases
+    _perform_test(testee, pred, *cases)

From f5eb441ef6f48d2c99fa81e99e662c09ca15b1de Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.paul.mueller@bluemain.ch>
Date: Sat, 1 Jun 2024 14:41:37 +0200
Subject: [PATCH 288/458] Updated the coverage configuration, however, not yet
 tested.

Following the [doc](https://coverage.readthedocs.io/en/7.5.3/config.html#sample-file) there was clearly an error in the configuration of the `exclude_also` definition, should be inside the run section.
However, I also added some stuff that the page recommended.
---
 pyproject.toml | 31 ++++++++++++++++++++++++++-----
 1 file changed, 26 insertions(+), 5 deletions(-)

diff --git a/pyproject.toml b/pyproject.toml
index 3556e8a..f85e586 100644
--- a/pyproject.toml
+++ b/pyproject.toml
@@ -46,12 +46,33 @@ Changelog = "https://github.com/GridTools/JaCe/releases"
 Discussions = "https://github.com/GridTools/JaCe/discussions"
 Homepage = "https://github.com/GridTools/JaCe"
 
-[tool.coverage]
-report.exclude_also = [
+[tool.coverage.run]
+branch = true
+source = ["jace"]
+
+[tool.coverage.report]
+# Regexes for lines to exclude from consideration
+exclude_also = [
+  # Don't complain about missing debug-only code:
+  'def __repr__',
+
+  # Don't complain about typechecker includes
+  'if typing.TYPE_CHECKING:',
   '\.\.\.',
-  'if typing.TYPE_CHECKING:'
-]
-run.source = ["jace"]
+  '@overload',
+
+  # Don't complain if tests don't hit defensive assertion code:
+  'raise AssertionError',
+  'raise NotImplementedError',
+
+  # Don't complain if non-runnable code isn't run:
+  'if 0:',
+  'if __name__ == .__main__.:',
+
+  # Don't complain about abstract methods, they aren't run:
+  '@(abc\\.)?abstractmethod',
+  '@(abc\\.)?abstract',
+  ]
 
 # -- mypy  --
 [tool.mypy]

From 4179d40175517802b1cf19819e5cfcd7bee397f4 Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Sun, 2 Jun 2024 09:07:58 +0200
Subject: [PATCH 289/458] Fixed the `TranslatorContext` and
 `TransltedJaxprSDFG`.

I noticed that the previous implementation was not that nice.
However, I realized that composition is not the correct way of doing it, they should, as I did it originally, be fully seperated.
Which is what I will do next.
---
 src/jace/stages.py                            |  2 +
 .../translator/jaxpr_translator_builder.py    | 83 ++++++-------------
 src/jace/translator/post_translation.py       | 68 ++++++++++-----
 src/jace/translator/translated_jaxpr_sdfg.py  | 48 ++++-------
 4 files changed, 90 insertions(+), 111 deletions(-)

diff --git a/src/jace/stages.py b/src/jace/stages.py
index 8941906..a828e4a 100644
--- a/src/jace/stages.py
+++ b/src/jace/stages.py
@@ -157,6 +157,8 @@ def lower(
         tsdfg: translator.TranslatedJaxprSDFG = ptrans.postprocess_jaxpr_sdfg(
             trans_ctx=trans_ctx,
             fun=self.wrapped_fun,
+            call_args=args,  # Already linearised, since we only accept positional args.
+            intree=None,  # Not yet implemented.
         )
 
         return JaCeLowered(tsdfg)
diff --git a/src/jace/translator/jaxpr_translator_builder.py b/src/jace/translator/jaxpr_translator_builder.py
index 1cc8265..ae7282a 100644
--- a/src/jace/translator/jaxpr_translator_builder.py
+++ b/src/jace/translator/jaxpr_translator_builder.py
@@ -460,7 +460,7 @@ def _create_initial_input(
         """
         if not self.is_allocated():
             raise RuntimeError("Builder is not allocated, can not create constants.")
-        assert len(self._ctx.inp_names) == 0
+        assert len(self._ctx.jsdfg.inp_names) == 0
 
         # Handle the initial input arguments
         init_in_var_names: Sequence[str] = self.create_jax_var_list(
@@ -473,7 +473,7 @@ def _create_initial_input(
         self.sdfg.arg_names = []
 
         # The output list is populated by `self._translate_jaxpr_internal()`
-        self._ctx.inp_names = tuple(init_in_var_names)
+        self._ctx.jsdfg.inp_names = tuple(init_in_var_names)
 
         return init_in_var_names
 
@@ -650,7 +650,7 @@ def _translate_jaxpr_internal(
         if nb_translated_eqn == 0:
             out_var_names = self._handle_null_jaxpr(jaxpr)
 
-        self._ctx.out_names = tuple(out_var_names)
+        self._ctx.jsdfg.out_names = tuple(out_var_names)
 
         return cast(TranslationContext, self._clear_translation_ctx())
 
@@ -673,8 +673,8 @@ def _handle_null_jaxpr(
             - Handle the case if if the output is a literal.
         """
         assert self._ctx.terminal_state is self._ctx.start_state
-        assert len(self._ctx.inp_names) > 0
-        assert len(self._ctx.out_names) == 0
+        assert len(self._ctx.jsdfg.inp_names) > 0
+        assert len(self._ctx.jsdfg.out_names) == 0
 
         # There is not output so we do not have to copy anything around.
         if len(jaxpr.out_avals) == 0:
@@ -734,13 +734,13 @@ class TranslationContext:
 
     Essentially it is a `TranslatedJaxprSDFG` object together with some additional meta data,
     that is needed during translation. It is also returned by the `translate_jaxpr()` function.
-    It is important that the SDFG it encapsulates is not directly usable and should be passed
-    to the post processing stage, i.e. `postprocess_jaxpr_sdfg()`, which will turn a context into
-    a `TranslatedJaxprSDFG` object.
+    It is important that the SDFG it encapsulates is not directly usable and must be passed to the
+    `finalize_translation_context()` function, before it can be passed to the optimization stage.
+    However, it is recommended to pass it to the `postprocess_jaxpr_sdfg()` instead.
 
     Attributes:
         jsdfg:          The wrapped `TranslatedJaxprSDFG` object that stores the SDFG under
-            construction. `self` adds access properties to all attributes of the `TranslatedJaxprSDFG`.
+            construction.
         start_state:    The first state in the SDFG state machine.
         terminal_state: The (currently) last state in the state machine.
 
@@ -758,7 +758,14 @@ def __init__(
     ) -> None:
         from jace import translator  # Cyclic import
 
-        self.jsdfg = translator.TranslatedJaxprSDFG(name=name)
+        if isinstance(name, str) and not util.VALID_SDFG_OBJ_NAME.fullmatch(name):
+            raise ValueError(f"'{name}' is not a valid SDFG name.")
+
+        self.jsdfg = translator.TranslatedJaxprSDFG(
+            sdfg=dace.SDFG(name=(name or f"unnamed_SDFG_{id(self)}")),
+            inp_names=(),
+            out_names=(),
+        )
         self.start_state = self.sdfg.add_state(label="initial_state", is_start_block=True)
         self.terminal_state = self.start_state
 
@@ -766,62 +773,24 @@ def __init__(
     def sdfg(self) -> dace.SDFG:
         return self.jsdfg.sdfg
 
-    @property
-    def inp_names(self) -> tuple[str, ...]:
-        return self.jsdfg.inp_names
-
-    @inp_names.setter
-    def inp_names(self, inp_names: tuple[str, ...]) -> None:
-        if len(inp_names) == 0:
-            raise dace.sdfg.InvalidSDFGError(
-                "There are no input arguments.",
-                self.sdfg,
-                self.sdfg.node_id(self.sdfg.start_state),
-            )
-        if any(inp not in self.sdfg.arrays for inp in inp_names):
-            raise dace.sdfg.InvalidSDFGError(
-                f"Expected to find: {(inp for inp in inp_names if inp not in self.sdfg.arrays)}",
-                self.sdfg,
-                self.sdfg.node_id(self.start_state),
-            )
-        self.jsdfg.inp_names = inp_names
-
-    @property
-    def out_names(self) -> tuple[str, ...]:
-        return self.jsdfg.out_names
-
-    @out_names.setter
-    def out_names(self, out_names: tuple[str, ...]) -> None:
-        if len(out_names) == 0:
-            raise dace.sdfg.InvalidSDFGError(
-                "There are no output arguments.",
-                self.sdfg,
-                self.sdfg.node_id(self.start_state),
-            )
-        if any(out not in self.sdfg.arrays for out in out_names):
-            raise dace.sdfg.InvalidSDFGError(
-                f"Expected to find: {(out for out in out_names if out not in self.sdfg.arrays)}",
-                self.sdfg,
-                self.sdfg.node_id(self.start_state),
-            )
-        self.jsdfg.out_names = out_names
-
     def validate(self) -> bool:
         """Validate internal state of `self`.
 
-        This function will not check the embedded SDFG.
+        Note:
+            The it is not possible to call the validation function of the embedded
+            `TranslatedJaxprSDFG` because the SDFG is still under construction`.
         """
-        if self.start_state and (self.start_state is not self.sdfg.start_block):
+        if self.start_state is not self.sdfg.start_block:
             raise dace.sdfg.InvalidSDFGError(
-                f"Expected to find '{self.start_state}' ({self.sdfg.node_id(self.start_state)}),"
-                f" instead found '{self.sdfg.start_block} ({self.sdfg.node_id(self.sdfg.start_block)}).",
+                f"Expected to find '{self.start_state}' as start state,"
+                f" but instead found '{self.sdfg.start_block}'.",
                 self.sdfg,
                 self.sdfg.node_id(self.start_state),
             )
-        if self.start_state and ({self.terminal_state} != set(self.sdfg.sink_nodes())):
+        if {self.terminal_state} != set(self.sdfg.sink_nodes()):
             raise dace.sdfg.InvalidSDFGError(
-                f"Expected to find '{self.terminal_state}' ({self.sdfg.node_id(self.terminal_state)}),"
-                f" instead found '{self.sdfg.sink_nodes()}.",
+                f"Expected to find as terminal state '{self.terminal_state}',"
+                f" but instead found '{self.sdfg.sink_nodes()}'.",
                 self.sdfg,
                 self.sdfg.node_id(self.terminal_state),
             )
diff --git a/src/jace/translator/post_translation.py b/src/jace/translator/post_translation.py
index aa1cc1a..24d90c2 100644
--- a/src/jace/translator/post_translation.py
+++ b/src/jace/translator/post_translation.py
@@ -15,11 +15,11 @@
 from __future__ import annotations
 
 import copy
-from typing import TYPE_CHECKING
+from typing import TYPE_CHECKING, Any
 
 
 if TYPE_CHECKING:
-    from collections.abc import Callable
+    from collections.abc import Callable, Sequence
 
     from jace import translator
 
@@ -27,50 +27,67 @@
 def postprocess_jaxpr_sdfg(
     trans_ctx: translator.TranslationContext,
     fun: Callable,  # noqa: ARG001  # Currently unused
+    call_args: Sequence[Any],  # noqa: ARG001  # Currently unused
+    intree: None,  # noqa: ARG001  # Currently unused
 ) -> translator.TranslatedJaxprSDFG:
-    """Perform the final post processing steps on the `TranslationContext`.
+    """Perform the final post processing steps on the `TranslationContext` _in place_.
 
-    Returns:
-        The function returns a valid `TranslationContext` that is decoupled from the one
-        that was originally part of `trans_ctx`.
+    The function will perform post processing stages on the context in place.
+    However, the function will return a decoupled `TranslatedJaxprSDFG` object.
 
     Args:
         trans_ctx:  The `TranslationContext` obtained from the `translate_jaxpr()` function.
         fun:        The original function that was translated.
+        call_args:  The linearized input arguments.
+        intree:     The pytree describing the inputs.
 
     Todo:
         - Setting correct input names (layer that does not depend on JAX).
-        - Setting the correct strides & Storage properties.
+        - Setting the correct strides & storage properties.
+        - Fixing the scalar input problem on GPU.
     """
     # Currently we do nothing except finalizing.
     trans_ctx.validate()
-    tsdfg: translator.TranslatedJaxprSDFG = copy.deepcopy(trans_ctx.jsdfg)
 
-    finalize_jaxpr_sdfg(tsdfg)
+    #
+    # Assume some post processing here.
+    #
 
-    tsdfg.validate()
-    return tsdfg
+    return finalize_translation_context(trans_ctx, validate=True)
 
 
-def finalize_jaxpr_sdfg(
-    tsdfg: translator.TranslatedJaxprSDFG,
-) -> None:
-    """Finalizes the supplied `tsdfg` object in place.
+def finalize_translation_context(
+    trans_ctx: translator.TranslationContext,
+    validate: bool = True,
+) -> translator.TranslatedJaxprSDFG:
+    """Finalizes the supplied translation context `trans_ctx`.
 
-    This function will turn a non finalized, i.e. canonical, SDFG into a finalized one,
-    The function will:
-    - mark all input and output variables, i.e. listed in `tsdfg.{inp, out}_names`, as globals,
-    - set the `arg_names` property of the SDFG,
+    The function will process the SDFG that is encapsulated inside the context, i.e. a canonical
+    one, into a proper SDFG, as it is described in `TranslatedJaxprSDFG`.
+    It is important to realize that this function does not perform any optimization of the
+    underlying SDFG itself, instead it prepares an SDFG such that it can be passed to the
+    optimization pipeline.
+
+    The function will not mutate the passed translation context and the output is always decoupled
+    from its output.
+
+    Args:
+        trans_ctx:      The context that should be finalized.
+        validate:       Call the validate function after the finalizing.
     """
-    if not tsdfg.inp_names:
+    trans_ctx.validate()
+    if not trans_ctx.jsdfg.inp_names:
         raise ValueError("Input names are not specified.")
-    if not tsdfg.out_names:
+    if not trans_ctx.jsdfg.out_names:
         raise ValueError("Output names are not specified.")
 
-    # Canonical SDFGs do not have global memory, so we must transform it
+    # We guarantee decoupling
+    tsdfg: translator.TranslatedJaxprSDFG = copy.deepcopy(trans_ctx.jsdfg)
+
+    # Make inputs and outputs to globals.
     sdfg_arg_names: list[str] = []
     for glob_name in tsdfg.inp_names + tsdfg.out_names:
-        if glob_name in sdfg_arg_names:  # Donated arguments
+        if glob_name in sdfg_arg_names:
             continue
         tsdfg.sdfg.arrays[glob_name].transient = False
         sdfg_arg_names.append(glob_name)
@@ -78,3 +95,8 @@ def finalize_jaxpr_sdfg(
     # This forces the signature of the SDFG to include all arguments in order they appear.
     #  If an argument is used as input and output then it is only listed as input.
     tsdfg.sdfg.arg_names = sdfg_arg_names
+
+    if validate:
+        tsdfg.validate()
+
+    return tsdfg
diff --git a/src/jace/translator/translated_jaxpr_sdfg.py b/src/jace/translator/translated_jaxpr_sdfg.py
index 77c6001..7eac48e 100644
--- a/src/jace/translator/translated_jaxpr_sdfg.py
+++ b/src/jace/translator/translated_jaxpr_sdfg.py
@@ -7,54 +7,40 @@
 
 from __future__ import annotations
 
-import dace
+import dataclasses
 
-from jace import util
+import dace
 
 
+@dataclasses.dataclass(kw_only=True)
 class TranslatedJaxprSDFG:
-    """Encapsulates the result of a translation run of the `JaxprTranslationBuilder` object.
-
-    The only valid way to obtain a `TranslatedJaxprSDFG` is by passing a `TranslationContext`,
-    that was in turn constructed by `JaxprTranslationBuilder.translate_jaxpr()`, to the
-    `postprocess_jaxpr_sdfg()` function.
-    This class encapsulates a translated SDFG as well as the meta data needed to compile and run it.
+    """Encapsulates the translated SDFG together with the metadata that is needed to run it.
 
     Contrary to the SDFG that is encapsulated inside the `TranslationContext` object, `self`
     carries a proper SDFG, however:
-    - it does not have `__return*` variables, instead all return arguments are passed by arguments,
-    - its `arg_names` is set to  `inp_names + out_names`, but arguments that are input and outputs
+    - It does not have `__return*` variables, instead all return arguments are passed by arguments.
+    - All input arguments are passed through arguments mentioned in `inp_names`, while the outputs
+        are passed through `out_names`.
+    - Only variables listed as in/outputs are non transient.
+    - The order inside `inp_names` and `out_names` is the same as in the translated Jaxpr.
+    - If inputs are also used as outputs they appear in both `inp_names` and `out_names`.
+    - Its `arg_names` is set to  `inp_names + out_names`, but arguments that are input and outputs
         are only listed as inputs.
 
+    The only valid way to obtain a `TranslatedJaxprSDFG` is by passing a `TranslationContext`,
+    that was in turn constructed by `JaxprTranslationBuilder.translate_jaxpr()`, to the
+    `finalize_translation_context()` or preferably to the `postprocess_jaxpr_sdfg()` function.
+
     Attributes:
         sdfg:           The encapsulated SDFG object.
         inp_names:      A list of the SDFG variables that are used as input
         out_names:      A list of the SDFG variables that are used as output.
-
-    The `inp_names` and `out_name` are in the same order as in the original Jaxpr object.
-    It might happen that a name appears in both the `inp_names` and `out_names` lists. This happens
-    if an argument is used both as input and output, and it is not an error. In Jax this is called
-    argument donation.
-
-    Args:
-        name:   The name that should be given to the SDFG, optional.
     """
 
     sdfg: dace.SDFG
     inp_names: tuple[str, ...]
     out_names: tuple[str, ...]
 
-    def __init__(
-        self,
-        name: str | None = None,
-    ) -> None:
-        if isinstance(name, str) and not util.VALID_SDFG_OBJ_NAME.fullmatch(name):
-            raise ValueError(f"'{name}' is not a valid SDFG name.")
-
-        self.sdfg = dace.SDFG(name=(name or f"unnamed_SDFG_{id(self)}"))
-        self.inp_names = ()
-        self.out_names = ()
-
     def validate(self) -> bool:
         """Validate the underlying SDFG."""
         if not self.inp_names:
@@ -63,7 +49,7 @@ def validate(self) -> bool:
                 self.sdfg,
                 self.sdfg.node_id(self.sdfg.start_state),
             )
-        if not all(not self.sdfg.arrays[inp].transient for inp in self.inp_names):
+        if any(self.sdfg.arrays[inp].transient for inp in self.inp_names):
             raise dace.sdfg.InvalidSDFGError(
                 f"Found transient inputs: {(inp for inp in self.inp_names if self.sdfg.arrays[inp].transient)}",
                 self.sdfg,
@@ -75,7 +61,7 @@ def validate(self) -> bool:
                 self.sdfg,
                 self.sdfg.node_id(self.sdfg.start_state),
             )
-        if not all(not self.sdfg.arrays[out].transient for out in self.out_names):
+        if any(self.sdfg.arrays[out].transient for out in self.out_names):
             raise dace.sdfg.InvalidSDFGError(
                 f"Found transient outputs: {(out for out in self.out_names if self.sdfg.arrays[out].transient)}",
                 self.sdfg,

From acfcf394089fcf7b32925280db8b653162c09b65 Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Sun, 2 Jun 2024 09:34:58 +0200
Subject: [PATCH 290/458] Now the translation conext and the translated sdfg no
 longer share anything.

I realized that they are fundamently too different to compose them.
It might make sense on some theoretical level, but as PEP20 says, it is not practical and realy awkward in doing so.
---
 .../translator/jaxpr_translator_builder.py    | 59 ++++++++++---------
 src/jace/translator/post_translation.py       | 14 +++--
 src/jace/translator/translated_jaxpr_sdfg.py  | 14 +----
 3 files changed, 40 insertions(+), 47 deletions(-)

diff --git a/src/jace/translator/jaxpr_translator_builder.py b/src/jace/translator/jaxpr_translator_builder.py
index ae7282a..9aee655 100644
--- a/src/jace/translator/jaxpr_translator_builder.py
+++ b/src/jace/translator/jaxpr_translator_builder.py
@@ -460,7 +460,7 @@ def _create_initial_input(
         """
         if not self.is_allocated():
             raise RuntimeError("Builder is not allocated, can not create constants.")
-        assert len(self._ctx.jsdfg.inp_names) == 0
+        assert self._ctx.inp_names is None
 
         # Handle the initial input arguments
         init_in_var_names: Sequence[str] = self.create_jax_var_list(
@@ -473,7 +473,7 @@ def _create_initial_input(
         self.sdfg.arg_names = []
 
         # The output list is populated by `self._translate_jaxpr_internal()`
-        self._ctx.jsdfg.inp_names = tuple(init_in_var_names)
+        self._ctx.inp_names = tuple(init_in_var_names)
 
         return init_in_var_names
 
@@ -650,7 +650,7 @@ def _translate_jaxpr_internal(
         if nb_translated_eqn == 0:
             out_var_names = self._handle_null_jaxpr(jaxpr)
 
-        self._ctx.jsdfg.out_names = tuple(out_var_names)
+        self._ctx.out_names = tuple(out_var_names)
 
         return cast(TranslationContext, self._clear_translation_ctx())
 
@@ -671,10 +671,13 @@ def _handle_null_jaxpr(
 
         Todo:
             - Handle the case if if the output is a literal.
+
+        Note:
+            The function will _not_ update the `out_names` field of the current context.
         """
         assert self._ctx.terminal_state is self._ctx.start_state
-        assert len(self._ctx.jsdfg.inp_names) > 0
-        assert len(self._ctx.jsdfg.out_names) == 0
+        assert self._ctx.inp_names
+        assert self._ctx.out_names is None
 
         # There is not output so we do not have to copy anything around.
         if len(jaxpr.out_avals) == 0:
@@ -732,23 +735,30 @@ def _terminal_sdfg_state(self) -> dace.SDFGState:
 class TranslationContext:
     """Translation context used by the `JaxprTranslationBuilder`.
 
-    Essentially it is a `TranslatedJaxprSDFG` object together with some additional meta data,
-    that is needed during translation. It is also returned by the `translate_jaxpr()` function.
-    It is important that the SDFG it encapsulates is not directly usable and must be passed to the
-    `finalize_translation_context()` function, before it can be passed to the optimization stage.
-    However, it is recommended to pass it to the `postprocess_jaxpr_sdfg()` instead.
+    Internal representation of the builder of an SDFG under construction together with the needed
+    metadata. Essentially it is an extended version of the `TranslatedJaxprSDFG`, but carrying
+    an unfinished canonical SDFG.
+    A user should consider this class as an opaque object, that represents an invalid
+    `TranslatedJaxprSDFG` object, and the only valid operation a user can do with it is passing it
+    either to `finalize_translation_context()` or the `postprocess_jaxpr_sdfg()` function.
 
     Attributes:
-        jsdfg:          The wrapped `TranslatedJaxprSDFG` object that stores the SDFG under
-            construction.
-        start_state:    The first state in the SDFG state machine.
-        terminal_state: The (currently) last state in the state machine.
+        sdfg:              The encapsulated SDFG object.
+        inp_names:         A list of the SDFG variables that are used as input
+        out_names:         A list of the SDFG variables that are used as output.
+        start_state:       The first state in the SDFG state machine.
+        terminal_state:    The (currently) last state in the state machine.
 
     Args:
         name:       The name of the SDFG, will be forwarded to the encapsulated `TranslatedJaxprSDFG`.
+
+    Note:
+        Access of any attribute of this class by an outside user is considered undefined behaviour.
     """
 
-    jsdfg: translator.TranslatedJaxprSDFG
+    sdfg: dace.SDFG
+    inp_names: tuple[str, ...] | None
+    out_names: tuple[str, ...] | None
     start_state: dace.SDFGState
     terminal_state: dace.SDFGState
 
@@ -756,29 +766,20 @@ def __init__(
         self,
         name: str | None = None,
     ) -> None:
-        from jace import translator  # Cyclic import
-
         if isinstance(name, str) and not util.VALID_SDFG_OBJ_NAME.fullmatch(name):
             raise ValueError(f"'{name}' is not a valid SDFG name.")
 
-        self.jsdfg = translator.TranslatedJaxprSDFG(
-            sdfg=dace.SDFG(name=(name or f"unnamed_SDFG_{id(self)}")),
-            inp_names=(),
-            out_names=(),
-        )
+        self.sdfg = dace.SDFG(name=(name or f"unnamed_SDFG_{id(self)}"))
+        self.inp_names = None
+        self.out_names = None
         self.start_state = self.sdfg.add_state(label="initial_state", is_start_block=True)
         self.terminal_state = self.start_state
 
-    @property
-    def sdfg(self) -> dace.SDFG:
-        return self.jsdfg.sdfg
-
     def validate(self) -> bool:
         """Validate internal state of `self`.
 
-        Note:
-            The it is not possible to call the validation function of the embedded
-            `TranslatedJaxprSDFG` because the SDFG is still under construction`.
+        Since the SDFG is under construction it will not be validated, instead the meta data
+        will be validated.
         """
         if self.start_state is not self.sdfg.start_block:
             raise dace.sdfg.InvalidSDFGError(
diff --git a/src/jace/translator/post_translation.py b/src/jace/translator/post_translation.py
index 24d90c2..0f86e34 100644
--- a/src/jace/translator/post_translation.py
+++ b/src/jace/translator/post_translation.py
@@ -17,12 +17,12 @@
 import copy
 from typing import TYPE_CHECKING, Any
 
+from jace import translator
+
 
 if TYPE_CHECKING:
     from collections.abc import Callable, Sequence
 
-    from jace import translator
-
 
 def postprocess_jaxpr_sdfg(
     trans_ctx: translator.TranslationContext,
@@ -76,13 +76,17 @@ def finalize_translation_context(
         validate:       Call the validate function after the finalizing.
     """
     trans_ctx.validate()
-    if not trans_ctx.jsdfg.inp_names:
+    if trans_ctx.inp_names is None:
         raise ValueError("Input names are not specified.")
-    if not trans_ctx.jsdfg.out_names:
+    if trans_ctx.out_names is None:
         raise ValueError("Output names are not specified.")
 
     # We guarantee decoupling
-    tsdfg: translator.TranslatedJaxprSDFG = copy.deepcopy(trans_ctx.jsdfg)
+    tsdfg = translator.TranslatedJaxprSDFG(
+        sdfg=copy.deepcopy(trans_ctx.sdfg),
+        inp_names=trans_ctx.inp_names,
+        out_names=trans_ctx.out_names,
+    )
 
     # Make inputs and outputs to globals.
     sdfg_arg_names: list[str] = []
diff --git a/src/jace/translator/translated_jaxpr_sdfg.py b/src/jace/translator/translated_jaxpr_sdfg.py
index 7eac48e..f3c5d41 100644
--- a/src/jace/translator/translated_jaxpr_sdfg.py
+++ b/src/jace/translator/translated_jaxpr_sdfg.py
@@ -12,7 +12,7 @@
 import dace
 
 
-@dataclasses.dataclass(kw_only=True)
+@dataclasses.dataclass(kw_only=True, frozen=True)
 class TranslatedJaxprSDFG:
     """Encapsulates the translated SDFG together with the metadata that is needed to run it.
 
@@ -43,24 +43,12 @@ class TranslatedJaxprSDFG:
 
     def validate(self) -> bool:
         """Validate the underlying SDFG."""
-        if not self.inp_names:
-            raise dace.sdfg.InvalidSDFGError(
-                "There are no input arguments.",
-                self.sdfg,
-                self.sdfg.node_id(self.sdfg.start_state),
-            )
         if any(self.sdfg.arrays[inp].transient for inp in self.inp_names):
             raise dace.sdfg.InvalidSDFGError(
                 f"Found transient inputs: {(inp for inp in self.inp_names if self.sdfg.arrays[inp].transient)}",
                 self.sdfg,
                 self.sdfg.node_id(self.sdfg.start_state),
             )
-        if not self.out_names:
-            raise dace.sdfg.InvalidSDFGError(
-                "There are no output arguments.",
-                self.sdfg,
-                self.sdfg.node_id(self.sdfg.start_state),
-            )
         if any(self.sdfg.arrays[out].transient for out in self.out_names):
             raise dace.sdfg.InvalidSDFGError(
                 f"Found transient outputs: {(out for out in self.out_names if self.sdfg.arrays[out].transient)}",

From cf99b028fb7319130b6de250def81ee0997af565 Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Sun, 2 Jun 2024 10:16:07 +0200
Subject: [PATCH 291/458] Updated the coverage again.

It now also reprorts the contextes.
---
 pyproject.toml | 21 ++++++++++++---------
 1 file changed, 12 insertions(+), 9 deletions(-)

diff --git a/pyproject.toml b/pyproject.toml
index f85e586..0d3362a 100644
--- a/pyproject.toml
+++ b/pyproject.toml
@@ -46,33 +46,36 @@ Changelog = "https://github.com/GridTools/JaCe/releases"
 Discussions = "https://github.com/GridTools/JaCe/discussions"
 Homepage = "https://github.com/GridTools/JaCe"
 
-[tool.coverage.run]
-branch = true
-source = ["jace"]
+[tool.coverage]
+
+[tool.coverage.html]
+show_contexts = true
 
 [tool.coverage.report]
 # Regexes for lines to exclude from consideration
 exclude_also = [
   # Don't complain about missing debug-only code:
   'def __repr__',
-
   # Don't complain about typechecker includes
   'if typing.TYPE_CHECKING:',
   '\.\.\.',
   '@overload',
-
   # Don't complain if tests don't hit defensive assertion code:
   'raise AssertionError',
   'raise NotImplementedError',
-
   # Don't complain if non-runnable code isn't run:
   'if 0:',
   'if __name__ == .__main__.:',
-
-  # Don't complain about abstract methods, they aren't run:
+  # Don't complain about abstract methods and interfaces.
   '@(abc\\.)?abstractmethod',
   '@(abc\\.)?abstract',
-  ]
+  'class .*\bProtocol\):'
+]
+
+[tool.coverage.run]
+branch = true
+dynamic_context = "test_function"
+source = ["jace"]
 
 # -- mypy  --
 [tool.mypy]

From 7424687d490cb0cb6329e1d2a4fb378443c13c98 Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Sun, 2 Jun 2024 10:20:20 +0200
Subject: [PATCH 292/458] Made a note about what tests are still needed.

---
 tests/conftest.py | 1 +
 1 file changed, 1 insertion(+)

diff --git a/tests/conftest.py b/tests/conftest.py
index e55ad74..936d6be 100644
--- a/tests/conftest.py
+++ b/tests/conftest.py
@@ -9,6 +9,7 @@
 
 Todo:
     - Implement some fixture that allows to force validation.
+    - Implement fixture to disable and enable optimisation, i.e. doing it twice.
 """
 
 from __future__ import annotations

From b996041e6a68cc80ebaeb8d3c6638361e51923f6 Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Sun, 2 Jun 2024 12:53:39 +0200
Subject: [PATCH 293/458] Fixed the issue with the logical operations.

---
 .../mapped_operation_base_translator.py       |   2 -
 .../primitive_translators/__init__.py         |   4 +-
 .../primitive_translators/alu_translators.py  | 126 +++++++++++++-----
 3 files changed, 96 insertions(+), 36 deletions(-)

diff --git a/src/jace/translator/mapped_operation_base_translator.py b/src/jace/translator/mapped_operation_base_translator.py
index 6b802fb..fb42ea0 100644
--- a/src/jace/translator/mapped_operation_base_translator.py
+++ b/src/jace/translator/mapped_operation_base_translator.py
@@ -54,8 +54,6 @@ class MappedOperationTranslatorBase(translator.PrimitiveTranslator):
         This class will always generate a mapped Tasklet, even if a scalar is handled.
     """
 
-    __slots__ = ("_prim_name",)
-
     def __init__(
         self,
         primitive_name: str,
diff --git a/src/jace/translator/primitive_translators/__init__.py b/src/jace/translator/primitive_translators/__init__.py
index 61fcc38..a3221d4 100644
--- a/src/jace/translator/primitive_translators/__init__.py
+++ b/src/jace/translator/primitive_translators/__init__.py
@@ -8,7 +8,7 @@
 
 from __future__ import annotations
 
-from .alu_translators import ALUTranslator
+from .alu_translators import ArithmeticOperationTranslator
 from .broadcast_in_dim_translator import BroadcastInDimTranslator
 from .convert_element_type_translator import ConvertElementTypeTranslator
 from .copy_translator import CopyTranslator, DevicePutTranslator
@@ -20,7 +20,7 @@
 
 
 __all__ = [
-    "ALUTranslator",
+    "ArithmeticOperationTranslator",
     "BroadcastInDimTranslator",
     "ConvertElementTypeTranslator",
     "CopyTranslator",
diff --git a/src/jace/translator/primitive_translators/alu_translators.py b/src/jace/translator/primitive_translators/alu_translators.py
index c64665f..ab0dcf9 100644
--- a/src/jace/translator/primitive_translators/alu_translators.py
+++ b/src/jace/translator/primitive_translators/alu_translators.py
@@ -5,15 +5,20 @@
 #
 # SPDX-License-Identifier: BSD-3-Clause
 
-"""Module containing all translators related to arithmetic logical operations."""
+"""Module containing all translators related to arithmetic and logical operations.
+
+Todo:
+    - Hijack Jax to inject a proper modulo operation.
+"""
 
 from __future__ import annotations
 
 from typing import TYPE_CHECKING, Final
 
+import dace
 from typing_extensions import override
 
-from jace import translator
+from jace import translator, util
 from jace.translator import mapped_operation_base_translator as mapped_base
 
 
@@ -23,26 +28,28 @@
     from jax import core as jax_core
 
 
-class ALUTranslator(mapped_base.MappedOperationTranslatorBase):
-    """Translator for all arithmetic and logical operations.
+class ArithmeticOperationTranslator(mapped_base.MappedOperationTranslatorBase):
+    """Translator for all arithmetic operations.
 
-    The class uses `MappedOperationBaseTranslator` for generating the maps.
-    Its `write_tasklet_code()` function will perform replace all literals.
-    """
+    The class makes use of the `MappedOperationTranslatorBase`. It only implements the
+    `write_tasklet_code()` to generate the code for a Tasklet from a template.
 
-    __slots__ = ("_tskl_tmpl",)
+    Args:
+        prim_name:      The name of the primitive that should be handled.
+        tskl_tmpl:      Template used for generating the Tasklet code.
+
+    Note:
+        - It does not implement the logical operations, they are implemented by the
+            `LogicalOperationTranslator` class.
+        - It does not implement `mod` nor `fmod` as they are translated to some nested `pjit`
+            implementation by Jax for unknown reasons.
+    """
 
     def __init__(
         self,
         prim_name: str,
         tskl_tmpl: str,
     ) -> None:
-        """Initialize a base translator for primitive `prim_name` with template `tskl_tmpl`.
-
-        Args:
-            prim_name:      The name of the primitive that should be handled.
-            tskl_tmpl:      Template used for generating the Tasklet code.
-        """
         super().__init__(primitive_name=prim_name)
         self._tskl_tmpl = tskl_tmpl
 
@@ -60,15 +67,61 @@ def write_tasklet_code(
         return tskl_code
 
 
-# Contains all the templates for ALU operations.
-#  TODO(phimuell): Import them also from `frontend/python/replacements.py`, however, the names
-#   do not fully matches the Jax names, `grep -P '^[a-zA-Z0-9_]+_p[[:space:]]+' -r -o -h | sort -u`
-# NOTES:
-#   - Jax does not seem to have a mod, `%? , operation, instead a nested computation is done.
-#   - Jax has multiple shift operations, only one is implemented.
-#   - The logical operations, i.e. `and`, `xor`, `or` and `not` are bitwise, in Jax.
+class LogicalOperationTranslator(mapped_base.MappedOperationTranslatorBase):
+    """Translator for all logical operations.
+
+    The reason why the logical operations are separated from the arithmetic operation is quite
+    complicated, and in fact the whole thing is harder than it should be.
+    NumPy has two kinds of these operations, i.e. `logical_{and, or, xor, not}()` and
+    `bitwise_{and, or, xor, not}()`, but Jax has only a single kind of logical operations, that
+    operate in bitwise mode.
+    The first idea would be to use `ArithmeticOperationTranslator` with a template such as
+    `__out = __in0 & __in1` or `__out = ~__in0`. Since DaCe eventually generates C++ code and C++
+    has a native bool type, and `true` is guaranteed to be `1` and `false` equals `0`, this works
+    for all operations except `not`, as `~true` in C++ is again `true`. Thus the `not` primitive
+    must be handled separately, however, it does not make sense to split the logical operations,
+    thus all of them are handled by this class.
+    I think that in XLA, Jax target language, a bool is either a single bit or either all bits are
+    one or zero.
+
+    The solution to the problem is, to introduce two templates, one used for the bool context
+    and one used in the integer context. This works because depending if the `logical_*()` or
+    `bitwise_*()` functions are used the input is either of type bool or an integer.
+
+    Args:
+        prim_name:      The name of the primitive that should be handled.
+        int_tmpl:       The template used for the integer case.
+        bool_tmpl:      The template used for the bool case.
+
+    Notes:
+        This class does not do parameter substitution as the `ArithmeticOperationTranslator` does.
+    """
+
+    def __init__(
+        self,
+        prim_name: str,
+        int_tmpl: str,
+        bool_tmpl: str,
+    ) -> None:
+        super().__init__(primitive_name=prim_name)
+        self._int_tmpl = int_tmpl
+        self._bool_tmpl = bool_tmpl
+
+    @override
+    def write_tasklet_code(
+        self,
+        tskl_ranges: Sequence[tuple[str, str]],
+        in_var_names: Sequence[str | None],
+        eqn: jax_core.JaxprEqn,
+    ) -> str:
+        if all(util.get_jax_var_dtype(invar) is dace.bool_ for invar in eqn.invars):
+            return self._bool_tmpl
+        return self._int_tmpl
+
+
+# Contains the code templates for all supported arithmetic operations.
 # fmt: off
-_ALU_OPS_TMPL: Final[dict[str, str]] = {
+_ARITMETIC_OPERATION_TEMPLATES: Final[dict[str, str]] = {
     # Unary operations
     "pos": "__out = +(__in0)",
     "neg": "__out = -(__in0)",
@@ -129,15 +182,24 @@ def write_tasklet_code(
     "right_shift": "__out = (__in0) >> (__in1)",
     "nextafter": "__out = nextafter((__in0), (__in1))",
 
-    # Logical operations
-    #  Note in Jax all logical operations are bitwise; for "logical" operations they are first
-    #  turned into "bools" by `ne a 0`.
-    "or": "__out = (__in0) | (__in1)",
-    "not": "__out = ~(__in0)",
-    "and": "__out = (__in0) & (__in1)",
-    "xor": "__out = (__in0) ^ (__in1)",
 }
 
-# Create the ALU translators
-for pname, ptmpl in _ALU_OPS_TMPL.items():
-    translator.register_primitive_translator(ALUTranslator(pname, ptmpl))
+
+# Contains the code templates for all logical operations.
+#  The first one is for the integer case, the second for the bool case.
+_LOGICAL_OPERATION_TEMPLATES: Final[dict[str, tuple[str, str]]] = {
+    "or": ("__out = (__in0) | (__in1)",  "__out = (__in0) or (__in1)"),
+    "not": ("__out = ~(__in0)", "__out = not (__in0)"),
+    "and": ("__out = (__in0) & (__in1)", "__out = (__in0) and (__in1)"),
+    "xor": ("__out = (__in0) ^ (__in1)", "__out = (__in0) != (__in1)"),
+}
+
+
+
+# Create the arithmetic translators
+for pname, ptmpl in _ARITMETIC_OPERATION_TEMPLATES.items():
+    translator.register_primitive_translator(ArithmeticOperationTranslator(pname, ptmpl))
+
+# create the logical translators.
+for pname, (itmpl, btmpl) in _LOGICAL_OPERATION_TEMPLATES.items():
+    translator.register_primitive_translator(LogicalOperationTranslator(pname, itmpl, btmpl))

From bb9d81d8f8a3f4901e9c6a4636fed6161dc5a1ce Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Sun, 2 Jun 2024 13:45:45 +0200
Subject: [PATCH 294/458] Updated the ALU tests.

Now we make sure that onyl ALU translators are used.
However, the biggst test, the running of all templates is not yet implemented.
---
 .../test_primitive_alu.py                     | 109 ++++++++++++------
 1 file changed, 74 insertions(+), 35 deletions(-)

diff --git a/tests/integration_tests/primitive_translators/test_primitive_alu.py b/tests/integration_tests/primitive_translators/test_primitive_alu.py
index 774ebe4..d589f07 100644
--- a/tests/integration_tests/primitive_translators/test_primitive_alu.py
+++ b/tests/integration_tests/primitive_translators/test_primitive_alu.py
@@ -5,7 +5,9 @@
 #
 # SPDX-License-Identifier: BSD-3-Clause
 
-"""Implements tests for the ALU translator.
+"""Implements tests for the ALU and the `MappedOperationTranslatorBase` translator.
+
+The function mostly tests the `MappedOperationTranslatorBase` class by performing additions.
 
 Todo:
     - Add all supported primitives, to see if the template is valid.
@@ -14,7 +16,7 @@
 from __future__ import annotations
 
 from collections.abc import Callable
-from typing import TYPE_CHECKING, Any, cast
+from typing import TYPE_CHECKING, Any
 
 import jax
 import numpy as np
@@ -30,6 +32,33 @@
     from collections.abc import Callable
 
 
+@pytest.fixture(autouse=True)
+def _only_alu_translators():
+    """Removes all non arithmetic/logical translator from the registry.
+
+    This ensures that Jax is not doing some stuff that is supposed to be handled by the
+    test class, such as broadcasting. It makes writing tests a bit harder, but it is worth.
+    """
+    from jace.translator.primitive_translators.alu_translators import (
+        _ARITMETIC_OPERATION_TEMPLATES,
+        _LOGICAL_OPERATION_TEMPLATES,
+    )
+
+    # Remove all non ALU translators from the registry
+    all_translators = jace.translator.get_regsitered_primitive_translators()
+    alu_translators_names = (
+        _LOGICAL_OPERATION_TEMPLATES.keys() | _ARITMETIC_OPERATION_TEMPLATES.keys()
+    )
+    jace.translator.set_active_primitive_translators_to(
+        {p: t for p, t in all_translators.items() if p in alu_translators_names}
+    )
+
+    yield
+
+    # Restore the initial state
+    jace.translator.set_active_primitive_translators_to(all_translators)
+
+
 @pytest.fixture(
     params=[
         (jnp.logical_and, 2, np.bool_),
@@ -56,16 +85,25 @@ def _perform_alu_test(testee: Callable, *args: Any) -> None:
 
     ref = testee(*args)
     res = wrapped(*args)
+
+    if jace.util.is_scalar(ref):
+        # Builder hack, only arrays are generated.
+        assert res.shape == (1,)
+    elif ref.shape == ():  # TODO: Investigate
+        assert res.shape == (1,)
+    else:
+        assert ref.shape == res.shape
+    assert ref.dtype == res.dtype
     assert np.allclose(ref, res), f"Expected '{ref.tolist()}' got '{res.tolist()}'"
 
 
 def test_alu_unary_scalar():
     """Test unary ALU translator in the scalar case."""
 
-    def testee(A: float) -> float | jax.Array:
+    def testee(A: np.float64) -> np.float64 | jax.Array:
         return jnp.cos(A)
 
-    _perform_alu_test(testee, 1.0)
+    _perform_alu_test(testee, np.float64(1.0))
 
 
 def test_alu_unary_array():
@@ -90,40 +128,47 @@ def testee(A: float) -> float | jax.Array:
 
 def test_alu_unary_integer_power():
     """Tests the integer power, which has a parameter."""
-    for exp in [0, 1, 2, 10]:
 
-        def testee(A: np.ndarray) -> np.ndarray:
-            return A ** int(exp)  # noqa: B023 # `exp` is not used in the body
+    def testee(A: np.ndarray) -> np.ndarray:
+        return A**3
+
+    A = testutil.mkarray((10, 2, 3))
+    _perform_alu_test(testee, A)
+
 
-        A = testutil.mkarray((10, 2 + exp, 3))
-        _perform_alu_test(testee, A)
+def test_alu_unary_regular_power():
+    """Tests the "normal" power operator, i.e. not with a known integer power."""
+
+    for exp in [3, np.float64(3.1415)]:
+
+        def testee(A: np.ndarray, exp: int | float) -> np.ndarray:
+            return A**exp
+
+        A = testutil.mkarray((10, 2, 3))
+        _perform_alu_test(testee, A, exp)
 
 
 def test_alu_binary_scalar():
     """Scalar binary operation."""
 
-    def testee(A: float, B: float) -> float:
+    def testee(A: np.float64, B: np.float64) -> np.float64:
         return A * B
 
-    _perform_alu_test(testee, 1.0, 2.0)
+    _perform_alu_test(testee, np.float64(1.0), np.float64(2.0))
 
 
 def test_alu_binary_scalar_literal():
     """Scalar binary operation, with a literal."""
 
-    def testee(A: float) -> float:
+    def testeeR(A: np.float64) -> np.float64:
         return A * 2.03
 
-    _perform_alu_test(testee, 7.0)
-
-
-def test_alu_binary_scalar_literal_2():
-    """Scalar binary operation, with a literal."""
-
-    def testee(A: float) -> float:
+    def testeeL(A: np.float64) -> np.float64:
         return 2.03 * A
 
-    _perform_alu_test(testee, 7.0)
+    A = np.float64(7.0)
+    _perform_alu_test(testeeR, A)
+    _perform_alu_test(testeeL, A)
 
 
 def test_alu_binary_array():
@@ -140,8 +185,8 @@ def testee(A: np.ndarray, B: np.ndarray) -> np.ndarray:
 def test_alu_binary_array_scalar():
     """Test binary of array with scalar."""
 
-    def testee(A: np.ndarray | float, B: float | np.ndarray) -> np.ndarray:
-        return cast(np.ndarray, A + B)
+    def testee(A: np.ndarray | np.float64, B: np.float64 | np.ndarray) -> np.ndarray:
+        return A + B  # type: ignore[return-value]  # It is always an array.
 
     A = testutil.mkarray((100, 22))
     B = np.float64(1.34)
@@ -152,21 +197,15 @@ def testee(A: np.ndarray | float, B: float | np.ndarray) -> np.ndarray:
 def test_alu_binary_array_literal():
     """Test binary of array with literal"""
 
-    def testee(A: np.ndarray) -> np.ndarray:
+    def testeeR(A: np.ndarray) -> np.ndarray:
         return A + 1.52
 
-    A = testutil.mkarray((100, 22))
-    _perform_alu_test(testee, A)
-
-
-def test_alu_binary_array_literal_2():
-    """Test binary of array with literal"""
-
-    def testee(A: np.ndarray) -> np.ndarray:
+    def testeeL(A: np.ndarray) -> np.ndarray:
         return 1.52 + A
 
     A = testutil.mkarray((100, 22))
-    _perform_alu_test(testee, A)
+    _perform_alu_test(testeeR, A)
+    _perform_alu_test(testeeL, A)
 
 
 def test_alu_binary_array_constants():
@@ -209,15 +248,15 @@ def test_alu_binary_broadcast_3():
     def testee(A: np.ndarray, B: np.ndarray) -> np.ndarray:
         return A + B
 
-    A = testutil.mkarray((5, 1, 3, 4, 1))
-    B = testutil.mkarray((5, 1, 3, 1, 2))
+    A = testutil.mkarray((5, 1, 3, 4, 1, 5))
+    B = testutil.mkarray((5, 1, 3, 1, 2, 5))
     _perform_alu_test(testee, A, B)
     _perform_alu_test(testee, B, A)
 
 
 def test_alu_logical_bitwise_operation(
     logical_ops: tuple[Callable, tuple[np.ndarray, ...]],
-):
+) -> None:
     """Tests if the logical and bitwise operations works as they do in Jax."""
     inputs: tuple[np.ndarray, ...] = logical_ops[1]
 

From 95b34cf0577174e4fa2e9e94ad23fdec9e92a9e1 Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Sun, 2 Jun 2024 14:00:18 +0200
Subject: [PATCH 295/458] Updated the iota test.

---
 .../primitive_translators/test_primitive_iota.py            | 6 +++---
 1 file changed, 3 insertions(+), 3 deletions(-)

diff --git a/tests/integration_tests/primitive_translators/test_primitive_iota.py b/tests/integration_tests/primitive_translators/test_primitive_iota.py
index 63f790b..7ae4cfa 100644
--- a/tests/integration_tests/primitive_translators/test_primitive_iota.py
+++ b/tests/integration_tests/primitive_translators/test_primitive_iota.py
@@ -27,10 +27,10 @@ def testee(A: int) -> jax.Array:
 
 def test_iota_broadcast():
     """Test more iota using the `jax.lax.broadcasted_iota()` function."""
-    shape = (4, 4, 4, 4)
+    shape = (2, 2, 2, 2)
 
     for d in range(len(shape)):
-
+        # Must be inside the loop to bypass caching.
         def testee(A: np.int32) -> jax.Array:
             return jax.lax.broadcasted_iota("int32", shape, d) + A  # noqa: B023  # Variable capturing.
 
@@ -38,4 +38,4 @@ def testee(A: np.int32) -> jax.Array:
         res = jace.jit(testee)(np.int32(0))
 
         assert res.shape == shape
-        assert np.all(ref == res)
+        assert np.all(ref == res), f"Expected: {ref.tolist()}; Got: {res.tolist()}"

From 72c055a02c8a9863ccd7e9469bfb2c85dcad8342 Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.paul.mueller@bluemain.ch>
Date: Sun, 2 Jun 2024 15:48:40 +0200
Subject: [PATCH 296/458] Fixed an issue in the pyproject configuration
 regarding the `TYPE_CHECKING` exclusion.

---
 pyproject.toml | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/pyproject.toml b/pyproject.toml
index 0d3362a..d7e3b1d 100644
--- a/pyproject.toml
+++ b/pyproject.toml
@@ -57,7 +57,7 @@ exclude_also = [
   # Don't complain about missing debug-only code:
   'def __repr__',
   # Don't complain about typechecker includes
-  'if typing.TYPE_CHECKING:',
+  'if TYPE_CHECKING:',
   '\.\.\.',
   '@overload',
   # Don't complain if tests don't hit defensive assertion code:

From 66fa0380d99e8c8688539c44aa5303feaf809086 Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Mon, 3 Jun 2024 08:08:52 +0200
Subject: [PATCH 297/458] Fixed a bug in the builder.

The returtn values where not handled correctly.
It only used the ones that were generated by the last equation that was translated.
---
 .../translator/jaxpr_translator_builder.py     | 18 +++++++++---------
 1 file changed, 9 insertions(+), 9 deletions(-)

diff --git a/src/jace/translator/jaxpr_translator_builder.py b/src/jace/translator/jaxpr_translator_builder.py
index 9aee655..0a2a80d 100644
--- a/src/jace/translator/jaxpr_translator_builder.py
+++ b/src/jace/translator/jaxpr_translator_builder.py
@@ -546,7 +546,7 @@ def _clear_translation_ctx(self) -> TranslationContext | None:
     def _translate_single_eqn(
         self,
         eqn: jax_core.JaxprEqn,
-    ) -> tuple[Sequence[str | None], Sequence[str]]:
+    ) -> None:
         """Translate `eqn` into its SDFG equivalent.
 
         To do this the function will perform the following steps:
@@ -554,10 +554,6 @@ def _translate_single_eqn(
         - Select the appropriate primitive translator to use.
         - Create a new empty state terminal state.
         - Call the primitive translator to perform the translation inside the new state.
-
-        Returns:
-            The SDFG names that were used as inputs and outputs. The inputs might contain `None`
-            which indicates that this particular input was a literal.
         """
         if len(eqn.effects) != 0:
             raise NotImplementedError(f"Equation '{eqn}' has side effects.")
@@ -619,8 +615,6 @@ def _translate_single_eqn(
         # Modify terminal root state of 'self'
         self._ctx.terminal_state = new_sdfg_term_state
 
-        return (in_var_names, out_var_names)
-
     def _translate_jaxpr_internal(
         self,
         jaxpr: jax_core.ClosedJaxpr,
@@ -643,12 +637,18 @@ def _translate_jaxpr_internal(
             if any(util.is_drop_var(outVar) for outVar in eqn.outvars):
                 assert all(util.is_drop_var(outVar) for outVar in eqn.outvars)
                 continue
-            _, out_var_names = self._translate_single_eqn(eqn=eqn)
+            self._translate_single_eqn(eqn=eqn)
             nb_translated_eqn += 1
 
-        # There were no (useful) equations; thus the Jaxpr was empty.
+        # Handle the output or the case of an empty Jaxpr
         if nb_translated_eqn == 0:
             out_var_names = self._handle_null_jaxpr(jaxpr)
+        else:
+            out_var_names = self.create_jax_var_list(
+                jaxpr.jaxpr.outvars,
+                prevent_creation=True,
+                handle_literals=False,
+            )
 
         self._ctx.out_names = tuple(out_var_names)
 

From fa599c399a7de57ef666b51cb45e32f66103241c Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Mon, 3 Jun 2024 08:16:19 +0200
Subject: [PATCH 298/458] Added some more tests to the empty case.

---
 tests/integration_tests/test_empty_jaxpr.py | 57 +++++++++++++++++----
 1 file changed, 47 insertions(+), 10 deletions(-)

diff --git a/tests/integration_tests/test_empty_jaxpr.py b/tests/integration_tests/test_empty_jaxpr.py
index 8dfc495..e4dbc09 100644
--- a/tests/integration_tests/test_empty_jaxpr.py
+++ b/tests/integration_tests/test_empty_jaxpr.py
@@ -22,33 +22,67 @@
 
 def test_empty_array():
     @jace.jit
-    def testee(A: np.ndarray) -> np.ndarray:
+    def wrapped(A: np.ndarray) -> np.ndarray:
         return A
 
     A = np.arange(12, dtype=np.float64).reshape((4, 3))
+    res = wrapped(A)
 
-    assert np.all(testee(A) == A)
+    assert np.all(res == A)
+    assert res.__array_interface__["data"][0] != A.__array_interface__["data"][0]
+
+
+def test_empty_multiple():
+    @jace.jit
+    def wrapped(A: np.ndarray, B: np.float64) -> tuple[np.ndarray, np.float64]:
+        return A, B
+
+    A = np.arange(12, dtype=np.float64).reshape((4, 3))
+    B = np.float64(30.0)
+    res = wrapped(A, B)
+
+    assert np.all(res[0] == A)
+    assert res[1] == B
+    assert res[0].__array_interface__["data"][0] != A.__array_interface__["data"][0]
+
+
+def test_empty_unused():
+    @jace.jit
+    def wrapped(A: np.ndarray, B: np.float64) -> np.ndarray:  # noqa: ARG001  # Explicitly unused.
+        return A
+
+    A = np.arange(12, dtype=np.float64).reshape((4, 3))
+    B = np.float64(30.0)
+    lowered = wrapped.lower(A, B)
+    compiled = lowered.compile()
+    res = compiled(A, B)
+
+    assert len(lowered._translated_sdfg.inp_names) == 2
+    assert len(compiled._inp_names) == 2
+    assert isinstance(res, np.ndarray)
+    assert np.all(res == A)
+    assert res.__array_interface__["data"][0] != A.__array_interface__["data"][0]
 
 
 def test_empty_scalar():
     @jace.jit
-    def testee(A: float) -> float:
+    def wrapped(A: float) -> float:
         return A
 
     A = np.pi
 
-    assert np.all(testee(A) == A)
+    assert np.all(wrapped(A) == A)
 
 
 @pytest.mark.skip(reason="Nested Jaxpr are not handled.")
 def test_empty_nested():
     @jace.jit
-    def testee(A: float) -> float:
+    def wrapped(A: float) -> float:
         return jax.jit(lambda A: A)(A)
 
     A = np.pi
 
-    assert np.all(testee(A) == A)
+    assert np.all(wrapped(A) == A)
 
 
 def test_empty_with_drop_vars():
@@ -56,12 +90,12 @@ def test_empty_with_drop_vars():
 
     @jace.jit
     @jace.grad
-    def testee(A: float) -> float:
+    def wrapped(A: float) -> float:
         return A * A
 
     A = np.pi
 
-    assert np.all(testee(A) == 2.0 * A)
+    assert np.all(wrapped(A) == 2.0 * A)
 
 
 @pytest.mark.skip(reason="Literal return value is not implemented.")
@@ -72,13 +106,16 @@ def test_empty_literal_return():
         Using this test function serves another purpose. Since Jax includes the original
         computation in the Jaxpr coming from a `grad` annotated function, the result will have
         only drop variables.
+
+    Todo:
+        Add a test if we really have a literal return value, but for that we need the Jaxpr.
     """
 
     @jace.jit
     @jace.grad
-    def testee(A: float) -> float:
+    def wrapped(A: float) -> float:
         return A + A + A
 
     A = np.e
 
-    assert np.all(testee(A) == 3.0)
+    assert np.all(wrapped(A) == 3.0)

From e164d75a61534420aefec716e9fad8c384a373c0 Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Mon, 3 Jun 2024 08:20:17 +0200
Subject: [PATCH 299/458] Added some more tests to the builder.

Thus I found some new errors that are not yet handled.
---
 .../test_jaxpr_translator_builder.py          | 96 ++++++++++++++++++-
 1 file changed, 95 insertions(+), 1 deletion(-)

diff --git a/tests/integration_tests/test_jaxpr_translator_builder.py b/tests/integration_tests/test_jaxpr_translator_builder.py
index 09ba0b7..b5a691c 100644
--- a/tests/integration_tests/test_jaxpr_translator_builder.py
+++ b/tests/integration_tests/test_jaxpr_translator_builder.py
@@ -532,7 +532,101 @@ def wrapped(A: np.float64) -> np.float64:
         return A + A - A * A
 
     A = np.float64(1.0)
-    assert type(A) is np.float64, f"Expected type 'np.float64', but got '{type(A).__name__}'."
+    res = wrapped(A)
+    assert type(res) is np.float64, f"Expected type 'np.float64', but got '{type(res).__name__}'."
+    assert res == np.float64(0.0)
+
+
+def test_builder_multiple_return_values() -> None:
+    """Tests the case that we return multiple value.
+
+    Currently this is always a tuple.
+    """
+
+    @jace.jit
+    def wrapped(A: np.ndarray, B: np.ndarray) -> tuple[np.ndarray, np.ndarray]:
+        return A + B, A - B
+
+    A = testutil.mkarray((2, 2))
+    B = testutil.mkarray((2, 2))
+
+    lowered = wrapped.lower(A, B)
+    compiled = lowered.compile()
+
+    ref = (A + B, A - B)
+    res = compiled(A, B)
+
+    assert len(lowered._translated_sdfg.inp_names) == 2
+    assert len(compiled._inp_names) == 2
+    assert len(lowered._translated_sdfg.out_names) == 2
+    assert len(compiled._out_names) == 2
+    assert isinstance(res, tuple), f"Expected 'tuple', but got '{type(res).__name__}'."
+    assert len(res) == 2
+    assert np.allclose(ref, res)
+
+
+@pytest.mark.skip(reason="The input is not copied in the output.")
+def test_builder_direct_return() -> None:
+    """Tests the case, when an input value is returned as output."""
+
+    @jace.jit
+    def wrapped(A: np.ndarray, B: np.ndarray) -> tuple[np.ndarray, np.ndarray, np.ndarray]:
+        return A + B, B, A
+
+    A = testutil.mkarray((2, 2))
+    B = testutil.mkarray((2, 2))
+
+    ref0 = A + B
+    res = wrapped(A, B)
+
+    assert isinstance(res, tuple)
+    assert len(res) == 3
+    assert np.allclose(ref0, res[0])
+    assert np.all(res[2] == A)
+    assert res[2].__array_interface__["data"][0] != A.__array_interface__["data"][0]
+    assert np.all(res[1] == B)
+    assert res[1].__array_interface__["data"][0] != B.__array_interface__["data"][0]
+
+
+@pytest.mark.skip(reason="Literal return values are not supported.")
+def test_builder_literal_return_value() -> None:
+    """Tests if there can be literals in the return values."""
+
+    def testee(A: np.ndarray) -> tuple[np.ndarray, np.float64, np.ndarray]:
+        return (A + 1.0, np.float64(1.0), A - 1.0)
+
+    A = testutil.mkarray((2, 2))
+    ref = testee(A)
+    res = jace.jit(testee)(A)
+
+    assert isinstance(res, tuple)
+    assert len(res) == 3
+    assert res[1].dtype is np.float64
+    assert all(np.allclose(ref[i], res[i]) for i in range(3))
+
+
+def test_builder_unused_arg() -> None:
+    """Tests if there is an unused argument."""
+
+    def testee(A: np.ndarray, B: np.ndarray) -> np.ndarray:  # noqa: ARG001  # Explicitly unused.
+        return A + 3.0
+
+    A = testutil.mkarray((10, 10))
+    B = testutil.mkarray((11, 11))
+    C = testutil.mkarray((20, 20))
+
+    wrapped = jace.jit(testee)
+    lowered = wrapped.lower(A, B)
+    compiled = lowered.compile()
+
+    ref = testee(A, B)
+    res1 = compiled(A, B)  # Correct call
+    res2 = compiled(A, C)  # wrong call to show that nothing is affected.
+
+    assert len(lowered._translated_sdfg.inp_names) == 2
+    assert len(compiled._inp_names) == 2
+    assert np.all(res1 == res2)
+    assert np.allclose(ref, res1)
 
 
 def test_builder_jace_var() -> None:

From 7fe6f3b19ad5b3cbb98436fac39ca557a10232a9 Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Mon, 3 Jun 2024 08:08:52 +0200
Subject: [PATCH 300/458] Fixed a bug in the builder.

The returtn values where not handled correctly.
It only used the ones that were generated by the last equation that was translated.
---
 .../translator/jaxpr_translator_builder.py     | 18 +++++++++---------
 1 file changed, 9 insertions(+), 9 deletions(-)

diff --git a/src/jace/translator/jaxpr_translator_builder.py b/src/jace/translator/jaxpr_translator_builder.py
index 9aee655..0a2a80d 100644
--- a/src/jace/translator/jaxpr_translator_builder.py
+++ b/src/jace/translator/jaxpr_translator_builder.py
@@ -546,7 +546,7 @@ def _clear_translation_ctx(self) -> TranslationContext | None:
     def _translate_single_eqn(
         self,
         eqn: jax_core.JaxprEqn,
-    ) -> tuple[Sequence[str | None], Sequence[str]]:
+    ) -> None:
         """Translate `eqn` into its SDFG equivalent.
 
         To do this the function will perform the following steps:
@@ -554,10 +554,6 @@ def _translate_single_eqn(
         - Select the appropriate primitive translator to use.
         - Create a new empty state terminal state.
         - Call the primitive translator to perform the translation inside the new state.
-
-        Returns:
-            The SDFG names that were used as inputs and outputs. The inputs might contain `None`
-            which indicates that this particular input was a literal.
         """
         if len(eqn.effects) != 0:
             raise NotImplementedError(f"Equation '{eqn}' has side effects.")
@@ -619,8 +615,6 @@ def _translate_single_eqn(
         # Modify terminal root state of 'self'
         self._ctx.terminal_state = new_sdfg_term_state
 
-        return (in_var_names, out_var_names)
-
     def _translate_jaxpr_internal(
         self,
         jaxpr: jax_core.ClosedJaxpr,
@@ -643,12 +637,18 @@ def _translate_jaxpr_internal(
             if any(util.is_drop_var(outVar) for outVar in eqn.outvars):
                 assert all(util.is_drop_var(outVar) for outVar in eqn.outvars)
                 continue
-            _, out_var_names = self._translate_single_eqn(eqn=eqn)
+            self._translate_single_eqn(eqn=eqn)
             nb_translated_eqn += 1
 
-        # There were no (useful) equations; thus the Jaxpr was empty.
+        # Handle the output or the case of an empty Jaxpr
         if nb_translated_eqn == 0:
             out_var_names = self._handle_null_jaxpr(jaxpr)
+        else:
+            out_var_names = self.create_jax_var_list(
+                jaxpr.jaxpr.outvars,
+                prevent_creation=True,
+                handle_literals=False,
+            )
 
         self._ctx.out_names = tuple(out_var_names)
 

From b518ec77e46b964dcf093d02fa0ab313666c795e Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Mon, 3 Jun 2024 18:00:28 +0200
Subject: [PATCH 301/458] Reenabled the input output functionality in the
 runner function again.

However, there is no full test for that yet.
---
 src/jace/util/compiling.py | 11 ++++++-----
 1 file changed, 6 insertions(+), 5 deletions(-)

diff --git a/src/jace/util/compiling.py b/src/jace/util/compiling.py
index 81068fe..3aec681 100644
--- a/src/jace/util/compiling.py
+++ b/src/jace/util/compiling.py
@@ -110,8 +110,6 @@ def run_jax_sdfg(
         raise NotImplementedError("No kwargs are supported yet.")
     if len(inp_names) != len(cargs):
         raise RuntimeError("Wrong number of arguments.")
-    if len(set(inp_names).intersection(out_names)) != 0:
-        raise NotImplementedError("Using an input also for output is not yet supported.")
     if len(sdfg.free_symbols) != 0:  # This is a simplification that makes our life simple.
         raise NotImplementedError(
             f"No externally defined symbols are allowed, found: {sdfg.free_symbols}"
@@ -126,9 +124,12 @@ def run_jax_sdfg(
         call_args[in_name] = in_val
 
     for out_name, sarray in ((name, sdfg.arrays[name]) for name in out_names):
-        assert not (out_name in call_args and util.is_jax_array(call_args[out_name]))
-        assert isinstance(sarray, dace_data.Array)
-        call_args[out_name] = dace_data.make_array_from_descriptor(sarray)
+        if out_name in call_args:
+            if util.is_jax_array(call_args[out_name]):
+                # Jax arrays are immutable, so they can not be return values too.
+                raise ValueError("Passed a Jax array as output.")
+        else:
+            call_args[out_name] = dace_data.make_array_from_descriptor(sarray)
 
     assert len(call_args) == len(csdfg.argnames), (
         "Failed to construct the call arguments,"

From 94bdf5744ecd5f9edf4603d81213ce3ecf17c297 Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Mon, 3 Jun 2024 18:04:37 +0200
Subject: [PATCH 302/458] Updated some tests, especially the x64 test.

---
 .../test_jaxpr_translator_builder.py          |  9 ++-
 tests/unit_tests/test_jax_api.py              | 59 +++++++++++--------
 2 files changed, 42 insertions(+), 26 deletions(-)

diff --git a/tests/integration_tests/test_jaxpr_translator_builder.py b/tests/integration_tests/test_jaxpr_translator_builder.py
index b5a691c..463c3fc 100644
--- a/tests/integration_tests/test_jaxpr_translator_builder.py
+++ b/tests/integration_tests/test_jaxpr_translator_builder.py
@@ -565,9 +565,14 @@ def wrapped(A: np.ndarray, B: np.ndarray) -> tuple[np.ndarray, np.ndarray]:
     assert np.allclose(ref, res)
 
 
-@pytest.mark.skip(reason="The input is not copied in the output.")
 def test_builder_direct_return() -> None:
-    """Tests the case, when an input value is returned as output."""
+    """Tests the case, when an input value is returned as output.
+
+    Note:
+        The test function below will not return a reference to its input, but perform an actual
+        copy. This behaviour does look strange from a Python point of view, however, it is (at the
+        time of writing) consistent with what Jax does, even when passing Jax arrays directly.
+    """
 
     @jace.jit
     def wrapped(A: np.ndarray, B: np.ndarray) -> tuple[np.ndarray, np.ndarray, np.ndarray]:
diff --git a/tests/unit_tests/test_jax_api.py b/tests/unit_tests/test_jax_api.py
index e2f42e2..7571e7f 100644
--- a/tests/unit_tests/test_jax_api.py
+++ b/tests/unit_tests/test_jax_api.py
@@ -15,7 +15,8 @@
 from jax import numpy as jnp
 
 import jace
-from jace import util as jutil
+from jace import translator, util
+from jace.translator import pre_post_translation as ptrans
 
 from tests import util as testutil
 
@@ -32,10 +33,10 @@ def testee(A: np.ndarray, B: np.ndarray) -> np.ndarray:
     jax_testee = jax.jit(testee)
     jace_testee = jace.jit(testee)
 
-    assert jutil.is_jaxified(jax_testee)
-    assert not jutil.is_jaxified(jace_testee)
-    assert not jutil.is_jaceified(jax_testee)
-    assert jutil.is_jaceified(jace_testee)
+    assert util.is_jaxified(jax_testee)
+    assert not util.is_jaxified(jace_testee)
+    assert not util.is_jaceified(jax_testee)
+    assert util.is_jaceified(jace_testee)
 
     ref = jax_testee(A, B)
     res = jace_testee(A, B)
@@ -71,7 +72,7 @@ def df(x):
     def ddf(x):
         return df(x)
 
-    assert all(jutil.is_jaceified(x) for x in [f, df, ddf])
+    assert all(util.is_jaceified(x) for x in [f, df, ddf])
 
     x = 1.0
     for fun, fref in zip([f, df, ddf], [f_ref, df_ref, ddf_ref]):
@@ -107,25 +108,25 @@ def test_composition_with_jax_2():
     def f1_jax(A, B):
         return A + B
 
-    assert jutil.is_jaxified(f1_jax)
+    assert util.is_jaxified(f1_jax)
 
     @jace.jit
     def f2_jace(A, B, C):
         return f1_jax(A, B) - C
 
-    assert jutil.is_jaceified(f2_jace)
+    assert util.is_jaceified(f2_jace)
 
     @jax.jit
     def f3_jax(A, B, C, D):
         return f2_jace(A, B, C) * D
 
-    assert jutil.is_jaxified(f3_jax)
+    assert util.is_jaxified(f3_jax)
 
     @jace.jit
     def f3_jace(A, B, C, D):
         return f3_jax(A, B, C, D)
 
-    assert jutil.is_jaceified(f3_jace)
+    assert util.is_jaceified(f3_jace)
 
     A, B, C, D = (testutil.mkarray((10, 3, 50)) for _ in range(4))
 
@@ -186,11 +187,11 @@ def df(x):
     assert df(x2) == df_x2, f"Failed upper branch, expected '{df_x2}', got '{res_2}'."
 
 
-@pytest.mark.skip(reason="Running JaCe with disabled 'x64' support does not work.")
 def test_disabled_x64():
-    """Tests the behaviour of the tool chain if we explicitly disable x64 support in Jax.
+    """Tests the behaviour of the tool chain if x64 support is disabled.
 
-    If you want to test, if this restriction still applies, you can enable the test.
+    Notes:
+        Once the x64 issue is resolved make this test a bit more useful.
     """
     from jax.experimental import disable_x64
 
@@ -201,15 +202,25 @@ def testee(A: np.ndarray, B: np.float64) -> np.ndarray:
     B = np.float64(10.0)
 
     # Run them with disabled x64 support
+    #  This is basically a reimplementation of the `JaCeWrapped.lower()` function.
+    #  but we have to do it this way to disable the x64 mode in translation.
     with disable_x64():
-        # JaCe
-        jace_testee = jace.jit(testee)
-        jace_lowered = jace_testee.lower(A, B)
-        jace_comp = jace_lowered.compile()
-        res = jace_comp(A, B)
-
-        # Jax
-        jax_testee = jax.jit(testee)
-        ref = jax_testee(A, B)
-
-    assert np.allclose(ref, res), "Expected that: {ref.tolist()}, but got {res.tolist()}."
+        jaxpr = jax.make_jaxpr(testee)(A, B)
+
+    builder = translator.JaxprTranslationBuilder(
+        primitive_translators=translator.get_regsitered_primitive_translators(),
+    )
+    trans_ctx: translator.TranslationContext = builder.translate_jaxpr(jaxpr)
+
+    tsdfg: translator.TranslatedJaxprSDFG = ptrans.postprocess_jaxpr_sdfg(
+        trans_ctx=trans_ctx,
+        fun=testee,
+        call_args=(A, B),  # Already linearised, since we only accept positional args.
+        intree=None,  # Not yet implemented.
+    )
+
+    # Because x64 is disabled Jax traces the input as float32, even if we have passed
+    #  float64 as input! Calling the resulting SDFG with the arguments we used for lowering
+    #  will result in an error, because of the situation, `sizeof(float32) < sizeof(float64)`,
+    #  no out of bound error would result, but the values are garbage.
+    assert tsdfg.sdfg.arrays[tsdfg.inp_names[0]].dtype.as_numpy_dtype().type is np.float32

From 380dca9d5a77d06f3dadecd8e1932ec24ce62daf Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Mon, 3 Jun 2024 18:00:28 +0200
Subject: [PATCH 303/458] Reenabled the input output functionality in the
 runner function again.

However, there is no full test for that yet.
---
 src/jace/util/compiling.py | 11 ++++++-----
 1 file changed, 6 insertions(+), 5 deletions(-)

diff --git a/src/jace/util/compiling.py b/src/jace/util/compiling.py
index 0e3fcd7..48d6ff4 100644
--- a/src/jace/util/compiling.py
+++ b/src/jace/util/compiling.py
@@ -105,8 +105,6 @@ def run_jax_sdfg(
         raise NotImplementedError("No kwargs are supported yet.")
     if len(inp_names) != len(cargs):
         raise RuntimeError("Wrong number of arguments.")
-    if len(set(inp_names).intersection(out_names)) != 0:
-        raise NotImplementedError("Using an input also for output is not yet supported.")
     if len(sdfg.free_symbols) != 0:  # This is a simplification that makes our life simple.
         raise NotImplementedError(
             f"No externally defined symbols are allowed, found: {sdfg.free_symbols}"
@@ -121,9 +119,12 @@ def run_jax_sdfg(
         call_args[in_name] = in_val
 
     for out_name, sarray in ((name, sdfg.arrays[name]) for name in out_names):
-        assert not (out_name in call_args and util.is_jax_array(call_args[out_name]))
-        assert isinstance(sarray, dace_data.Array)
-        call_args[out_name] = dace_data.make_array_from_descriptor(sarray)
+        if out_name in call_args:
+            if util.is_jax_array(call_args[out_name]):
+                # Jax arrays are immutable, so they can not be return values too.
+                raise ValueError("Passed a Jax array as output.")
+        else:
+            call_args[out_name] = dace_data.make_array_from_descriptor(sarray)
 
     assert len(call_args) == len(csdfg.argnames), (
         "Failed to construct the call arguments,"

From 35dc1f10da1fa69000cb005687e3009ef3cf61f3 Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Tue, 4 Jun 2024 08:19:49 +0200
Subject: [PATCH 304/458] Enrique's comments.

---
 src/jace/api.py                               |  8 +-
 src/jace/optimization.py                      | 11 +--
 src/jace/stages.py                            | 20 ++---
 src/jace/translator/__init__.py               |  4 +-
 .../translator/jaxpr_translator_builder.py    | 76 +++++++------------
 src/jace/translator/primitive_translator.py   | 27 +++----
 .../primitive_translators/alu_translator.py   |  4 +-
 tests/__init__.py                             |  7 ++
 tests/test_jaxpr_translator_builder.py        |  4 +-
 tests/test_subtranslator_helper.py            | 36 ++++-----
 10 files changed, 87 insertions(+), 110 deletions(-)

diff --git a/src/jace/api.py b/src/jace/api.py
index 78d2c65..0fd1d31 100644
--- a/src/jace/api.py
+++ b/src/jace/api.py
@@ -5,12 +5,12 @@
 #
 # SPDX-License-Identifier: BSD-3-Clause
 
-"""Stand in for the `jax.*` namespace."""
+"""Implementation of the `jax.*` namespace."""
 
 from __future__ import annotations
 
 import functools
-from typing import TYPE_CHECKING, Any, Literal, cast, overload
+from typing import TYPE_CHECKING, Any, Literal, overload
 
 from jax import grad, jacfwd, jacrev
 
@@ -73,6 +73,7 @@ def jit(
         )
 
     def wrapper(f: Callable) -> stages.JaCeWrapped:
+        # TODO: Improve typing, such that signature is attached to the `JaCeWrapped`.
         jace_wrapper = stages.JaCeWrapped(
             fun=f,
             primitive_translators=(
@@ -82,6 +83,7 @@ def wrapper(f: Callable) -> stages.JaCeWrapped:
             ),
             jit_options=kwargs,
         )
-        return cast(stages.JaCeWrapped, functools.update_wrapper(jace_wrapper, f))
+        functools.update_wrapper(jace_wrapper, f)
+        return jace_wrapper
 
     return wrapper if fun is None else wrapper(fun)
diff --git a/src/jace/optimization.py b/src/jace/optimization.py
index 249225e..6d59926 100644
--- a/src/jace/optimization.py
+++ b/src/jace/optimization.py
@@ -29,15 +29,13 @@ class CompilerOptions(TypedDict, total=False):
     There are some predefined option sets in `jace.jax.stages`:
     - `DEFAULT_OPTIONS`
     - `NO_OPTIMIZATIONS`
-
-    Todo:
-        - Implement a context manager to dynamically change the default.
     """
 
     auto_optimize: bool
     simplify: bool
 
 
+# TODO(phimuell): Add a context manager to modify the default.
 DEFAULT_OPTIMIZATIONS: Final[CompilerOptions] = {
     "auto_optimize": True,
     "simplify": True,
@@ -62,14 +60,9 @@ def jace_optimize(
         tsdfg:          The translated SDFG that should be optimized.
         simplify:       Run the simplification pipeline.
         auto_optimize:  Run the auto optimization pipeline (currently does nothing)
-
-    Note:
-        Its main job is to exists that we have something that we can call in the tool chain.
     """
-    if not kwargs:
-        return
+    # Currently this function exists primarily for the same of existing.
 
-    # Unpack the arguments, defaults are such that no optimization is done.
     simplify = kwargs.get("simplify", False)
     auto_optimize = kwargs.get("auto_optimize", False)
 
diff --git a/src/jace/stages.py b/src/jace/stages.py
index a828e4a..3abe071 100644
--- a/src/jace/stages.py
+++ b/src/jace/stages.py
@@ -90,9 +90,9 @@ def __init__(
         # We have to shallow copy both the translator and the jit options.
         #  This prevents that any modifications affect `self`.
         #  Shallow is enough since the translators themselves are immutable.
-        self._primitive_translators = dict(primitive_translators)
+        self._primitive_translators = {**primitive_translators}
         # TODO(phimuell): Do we need to deepcopy the options?
-        self._jit_options = dict(jit_options)
+        self._jit_options = {**jit_options}
         self._fun = fun
 
     def __call__(
@@ -195,7 +195,7 @@ class JaCeLowered(tcache.CachingStage["JaCeCompiled"]):
 
     Note:
         `self` will manage the passed `tsdfg` object. Modifying it results in undefined behavior.
-        Although, `JaCeWrapped` is composable with Jax transformations `JaCeLowered` is not.
+        Although `JaCeWrapped` is composable with Jax transformations `JaCeLowered` is not.
         A user should never create such an object, instead `JaCeWrapped.lower()` should be used.
 
     Todo:
@@ -227,7 +227,7 @@ def compile(
             the default arguments.
         """
         # We **must** deepcopy before we do any optimization, because all optimizations are in
-        #  place, however, to properly cache stages, they have to be immutable.
+        #  place, however, to properly cache stages, stages needs to be immutable.
         tsdfg: translator.TranslatedJaxprSDFG = copy.deepcopy(self._translated_sdfg)
         optimization.jace_optimize(tsdfg=tsdfg, **self._make_compiler_options(compiler_options))
 
@@ -240,8 +240,8 @@ def compile(
     def compiler_ir(self, dialect: str | None = None) -> translator.TranslatedJaxprSDFG:
         """Returns the internal SDFG.
 
-        The function returns a `TranslatedJaxprSDFG` object. It is important that modifying this
-        object in any way is undefined behavior.
+        The function returns a `TranslatedJaxprSDFG` object. Direct modification of the returned
+        object is forbidden and will cause undefined behaviour.
         """
         if (dialect is None) or (dialect.upper() == "SDFG"):
             return self._translated_sdfg
@@ -268,7 +268,7 @@ def _make_call_description(
         compiler options.
         """
         options = self._make_compiler_options(compiler_options)
-        call_args = tuple(sorted(options.items(), key=lambda X: X[0]))
+        call_args = tuple(sorted(options.items(), key=lambda x: x[0]))
         return tcache.StageTransformationSpec(stage_id=id(self), call_args=call_args)
 
     def _make_compiler_options(
@@ -296,9 +296,9 @@ class JaCeCompiled:
         - Handle pytrees.
     """
 
-    _csdfg: dace_helper.CompiledSDFG  # The compiled SDFG object.
-    _inp_names: tuple[str, ...]  # Name of all input arguments.
-    _out_names: tuple[str, ...]  # Name of all output arguments.
+    _csdfg: dace_helper.CompiledSDFG
+    _inp_names: tuple[str, ...]
+    _out_names: tuple[str, ...]
 
     def __init__(
         self,
diff --git a/src/jace/translator/__init__.py b/src/jace/translator/__init__.py
index 2acbb7f..192c178 100644
--- a/src/jace/translator/__init__.py
+++ b/src/jace/translator/__init__.py
@@ -17,7 +17,7 @@
 from .primitive_translator import (
     PrimitiveTranslator,
     PrimitiveTranslatorCallable,
-    get_regsitered_primitive_translators,
+    get_registered_primitive_translators,
     make_primitive_translator,
     register_primitive_translator,
     set_active_primitive_translators_to,
@@ -31,7 +31,7 @@
     "PrimitiveTranslatorCallable",
     "TranslatedJaxprSDFG",
     "TranslationContext",
-    "get_regsitered_primitive_translators",
+    "get_registered_primitive_translators",
     "make_primitive_translator",
     "register_primitive_translator",
     "set_active_primitive_translators_to",
diff --git a/src/jace/translator/jaxpr_translator_builder.py b/src/jace/translator/jaxpr_translator_builder.py
index 0a2a80d..d21b3f7 100644
--- a/src/jace/translator/jaxpr_translator_builder.py
+++ b/src/jace/translator/jaxpr_translator_builder.py
@@ -10,19 +10,19 @@
 from __future__ import annotations
 
 import copy
-from collections.abc import Mapping, MutableSequence, Sequence
+from collections.abc import Mapping, Sequence
 from typing import TYPE_CHECKING, Any, Literal, cast, overload
 
 import dace
 from dace import data as ddata, properties as dprop
 from jax import core as jax_core
 
+from jace import util
+
 
 if TYPE_CHECKING:
     from jace import translator
 
-from jace import util
-
 
 class JaxprTranslationBuilder:
     """Internal builder class for creating an SDFG equivalent of a `Jaxpr` instance.
@@ -59,7 +59,7 @@ class JaxprTranslationBuilder:
     process that is already going.
 
     Args:
-        primitive_translators:    Primitive to use during the translation.
+        primitive_translators:      Primitive translators to use in the translation.
 
     Notes:
         After a translation has been performed the translator object can be used again.
@@ -97,7 +97,7 @@ def translate_jaxpr(
         """Perform the translation of a Jaxpr into a SDFG.
 
         In case this function is called and `self` has an ongoing translation process, a new
-        translation context will be created. This allows to handled nested Jaxprs.
+        translation context will be created. This allows to handle nested Jaxprs.
         However, the variable map is shared among all.
 
         Returns:
@@ -235,7 +235,7 @@ def map_jax_var_to_sdfg(
         elif allow_fail:
             return None
         else:
-            KeyError(f"The Jax variable '{jax_var}' was never registered.")
+            raise KeyError(f"The Jax variable '{jax_var}' was never registered.")
         if sdfg_name not in self._ctx.sdfg.arrays:
             raise KeyError(
                 f"Jax variable '{jax_var}' was supposed to map to '{sdfg_name}',"
@@ -280,9 +280,6 @@ def add_jax_name_mapping(
         Args:
             jax_var:     The Jax variable.
             sdfg_name:   The name of the corresponding SDFG variable.
-
-        Todo:
-            - Implement a way to delete or to modify a mapping.
         """
         assert sdfg_name
 
@@ -325,7 +322,7 @@ def add_array(
             As a temporary fix for handling scalar return values, the function will always
             generate arrays, even if `arg` is a scalar.
             According to the dace developer, the majority of the backend, i.e. optimization
-            pipeline, should be handle to handle it. But there are some special parts that
+            pipeline, should be able to handle it. But there are some special parts that
             might explicitly want a scalar, it also might block certain compiler optimization.
         """
 
@@ -339,8 +336,8 @@ def add_array(
         as_transient = True
         strides = None
 
-        if shape == ():  # Temporary fix for handling DaCe scalars, see above for more.
-            shape = (1,)
+        # Temporary fix for handling DaCe scalars, see above for more.
+        shape = shape or (1,)
 
         # Propose a name and if needed extend it.
         arg_name = util.propose_jax_name(arg, self._jax_name_map)
@@ -452,14 +449,13 @@ def create_jax_var_list(  # type: ignore[misc]
     def _create_initial_input(
         self,
         jaxpr: jax_core.ClosedJaxpr,
-    ) -> Sequence[str]:
-        """Creates the input variables of `jaxpr` and return a list of their SDFG names.
+    ) -> None:
+        """Creates the input variables of `jaxpr`.
 
         Notes:
             The function will populate the `inp_names` member of the current context.
         """
-        if not self.is_allocated():
-            raise RuntimeError("Builder is not allocated, can not create constants.")
+        assert self.is_allocated(), "Builder is not allocated, can not create constants."
         assert self._ctx.inp_names is None
 
         # Handle the initial input arguments
@@ -475,21 +471,18 @@ def _create_initial_input(
         # The output list is populated by `self._translate_jaxpr_internal()`
         self._ctx.inp_names = tuple(init_in_var_names)
 
-        return init_in_var_names
-
     def _create_constants(
         self,
         jaxpr: jax_core.ClosedJaxpr,
-    ) -> Sequence[str]:
-        """Creates all constants requested by the `jaxpr` and return a list with their SDFG names.
+    ) -> None:
+        """Creates all constants requested by the `jaxpr`.
 
         The function will create an SDFG variable and add them as constant to the SDFG. Their value
         is deepcopied.
         """
-        if not self.is_allocated():
-            raise RuntimeError("Builder is not allocated, can not create constants.")
+        assert self.is_allocated(), "Builder is not allocated, can not create constants."
         if len(jaxpr.consts) == 0:
-            return ()
+            return
 
         sdfg_const_names: Sequence[str] = self.create_jax_var_list(
             jax_var_list=jaxpr.jaxpr.constvars,
@@ -502,7 +495,6 @@ def _create_constants(
             self._ctx.sdfg.add_constant(
                 sdfg_name, copy.deepcopy(const_value), self._ctx.sdfg.arrays[sdfg_name]
             )
-        return sdfg_const_names
 
     def _allocate_translation_ctx(
         self,
@@ -518,7 +510,6 @@ def _allocate_translation_ctx(
                 name=name,
             )
         )
-
         return self
 
     @property
@@ -560,14 +551,12 @@ def _translate_single_eqn(
 
         # Input/Output variables
         #  Using a tuple for the input ensures that it cannot be modified.
-        in_var_names: Sequence[str | None] = tuple(
-            self.create_jax_var_list(
-                eqn.invars,
-                prevent_creation=True,  # Inputs must already exists.
-                handle_literals=True,  #   but they can be literals.
-            )
+        in_var_names: Sequence[str | None] = self.create_jax_var_list(
+            eqn.invars,
+            prevent_creation=True,  # Inputs must already exists.
+            handle_literals=True,  #   but they can be literals.
         )
-        out_var_names: MutableSequence[str] = self.create_jax_var_list(
+        out_var_names: Sequence[str] = self.create_jax_var_list(
             eqn.outvars,
             only_creation=True,  # Output must not exist yet.
             update_var_mapping=True,
@@ -588,7 +577,7 @@ def _translate_single_eqn(
         new_sdfg_term_state = ptranslator(
             builder=self,
             in_var_names=in_var_names,
-            out_var_names=out_var_names,  # Might be modified by the translator!
+            out_var_names=out_var_names,
             eqn=eqn,
             eqn_state=eqn_state,
         )
@@ -601,17 +590,6 @@ def _translate_single_eqn(
         if not self._ctx.validate():
             raise RuntimeError("Detected an invalid SDFG under construction.")
 
-        # In case a translator decided to not use the variables we created for it, which is
-        #  allowed but it must update the `out_var_names` list correctly, we will now verify this.
-        for expectedSDFGName, jax_var in zip(out_var_names, eqn.outvars, strict=True):
-            mapped_sdfg_name = self.map_jax_var_to_sdfg(jax_var)
-            if mapped_sdfg_name != expectedSDFGName:
-                raise ValueError(
-                    f"Mapping inconsistency detected, expected that Jax variable"
-                    f" '{jax_var}' maps to '{expectedSDFGName}' but it actually"
-                    f" maps to '{mapped_sdfg_name}'."
-                )
-
         # Modify terminal root state of 'self'
         self._ctx.terminal_state = new_sdfg_term_state
 
@@ -657,7 +635,7 @@ def _translate_jaxpr_internal(
     def _handle_null_jaxpr(
         self,
         jaxpr: jax_core.ClosedJaxpr,
-    ) -> Sequence[str]:
+    ) -> list[str]:
         """This function is called in case a `Jaxpr` with zero equations is encountered.
 
         A function with zero equation might still have output, in which case an input is copied
@@ -666,7 +644,7 @@ def _handle_null_jaxpr(
         as input and output from the mapping.
 
         Returns:
-            The function returns a list denoting the SDFG variables that refers to the output.
+            The function returns a tuple containing the SDFG variables that refer to the output.
             The order of the list is the same as in `jaxpr.jaxpr.outvars`.
 
         Todo:
@@ -680,8 +658,8 @@ def _handle_null_jaxpr(
         assert self._ctx.out_names is None
 
         # There is not output so we do not have to copy anything around.
-        if len(jaxpr.out_avals) == 0:
-            return ()
+        if not jaxpr.out_avals:
+            return []
 
         # List of the real output variables.
         out_var_names: list[str] = []
@@ -720,7 +698,7 @@ def _handle_null_jaxpr(
             #  I am open for different approaches.
             self._jax_name_map.pop(jax_out_var)
 
-        return tuple(out_var_names)
+        return out_var_names
 
     @property
     def _start_state(self) -> dace.SDFGState:
diff --git a/src/jace/translator/primitive_translator.py b/src/jace/translator/primitive_translator.py
index f0b2088..13d1821 100644
--- a/src/jace/translator/primitive_translator.py
+++ b/src/jace/translator/primitive_translator.py
@@ -12,12 +12,12 @@
 
 from __future__ import annotations
 
-from abc import abstractmethod
+import abc
 from typing import TYPE_CHECKING, Literal, Protocol, cast, overload, runtime_checkable
 
 
 if TYPE_CHECKING:
-    from collections.abc import Callable, Mapping, MutableMapping, MutableSequence, Sequence
+    from collections.abc import Callable, Mapping, MutableMapping, Sequence
 
     import dace
     from jax import core as jax_core
@@ -32,17 +32,17 @@
 class PrimitiveTranslatorCallable(Protocol):
     """Callable version of the primitive translators.
 
-    Used for type annotation purposes, classes should be derived from `PrimitiveTranslator` instead.
+    Used for type annotation purposes, the proper public interface is `PrimitiveTranslator`.
     You can use `jace.translator.make_primitive_translator()` to add a `primitive` property to
     a callable.
     """
 
-    @abstractmethod
+    @abc.abstractmethod
     def __call__(
         self,
         builder: translator.JaxprTranslationBuilder,
         in_var_names: Sequence[str | None],
-        out_var_names: MutableSequence[str],
+        out_var_names: Sequence[str],
         eqn: jax_core.JaxprEqn,
         eqn_state: dace.SDFGState,
     ) -> dace.SDFGState | None:
@@ -66,14 +66,11 @@ def __call__(
         reachable from `eqn_state`. If the function returns `None` the builder will assume that
         primitive translator was able to fully construct the dataflow graph within `eqn_state`.
 
-        While a primitive translator is forbidden from meddling with the input variables mentioned
-        in `in_var_names` in any way, it is allowed to modify the output variables. For example
-        a translator could create a new SDFG variable, with different strides. But in that case
-        the primitive translator must update the internal mapping of the builder TBA HOW, and
-        modify the names passed through `out_var_names`. However, the translator is allowed to
-        create internal temporary variables without registering them to the mapping, as long as it
-        uses the supplied variables as final output. To ensure that there are no collision with
-        further variables, the translator should prefix them.
+        A primitive translator has to use the passed input variables, `in_var_names` and must write
+        its output into the variables indicated by `out_var_names`.
+        But it is allowed that a primitive translator creates intermediate values as needed.
+        To ensure that there are no collision with further variables, the translator should prefix
+        them, see the `name_prefix` argument of `JaxprTranslationBuilder.add_array()`.
 
         Args:
             builder:        The builder object of the translation.
@@ -104,7 +101,7 @@ class PrimitiveTranslator(PrimitiveTranslatorCallable, Protocol):
     """
 
     @property
-    @abstractmethod
+    @abc.abstractmethod
     def primitive(self) -> str:
         """Returns the name of the Jax primitive that `self` is able to handle."""
         ...
@@ -207,7 +204,7 @@ def wrapper(
     return wrapper if primitive_translator is None else wrapper(primitive_translator)
 
 
-def get_regsitered_primitive_translators() -> dict[str, translator.PrimitiveTranslator]:
+def get_registered_primitive_translators() -> dict[str, translator.PrimitiveTranslator]:
     """Returns a copy of the current state of JaCe's global primitive registry.
 
     The state returned by this function is compatible to what `jace.hit`'s `primitive_translators`
diff --git a/src/jace/translator/primitive_translators/alu_translator.py b/src/jace/translator/primitive_translators/alu_translator.py
index 33f5800..8e68a75 100644
--- a/src/jace/translator/primitive_translators/alu_translator.py
+++ b/src/jace/translator/primitive_translators/alu_translator.py
@@ -20,7 +20,7 @@
 
 
 if TYPE_CHECKING:
-    from collections.abc import MutableSequence, Sequence
+    from collections.abc import Sequence
 
 
 class ALUTranslator(translator.PrimitiveTranslator):
@@ -48,7 +48,7 @@ def __call__(
         self,
         builder: translator.JaxprTranslationBuilder,
         in_var_names: Sequence[str | None],
-        out_var_names: MutableSequence[str],
+        out_var_names: Sequence[str],
         eqn: jax_core.JaxprEqn,
         eqn_state: dace.SDFGState,
     ) -> None:
diff --git a/tests/__init__.py b/tests/__init__.py
index 116302a..a5e868c 100644
--- a/tests/__init__.py
+++ b/tests/__init__.py
@@ -4,3 +4,10 @@
 # All rights reserved.
 #
 # SPDX-License-Identifier: BSD-3-Clause
+
+"""JaCe's tests.
+
+
+Note:
+    This is work in progress.
+"""
diff --git a/tests/test_jaxpr_translator_builder.py b/tests/test_jaxpr_translator_builder.py
index 75e8ded..c769788 100644
--- a/tests/test_jaxpr_translator_builder.py
+++ b/tests/test_jaxpr_translator_builder.py
@@ -42,7 +42,7 @@ def translation_builder():
     """Returns an allocated builder instance."""
     name = "fixture_builder"
     builder = translator.JaxprTranslationBuilder(
-        primitive_translators=translator.get_regsitered_primitive_translators()
+        primitive_translators=translator.get_registered_primitive_translators()
     )
     builder._allocate_translation_ctx(name=name)
     return builder
@@ -54,7 +54,7 @@ def test_builder_alloc() -> None:
     Does not use the fixture because it does it on its own.
     """
     builder = translator.JaxprTranslationBuilder(
-        primitive_translators=translator.get_regsitered_primitive_translators()
+        primitive_translators=translator.get_registered_primitive_translators()
     )
     assert not builder.is_allocated(), "Builder was created allocated."
     assert len(builder._ctx_stack) == 0
diff --git a/tests/test_subtranslator_helper.py b/tests/test_subtranslator_helper.py
index 0c5faa6..c6dd33b 100644
--- a/tests/test_subtranslator_helper.py
+++ b/tests/test_subtranslator_helper.py
@@ -18,7 +18,7 @@
 import jace
 from jace import translator
 from jace.translator import (
-    get_regsitered_primitive_translators,
+    get_registered_primitive_translators,
     make_primitive_translator,
     register_primitive_translator,
     set_active_primitive_translators_to,
@@ -28,7 +28,7 @@
 @pytest.fixture(autouse=True)
 def _conserve_builtin_translators():
     """Restores the set of registered subtranslators after a test."""
-    initial_translators = get_regsitered_primitive_translators()
+    initial_translators = get_registered_primitive_translators()
     yield
     set_active_primitive_translators_to(initial_translators)
 
@@ -73,13 +73,13 @@ def fake_add_translator(*args: Any, **kwargs: Any) -> None:  # noqa: ARG001
 def test_are_subtranslators_imported():
     """Tests if something is inside the list of subtranslators."""
     # Must be adapted if new primitives are implemented.
-    assert len(get_regsitered_primitive_translators()) == 37
+    assert len(get_registered_primitive_translators()) == 37
 
 
 @pytest.mark.usefixtures("no_builtin_translators")
 def test_subtranslatior_managing():
     """Basic functionality of the subtranslators."""
-    original_active_subtrans = get_regsitered_primitive_translators()
+    original_active_subtrans = get_registered_primitive_translators()
     assert len(original_active_subtrans) == 0
 
     # Create the classes.
@@ -94,27 +94,27 @@ def test_subtranslatior_managing():
         assert register_primitive_translator(sub) is sub
 
     # Tests if they were correctly registered
-    active_subtrans = get_regsitered_primitive_translators()
+    active_subtrans = get_registered_primitive_translators()
     for expected in prim_translators:
         assert active_subtrans[expected.primitive] is expected
     assert len(active_subtrans) == 3
 
 
 def test_subtranslatior_managing_isolation():
-    """Tests if `get_regsitered_primitive_translators()` protects the internal registry."""
+    """Tests if `get_registered_primitive_translators()` protects the internal registry."""
     assert (
-        get_regsitered_primitive_translators()
+        get_registered_primitive_translators()
         is not translator.primitive_translator._PRIMITIVE_TRANSLATORS_REGISTRY
     )
 
-    initial_primitives = get_regsitered_primitive_translators()
-    assert get_regsitered_primitive_translators() is not initial_primitives
+    initial_primitives = get_registered_primitive_translators()
+    assert get_registered_primitive_translators() is not initial_primitives
     assert "add" in initial_primitives, "For this test the 'add' primitive must be registered."
     org_add_prim = initial_primitives["add"]
 
     initial_primitives["add"] = fake_add_translator
     assert org_add_prim is not fake_add_translator
-    assert get_regsitered_primitive_translators()["add"] is org_add_prim
+    assert get_registered_primitive_translators()["add"] is org_add_prim
 
 
 def test_subtranslatior_managing_swap():
@@ -124,23 +124,23 @@ def test_subtranslatior_managing_swap():
     def same_structure(d1: dict, d2: dict) -> bool:
         return d1.keys() == d2.keys() and all(id(d2[k]) == id(d1[k]) for k in d1)
 
-    initial_primitives = get_regsitered_primitive_translators()
+    initial_primitives = get_registered_primitive_translators()
     assert "add" in initial_primitives
 
     # Now mutate the dict a little bit, shallow copy it first.
     mutated_primitives = initial_primitives.copy()
     mutated_primitives["add"] = fake_add_translator
     assert mutated_primitives.keys() == initial_primitives.keys()
-    assert same_structure(initial_primitives, get_regsitered_primitive_translators())
+    assert same_structure(initial_primitives, get_registered_primitive_translators())
     assert not same_structure(mutated_primitives, initial_primitives)
-    assert not same_structure(mutated_primitives, get_regsitered_primitive_translators())
+    assert not same_structure(mutated_primitives, get_registered_primitive_translators())
 
     # Now change the initial one with the mutated one.
     #  The object is copied but should still have the same structure.
     old_active = set_active_primitive_translators_to(mutated_primitives)
     assert mutated_primitives is not translator.primitive_translator._PRIMITIVE_TRANSLATORS_REGISTRY
     assert same_structure(old_active, initial_primitives)
-    assert same_structure(mutated_primitives, get_regsitered_primitive_translators())
+    assert same_structure(mutated_primitives, get_registered_primitive_translators())
 
 
 @pytest.mark.usefixtures("no_builtin_translators")
@@ -155,12 +155,12 @@ def non_existing_translator(*args: Any, **kwargs: Any) -> None:  # noqa: ARG001
 
     assert hasattr(non_existing_translator, "primitive")
     assert non_existing_translator.primitive == prim_name
-    assert len(get_regsitered_primitive_translators()) == 0
+    assert len(get_registered_primitive_translators()) == 0
 
 
 def test_subtranslatior_managing_overwriting():
     """Tests if we are able to overwrite something."""
-    current_add_translator = get_regsitered_primitive_translators()["add"]
+    current_add_translator = get_registered_primitive_translators()["add"]
 
     @make_primitive_translator("add")
     def useless_add_translator(*args: Any, **kwargs: Any) -> None:  # noqa: ARG001
@@ -174,13 +174,13 @@ def useless_add_translator(*args: Any, **kwargs: Any) -> None:  # noqa: ARG001
         ),
     ):
         register_primitive_translator(useless_add_translator)
-    assert current_add_translator is get_regsitered_primitive_translators()["add"]
+    assert current_add_translator is get_registered_primitive_translators()["add"]
 
     # Now we use overwrite, thus it will now work.
     assert useless_add_translator is register_primitive_translator(
         useless_add_translator, overwrite=True
     )
-    assert useless_add_translator is get_regsitered_primitive_translators()["add"]
+    assert useless_add_translator is get_registered_primitive_translators()["add"]
 
 
 @pytest.mark.usefixtures("no_builtin_translators")

From ff6699509149fc031a2d1dba8fe6a9e807fdb209 Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Tue, 4 Jun 2024 08:52:19 +0200
Subject: [PATCH 305/458] Modified some tests.

---
 tests/integration_tests/test_jaxpr_translator_builder.py      | 1 +
 tests/integration_tests/test_primitive_translator_managing.py | 2 +-
 2 files changed, 2 insertions(+), 1 deletion(-)

diff --git a/tests/integration_tests/test_jaxpr_translator_builder.py b/tests/integration_tests/test_jaxpr_translator_builder.py
index 3d742ca..e138a37 100644
--- a/tests/integration_tests/test_jaxpr_translator_builder.py
+++ b/tests/integration_tests/test_jaxpr_translator_builder.py
@@ -565,6 +565,7 @@ def wrapped(A: np.ndarray, B: np.ndarray) -> tuple[np.ndarray, np.ndarray]:
     assert np.allclose(ref, res)
 
 
+@pytest.mark.skip(reason="Direct returns, in a non empty context does not work yet.")
 def test_builder_direct_return() -> None:
     """Tests the case, when an input value is returned as output.
 
diff --git a/tests/integration_tests/test_primitive_translator_managing.py b/tests/integration_tests/test_primitive_translator_managing.py
index ecae6d1..e4b60b1 100644
--- a/tests/integration_tests/test_primitive_translator_managing.py
+++ b/tests/integration_tests/test_primitive_translator_managing.py
@@ -73,7 +73,7 @@ def fake_add_translator(*args: Any, **kwargs: Any) -> None:  # noqa: ARG001
 def test_are_subtranslators_imported():
     """Tests if something is inside the list of subtranslators."""
     # Must be adapted if new primitives are implemented.
-    assert len(get_registered_primitive_translators()) == 37
+    assert len(get_registered_primitive_translators()) == 62
 
 
 @pytest.mark.usefixtures("no_builtin_translators")

From 74435a20a457117a0bfc00d46cb53bed960225ae Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Tue, 4 Jun 2024 13:45:26 +0200
Subject: [PATCH 306/458] Reorganized some tests.

---
 src/jace/translator/primitive_translators/__init__.py |  6 +++++-
 ...anslators.py => arithmetic_logical_translators.py} |  0
 .../primitive_translators/select_n_translator.py      |  7 ++-----
 ...> test_primitive_arithmetic_logical_operations.py} |  2 +-
 .../primitive_translators/test_primitive_select_n.py  | 11 ++++++-----
 tests/unit_tests/test_jax_api.py                      |  2 +-
 6 files changed, 15 insertions(+), 13 deletions(-)
 rename src/jace/translator/primitive_translators/{alu_translators.py => arithmetic_logical_translators.py} (100%)
 rename tests/integration_tests/primitive_translators/{test_primitive_alu.py => test_primitive_arithmetic_logical_operations.py} (98%)

diff --git a/src/jace/translator/primitive_translators/__init__.py b/src/jace/translator/primitive_translators/__init__.py
index a3221d4..f06a67a 100644
--- a/src/jace/translator/primitive_translators/__init__.py
+++ b/src/jace/translator/primitive_translators/__init__.py
@@ -8,7 +8,10 @@
 
 from __future__ import annotations
 
-from .alu_translators import ArithmeticOperationTranslator
+from .arithmetic_logical_translators import (
+    ArithmeticOperationTranslator,
+    LogicalOperationTranslator,
+)
 from .broadcast_in_dim_translator import BroadcastInDimTranslator
 from .convert_element_type_translator import ConvertElementTypeTranslator
 from .copy_translator import CopyTranslator, DevicePutTranslator
@@ -26,6 +29,7 @@
     "CopyTranslator",
     "DevicePutTranslator",
     "IotaTranslator",
+    "LogicalOperationTranslator",
     "ReshapeTranslator",
     "SelectNTranslator",
     "SlicingTranslator",
diff --git a/src/jace/translator/primitive_translators/alu_translators.py b/src/jace/translator/primitive_translators/arithmetic_logical_translators.py
similarity index 100%
rename from src/jace/translator/primitive_translators/alu_translators.py
rename to src/jace/translator/primitive_translators/arithmetic_logical_translators.py
diff --git a/src/jace/translator/primitive_translators/select_n_translator.py b/src/jace/translator/primitive_translators/select_n_translator.py
index 084ced2..3d21113 100644
--- a/src/jace/translator/primitive_translators/select_n_translator.py
+++ b/src/jace/translator/primitive_translators/select_n_translator.py
@@ -49,8 +49,7 @@ def write_tasklet_code(
         in_var_names: Sequence[str | None],
         eqn: jax_core.JaxprEqn,
     ) -> str:
-        """Writes the selection code.
-        """
+        """Writes the selection code."""
         if len(in_var_names) == 3:
             # This order is correct, since `False` is interpreted as `0`, which means the first
             #  case. DaCe seems to have some problems with bools and integer casting around,
@@ -79,15 +78,13 @@ def make_input_memlets(
             if in_var_name
         }
 
-
     def literal_substitution(
         self,
         tskl_code: str,
         in_var_names: Sequence[str | None],
         eqn: jax_core.JaxprEqn,
     ) -> str:
-        """Can not be done by the base because of the renaming.
-        """
+        """Can not be done by the base because of the renaming."""
         for i, in_var_name in enumerate(in_var_names[1:]):
             if in_var_name is not None:
                 continue
diff --git a/tests/integration_tests/primitive_translators/test_primitive_alu.py b/tests/integration_tests/primitive_translators/test_primitive_arithmetic_logical_operations.py
similarity index 98%
rename from tests/integration_tests/primitive_translators/test_primitive_alu.py
rename to tests/integration_tests/primitive_translators/test_primitive_arithmetic_logical_operations.py
index 88c4c53..d2acc78 100644
--- a/tests/integration_tests/primitive_translators/test_primitive_alu.py
+++ b/tests/integration_tests/primitive_translators/test_primitive_arithmetic_logical_operations.py
@@ -39,7 +39,7 @@ def _only_alu_translators():
     This ensures that Jax is not doing some stuff that is supposed to be handled by the
     test class, such as broadcasting. It makes writing tests a bit harder, but it is worth.
     """
-    from jace.translator.primitive_translators.alu_translators import (
+    from jace.translator.primitive_translators.arithmetic_logical_translators import (
         _ARITMETIC_OPERATION_TEMPLATES,
         _LOGICAL_OPERATION_TEMPLATES,
     )
diff --git a/tests/integration_tests/primitive_translators/test_primitive_select_n.py b/tests/integration_tests/primitive_translators/test_primitive_select_n.py
index ec2285f..deda424 100644
--- a/tests/integration_tests/primitive_translators/test_primitive_select_n.py
+++ b/tests/integration_tests/primitive_translators/test_primitive_select_n.py
@@ -9,11 +9,10 @@
 
 from __future__ import annotations
 
-from typing import Any, Callable
+from typing import TYPE_CHECKING, Any
 
 import jax
 import numpy as np
-import pytest
 from jax import numpy as jnp
 
 import jace
@@ -21,8 +20,11 @@
 from tests import util as testutil
 
 
-def _perform_test(testee: Callable, *args: Any):
+if TYPE_CHECKING:
+    from collections.abc import Callable
+
 
+def _perform_test(testee: Callable, *args: Any):
     res = testee(*args)
     ref = jace.jit(testee)(*args)
     assert np.all(res == ref)
@@ -42,8 +44,7 @@ def testee(P: Any, T: Any, F: Any) -> Any:
 
 
 def test_select_n_where_literal():
-    """`np.where` where one of the input is a literal.
-    """
+    """`np.where` where one of the input is a literal."""
 
     def testee1(P: Any, F: Any) -> Any:
         return jnp.where(P, 2, F)
diff --git a/tests/unit_tests/test_jax_api.py b/tests/unit_tests/test_jax_api.py
index 41b2f10..d18a228 100644
--- a/tests/unit_tests/test_jax_api.py
+++ b/tests/unit_tests/test_jax_api.py
@@ -187,7 +187,7 @@ def df(x):
     assert df(x2) == df_x2, f"Failed upper branch, expected '{df_x2}', got '{res_2}'."
 
 
-def test_disabled_x64():
+def test_disabled_x64() -> None:
     """Tests the behaviour of the tool chain if x64 support is disabled.
 
     Notes:

From acb9501948b2a01d690a34d56831a9c5ae9ce5ca Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Tue, 4 Jun 2024 17:22:58 +0200
Subject: [PATCH 307/458] Updated the calling code.

---
 src/jace/util/compiling.py | 6 +++++-
 1 file changed, 5 insertions(+), 1 deletion(-)

diff --git a/src/jace/util/compiling.py b/src/jace/util/compiling.py
index 3aec681..0461883 100644
--- a/src/jace/util/compiling.py
+++ b/src/jace/util/compiling.py
@@ -121,12 +121,16 @@ def run_jax_sdfg(
         if util.is_scalar(in_val):
             # Currently the translator makes scalar into arrays, this has to be reflected here
             in_val = np.array([in_val])
+        elif util.is_jax_array(in_val):
+            # TODO(phimuell): Add test for this.
+            if not util.is_fully_addressable(in_val):
+                raise ValueError(f"Passed a not fully addressable Jax array as '{in_name}'")
+            in_val = in_val.__array__()
         call_args[in_name] = in_val
 
     for out_name, sarray in ((name, sdfg.arrays[name]) for name in out_names):
         if out_name in call_args:
             if util.is_jax_array(call_args[out_name]):
-                # Jax arrays are immutable, so they can not be return values too.
                 raise ValueError("Passed a Jax array as output.")
         else:
             call_args[out_name] = dace_data.make_array_from_descriptor(sarray)

From 5373ca9f3376dd49329bfc7316959889029d9549 Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Tue, 4 Jun 2024 17:24:59 +0200
Subject: [PATCH 308/458] It is now also possible to generate random complex.

---
 tests/util.py | 9 ++++++---
 1 file changed, 6 insertions(+), 3 deletions(-)

diff --git a/tests/util.py b/tests/util.py
index c434666..ba65808 100644
--- a/tests/util.py
+++ b/tests/util.py
@@ -36,8 +36,9 @@ def mkarray(
         shape:      The shape to use.
         dtype:      The data type to use.
 
-    Todo:
-        - Also support integers.
+    Notes:
+        Floating point based values are generated in the range 0 to 1.0, integers are inside the
+        range `-2**16` to `2**16`.
     """
 
     if shape == ():
@@ -48,5 +49,7 @@ def mkarray(
     if dtype == np.bool_:
         return np.random.random(shape) > 0.5  # noqa: NPY002
     if np.issubdtype(dtype, np.integer):
-        return np.random.randint(low=-2**30, high=2**30, size=shape, dtype=dtype)  # noqa: NPY002
+        return np.random.randint(low=-2**16, high=2**16, size=shape, dtype=dtype)  # noqa: NPY002
+    if np.issubdtype(dtype, np.complexfloating):
+        return np.array(mkarray(shape, np.float64) + 1.0j * mkarray(shape, np.float64), dtype=dtype)
     return np.array(np.random.random(shape), dtype=dtype)  # noqa: NPY002

From e9597f2b5356c396fe550d6e15c6dea2c74c7ca0 Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Tue, 4 Jun 2024 18:01:56 +0200
Subject: [PATCH 309/458] Updated the alu tests.

---
 ...primitive_arithmetic_logical_operations.py | 67 +++++++++++++++++++
 1 file changed, 67 insertions(+)

diff --git a/tests/integration_tests/primitive_translators/test_primitive_arithmetic_logical_operations.py b/tests/integration_tests/primitive_translators/test_primitive_arithmetic_logical_operations.py
index d2acc78..96837c2 100644
--- a/tests/integration_tests/primitive_translators/test_primitive_arithmetic_logical_operations.py
+++ b/tests/integration_tests/primitive_translators/test_primitive_arithmetic_logical_operations.py
@@ -18,6 +18,7 @@
 from collections.abc import Callable
 from typing import TYPE_CHECKING, Any
 
+import dace
 import jax
 import numpy as np
 import pytest
@@ -79,6 +80,47 @@ def logical_ops(request) -> tuple[Callable, tuple[np.ndarray, ...]]:
     )
 
 
+@pytest.fixture(
+    params=[
+        np.float32,
+        pytest.param(
+            np.complex64,
+            marks=pytest.mark.skip("Some complex values operations are not fully supported."),
+        ),
+    ]
+)
+def dtype(request) -> np.generic:
+    """The dtypes that should be used for the full alu tests."""
+    return request.param
+
+
+@pytest.fixture(
+    params=[
+        lambda x: +(x - 1.0),
+        lambda x: -x,
+        jnp.floor,
+        jnp.ceil,
+        jnp.round,
+        jnp.exp2,
+        jnp.exp,
+        lambda x: jnp.abs(x - 0.5),
+        lambda x: jnp.log(x + 1.0),
+        lambda x: jnp.sqrt(x**2),
+        # The following have a restricted input domain, so we use `x = f^{-1}(f(x))`.
+        lambda x: jnp.log1p(jnp.expm1(x)),
+        lambda x: jnp.asin(jnp.sin(x)),
+        lambda x: jnp.acos(jnp.cos(x)),
+        lambda x: jnp.atan(jnp.tan(x)),
+        lambda x: jnp.asinh(jnp.sinh(x)),
+        lambda x: jnp.acosh(jnp.cosh(x)),
+        lambda x: jnp.atanh(jnp.tanh(x)),
+    ]
+)
+def alu_unary_ops(request, dtype) -> tuple[Callable, np.ndarray]:
+    """The inputs and the operation we need for the full test."""
+    return (request.param, testutil.mkarray((2, 2), dtype))
+
+
 def _perform_alu_test(testee: Callable, *args: Any) -> None:
     """General function that just performs the test."""
     wrapped = jace.jit(testee)
@@ -254,6 +296,22 @@ def testee(A: np.ndarray, B: np.ndarray) -> np.ndarray:
     _perform_alu_test(testee, B, A)
 
 
+def test_alu_unary_isfinite():
+    def testee(A: np.ndarray) -> np.ndarray:
+        return jnp.isfinite(A)
+
+    A = np.array([np.inf, +np.inf, -np.inf, np.nan, -np.nan, 1.0])
+
+    args = dace.Config.get("compiler", "cpu", "args")
+    try:
+        new_args = args.replace("-ffast-math", "-fno-finite-math-only")
+        dace.Config.set("compiler", "cpu", "args", value=new_args)
+        _perform_alu_test(testee, A)
+
+    finally:
+        dace.Config.set("compiler", "cpu", "args", value=args)
+
+
 def test_alu_logical_bitwise_operation(
     logical_ops: tuple[Callable, tuple[np.ndarray, ...]],
 ) -> None:
@@ -264,3 +322,12 @@ def testee(*args: np.ndarray) -> np.ndarray:
         return logical_ops[0](*args)
 
     _perform_alu_test(testee, *inputs)
+
+
+def test_alu_general_unary(alu_unary_ops: tuple[Callable, np.ndarray]):
+    """General test for the unary operations."""
+
+    def testee(A: np.ndarray) -> np.ndarray:
+        return alu_unary_ops[0](A)
+
+    _perform_alu_test(testee, alu_unary_ops[1])

From 4499cfb3d914d73ff7fefbaf771272626876539a Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Wed, 5 Jun 2024 07:34:25 +0200
Subject: [PATCH 310/458] Enrique's suggestions/comments.

---
 CODING_GUIDELINES.md                          |   4 +-
 src/jace/api.py                               |  11 +-
 src/jace/optimization.py                      |  11 +-
 src/jace/stages.py                            | 104 ++++----
 src/jace/translator/__init__.py               |   4 +-
 .../translator/jaxpr_translator_builder.py    | 227 +++++++++---------
 src/jace/translator/post_translation.py       |  27 +--
 src/jace/translator/primitive_translator.py   | 115 +++++----
 src/jace/translator/translated_jaxpr_sdfg.py  |  35 ++-
 src/jace/util/__init__.py                     |  14 +-
 src/jace/util/compiling.py                    |  78 +++---
 src/jace/util/jax_helper.py                   |  61 +++--
 src/jace/util/{util.py => misc.py}            |   0
 src/jace/util/traits.py                       |  49 +---
 src/jace/util/translation_cache.py            |  77 +++---
 tests/test_jax_api.py                         |  17 +-
 16 files changed, 401 insertions(+), 433 deletions(-)
 rename src/jace/util/{util.py => misc.py} (100%)

diff --git a/CODING_GUIDELINES.md b/CODING_GUIDELINES.md
index c7c5d3c..582ae00 100644
--- a/CODING_GUIDELINES.md
+++ b/CODING_GUIDELINES.md
@@ -9,15 +9,13 @@ We deviate from the [Google Python Style Guide][google-style-guide] only in the
 - We use [`ruff-linter`][ruff-linter] instead of [`pylint`][pylint].
 - We use [`ruff-formatter`][ruff-formatter] for source code and imports formatting, which may work differently than indicated by the guidelines in section [_3. Python Style Rules_](https://google.github.io/styleguide/pyguide.html#3-python-style-rules). For example, maximum line length is set to 100 instead of 79 (although docstring lines should still be limited to 79).
 - According to subsection [_2.19 Power Features_](https://google.github.io/styleguide/pyguide.html#219-power-features), direct use of _power features_ (e.g. custom metaclasses, import hacks, reflection) should be avoided, but standard library classes that internally use these power features are accepted. Following the same spirit, we allow the use of power features in infrastructure code with similar functionality and scope as the Python standard library.
-- For readability purposes, when a docstring contains more than the required summary line, we prefer indenting the first line at the same cursor position as the first opening quote, although this is not explicitly considered in the doctring conventions described in subsection [_3.8.1 Docstrings_](https://google.github.io/styleguide/pyguide.html#381-docstrings). Example:
 
   ```python
   # single line docstring
   """A one-line summary of the module or program, terminated by a period."""
 
   # multi-line docstring
-  """
-  A one-line summary of the module or program, terminated by a period.
+  """ A one-line summary of the module or program, terminated by a period.
 
   Leave one blank line. The rest of this docstring should contain an
   overall description of the module or program.
diff --git a/src/jace/api.py b/src/jace/api.py
index 0fd1d31..9f128b3 100644
--- a/src/jace/api.py
+++ b/src/jace/api.py
@@ -55,13 +55,14 @@ def jit(
 ) -> stages.JaCeWrapped | Callable[[Callable], stages.JaCeWrapped]:
     """JaCe's replacement for `jax.jit` (just-in-time) wrapper.
 
-    It works the same way as `jax.jit` does, but instead of using XLA the computation is lowered
-    to DaCe. In addition it accepts some JaCe specific arguments, it accepts the same arguments
-    as `jax.jit` does.
+    It works the same way as `jax.jit` does, but instead of using XLA the
+    computation is lowered to DaCe. In addition it accepts some JaCe specific
+    arguments.
 
     Args:
-        primitive_translators:    Use these primitive translators for the lowering to SDFG.
-            If not specified the translators in the global registry are used.
+        primitive_translators: Use these primitive translators for the lowering
+            to SDFG. If not specified the translators in the global registry are
+            used.
 
     Notes:
         After constructions any change to `primitive_translators` has no effect.
diff --git a/src/jace/optimization.py b/src/jace/optimization.py
index 6d59926..7240b79 100644
--- a/src/jace/optimization.py
+++ b/src/jace/optimization.py
@@ -53,13 +53,14 @@ def jace_optimize(
 ) -> None:
     """Performs optimization of the translated SDFG _in place_.
 
-    It is recommended to use the `CompilerOptions` `TypedDict` to pass options to the function.
-    However, any option that is not specified will be interpreted as to be disabled.
+    It is recommended to use the `CompilerOptions` `TypedDict` to pass options
+    to the function. However, any option that is not specified will be
+    interpreted as to be disabled.
 
     Args:
-        tsdfg:          The translated SDFG that should be optimized.
-        simplify:       Run the simplification pipeline.
-        auto_optimize:  Run the auto optimization pipeline (currently does nothing)
+        tsdfg: The translated SDFG that should be optimized.
+        simplify: Run the simplification pipeline.
+        auto_optimize: Run the auto optimization pipeline (currently does nothing)
     """
     # Currently this function exists primarily for the same of existing.
 
diff --git a/src/jace/stages.py b/src/jace/stages.py
index 3abe071..9dbcb7e 100644
--- a/src/jace/stages.py
+++ b/src/jace/stages.py
@@ -12,16 +12,17 @@
 As in Jax JaCe has different stages, the terminology is taken from
 [Jax' AOT-Tutorial](https://jax.readthedocs.io/en/latest/aot.html).
 - Stage out:
-    In this phase we translate an executable python function into Jaxpr.
+    In this phase an executable Python function is translated to Jaxpr.
 - Lower:
-    This will transform the Jaxpr into an SDFG equivalent. As a implementation note,
-    currently this and the previous step are handled as a single step.
+    This will transform the Jaxpr into an SDFG equivalent. As a implementation
+    note, currently this and the previous step are handled as a single step.
 - Compile:
     This will turn the SDFG into an executable object, see `dace.codegen.CompiledSDFG`.
 - Execution:
     This is the actual running of the computation.
 
-As in Jax the `stages` module give access to the last three stages, but not the first one.
+As in Jax the `stages` module give access to the last three stages, but not
+the first one.
 """
 
 from __future__ import annotations
@@ -54,26 +55,28 @@
 class JaCeWrapped(tcache.CachingStage["JaCeLowered"]):
     """A function ready to be specialized, lowered, and compiled.
 
-    This class represents the output of functions such as `jace.jit()` and is the first stage in
-    the translation/compilation chain of JaCe. A user should never create a `JaCeWrapped` object
-    directly, instead `jace.jit` should be used for that.
-    While it supports just-in-time lowering and compilation, by just calling it, these steps can
-    also be performed explicitly. The lowering performed by this stage is cached, thus if a
-    `JaCeWrapped` object is lowered later, with the same argument the result is taken from the
-    cache. Furthermore, a `JaCeWrapped` object is composable with all Jax transformations.
+    This class represents the output of functions such as `jace.jit()` and is
+    the first stage in the translation/compilation chain of JaCe. A user should
+    never create a `JaCeWrapped` object directly, instead `jace.jit` should be
+    used for that. While it supports just-in-time lowering and compilation, by
+    just calling it, these steps can also be performed explicitly. The lowering
+    performed by this stage is cached, thus if a `JaCeWrapped` object is lowered
+    later, with the same argument the result is taken from the cache.
+    Furthermore, a `JaCeWrapped` object is composable with all Jax transformations.
 
     Args:
-        fun:                    The function that is wrapped.
-        primitive_translators:  The list of primitive translators that that should be used.
-        jit_options:            Options to influence the jit process.
+        fun: The function that is wrapped.
+        primitive_translators: The list of primitive translators that that should be used.
+        jit_options: Options to influence the jit process.
 
     Todo:
-        - Handle pytrees.
-        - Handle all options to `jax.jit`.
+        - Support pytrees.
+        - Support keyword arguments and default values of the wrapped function.
+        - Support static arguments.
 
     Note:
-        The tracing of function will always happen with enabled `x64` mode, which is implicitly
-        and temporary activated while tracing.
+        The tracing of function will always happen with enabled `x64` mode,
+        which is implicitly and temporary activated while tracing.
     """
 
     _fun: Callable
@@ -122,13 +125,14 @@ def lower(
     ) -> JaCeLowered:
         """Lower this function explicitly for the given arguments.
 
-        Performs the first two steps of the AOT steps described above, i.e. trace the wrapped
-        function with the given arguments and stage it out to a Jaxpr. Then translate it to SDFG.
-        The result is encapsulated inside a `JaCeLowered` object which can later be compiled.
+        Performs the first two steps of the AOT steps described above, i.e.
+        trace the wrapped function with the given arguments and stage it out
+        to a Jaxpr. Then translate it to SDFG. The result is encapsulated
+        inside a `JaCeLowered` object which can later be compiled.
 
         Note:
-            The call to the function is cached. As key an abstract description of the call,
-            similar to the tracers used by Jax, is used.
+            The call to the function is cached. As key an abstract description
+            of the call, similar to the tracers used by Jax, is used.
             The tracing is always done with activated `x64` mode.
         """
         if len(kwargs) != 0:
@@ -175,10 +179,6 @@ def _make_call_description(
         """This function computes the key for the `JaCeWrapped.lower()` call inside the cache.
 
         The function will compute a full abstract description on its argument.
-
-        Todo:
-            - Support keyword arguments and default values of the wrapped function.
-            - Support static arguments.
         """
         call_args = tuple(tcache._AbstractCallArgument.from_value(x) for x in args)
         return tcache.StageTransformationSpec(stage_id=id(self), call_args=call_args)
@@ -187,19 +187,18 @@ def _make_call_description(
 class JaCeLowered(tcache.CachingStage["JaCeCompiled"]):
     """Represents the original computation as an SDFG.
 
-    This class represents the output of `JaCeWrapped.lower()` and represents the originally wrapped
-    computation as an SDFG. This stage is followed by the `JaCeCompiled` stage.
+    This class is the output type of `JaCeWrapped.lower()` and represents the
+    originally wrapped computation as an SDFG. This stage is followed by the
+    `JaCeCompiled` stage.
 
     Args:
-        tsdfg:      The translated SDFG object representing the computation.
+        tsdfg: The translated SDFG object representing the computation.
 
     Note:
-        `self` will manage the passed `tsdfg` object. Modifying it results in undefined behavior.
-        Although `JaCeWrapped` is composable with Jax transformations `JaCeLowered` is not.
-        A user should never create such an object, instead `JaCeWrapped.lower()` should be used.
-
-    Todo:
-        - Handle pytrees.
+        `self` will manage the passed `tsdfg` object. Modifying it results in
+        undefined behavior. Although `JaCeWrapped` is composable with Jax
+        transformations `JaCeLowered` is not. A user should never create such
+        an object, instead `JaCeWrapped.lower()` should be used.
     """
 
     _translated_sdfg: translator.TranslatedJaxprSDFG
@@ -218,13 +217,14 @@ def compile(
     ) -> JaCeCompiled:
         """Optimize and compile the lowered SDFG using `compiler_options`.
 
-        Returns an object that encapsulates a compiled SDFG object. To influence the various
-        optimizations and compile options of JaCe you can use the `compiler_options` argument.
-        If nothing is specified `jace.optimization.DEFAULT_OPTIMIZATIONS` will be used.
+        Returns an object that encapsulates a compiled SDFG object. To influence
+        the various optimizations and compile options of JaCe you can use the
+        `compiler_options` argument. If nothing is specified
+        `jace.optimization.DEFAULT_OPTIMIZATIONS` will be used.
 
         Note:
-            Before `compiler_options` is forwarded to `jace_optimize()` it will be merged with
-            the default arguments.
+            Before `compiler_options` is forwarded to `jace_optimize()` it
+            will be merged with the default arguments.
         """
         # We **must** deepcopy before we do any optimization, because all optimizations are in
         #  place, however, to properly cache stages, stages needs to be immutable.
@@ -240,8 +240,8 @@ def compile(
     def compiler_ir(self, dialect: str | None = None) -> translator.TranslatedJaxprSDFG:
         """Returns the internal SDFG.
 
-        The function returns a `TranslatedJaxprSDFG` object. Direct modification of the returned
-        object is forbidden and will cause undefined behaviour.
+        The function returns a `TranslatedJaxprSDFG` object. Direct modification
+        of the returned object is forbidden and will cause undefined behaviour.
         """
         if (dialect is None) or (dialect.upper() == "SDFG"):
             return self._translated_sdfg
@@ -264,8 +264,8 @@ def _make_call_description(
     ) -> tcache.StageTransformationSpec:
         """This function computes the key for the `self.compile()` call inside the cache.
 
-        The key that is computed by this function is based on the concrete values of the passed
-        compiler options.
+        The key that is computed by this function is based on the concrete
+        values of the passed compiler options.
         """
         options = self._make_compiler_options(compiler_options)
         call_args = tuple(sorted(options.items(), key=lambda x: x[0]))
@@ -281,13 +281,13 @@ def _make_compiler_options(
 class JaCeCompiled:
     """Compiled version of the SDFG.
 
-    This is the last stage of the jit chain. A user should never create a `JaCeCompiled` instance,
-    instead `JaCeLowered.compile()` should be used.
+    This is the last stage of the jit chain. A user should never create a
+    `JaCeCompiled` instance, instead `JaCeLowered.compile()` should be used.
 
     Args:
-        csdfg:      The compiled SDFG object.
-        inp_names:  Names of the SDFG variables used as inputs.
-        out_names:  Names of the SDFG variables used as outputs.
+        csdfg: The compiled SDFG object.
+        inp_names: Names of the SDFG variables used as inputs.
+        out_names: Names of the SDFG variables used as outputs.
 
     Note:
         The class assumes ownership of its input arguments.
@@ -319,8 +319,8 @@ def __call__(
     ) -> Any:
         """Calls the embedded computation.
 
-        The arguments must be the same as for the wrapped function, but with all static arguments
-        removed.
+        The arguments must be the same as for the wrapped function, but with
+        all static arguments removed.
         """
         return util.run_jax_sdfg(
             self._csdfg,
diff --git a/src/jace/translator/__init__.py b/src/jace/translator/__init__.py
index 192c178..7c2a1c4 100644
--- a/src/jace/translator/__init__.py
+++ b/src/jace/translator/__init__.py
@@ -7,8 +7,8 @@
 
 """Subpackage containing all the code related to the Jaxpr to SDFG translation.
 
-The concrete primitive translators that ships with JaCe are inside the `primitive_translators`
-subpackage.
+The concrete primitive translators that ships with JaCe are inside the
+`primitive_translators` subpackage.
 """
 
 from __future__ import annotations
diff --git a/src/jace/translator/jaxpr_translator_builder.py b/src/jace/translator/jaxpr_translator_builder.py
index d21b3f7..4e42262 100644
--- a/src/jace/translator/jaxpr_translator_builder.py
+++ b/src/jace/translator/jaxpr_translator_builder.py
@@ -27,8 +27,8 @@
 class JaxprTranslationBuilder:
     """Internal builder class for creating an SDFG equivalent of a `Jaxpr` instance.
 
-    The SDFG created by this class has a very particular form, which we call canonical. The main
-    features of such an SDFG are:
+    The SDFG created by this class has a very particular form, which we call
+    canonical. The main features of such an SDFG are:
     - the SDFG is a list of states, ideally each state corresponds to single Jax primitive,
     - it has a single source and sink state.
     - all variable names are derived from Jax names,
@@ -36,35 +36,38 @@ class JaxprTranslationBuilder:
     - It lacks the special `__return` variable,
     - the `arg_names` parameter is not set.
 
-    For these reasons the SDFG is not directly usable, and further manipulations have to be
-    performed. Especially, DaCe's validation function will fail and it is unable to be processed
-    by JaCe's optimization pipeline. For more information also see `jace.translator.post_translation`
-    module.
-
-    The idea of the translator is extremely simple. A Jaxpr is essentially a list consisting of
-    more or less simple instructions/equations, they get processed one after the other. Each
-    equation is translated into its own state that is successively appended to the SDFG, while the
-    SDFG is being build, which explains the particular form of the SDFG.
-
-    However, the actual translation of the equations is not handled by the builder. Instead the
-    request is forwarded to a `PrimitiveTranslator` object, known as primitive translator. This is
-    a highly specialized object that is able to handle one kind of primitive. For more information
-    on them see the documentation of `PrimitiveTranslator`.
-
-    To start a translation the `translate_jaxpr()` function has to be called, if this happens it is
-    said that the builder has an ongoing translation. The first translator is known as root,
-    translator. If `translate_jaxpr()` is called on a builder that has an ongoing translation,
-    a new translation context will be set up. Thus the builder will then translate the supplied
-    (nested) Jaxpr and return the result. However, this will have no influence on the translation
-    process that is already going.
+    For these reasons the SDFG is not directly usable, and further manipulations
+    have to be performed. Especially, DaCe's validation function will fail and
+    it is unable to be processed by JaCe's optimization pipeline. For more
+    information also see `jace.translator.post_translation` module.
+
+    The idea of the translator is extremely simple. A Jaxpr is essentially a
+    list consisting of more or less simple instructions/equations, they get
+    processed one after the other. Each equation is translated into its own
+    state that is successively appended to the SDFG, while the SDFG is being
+    build, which explains the particular form of the SDFG.
+
+    However, the actual translation of the equations is not handled by the
+    builder. Instead the request is forwarded to a `PrimitiveTranslator`
+    object, known as primitive translator. This is a highly specialized object
+    that is able to handle one kind of primitive. For more information on them
+    see the documentation of `PrimitiveTranslator`.
+
+    To start a translation the `translate_jaxpr()` function has to be called,
+    if this happens it is said that the builder has an ongoing translation.
+    The first translator is known as root, translator. If `translate_jaxpr()`
+    is called on a builder that has an ongoing translation, a new translation
+    context will be set up. Thus the builder will then translate the supplied
+    (nested) Jaxpr and return the result. However, this will have no influence
+    on the translation process that is already going.
 
     Args:
-        primitive_translators:      Primitive translators to use in the translation.
+        primitive_translators: Primitive translators to use in the translation.
 
     Notes:
-        After a translation has been performed the translator object can be used again.
-        Currently the builder will generate only Array as SDFG variables, however, this is a
-        temporary solution, see `add_array()`.
+        After a translation has been performed the translator object can be used
+        again. Currently the builder will generate only Array as SDFG variables,
+        however, this is a temporary solution, see `add_array()`.
     """
 
     _primitive_translators: Mapping[str, translator.PrimitiveTranslatorCallable]
@@ -96,18 +99,19 @@ def translate_jaxpr(
     ) -> TranslationContext:
         """Perform the translation of a Jaxpr into a SDFG.
 
-        In case this function is called and `self` has an ongoing translation process, a new
-        translation context will be created. This allows to handle nested Jaxprs.
-        However, the variable map is shared among all.
+        In case this function is called and `self` has an ongoing translation
+        process, a new translation context will be created. This allows to
+        handle nested Jaxprs. However, the variable map is shared among all.
 
         Returns:
-            The function will translate the passed Jaxpr object into an SDFG in canonical form.
-            This SDFG together with additional meta data, that is needed for further processing
-            is encapsulated inside a `TranslationContext` object.
-            For further use it should be passed to `postprocess_jaxpr_sdfg()`.
+            The function will translate the passed Jaxpr object into an SDFG
+            in canonical form. This SDFG together with additional meta data,
+            that is needed for further processing is encapsulated inside a
+            `TranslationContext` object. For further use it should be passed
+            to `postprocess_jaxpr_sdfg()`.
 
         Args:
-            name:   Use this name for the SDFG instead some generated one.
+            name: Use this name for the SDFG instead some generated one.
         """
 
         if len(jaxpr.effects) != 0:
@@ -137,21 +141,22 @@ def append_new_state(
     ) -> dace.SDFGState:
         """Creates a new `SDFGState`, adds it to the SDFG and returns it.
 
-        By default the new state is appended to the current terminal state. However, if
-        `prev_state` is specified it will be appended to it.
-        In case the new state is appended to the current terminal state, this will modify the
-        terminal state of `self`.
+        By default the new state is appended to the current terminal state.
+        However, if `prev_state` is specified it will be appended to it. In
+        case the new state is appended to the current terminal state, this will
+        modify the terminal state of `self`.
 
         Args:
-            label:          The name that should be given to the new `SDFGState`.
-            condition:      The condition of the state transitions used on the `InterstateEdge`.
-            assignments:    Symbol assignments that should be done during the transition.
-            prev_state:     Alternative `SDFGState` at which we should append the new state.
+            label: The name that should be given to the new `SDFGState`.
+            condition: The condition of the state transitions used on the `InterstateEdge`.
+            assignments: Symbol assignments that should be done during the transition.
+            prev_state: Alternative `SDFGState` at which we should append the new state.
 
         Notes:
-            It is potentially dangerous to not append to the current terminal state, as a
-            canonical SDFG only has one sink state. If this is done the user has to ensure,
-            that at the end of the processing the SDFG is back in canonical form.
+            It is potentially dangerous to not append to the current terminal
+            state, as a canonical SDFG only has one sink state. If this is done
+            the user has to ensure, that at the end of the processing the SDFG
+            is back in canonical form.
         """
         if isinstance(label, str) and (not util.VALID_SDFG_OBJ_NAME.fullmatch(label)):
             raise ValueError(f"Can not create state with label '{label}' since it is invalid.")
@@ -180,8 +185,8 @@ def arrays(self) -> Mapping[str, ddata.Data]:
         """Get all data descriptors that are currently known to the SDFG.
 
         Notes:
-            Essentially a shorthand and preferred way for `self.sdfg.arrays`. For getting a
-            specific data descriptor use `self.get_array()`.
+            Essentially a shorthand and preferred way for `self.sdfg.arrays`.
+            For getting a specific data descriptor use `self.get_array()`.
         """
         return cast(Mapping[str, ddata.Data], self._ctx.sdfg.arrays)
 
@@ -191,9 +196,9 @@ def get_array(
     ) -> ddata.Data:
         """Returns the SDFG `Data` object `name` referees to.
 
-        `name` can either be a string, in which case it is interpreted as a verbatim SDFG name.
-        If it is a Jax or JaCe variable, the function will first perform a lookup using
-        `self.map_jax_var_to_sdfg(name)`.
+        `name` can either be a string, in which case it is interpreted as a
+        verbatim SDFG name. If it is a Jax or JaCe variable, the function will
+        first perform a lookup using `self.map_jax_var_to_sdfg(name)`.
         """
         if isinstance(name, (jax_core.Var, util.JaCeVar)):
             sdfg_name: str = self.map_jax_var_to_sdfg(name)
@@ -225,8 +230,8 @@ def map_jax_var_to_sdfg(
         """Get the name of the SDFG variable to which `jax_var` is referring to.
 
         Args:
-            jax_var:        The Jax variable to look up.
-            allow_fail:     If no mapping is known return `None` instead of raising `KeyError`.
+            jax_var: The Jax variable to look up.
+            allow_fail: If no mapping is known return `None` instead of raising `KeyError`.
         """
         if isinstance(jax_var, jax_core.Literal):
             raise RuntimeError(f"There is no SDFG variable for literal '{jax_var}'.")
@@ -245,10 +250,7 @@ def map_jax_var_to_sdfg(
 
     @property
     def sdfg(self) -> dace.SDFG:
-        """Returns the SDFG that is currently constructed.
-
-        If you want access to the arrays of the SDFG use `self.arrays`/`self.get_array()`.
-        """
+        """Returns the SDFG that is currently constructed."""
         return self._ctx.sdfg
 
     def is_allocated(self) -> bool:
@@ -261,7 +263,7 @@ def is_allocated(self) -> bool:
     def is_root_translator(self) -> bool:
         """Tests if `self` is the root translator.
 
-        The root translator (context) is the very first translator process that was started.
+        The root translator (context) is the very first translator process.
         """
         if not self.is_allocated():
             raise RuntimeError("Builder is not allocated.")
@@ -274,12 +276,12 @@ def add_jax_name_mapping(
     ) -> JaxprTranslationBuilder:
         """Creates a new mapping between `jax_var` to `sdfg_name`.
 
-        If the mapping already exists an error will be generated. This function is not able to
-        delete a variable mapping that was established before.
+        If the mapping already exists an error will be generated. This function
+        is not able to delete a variable mapping that was established before.
 
         Args:
-            jax_var:     The Jax variable.
-            sdfg_name:   The name of the corresponding SDFG variable.
+            jax_var: The Jax variable.
+            sdfg_name: The name of the corresponding SDFG variable.
         """
         assert sdfg_name
 
@@ -305,25 +307,27 @@ def add_array(
     ) -> str:
         """Creates an SDFG variable for Jax variable `arg` and returns its SDFG name.
 
-        The SDFG object is always created as a transient. Furthermore, the function will not
-        update the internal variable mapping, by default.
+        The SDFG object is always created as a transient. Furthermore, the
+        function will not update the internal variable mapping, by default.
 
-        By default the function will use `jace.util.propose_jax_name()` to derive the name that
-        should be used. However, by passing a `JaCeVar` with a name it is possible to suggest a
-        specific name. In addition it is possible to specify `name_prefix` to supply a prefix
-        to the determined name that should be used.
+        By default the function will use `jace.util.propose_jax_name()` to derive
+        the name that should be used. However, by passing a `JaCeVar` with a
+        name it is possible to suggest a specific name. In addition it is possible
+        to specify `name_prefix` to supply a prefix to the determined name that
+        should be used.
 
         Args:
-            arg:                The Jax object for which a SDFG equivalent should be created.
-            name_prefix:        If given it will be used as prefix for the name.
+            arg: The Jax object for which a SDFG equivalent should be created.
+            name_prefix: If given it will be used as prefix for the name.
             update_var_mapping: Update the internal variable mapping; by default `False`.
 
         Notes:
-            As a temporary fix for handling scalar return values, the function will always
-            generate arrays, even if `arg` is a scalar.
-            According to the dace developer, the majority of the backend, i.e. optimization
-            pipeline, should be able to handle it. But there are some special parts that
-            might explicitly want a scalar, it also might block certain compiler optimization.
+            As a temporary fix for handling scalar return values, the function
+            will always generate arrays, even if `arg` is a scalar. According to
+            the DaCe developer, the majority of the backend, i.e. optimization
+            pipeline, should be able to handle it. But there are some special
+            parts that might explicitly want a scalar, it also might block
+            certain compiler optimization.
         """
 
         if isinstance(arg, jax_core.Literal):
@@ -402,23 +406,25 @@ def create_jax_var_list(  # type: ignore[misc]
     ) -> list[None | str]:
         """Creates SDFG variables for the listed Jax variables and returns their SDFG names.
 
-        If a Jax variable already has a SDFG equivalent then the function will use this variable.
-        If no corresponding SDFG variable is known the function will create one using `add_array()`.
+        If a Jax variable already has a SDFG equivalent then the function will
+        use this variable. If no corresponding SDFG variable is known the function
+        will create one using `add_array()`.
 
-        By setting `prevent_creation` the function will not create any new SDFG variables, if no
-        corresponding SDFG variable exists an error is generated. By setting `only_creation` the
-        function will only create new SDFG variables, if a variable already have a corresponding
-        SDFG variable an error will be generated.
+        By setting `prevent_creation` the function will not create any new SDFG
+        variables, if no corresponding SDFG variable exists an error is generated.
+        By setting `only_creation` the function will only create new SDFG variables,
+        if a variable already have a corresponding SDFG variable an error will be
+        generated.
 
-        By default literals cause an error. However, by setting `handle_literals` to `True`
-        literals will will be included in the output with the value `None`.
+        By default literals cause an error. However, by setting `handle_literals`
+        to `True` literals will will be included in the output with the value `None`.
 
         Args:
-            jax_var_list:       The list of Jax variables that should be transformed to SDFG names.
-            prevent_creation:   Never create a variable, all must already be known.
-            only_creation:      Always create a variable, it is an error if one already exist.
-            handle_literals:    Allow the processing of literals.
-            kwargs:             Will be forwarded to `self.add_array()` if a variable is created.
+            jax_var_list: The list of Jax variables that should be transformed to SDFG names.
+            prevent_creation: Never create a variable, all must already be known.
+            only_creation: Always create a variable, it is an error if one already exist.
+            handle_literals: Allow the processing of literals.
+            kwargs: Will be forwarded to `self.add_array()` if a variable is created.
 
         Todo:
             - Rollback if the creation fails.
@@ -477,8 +483,8 @@ def _create_constants(
     ) -> None:
         """Creates all constants requested by the `jaxpr`.
 
-        The function will create an SDFG variable and add them as constant to the SDFG. Their value
-        is deepcopied.
+        The function will create an SDFG variable and add them as constant to
+        the SDFG. Their value is deepcopied.
         """
         assert self.is_allocated(), "Builder is not allocated, can not create constants."
         if len(jaxpr.consts) == 0:
@@ -503,7 +509,7 @@ def _allocate_translation_ctx(
         """Allocate a new context and activate it.
 
         Args:
-            name:               The name of the SDFG.
+            name: The name of the SDFG.
         """
         self._ctx_stack.append(
             TranslationContext(
@@ -599,14 +605,16 @@ def _translate_jaxpr_internal(
     ) -> TranslationContext:
         """Performs the actual translation of the Jaxpr into an SDFG.
 
-        The function assumes that the context is allocated as well as the initial variables.
-        The function removes and returns the currently active translation context.
+        The function assumes that the context is allocated as well as the
+        initial variables. The function removes and returns the currently
+        active translation context.
 
         Args:
-            jaxpr:      The Jaxpr to translate.
+            jaxpr: The Jaxpr to translate.
 
         Notes:
-            Equations that store into drop variables, i.e. with name `_`, will be ignored.
+            Equations that store into drop variables, i.e. with name `_`,
+            will be ignored.
         """
         nb_translated_eqn: int = 0
         out_var_names: Sequence[str] = ()
@@ -638,14 +646,16 @@ def _handle_null_jaxpr(
     ) -> list[str]:
         """This function is called in case a `Jaxpr` with zero equations is encountered.
 
-        A function with zero equation might still have output, in which case an input is copied
-        to an output. This function will handle the copying from the input into the corresponding
-        output variable. It is important that the function will remove the variables that are used
-        as input and output from the mapping.
+        A function with zero equation might still have output, in which case
+        an input is copied to an output. This function will handle the copying
+        from the input into the corresponding output variable. It is important
+        that the function will remove the variables that are used as input and
+        output from the mapping.
 
         Returns:
-            The function returns a tuple containing the SDFG variables that refer to the output.
-            The order of the list is the same as in `jaxpr.jaxpr.outvars`.
+            The function returns a tuple containing the SDFG variables that
+            refer to the output. The order of the list is the same as in
+            `jaxpr.jaxpr.outvars`.
 
         Todo:
             - Handle the case if if the output is a literal.
@@ -713,12 +723,13 @@ def _terminal_sdfg_state(self) -> dace.SDFGState:
 class TranslationContext:
     """Translation context used by the `JaxprTranslationBuilder`.
 
-    Internal representation of the builder of an SDFG under construction together with the needed
-    metadata. Essentially it is an extended version of the `TranslatedJaxprSDFG`, but carrying
-    an unfinished canonical SDFG.
-    A user should consider this class as an opaque object, that represents an invalid
-    `TranslatedJaxprSDFG` object, and the only valid operation a user can do with it is passing it
-    either to `finalize_translation_context()` or the `postprocess_jaxpr_sdfg()` function.
+    Internal representation of the builder of an SDFG under construction together
+    with the needed metadata. Essentially it is an extended version of the
+    `TranslatedJaxprSDFG`, but carrying an unfinished canonical SDFG.
+    A user should consider this class as an opaque object, that represents an
+    invalid `TranslatedJaxprSDFG` object, and the only valid operation a user
+    can do with it is passing it either to `finalize_translation_context()` or
+    the `postprocess_jaxpr_sdfg()` function.
 
     Attributes:
         sdfg:              The encapsulated SDFG object.
@@ -728,7 +739,7 @@ class TranslationContext:
         terminal_state:    The (currently) last state in the state machine.
 
     Args:
-        name:       The name of the SDFG, will be forwarded to the encapsulated `TranslatedJaxprSDFG`.
+        name: The name of the SDFG, will be forwarded to the encapsulated `TranslatedJaxprSDFG`.
 
     Note:
         Access of any attribute of this class by an outside user is considered undefined behaviour.
diff --git a/src/jace/translator/post_translation.py b/src/jace/translator/post_translation.py
index 0f86e34..37be078 100644
--- a/src/jace/translator/post_translation.py
+++ b/src/jace/translator/post_translation.py
@@ -8,7 +8,6 @@
 """This module contains all functions that are related to post processing the SDFG.
 
 Most of them operate on `TranslatedJaxprSDFG` objects.
-
 Currently they mostly exist for the sake of existing.
 """
 
@@ -36,10 +35,10 @@ def postprocess_jaxpr_sdfg(
     However, the function will return a decoupled `TranslatedJaxprSDFG` object.
 
     Args:
-        trans_ctx:  The `TranslationContext` obtained from the `translate_jaxpr()` function.
-        fun:        The original function that was translated.
-        call_args:  The linearized input arguments.
-        intree:     The pytree describing the inputs.
+        trans_ctx: The `TranslationContext` obtained from the `translate_jaxpr()` function.
+        fun: The original function that was translated.
+        call_args: The linearized input arguments.
+        intree: The pytree describing the inputs.
 
     Todo:
         - Setting correct input names (layer that does not depend on JAX).
@@ -62,18 +61,18 @@ def finalize_translation_context(
 ) -> translator.TranslatedJaxprSDFG:
     """Finalizes the supplied translation context `trans_ctx`.
 
-    The function will process the SDFG that is encapsulated inside the context, i.e. a canonical
-    one, into a proper SDFG, as it is described in `TranslatedJaxprSDFG`.
-    It is important to realize that this function does not perform any optimization of the
-    underlying SDFG itself, instead it prepares an SDFG such that it can be passed to the
-    optimization pipeline.
+    The function will process the SDFG that is encapsulated inside the context,
+    i.e. a canonical one, into a proper SDFG, as it is described in
+    `TranslatedJaxprSDFG`. It is important to realize that this function does
+    not perform any optimization of the underlying SDFG itself, instead it
+    prepares an SDFG such that it can be passed to the optimization pipeline.
 
-    The function will not mutate the passed translation context and the output is always decoupled
-    from its output.
+    The function will not mutate the passed translation context and the output
+    is always decoupled from its output.
 
     Args:
-        trans_ctx:      The context that should be finalized.
-        validate:       Call the validate function after the finalizing.
+        trans_ctx: The context that should be finalized.
+        validate: Call the validate function after the finalizing.
     """
     trans_ctx.validate()
     if trans_ctx.inp_names is None:
diff --git a/src/jace/translator/primitive_translator.py b/src/jace/translator/primitive_translator.py
index 13d1821..bd149d3 100644
--- a/src/jace/translator/primitive_translator.py
+++ b/src/jace/translator/primitive_translator.py
@@ -33,8 +33,6 @@ class PrimitiveTranslatorCallable(Protocol):
     """Callable version of the primitive translators.
 
     Used for type annotation purposes, the proper public interface is `PrimitiveTranslator`.
-    You can use `jace.translator.make_primitive_translator()` to add a `primitive` property to
-    a callable.
     """
 
     @abc.abstractmethod
@@ -48,39 +46,46 @@ def __call__(
     ) -> dace.SDFGState | None:
         """Translates the Jax primitive into its SDFG equivalent.
 
-        Before the builder calls this function it will perform the following preparatory tasks:
-        - It will allocate the SDFG variables that are used as outputs. Their names will be passed
-            through the `out_var_names` argument, in the same order as `eqn.outvars`.
-        - It will collect the names of the SDFG variables that are used as inputs and place them in
-            `in_var_names`, in the same order as `eqn.invars`. If an input argument refers to a
-            literal no SDFG variable is created for it and `None` is used to indicate this.
-        - The builder will create variables that are used as output. They are passed as
-            `out_var_names`, same order as in the equation.
-        - The builder will create a new terminal state and pass it as `eqn_state` argument. This
-            state is guaranteed to be empty and `translator.terminal_sdfg_state is eqn_state` holds.
+        Before the builder calls this function it will perform the following
+        preparatory tasks:
+        - It will allocate the SDFG variables that are used as outputs. Their
+            names will be passed through the `out_var_names` argument, in the
+            same order as `eqn.outvars`.
+        - It will collect the names of the SDFG variables that are used as
+            inputs and place them in `in_var_names`, in the same order as
+            `eqn.invars`. If an input argument refers to a literal no SDFG
+            variable is created for it and `None` is used to indicate this.
+        - The builder will create variables that are used as output. They are
+            passed as `out_var_names`, same order as in the equation.
+        - The builder will create a new terminal state and pass it as `eqn_state`
+            argument. This state is guaranteed to be empty and
+            `translator.terminal_sdfg_state is eqn_state` holds.
 
         Then the primitive translator is called.
-        Usually a primitive translator should construct the dataflow graph inside `eqn_state`.
-        However, it is allowed that the primitive translators creates more states if needed, but
-        this state machinery has to have a single terminal state, which must be returned and
-        reachable from `eqn_state`. If the function returns `None` the builder will assume that
-        primitive translator was able to fully construct the dataflow graph within `eqn_state`.
-
-        A primitive translator has to use the passed input variables, `in_var_names` and must write
-        its output into the variables indicated by `out_var_names`.
-        But it is allowed that a primitive translator creates intermediate values as needed.
-        To ensure that there are no collision with further variables, the translator should prefix
-        them, see the `name_prefix` argument of `JaxprTranslationBuilder.add_array()`.
+        Usually a primitive translator should construct the dataflow graph
+        inside `eqn_state`. However, it is allowed that the primitive translators
+        creates more states if needed, but this state machinery has to have a
+        single terminal state, which must be returned and reachable from
+        `eqn_state`. If the function returns `None` the builder will assume that
+        primitive translator was able to fully construct the dataflow graph
+        within `eqn_state`.
+
+        A primitive translator has to use the passed input variables,
+        `in_var_names` and must write its output into the variables indicated
+        by `out_var_names`. But it is allowed that a primitive translator
+        creates intermediate values as needed. To ensure that there are no
+        collision with further variables, the translator should prefix them,
+        see the `name_prefix` argument of `JaxprTranslationBuilder.add_array()`.
 
         Args:
-            builder:        The builder object of the translation.
-            in_var_names:   List of the names of the arrays created inside the
-                                SDFG for the inpts or `None` in case of a literal.
-            out_var_names:  List of the names of the arrays created inside the
-                                SDFG for the outputs.
-            eqn:            The Jax primitive that should be translated.
-            eqn_state:      State into which the primitive`s SDFG representation
-                                should be constructed.
+            builder: The builder object of the translation.
+            in_var_names: List of the names of the arrays created inside the
+                SDFG for the inpts or `None` in case of a literal.
+            out_var_names: List of the names of the arrays created inside the
+                SDFG for the outputs.
+            eqn: The Jax primitive that should be translated.
+            eqn_state: State into which the primitive`s SDFG representation
+                should be constructed.
         """
         ...
 
@@ -89,15 +94,18 @@ def __call__(
 class PrimitiveTranslator(PrimitiveTranslatorCallable, Protocol):
     """Interface for all Jax primitive translators.
 
-    A translator for a primitive translates a single equation of a Jaxpr into its SDFG equivalent.
-    For satisfying this interface a concrete implementation must be immutable after construction.
+    A translator for a primitive translates a single equation of a Jaxpr into
+    its SDFG equivalent. For satisfying this interface a concrete implementation
+    must be immutable after construction.
 
-    Primitive translators are simple, but highly specialized objects that are only able to perform
-    the translation of a single primitive. The overall translation process itself is managed by a
-    builder object, which also owns and manage the primitive translators. In the end this implements
-    the delegation pattern.
+    Primitive translators are simple, but highly specialized objects that are
+    only able to perform the translation of a single primitive. The overall
+    translation process itself is managed by a builder object, which also owns
+    and manage the primitive translators. In the end this implements the
+    delegation pattern.
 
-    You can use `jace.translator.register_primitive_translator()` to register your translator to JaCe.
+    The `jace.translator.register_primitive_translator()` function can be used
+    to add a translator to the JaCe global registry.
     """
 
     @property
@@ -129,12 +137,12 @@ def make_primitive_translator(
 ):
     """Turn `primitive_translator` into a `PrimitiveTranslator` for primitive `primitive`.
 
-    Essentially, this function adds the `primitive` property to a callable, such that it satisfy
-    the `PrimitiveTranslator` protocol. However, it does not add it to the registry, for that
-    `register_primitive_translator()` has to be used.
+    Essentially, this function adds the `primitive` property to a callable, such
+    that it satisfy the `PrimitiveTranslator` protocol. However, it does not add
+    it to the registry, for that `register_primitive_translator()` has to be used.
 
     Notes:
-        This function cal also be used as decorator.
+        This function can also be used as decorator.
     """
 
     def wrapper(
@@ -174,15 +182,17 @@ def register_primitive_translator(
 ):
     """Adds a primitive translator to JaCe's global registry.
 
-    The default set of primitives that are used if nothing is specified to to `jace.jit` are stored
-    inside a global registry. To add a translator to this registry this function can be used.
+    The default set of primitives that are used if nothing is specified to to
+    `jace.jit` are stored inside a global registry. To add a translator to this
+    registry this function can be used.
 
-    If a translator for `primitive` is already registered an error will be generated. However,
-    by specifying `overwrite` `primitive_translator` will replace the current one.
+    If a translator for `primitive` is already registered an error will be
+    generated. However, by specifying `overwrite` `primitive_translator` will
+    replace the current one.
 
     Args:
         primitive_translator: The primitive translator to add to the global registry.
-        overwrite:            Replace the current primitive translator with `primitive_translator`.
+        overwrite: Replace the current primitive translator with `primitive_translator`.
 
     Note:
         To add a `primitive` property use the `@make_primitive_translator` decorator.
@@ -207,8 +217,9 @@ def wrapper(
 def get_registered_primitive_translators() -> dict[str, translator.PrimitiveTranslator]:
     """Returns a copy of the current state of JaCe's global primitive registry.
 
-    The state returned by this function is compatible to what `jace.hit`'s `primitive_translators`
-    argument expects. It is important the the returned object is decoupled from the registry.
+    The state returned by this function is compatible to what `jace.jit`'s
+    `primitive_translators` argument expects. It is important the the returned
+    object is decoupled from the registry.
     """
     return _PRIMITIVE_TRANSLATORS_REGISTRY.copy()
 
@@ -218,9 +229,9 @@ def set_active_primitive_translators_to(
 ) -> MutableMapping[str, translator.PrimitiveTranslator]:
     """Exchange the global translator registry state of JaCe with `new_translators`.
 
-    The function will return the state of the global translator registry prior to this call.
-    Any changes to `new_translators` after calling this function will have no effect on the
-    global translator registry and vice versa.
+    The function will return the state of the global translator registry prior
+    to this call. Any changes to `new_translators` after calling this function
+    will have no effect on the global translator registry and vice versa.
     """
     global _PRIMITIVE_TRANSLATORS_REGISTRY
     assert all(getattr(trans, "primitive", prim) for prim, trans in new_translators.items())
diff --git a/src/jace/translator/translated_jaxpr_sdfg.py b/src/jace/translator/translated_jaxpr_sdfg.py
index f3c5d41..811cce9 100644
--- a/src/jace/translator/translated_jaxpr_sdfg.py
+++ b/src/jace/translator/translated_jaxpr_sdfg.py
@@ -16,25 +16,28 @@
 class TranslatedJaxprSDFG:
     """Encapsulates the translated SDFG together with the metadata that is needed to run it.
 
-    Contrary to the SDFG that is encapsulated inside the `TranslationContext` object, `self`
-    carries a proper SDFG, however:
-    - It does not have `__return*` variables, instead all return arguments are passed by arguments.
-    - All input arguments are passed through arguments mentioned in `inp_names`, while the outputs
-        are passed through `out_names`.
+    Contrary to the SDFG that is encapsulated inside the `TranslationContext`
+    object, `self` carries a proper SDFG, however:
+    - It does not have `__return*` variables, instead all return arguments are
+        passed by arguments.
+    - All input arguments are passed through arguments mentioned in `inp_names`,
+        while the outputs are passed through `out_names`.
     - Only variables listed as in/outputs are non transient.
     - The order inside `inp_names` and `out_names` is the same as in the translated Jaxpr.
     - If inputs are also used as outputs they appear in both `inp_names` and `out_names`.
-    - Its `arg_names` is set to  `inp_names + out_names`, but arguments that are input and outputs
-        are only listed as inputs.
+    - Its `arg_names` is set to  `inp_names + out_names`, but arguments that are
+        input and outputs are only listed as inputs.
 
-    The only valid way to obtain a `TranslatedJaxprSDFG` is by passing a `TranslationContext`,
-    that was in turn constructed by `JaxprTranslationBuilder.translate_jaxpr()`, to the
-    `finalize_translation_context()` or preferably to the `postprocess_jaxpr_sdfg()` function.
+    The only valid way to obtain a `TranslatedJaxprSDFG` is by passing a
+    `TranslationContext`, that was in turn constructed by
+    `JaxprTranslationBuilder.translate_jaxpr()`, to the
+    `finalize_translation_context()` or preferably to the `postprocess_jaxpr_sdfg()`
+    function.
 
     Attributes:
-        sdfg:           The encapsulated SDFG object.
-        inp_names:      A list of the SDFG variables that are used as input
-        out_names:      A list of the SDFG variables that are used as output.
+        sdfg: The encapsulated SDFG object.
+        inp_names: A list of the SDFG variables that are used as input
+        out_names: A list of the SDFG variables that are used as output.
     """
 
     sdfg: dace.SDFG
@@ -55,5 +58,11 @@ def validate(self) -> bool:
                 self.sdfg,
                 self.sdfg.node_id(self.sdfg.start_state),
             )
+        if self.sdfg.free_symbols:  # This is a simplification that makes our life simple.
+            raise dace.sdfg.InvalidSDFGError(
+                f"Found free symbols: {self.sdfg.free_symbols}",
+                self.sdfg,
+                self.sdfg.node_id(self.sdfg.start_state),
+            )
         self.sdfg.validate()
         return True
diff --git a/src/jace/util/__init__.py b/src/jace/util/__init__.py
index 51e6b75..27bd032 100644
--- a/src/jace/util/__init__.py
+++ b/src/jace/util/__init__.py
@@ -22,21 +22,19 @@
     propose_jax_name,
     translate_dtype,
 )
+from .misc import (
+    FORBIDDEN_SDFG_VAR_NAMES,
+    VALID_SDFG_OBJ_NAME,
+    VALID_SDFG_VAR_NAME,
+)
 from .traits import (
     is_array,
     is_drop_var,
     is_fully_addressable,
-    is_jaceified,
     is_jax_array,
-    is_jaxified,
     is_on_device,
     is_scalar,
 )
-from .util import (
-    FORBIDDEN_SDFG_VAR_NAMES,
-    VALID_SDFG_OBJ_NAME,
-    VALID_SDFG_VAR_NAME,
-)
 
 
 __all__ = [
@@ -52,9 +50,7 @@
     "is_array",
     "is_drop_var",
     "is_fully_addressable",
-    "is_jaceified",
     "is_jax_array",
-    "is_jaxified",
     "is_on_device",
     "is_scalar",
     "is_tracing_ongoing",
diff --git a/src/jace/util/compiling.py b/src/jace/util/compiling.py
index 48d6ff4..966b09d 100644
--- a/src/jace/util/compiling.py
+++ b/src/jace/util/compiling.py
@@ -29,15 +29,10 @@
 def compile_jax_sdfg(
     tsdfg: translator.TranslatedJaxprSDFG,
 ) -> dace_helper.CompiledSDFG:
-    """Compiles the SDFG embedded in `tsdfg` and return the resulting `CompiledSDFG` object.
-
-    Note:
-        For calling the returned `CompiledSDFG` object you need the `inp_names` and `out_names`
-        of the input `TranslatedJaxprSDFG`.
-    """
+    """Compiles the SDFG embedded in `tsdfg` and return the resulting `CompiledSDFG` object."""
     if any(  # We do not support the DaCe return mechanism
-        arrname.startswith("__return")
-        for arrname in tsdfg.sdfg.arrays.keys()  # noqa: SIM118  # we can not use `in` because we are also interested in `__return_`!
+        array_name.startswith("__return")
+        for array_name in tsdfg.sdfg.arrays.keys()  # noqa: SIM118  # we can not use `in` because we are also interested in `__return_`!
     ):
         raise ValueError("Only support SDFGs without '__return' members.")
 
@@ -71,76 +66,73 @@ def run_jax_sdfg(
     csdfg: dace_helper.CompiledSDFG,
     inp_names: Sequence[str],
     out_names: Sequence[str],
-    cargs: Sequence[Any],
-    ckwargs: Mapping[str, Any],
+    call_args: Sequence[Any],
+    call_kwargs: Mapping[str, Any],
 ) -> tuple[Any, ...] | Any:
     """Run the compiled SDFG.
 
-    The function assumes that the SDFG was finalized and then compiled by `compile_jax_sdfg()`.
-    For running the SDFG you also have to pass the input names (`inp_names`) and output names
-    (`out_names`) that were inside the `TranslatedJaxprSDFG` from which `csdfg` was compiled from.
+    The function assumes that the SDFG was finalized and then compiled by
+    `compile_jax_sdfg()`. For running the SDFG you also have to pass the input
+    names (`inp_names`) and output names (`out_names`) that were inside the
+    `TranslatedJaxprSDFG` from which `csdfg` was compiled from.
 
     Args:
-        csdfg:      The `CompiledSDFG` object.
-        inp_names:  List of names of the input arguments.
-        out_names:  List of names of the output arguments.
-        cargs:      All positional arguments of the call.
-        ckwargs:    All keyword arguments of the call.
+        csdfg: The `CompiledSDFG` object.
+        inp_names: List of names of the input arguments.
+        out_names: List of names of the output arguments.
+        call_args: All positional arguments of the call.
+        call_kwargs: All keyword arguments of the call.
 
     Note:
-        There is no pytree mechanism jet, thus the return values are returned inside a `tuple`
-        or in case of one value, directly, in the order determined by Jax.
-        Furthermore, DaCe does not support scalar return values, thus they are silently converted
-        into arrays of length 1, the same holds for inputs.
+        There is no pytree mechanism jet, thus the return values are returned
+        inside a `tuple` or in case of one value, directly, in the order
+        determined by Jax. Furthermore, DaCe does not support scalar return
+        values, thus they are silently converted into arrays of length 1, the
+        same holds for inputs.
 
     Todo:
-        - Since we do not have symbols and a fixed size this works and there is no problem.
-            However, if we have symbols or variable sizes, we must ensure that the init function of
-            the SDFG is called every time, or ensure that its exit function runs every time.
         - Implement non C strides.
     """
     sdfg: dace.SDFG = csdfg.sdfg
 
-    if len(ckwargs) != 0:
+    if len(call_kwargs) != 0:
         raise NotImplementedError("No kwargs are supported yet.")
-    if len(inp_names) != len(cargs):
+    if len(inp_names) != len(call_args):
         raise RuntimeError("Wrong number of arguments.")
-    if len(sdfg.free_symbols) != 0:  # This is a simplification that makes our life simple.
+    if sdfg.free_symbols:  # This is a simplification that makes our life simple.
         raise NotImplementedError(
             f"No externally defined symbols are allowed, found: {sdfg.free_symbols}"
         )
 
     # Build the argument list that we will pass to the compiled object.
-    call_args: dict[str, Any] = {}
-    for in_name, in_val in zip(inp_names, cargs, strict=True):
+    sdfg_call_args: dict[str, Any] = {}
+    for in_name, in_val in zip(inp_names, call_args, strict=True):
         if util.is_scalar(in_val):
             # Currently the translator makes scalar into arrays, this has to be reflected here
             in_val = np.array([in_val])
-        call_args[in_name] = in_val
+        sdfg_call_args[in_name] = in_val
 
-    for out_name, sarray in ((name, sdfg.arrays[name]) for name in out_names):
-        if out_name in call_args:
-            if util.is_jax_array(call_args[out_name]):
+    for out_name, sdfg_array in ((out_name, sdfg.arrays[out_name]) for out_name in out_names):
+        if out_name in sdfg_call_args:
+            if util.is_jax_array(sdfg_call_args[out_name]):
                 # Jax arrays are immutable, so they can not be return values too.
                 raise ValueError("Passed a Jax array as output.")
         else:
-            call_args[out_name] = dace_data.make_array_from_descriptor(sarray)
+            sdfg_call_args[out_name] = dace_data.make_array_from_descriptor(sdfg_array)
 
-    assert len(call_args) == len(csdfg.argnames), (
+    assert len(sdfg_call_args) == len(csdfg.argnames), (
         "Failed to construct the call arguments,"
         f" expected {len(csdfg.argnames)} but got {len(call_args)}."
-        f"\nExpected: {csdfg.argnames}\nGot: {list(call_args.keys())}"
+        f"\nExpected: {csdfg.argnames}\nGot: {list(sdfg_call_args.keys())}"
     )
 
     # Calling the SDFG
     with dace.config.temporary_config():
         dace.Config.set("compiler", "allow_view_arguments", value=True)
-        csdfg(**call_args)
+        csdfg(**sdfg_call_args)
 
     # Handling the output (pytrees are missing)
-    if len(out_names) == 0:
+    if not out_names:
         return None
-    ret_val: tuple[Any] = tuple(call_args[out_name] for out_name in out_names)
-    if len(out_names) == 1:
-        return ret_val[0]
-    return ret_val
+    ret_val: tuple[Any] = tuple(sdfg_call_args[out_name] for out_name in out_names)
+    return ret_val[0] if len(out_names) == 1 else ret_val
diff --git a/src/jace/util/jax_helper.py b/src/jace/util/jax_helper.py
index c5b518d..8fa982f 100644
--- a/src/jace/util/jax_helper.py
+++ b/src/jace/util/jax_helper.py
@@ -7,8 +7,8 @@
 
 """Implements all utility functions that are related to Jax.
 
-Most of the functions defined here allow an unified access to Jax' internal in a consistent and
-stable way.
+Most of the functions defined here allow an unified access to Jax' internal in
+a consistent and stable way.
 """
 
 from __future__ import annotations
@@ -32,23 +32,25 @@
 class JaCeVar:
     """Replacement for the `jax.Var` class.
 
-    This class can be seen as some kind of substitute `jax.core.Var`. The main intention of this
-    class is as an internal representation of values, as they are used in Jax, but without the Jax
-    machinery. As abstract values in Jax this class has a datatype, which is a `dace.typeclass`
-    instance and a shape. In addition it has an optional name, which allows to create variables
-    with a certain name using `JaxprTranslationBuilder.add_array()`.
+    This class can be seen as some kind of substitute `jax.core.Var`. The main
+    intention of this class is as an internal representation of values, as they
+    are used in Jax, but without the Jax machinery. As abstract values in Jax
+    this class has a datatype, which is a `dace.typeclass` instance and a shape.
+    In addition it has an optional name, which allows to create variables with
+    a certain name using `JaxprTranslationBuilder.add_array()`.
 
-    If you are expect to handle both real Jax variables and JaCe variable, you should use the
-    `get_jax_var_*()` functions to access them.
+    If it is expected that code must handle both Jax variables and `JaCeVar`
+    then the `get_jax_var_*()` functions should be used.
 
     Args:
-        shape:      The shape of the variable.
-        dtype:      The dace datatype of the variable.
-        name:       Name the variable should have, optional.
+        shape: The shape of the variable.
+        dtype: The dace datatype of the variable.
+        name: Name the variable should have, optional.
 
     Note:
-        If the name of a `JaCeVar` is '_' it is considered a drop variable.
-        The definitions of `__hash__` and `__eq__` are in accordance with how Jax variable works.
+        If the name of a `JaCeVar` is '_' it is considered a drop variable. The
+        definitions of `__hash__` and `__eq__` are in accordance with how Jax
+        variable works.
 
     Todo:
         - Add support for strides.
@@ -78,13 +80,7 @@ def __eq__(self, other: Any) -> bool:
 
 
 def get_jax_var_name(jax_var: jax_core.Atom | JaCeVar) -> str:
-    """Returns the name of `jax_var` as a string.
-
-    Notes:
-        If `jax_var` is a `JaCeVar` the function will return, if defined, its `.name` property.
-        Otherwise it will compose a name similar to Jax `Var` objects. The returned names are
-        stable, i.e. it will output the same value for the same variable.
-    """
+    """Returns the name of `jax_var` as a string."""
     match jax_var:
         case jax_core.DropVar():
             return "_"
@@ -135,8 +131,8 @@ def is_tracing_ongoing(
 ) -> bool:
     """Test if tracing is ongoing.
 
-    While a return value `True` guarantees that a translation is ongoing, a value of `False`
-    does not guarantees that no tracing is ongoing.
+    While a return value `True` guarantees that a translation is ongoing, a
+    value of `False` does not guarantees that no tracing is ongoing.
     """
     # The current implementation only checks the arguments if it contains tracers.
     if (len(args) == 0) and (len(kwargs) == 0):
@@ -163,19 +159,22 @@ def propose_jax_name(
 ) -> str:
     """Proposes a variable name for `jax_var`.
 
-    If `jax_name_map` is `None` the function will fallback to `get_jax_var_name(jax_var)`.
-    If `jax_name_map` is supplied the function will:
+    If `jax_name_map` is `None` the function will fallback to
+    `get_jax_var_name(jax_var)`. If `jax_name_map` is supplied the function
+    will:
     - If `jax_var` is stored inside `jax_name_map`, returns the mapped value.
-    - If `jax_var` is a `JaCeVar` with a set `.name` property that name will be returned.
-    - Otherwise the function will generate a new name in a similar way to the pretty printer of Jaxpr.
+    - If `jax_var` is a `JaCeVar` with a set `.name` property that name will
+        be returned.
+    - Otherwise the function will generate a new name in a similar way to the
+        pretty printer of Jaxpr.
 
     Args:
-        jax_var:        The variable for which a name to propose.
-        jax_name_map:   A mapping of all Jax variables that were already named.
+        jax_var: The variable for which a name to propose.
+        jax_name_map: A mapping of all Jax variables that were already named.
 
     Note:
-        The function guarantees that the returned name passes `VALID_SDFG_VAR_NAME` test and that
-        the name is not inside `util.FORBIDDEN_SDFG_VAR_NAMES`.
+        The function guarantees that the returned name passes `VALID_SDFG_VAR_NAME`
+        test and that the name is not inside `util.FORBIDDEN_SDFG_VAR_NAMES`.
         Dropped variables will always be named `'_'`.
     """
     if isinstance(jax_var, jax_core.Literal):
diff --git a/src/jace/util/util.py b/src/jace/util/misc.py
similarity index 100%
rename from src/jace/util/util.py
rename to src/jace/util/misc.py
diff --git a/src/jace/util/traits.py b/src/jace/util/traits.py
index 56f4f7e..c9e9059 100644
--- a/src/jace/util/traits.py
+++ b/src/jace/util/traits.py
@@ -14,40 +14,9 @@
 import dace
 import jax
 import numpy as np
-from jax import _src as jax_src, core as jax_core
-from jaxlib import xla_extension as jax_xe
+from jax import core as jax_core
 
 import jace.util as util
-from jace import stages
-
-
-def is_jaceified(obj: Any) -> TypeGuard[stages.JaCeWrapped]:
-    """Tests if `obj` is decorated by JaCe.
-
-    Similar to `is_jaxified` but for JaCe objects.
-    """
-
-    if util.is_jaxified(obj):
-        return False
-    return isinstance(obj, stages.JaCeWrapped)
-
-
-def is_jaxified(
-    obj: Any,
-) -> TypeGuard[jax_core.Primitive | jax_src.pjit.JitWrapped | jax_xe.PjitFunction]:
-    """Tests if `obj` is a "jaxified" object.
-
-    A "jaxified" object is an object that was processed by Jax.
-    While a return value of `True` guarantees a jaxified object, `False` does not proof the
-    contrary. See also `jace.util.is_jaceified()` to tests if something is a JaCe object.
-    """
-    jaxifyed_types = (
-        jax_core.Primitive,
-        # jax_core.stage.Wrapped is not runtime chakable
-        jax_src.pjit.JitWrapped,
-        jax_xe.PjitFunction,
-    )
-    return isinstance(obj, jaxifyed_types)
 
 
 def is_drop_var(jax_var: jax_core.Atom | util.JaCeVar) -> TypeGuard[jax_core.DropVar]:
@@ -65,8 +34,9 @@ def is_jax_array(
 ) -> TypeGuard[jax.Array]:
     """Tests if `obj` is a Jax array.
 
-    Notes Jax array are special as you can not write to them directly.
-    Furthermore, they always allocate on the CPU and if present, also on the GPU.
+    Note:
+     Jax arrays are special as they can not be mutated. Furthermore, they always
+     allocate on the CPU _and_ on the GPU, if present.
     """
     return isinstance(obj, jax.Array)
 
@@ -115,8 +85,8 @@ def is_on_device(
 ) -> bool:
     """Tests if `obj` is on a device.
 
-    Jax arrays are always on the CPU and GPU (if there is one). Thus for Jax arrays this
-    function is more of a test, if there is a GPU at all.
+    Jax arrays are always on the CPU and GPU (if there is one). Thus for Jax
+    arrays this function is more of a test, if there is a GPU at all.
     """
     if is_jax_array(obj):
         return hasattr(obj, "__cuda_array_interface__")
@@ -126,12 +96,7 @@ def is_on_device(
 def is_fully_addressable(
     obj: Any,
 ) -> bool:
-    """Tests if `obj` is fully addressable, i.e. is only on this host.
-
-    Notes:
-        This function currently assumes that everything that is not a Jax array is always fully
-        addressable.
-    """
+    """Tests if `obj` is fully addressable, i.e. is only on this host."""
     if is_jax_array(obj):
         return obj.is_fully_addressable
     return True
diff --git a/src/jace/util/translation_cache.py b/src/jace/util/translation_cache.py
index 02ba9ef..54c722b 100644
--- a/src/jace/util/translation_cache.py
+++ b/src/jace/util/translation_cache.py
@@ -7,10 +7,11 @@
 
 """This module contains the functionality related to the compilation cache of the stages.
 
-The cache currently caches the lowering, i.e. the result of `JaCeWrapped.lower()` and the
-compilation, i.e. `JaCeLowered.compile()`. The caches are on a per stage basis and not on a
-per instant basis. To make a stage cacheable, it must be derived from `CachingStage` and
-its transition function must be decoration with `@cached_transition`.
+The cache currently caches the lowering, i.e. the result of `JaCeWrapped.lower()`
+and the compilation, i.e. `JaCeLowered.compile()`. The caches are on a per stage
+basis and not on a per instant basis. To make a stage cacheable, it must be
+derived from `CachingStage` and its transition function must be decoration with
+`@cached_transition`.
 """
 
 from __future__ import annotations
@@ -53,12 +54,14 @@
 class CachingStage(Generic[NextStage]):
     """Annotates a stage whose transition to the next stage is cacheable.
 
-    To make the transition of a stage cacheable, the stage must be derived from this class,
-    and its initialization must call `CachingStage.__init__()`. Furthermore, its transition
-    function must be annotated by the `@cached_transition` decorator.
+    To make the transition of a stage cacheable, the stage must be derived from
+    this class, and its initialization must call `CachingStage.__init__()`.
+    Furthermore, its transition function must be annotated by the
+    `@cached_transition` decorator.
 
-    A class must implement the `_make_call_description()` to compute an abstract description
-    of the call. This is needed to operate the cache to store the stage transitions.
+    A class must implement the `_make_call_description()` to compute an abstract
+    description of the call. This is needed to operate the cache to store the
+    stage transitions.
 
     Notes:
         The `__init__()` function must explicitly be called to fully setup `self`.
@@ -93,8 +96,9 @@ def cached_transition(
 ) -> Callable[Concatenate[CachingStage[NextStage], P], NextStage]:
     """Decorator for making the transition function of the stage cacheable.
 
-    In order to work, the stage must be derived from `CachingStage`. For computing the key of a
-    call the function will use the `_make_call_description()` function of the cache.
+    In order to work, the stage must be derived from `CachingStage`. For computing
+    the key of a call the function will use the `_make_call_description()`
+    function of the cache.
 
     Todo:
         - Implement a way to temporary disable the cache.
@@ -136,19 +140,19 @@ def get_cache(
 class _AbstractCallArgument:
     """Class to represent a single argument to the transition function in an abstract way.
 
-    As noted in `StageTransformationSpec` there are two ways to describe an argument, either by
-    using its concrete value or an abstract description, which is similar to tracers in Jax.
-    This class represents the second way.
+    As noted in `StageTransformationSpec` there are two ways to describe an
+    argument, either by using its concrete value or an abstract description,
+    which is similar to tracers in Jax. This class represents the second way.
     To create an instance you should use `_AbstractCallArgument.from_value()`.
 
-    Its description is limited to scalars and arrays. To describe more complex types, they
-    should be processed by pytrees first.
+    Its description is limited to scalars and arrays. To describe more complex
+    types, they should be processed by pytrees first.
 
     Attributes:
-        shape:      In case of an array its shape, in case of a scalar the empty tuple.
-        dtype:      The DaCe type of the argument.
-        strides:    The strides of the argument, or `None` if they are unknown or a scalar.
-        storage:    The storage type where the argument is stored.
+        shape: In case of an array its shape, in case of a scalar the empty tuple.
+        dtype: The DaCe type of the argument.
+        strides: The strides of the argument, or `None` if they are unknown or a scalar.
+        storage: The storage type where the argument is stored.
     """
 
     shape: tuple[int, ...]
@@ -206,22 +210,21 @@ def from_value(
 class StageTransformationSpec:
     """Represents the entire call to a state transformation function of a stage.
 
-    State transition functions are annotated with `@cached_transition` and their result may be
-    cached. They key to locate them inside the cache is represented by this class and computed by
-    the `CachingStage._make_call_description()` function.
-    The actual key is consists of two parts, `stage_id` and `call_args`.
+    State transition functions are annotated with `@cached_transition` and their
+    result may be cached. They key to locate them inside the cache is represented
+    by this class and computed by the `CachingStage._make_call_description()`
+    function. The actual key is consists of two parts, `stage_id` and `call_args`.
 
     Args:
-        stage_id:   Origin of the call, for which the id of the stage object should be used.
-        call_args:  Description of the arguments of the call. There are two ways to describe
-            the arguments:
-            - Abstract description: In this way, the actual value of the argument is irrelevant,
-                only the structure of them are important, similar to the tracers used in Jax.
-            - Concrete description: Here one caches on the actual value of the argument.
-                The only requirement is that they can be hashed.
-
-    Todo:
-        In the future pytrees will be used as third part.
+        stage_id: Origin of the call, for which the id of the stage object should
+            be used.
+        call_args: Description of the arguments of the call. There are two ways
+            to describe the arguments:
+            - Abstract description: In this way, the actual value of the argument
+                is irrelevant, only the structure of them are important, similar
+                to the tracers used in Jax.
+            - Concrete description: Here one caches on the actual value of the
+                argument. The only requirement is that they can be hashed.
     """
 
     stage_id: int
@@ -236,12 +239,10 @@ class StageCache(Generic[StageType]):
     """Simple LRU cache to cache the results of the stage transition function.
 
     Args:
-        size:   The size of the cache, defaults to 256.
-
-    Notes:
-        The most recently used entry is at the end of the `OrderedDict`.
+        size: The size of the cache, defaults to 256.
     """
 
+    # The most recently used entry is at the end of the `OrderedDict`.
     _memory: collections.OrderedDict[StageTransformationSpec, StageType]
     _size: int
 
diff --git a/tests/test_jax_api.py b/tests/test_jax_api.py
index f6c89df..80eff4a 100644
--- a/tests/test_jax_api.py
+++ b/tests/test_jax_api.py
@@ -15,7 +15,6 @@
 from jax import numpy as jnp
 
 import jace
-from jace import util as jutil
 
 
 np.random.seed(42)  # noqa: NPY002  # random generator
@@ -33,11 +32,6 @@ def testee(A: np.ndarray, B: np.ndarray) -> np.ndarray:
     jax_testee = jax.jit(testee)
     jace_testee = jace.jit(testee)
 
-    assert jutil.is_jaxified(jax_testee)
-    assert not jutil.is_jaxified(jace_testee)
-    assert not jutil.is_jaceified(jax_testee)
-    assert jutil.is_jaceified(jace_testee)
-
     ref = jax_testee(A, B)
     res = jace_testee(A, B)
 
@@ -72,7 +66,7 @@ def df(x):
     def ddf(x):
         return df(x)
 
-    assert all(jutil.is_jaceified(x) for x in [f, df, ddf])
+    assert all(isinstance(x, jace.stages.JaCeWrapped) for x in [f, df, ddf])
 
     x = 1.0
     for fun, fref in zip([f, df, ddf], [f_ref, df_ref, ddf_ref]):
@@ -108,30 +102,21 @@ def test_composition_with_jax_2():
     def f1_jax(A, B):
         return A + B
 
-    assert jutil.is_jaxified(f1_jax)
-
     @jace.jit
     def f2_jace(A, B, C):
         return f1_jax(A, B) - C
 
-    assert jutil.is_jaceified(f2_jace)
-
     @jax.jit
     def f3_jax(A, B, C, D):
         return f2_jace(A, B, C) * D
 
-    assert jutil.is_jaxified(f3_jax)
-
     @jace.jit
     def f3_jace(A, B, C, D):
         return f3_jax(A, B, C, D)
 
-    assert jutil.is_jaceified(f3_jace)
-
     A, B, C, D = (np.random.random((10, 3, 50)) for _ in range(4))  # noqa: NPY002  # random generator
 
     ref = ((A + B) - C) * D
-
     res_jax = f3_jax(A, B, C, D)
     res_jace = f3_jace(A, B, C, D)
 

From 5c1e8c68d1b59697ec9c7efd07cf41472a796961 Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Wed, 5 Jun 2024 09:19:09 +0200
Subject: [PATCH 311/458] Updated the tests.

---
 .../arithmetic_logical_translators.py         |  3 -
 ...primitive_arithmetic_logical_operations.py | 84 ++++++++++++++++---
 .../test_primitive_convert_element_type.py    |  7 +-
 .../test_primitive_translator_managing.py     |  2 +-
 tests/util.py                                 |  6 +-
 5 files changed, 78 insertions(+), 24 deletions(-)

diff --git a/src/jace/translator/primitive_translators/arithmetic_logical_translators.py b/src/jace/translator/primitive_translators/arithmetic_logical_translators.py
index ab0dcf9..d323395 100644
--- a/src/jace/translator/primitive_translators/arithmetic_logical_translators.py
+++ b/src/jace/translator/primitive_translators/arithmetic_logical_translators.py
@@ -178,10 +178,7 @@ def write_tasklet_code(
 
     "atan2": "__out = atan2((__in0), (__in1))",
 
-    "left_shift": "__out = (__in0) << (__in1)",
-    "right_shift": "__out = (__in0) >> (__in1)",
     "nextafter": "__out = nextafter((__in0), (__in1))",
-
 }
 
 
diff --git a/tests/integration_tests/primitive_translators/test_primitive_arithmetic_logical_operations.py b/tests/integration_tests/primitive_translators/test_primitive_arithmetic_logical_operations.py
index 3424d20..c1b533d 100644
--- a/tests/integration_tests/primitive_translators/test_primitive_arithmetic_logical_operations.py
+++ b/tests/integration_tests/primitive_translators/test_primitive_arithmetic_logical_operations.py
@@ -39,6 +39,7 @@ def _only_alu_translators():
 
     This ensures that Jax is not doing some stuff that is supposed to be handled by the
     test class, such as broadcasting. It makes writing tests a bit harder, but it is worth.
+    For some reasons also type conversion s allowed.
     """
     from jace.translator.primitive_translators.arithmetic_logical_translators import (
         _ARITMETIC_OPERATION_TEMPLATES,
@@ -46,18 +47,20 @@ def _only_alu_translators():
     )
 
     # Remove all non ALU translators from the registry
-    all_translators = jace.translator.get_registered_primitive_translators()
-    alu_translators_names = (
-        _LOGICAL_OPERATION_TEMPLATES.keys() | _ARITMETIC_OPERATION_TEMPLATES.keys()
+    primitive_translators = jace.translator.get_registered_primitive_translators()
+    allowed_translators = (
+        _LOGICAL_OPERATION_TEMPLATES.keys()
+        | _ARITMETIC_OPERATION_TEMPLATES.keys()
+        | {"convert_element_type"}
     )
     jace.translator.set_active_primitive_translators_to(
-        {p: t for p, t in all_translators.items() if p in alu_translators_names}
+        {p: t for p, t in primitive_translators.items() if p in allowed_translators}
     )
 
     yield
 
     # Restore the initial state
-    jace.translator.set_active_primitive_translators_to(all_translators)
+    jace.translator.set_active_primitive_translators_to(primitive_translators)
 
 
 @pytest.fixture(
@@ -121,6 +124,44 @@ def alu_unary_ops(request, dtype) -> tuple[Callable, np.ndarray]:
     return (request.param, testutil.mkarray((2, 2), dtype))
 
 
+@pytest.fixture(
+    params=[
+        jnp.add,
+        jnp.multiply,
+        jnp.divide,
+        jnp.minimum,
+        jnp.maximum,
+        jnp.atan2,
+        jnp.nextafter,
+    ]
+)
+def alu_binary_ops_float(request) -> tuple[Callable, tuple[np.ndarray, np.ndarray]]:
+    """All binary operations that can handle floats, complex values are not tested."""
+    # Getting 0 in the division test is unlikely.
+    return (  # type: ignore[return-value]  # Type confusion.
+        request.param,
+        tuple(testutil.mkarray((2, 2), np.float64) for _ in range(2)),
+    )
+
+
+@pytest.fixture(
+    params=[
+        lambda x, y: x == y,
+        lambda x, y: x != y,
+        lambda x, y: x <= y,
+        lambda x, y: x < y,
+        lambda x, y: x >= y,
+        lambda x, y: x > y,
+    ]
+)
+def alu_binary_compare_ops(request) -> tuple[Callable, tuple[np.ndarray, np.ndarray]]:
+    """These are the comparison operations, that we test with integers, since it is simpler."""
+    return (
+        request.param,
+        tuple(np.abs(testutil.mkarray((20, 20), np.int32)) % 30 for _ in range(2)),
+    )
+
+
 def _perform_alu_test(testee: Callable, *args: Any) -> None:
     """General function that just performs the test."""
     wrapped = jace.jit(testee)
@@ -178,16 +219,15 @@ def testee(A: np.ndarray) -> np.ndarray:
     _perform_alu_test(testee, A)
 
 
-def test_alu_unary_regular_power():
+def test_alu_binary_power(dtype):
     """Tests the "normal" power operator, i.e. not with a known integer power."""
 
-    for exp in [3, np.float64(3.1415)]:
+    def testee(A: np.ndarray, exp: np.generic) -> np.ndarray:
+        return A**exp
 
-        def testee(A: np.ndarray, exp: int | float) -> np.ndarray:
-            return A**exp
-
-        A = testutil.mkarray((10, 2, 3))
-        _perform_alu_test(testee, A, exp)
+    exp = dtype(3)
+    A = testutil.mkarray((10, 2, 3), dtype=dtype)
+    _perform_alu_test(testee, A, exp)
 
 
 def test_alu_binary_scalar():
@@ -331,3 +371,23 @@ def testee(A: np.ndarray) -> np.ndarray:
         return alu_unary_ops[0](A)
 
     _perform_alu_test(testee, alu_unary_ops[1])
+
+
+def test_alu_general_binary_float(
+    alu_binary_ops_float: tuple[Callable, tuple[np.ndarray, np.ndarray]],
+):
+    """Tests the binary operations that runs on floating points."""
+
+    def testee(A: np.ndarray, B: np.ndarray) -> np.ndarray:
+        return alu_binary_ops_float[0](A, B)
+
+    _perform_alu_test(testee, *alu_binary_ops_float[1])
+
+
+def test_alu_compare_ops(alu_binary_compare_ops: tuple[Callable, tuple[np.ndarray, np.ndarray]]):
+    """Test all the comparison operations."""
+
+    def testee(A: np.ndarray, B: np.ndarray) -> np.ndarray:
+        return alu_binary_compare_ops[0](A, B)
+
+    _perform_alu_test(testee, *alu_binary_compare_ops[1])
diff --git a/tests/integration_tests/primitive_translators/test_primitive_convert_element_type.py b/tests/integration_tests/primitive_translators/test_primitive_convert_element_type.py
index a85b145..dffc125 100644
--- a/tests/integration_tests/primitive_translators/test_primitive_convert_element_type.py
+++ b/tests/integration_tests/primitive_translators/test_primitive_convert_element_type.py
@@ -72,17 +72,14 @@ def converter(A: np.ndarray) -> jax.Array:
     return True
 
 
-@pytest.mark.skip(reason="This test is too long, only do it on certain conditions.")
 def test_convert_element_type_main(src_type, dst_type):
     """Tests all conversions with the exception of conversions from bool and complex."""
     _convert_element_type_impl(src_type, dst_type)
 
 
-@pytest.mark.skip(reason="This test is too long, only do it on certain conditions.")
 def test_convert_element_type_from_bool(src_type):
     _convert_element_type_impl(np.bool_, src_type)
 
 
-@pytest.mark.skip(reason="This test is too long, only do it on certain conditions.")
-def test_convert_element_type_to_bool(dst_type):
-    _convert_element_type_impl(dst_type, np.bool_)
+def test_convert_element_type_to_bool(src_type):
+    _convert_element_type_impl(src_type, np.bool_)
diff --git a/tests/integration_tests/test_primitive_translator_managing.py b/tests/integration_tests/test_primitive_translator_managing.py
index e4b60b1..68b27a6 100644
--- a/tests/integration_tests/test_primitive_translator_managing.py
+++ b/tests/integration_tests/test_primitive_translator_managing.py
@@ -73,7 +73,7 @@ def fake_add_translator(*args: Any, **kwargs: Any) -> None:  # noqa: ARG001
 def test_are_subtranslators_imported():
     """Tests if something is inside the list of subtranslators."""
     # Must be adapted if new primitives are implemented.
-    assert len(get_registered_primitive_translators()) == 62
+    assert len(get_registered_primitive_translators()) == 60
 
 
 @pytest.mark.usefixtures("no_builtin_translators")
diff --git a/tests/util.py b/tests/util.py
index 902cbd8..c5ff56e 100644
--- a/tests/util.py
+++ b/tests/util.py
@@ -37,8 +37,7 @@ def mkarray(
         dtype:      The data type to use.
 
     Notes:
-        Floating point based values are generated in the range 0 to 1.0, integers are inside the
-        range `-2**16` to `2**16`.
+        Floating point based values are generated in the range 0 to 1.0.
     """
 
     if shape == ():
@@ -49,7 +48,8 @@ def mkarray(
     if dtype == np.bool_:
         return np.random.random(shape) > 0.5  # noqa: NPY002
     if np.issubdtype(dtype, np.integer):
-        return np.random.randint(low=-(2**16), high=2**16, size=shape, dtype=dtype)  # noqa: NPY002
+        iinfo: np.iinfo = np.iinfo(dtype)
+        return np.random.randint(low=iinfo.min, high=iinfo.max, size=shape, dtype=dtype)  # noqa: NPY002
     if np.issubdtype(dtype, np.complexfloating):
         return np.array(mkarray(shape, np.float64) + 1.0j * mkarray(shape, np.float64), dtype=dtype)
     return np.array(np.random.random(shape), dtype=dtype)  # noqa: NPY002

From 01cc7776ea6d0ccaf5d82b5e8a113aa293c5cc15 Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Thu, 6 Jun 2024 07:24:13 +0200
Subject: [PATCH 312/458] Allied some reformating.

---
 src/jace/stages.py                            |  19 ++-
 .../translator/jaxpr_translator_builder.py    |  16 +-
 src/jace/util/__init__.py                     |   6 -
 src/jace/util/compiling.py                    | 138 -----------------
 src/jace/util/dace_helper.py                  | 142 +++++++++++++++++-
 src/jace/util/jax_helper.py                   |  21 ++-
 src/jace/util/traits.py                       |   4 +-
 7 files changed, 178 insertions(+), 168 deletions(-)
 delete mode 100644 src/jace/util/compiling.py

diff --git a/src/jace/stages.py b/src/jace/stages.py
index 9dbcb7e..224bc00 100644
--- a/src/jace/stages.py
+++ b/src/jace/stages.py
@@ -232,12 +232,15 @@ def compile(
         optimization.jace_optimize(tsdfg=tsdfg, **self._make_compiler_options(compiler_options))
 
         return JaCeCompiled(
-            csdfg=util.compile_jax_sdfg(tsdfg),
+            csdfg=dace_helper.compile_jax_sdfg(tsdfg),
             inp_names=tsdfg.inp_names,
             out_names=tsdfg.out_names,
         )
 
-    def compiler_ir(self, dialect: str | None = None) -> translator.TranslatedJaxprSDFG:
+    def compiler_ir(
+        self,
+        dialect: str | None = None,
+    ) -> translator.TranslatedJaxprSDFG:
         """Returns the internal SDFG.
 
         The function returns a `TranslatedJaxprSDFG` object. Direct modification
@@ -247,8 +250,14 @@ def compiler_ir(self, dialect: str | None = None) -> translator.TranslatedJaxprS
             return self._translated_sdfg
         raise ValueError(f"Unknown dialect '{dialect}'.")
 
-    def as_html(self, filename: str | None = None) -> None:
-        """Runs the `view()` method of the underlying SDFG."""
+    def view(
+        self,
+        filename: str | None = None,
+    ) -> None:
+        """Runs the `view()` method of the underlying SDFG.
+
+        This will open a browser and display the SDFG.
+        """
         self.compiler_ir().sdfg.view(filename=filename, verbose=False)
 
     def as_sdfg(self) -> dace.SDFG:
@@ -322,7 +331,7 @@ def __call__(
         The arguments must be the same as for the wrapped function, but with
         all static arguments removed.
         """
-        return util.run_jax_sdfg(
+        return dace_helper.run_jax_sdfg(
             self._csdfg,
             self._inp_names,
             self._out_names,
diff --git a/src/jace/translator/jaxpr_translator_builder.py b/src/jace/translator/jaxpr_translator_builder.py
index 4e42262..437787e 100644
--- a/src/jace/translator/jaxpr_translator_builder.py
+++ b/src/jace/translator/jaxpr_translator_builder.py
@@ -219,7 +219,9 @@ def map_jax_var_to_sdfg(
 
     @overload
     def map_jax_var_to_sdfg(
-        self, jax_var: jax_core.Atom | util.JaCeVar, allow_fail: Literal[True]
+        self,
+        jax_var: jax_core.Atom | util.JaCeVar,
+        allow_fail: Literal[True],
     ) -> str | None: ...
 
     def map_jax_var_to_sdfg(
@@ -568,19 +570,19 @@ def _translate_single_eqn(
             update_var_mapping=True,
         )
 
-        pname: str = eqn.primitive.name
-        if pname not in self._primitive_translators:
-            raise NotImplementedError(f"No translator known to handle '{pname}'.")
-        ptranslator = self._primitive_translators[pname]
+        primitive_name: str = eqn.primitive.name
+        if primitive_name not in self._primitive_translators:
+            raise NotImplementedError(f"No translator known to handle '{primitive_name}'.")
+        translator = self._primitive_translators[primitive_name]
 
         # Create the state into which the equation should be translated
         eqn_state = self.append_new_state(
-            label=f"{pname}_{'_'.join(out_var_names)}",
+            label=f"{primitive_name}_{'_'.join(out_var_names)}",
             prev_state=None,  # forces the creation of a new terminal state
         )
 
         # Now perform the actual translation of the equation.
-        new_sdfg_term_state = ptranslator(
+        new_sdfg_term_state = translator(
             builder=self,
             in_var_names=in_var_names,
             out_var_names=out_var_names,
diff --git a/src/jace/util/__init__.py b/src/jace/util/__init__.py
index 27bd032..778c645 100644
--- a/src/jace/util/__init__.py
+++ b/src/jace/util/__init__.py
@@ -9,10 +9,6 @@
 
 from __future__ import annotations
 
-from .compiling import (
-    compile_jax_sdfg,
-    run_jax_sdfg,
-)
 from .jax_helper import (
     JaCeVar,
     get_jax_var_dtype,
@@ -42,7 +38,6 @@
     "VALID_SDFG_OBJ_NAME",
     "VALID_SDFG_VAR_NAME",
     "JaCeVar",
-    "compile_jax_sdfg",
     "dataclass_with_default_init",
     "get_jax_var_dtype",
     "get_jax_var_name",
@@ -55,6 +50,5 @@
     "is_scalar",
     "is_tracing_ongoing",
     "propose_jax_name",
-    "run_jax_sdfg",
     "translate_dtype",
 ]
diff --git a/src/jace/util/compiling.py b/src/jace/util/compiling.py
deleted file mode 100644
index 966b09d..0000000
--- a/src/jace/util/compiling.py
+++ /dev/null
@@ -1,138 +0,0 @@
-# JaCe - JAX Just-In-Time compilation using DaCe (Data Centric Parallel Programming)
-#
-# Copyright (c) 2024, ETH Zurich
-# All rights reserved.
-#
-# SPDX-License-Identifier: BSD-3-Clause
-
-"""Contains everything for compiling and running `TranslatedJaxprSDFG` instances."""
-
-from __future__ import annotations
-
-import time
-from typing import TYPE_CHECKING, Any
-
-import dace
-import numpy as np
-from dace import data as dace_data
-
-from jace import util
-
-
-if TYPE_CHECKING:
-    from collections.abc import Mapping, Sequence
-
-    from jace import translator
-    from jace.util import dace_helper
-
-
-def compile_jax_sdfg(
-    tsdfg: translator.TranslatedJaxprSDFG,
-) -> dace_helper.CompiledSDFG:
-    """Compiles the SDFG embedded in `tsdfg` and return the resulting `CompiledSDFG` object."""
-    if any(  # We do not support the DaCe return mechanism
-        array_name.startswith("__return")
-        for array_name in tsdfg.sdfg.arrays.keys()  # noqa: SIM118  # we can not use `in` because we are also interested in `__return_`!
-    ):
-        raise ValueError("Only support SDFGs without '__return' members.")
-
-    # To ensure that the SDFG is compiled and to get rid of a warning we must modify
-    #  some settings of the SDFG. To fake an immutable SDFG, we will restore them later.
-    sdfg = tsdfg.sdfg
-    org_sdfg_name = sdfg.name
-    org_recompile = sdfg._recompile
-    org_regenerate_code = sdfg._regenerate_code
-
-    try:
-        # We need to give the SDFG another name, this is needed to prevent a DaCe error/warning.
-        #  This happens if we compile the same lowered SDFG multiple times with different options.
-        sdfg.name = f"{sdfg.name}__comp_{int(time.time() * 1000)}"
-
-        with dace.config.temporary_config():
-            sdfg._recompile = True
-            sdfg._regenerate_code = True
-            dace.Config.set("compiler", "use_cache", value=False)
-            csdfg: dace_helper.CompiledSDFG = sdfg.compile()
-
-    finally:
-        sdfg.name = org_sdfg_name
-        sdfg._recompile = org_recompile
-        sdfg._regenerate_code = org_regenerate_code
-
-    return csdfg
-
-
-def run_jax_sdfg(
-    csdfg: dace_helper.CompiledSDFG,
-    inp_names: Sequence[str],
-    out_names: Sequence[str],
-    call_args: Sequence[Any],
-    call_kwargs: Mapping[str, Any],
-) -> tuple[Any, ...] | Any:
-    """Run the compiled SDFG.
-
-    The function assumes that the SDFG was finalized and then compiled by
-    `compile_jax_sdfg()`. For running the SDFG you also have to pass the input
-    names (`inp_names`) and output names (`out_names`) that were inside the
-    `TranslatedJaxprSDFG` from which `csdfg` was compiled from.
-
-    Args:
-        csdfg: The `CompiledSDFG` object.
-        inp_names: List of names of the input arguments.
-        out_names: List of names of the output arguments.
-        call_args: All positional arguments of the call.
-        call_kwargs: All keyword arguments of the call.
-
-    Note:
-        There is no pytree mechanism jet, thus the return values are returned
-        inside a `tuple` or in case of one value, directly, in the order
-        determined by Jax. Furthermore, DaCe does not support scalar return
-        values, thus they are silently converted into arrays of length 1, the
-        same holds for inputs.
-
-    Todo:
-        - Implement non C strides.
-    """
-    sdfg: dace.SDFG = csdfg.sdfg
-
-    if len(call_kwargs) != 0:
-        raise NotImplementedError("No kwargs are supported yet.")
-    if len(inp_names) != len(call_args):
-        raise RuntimeError("Wrong number of arguments.")
-    if sdfg.free_symbols:  # This is a simplification that makes our life simple.
-        raise NotImplementedError(
-            f"No externally defined symbols are allowed, found: {sdfg.free_symbols}"
-        )
-
-    # Build the argument list that we will pass to the compiled object.
-    sdfg_call_args: dict[str, Any] = {}
-    for in_name, in_val in zip(inp_names, call_args, strict=True):
-        if util.is_scalar(in_val):
-            # Currently the translator makes scalar into arrays, this has to be reflected here
-            in_val = np.array([in_val])
-        sdfg_call_args[in_name] = in_val
-
-    for out_name, sdfg_array in ((out_name, sdfg.arrays[out_name]) for out_name in out_names):
-        if out_name in sdfg_call_args:
-            if util.is_jax_array(sdfg_call_args[out_name]):
-                # Jax arrays are immutable, so they can not be return values too.
-                raise ValueError("Passed a Jax array as output.")
-        else:
-            sdfg_call_args[out_name] = dace_data.make_array_from_descriptor(sdfg_array)
-
-    assert len(sdfg_call_args) == len(csdfg.argnames), (
-        "Failed to construct the call arguments,"
-        f" expected {len(csdfg.argnames)} but got {len(call_args)}."
-        f"\nExpected: {csdfg.argnames}\nGot: {list(sdfg_call_args.keys())}"
-    )
-
-    # Calling the SDFG
-    with dace.config.temporary_config():
-        dace.Config.set("compiler", "allow_view_arguments", value=True)
-        csdfg(**sdfg_call_args)
-
-    # Handling the output (pytrees are missing)
-    if not out_names:
-        return None
-    ret_val: tuple[Any] = tuple(sdfg_call_args[out_name] for out_name in out_names)
-    return ret_val[0] if len(out_names) == 1 else ret_val
diff --git a/src/jace/util/dace_helper.py b/src/jace/util/dace_helper.py
index a380272..613a59c 100644
--- a/src/jace/util/dace_helper.py
+++ b/src/jace/util/dace_helper.py
@@ -5,14 +5,144 @@
 #
 # SPDX-License-Identifier: BSD-3-Clause
 
-"""Implements all utility functions that are related to DaCe.
-
-Most of the functions defined here allow an unified access to DaCe's internals
-in a consistent and stable way.
-"""
+"""Implements all utility functions that are related to DaCe."""
 
 from __future__ import annotations
 
+import time
+from typing import TYPE_CHECKING, Any
+
+import dace
+import numpy as np
+from dace import data as dace_data
+
 # The compiled SDFG is not available in the dace namespace or anywhere else
 #  Thus we import it here directly
-from dace.codegen.compiled_sdfg import CompiledSDFG as CompiledSDFG
+from dace.codegen.compiled_sdfg import CompiledSDFG
+
+from jace import util
+
+
+if TYPE_CHECKING:
+    from collections.abc import Mapping, Sequence
+
+    from jace import translator
+    from jace.util import dace_helper
+
+__all__ = [
+    "CompiledSDFG",
+    "compile_jax_sdfg",
+    "run_jax_sdfg",
+]
+
+
+def compile_jax_sdfg(
+    tsdfg: translator.TranslatedJaxprSDFG,
+) -> dace_helper.CompiledSDFG:
+    """Compiles the SDFG embedded in `tsdfg` and return the resulting `CompiledSDFG` object."""
+    if any(  # We do not support the DaCe return mechanism
+        array_name.startswith("__return")
+        for array_name in tsdfg.sdfg.arrays.keys()  # noqa: SIM118  # we can not use `in` because we are also interested in `__return_`!
+    ):
+        raise ValueError("Only support SDFGs without '__return' members.")
+
+    # To ensure that the SDFG is compiled and to get rid of a warning we must modify
+    #  some settings of the SDFG. To fake an immutable SDFG, we will restore them later.
+    sdfg = tsdfg.sdfg
+    org_sdfg_name = sdfg.name
+    org_recompile = sdfg._recompile
+    org_regenerate_code = sdfg._regenerate_code
+
+    try:
+        # We need to give the SDFG another name, this is needed to prevent a DaCe error/warning.
+        #  This happens if we compile the same lowered SDFG multiple times with different options.
+        sdfg.name = f"{sdfg.name}__comp_{int(time.time() * 1000)}"
+
+        with dace.config.temporary_config():
+            sdfg._recompile = True
+            sdfg._regenerate_code = True
+            dace.Config.set("compiler", "use_cache", value=False)
+            csdfg: dace_helper.CompiledSDFG = sdfg.compile()
+
+    finally:
+        sdfg.name = org_sdfg_name
+        sdfg._recompile = org_recompile
+        sdfg._regenerate_code = org_regenerate_code
+
+    return csdfg
+
+
+def run_jax_sdfg(
+    csdfg: dace_helper.CompiledSDFG,
+    inp_names: Sequence[str],
+    out_names: Sequence[str],
+    call_args: Sequence[Any],
+    call_kwargs: Mapping[str, Any],
+) -> tuple[Any, ...] | Any:
+    """Run the compiled SDFG.
+
+    The function assumes that the SDFG was finalized and then compiled by
+    `compile_jax_sdfg()`. For running the SDFG you also have to pass the input
+    names (`inp_names`) and output names (`out_names`) that were inside the
+    `TranslatedJaxprSDFG` from which `csdfg` was compiled from.
+
+    Args:
+        csdfg: The `CompiledSDFG` object.
+        inp_names: List of names of the input arguments.
+        out_names: List of names of the output arguments.
+        call_args: All positional arguments of the call.
+        call_kwargs: All keyword arguments of the call.
+
+    Note:
+        There is no pytree mechanism jet, thus the return values are returned
+        inside a `tuple` or in case of one value, directly, in the order
+        determined by Jax. Furthermore, DaCe does not support scalar return
+        values, thus they are silently converted into arrays of length 1, the
+        same holds for inputs.
+
+    Todo:
+        - Implement non C strides.
+    """
+    sdfg: dace.SDFG = csdfg.sdfg
+
+    if len(call_kwargs) != 0:
+        raise NotImplementedError("No kwargs are supported yet.")
+    if len(inp_names) != len(call_args):
+        raise RuntimeError("Wrong number of arguments.")
+    if sdfg.free_symbols:  # This is a simplification that makes our life simple.
+        raise NotImplementedError(
+            f"No externally defined symbols are allowed, found: {sdfg.free_symbols}"
+        )
+
+    # Build the argument list that we will pass to the compiled object.
+    sdfg_call_args: dict[str, Any] = {}
+    for in_name, in_val in zip(inp_names, call_args, strict=True):
+        if util.is_scalar(in_val):
+            # Currently the translator makes scalar into arrays, this has to be reflected here
+            in_val = np.array([in_val])
+        sdfg_call_args[in_name] = in_val
+
+    for out_name, sdfg_array in ((out_name, sdfg.arrays[out_name]) for out_name in out_names):
+        if out_name in sdfg_call_args:
+            if util.is_jax_array(sdfg_call_args[out_name]):
+                # Jax arrays are immutable, so they can not be return values too.
+                raise ValueError("Passed a Jax array as output.")
+        else:
+            sdfg_call_args[out_name] = dace_data.make_array_from_descriptor(sdfg_array)
+
+    assert len(sdfg_call_args) == len(csdfg.argnames), (
+        "Failed to construct the call arguments,"
+        f" expected {len(csdfg.argnames)} but got {len(call_args)}."
+        f"\nExpected: {csdfg.argnames}\nGot: {list(sdfg_call_args.keys())}"
+    )
+
+    # Calling the SDFG
+    with dace.config.temporary_config():
+        dace.Config.set("compiler", "allow_view_arguments", value=True)
+        csdfg(**sdfg_call_args)
+
+    # Handling the output (pytrees are missing)
+    if not out_names:
+        return None
+    ret_val: tuple[Any] = tuple(sdfg_call_args[out_name] for out_name in out_names)
+    return ret_val[0] if len(out_names) == 1 else ret_val
diff --git a/src/jace/util/jax_helper.py b/src/jace/util/jax_helper.py
index 8fa982f..ca6f60c 100644
--- a/src/jace/util/jax_helper.py
+++ b/src/jace/util/jax_helper.py
@@ -73,7 +73,10 @@ def __post_init__(self) -> None:
     def __hash__(self) -> int:
         return id(self)
 
-    def __eq__(self, other: Any) -> bool:
+    def __eq__(
+        self,
+        other: Any,
+    ) -> bool:
         if not isinstance(other, JaCeVar):
             return NotImplemented
         return id(self) == id(other)
@@ -99,7 +102,9 @@ def get_jax_var_name(jax_var: jax_core.Atom | JaCeVar) -> str:
             )
 
 
-def get_jax_var_shape(jax_var: jax_core.Atom | JaCeVar) -> tuple[int | dace.symbol | str, ...]:
+def get_jax_var_shape(
+    jax_var: jax_core.Atom | JaCeVar,
+) -> tuple[int | dace.symbol | str, ...]:
     """Returns the shape of `jax_var`."""
     match jax_var:
         case jax_core.Var() | jax_core.Literal():
@@ -112,7 +117,9 @@ def get_jax_var_shape(jax_var: jax_core.Atom | JaCeVar) -> tuple[int | dace.symb
             raise TypeError(f"'get_jax_var_shape()` is not implemented for '{type(jax_var)}'.")
 
 
-def get_jax_var_dtype(jax_var: jax_core.Atom | JaCeVar) -> dace.typeclass:
+def get_jax_var_dtype(
+    jax_var: jax_core.Atom | JaCeVar,
+) -> dace.typeclass:
     """Returns the DaCe equivalent of `jax_var`s datatype."""
     match jax_var:
         case jax_core.Var() | jax_core.Literal():
@@ -140,7 +147,9 @@ def is_tracing_ongoing(
     return any(isinstance(x, jax_core.Tracer) for x in itertools.chain(args, kwargs.values()))
 
 
-def translate_dtype(dtype: Any) -> dace.typeclass:
+def translate_dtype(
+    dtype: Any,
+) -> dace.typeclass:
     """Turns a Jax datatype into a DaCe datatype."""
     if dtype is None:
         raise NotImplementedError  # Handling a special case in DaCe.
@@ -201,7 +210,9 @@ def propose_jax_name(
     return jax_name
 
 
-def get_jax_literal_value(lit: jax_core.Atom) -> bool | float | int | np.generic:
+def get_jax_literal_value(
+    lit: jax_core.Atom,
+) -> bool | float | int | np.generic:
     """Returns the value a literal is wrapping.
 
     The function guarantees to return a scalar value.
diff --git a/src/jace/util/traits.py b/src/jace/util/traits.py
index c9e9059..acada34 100644
--- a/src/jace/util/traits.py
+++ b/src/jace/util/traits.py
@@ -19,7 +19,9 @@
 import jace.util as util
 
 
-def is_drop_var(jax_var: jax_core.Atom | util.JaCeVar) -> TypeGuard[jax_core.DropVar]:
+def is_drop_var(
+    jax_var: jax_core.Atom | util.JaCeVar,
+) -> TypeGuard[jax_core.DropVar]:
     """Tests if `jax_var` is a drop variable, i.e. a variable that is not read from in a Jaxpr."""
 
     if isinstance(jax_var, jax_core.DropVar):

From c8b9763d87515a08fbe8ba068f03bb409bf8de1e Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Thu, 6 Jun 2024 08:14:07 +0200
Subject: [PATCH 313/458] Reapplied some stuff.

---
 src/jace/optimization.py                      |  5 +-
 .../mapped_operation_base_translator.py       | 52 ++++++++++---------
 src/jace/translator/primitive_translator.py   |  6 +--
 .../arithmetic_logical_translators.py         | 45 ++++++++--------
 .../convert_element_type_translator.py        | 10 ++--
 .../primitive_translators/copy_translator.py  | 17 +++---
 .../select_n_translator.py                    | 12 ++---
 .../primitive_translators/slicing.py          | 10 ++--
 8 files changed, 84 insertions(+), 73 deletions(-)

diff --git a/src/jace/optimization.py b/src/jace/optimization.py
index 21f33a0..63528db 100644
--- a/src/jace/optimization.py
+++ b/src/jace/optimization.py
@@ -64,8 +64,9 @@ def jace_optimize(
         tsdfg: The translated SDFG that should be optimized.
         simplify: Run the simplification pipeline.
         auto_optimize: Run the auto optimization pipeline (currently does nothing)
-        persistent:  Make the memory allocation persistent, i.e. allocate the transients only
-            once at the beginning and then reuse the memory across the lifetime of the SDFG.
+        persistent:  Make the memory allocation persistent, i.e. allocate the
+            transients only once at the beginning and then reuse the memory across
+            the lifetime of the SDFG.
     """
     # Currently this function exists primarily for the same of existing.
 
diff --git a/src/jace/translator/mapped_operation_base_translator.py b/src/jace/translator/mapped_operation_base_translator.py
index bc814ec..2b70f30 100644
--- a/src/jace/translator/mapped_operation_base_translator.py
+++ b/src/jace/translator/mapped_operation_base_translator.py
@@ -27,25 +27,27 @@
 class MappedOperationTranslatorBase(translator.PrimitiveTranslator):
     """Implements the base for all "mapped base operations".
 
-    A mapped base operation `f` is an operation that has several inputs arrays that are
-    elementwise combined to a single output array. A prime example for this would be the
-    addition of two arrays.
-    Essentially it assumes that the Tasklet code can be written as:
+    A mapped base operation `f` is an operation that has several inputs arrays
+    that are elementwise combined to a single output array. A prime example for
+    this would be the addition of two arrays. Essentially it assumes that the
+    Tasklet code can be written as:
     ```
         __out = f(__in0, __in1, __in3, ...)
     ```
-    where `__in*` are the connector names of the Tasklet and `__out` is the output connector. For
-    problems such as this, the SDFG API provides the `SDFGState.add_mapped_tasklet()` function,
-    however, in most cases it can not be directly used, for various reasons.
-    Thus this class acts like a convenience wrapper around it.
+    where `__in*` are the connector names of the Tasklet and `__out` is the
+    output connector. For problems such as this, the SDFG API provides the
+    `SDFGState.add_mapped_tasklet()` function, however, in most cases it can not
+    be directly used, for various reasons. Thus this class acts like a
+    convenience wrapper around it.
 
-    To use this class a user has to overwrite the `write_tasklet_code()` function. This function
-    generates the entire code that should be put into the Tasklet, include the assignment to
-    `__out`. If needed the translator will perform literal substitution on the returned code and
-    broadcast the inputs to match the outputs.
+    To use this class a user has to overwrite the `write_tasklet_code()` function.
+    This function generates the entire code that should be put into the Tasklet,
+    include the assignment to `__out`. If needed the translator will perform
+    literal substitution on the returned code and broadcast the inputs to match
+    the outputs.
 
-    If needed a subclass can also override the `make_input_memlets()` function to generate custom
-    input Memlets, such as adding an offset.
+    If needed a subclass can also override the `make_input_memlets()` function
+    to generate custom input Memlets, such as adding an offset.
 
     Args:
         primitive_name:     The name of the primitive `self` should bind to.
@@ -77,11 +79,11 @@ def __call__(
     ) -> None:
         """Create the mapped Tasklet.
 
-        The function will create the map ranges and based on the shape of the output array.
-        It will then call `make_input_memlets()` to get the input Memlets.
-        After that it calls `write_tasklet_code()` to get the Tasklet code
-        and perform literal substitution by forwarding it to `self.literal_substitution()`.
-        After that it will create the mapped Tasklet.
+        The function will create the map ranges and based on the shape of the
+        output array. It will then call `make_input_memlets()` to get the input
+        Memlets. After that it calls `write_tasklet_code()` to get the Tasklet
+        code and perform literal substitution by forwarding it to
+        `self.literal_substitution()`. After that it will create the mapped Tasklet.
 
         Note:
             For a description of the arguments see `PrimitiveTranslatorCallable`.
@@ -135,8 +137,8 @@ def write_tasklet_code(
         However, the base will do literal substitution on the returned object.
 
         Args:
-            tskl_ranges:    List of pairs used as map parameter, first element is the name
-                iteration index of the dimension, second is its range, i.e. `0:SIZE`.
+            tskl_ranges:    List of pairs used as map parameter, first element
+                is the name iteration index of the dimension, second is its range.
             in_var_names:   The list of SDFG variables used as input, `None` if literal.
             eqn:            The equation.
         """
@@ -150,12 +152,12 @@ def make_input_memlets(
     ) -> dict[str, dace.Memlet]:
         """Generate the input Memlets for the non literal operators of the primitive.
 
-        The returned `dict` maps the input connector of the Tasklet to the Memlet that is used
-        to connect it to the Map entry node.
+        The returned `dict` maps the input connector of the Tasklet to the Memlet
+        that is used to connect it to the Map entry node.
 
         Args:
-            tskl_ranges:    List of pairs used as map parameter, first element is the name
-                iteration index of the dimension, second is its range, i.e. `0:SIZE`.
+            tskl_ranges:    List of pairs used as map parameter, first element
+                is the name iteration index of the dimension, second is its range
             in_var_names:   The list of SDFG variables used as input, `None` if literal.
             eqn:            The equation object.
         """
diff --git a/src/jace/translator/primitive_translator.py b/src/jace/translator/primitive_translator.py
index bd149d3..aaf164f 100644
--- a/src/jace/translator/primitive_translator.py
+++ b/src/jace/translator/primitive_translator.py
@@ -195,9 +195,9 @@ def register_primitive_translator(
         overwrite: Replace the current primitive translator with `primitive_translator`.
 
     Note:
-        To add a `primitive` property use the `@make_primitive_translator` decorator.
-        This function returns `primitive_translator` unmodified, which allows it to be
-        used as decorator.
+        To add a `primitive` property use the `@make_primitive_translator`
+        decorator. This function returns `primitive_translator` unmodified,
+        which allows it to be used as decorator.
     """
 
     def wrapper(
diff --git a/src/jace/translator/primitive_translators/arithmetic_logical_translators.py b/src/jace/translator/primitive_translators/arithmetic_logical_translators.py
index d323395..a344c4a 100644
--- a/src/jace/translator/primitive_translators/arithmetic_logical_translators.py
+++ b/src/jace/translator/primitive_translators/arithmetic_logical_translators.py
@@ -31,18 +31,18 @@
 class ArithmeticOperationTranslator(mapped_base.MappedOperationTranslatorBase):
     """Translator for all arithmetic operations.
 
-    The class makes use of the `MappedOperationTranslatorBase`. It only implements the
-    `write_tasklet_code()` to generate the code for a Tasklet from a template.
+    The class makes use of the `MappedOperationTranslatorBase`. It only implements
+    the `write_tasklet_code()` to generate the code for a Tasklet from a template.
 
     Args:
         prim_name:      The name of the primitive that should be handled.
         tskl_tmpl:      Template used for generating the Tasklet code.
 
     Note:
-        - It does not implement the logical operations, they are implemented by the
-            `LogicalOperationTranslator` class.
-        - It does not implement `mod` nor `fmod` as they are translated to some nested `pjit`
-            implementation by Jax for unknown reasons.
+        - It does not implement the logical operations, they are implemented by
+            the `LogicalOperationTranslator` class.
+        - It does not implement `mod` nor `fmod` as they are translated to some
+            nested `pjit` implementation by Jax for unknown reasons.
     """
 
     def __init__(
@@ -70,23 +70,23 @@ def write_tasklet_code(
 class LogicalOperationTranslator(mapped_base.MappedOperationTranslatorBase):
     """Translator for all logical operations.
 
-    The reason why the logical operations are separated from the arithmetic operation is quite
-    complicated, and in fact the whole thing is harder than it should be.
-    NumPy has two kinds of these operations, i.e. `logical_{and, or, xor, not}()` and
-    `bitwise_{and, or, xor, not}()`, but Jax has only a single kind of logical operations, that
-    operate in bitwise mode.
-    The first idea would be to use `ArithmeticOperationTranslator` with a template such as
-    `__out = __in0 & __in1` or `__out = ~__in0`. Since DaCe eventually generates C++ code and C++
-    has a native bool type, and `true` is guaranteed to be `1` and `false` equals `0`, this works
-    for all operations except `not`, as `~true` in C++ is again `true`. Thus the `not` primitive
-    must be handled separately, however, it does not make sense to split the logical operations,
+    The reason why the logical operations are separated from the arithmetic
+    operation is quite complicated, and in fact the whole thing is harder than
+    it should be. NumPy has two kinds of these operations, i.e.
+    `logical_{and, or, xor, not}()` and `bitwise_{and, or, xor, not}()`, but Jax
+    has only a single kind of logical operations, that operate in bitwise mode.
+    The first idea would be to use `ArithmeticOperationTranslator` with a template
+    such as `__out = __in0 & __in1` or `__out = ~__in0`. Since DaCe eventually
+    generates C++ code and C++ has a native bool type, and `true` is guaranteed
+    to be `1` and `false` equals `0`, this works for all operations except `not`,
+    as `~true` in C++ is again `true`. Thus the `not` primitive must be handled
+    separately, however, it does not make sense to split the logical operations,
     thus all of them are handled by this class.
-    I think that in XLA, Jax target language, a bool is either a single bit or either all bits are
-    one or zero.
 
-    The solution to the problem is, to introduce two templates, one used for the bool context
-    and one used in the integer context. This works because depending if the `logical_*()` or
-    `bitwise_*()` functions are used the input is either of type bool or an integer.
+    The solution to the problem is, to introduce two templates, one used for the
+    bool context and one used in the integer context. This works because depending
+    if the `logical_*()` or `bitwise_*()` functions are used the input is either
+    of type bool or an integer.
 
     Args:
         prim_name:      The name of the primitive that should be handled.
@@ -94,7 +94,8 @@ class LogicalOperationTranslator(mapped_base.MappedOperationTranslatorBase):
         bool_tmpl:      The template used for the bool case.
 
     Notes:
-        This class does not do parameter substitution as the `ArithmeticOperationTranslator` does.
+        This class does not do parameter substitution as the
+        `ArithmeticOperationTranslator` does.
     """
 
     def __init__(
diff --git a/src/jace/translator/primitive_translators/convert_element_type_translator.py b/src/jace/translator/primitive_translators/convert_element_type_translator.py
index 16e5e78..59230d8 100644
--- a/src/jace/translator/primitive_translators/convert_element_type_translator.py
+++ b/src/jace/translator/primitive_translators/convert_element_type_translator.py
@@ -30,13 +30,13 @@ class ConvertElementTypeTranslator(mapped_base.MappedOperationTranslatorBase):
     Copies the input to the output and performs type conversion.
 
     Notes:
-        This translator ignores the `new_dtype` and `weak_type` parameter the equation
-        and only performs the casting.
+        This translator ignores the `new_dtype` and `weak_type` parameter the
+        equation and only performs the casting.
 
     Todo:
-        - Occasionally Jax generates a cast that is not needed, because the types are the same.
-            Currently this is handled, by generating an explicit copy, however, it should be
-            handled by a Memlet.
+        Occasionally Jax generates a cast that is not needed, because the types
+        are the same. Currently this is handled, by generating an explicit copy,
+        however, it should be handled by a Memlet.
     """
 
     def __init__(self) -> None:
diff --git a/src/jace/translator/primitive_translators/copy_translator.py b/src/jace/translator/primitive_translators/copy_translator.py
index 69dc923..c1afb34 100644
--- a/src/jace/translator/primitive_translators/copy_translator.py
+++ b/src/jace/translator/primitive_translators/copy_translator.py
@@ -24,7 +24,11 @@
 
 
 class CopyTranslator(mapped_base.MappedOperationTranslatorBase):
-    """Copy operations are implemented as a map to ensure that they can be fused with other maps."""
+    """Implements the `copy` primitive.
+
+    Copy operations are implemented as a map to ensure that they can be fused
+    with other maps
+    ."""
 
     def __init__(self) -> None:
         super().__init__(primitive_name="copy")
@@ -42,13 +46,14 @@ def write_tasklet_code(
 class DevicePutTranslator(mapped_base.MappedOperationTranslatorBase):
     """The `device_put` primitive is used to transfer data between host and device.
 
-    The current implementation only supports the copying where the data already is. Currently DaCe
-    only knows about the Host and the GPU. Furthermore, currently JaCe works in such a way that
-    everything is either put on the host or the device. Because of this, the `DevicePutTranslator`
-    is, currently, just a simple copy operation that should be removed, by the optimization.
+    The current implementation only supports the copying where the data already
+    is. Currently DaCe only knows about the Host and the GPU. Furthermore,
+    currently JaCe works in such a way that everything is either put on the host
+    or the device. Because of this, the `DevicePutTranslator` is, currently,
+    just a simple copy operation that should be removed, by the optimization.
 
     Todo:
-        - Make into a Memlet because only the Memlet can handle copying between devices.
+        Make into a Memlet because only the Memlet can handle copying between devices.
     """
 
     def __init__(self) -> None:
diff --git a/src/jace/translator/primitive_translators/select_n_translator.py b/src/jace/translator/primitive_translators/select_n_translator.py
index 3d21113..ee5eb5c 100644
--- a/src/jace/translator/primitive_translators/select_n_translator.py
+++ b/src/jace/translator/primitive_translators/select_n_translator.py
@@ -27,16 +27,16 @@
 class SelectNTranslator(mapped_base.MappedOperationTranslatorBase):
     """Implements the `select_n` primitive, which is a generalization of `np.where`
 
-    While `numpy.where` only supports two cases, the Jax primitive supports an arbitrary number
-    of cases. In that sense it is essentially a `C` `switch` statement, only that all cases have
-    to materialize.
+    While `numpy.where` only supports two cases, the Jax primitive supports an
+    arbitrary number of cases. In that sense it is essentially a `C` `switch`
+    statement, only that all cases have to materialize.
 
     The behaviour is undefined if the predicate is out of bound.
 
     Note:
-        For a better understanding this function renames its input connectors. The first one,
-        which is the predicate, is renamed to `__cond` and the others are renamed again to
-        `__in{i}`, starting with zero.
+        For a better understanding this function renames its input connectors.
+        The first one, which is the predicate, is renamed to `__cond` and the
+        others are renamed again to `__in{i}`, starting with zero.
     """
 
     def __init__(self) -> None:
diff --git a/src/jace/translator/primitive_translators/slicing.py b/src/jace/translator/primitive_translators/slicing.py
index c900f06..fb16040 100644
--- a/src/jace/translator/primitive_translators/slicing.py
+++ b/src/jace/translator/primitive_translators/slicing.py
@@ -70,12 +70,14 @@ class DynamicSlicingTranslator(translator.PrimitiveTranslator):
     """Implements the dynamic slicing translator.
 
     The [dynamic slicing](https://jax.readthedocs.io/en/latest/_autosummary/jax.lax.dynamic_slice.html)
-    performs a slicing of a _fixed_ window, however, the starting indexes are not fix, but are
-    variables that can come from the outside. Thus, the translator uses "Dynamic Map Ranges".
-    Furthermore, Jax guarantees that if the window overruns the start indexes are adjusted.
+    performs a slicing of a _fixed_ window, however, the starting indexes are
+    not fix, but are variables that can come from the outside. Thus, the
+    translator uses "Dynamic Map Ranges". Furthermore, Jax guarantees that if
+    the window overruns the start indexes are adjusted.
 
     Note:
-        Unlike the normal slicing primitive, it is not derived from `MappedOperationTranslatorBase`.
+        Unlike the normal slicing primitive, it is not derived from
+        `MappedOperationTranslatorBase`.
     """
 
     @property

From f5b7ccc102149c4635abf34a2799b125c12a0ef4 Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Thu, 6 Jun 2024 08:42:34 +0200
Subject: [PATCH 314/458] Adapted formating in the tests, however, they are so
 ugly.

---
 tests/conftest.py                             | 24 ++++---
 ...primitive_arithmetic_logical_operations.py | 70 ++++++++++++-------
 .../test_primitive_broadcast_in_dim.py        | 12 ++--
 .../test_primitive_convert_element_type.py    | 21 ++++--
 .../test_primitive_copy.py                    |  2 +-
 .../test_primitive_iota.py                    |  4 +-
 .../test_primitive_reshape.py                 | 16 +++--
 .../test_primitive_select_n.py                | 11 +--
 .../test_primitive_slicing.py                 | 47 +++++++++----
 .../test_primitive_squeeze_expand_dims.py     | 16 +++--
 tests/integration_tests/test_empty_jaxpr.py   | 14 ++--
 .../test_jaxpr_translator_builder.py          | 10 ++-
 .../test_primitive_translator_managing.py     | 31 ++++----
 tests/unit_tests/test_caching.py              |  6 +-
 tests/unit_tests/test_decorator.py            |  7 +-
 tests/unit_tests/test_jax_api.py              | 12 ++--
 tests/unit_tests/test_misc.py                 |  2 +-
 tests/unit_tests/test_package.py              |  2 +-
 18 files changed, 197 insertions(+), 110 deletions(-)

diff --git a/tests/conftest.py b/tests/conftest.py
index 936d6be..df8e75c 100644
--- a/tests/conftest.py
+++ b/tests/conftest.py
@@ -22,26 +22,28 @@
 
 
 @pytest.fixture(autouse=True)
-def _enable_x64_mode_in_jax():
+def _enable_x64_mode_in_jax() -> None:
     """Fixture of enable the `x64` mode in Jax.
 
-    Currently, JaCe requires that `x64` mode is enabled and will do all Jax things with it enabled.
-    However, if we use Jax with the intend to compare it against JaCe we must also enable it for
-    Jax.
+    Currently, JaCe requires that `x64` mode is enabled and will do all Jax
+    things with it enabled. However, if we use Jax with the intend to compare
+    it against JaCe we must also enable it for Jax.
     """
     with jax.experimental.enable_x64():
         yield
 
 
 @pytest.fixture(autouse=True)
-def _disable_jit():
+def _disable_jit() -> None:
     """Fixture for disable the dynamic jiting in Jax.
 
-    For certain reasons Jax puts certain primitives inside a `pjit` primitive, i.e. nested Jaxpr.
-    The intent is, that these operations can/should run on an accelerator.
+    For certain reasons Jax puts certain primitives inside a `pjit` primitive,
+    i.e. nested Jaxpr. The intent is, that these operations can/should run on
+    an accelerator.
 
-    But this is a problem, since JaCe can not handle this primitive, it leads to an error.
-    To overcome this problem, we will globally disable this feature until we can handle `pjit`.
+    But this is a problem, since JaCe can not handle this primitive, it leads
+    to an error. To overcome this problem, we will globally disable this feature
+    until we can handle `pjit`.
 
     Todo:
         Remove as soon as we can handle nested `jit`.
@@ -51,7 +53,7 @@ def _disable_jit():
 
 
 @pytest.fixture(autouse=True)
-def _clear_translation_cache():
+def _clear_translation_cache() -> None:
     """Decorator that clears the translation cache.
 
     Ensures that a function finds an empty cache and clears up afterwards.
@@ -62,7 +64,7 @@ def _clear_translation_cache():
 
 
 @pytest.fixture(autouse=True)
-def _reset_random_seed():
+def _reset_random_seed() -> None:
     """Fixture for resetting the random seed.
 
     This ensures that for every test the random seed of NumPy is reset.
diff --git a/tests/integration_tests/primitive_translators/test_primitive_arithmetic_logical_operations.py b/tests/integration_tests/primitive_translators/test_primitive_arithmetic_logical_operations.py
index c1b533d..f2bf813 100644
--- a/tests/integration_tests/primitive_translators/test_primitive_arithmetic_logical_operations.py
+++ b/tests/integration_tests/primitive_translators/test_primitive_arithmetic_logical_operations.py
@@ -34,7 +34,7 @@
 
 
 @pytest.fixture(autouse=True)
-def _only_alu_translators():
+def _only_alu_translators() -> None:
     """Removes all non arithmetic/logical translator from the registry.
 
     This ensures that Jax is not doing some stuff that is supposed to be handled by the
@@ -75,7 +75,9 @@ def _only_alu_translators():
         (jnp.bitwise_not, 1, np.int64),
     ]
 )
-def logical_ops(request) -> tuple[Callable, tuple[np.ndarray, ...]]:
+def logical_ops(
+    request,
+) -> tuple[Callable, tuple[np.ndarray, ...]]:
     """Returns a logical operation function and inputs."""
     return (
         request.param[0],
@@ -92,7 +94,9 @@ def logical_ops(request) -> tuple[Callable, tuple[np.ndarray, ...]]:
         ),
     ]
 )
-def dtype(request) -> np.generic:
+def dtype(
+    request,
+) -> np.generic:
     """The dtypes that should be used for the full alu tests."""
     return request.param
 
@@ -119,7 +123,10 @@ def dtype(request) -> np.generic:
         lambda x: jnp.atanh(jnp.tanh(x)),
     ]
 )
-def alu_unary_ops(request, dtype) -> tuple[Callable, np.ndarray]:
+def alu_unary_ops(
+    request,
+    dtype: type,
+) -> tuple[Callable, np.ndarray]:
     """The inputs and the operation we need for the full test."""
     return (request.param, testutil.mkarray((2, 2), dtype))
 
@@ -135,7 +142,9 @@ def alu_unary_ops(request, dtype) -> tuple[Callable, np.ndarray]:
         jnp.nextafter,
     ]
 )
-def alu_binary_ops_float(request) -> tuple[Callable, tuple[np.ndarray, np.ndarray]]:
+def alu_binary_ops_float(
+    request,
+) -> tuple[Callable, tuple[np.ndarray, np.ndarray]]:
     """All binary operations that can handle floats, complex values are not tested."""
     # Getting 0 in the division test is unlikely.
     return (  # type: ignore[return-value]  # Type confusion.
@@ -154,7 +163,9 @@ def alu_binary_ops_float(request) -> tuple[Callable, tuple[np.ndarray, np.ndarra
         lambda x, y: x > y,
     ]
 )
-def alu_binary_compare_ops(request) -> tuple[Callable, tuple[np.ndarray, np.ndarray]]:
+def alu_binary_compare_ops(
+    request,
+) -> tuple[Callable, tuple[np.ndarray, np.ndarray]]:
     """These are the comparison operations, that we test with integers, since it is simpler."""
     return (
         request.param,
@@ -162,7 +173,10 @@ def alu_binary_compare_ops(request) -> tuple[Callable, tuple[np.ndarray, np.ndar
     )
 
 
-def _perform_alu_test(testee: Callable, *args: Any) -> None:
+def _perform_alu_test(
+    testee: Callable,
+    *args: Any,
+) -> None:
     """General function that just performs the test."""
     wrapped = jace.jit(testee)
 
@@ -180,7 +194,7 @@ def _perform_alu_test(testee: Callable, *args: Any) -> None:
     assert np.allclose(ref, res), f"Expected '{ref.tolist()}' got '{res.tolist()}'"
 
 
-def test_alu_unary_scalar():
+def test_alu_unary_scalar() -> None:
     """Test unary ALU translator in the scalar case."""
 
     def testee(A: np.float64) -> np.float64 | jax.Array:
@@ -189,7 +203,7 @@ def testee(A: np.float64) -> np.float64 | jax.Array:
     _perform_alu_test(testee, np.float64(1.0))
 
 
-def test_alu_unary_array():
+def test_alu_unary_array() -> None:
     """Test unary ALU translator with array argument."""
 
     def testee(A: np.ndarray) -> jax.Array:
@@ -200,7 +214,7 @@ def testee(A: np.ndarray) -> jax.Array:
     _perform_alu_test(testee, A)
 
 
-def test_alu_unary_scalar_literal():
+def test_alu_unary_scalar_literal() -> None:
     """Test unary ALU translator with literal argument"""
 
     def testee(A: float) -> float | jax.Array:
@@ -209,7 +223,7 @@ def testee(A: float) -> float | jax.Array:
     _perform_alu_test(testee, 10.0)
 
 
-def test_alu_unary_integer_power():
+def test_alu_unary_integer_power() -> None:
     """Tests the integer power, which has a parameter."""
 
     def testee(A: np.ndarray) -> np.ndarray:
@@ -219,7 +233,9 @@ def testee(A: np.ndarray) -> np.ndarray:
     _perform_alu_test(testee, A)
 
 
-def test_alu_binary_power(dtype):
+def test_alu_binary_power(
+    dtype: type,
+):
     """Tests the "normal" power operator, i.e. not with a known integer power."""
 
     def testee(A: np.ndarray, exp: np.generic) -> np.ndarray:
@@ -230,7 +246,7 @@ def testee(A: np.ndarray, exp: np.generic) -> np.ndarray:
     _perform_alu_test(testee, A, exp)
 
 
-def test_alu_binary_scalar():
+def test_alu_binary_scalar() -> None:
     """Scalar binary operation."""
 
     def testee(A: np.float64, B: np.float64) -> np.float64:
@@ -239,7 +255,7 @@ def testee(A: np.float64, B: np.float64) -> np.float64:
     _perform_alu_test(testee, np.float64(1.0), np.float64(2.0))
 
 
-def test_alu_binary_scalar_literal():
+def test_alu_binary_scalar_literal() -> None:
     """Scalar binary operation, with a literal."""
 
     def testeeR(A: np.float64) -> np.float64:
@@ -253,7 +269,7 @@ def testeeL(A: np.float64) -> np.float64:
     _perform_alu_test(testeeL, A)
 
 
-def test_alu_binary_array():
+def test_alu_binary_array() -> None:
     """Test binary of arrays, with same size."""
 
     def testee(A: np.ndarray, B: np.ndarray) -> np.ndarray:
@@ -264,7 +280,7 @@ def testee(A: np.ndarray, B: np.ndarray) -> np.ndarray:
     _perform_alu_test(testee, A, B)
 
 
-def test_alu_binary_array_scalar():
+def test_alu_binary_array_scalar() -> None:
     """Test binary of array with scalar."""
 
     def testee(A: np.ndarray | np.float64, B: np.float64 | np.ndarray) -> np.ndarray:
@@ -276,7 +292,7 @@ def testee(A: np.ndarray | np.float64, B: np.float64 | np.ndarray) -> np.ndarray
     _perform_alu_test(testee, B, A)
 
 
-def test_alu_binary_array_literal():
+def test_alu_binary_array_literal() -> None:
     """Test binary of array with literal"""
 
     def testeeR(A: np.ndarray) -> np.ndarray:
@@ -290,7 +306,7 @@ def testeeL(A: np.ndarray) -> np.ndarray:
     _perform_alu_test(testeeL, A)
 
 
-def test_alu_binary_array_constants():
+def test_alu_binary_array_constants() -> None:
     """Test binary of array with constant."""
 
     def testee(A: np.ndarray) -> np.ndarray:
@@ -300,7 +316,7 @@ def testee(A: np.ndarray) -> np.ndarray:
     _perform_alu_test(testee, A)
 
 
-def test_alu_binary_broadcast_1():
+def test_alu_binary_broadcast_1() -> None:
     """Test broadcasting."""
 
     def testee(A: np.ndarray, B: np.ndarray) -> np.ndarray:
@@ -312,7 +328,7 @@ def testee(A: np.ndarray, B: np.ndarray) -> np.ndarray:
     _perform_alu_test(testee, B, A)
 
 
-def test_alu_binary_broadcast_2():
+def test_alu_binary_broadcast_2() -> None:
     """Test broadcasting."""
 
     def testee(A: np.ndarray, B: np.ndarray) -> np.ndarray:
@@ -324,7 +340,7 @@ def testee(A: np.ndarray, B: np.ndarray) -> np.ndarray:
     _perform_alu_test(testee, B, A)
 
 
-def test_alu_binary_broadcast_3():
+def test_alu_binary_broadcast_3() -> None:
     """Test broadcasting."""
 
     def testee(A: np.ndarray, B: np.ndarray) -> np.ndarray:
@@ -336,7 +352,7 @@ def testee(A: np.ndarray, B: np.ndarray) -> np.ndarray:
     _perform_alu_test(testee, B, A)
 
 
-def test_alu_unary_isfinite():
+def test_alu_unary_isfinite() -> None:
     def testee(A: np.ndarray) -> jax.Array:
         return jnp.isfinite(A)
 
@@ -364,7 +380,9 @@ def testee(*args: np.ndarray) -> np.ndarray:
     _perform_alu_test(testee, *inputs)
 
 
-def test_alu_general_unary(alu_unary_ops: tuple[Callable, np.ndarray]):
+def test_alu_general_unary(
+    alu_unary_ops: tuple[Callable, np.ndarray],
+) -> None:
     """General test for the unary operations."""
 
     def testee(A: np.ndarray) -> np.ndarray:
@@ -375,7 +393,7 @@ def testee(A: np.ndarray) -> np.ndarray:
 
 def test_alu_general_binary_float(
     alu_binary_ops_float: tuple[Callable, tuple[np.ndarray, np.ndarray]],
-):
+) -> None:
     """Tests the binary operations that runs on floating points."""
 
     def testee(A: np.ndarray, B: np.ndarray) -> np.ndarray:
@@ -384,7 +402,9 @@ def testee(A: np.ndarray, B: np.ndarray) -> np.ndarray:
     _perform_alu_test(testee, *alu_binary_ops_float[1])
 
 
-def test_alu_compare_ops(alu_binary_compare_ops: tuple[Callable, tuple[np.ndarray, np.ndarray]]):
+def test_alu_compare_ops(
+    alu_binary_compare_ops: tuple[Callable, tuple[np.ndarray, np.ndarray]],
+) -> None:
     """Test all the comparison operations."""
 
     def testee(A: np.ndarray, B: np.ndarray) -> np.ndarray:
diff --git a/tests/integration_tests/primitive_translators/test_primitive_broadcast_in_dim.py b/tests/integration_tests/primitive_translators/test_primitive_broadcast_in_dim.py
index f49efdc..ae85c81 100644
--- a/tests/integration_tests/primitive_translators/test_primitive_broadcast_in_dim.py
+++ b/tests/integration_tests/primitive_translators/test_primitive_broadcast_in_dim.py
@@ -34,12 +34,14 @@
 
 
 @pytest.fixture(params=[(10,), (10, 1), (1, 10)])
-def vector_shape(request) -> tuple[int, ...]:
+def vector_shape(
+    request,
+) -> tuple[int, ...]:
     """Shapes used in the `test_bid_vector()` tests."""
     return request.param
 
 
-def test_bid_scalar():
+def test_bid_scalar() -> None:
     """Broadcast a scalar to a matrix."""
 
     def testee(A: float) -> jax.Array:
@@ -54,7 +56,7 @@ def testee(A: float) -> jax.Array:
         assert np.all(res == ref), f"Expected '{ref.tolist()}' got '{res.tolist()}'."
 
 
-def test_bid_literal():
+def test_bid_literal() -> None:
     """Broadcast a literal to a matrix."""
 
     def testee(a: float) -> np.ndarray | jax.Array:
@@ -67,7 +69,9 @@ def testee(a: float) -> np.ndarray | jax.Array:
     assert np.all(res == ref)
 
 
-def test_bid_vector(vector_shape: Sequence[int]):
+def test_bid_vector(
+    vector_shape: Sequence[int],
+) -> None:
     """Broadcast a vector to a tensor."""
 
     def testee(a: np.ndarray) -> np.ndarray | jax.Array:
diff --git a/tests/integration_tests/primitive_translators/test_primitive_convert_element_type.py b/tests/integration_tests/primitive_translators/test_primitive_convert_element_type.py
index dffc125..ef98e72 100644
--- a/tests/integration_tests/primitive_translators/test_primitive_convert_element_type.py
+++ b/tests/integration_tests/primitive_translators/test_primitive_convert_element_type.py
@@ -34,13 +34,17 @@
 
 
 @pytest.fixture(params=_DACE_REAL_TYPES)
-def src_type(request) -> type:
+def src_type(
+    request,
+) -> type:
     """All valid source types, with the exception of bool."""
     return request.param
 
 
 @pytest.fixture(params=_DACE_REAL_TYPES + _DACE_COMPLEX_TYPES)
-def dst_type(request) -> type:
+def dst_type(
+    request,
+) -> type:
     """All valid destination types, with the exception of bool.
 
     Includes also complex types, because going from real to complex is useful, but the other
@@ -72,14 +76,21 @@ def converter(A: np.ndarray) -> jax.Array:
     return True
 
 
-def test_convert_element_type_main(src_type, dst_type):
+def test_convert_element_type_main(
+    src_type: type,
+    dst_type: type,
+) -> None:
     """Tests all conversions with the exception of conversions from bool and complex."""
     _convert_element_type_impl(src_type, dst_type)
 
 
-def test_convert_element_type_from_bool(src_type):
+def test_convert_element_type_from_bool(
+    src_type: type,
+) -> None:
     _convert_element_type_impl(np.bool_, src_type)
 
 
-def test_convert_element_type_to_bool(src_type):
+def test_convert_element_type_to_bool(
+    src_type: type,
+) -> None:
     _convert_element_type_impl(src_type, np.bool_)
diff --git a/tests/integration_tests/primitive_translators/test_primitive_copy.py b/tests/integration_tests/primitive_translators/test_primitive_copy.py
index ecbc3c6..c4a3d62 100644
--- a/tests/integration_tests/primitive_translators/test_primitive_copy.py
+++ b/tests/integration_tests/primitive_translators/test_primitive_copy.py
@@ -16,7 +16,7 @@
 from tests import util as testutil
 
 
-def test_copy():
+def test_copy() -> None:
     @jace.jit
     def testee(A: np.ndarray) -> jax.Array:
         return jnp.copy(A)
diff --git a/tests/integration_tests/primitive_translators/test_primitive_iota.py b/tests/integration_tests/primitive_translators/test_primitive_iota.py
index 7ae4cfa..0e27734 100644
--- a/tests/integration_tests/primitive_translators/test_primitive_iota.py
+++ b/tests/integration_tests/primitive_translators/test_primitive_iota.py
@@ -14,7 +14,7 @@
 import jace
 
 
-def test_iota_arange():
+def test_iota_arange() -> None:
     """Tests `jnp.arange` functionality."""
 
     def testee(A: int) -> jax.Array:
@@ -25,7 +25,7 @@ def testee(A: int) -> jax.Array:
     assert np.all(ref == res)
 
 
-def test_iota_broadcast():
+def test_iota_broadcast() -> None:
     """Test more iota using the `jax.lax.broadcasted_iota()` function."""
     shape = (2, 2, 2, 2)
 
diff --git a/tests/integration_tests/primitive_translators/test_primitive_reshape.py b/tests/integration_tests/primitive_translators/test_primitive_reshape.py
index 7bd142b..209057c 100644
--- a/tests/integration_tests/primitive_translators/test_primitive_reshape.py
+++ b/tests/integration_tests/primitive_translators/test_primitive_reshape.py
@@ -47,7 +47,9 @@ def testee(A: np.ndarray) -> jax.Array:
 @pytest.fixture(
     params=["C", pytest.param("F", marks=pytest.mark.skip("Non C order is not supported"))]
 )
-def mem_order(request) -> str:
+def mem_order(
+    request,
+) -> str:
     """Gets the memory order that we want
 
     Currently 'F' is skipped because it is not implemented by the logic.
@@ -56,19 +58,25 @@ def mem_order(request) -> str:
 
 
 @pytest.fixture(params=[(216, 1, 1), (1, 216, 1), (1, 1, 216), (1, 6, 36), (36, 1, 6)])
-def new_shape(request):
+def new_shape(
+    request,
+) -> None:
     """New shapes for the `test_reshaping_same_rank()` test."""
     return request.param
 
 
 @pytest.fixture(params=[(12, 1), (1, 12), (1, 1, 12), (1, 2, 6)])
-def expanded_shape(request):
+def expanded_shape(
+    request,
+) -> None:
     """New shapes for the `test_reshaping_removing_rank()` test."""
     return request.param
 
 
 @pytest.fixture(params=[(216,), (6, 36), (36, 6), (216, 1)])
-def reduced_shape(request):
+def reduced_shape(
+    request,
+) -> None:
     """New shapes for the `test_reshaping_adding_rank()` test."""
     return request.param
 
diff --git a/tests/integration_tests/primitive_translators/test_primitive_select_n.py b/tests/integration_tests/primitive_translators/test_primitive_select_n.py
index deda424..16ca0ee 100644
--- a/tests/integration_tests/primitive_translators/test_primitive_select_n.py
+++ b/tests/integration_tests/primitive_translators/test_primitive_select_n.py
@@ -24,13 +24,16 @@
     from collections.abc import Callable
 
 
-def _perform_test(testee: Callable, *args: Any):
+def _perform_test(
+    testee: Callable,
+    *args: Any,
+) -> None:
     res = testee(*args)
     ref = jace.jit(testee)(*args)
     assert np.all(res == ref)
 
 
-def test_select_n_where():
+def test_select_n_where() -> None:
     """Normal `np.where` test."""
 
     def testee(P: Any, T: Any, F: Any) -> Any:
@@ -43,7 +46,7 @@ def testee(P: Any, T: Any, F: Any) -> Any:
     _perform_test(testee, pred, tbranch, fbranch)
 
 
-def test_select_n_where_literal():
+def test_select_n_where_literal() -> None:
     """`np.where` where one of the input is a literal."""
 
     def testee1(P: Any, F: Any) -> Any:
@@ -65,7 +68,7 @@ def testee3(P: Any) -> Any:
     _perform_test(testee3, pred)
 
 
-def test_select_n_many_inputs():
+def test_select_n_many_inputs() -> None:
     """Tests the generalized way of using the primitive."""
 
     def testee(pred: np.ndarray, *cases: np.ndarray) -> jax.Array:
diff --git a/tests/integration_tests/primitive_translators/test_primitive_slicing.py b/tests/integration_tests/primitive_translators/test_primitive_slicing.py
index dc5f8be..735cfed 100644
--- a/tests/integration_tests/primitive_translators/test_primitive_slicing.py
+++ b/tests/integration_tests/primitive_translators/test_primitive_slicing.py
@@ -19,12 +19,12 @@
 
 
 @pytest.fixture()
-def A_4x4():
+def A_4x4() -> np.ndarray:
     return testutil.mkarray((4, 4))
 
 
 @pytest.fixture()
-def A_4x4x4x4():
+def A_4x4x4x4() -> np.ndarray:
     return testutil.mkarray((4, 4, 4, 4))
 
 
@@ -36,12 +36,16 @@ def A_4x4x4x4():
         (3, 1, 3, 0),  # Will lead to readjustment of the start index.
     ]
 )
-def full_dynamic_start_idx(request):
+def full_dynamic_start_idx(
+    request,
+) -> None:
     """Start indexes for the slice window of `test_dynamic_slice_full_dynamic()`."""
     return request.param
 
 
-def test_slice_sub_view(A_4x4):
+def test_slice_sub_view(
+    A_4x4,
+) -> None:
     """Simple extraction of a subsize."""
 
     @jace.jit
@@ -55,7 +59,9 @@ def testee(A: np.ndarray) -> np.ndarray:
     assert np.all(ref == res)
 
 
-def test_slice_rslice(A_4x4):
+def test_slice_rslice(
+    A_4x4,
+) -> None:
     """Only slicing some rows."""
 
     @jace.jit
@@ -69,7 +75,9 @@ def testee(A: np.ndarray) -> np.ndarray:
     assert np.all(ref == res)
 
 
-def test_slice_cslice(A_4x4):
+def test_slice_cslice(
+    A_4x4,
+) -> None:
     """Slicing some columns."""
 
     @jace.jit
@@ -84,7 +92,9 @@ def testee(A: np.ndarray) -> np.ndarray:
     assert np.all(ref == res)
 
 
-def test_slice_singelton(A_4x4):
+def test_slice_singelton(
+    A_4x4,
+) -> None:
     """Only extracting a single value."""
 
     @jace.jit
@@ -99,7 +109,7 @@ def testee(A: np.ndarray) -> np.ndarray:
 
 
 @pytest.mark.skip(reason="Missing 'gather' translator.")
-def test_slice_strides_vec():
+def test_slice_strides_vec() -> None:
     """Using strides.
 
     Note:
@@ -122,7 +132,9 @@ def testee(A: np.ndarray) -> np.ndarray:
 
 
 @pytest.mark.skip(reason="Missing 'concatenate' translator.")
-def test_slice_strides(A_4x4):
+def test_slice_strides(
+    A_4x4,
+) -> None:
     """Using strides in a 2D matrix.
 
     See `test_slice_strides_vec()` why the test is skipped.
@@ -139,7 +151,9 @@ def testee(A: np.ndarray) -> np.ndarray:
     assert np.all(ref == res)
 
 
-def test_slice_too_big(A_4x4):
+def test_slice_too_big(
+    A_4x4,
+) -> None:
     """Tests what happens if we specify a size that is too big.
 
     Note:
@@ -157,7 +171,10 @@ def testee(A: np.ndarray) -> np.ndarray:
     assert np.all(ref == res)
 
 
-def test_dynamic_slice_full_dynamic(A_4x4x4x4, full_dynamic_start_idx):
+def test_dynamic_slice_full_dynamic(
+    A_4x4x4x4,
+    full_dynamic_start_idx,
+) -> None:
     """Dynamic slicing where all start index are input parameters."""
 
     def testee(A: np.ndarray, s1: int, s2: int, s3: int, s4: int) -> jax.Array:
@@ -169,7 +186,9 @@ def testee(A: np.ndarray, s1: int, s2: int, s3: int, s4: int) -> jax.Array:
     assert np.all(ref == res)
 
 
-def test_dynamic_slice_partially_dynamic(A_4x4x4x4):
+def test_dynamic_slice_partially_dynamic(
+    A_4x4x4x4,
+) -> None:
     """Dynamic slicing where some start index are input parameters and others are literals."""
 
     def testee(A: np.ndarray, s1: int, s2: int) -> jax.Array:
@@ -181,7 +200,9 @@ def testee(A: np.ndarray, s1: int, s2: int) -> jax.Array:
     assert np.all(ref == res)
 
 
-def test_dynamic_slice_full_literal(A_4x4x4x4):
+def test_dynamic_slice_full_literal(
+    A_4x4x4x4,
+) -> None:
     """Dynamic slicing where all start indexes are literals."""
 
     def testee(A: np.ndarray) -> jax.Array:
diff --git a/tests/integration_tests/primitive_translators/test_primitive_squeeze_expand_dims.py b/tests/integration_tests/primitive_translators/test_primitive_squeeze_expand_dims.py
index bf9e89f..a37557d 100644
--- a/tests/integration_tests/primitive_translators/test_primitive_squeeze_expand_dims.py
+++ b/tests/integration_tests/primitive_translators/test_primitive_squeeze_expand_dims.py
@@ -59,7 +59,9 @@ def _roundtrip_implementation(
 
 
 @pytest.fixture(params=[0, -1, 1])
-def simple_axis(request) -> int:
+def simple_axis(
+    request,
+) -> int:
     return request.param
 
 
@@ -71,13 +73,19 @@ def simple_axis(request) -> int:
         (3, 2, 1),
     ]
 )
-def hard_axis(request) -> Sequence[int] | int:
+def hard_axis(
+    request,
+) -> Sequence[int] | int:
     return request.param
 
 
-def test_expand_squeeze_rountrip_simple(simple_axis):
+def test_expand_squeeze_rountrip_simple(
+    simple_axis,
+) -> None:
     _roundtrip_implementation((10,), simple_axis)
 
 
-def test_expand_squeeze_rountrip_big(hard_axis):
+def test_expand_squeeze_rountrip_big(
+    hard_axis,
+) -> None:
     _roundtrip_implementation((2, 3, 4, 5), hard_axis)
diff --git a/tests/integration_tests/test_empty_jaxpr.py b/tests/integration_tests/test_empty_jaxpr.py
index e4dbc09..b2e2207 100644
--- a/tests/integration_tests/test_empty_jaxpr.py
+++ b/tests/integration_tests/test_empty_jaxpr.py
@@ -20,7 +20,7 @@
 import jace
 
 
-def test_empty_array():
+def test_empty_array() -> None:
     @jace.jit
     def wrapped(A: np.ndarray) -> np.ndarray:
         return A
@@ -32,7 +32,7 @@ def wrapped(A: np.ndarray) -> np.ndarray:
     assert res.__array_interface__["data"][0] != A.__array_interface__["data"][0]
 
 
-def test_empty_multiple():
+def test_empty_multiple() -> None:
     @jace.jit
     def wrapped(A: np.ndarray, B: np.float64) -> tuple[np.ndarray, np.float64]:
         return A, B
@@ -46,7 +46,7 @@ def wrapped(A: np.ndarray, B: np.float64) -> tuple[np.ndarray, np.float64]:
     assert res[0].__array_interface__["data"][0] != A.__array_interface__["data"][0]
 
 
-def test_empty_unused():
+def test_empty_unused() -> None:
     @jace.jit
     def wrapped(A: np.ndarray, B: np.float64) -> np.ndarray:  # noqa: ARG001  # Explicitly unused.
         return A
@@ -64,7 +64,7 @@ def wrapped(A: np.ndarray, B: np.float64) -> np.ndarray:  # noqa: ARG001  # Expl
     assert res.__array_interface__["data"][0] != A.__array_interface__["data"][0]
 
 
-def test_empty_scalar():
+def test_empty_scalar() -> None:
     @jace.jit
     def wrapped(A: float) -> float:
         return A
@@ -75,7 +75,7 @@ def wrapped(A: float) -> float:
 
 
 @pytest.mark.skip(reason="Nested Jaxpr are not handled.")
-def test_empty_nested():
+def test_empty_nested() -> None:
     @jace.jit
     def wrapped(A: float) -> float:
         return jax.jit(lambda A: A)(A)
@@ -85,7 +85,7 @@ def wrapped(A: float) -> float:
     assert np.all(wrapped(A) == A)
 
 
-def test_empty_with_drop_vars():
+def test_empty_with_drop_vars() -> None:
     """Tests if we can handle an empty input = output case, with present drop variables."""
 
     @jace.jit
@@ -99,7 +99,7 @@ def wrapped(A: float) -> float:
 
 
 @pytest.mark.skip(reason="Literal return value is not implemented.")
-def test_empty_literal_return():
+def test_empty_literal_return() -> None:
     """Tests if we can handle a literal return value.
 
     Note:
diff --git a/tests/integration_tests/test_jaxpr_translator_builder.py b/tests/integration_tests/test_jaxpr_translator_builder.py
index e138a37..9222f52 100644
--- a/tests/integration_tests/test_jaxpr_translator_builder.py
+++ b/tests/integration_tests/test_jaxpr_translator_builder.py
@@ -40,7 +40,7 @@
 
 
 @pytest.fixture()
-def translation_builder():
+def translation_builder() -> translator.JaxprTranslationBuilder:
     """Returns an allocated builder instance."""
     name = "fixture_builder"
     builder = translator.JaxprTranslationBuilder(
@@ -188,7 +188,9 @@ def test_builder_variable_alloc_auto_naming_wrapped(
             ), f"Automated naming failed, expected '{exp_name}' but got '{sdfg_name}'."
 
 
-def test_builder_nested(translation_builder: translator.JaxprTranslationBuilder) -> None:
+def test_builder_nested(
+    translation_builder: translator.JaxprTranslationBuilder,
+) -> None:
     """Tests the ability of the nesting of the builder."""
 
     # Now add a variable to the current subtext.
@@ -261,7 +263,9 @@ def test_builder_nested(translation_builder: translator.JaxprTranslationBuilder)
     assert name_3 == translation_builder.map_jax_var_to_sdfg(array3)
 
 
-def test_builder_append_state(translation_builder: translator.JaxprTranslationBuilder) -> None:
+def test_builder_append_state(
+    translation_builder: translator.JaxprTranslationBuilder,
+) -> None:
     """Tests the functionality of appending states."""
     sdfg: dace.SDFG = translation_builder.sdfg
 
diff --git a/tests/integration_tests/test_primitive_translator_managing.py b/tests/integration_tests/test_primitive_translator_managing.py
index 68b27a6..22021c9 100644
--- a/tests/integration_tests/test_primitive_translator_managing.py
+++ b/tests/integration_tests/test_primitive_translator_managing.py
@@ -10,7 +10,7 @@
 from __future__ import annotations
 
 import re
-from typing import Any
+from typing import TYPE_CHECKING, Any
 
 import numpy as np
 import pytest
@@ -25,8 +25,12 @@
 )
 
 
+if TYPE_CHECKING:
+    from collections.abc import Mapping
+
+
 @pytest.fixture(autouse=True)
-def _conserve_builtin_translators():
+def _conserve_builtin_translators() -> None:
     """Restores the set of registered subtranslators after a test."""
     initial_translators = get_registered_primitive_translators()
     yield
@@ -34,7 +38,7 @@ def _conserve_builtin_translators():
 
 
 @pytest.fixture()
-def no_builtin_translators():  # noqa: PT004  # This is how you should do it: https://docs.pytest.org/en/7.1.x/how-to/fixtures.html#use-fixtures-in-classes-and-modules-with-usefixtures
+def no_builtin_translators() -> None:  # noqa: PT004  # This is how you should do it: https://docs.pytest.org/en/7.1.x/how-to/fixtures.html#use-fixtures-in-classes-and-modules-with-usefixtures
     """This fixture can be used if the test does not want any builtin translators."""
     initial_translators = translator.set_active_primitive_translators_to({})
     yield
@@ -70,14 +74,14 @@ def fake_add_translator(*args: Any, **kwargs: Any) -> None:  # noqa: ARG001
     raise NotImplementedError
 
 
-def test_are_subtranslators_imported():
+def test_are_subtranslators_imported() -> None:
     """Tests if something is inside the list of subtranslators."""
     # Must be adapted if new primitives are implemented.
     assert len(get_registered_primitive_translators()) == 60
 
 
 @pytest.mark.usefixtures("no_builtin_translators")
-def test_subtranslatior_managing():
+def test_subtranslatior_managing() -> None:
     """Basic functionality of the subtranslators."""
     original_active_subtrans = get_registered_primitive_translators()
     assert len(original_active_subtrans) == 0
@@ -100,7 +104,7 @@ def test_subtranslatior_managing():
     assert len(active_subtrans) == 3
 
 
-def test_subtranslatior_managing_isolation():
+def test_subtranslatior_managing_isolation() -> None:
     """Tests if `get_registered_primitive_translators()` protects the internal registry."""
     assert (
         get_registered_primitive_translators()
@@ -117,11 +121,14 @@ def test_subtranslatior_managing_isolation():
     assert get_registered_primitive_translators()["add"] is org_add_prim
 
 
-def test_subtranslatior_managing_swap():
+def test_subtranslatior_managing_swap() -> None:
     """Tests the `set_active_primitive_translators_to()` functionality."""
 
     # Allows to compare the structure of dicts.
-    def same_structure(d1: dict, d2: dict) -> bool:
+    def same_structure(
+        d1: Mapping,
+        d2: Mapping,
+    ) -> bool:
         return d1.keys() == d2.keys() and all(id(d2[k]) == id(d1[k]) for k in d1)
 
     initial_primitives = get_registered_primitive_translators()
@@ -144,7 +151,7 @@ def same_structure(d1: dict, d2: dict) -> bool:
 
 
 @pytest.mark.usefixtures("no_builtin_translators")
-def test_subtranslatior_managing_callable_annotation():
+def test_subtranslatior_managing_callable_annotation() -> None:
     """Test if `make_primitive_translator()` works."""
 
     prim_name = "non_existing_property"
@@ -158,7 +165,7 @@ def non_existing_translator(*args: Any, **kwargs: Any) -> None:  # noqa: ARG001
     assert len(get_registered_primitive_translators()) == 0
 
 
-def test_subtranslatior_managing_overwriting():
+def test_subtranslatior_managing_overwriting() -> None:
     """Tests if we are able to overwrite something."""
     current_add_translator = get_registered_primitive_translators()["add"]
 
@@ -184,7 +191,7 @@ def useless_add_translator(*args: Any, **kwargs: Any) -> None:  # noqa: ARG001
 
 
 @pytest.mark.usefixtures("no_builtin_translators")
-def test_subtranslatior_managing_overwriting_2():
+def test_subtranslatior_managing_overwriting_2() -> None:
     """Again an overwriting test, but this time a bit more complicated."""
 
     trans_cnt = [0]
@@ -206,7 +213,7 @@ def foo(A: int) -> int:
     assert trans_cnt[0] == 4
 
 
-def test_subtranslatior_managing_decoupling():
+def test_subtranslatior_managing_decoupling() -> None:
     """Shows that we have proper decoupling.
 
     I.e. changes to the global state, does not affect already annotated functions.
diff --git a/tests/unit_tests/test_caching.py b/tests/unit_tests/test_caching.py
index f593ae4..e615ee3 100644
--- a/tests/unit_tests/test_caching.py
+++ b/tests/unit_tests/test_caching.py
@@ -70,7 +70,7 @@ def wrapped(A, B):
     assert lowering_cnt[0] == 1
 
 
-def test_caching_different_sizes():
+def test_caching_different_sizes() -> None:
     """The behaviour of the cache if different sizes where used."""
 
     # Counter for how many time it was lowered.
@@ -193,7 +193,7 @@ def jaceWrapped(A: np.ndarray, B: np.ndarray) -> np.ndarray:
     assert optiCompiled._csdfg.sdfg.number_of_nodes() < unoptiCompiled._csdfg.sdfg.number_of_nodes()
 
 
-def test_caching_dtype():
+def test_caching_dtype() -> None:
     """Tests if the data type is properly included in the test."""
 
     lowering_cnt = [0]
@@ -219,7 +219,7 @@ def testee(A: np.ndarray) -> np.ndarray:
         assert lowering_cnt[0] == i + 1
 
 
-def test_caching_eviction_simple():
+def test_caching_eviction_simple() -> None:
     """Simple tests for cache eviction."""
 
     @jace.jit
diff --git a/tests/unit_tests/test_decorator.py b/tests/unit_tests/test_decorator.py
index 0cffc34..ca6a0de 100644
--- a/tests/unit_tests/test_decorator.py
+++ b/tests/unit_tests/test_decorator.py
@@ -19,7 +19,7 @@
 from tests import util as testutil
 
 
-def test_decorator_individually():
+def test_decorator_individually() -> None:
     """Tests the compilation steps individually."""
 
     def testee_(A: np.ndarray, B: np.ndarray) -> np.ndarray:
@@ -45,7 +45,7 @@ def testee(A, B):
     assert lowering_cnt[0] == 1
 
 
-def test_decorator_one_go():
+def test_decorator_one_go() -> None:
     """Tests the compilation steps in one go."""
 
     def testee_(A: np.ndarray, B: np.ndarray) -> np.ndarray:
@@ -68,7 +68,7 @@ def testee(A, B):
     assert lowering_cnt[0] == 1
 
 
-def test_decorator_wrapped():
+def test_decorator_wrapped() -> None:
     """Tests if some properties are set correctly."""
 
     def testee(A: np.ndarray, B: np.ndarray) -> np.ndarray:
@@ -77,4 +77,3 @@ def testee(A: np.ndarray, B: np.ndarray) -> np.ndarray:
     wrapped = jace.jit(testee)
 
     assert wrapped.wrapped_fun is testee
-    assert wrapped.__wrapped__ is testee
diff --git a/tests/unit_tests/test_jax_api.py b/tests/unit_tests/test_jax_api.py
index cacc6f8..a10aef3 100644
--- a/tests/unit_tests/test_jax_api.py
+++ b/tests/unit_tests/test_jax_api.py
@@ -21,7 +21,7 @@
 from tests import util as testutil
 
 
-def test_jit():
+def test_jit() -> None:
     """Simple add function."""
 
     def testee(A: np.ndarray, B: np.ndarray) -> np.ndarray:
@@ -39,7 +39,7 @@ def testee(A: np.ndarray, B: np.ndarray) -> np.ndarray:
     assert np.allclose(ref, res), f"Expected '{ref}' got '{res}'."
 
 
-def test_composition_itself():
+def test_composition_itself() -> None:
     """Tests if JaCe is composable with itself."""
 
     # Pure Python functions
@@ -77,7 +77,7 @@ def ddf(x):
 
 
 @pytest.mark.skip(reason="Nested Jaxpr are not handled.")
-def test_composition_with_jax():
+def test_composition_with_jax() -> None:
     """Tests if JaCe can interact with Jax and vice versa."""
 
     def base_fun(A, B, C):
@@ -96,7 +96,7 @@ def jax_fun(A, B, C):
 
 
 @pytest.mark.skip(reason="Nested Jaxpr are not handled.")
-def test_composition_with_jax_2():
+def test_composition_with_jax_2() -> None:
     """Second test if JaCe can interact with Jax and vice versa."""
 
     @jax.jit
@@ -125,7 +125,7 @@ def f3_jace(A, B, C, D):
     assert np.allclose(ref, res_jace), "JaCe Failed."
 
 
-def test_grad_annotation_direct():
+def test_grad_annotation_direct() -> None:
     """Test if `jace.grad` works directly."""
 
     def f(x):
@@ -149,7 +149,7 @@ def jace_ddf(x):
         assert np.allclose(res, ref)
 
 
-def test_grad_control_flow():
+def test_grad_control_flow() -> None:
     """Tests if `grad` and controlflow works.
 
     This requirement is mentioned in `https://jax.readthedocs.io/en/latest/notebooks/Common_Gotchas_in_JAX.html#python-control-flow-autodiff`.
diff --git a/tests/unit_tests/test_misc.py b/tests/unit_tests/test_misc.py
index 6c30783..d595498 100644
--- a/tests/unit_tests/test_misc.py
+++ b/tests/unit_tests/test_misc.py
@@ -18,7 +18,7 @@
 
 
 @pytest.mark.skip("Possible bug in DaCe.")
-def test_mismatch_in_datatyte_calling():
+def test_mismatch_in_datatyte_calling() -> None:
     """Tests compilation and calling with different types.
 
     Note that this more or less a test for the calling implementation of the `CompiledSDFG`
diff --git a/tests/unit_tests/test_package.py b/tests/unit_tests/test_package.py
index 5237aeb..4d63fcc 100644
--- a/tests/unit_tests/test_package.py
+++ b/tests/unit_tests/test_package.py
@@ -15,5 +15,5 @@
 
 
 @pytest.mark.skip(reason="This does not work yet.")
-def test_version():
+def test_version() -> None:
     assert importlib.metadata.version("jace") == m.__version__

From 1c3d3a633cacac23ac929396bf24e44cdb6bb791 Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Thu, 6 Jun 2024 09:07:45 +0200
Subject: [PATCH 315/458] Updated the ALT tests.

---
 ...primitive_arithmetic_logical_operations.py | 244 +++++++++---------
 1 file changed, 115 insertions(+), 129 deletions(-)

diff --git a/tests/integration_tests/primitive_translators/test_primitive_arithmetic_logical_operations.py b/tests/integration_tests/primitive_translators/test_primitive_arithmetic_logical_operations.py
index f2bf813..c50ff65 100644
--- a/tests/integration_tests/primitive_translators/test_primitive_arithmetic_logical_operations.py
+++ b/tests/integration_tests/primitive_translators/test_primitive_arithmetic_logical_operations.py
@@ -5,12 +5,20 @@
 #
 # SPDX-License-Identifier: BSD-3-Clause
 
-"""Implements tests for the ALU and the `MappedOperationTranslatorBase` translator.
+"""Tests for `MappedOperationTranslatorBase` class and arithmetic & logical operations.
 
-The function mostly tests the `MappedOperationTranslatorBase` class by performing additions.
+The `MappedOperationTranslatorBase` can not be tested on its own, since it does
+not generate a Tasklet. For that reason it is thoroughly tested together with
+the arithmetic and logical translators (ALT).
 
-Todo:
-    - Add all supported primitives, to see if the template is valid.
+Thus the first tests tests the behaviour of the `MappedOperationTranslatorBase`
+class such as
+- broadcasting,
+- literal substitution,
+- scalar vs array computation.
+
+Followed by tests that are specific to the ALTs, which mostly focuses
+on the validity of the template of the ALT.
 """
 
 from __future__ import annotations
@@ -34,7 +42,7 @@
 
 
 @pytest.fixture(autouse=True)
-def _only_alu_translators() -> None:
+def _only_alt_translators() -> None:
     """Removes all non arithmetic/logical translator from the registry.
 
     This ensures that Jax is not doing some stuff that is supposed to be handled by the
@@ -96,8 +104,8 @@ def logical_ops(
 )
 def dtype(
     request,
-) -> np.generic:
-    """The dtypes that should be used for the full alu tests."""
+) -> type:
+    """Data types that should be used for the numerical tests of the ALT translators."""
     return request.param
 
 
@@ -123,7 +131,7 @@ def dtype(
         lambda x: jnp.atanh(jnp.tanh(x)),
     ]
 )
-def alu_unary_ops(
+def alt_unary_ops(
     request,
     dtype: type,
 ) -> tuple[Callable, np.ndarray]:
@@ -142,10 +150,10 @@ def alu_unary_ops(
         jnp.nextafter,
     ]
 )
-def alu_binary_ops_float(
+def alt_binary_ops_float(
     request,
 ) -> tuple[Callable, tuple[np.ndarray, np.ndarray]]:
-    """All binary operations that can handle floats, complex values are not tested."""
+    """Binary ALT operations that operates on floats."""
     # Getting 0 in the division test is unlikely.
     return (  # type: ignore[return-value]  # Type confusion.
         request.param,
@@ -163,17 +171,31 @@ def alu_binary_ops_float(
         lambda x, y: x > y,
     ]
 )
-def alu_binary_compare_ops(
+def alt_binary_compare_ops(
     request,
 ) -> tuple[Callable, tuple[np.ndarray, np.ndarray]]:
-    """These are the comparison operations, that we test with integers, since it is simpler."""
+    """Comparison operations, operates on integers."""
     return (
         request.param,
         tuple(np.abs(testutil.mkarray((20, 20), np.int32)) % 30 for _ in range(2)),
     )
 
 
-def _perform_alu_test(
+@pytest.fixture(
+    params=[
+        [(100, 1), (100, 10)],
+        [(100, 1, 3), (100, 1, 1)],
+        [(5, 1, 3, 4, 1, 5), (5, 1, 3, 1, 2, 5)],
+    ]
+)
+def broadcast_input(
+    request,
+) -> tuple[np.ndarray, np.ndarray]:
+    """Inputs to be used for the broadcast test."""
+    return tuple(testutil.mkarray(shape) for shape in request.param)  # type: ignore[return-value] # can not deduce that it is only size 2.
+
+
+def _perform_alt_test(
     testee: Callable,
     *args: Any,
 ) -> None:
@@ -194,70 +216,40 @@ def _perform_alu_test(
     assert np.allclose(ref, res), f"Expected '{ref.tolist()}' got '{res.tolist()}'"
 
 
-def test_alu_unary_scalar() -> None:
-    """Test unary ALU translator in the scalar case."""
+# <------------ Tests for `MappedOperationTranslatorBase`
+
 
+def test_mapped_unary_scalar() -> None:
     def testee(A: np.float64) -> np.float64 | jax.Array:
         return jnp.cos(A)
 
-    _perform_alu_test(testee, np.float64(1.0))
+    _perform_alt_test(testee, np.float64(1.0))
 
 
-def test_alu_unary_array() -> None:
-    """Test unary ALU translator with array argument."""
-
+def test_mapped_unary_array() -> None:
     def testee(A: np.ndarray) -> jax.Array:
         return jnp.sin(A)
 
     A = testutil.mkarray((100, 10, 3))
 
-    _perform_alu_test(testee, A)
-
+    _perform_alt_test(testee, A)
 
-def test_alu_unary_scalar_literal() -> None:
-    """Test unary ALU translator with literal argument"""
 
+def test_mapped_unary_scalar_literal() -> None:
     def testee(A: float) -> float | jax.Array:
         return jnp.sin(1.98) + A
 
-    _perform_alu_test(testee, 10.0)
-
-
-def test_alu_unary_integer_power() -> None:
-    """Tests the integer power, which has a parameter."""
-
-    def testee(A: np.ndarray) -> np.ndarray:
-        return A**3
-
-    A = testutil.mkarray((10, 2, 3))
-    _perform_alu_test(testee, A)
-
-
-def test_alu_binary_power(
-    dtype: type,
-):
-    """Tests the "normal" power operator, i.e. not with a known integer power."""
-
-    def testee(A: np.ndarray, exp: np.generic) -> np.ndarray:
-        return A**exp
+    _perform_alt_test(testee, 10.0)
 
-    exp = dtype(3)
-    A = testutil.mkarray((10, 2, 3), dtype=dtype)
-    _perform_alu_test(testee, A, exp)
-
-
-def test_alu_binary_scalar() -> None:
-    """Scalar binary operation."""
 
+def test_mapped_binary_scalar() -> None:
     def testee(A: np.float64, B: np.float64) -> np.float64:
         return A * B
 
-    _perform_alu_test(testee, np.float64(1.0), np.float64(2.0))
-
+    _perform_alt_test(testee, np.float64(1.0), np.float64(2.0))
 
-def test_alu_binary_scalar_literal() -> None:
-    """Scalar binary operation, with a literal."""
 
+def test_mapped_binary_scalar_partial_literal() -> None:
     def testeeR(A: np.float64) -> np.float64:
         return A * 2.03
 
@@ -265,11 +257,11 @@ def testeeL(A: np.float64) -> np.float64:
         return 2.03 * A
 
     A = np.float64(7.0)
-    _perform_alu_test(testeeR, A)
-    _perform_alu_test(testeeL, A)
+    _perform_alt_test(testeeR, A)
+    _perform_alt_test(testeeL, A)
 
 
-def test_alu_binary_array() -> None:
+def test_mapped_binary_array() -> None:
     """Test binary of arrays, with same size."""
 
     def testee(A: np.ndarray, B: np.ndarray) -> np.ndarray:
@@ -277,24 +269,20 @@ def testee(A: np.ndarray, B: np.ndarray) -> np.ndarray:
 
     A = testutil.mkarray((100, 10, 3))
     B = testutil.mkarray((100, 10, 3))
-    _perform_alu_test(testee, A, B)
+    _perform_alt_test(testee, A, B)
 
 
-def test_alu_binary_array_scalar() -> None:
-    """Test binary of array with scalar."""
-
+def test_mapped_binary_array_scalar() -> None:
     def testee(A: np.ndarray | np.float64, B: np.float64 | np.ndarray) -> np.ndarray:
         return A + B  # type: ignore[return-value]  # It is always an array.
 
     A = testutil.mkarray((100, 22))
     B = np.float64(1.34)
-    _perform_alu_test(testee, A, B)
-    _perform_alu_test(testee, B, A)
-
+    _perform_alt_test(testee, A, B)
+    _perform_alt_test(testee, B, A)
 
-def test_alu_binary_array_literal() -> None:
-    """Test binary of array with literal"""
 
+def test_mapped_binary_array_partial_literal() -> None:
     def testeeR(A: np.ndarray) -> np.ndarray:
         return A + 1.52
 
@@ -302,73 +290,67 @@ def testeeL(A: np.ndarray) -> np.ndarray:
         return 1.52 + A
 
     A = testutil.mkarray((100, 22))
-    _perform_alu_test(testeeR, A)
-    _perform_alu_test(testeeL, A)
+    _perform_alt_test(testeeR, A)
+    _perform_alt_test(testeeL, A)
 
 
-def test_alu_binary_array_constants() -> None:
-    """Test binary of array with constant."""
-
+def test_mapped_binary_array_constants() -> None:
     def testee(A: np.ndarray) -> np.ndarray:
         return A + jnp.array([[1.0, 2.0, 3.0], [4.0, 5.0, 6.0], [7.0, 8.0, 9.0]])
 
     A = testutil.mkarray((3, 3))
-    _perform_alu_test(testee, A)
-
+    _perform_alt_test(testee, A)
 
-def test_alu_binary_broadcast_1() -> None:
-    """Test broadcasting."""
 
+def test_mapped_broadcast(
+    broadcast_input: tuple[np.ndarray, np.ndarray],
+) -> None:
     def testee(A: np.ndarray, B: np.ndarray) -> np.ndarray:
         return A + B
 
-    A = testutil.mkarray((100, 1, 3))
-    B = testutil.mkarray((100, 1, 1))
-    _perform_alu_test(testee, A, B)
-    _perform_alu_test(testee, B, A)
+    A = broadcast_input[0]
+    B = broadcast_input[1]
+    _perform_alt_test(testee, A, B)
+    _perform_alt_test(testee, B, A)
 
 
-def test_alu_binary_broadcast_2() -> None:
-    """Test broadcasting."""
+# <------------ Tests for ALT
 
-    def testee(A: np.ndarray, B: np.ndarray) -> np.ndarray:
-        return A + B
 
-    A = testutil.mkarray((100, 1))
-    B = testutil.mkarray((100, 10))
-    _perform_alu_test(testee, A, B)
-    _perform_alu_test(testee, B, A)
+def test_alt_general_unary(
+    alt_unary_ops: tuple[Callable, np.ndarray],
+) -> None:
+    """General test for the unary operations."""
 
+    def testee(A: np.ndarray) -> np.ndarray:
+        return alt_unary_ops[0](A)
 
-def test_alu_binary_broadcast_3() -> None:
-    """Test broadcasting."""
+    _perform_alt_test(testee, alt_unary_ops[1])
 
-    def testee(A: np.ndarray, B: np.ndarray) -> np.ndarray:
-        return A + B
 
-    A = testutil.mkarray((5, 1, 3, 4, 1, 5))
-    B = testutil.mkarray((5, 1, 3, 1, 2, 5))
-    _perform_alu_test(testee, A, B)
-    _perform_alu_test(testee, B, A)
+def test_alt_general_binary_float(
+    alt_binary_ops_float: tuple[Callable, tuple[np.ndarray, np.ndarray]],
+) -> None:
+    """Tests the binary operations that runs on floating points."""
 
+    def testee(A: np.ndarray, B: np.ndarray) -> np.ndarray:
+        return alt_binary_ops_float[0](A, B)
 
-def test_alu_unary_isfinite() -> None:
-    def testee(A: np.ndarray) -> jax.Array:
-        return jnp.isfinite(A)
+    _perform_alt_test(testee, *alt_binary_ops_float[1])
 
-    A = np.array([np.inf, +np.inf, -np.inf, np.nan, -np.nan, 1.0])
 
-    args = dace.Config.get("compiler", "cpu", "args")
-    try:
-        new_args = args.replace("-ffast-math", "-fno-finite-math-only")
-        dace.Config.set("compiler", "cpu", "args", value=new_args)
-        _perform_alu_test(testee, A)
+def test_alt_compare_ops(
+    alt_binary_compare_ops: tuple[Callable, tuple[np.ndarray, np.ndarray]],
+) -> None:
+    """Test all the comparison operations."""
 
-    finally:
-        dace.Config.set("compiler", "cpu", "args", value=args)
+    def testee(A: np.ndarray, B: np.ndarray) -> np.ndarray:
+        return alt_binary_compare_ops[0](A, B)
 
+    _perform_alt_test(testee, *alt_binary_compare_ops[1])
 
-def test_alu_logical_bitwise_operation(
+
+def test_alt_logical_bitwise_operation(
     logical_ops: tuple[Callable, tuple[np.ndarray, ...]],
 ) -> None:
     """Tests if the logical and bitwise operations works as they do in Jax."""
@@ -377,37 +359,41 @@ def test_alu_logical_bitwise_operation(
     def testee(*args: np.ndarray) -> np.ndarray:
         return logical_ops[0](*args)
 
-    _perform_alu_test(testee, *inputs)
+    _perform_alt_test(testee, *inputs)
 
 
-def test_alu_general_unary(
-    alu_unary_ops: tuple[Callable, np.ndarray],
-) -> None:
-    """General test for the unary operations."""
+def test_alt_unary_isfinite() -> None:
+    def testee(A: np.ndarray) -> jax.Array:
+        return jnp.isfinite(A)
 
-    def testee(A: np.ndarray) -> np.ndarray:
-        return alu_unary_ops[0](A)
+    A = np.array([np.inf, +np.inf, -np.inf, np.nan, -np.nan, 1.0])
 
-    _perform_alu_test(testee, alu_unary_ops[1])
+    args = dace.Config.get("compiler", "cpu", "args")
+    try:
+        new_args = args.replace("-ffast-math", "-fno-finite-math-only")
+        dace.Config.set("compiler", "cpu", "args", value=new_args)
+        _perform_alt_test(testee, A)
 
+    finally:
+        dace.Config.set("compiler", "cpu", "args", value=args)
 
-def test_alu_general_binary_float(
-    alu_binary_ops_float: tuple[Callable, tuple[np.ndarray, np.ndarray]],
-) -> None:
-    """Tests the binary operations that runs on floating points."""
 
-    def testee(A: np.ndarray, B: np.ndarray) -> np.ndarray:
-        return alu_binary_ops_float[0](A, B)
+def test_alt_unary_integer_power() -> None:
+    def testee(A: np.ndarray) -> np.ndarray:
+        return A**3
 
-    _perform_alu_test(testee, *alu_binary_ops_float[1])
+    A = testutil.mkarray((10, 2, 3))
+    _perform_alt_test(testee, A)
 
 
-def test_alu_compare_ops(
-    alu_binary_compare_ops: tuple[Callable, tuple[np.ndarray, np.ndarray]],
-) -> None:
-    """Test all the comparison operations."""
+def test_alt_binary_power(
+    dtype: type,
+):
+    """Tests the "normal" power operator, i.e. not with a known integer power."""
 
-    def testee(A: np.ndarray, B: np.ndarray) -> np.ndarray:
-        return alu_binary_compare_ops[0](A, B)
+    def testee(A: np.ndarray, exp: np.generic) -> np.ndarray:
+        return A**exp
 
-    _perform_alu_test(testee, *alu_binary_compare_ops[1])
+    exp = dtype(3)
+    A = testutil.mkarray((10, 2, 3), dtype=dtype)
+    _perform_alt_test(testee, A, exp)

From 7990569960aa2df7d6b92819c1a780c533482237 Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Thu, 6 Jun 2024 13:54:39 +0200
Subject: [PATCH 316/458] Updated the ALT tests.

---
 ...primitive_arithmetic_logical_operations.py | 78 +++++++------------
 1 file changed, 30 insertions(+), 48 deletions(-)

diff --git a/tests/integration_tests/primitive_translators/test_primitive_arithmetic_logical_operations.py b/tests/integration_tests/primitive_translators/test_primitive_arithmetic_logical_operations.py
index c50ff65..0854dea 100644
--- a/tests/integration_tests/primitive_translators/test_primitive_arithmetic_logical_operations.py
+++ b/tests/integration_tests/primitive_translators/test_primitive_arithmetic_logical_operations.py
@@ -23,7 +23,6 @@ class such as
 
 from __future__ import annotations
 
-from collections.abc import Callable
 from typing import TYPE_CHECKING, Any
 
 import dace
@@ -38,11 +37,11 @@ class such as
 
 
 if TYPE_CHECKING:
-    from collections.abc import Callable
+    from collections.abc import Callable, Generator
 
 
 @pytest.fixture(autouse=True)
-def _only_alt_translators() -> None:
+def _only_alt_translators() -> Generator[None, None, None]:
     """Removes all non arithmetic/logical translator from the registry.
 
     This ensures that Jax is not doing some stuff that is supposed to be handled by the
@@ -111,17 +110,15 @@ def dtype(
 
 @pytest.fixture(
     params=[
-        lambda x: +(x - 1.0),
+        lambda x: +(x - 0.5),
         lambda x: -x,
         jnp.floor,
         jnp.ceil,
         jnp.round,
         jnp.exp2,
-        jnp.exp,
-        lambda x: jnp.abs(x - 0.5),
-        lambda x: jnp.log(x + 1.0),
-        lambda x: jnp.sqrt(x**2),
-        # The following have a restricted input domain, so we use `x = f^{-1}(f(x))`.
+        lambda x: jnp.abs(-x),
+        lambda x: jnp.sqrt(x**2),  # includes integer power.
+        lambda x: jnp.log(jnp.exp(x)),
         lambda x: jnp.log1p(jnp.expm1(x)),
         lambda x: jnp.asin(jnp.sin(x)),
         lambda x: jnp.acos(jnp.cos(x)),
@@ -135,7 +132,11 @@ def alt_unary_ops(
     request,
     dtype: type,
 ) -> tuple[Callable, np.ndarray]:
-    """The inputs and the operation we need for the full test."""
+    """The inputs and the operation we need for the full test.
+
+    Some of the unary operations are combined to ensure that they will succeed.
+    An example is `asin()` which only takes values in the range `[-1, 1]`.
+    """
     return (request.param, testutil.mkarray((2, 2), dtype))
 
 
@@ -148,6 +149,7 @@ def alt_unary_ops(
         jnp.maximum,
         jnp.atan2,
         jnp.nextafter,
+        lambda x, y: x**y,
     ]
 )
 def alt_binary_ops_float(
@@ -314,36 +316,46 @@ def testee(A: np.ndarray, B: np.ndarray) -> np.ndarray:
     _perform_alt_test(testee, B, A)
 
 
-# <------------ Tests for ALT
+# <------------ Tests for arithmetic and logical translators/operations
 
 
 def test_alt_general_unary(
     alt_unary_ops: tuple[Callable, np.ndarray],
 ) -> None:
-    """General test for the unary operations."""
-
     def testee(A: np.ndarray) -> np.ndarray:
         return alt_unary_ops[0](A)
 
     _perform_alt_test(testee, alt_unary_ops[1])
 
 
+def test_alt_unary_isfinite() -> None:
+    def testee(A: np.ndarray) -> jax.Array:
+        return jnp.isfinite(A)
+
+    A = np.array([np.inf, +np.inf, -np.inf, np.nan, -np.nan, 1.0])
+
+    args = dace.Config.get("compiler", "cpu", "args")
+    try:
+        new_args = args.replace("-ffast-math", "-fno-finite-math-only")
+        dace.Config.set("compiler", "cpu", "args", value=new_args)
+        _perform_alt_test(testee, A)
+
+    finally:
+        dace.Config.set("compiler", "cpu", "args", value=args)
+
+
 def test_alt_general_binary_float(
     alt_binary_ops_float: tuple[Callable, tuple[np.ndarray, np.ndarray]],
 ) -> None:
-    """Tests the binary operations that runs on floating points."""
-
     def testee(A: np.ndarray, B: np.ndarray) -> np.ndarray:
         return alt_binary_ops_float[0](A, B)
 
     _perform_alt_test(testee, *alt_binary_ops_float[1])
 
 
-def test_alt_compare_ops(
+def test_alt_compare_operation(
     alt_binary_compare_ops: tuple[Callable, tuple[np.ndarray, np.ndarray]],
 ) -> None:
-    """Test all the comparison operations."""
-
     def testee(A: np.ndarray, B: np.ndarray) -> np.ndarray:
         return alt_binary_compare_ops[0](A, B)
 
@@ -353,7 +365,6 @@ def testee(A: np.ndarray, B: np.ndarray) -> np.ndarray:
 def test_alt_logical_bitwise_operation(
     logical_ops: tuple[Callable, tuple[np.ndarray, ...]],
 ) -> None:
-    """Tests if the logical and bitwise operations works as they do in Jax."""
     inputs: tuple[np.ndarray, ...] = logical_ops[1]
 
     def testee(*args: np.ndarray) -> np.ndarray:
@@ -362,38 +373,9 @@ def testee(*args: np.ndarray) -> np.ndarray:
     _perform_alt_test(testee, *inputs)
 
 
-def test_alt_unary_isfinite() -> None:
-    def testee(A: np.ndarray) -> jax.Array:
-        return jnp.isfinite(A)
-
-    A = np.array([np.inf, +np.inf, -np.inf, np.nan, -np.nan, 1.0])
-
-    args = dace.Config.get("compiler", "cpu", "args")
-    try:
-        new_args = args.replace("-ffast-math", "-fno-finite-math-only")
-        dace.Config.set("compiler", "cpu", "args", value=new_args)
-        _perform_alt_test(testee, A)
-
-    finally:
-        dace.Config.set("compiler", "cpu", "args", value=args)
-
-
 def test_alt_unary_integer_power() -> None:
     def testee(A: np.ndarray) -> np.ndarray:
         return A**3
 
     A = testutil.mkarray((10, 2, 3))
     _perform_alt_test(testee, A)
-
-
-def test_alt_binary_power(
-    dtype: type,
-):
-    """Tests the "normal" power operator, i.e. not with a known integer power."""
-
-    def testee(A: np.ndarray, exp: np.generic) -> np.ndarray:
-        return A**exp
-
-    exp = dtype(3)
-    A = testutil.mkarray((10, 2, 3), dtype=dtype)
-    _perform_alt_test(testee, A, exp)

From 972c9c0f96f058822ca98bb5e34e81cce890dba9 Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Fri, 7 Jun 2024 08:10:23 +0200
Subject: [PATCH 317/458] Updated the tests a little bit.

They are still a mess.
---
 .../test_primitive_broadcast_in_dim.py        |  29 ++---
 .../test_primitive_convert_element_type.py    |  16 +--
 .../test_primitive_iota.py                    |   3 -
 .../test_primitive_reshape.py                 |  10 +-
 .../test_primitive_select_n.py                |  14 +--
 .../test_primitive_slicing.py                 |  59 ++++------
 .../test_primitive_squeeze_expand_dims.py     |  22 ++--
 tests/integration_tests/test_empty_jaxpr.py   |  49 ++++----
 .../test_jaxpr_translator_builder.py          | 106 ++++++++++--------
 .../test_primitive_translator_managing.py     |  78 +++++--------
 tests/unit_tests/test_caching.py              |  64 ++++++-----
 tests/unit_tests/test_jax_api.py              |   7 +-
 tests/unit_tests/test_misc.py                 |   9 +-
 13 files changed, 224 insertions(+), 242 deletions(-)

diff --git a/tests/integration_tests/primitive_translators/test_primitive_broadcast_in_dim.py b/tests/integration_tests/primitive_translators/test_primitive_broadcast_in_dim.py
index ae85c81..088e5d6 100644
--- a/tests/integration_tests/primitive_translators/test_primitive_broadcast_in_dim.py
+++ b/tests/integration_tests/primitive_translators/test_primitive_broadcast_in_dim.py
@@ -5,9 +5,10 @@
 #
 # SPDX-License-Identifier: BSD-3-Clause
 
-"""Implements tests for the broadcast in dim translator.
+"""Implements tests for the `broadcast_in_dim` primitive.
 
-Parts of the tests are also implemented inside `test_sub_translators_squeeze_expand_dims.py`.
+Parts of the tests are also implemented inside `test_sub_translators_squeeze_expand_dims.py`,
+because this primitive has a relation to `squeeze`.
 
 Todo:
     - `np.meshgrid`
@@ -47,19 +48,19 @@ def test_bid_scalar() -> None:
     def testee(A: float) -> jax.Array:
         return jnp.broadcast_to(A, (2, 2))
 
-    for a in [1, 1.0, 3.1415]:
-        ref = testee(a)
-        res = jace.jit(testee)(a)
+    A = 1.032
+    ref = testee(A)
+    res = jace.jit(testee)(A)
 
-        assert res.shape == ref.shape
-        assert res.dtype == ref.dtype
-        assert np.all(res == ref), f"Expected '{ref.tolist()}' got '{res.tolist()}'."
+    assert res.shape == ref.shape
+    assert res.dtype == ref.dtype
+    assert np.all(res == ref), f"Expected '{ref.tolist()}' got '{res.tolist()}'."
 
 
 def test_bid_literal() -> None:
     """Broadcast a literal to a matrix."""
 
-    def testee(a: float) -> np.ndarray | jax.Array:
+    def testee(a: float) -> jax.Array:
         return jnp.broadcast_to(1.0, (10, 10)) + a
 
     ref = testee(0.0)
@@ -74,12 +75,12 @@ def test_bid_vector(
 ) -> None:
     """Broadcast a vector to a tensor."""
 
-    def testee(a: np.ndarray) -> np.ndarray | jax.Array:
-        return jnp.broadcast_to(a, (10, 10)) + a
+    def testee(A: np.ndarray) -> jax.Array:
+        return jnp.broadcast_to(A, (10, 10))
 
-    a = testutil.mkarray(vector_shape)
-    ref = testee(a)
-    res = jace.jit(testee)(a)
+    A = testutil.mkarray(vector_shape)
+    ref = testee(A)
+    res = jace.jit(testee)(A)
     assert res.shape == ref.shape
     assert res.dtype == ref.dtype
     assert np.all(res == ref)
diff --git a/tests/integration_tests/primitive_translators/test_primitive_convert_element_type.py b/tests/integration_tests/primitive_translators/test_primitive_convert_element_type.py
index ef98e72..181b384 100644
--- a/tests/integration_tests/primitive_translators/test_primitive_convert_element_type.py
+++ b/tests/integration_tests/primitive_translators/test_primitive_convert_element_type.py
@@ -5,7 +5,11 @@
 #
 # SPDX-License-Identifier: BSD-3-Clause
 
-"""Tests the element type conversion functionality."""
+"""Tests the element type conversion functionality.
+
+Todo:
+    The tests should only run on certain occasion.
+"""
 
 from __future__ import annotations
 
@@ -47,8 +51,8 @@ def dst_type(
 ) -> type:
     """All valid destination types, with the exception of bool.
 
-    Includes also complex types, because going from real to complex is useful, but the other
-    way is not.
+    Includes also complex types, because going from real to complex is useful,
+    but the other way is not.
     """
     return request.param
 
@@ -56,7 +60,7 @@ def dst_type(
 def _convert_element_type_impl(
     input_type: type,
     output_type: type,
-) -> bool:
+) -> None:
     """Implementation of the tests of the convert element types primitive."""
     lowering_cnt = [0]
     A: np.ndarray = testutil.mkarray((10, 10), input_type)
@@ -65,7 +69,7 @@ def _convert_element_type_impl(
     @jace.jit
     def converter(A: np.ndarray) -> jax.Array:
         lowering_cnt[0] += 1
-        return jnp.array(A, copy=False, dtype=output_type)  # Loop variable.
+        return jnp.array(A, copy=False, dtype=output_type)
 
     res = converter(A)
     assert lowering_cnt[0] == 1
@@ -73,14 +77,12 @@ def converter(A: np.ndarray) -> jax.Array:
         res.dtype == output_type
     ), f"Expected '{output_type}', but got '{res.dtype}', input was '{input_type}'."
     assert np.allclose(ref, res)
-    return True
 
 
 def test_convert_element_type_main(
     src_type: type,
     dst_type: type,
 ) -> None:
-    """Tests all conversions with the exception of conversions from bool and complex."""
     _convert_element_type_impl(src_type, dst_type)
 
 
diff --git a/tests/integration_tests/primitive_translators/test_primitive_iota.py b/tests/integration_tests/primitive_translators/test_primitive_iota.py
index 0e27734..10ba671 100644
--- a/tests/integration_tests/primitive_translators/test_primitive_iota.py
+++ b/tests/integration_tests/primitive_translators/test_primitive_iota.py
@@ -15,8 +15,6 @@
 
 
 def test_iota_arange() -> None:
-    """Tests `jnp.arange` functionality."""
-
     def testee(A: int) -> jax.Array:
         return jnp.arange(18, dtype=int) + A
 
@@ -26,7 +24,6 @@ def testee(A: int) -> jax.Array:
 
 
 def test_iota_broadcast() -> None:
-    """Test more iota using the `jax.lax.broadcasted_iota()` function."""
     shape = (2, 2, 2, 2)
 
     for d in range(len(shape)):
diff --git a/tests/integration_tests/primitive_translators/test_primitive_reshape.py b/tests/integration_tests/primitive_translators/test_primitive_reshape.py
index 209057c..a63b3f3 100644
--- a/tests/integration_tests/primitive_translators/test_primitive_reshape.py
+++ b/tests/integration_tests/primitive_translators/test_primitive_reshape.py
@@ -45,15 +45,15 @@ def testee(A: np.ndarray) -> jax.Array:
 
 
 @pytest.fixture(
-    params=["C", pytest.param("F", marks=pytest.mark.skip("Non C order is not supported"))]
+    params=[
+        "C",
+        pytest.param("F", marks=pytest.mark.skip("Non C order is not supported")),
+    ]
 )
 def mem_order(
     request,
 ) -> str:
-    """Gets the memory order that we want
-
-    Currently 'F' is skipped because it is not implemented by the logic.
-    """
+    """Gets the memory order that we want."""
     return request.param
 
 
diff --git a/tests/integration_tests/primitive_translators/test_primitive_select_n.py b/tests/integration_tests/primitive_translators/test_primitive_select_n.py
index 16ca0ee..e9871bf 100644
--- a/tests/integration_tests/primitive_translators/test_primitive_select_n.py
+++ b/tests/integration_tests/primitive_translators/test_primitive_select_n.py
@@ -34,9 +34,7 @@ def _perform_test(
 
 
 def test_select_n_where() -> None:
-    """Normal `np.where` test."""
-
-    def testee(P: Any, T: Any, F: Any) -> Any:
+    def testee(P: np.ndarray, T: np.ndarray, F: np.ndarray) -> jax.Array:
         return jnp.where(P, T, F)
 
     shape = (10, 10)
@@ -47,21 +45,19 @@ def testee(P: Any, T: Any, F: Any) -> Any:
 
 
 def test_select_n_where_literal() -> None:
-    """`np.where` where one of the input is a literal."""
-
-    def testee1(P: Any, F: Any) -> Any:
+    def testee1(P: np.ndarray, F: np.ndarray) -> jax.Array:
         return jnp.where(P, 2, F)
 
-    def testee2(P: Any, T: Any) -> Any:
+    def testee2(P: np.ndarray, T: np.ndarray) -> jax.Array:
         return jnp.where(P, T, 3)
 
-    def testee3(P: Any) -> Any:
+    def testee3(P: np.ndarray) -> jax.Array:
         return jnp.where(P, 8, 9)
 
     shape = ()
     pred = testutil.mkarray(shape, np.bool_)
     tbranch = testutil.mkarray(shape, np.int_)
-    fbranch = testutil.mkarray(shape, np.int_)
+    fbranch = tbranch + 1
 
     _perform_test(testee1, pred, fbranch)
     _perform_test(testee2, pred, tbranch)
diff --git a/tests/integration_tests/primitive_translators/test_primitive_slicing.py b/tests/integration_tests/primitive_translators/test_primitive_slicing.py
index 735cfed..b0c5dd1 100644
--- a/tests/integration_tests/primitive_translators/test_primitive_slicing.py
+++ b/tests/integration_tests/primitive_translators/test_primitive_slicing.py
@@ -38,16 +38,14 @@ def A_4x4x4x4() -> np.ndarray:
 )
 def full_dynamic_start_idx(
     request,
-) -> None:
+) -> tuple[int, int, int, int]:
     """Start indexes for the slice window of `test_dynamic_slice_full_dynamic()`."""
     return request.param
 
 
 def test_slice_sub_view(
-    A_4x4,
+    A_4x4: np.ndarray,
 ) -> None:
-    """Simple extraction of a subsize."""
-
     @jace.jit
     def testee(A: np.ndarray) -> np.ndarray:
         return A[1:3, 1:3]
@@ -60,9 +58,9 @@ def testee(A: np.ndarray) -> np.ndarray:
 
 
 def test_slice_rslice(
-    A_4x4,
+    A_4x4: np.ndarray,
 ) -> None:
-    """Only slicing some rows."""
+    """Only extracting rows."""
 
     @jace.jit
     def testee(A: np.ndarray) -> np.ndarray:
@@ -76,7 +74,7 @@ def testee(A: np.ndarray) -> np.ndarray:
 
 
 def test_slice_cslice(
-    A_4x4,
+    A_4x4: np.ndarray,
 ) -> None:
     """Slicing some columns."""
 
@@ -93,7 +91,7 @@ def testee(A: np.ndarray) -> np.ndarray:
 
 
 def test_slice_singelton(
-    A_4x4,
+    A_4x4: np.ndarray,
 ) -> None:
     """Only extracting a single value."""
 
@@ -110,22 +108,18 @@ def testee(A: np.ndarray) -> np.ndarray:
 
 @pytest.mark.skip(reason="Missing 'gather' translator.")
 def test_slice_strides_vec() -> None:
-    """Using strides.
+    """Slice with strides.
 
-    Note:
-        Although we do not support the `strides` parameter of the `stride` primitive,
-        this is not the reason why the test fails.
-        It fails instead because Jax makes some strange gather stuff out of it.
+    Although the translator (and the primitive) would support a stride, for some
+    reason Jax makes a `gather` operation out of it, that is not yet supported.
     """
 
-    A = np.arange(16)
-
-    @jace.jit
     def testee(A: np.ndarray) -> np.ndarray:
         return A[1:15:2]
 
-    ref = A[1:15:2]
-    res = testee(A)
+    A = np.arange(16)
+    ref = testee(A)
+    res = jace.jit(testee)(A)
 
     assert ref.shape == res.shape
     assert np.all(ref == res)
@@ -133,7 +127,7 @@ def testee(A: np.ndarray) -> np.ndarray:
 
 @pytest.mark.skip(reason="Missing 'concatenate' translator.")
 def test_slice_strides(
-    A_4x4,
+    A_4x4: np.ndarray,
 ) -> None:
     """Using strides in a 2D matrix.
 
@@ -152,31 +146,24 @@ def testee(A: np.ndarray) -> np.ndarray:
 
 
 def test_slice_too_big(
-    A_4x4,
+    A_4x4: np.ndarray,
 ) -> None:
-    """Tests what happens if we specify a size that is too big.
+    """Tests what happens if we specify a size that is too big."""
 
-    Note:
-        It seems that the array is just returned as it is.
-    """
-
-    @jace.jit
     def testee(A: np.ndarray) -> np.ndarray:
         return A[:20]
 
-    res = testee(A_4x4)
-    ref = A_4x4[:20]
+    ref = testee(A_4x4)
+    res = jace.jit(testee)(A_4x4)
 
     assert ref.shape == res.shape
     assert np.all(ref == res)
 
 
 def test_dynamic_slice_full_dynamic(
-    A_4x4x4x4,
-    full_dynamic_start_idx,
+    A_4x4x4x4: np.ndarray,
+    full_dynamic_start_idx: tuple[int, int, int, int],
 ) -> None:
-    """Dynamic slicing where all start index are input parameters."""
-
     def testee(A: np.ndarray, s1: int, s2: int, s3: int, s4: int) -> jax.Array:
         return jax.lax.dynamic_slice(A, (s1, s2, s3, s4), (2, 2, 2, 2))
 
@@ -187,10 +174,8 @@ def testee(A: np.ndarray, s1: int, s2: int, s3: int, s4: int) -> jax.Array:
 
 
 def test_dynamic_slice_partially_dynamic(
-    A_4x4x4x4,
+    A_4x4x4x4: np.ndarray,
 ) -> None:
-    """Dynamic slicing where some start index are input parameters and others are literals."""
-
     def testee(A: np.ndarray, s1: int, s2: int) -> jax.Array:
         return jax.lax.dynamic_slice(A, (s1, 1, s2, 2), (2, 2, 2, 2))
 
@@ -201,10 +186,8 @@ def testee(A: np.ndarray, s1: int, s2: int) -> jax.Array:
 
 
 def test_dynamic_slice_full_literal(
-    A_4x4x4x4,
+    A_4x4x4x4: np.ndarray,
 ) -> None:
-    """Dynamic slicing where all start indexes are literals."""
-
     def testee(A: np.ndarray) -> jax.Array:
         return jax.lax.dynamic_slice(A, (0, 1, 0, 2), (2, 2, 2, 2))
 
diff --git a/tests/integration_tests/primitive_translators/test_primitive_squeeze_expand_dims.py b/tests/integration_tests/primitive_translators/test_primitive_squeeze_expand_dims.py
index a37557d..cc5f56e 100644
--- a/tests/integration_tests/primitive_translators/test_primitive_squeeze_expand_dims.py
+++ b/tests/integration_tests/primitive_translators/test_primitive_squeeze_expand_dims.py
@@ -5,11 +5,11 @@
 #
 # SPDX-License-Identifier: BSD-3-Clause
 
-"""Implements tests for the squeeze translator.
+"""Tests about the `squeeze` primitive.
 
-For several reasons parts of the tests related to broadcasting, especially the ones in which
-a single dimension is added, are also here. This is because of the inverse relationship between
-`expand_dims` and `squeeze`.
+For several reasons parts of the tests related to broadcasting, especially the
+ones in which a single dimension is added, are also here. This is because of
+the inverse relationship between `expand_dims` and `squeeze`.
 """
 
 from __future__ import annotations
@@ -59,7 +59,7 @@ def _roundtrip_implementation(
 
 
 @pytest.fixture(params=[0, -1, 1])
-def simple_axis(
+def single_axis(
     request,
 ) -> int:
     return request.param
@@ -73,19 +73,19 @@ def simple_axis(
         (3, 2, 1),
     ]
 )
-def hard_axis(
+def multiple_axis(
     request,
-) -> Sequence[int] | int:
+) -> tuple[int, ...] | int:
     return request.param
 
 
 def test_expand_squeeze_rountrip_simple(
-    simple_axis,
+    single_axis: int,
 ) -> None:
-    _roundtrip_implementation((10,), simple_axis)
+    _roundtrip_implementation((10,), single_axis)
 
 
 def test_expand_squeeze_rountrip_big(
-    hard_axis,
+    multiple_axis: Sequence[int],
 ) -> None:
-    _roundtrip_implementation((2, 3, 4, 5), hard_axis)
+    _roundtrip_implementation((2, 3, 4, 5), multiple_axis)
diff --git a/tests/integration_tests/test_empty_jaxpr.py b/tests/integration_tests/test_empty_jaxpr.py
index b2e2207..22a1be3 100644
--- a/tests/integration_tests/test_empty_jaxpr.py
+++ b/tests/integration_tests/test_empty_jaxpr.py
@@ -20,7 +20,7 @@
 import jace
 
 
-def test_empty_array() -> None:
+def test_empty_single_return() -> None:
     @jace.jit
     def wrapped(A: np.ndarray) -> np.ndarray:
         return A
@@ -32,7 +32,7 @@ def wrapped(A: np.ndarray) -> np.ndarray:
     assert res.__array_interface__["data"][0] != A.__array_interface__["data"][0]
 
 
-def test_empty_multiple() -> None:
+def test_empty_multiple_return() -> None:
     @jace.jit
     def wrapped(A: np.ndarray, B: np.float64) -> tuple[np.ndarray, np.float64]:
         return A, B
@@ -46,7 +46,9 @@ def wrapped(A: np.ndarray, B: np.float64) -> tuple[np.ndarray, np.float64]:
     assert res[0].__array_interface__["data"][0] != A.__array_interface__["data"][0]
 
 
-def test_empty_unused() -> None:
+def test_empty_unused_argument() -> None:
+    """Empty body and an unused input argument."""
+
     @jace.jit
     def wrapped(A: np.ndarray, B: np.float64) -> np.ndarray:  # noqa: ARG001  # Explicitly unused.
         return A
@@ -66,7 +68,7 @@ def wrapped(A: np.ndarray, B: np.float64) -> np.ndarray:  # noqa: ARG001  # Expl
 
 def test_empty_scalar() -> None:
     @jace.jit
-    def wrapped(A: float) -> float:
+    def wrapped(A: np.float64) -> np.float64:
         return A
 
     A = np.pi
@@ -77,7 +79,7 @@ def wrapped(A: float) -> float:
 @pytest.mark.skip(reason="Nested Jaxpr are not handled.")
 def test_empty_nested() -> None:
     @jace.jit
-    def wrapped(A: float) -> float:
+    def wrapped(A: np.float64) -> np.float64:
         return jax.jit(lambda A: A)(A)
 
     A = np.pi
@@ -85,37 +87,32 @@ def wrapped(A: float) -> float:
     assert np.all(wrapped(A) == A)
 
 
-def test_empty_with_drop_vars() -> None:
-    """Tests if we can handle an empty input = output case, with present drop variables."""
+def test_empty_literal_return() -> None:
+    """An empty Jaxpr that only contains a literal return value."""
 
-    @jace.jit
-    @jace.grad
-    def wrapped(A: float) -> float:
-        return A * A
+    def testee() -> np.float64:
+        return np.float64(3.1415)
 
-    A = np.pi
+    ref = testee()
+    res = jace.jit(testee)()
 
-    assert np.all(wrapped(A) == 2.0 * A)
+    assert np.all(res == ref)
 
 
 @pytest.mark.skip(reason="Literal return value is not implemented.")
-def test_empty_literal_return() -> None:
-    """Tests if we can handle a literal return value.
-
-    Note:
-        Using this test function serves another purpose. Since Jax includes the original
-        computation in the Jaxpr coming from a `grad` annotated function, the result will have
-        only drop variables.
+def test_empty_with_drop_vars() -> None:
+    """Jaxpr only containing drop variables.
 
-    Todo:
-        Add a test if we really have a literal return value, but for that we need the Jaxpr.
+    Notes:
+        As a side effect the Jaxpr also has a literal return value.
     """
 
-    @jace.jit
     @jace.grad
-    def wrapped(A: float) -> float:
-        return A + A + A
+    def testee(a: np.float64, b: np.float64) -> np.float64:
+        return a + b
 
     A = np.e
+    ref = testee(A)
+    res = jace.jit(testee)(A)
 
-    assert np.all(wrapped(A) == 3.0)
+    assert np.all(ref == res)
diff --git a/tests/integration_tests/test_jaxpr_translator_builder.py b/tests/integration_tests/test_jaxpr_translator_builder.py
index 9222f52..53bd65a 100644
--- a/tests/integration_tests/test_jaxpr_translator_builder.py
+++ b/tests/integration_tests/test_jaxpr_translator_builder.py
@@ -5,16 +5,22 @@
 #
 # SPDX-License-Identifier: BSD-3-Clause
 
-"""Implements some tests of the subtranslator builder."""
+"""Tests for the `JaxprTranslationBuilder` object.
+
+Although this is an integration test, the tests here manipulate the builder on
+a low and direct level.
+"""
 
 from __future__ import annotations
 
 import re
 
 import dace
+import jax
 import numpy as np
 import pytest
 from dace.data import Array
+from jax import numpy as jnp
 
 import jace
 from jace import translator, util
@@ -51,10 +57,7 @@ def translation_builder() -> translator.JaxprTranslationBuilder:
 
 
 def test_builder_alloc() -> None:
-    """Tests the state right after allocation.
-
-    Does not use the fixture because it does it on its own.
-    """
+    """Tests for correct allocation."""
     builder = translator.JaxprTranslationBuilder(
         primitive_translators=translator.get_registered_primitive_translators()
     )
@@ -80,7 +83,7 @@ def test_builder_alloc() -> None:
 def test_builder_variable_alloc_auto_naming(
     translation_builder: translator.JaxprTranslationBuilder,
 ) -> None:
-    """Tests simple variable allocation."""
+    """Tests if autonaming of variables works."""
     for i, var in enumerate([array1, array2, scal1, array3, scal2, scal3]):
         sdfg_name = translation_builder.add_array(var, update_var_mapping=True)
         sdfg_var = translation_builder.get_array(sdfg_name)
@@ -93,10 +96,9 @@ def test_builder_variable_alloc_auto_naming(
 def test_builder_variable_alloc_mixed_naming(
     translation_builder: translator.JaxprTranslationBuilder,
 ) -> None:
-    """Tests the naming in a mixed setting.
+    """Test automatic naming if there are variables with a given name.
 
-    If `update_var_mapping=True` is given, then the naming will skip variables,
-    see also `test_builder_variable_alloc_mixed_naming2()`.
+    See also `test_builder_variable_alloc_mixed_naming2()`.
     """
     #                        *       b       c       d      *      f      g
     for i, var in enumerate([narray, array1, array2, scal1, nscal, scal2, scal3]):
@@ -114,11 +116,7 @@ def test_builder_variable_alloc_mixed_naming(
 def test_builder_variable_alloc_mixed_naming2(
     translation_builder: translator.JaxprTranslationBuilder,
 ) -> None:
-    """Tests the naming in a mixed setting.
-
-    This time we do not use `update_var_mapping=True`, instead it now depends on the name. This
-    means that automatic naming will now again include all, letters, but not in a linear order.
-    """
+    """Test automatic naming if there are variables with a given name."""
     letoff = 0
     #             *      a        b       c      *      d     e
     for var in [narray, array1, array2, scal1, nscal, scal2, scal3]:
@@ -134,6 +132,32 @@ def test_builder_variable_alloc_mixed_naming2(
         assert sdfg_var.dtype == var.dtype
 
 
+def test_builder_variable_alloc_auto_naming_wrapped(
+    translation_builder: translator.JaxprTranslationBuilder,
+) -> None:
+    """Tests the variable naming if we have more than 26 variables."""
+    single_letters = [chr(x) for x in range(97, 123)]
+    i = 0
+    for let1 in ["", *single_letters[1:]]:  # Note `z` is followed by `ba` and not by `aa`.
+        for let2 in single_letters:
+            i += 1
+            # Create a variable and enter it into the variable naming.
+            var = JaCeVar(shape=(19, 19), dtype=dace.float64)
+            sdfg_name = translation_builder.add_array(arg=var, update_var_mapping=True)
+            mapped_name = translation_builder.map_jax_var_to_sdfg(var)
+            assert (
+                sdfg_name == mapped_name
+            ), f"Mapping for '{var}' failed, expected '{sdfg_name}' got '{mapped_name}'."
+
+            # Get the name that we really expect, we must also handle some situations.
+            exp_name = let1 + let2
+            if exp_name in util.FORBIDDEN_SDFG_VAR_NAMES:
+                exp_name = "__jace_forbidden_" + exp_name
+            assert (
+                exp_name == sdfg_name
+            ), f"Automated naming failed, expected '{exp_name}' but got '{sdfg_name}'."
+
+
 def test_builder_variable_alloc_prefix_naming(
     translation_builder: translator.JaxprTranslationBuilder,
 ) -> None:
@@ -162,32 +186,6 @@ def test_builder_variable_alloc_prefix_naming(
     assert exp_name_3 == sdfg_name_3
 
 
-def test_builder_variable_alloc_auto_naming_wrapped(
-    translation_builder: translator.JaxprTranslationBuilder,
-) -> None:
-    """Tests the variable naming if we have more than 26 variables."""
-    single_letters = [chr(x) for x in range(97, 123)]
-    i = 0
-    for let1 in ["", *single_letters[1:]]:  # Note `z` is followed by `ba` and not by `aa`.
-        for let2 in single_letters:
-            i += 1
-            # Create a variable and enter it into the variable naming.
-            var = JaCeVar(shape=(19, 19), dtype=dace.float64)
-            sdfg_name = translation_builder.add_array(arg=var, update_var_mapping=True)
-            mapped_name = translation_builder.map_jax_var_to_sdfg(var)
-            assert (
-                sdfg_name == mapped_name
-            ), f"Mapping for '{var}' failed, expected '{sdfg_name}' got '{mapped_name}'."
-
-            # Get the name that we really expect, we must also handle some situations.
-            exp_name = let1 + let2
-            if exp_name in util.FORBIDDEN_SDFG_VAR_NAMES:
-                exp_name = "__jace_forbidden_" + exp_name
-            assert (
-                exp_name == sdfg_name
-            ), f"Automated naming failed, expected '{exp_name}' but got '{sdfg_name}'."
-
-
 def test_builder_nested(
     translation_builder: translator.JaxprTranslationBuilder,
 ) -> None:
@@ -246,8 +244,7 @@ def test_builder_nested(
     assert translation_builder.sdfg.number_of_nodes() == 2
     assert translation_builder.sdfg.number_of_edges() == 1
 
-    # Again the variable that was declared in the last stack is now no longer present.
-    #  Note if the nested SDFG was integrated into the parent SDFG it would be accessible
+    # Again the variable that was declared in the nested context is now no longer present.
     with pytest.raises(
         expected_exception=KeyError,
         match=re.escape(
@@ -302,10 +299,10 @@ def test_builder_append_state(
     assert next(iter(sdfg.in_edges(non_terminal_state))).src is terminal_state_1
 
 
-def test_builder_variable_multiple_variables(
+def test_builder_variable_multiple_versions(
     translation_builder: translator.JaxprTranslationBuilder,
 ) -> None:
-    """A simple test in which we try to add a variable that are known, but with a different name."""
+    """A simple test in which we try to add a variable that is known, but with a different name."""
     # Now we will add `array1` and then different ways of updating it.
     narray1: str = translation_builder.add_array(array1, update_var_mapping=True)
 
@@ -574,9 +571,10 @@ def test_builder_direct_return() -> None:
     """Tests the case, when an input value is returned as output.
 
     Note:
-        The test function below will not return a reference to its input, but perform an actual
-        copy. This behaviour does look strange from a Python point of view, however, it is (at the
-        time of writing) consistent with what Jax does, even when passing Jax arrays directly.
+        The test function below will not return a reference to its input,
+        but perform an actual copy. This behaviour does look strange from a
+        Python point of view, however, it is (at the time of writing)
+        consistent with what Jax does, even when passing Jax arrays directly.
     """
 
     @jace.jit
@@ -668,3 +666,17 @@ def testee(A: np.ndarray) -> np.ndarray:
         match=re.escape("Currently can not yet handle strides beside 'C_CONTIGUOUS'."),
     ):
         _ = testee(F)
+
+
+def test_builder_drop_variables() -> None:
+    """Tests if the builder can handle drop variables."""
+
+    @jace.grad
+    def testee(A: np.float64) -> jax.Array:
+        return jnp.exp(jnp.sin(jnp.tan(A**3))) ** 2
+
+    A = np.e
+    ref = testee(A)
+    res = jace.jit(testee)(A)
+
+    assert np.allclose(ref, res)
diff --git a/tests/integration_tests/test_primitive_translator_managing.py b/tests/integration_tests/test_primitive_translator_managing.py
index 22021c9..60497d7 100644
--- a/tests/integration_tests/test_primitive_translator_managing.py
+++ b/tests/integration_tests/test_primitive_translator_managing.py
@@ -26,11 +26,11 @@
 
 
 if TYPE_CHECKING:
-    from collections.abc import Mapping
+    from collections.abc import Generator, Mapping
 
 
 @pytest.fixture(autouse=True)
-def _conserve_builtin_translators() -> None:
+def _conserve_builtin_translators() -> Generator[None, None, None]:
     """Restores the set of registered subtranslators after a test."""
     initial_translators = get_registered_primitive_translators()
     yield
@@ -38,14 +38,16 @@ def _conserve_builtin_translators() -> None:
 
 
 @pytest.fixture()
-def no_builtin_translators() -> None:  # noqa: PT004  # This is how you should do it: https://docs.pytest.org/en/7.1.x/how-to/fixtures.html#use-fixtures-in-classes-and-modules-with-usefixtures
+def no_builtin_translators() -> Generator[None, None, None]:  # noqa: PT004  # This is how you should do it: https://docs.pytest.org/en/7.1.x/how-to/fixtures.html#use-fixtures-in-classes-and-modules-with-usefixtures
     """This fixture can be used if the test does not want any builtin translators."""
     initial_translators = translator.set_active_primitive_translators_to({})
     yield
     translator.set_active_primitive_translators_to(initial_translators)
 
 
-# These are definitions of some Subtranslators that can be used to test things.
+# <------------- Definitions needed for the test
+
+
 class SubTrans1(translator.PrimitiveTranslator):
     @property
     def primitive(self):
@@ -71,13 +73,7 @@ def SubTrans3_Callable(*args: Any, **kwargs: Any) -> None:  # noqa: ARG001
 
 @make_primitive_translator("add")
 def fake_add_translator(*args: Any, **kwargs: Any) -> None:  # noqa: ARG001
-    raise NotImplementedError
-
-
-def test_are_subtranslators_imported() -> None:
-    """Tests if something is inside the list of subtranslators."""
-    # Must be adapted if new primitives are implemented.
-    assert len(get_registered_primitive_translators()) == 60
+    raise NotImplementedError("'fake_add_translator()' was called.")
 
 
 @pytest.mark.usefixtures("no_builtin_translators")
@@ -134,23 +130,19 @@ def same_structure(
     initial_primitives = get_registered_primitive_translators()
     assert "add" in initial_primitives
 
-    # Now mutate the dict a little bit, shallow copy it first.
-    mutated_primitives = initial_primitives.copy()
-    mutated_primitives["add"] = fake_add_translator
-    assert mutated_primitives.keys() == initial_primitives.keys()
-    assert same_structure(initial_primitives, get_registered_primitive_translators())
-    assert not same_structure(mutated_primitives, initial_primitives)
-    assert not same_structure(mutated_primitives, get_registered_primitive_translators())
-
-    # Now change the initial one with the mutated one.
-    #  The object is copied but should still have the same structure.
-    old_active = set_active_primitive_translators_to(mutated_primitives)
-    assert mutated_primitives is not translator.primitive_translator._PRIMITIVE_TRANSLATORS_REGISTRY
+    # Generate a set of translators that we swap in
+    new_active_primitives = initial_primitives.copy()
+    new_active_primitives["add"] = fake_add_translator
+
+    # Now perform the changes.
+    old_active = set_active_primitive_translators_to(new_active_primitives)
+    assert (
+        new_active_primitives is not translator.primitive_translator._PRIMITIVE_TRANSLATORS_REGISTRY
+    )
     assert same_structure(old_active, initial_primitives)
-    assert same_structure(mutated_primitives, get_registered_primitive_translators())
+    assert same_structure(new_active_primitives, get_registered_primitive_translators())
 
 
-@pytest.mark.usefixtures("no_builtin_translators")
 def test_subtranslatior_managing_callable_annotation() -> None:
     """Test if `make_primitive_translator()` works."""
 
@@ -162,37 +154,33 @@ def non_existing_translator(*args: Any, **kwargs: Any) -> None:  # noqa: ARG001
 
     assert hasattr(non_existing_translator, "primitive")
     assert non_existing_translator.primitive == prim_name
-    assert len(get_registered_primitive_translators()) == 0
 
 
 def test_subtranslatior_managing_overwriting() -> None:
-    """Tests if we are able to overwrite something."""
+    """Tests if we are able to overwrite a translator in the global registry."""
     current_add_translator = get_registered_primitive_translators()["add"]
 
-    @make_primitive_translator("add")
-    def useless_add_translator(*args: Any, **kwargs: Any) -> None:  # noqa: ARG001
-        raise NotImplementedError
-
-    # This will not work because it is not overwritten.
+    # This will not work because overwriting is not activated.
     with pytest.raises(
         expected_exception=ValueError,
         match=re.escape(
             "Explicit override=True needed for primitive 'add' to overwrite existing one."
         ),
     ):
-        register_primitive_translator(useless_add_translator)
+        register_primitive_translator(fake_add_translator)
     assert current_add_translator is get_registered_primitive_translators()["add"]
 
-    # Now we use overwrite, thus it will now work.
-    assert useless_add_translator is register_primitive_translator(
-        useless_add_translator, overwrite=True
-    )
-    assert useless_add_translator is get_registered_primitive_translators()["add"]
+    # Now we use overwrite.
+    assert fake_add_translator is register_primitive_translator(fake_add_translator, overwrite=True)
+    assert fake_add_translator is get_registered_primitive_translators()["add"]
 
 
 @pytest.mark.usefixtures("no_builtin_translators")
 def test_subtranslatior_managing_overwriting_2() -> None:
-    """Again an overwriting test, but this time a bit more complicated."""
+    """Again an overwriting test, but this time a bit more complicated.
+
+    It also shows if the translator was actually called.
+    """
 
     trans_cnt = [0]
 
@@ -227,18 +215,14 @@ def foo(A: int) -> int:
         D = C + 1
         return D + 1
 
-    @register_primitive_translator(overwrite=True)
-    @make_primitive_translator("add")
-    def useless_add_translator(*args: Any, **kwargs: Any) -> None:  # noqa: ARG001
-        raise NotImplementedError("The 'useless_add_translator' was called as expected.")
-
-    assert get_registered_primitive_translators()["add"] is useless_add_translator
+    # Now register the add translator.
+    register_primitive_translator(fake_add_translator, overwrite=True)
 
     # Since `foo` was already constructed, a new registering can not change anything.
     A = np.zeros((10, 10))
     assert np.all(foo(A) == 4)
 
-    # But if we now annotate a new function, then we will get the uselss translator
+    # But if we now annotate a new function, then we will get fake translator
     @jace.jit
     def foo_fail(A):
         B = A + 1
@@ -246,6 +230,6 @@ def foo_fail(A):
 
     with pytest.raises(
         expected_exception=NotImplementedError,
-        match=re.escape("The 'useless_add_translator' was called as expected."),
+        match=re.escape("'fake_add_translator()' was called."),
     ):
         _ = foo_fail.lower(A)
diff --git a/tests/unit_tests/test_caching.py b/tests/unit_tests/test_caching.py
index e615ee3..c633f24 100644
--- a/tests/unit_tests/test_caching.py
+++ b/tests/unit_tests/test_caching.py
@@ -58,7 +58,7 @@ def wrapped(A, B):
     assert np.allclose(testee(A, B), compiled(A, B))
 
     # Now lets call the wrapped object directly, since we already did the lowering
-    #  no longering (and compiling) is needed.
+    #  no lowering (and compiling) is needed.
     assert np.allclose(testee(A, B), wrapped(A, B))
     assert lowering_cnt[0] == 1
 
@@ -123,10 +123,10 @@ def wrapped(A, B):
     C = testutil.mkarray((4, 3), dtype=np.int64)
     D = testutil.mkarray((6, 3), dtype=np.int64)
 
-    # These are the known lowerings.
+    # These are the known lowered instances.
     lowerings: dict[tuple[int, int], stages.JaCeLowered] = {}
     lowering_ids: set[int] = set()
-    # These are the known compilations.
+    # These are the known compilation instances.
     compilations: dict[tuple[int, int], stages.JaCeCompiled] = {}
     compiled_ids: set[int] = set()
 
@@ -174,16 +174,8 @@ def jaceWrapped(A: np.ndarray, B: np.ndarray) -> np.ndarray:
     # Now we lower it.
     jaceLowered = jaceWrapped.lower(A, B)
 
-    # Compiling it without any information.
+    # Compiling it with and without optimizations enabled
     optiCompiled = jaceLowered.compile()
-
-    # This should be the same as passing the defaults directly.
-    assert optiCompiled is jaceLowered.compile(optimization.DEFAULT_OPTIMIZATIONS)
-
-    # Also if we pass the empty dict, we should get the default.
-    assert optiCompiled is jaceLowered.compile({})
-
-    # Now we disable all optimizations
     unoptiCompiled = jaceLowered.compile(optimization.NO_OPTIMIZATIONS)
 
     # Because of the way how things work the optimized must have more than the unoptimized.
@@ -192,6 +184,11 @@ def jaceWrapped(A: np.ndarray, B: np.ndarray) -> np.ndarray:
     assert optiCompiled._csdfg.sdfg.number_of_nodes() == 1
     assert optiCompiled._csdfg.sdfg.number_of_nodes() < unoptiCompiled._csdfg.sdfg.number_of_nodes()
 
+    # Now we check if they are still inside the cache.
+    assert optiCompiled is jaceLowered.compile(optimization.DEFAULT_OPTIMIZATIONS)
+    assert optiCompiled is jaceLowered.compile({})
+    assert unoptiCompiled is jaceLowered.compile(optimization.NO_OPTIMIZATIONS)
+
 
 def test_caching_dtype() -> None:
     """Tests if the data type is properly included in the test."""
@@ -227,28 +224,35 @@ def testee(A: np.ndarray) -> np.ndarray:
         return A + 1.0
 
     cache: tcache.StageCache = testee._cache
+    assert len(cache) == 0
 
     first_lowered = testee.lower(np.ones(10))
     first_key = cache.front()[0]
+    assert len(cache) == 1
+
     second_lowered = testee.lower(np.ones(11))
     second_key = cache.front()[0]
+    assert len(cache) == 2
+    assert second_key != first_key
+
     third_lowered = testee.lower(np.ones(12))
     third_key = cache.front()[0]
+    assert len(cache) == 3
+    assert third_key != second_key
+    assert third_key != first_key
 
-    assert first_key != second_key
-    assert first_key != third_key
-    assert second_key != third_key
-    assert cache[first_key] is first_lowered
-    assert cache[second_key] is second_lowered
+    # Test if the key association is correct.
+    #  Since reading does not modify the order, third key must be still at the front.
+    #  To test this we also have this strange order.
+    assert cache.front()[0] == third_key
     assert cache[third_key] is third_lowered
-
-    assert first_key in cache
-    assert second_key in cache
-    assert third_key in cache
+    assert cache[second_key] is second_lowered
+    assert cache[first_key] is first_lowered
     assert cache.front()[0] == third_key
 
     # We now evict the second key, which should not change anything on the order.
     cache.popitem(second_key)
+    assert len(cache) == 2
     assert first_key in cache
     assert second_key not in cache
     assert third_key in cache
@@ -256,16 +260,15 @@ def testee(A: np.ndarray) -> np.ndarray:
 
     # Now we modify first_key, which moves it to the front.
     cache[first_key] = first_lowered
+    assert len(cache) == 2
     assert first_key in cache
-    assert second_key not in cache
     assert third_key in cache
     assert cache.front()[0] == first_key
 
     # Now we evict the oldest one, which is third_key
     cache.popitem(None)
+    assert len(cache) == 1
     assert first_key in cache
-    assert second_key not in cache
-    assert third_key not in cache
     assert cache.front()[0] == first_key
 
 
@@ -316,11 +319,15 @@ def testee(A: np.ndarray) -> np.ndarray:
     assert second_key not in cache
 
 
+@pytest.mark.skip("Non C order is not supported")
 def test_caching_strides() -> None:
     """Test if the cache detects a change in strides."""
 
+    lower_cnt = [0]
+
     @jace.jit
     def wrapped(A: np.ndarray) -> np.ndarray:
+        lower_cnt[0] += 1
         return A + 10.0
 
     shape = (10, 100, 1000)
@@ -338,15 +345,14 @@ def wrapped(A: np.ndarray) -> np.ndarray:
     # Now we run it with FORTRAN strides.
     #  However, this does not work because we do not support strides at all.
     #  But the cache is aware of this, which helps catch some nasty bugs.
-    F_lower = None  # Remove later
-    F_res = C_res.copy()  # Remove later
-    with pytest.raises(  # noqa: PT012 # Multiple calls
+    with pytest.raises(
         expected_exception=NotImplementedError,
         match=re.escape("Currently can not yet handle strides beside 'C_CONTIGUOUS'."),
     ):
         F_lower = wrapped.lower(F)
-        F_res = wrapped(F)
-    assert F_lower is None  # Remove later.
+    F_res = F_lower.compile()(F)
+
     assert C_res is not F_res
     assert np.allclose(F_res, C_res)
     assert F_lower is not C_lower
+    assert lower_cnt[0] == 2
diff --git a/tests/unit_tests/test_jax_api.py b/tests/unit_tests/test_jax_api.py
index a10aef3..d36e326 100644
--- a/tests/unit_tests/test_jax_api.py
+++ b/tests/unit_tests/test_jax_api.py
@@ -152,7 +152,7 @@ def jace_ddf(x):
 def test_grad_control_flow() -> None:
     """Tests if `grad` and controlflow works.
 
-    This requirement is mentioned in `https://jax.readthedocs.io/en/latest/notebooks/Common_Gotchas_in_JAX.html#python-control-flow-autodiff`.
+    This requirement is mentioned in the [documentation](https://jax.readthedocs.io/en/latest/notebooks/Common_Gotchas_in_JAX.html#python-control-flow-autodiff).
     """
 
     @jace.grad
@@ -209,4 +209,7 @@ def testee(A: np.ndarray, B: np.float64) -> np.ndarray:
     #  float64 as input! Calling the resulting SDFG with the arguments we used for lowering
     #  will result in an error, because of the situation, `sizeof(float32) < sizeof(float64)`,
     #  no out of bound error would result, but the values are garbage.
-    assert tsdfg.sdfg.arrays[tsdfg.inp_names[0]].dtype.as_numpy_dtype().type is np.float32
+    assert all(
+        tsdfg.sdfg.arrays[inp_name].dtype.as_numpy_dtype().type is np.float32
+        for inp_name in tsdfg.inp_names
+    )
diff --git a/tests/unit_tests/test_misc.py b/tests/unit_tests/test_misc.py
index d595498..d53a428 100644
--- a/tests/unit_tests/test_misc.py
+++ b/tests/unit_tests/test_misc.py
@@ -18,12 +18,13 @@
 
 
 @pytest.mark.skip("Possible bug in DaCe.")
-def test_mismatch_in_datatyte_calling() -> None:
+def test_mismatch_in_datatype_calling() -> None:
     """Tests compilation and calling with different types.
 
-    Note that this more or less a test for the calling implementation of the `CompiledSDFG`
-    class in DaCe. As I understand the `CompiledSDFG::_construct_args()` function this should be
-    detected. However, as evidently it does not do this.
+    Note that this is more or less a test for the calling implementation of
+    the `CompiledSDFG` class in DaCe. As I understand the
+    `CompiledSDFG::_construct_args()` function this should be detected.
+    However, as evidently it does not do this.
     """
 
     @jace.jit

From 95f04bebdf439fac0fca8300b186133ad279fcc6 Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Fri, 7 Jun 2024 09:50:40 +0200
Subject: [PATCH 318/458] Updated how `is_tracing_ongoing()` works.

Before we simply relied on the inspection of the input arguments.
However, now we also inspect the tracing stack of jax.
Since this is a very complex variable that should be considered the internal of the internal, accessing it is actually a very stupid idea.
---
 src/jace/stages.py          |  1 -
 src/jace/util/jax_helper.py | 18 ++++++++++++++----
 2 files changed, 14 insertions(+), 5 deletions(-)

diff --git a/src/jace/stages.py b/src/jace/stages.py
index c07d736..0670f7e 100644
--- a/src/jace/stages.py
+++ b/src/jace/stages.py
@@ -116,7 +116,6 @@ def __call__(
 
         The arguments passed to this function are the same as the wrapped function uses.
         """
-
         # If we are inside a traced context, then we forward the call to the wrapped function.
         #  This ensures that JaCe is composable with Jax.
         if util.is_tracing_ongoing(*args, **kwargs):
diff --git a/src/jace/util/jax_helper.py b/src/jace/util/jax_helper.py
index ca6f60c..cbc25d7 100644
--- a/src/jace/util/jax_helper.py
+++ b/src/jace/util/jax_helper.py
@@ -18,6 +18,7 @@
 from typing import TYPE_CHECKING, Any
 
 import dace
+import jax
 import jax.core as jax_core
 import numpy as np
 
@@ -141,10 +142,19 @@ def is_tracing_ongoing(
     While a return value `True` guarantees that a translation is ongoing, a
     value of `False` does not guarantees that no tracing is ongoing.
     """
-    # The current implementation only checks the arguments if it contains tracers.
-    if (len(args) == 0) and (len(kwargs) == 0):
-        raise RuntimeError("Failed to determine if tracing is ongoing.")
-    return any(isinstance(x, jax_core.Tracer) for x in itertools.chain(args, kwargs.values()))
+    # To detect if there is tracing ongoing, we check the internal tracing stack of Jax.
+    #  Note that this is highly internal and depends on the precise implementation of Jax.
+    #  For that reason we first look at all arguments and check if they are tracers.
+    #  Furthermore, it seems that Jax always have a bottom interpreter on the stack,
+    #  this is because we empty is `len(...) == 1`!
+    #  See also: https://github.com/google/jax/pull/3370
+    if any(isinstance(x, jax_core.Tracer) for x in itertools.chain(args, kwargs.values())):
+        return True
+    if len(jax._src.core.thread_local_state.trace_state.trace_stack.stack) == 1:
+        return False
+    if len(jax._src.core.thread_local_state.trace_state.trace_stack.stack) > 1:
+        return True
+    raise RuntimeError("Failed to determine if tracing is ongoing.")
 
 
 def translate_dtype(

From bbc51d0644af9a26276d5e6f6e949e5f16c011d2 Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Fri, 7 Jun 2024 10:11:56 +0200
Subject: [PATCH 319/458] The translator is now also able to handle cases with
 no input arguments.

---
 src/jace/stages.py                            |  7 +++++--
 .../translator/jaxpr_translator_builder.py    | 20 ++++++++++++++++++-
 2 files changed, 24 insertions(+), 3 deletions(-)

diff --git a/src/jace/stages.py b/src/jace/stages.py
index 0670f7e..c3032a6 100644
--- a/src/jace/stages.py
+++ b/src/jace/stages.py
@@ -326,8 +326,11 @@ def __init__(
         inp_names: Sequence[str],
         out_names: Sequence[str],
     ) -> None:
-        if (not inp_names) or (not out_names):
-            raise ValueError("Input and output can not be empty.")
+        # NOTE: We only check that we have output, we do not care about the input, since the
+        #  function `def foo(): return 1.0` is still a pure function, but we require that we have
+        #  output.
+        if not out_names:
+            raise ValueError("A jited function needs at least one output.")
         self._csdfg = csdfg
         self._inp_names = tuple(inp_names)
         self._out_names = tuple(out_names)
diff --git a/src/jace/translator/jaxpr_translator_builder.py b/src/jace/translator/jaxpr_translator_builder.py
index 437787e..d00f110 100644
--- a/src/jace/translator/jaxpr_translator_builder.py
+++ b/src/jace/translator/jaxpr_translator_builder.py
@@ -666,7 +666,7 @@ def _handle_null_jaxpr(
             The function will _not_ update the `out_names` field of the current context.
         """
         assert self._ctx.terminal_state is self._ctx.start_state
-        assert self._ctx.inp_names
+        assert isinstance(self._ctx.inp_names, tuple)
         assert self._ctx.out_names is None
 
         # There is not output so we do not have to copy anything around.
@@ -786,4 +786,22 @@ def validate(self) -> bool:
                 self.sdfg,
                 self.sdfg.node_id(self.terminal_state),
             )
+        if not (
+            self.inp_names is None
+            or all(inp_name in self.sdfg.arrays for inp_name in self.inp_names)
+        ):
+            raise dace.sdfg.InvalidSDFGError(
+                f"Missing input arguments: {(inp_name for inp_name in self.inp_names if inp_name not in self.sdfg.arrays)}",
+                self.sdfg,
+                self.sdfg.node_id(self.terminal_state),
+            )
+        if not (
+            self.out_names is None
+            or all(out_name in self.sdfg.arrays for out_name in self.out_names)
+        ):
+            raise dace.sdfg.InvalidSDFGError(
+                f"Missing output arguments: {(out_name for out_name in self.out_names if out_name not in self.sdfg.arrays)}",
+                self.sdfg,
+                self.sdfg.node_id(self.terminal_state),
+            )
         return True

From f1846eb7eb02b9989fa6cbc39e341d81e5383724 Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Fri, 7 Jun 2024 10:21:39 +0200
Subject: [PATCH 320/458] Updated the tests.

---
 tests/conftest.py                           | 25 +++++++++++--
 tests/integration_tests/test_empty_jaxpr.py |  1 +
 tests/unit_tests/test_caching.py            | 38 +++++++++++++++++---
 tests/unit_tests/test_jax_api.py            | 40 ++++++++++++++++++++-
 4 files changed, 96 insertions(+), 8 deletions(-)

diff --git a/tests/conftest.py b/tests/conftest.py
index df8e75c..4bd941f 100644
--- a/tests/conftest.py
+++ b/tests/conftest.py
@@ -14,6 +14,8 @@
 
 from __future__ import annotations
 
+from typing import TYPE_CHECKING
+
 import jax
 import numpy as np
 import pytest
@@ -21,8 +23,12 @@
 from jace.util import translation_cache as tcache
 
 
+if TYPE_CHECKING:
+    from collections.abc import Generator
+
+
 @pytest.fixture(autouse=True)
-def _enable_x64_mode_in_jax() -> None:
+def _enable_x64_mode_in_jax() -> Generator[None, None, None]:
     """Fixture of enable the `x64` mode in Jax.
 
     Currently, JaCe requires that `x64` mode is enabled and will do all Jax
@@ -34,7 +40,7 @@ def _enable_x64_mode_in_jax() -> None:
 
 
 @pytest.fixture(autouse=True)
-def _disable_jit() -> None:
+def _disable_jit() -> Generator[None, None, None]:
     """Fixture for disable the dynamic jiting in Jax.
 
     For certain reasons Jax puts certain primitives inside a `pjit` primitive,
@@ -45,6 +51,9 @@ def _disable_jit() -> None:
     to an error. To overcome this problem, we will globally disable this feature
     until we can handle `pjit`.
 
+    Note this essentially disable the `jax.jit` decorator, however, the `jace.jit`
+    decorator is still working.
+
     Todo:
         Remove as soon as we can handle nested `jit`.
     """
@@ -52,8 +61,18 @@ def _disable_jit() -> None:
         yield
 
 
+@pytest.fixture()
+def _enable_jit() -> Generator[None, None, None]:
+    """Fixture to enable jit compilation.
+
+    Essentially it undoes the effects of the `_disable_jit()` fixture.
+    """
+    with jax.disable_jit(disable=False):
+        yield
+
+
 @pytest.fixture(autouse=True)
-def _clear_translation_cache() -> None:
+def _clear_translation_cache() -> Generator[None, None, None]:
     """Decorator that clears the translation cache.
 
     Ensures that a function finds an empty cache and clears up afterwards.
diff --git a/tests/integration_tests/test_empty_jaxpr.py b/tests/integration_tests/test_empty_jaxpr.py
index 22a1be3..b877471 100644
--- a/tests/integration_tests/test_empty_jaxpr.py
+++ b/tests/integration_tests/test_empty_jaxpr.py
@@ -87,6 +87,7 @@ def wrapped(A: np.float64) -> np.float64:
     assert np.all(wrapped(A) == A)
 
 
+@pytest.mark.skip(reason="Literal return value is not implemented.")
 def test_empty_literal_return() -> None:
     """An empty Jaxpr that only contains a literal return value."""
 
diff --git a/tests/unit_tests/test_caching.py b/tests/unit_tests/test_caching.py
index c633f24..9e856b3 100644
--- a/tests/unit_tests/test_caching.py
+++ b/tests/unit_tests/test_caching.py
@@ -14,8 +14,10 @@
 import re
 from typing import TYPE_CHECKING
 
+import jax
 import numpy as np
 import pytest
+from jax import numpy as jnp
 
 import jace
 from jace import optimization, stages
@@ -27,6 +29,33 @@
     from jace.util import translation_cache as tcache
 
 
+def test_caching_working() -> None:
+    """Simple test if the caching actually works."""
+
+    lowering_cnt = [0]
+
+    @jace.jit
+    def wrapped(A: np.ndarray) -> jax.Array:
+        lowering_cnt[0] += 1
+        return jnp.sin(A)
+
+    A = testutil.mkarray((10, 10))
+    ref = np.sin(A)
+    res_ids: set[int] = set()
+    # We have to store the array, because numpy does reuse the memory.
+    res_set: list[np.ndarray] = []
+
+    for _ in range(10):
+        res = wrapped(A)
+        res_id = res.__array_interface__["data"][0]
+
+        assert np.allclose(res, ref)
+        assert lowering_cnt[0] == 1
+        assert res_id not in res_ids
+        res_ids.add(res_id)
+        res_set.append(res)
+
+
 def test_caching_same_sizes() -> None:
     """The behaviour of the cache if same sizes are used, in two different functions."""
 
@@ -242,12 +271,13 @@ def testee(A: np.ndarray) -> np.ndarray:
     assert third_key != first_key
 
     # Test if the key association is correct.
-    #  Since reading does not modify the order, third key must be still at the front.
-    #  To test this we also have this strange order.
+    #  We have to do it in this order, because reading the key modifies the order.
     assert cache.front()[0] == third_key
-    assert cache[third_key] is third_lowered
-    assert cache[second_key] is second_lowered
     assert cache[first_key] is first_lowered
+    assert cache.front()[0] == first_key
+    assert cache[second_key] is second_lowered
+    assert cache.front()[0] == second_key
+    assert cache[third_key] is third_lowered
     assert cache.front()[0] == third_key
 
     # We now evict the second key, which should not change anything on the order.
diff --git a/tests/unit_tests/test_jax_api.py b/tests/unit_tests/test_jax_api.py
index d36e326..434c983 100644
--- a/tests/unit_tests/test_jax_api.py
+++ b/tests/unit_tests/test_jax_api.py
@@ -15,7 +15,7 @@
 from jax import numpy as jnp
 
 import jace
-from jace import translator
+from jace import translator, util
 from jace.translator import pre_post_translation as ptrans
 
 from tests import util as testutil
@@ -213,3 +213,41 @@ def testee(A: np.ndarray, B: np.float64) -> np.ndarray:
         tsdfg.sdfg.arrays[inp_name].dtype.as_numpy_dtype().type is np.float32
         for inp_name in tsdfg.inp_names
     )
+
+
+@pytest.mark.usefixtures("_enable_jit")
+def test_tracing_detection() -> None:
+    """Tests our ability to detect if tracing is going on."""
+    expected_tracing_state = False
+
+    def testee(a: float, b: int) -> float:
+        c = a + b
+        assert util.is_tracing_ongoing(a, b) == expected_tracing_state
+        assert util.is_tracing_ongoing() == expected_tracing_state
+        return a + c
+
+    # We do not expect tracing to happen.
+    _ = testee(1.0, 1)
+
+    # Now tracing is going on
+    expected_tracing_state = True
+    _ = jax.jit(testee)(1.0, 1)
+    _ = jace.jit(testee)(1.0, 1)
+
+    # Tracing should now again be disabled
+    expected_tracing_state = False
+    _ = testee
+
+
+def test_no_input() -> None:
+    """Tests if we can handle the case of no input."""
+
+    @jace.jit
+    def ones10x10() -> jax.Array:
+        return jnp.ones((10, 10), dtype=np.int32)
+
+    res = ones10x10()
+
+    assert res.shape == (10, 10)
+    assert res.dtype == np.int32
+    assert np.all(res == 1)

From bf6802183e94911c1a2155609710d22b35924908 Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Fri, 7 Jun 2024 11:32:12 +0200
Subject: [PATCH 321/458] Updated the element type conversion translator.

---
 .../convert_element_type_translator.py        | 25 ++++++-------------
 1 file changed, 7 insertions(+), 18 deletions(-)

diff --git a/src/jace/translator/primitive_translators/convert_element_type_translator.py b/src/jace/translator/primitive_translators/convert_element_type_translator.py
index 59230d8..6dd7576 100644
--- a/src/jace/translator/primitive_translators/convert_element_type_translator.py
+++ b/src/jace/translator/primitive_translators/convert_element_type_translator.py
@@ -57,33 +57,22 @@ def write_tasklet_code(
         out_dtype = util.get_jax_var_dtype(eqn.outvars[0]).type
         out_dtype_s: str = out_dtype.__name__
 
-        # This is the base of the template that we use for conversion.
-        #  You should notice that the Tasklet `__out = __in0` will fail, see commit
-        #  `f5aabc3` of the prototype. Thus we have to do it in this way.
+        # This is the base of the template that we use for conversion. You should notice that
+        #  the Tasklet `__out = __in0` will fail, see commit `f5aabc3` of the prototype. Thus
+        #  we have to do it in this way.
         conv_code = "__in0"
 
-        # Handle special cases
-        if in_dtype_s.startswith("bool") and in_dtype == out_dtype:
-            #  Second and more importantly, in Jax the casting from bool to bool has a special
-            #  meaning, because in Jax all logical operations are bitwise. If a logical operation
-            #  is used, then Jax first makes it a bool by running `a != 0`.
-            #  Jax does this to ensure that it has either `0` or a `1`, I assume that is because
-            #  XLA does not have a native bool, similar as C.
-            #  However, in C++, that has a native bool, this operation is kind of useless.
-            #  But we keep it as special case to serve as a documentation.
-            return f"__out = {conv_code}"
         if in_dtype == out_dtype:
-            # For some odd reason, this conversion also happens if with other types as bool,
-            #  see above. For that reason we also keep it as special case.
-            #  In previous versions we generated a warning here, but it had become so annoying
-            #  that it was removed.
+            # For some reason Jax sometimes adds conversions where no are needed. I think
+            #  that the reason for this is the special type system that Jax made. In these cases
+            #  we do not add a cast, because such a Tasklet is not trivial and DaCe can not remove it.
             return f"__out = {conv_code}"
 
         if in_dtype_s.startswith("bool"):
             # Interestingly `__out = int(__in0)` will not work, see commit `f5aabc` of the prototype.
             conv_code = f"(1 if {conv_code} else 0)"
 
-        if out_dtype_s == "bool":
+        if out_dtype_s.startswith("bool"):
             conv_code = f"dace.bool_({conv_code})"
         elif hasattr(dace.dtypes, out_dtype_s):
             conv_code = f"dace.{out_dtype_s}({conv_code})"

From a376aadd9fd194be26a9f371572eddfce7533b6f Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Fri, 7 Jun 2024 11:35:01 +0200
Subject: [PATCH 322/458] Updated the slicing primitive and tests.

It is now able to handle strides and there is a test for that.
---
 .../primitive_translators/slicing.py          |  11 +-
 .../test_primitive_slicing.py                 | 119 +++---------------
 2 files changed, 23 insertions(+), 107 deletions(-)

diff --git a/src/jace/translator/primitive_translators/slicing.py b/src/jace/translator/primitive_translators/slicing.py
index fb16040..1b708d4 100644
--- a/src/jace/translator/primitive_translators/slicing.py
+++ b/src/jace/translator/primitive_translators/slicing.py
@@ -51,16 +51,17 @@ def make_input_memlets(
         eqn: jax_core.JaxprEqn,
     ) -> dict[str, dace.Memlet]:
         """We have to add the offsets to the Memlet accesses."""
-        if eqn.params["strides"] is not None:
-            raise NotImplementedError("Non 1 strides are not implemented.")
 
-        start_indices = eqn.params["start_indices"]  # Fist index to slice
+        strides: Sequence[int] = (
+            ((1,) * len(tskl_ranges)) if eqn.params["strides"] is None else eqn.params["strides"]
+        )
+        start_indices: Sequence[int] = eqn.params["start_indices"]  # Fist index to slice
         return {
             "__in0": dace.Memlet.simple(
                 in_var_names[0],
                 ", ".join(
-                    f"{it_idx} + {start_index}"
-                    for (it_idx, _), start_index in zip(tskl_ranges, start_indices)
+                    f"{start_index} + {it_idx} * {stride}"
+                    for (it_idx, _), start_index, stride in zip(tskl_ranges, start_indices, strides)
                 ),
             )
         }
diff --git a/tests/integration_tests/primitive_translators/test_primitive_slicing.py b/tests/integration_tests/primitive_translators/test_primitive_slicing.py
index b0c5dd1..2f6bf40 100644
--- a/tests/integration_tests/primitive_translators/test_primitive_slicing.py
+++ b/tests/integration_tests/primitive_translators/test_primitive_slicing.py
@@ -19,8 +19,8 @@
 
 
 @pytest.fixture()
-def A_4x4() -> np.ndarray:
-    return testutil.mkarray((4, 4))
+def A_20x20x20() -> np.ndarray:
+    return testutil.mkarray((20, 20, 20))
 
 
 @pytest.fixture()
@@ -43,118 +43,33 @@ def full_dynamic_start_idx(
     return request.param
 
 
-def test_slice_sub_view(
-    A_4x4: np.ndarray,
+def test_slice_no_strides(
+    A_20x20x20: np.ndarray,
 ) -> None:
-    @jace.jit
-    def testee(A: np.ndarray) -> np.ndarray:
-        return A[1:3, 1:3]
+    """Test without strides."""
 
-    ref = A_4x4[1:3, 1:3]
-    res = testee(A_4x4)
-
-    assert ref.shape == res.shape
-    assert np.all(ref == res)
-
-
-def test_slice_rslice(
-    A_4x4: np.ndarray,
-) -> None:
-    """Only extracting rows."""
-
-    @jace.jit
-    def testee(A: np.ndarray) -> np.ndarray:
-        return A[1:3]
-
-    ref = A_4x4[1:3]
-    res = testee(A_4x4)
-
-    assert ref.shape == res.shape
-    assert np.all(ref == res)
-
-
-def test_slice_cslice(
-    A_4x4: np.ndarray,
-) -> None:
-    """Slicing some columns."""
-
-    @jace.jit
-    def testee(A: np.ndarray) -> np.ndarray:
-        # NOTE: using `A[..., 1:3]` would trigger the `gather` primitive.
-        return A[:, 1:3]
-
-    ref = A_4x4[:, 1:3]
-    res = testee(A_4x4)
-
-    assert ref.shape == res.shape
-    assert np.all(ref == res)
-
-
-def test_slice_singelton(
-    A_4x4: np.ndarray,
-) -> None:
-    """Only extracting a single value."""
-
-    @jace.jit
-    def testee(A: np.ndarray) -> np.ndarray:
-        return A[1:2, 1:2]
-
-    ref = A_4x4[1:2, 1:2]
-    res = testee(A_4x4)
-
-    assert ref.shape == res.shape
-    assert np.all(ref == res)
-
-
-@pytest.mark.skip(reason="Missing 'gather' translator.")
-def test_slice_strides_vec() -> None:
-    """Slice with strides.
-
-    Although the translator (and the primitive) would support a stride, for some
-    reason Jax makes a `gather` operation out of it, that is not yet supported.
-    """
-
-    def testee(A: np.ndarray) -> np.ndarray:
-        return A[1:15:2]
+    def testee(A: np.ndarray) -> jax.Array:
+        # Read as: A[2:18, 3:19, 4:17]
+        return jax.lax.slice(A, (2, 3, 4), (18, 19, 17), None)
 
-    A = np.arange(16)
-    ref = testee(A)
-    res = jace.jit(testee)(A)
+    ref = testee(A_20x20x20)
+    res = jace.jit(testee)(A_20x20x20)
 
     assert ref.shape == res.shape
     assert np.all(ref == res)
 
 
-@pytest.mark.skip(reason="Missing 'concatenate' translator.")
 def test_slice_strides(
-    A_4x4: np.ndarray,
+    A_20x20x20: np.ndarray,
 ) -> None:
-    """Using strides in a 2D matrix.
+    """Test with strides."""
 
-    See `test_slice_strides_vec()` why the test is skipped.
-    """
-
-    @jace.jit
-    def testee(A: np.ndarray) -> np.ndarray:
-        return A[::2, ::2]
-
-    ref = A_4x4[::2, ::2]
-    res = testee(A_4x4)
-
-    assert ref.shape == res.shape
-    assert np.all(ref == res)
-
-
-def test_slice_too_big(
-    A_4x4: np.ndarray,
-) -> None:
-    """Tests what happens if we specify a size that is too big."""
-
-    def testee(A: np.ndarray) -> np.ndarray:
-        return A[:20]
+    def testee(A: np.ndarray) -> jax.Array:
+        # Read as: A[2:18:1, 3:19:2, 4:17:3]
+        return jax.lax.slice(A, (2, 3, 4), (18, 19, 17), (1, 2, 3))
 
-    ref = testee(A_4x4)
-    res = jace.jit(testee)(A_4x4)
+    ref = testee(A_20x20x20)
+    res = jace.jit(testee)(A_20x20x20)
 
     assert ref.shape == res.shape
     assert np.all(ref == res)

From 8a79f834d20d74cd6b9bc6810e68347e0387eb3c Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Fri, 7 Jun 2024 12:35:40 +0200
Subject: [PATCH 323/458] It is now also possible that Jax arrays can be used.

---
 src/jace/stages.py               |  2 +-
 src/jace/util/__init__.py        |  2 ++
 src/jace/util/traits.py          | 11 +++++++++
 tests/unit_tests/test_caching.py | 38 +++++++++++++++++++++++++++-----
 tests/unit_tests/test_jax_api.py | 16 ++++++++++++++
 5 files changed, 63 insertions(+), 6 deletions(-)

diff --git a/src/jace/stages.py b/src/jace/stages.py
index c3032a6..94276c7 100644
--- a/src/jace/stages.py
+++ b/src/jace/stages.py
@@ -149,7 +149,7 @@ def lower(
         # TODO(phimuell): Currently the SDFG that we build only supports `C_CONTIGUOUS` memory
         #  order. Since we support the paradigm that "everything passed to `lower()` should also
         #  be accepted as argument to call the result", we forbid other memory orders here.
-        if not all((not util.is_array(arg)) or arg.flags["C_CONTIGUOUS"] for arg in args):
+        if not all((not util.is_array(arg)) or util.is_c_contiguous(arg) for arg in args):
             raise NotImplementedError("Currently can not yet handle strides beside 'C_CONTIGUOUS'.")
 
         # In Jax `float32` is the main datatype, and they go to great lengths to avoid some
diff --git a/src/jace/util/__init__.py b/src/jace/util/__init__.py
index 1c1c8d4..c2f2031 100644
--- a/src/jace/util/__init__.py
+++ b/src/jace/util/__init__.py
@@ -26,6 +26,7 @@
 )
 from .traits import (
     is_array,
+    is_c_contiguous,
     is_drop_var,
     is_fully_addressable,
     is_jax_array,
@@ -45,6 +46,7 @@
     "get_jax_var_name",
     "get_jax_var_shape",
     "is_array",
+    "is_c_contiguous",
     "is_drop_var",
     "is_fully_addressable",
     "is_jax_array",
diff --git a/src/jace/util/traits.py b/src/jace/util/traits.py
index acada34..984f794 100644
--- a/src/jace/util/traits.py
+++ b/src/jace/util/traits.py
@@ -102,3 +102,14 @@ def is_fully_addressable(
     if is_jax_array(obj):
         return obj.is_fully_addressable
     return True
+
+
+def is_c_contiguous(
+    obj: Any,
+) -> bool:
+    """Tests if `obj` is in C order."""
+    if not is_array(obj):
+        return False
+    if is_jax_array(obj):
+        obj = obj.__array__()
+    return obj.flags["C_CONTIGUOUS"]
diff --git a/tests/unit_tests/test_caching.py b/tests/unit_tests/test_caching.py
index 9e856b3..fb50c6b 100644
--- a/tests/unit_tests/test_caching.py
+++ b/tests/unit_tests/test_caching.py
@@ -12,7 +12,6 @@
 
 import itertools as it
 import re
-from typing import TYPE_CHECKING
 
 import jax
 import numpy as np
@@ -21,14 +20,11 @@
 
 import jace
 from jace import optimization, stages
+from jace.util import translation_cache as tcache
 
 from tests import util as testutil
 
 
-if TYPE_CHECKING:
-    from jace.util import translation_cache as tcache
-
-
 def test_caching_working() -> None:
     """Simple test if the caching actually works."""
 
@@ -386,3 +382,35 @@ def wrapped(A: np.ndarray) -> np.ndarray:
     assert np.allclose(F_res, C_res)
     assert F_lower is not C_lower
     assert lower_cnt[0] == 2
+
+
+def test_caching_jax_numpy_array() -> None:
+    """Tests if jax arrays are handled the same way as numpy array."""
+
+    def _test_impl(
+        for_lowering: np.ndarray | jax.Array,
+        for_calling: np.ndarray | jax.Array,
+    ) -> None:
+        tcache.clear_translation_cache()
+        lowering_cnt = [0]
+
+        @jace.jit
+        def wrapped(A: np.ndarray | jax.Array) -> np.ndarray | jax.Array:
+            lowering_cnt[0] += 1
+            return A + 1.0
+
+        # Explicit lowering.
+        _ = wrapped(for_lowering)
+        assert lowering_cnt[0] == 1
+
+        # Now calling with the second argument, it should not longer again.
+        _ = wrapped(for_calling)
+        assert lowering_cnt[0] == 1, "Expected no further lowering."
+        return
+
+    A_numpy = testutil.mkarray((10, 10))
+    A_jax = jnp.array(A_numpy, copy=True)
+    assert A_numpy.dtype == A_jax.dtype
+
+    _test_impl(A_numpy, A_jax)
+    _test_impl(A_jax, A_numpy)
diff --git a/tests/unit_tests/test_jax_api.py b/tests/unit_tests/test_jax_api.py
index 434c983..a9beae2 100644
--- a/tests/unit_tests/test_jax_api.py
+++ b/tests/unit_tests/test_jax_api.py
@@ -251,3 +251,19 @@ def ones10x10() -> jax.Array:
     assert res.shape == (10, 10)
     assert res.dtype == np.int32
     assert np.all(res == 1)
+
+
+def test_jax_array_as_input() -> None:
+    """This function tests if we use Jax arrays as inputs."""
+
+    def testee(A: jax.Array) -> jax.Array:
+        return jnp.sin(A + 1.0)
+
+    A = jnp.array(testutil.mkarray((10, 19)))
+
+    ref = testee(A)
+    res = jace.jit(testee)(A)
+
+    assert res.shape == ref.shape
+    assert res.dtype == ref.dtype
+    assert np.allclose(res, ref)

From a4697bed2daa50d59a4638523c657606fed7dddd Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Fri, 7 Jun 2024 12:42:12 +0200
Subject: [PATCH 324/458] Removed some direct import.

---
 .../test_primitive_translator_managing.py     | 60 +++++++++----------
 1 file changed, 28 insertions(+), 32 deletions(-)

diff --git a/tests/integration_tests/test_primitive_translator_managing.py b/tests/integration_tests/test_primitive_translator_managing.py
index 60497d7..2a6ca33 100644
--- a/tests/integration_tests/test_primitive_translator_managing.py
+++ b/tests/integration_tests/test_primitive_translator_managing.py
@@ -17,12 +17,6 @@
 
 import jace
 from jace import translator
-from jace.translator import (
-    get_registered_primitive_translators,
-    make_primitive_translator,
-    register_primitive_translator,
-    set_active_primitive_translators_to,
-)
 
 
 if TYPE_CHECKING:
@@ -32,9 +26,9 @@
 @pytest.fixture(autouse=True)
 def _conserve_builtin_translators() -> Generator[None, None, None]:
     """Restores the set of registered subtranslators after a test."""
-    initial_translators = get_registered_primitive_translators()
+    initial_translators = translator.get_registered_primitive_translators()
     yield
-    set_active_primitive_translators_to(initial_translators)
+    translator.set_active_primitive_translators_to(initial_translators)
 
 
 @pytest.fixture()
@@ -66,12 +60,12 @@ def __call__(self) -> None:  # type: ignore[override]  # Arguments
         raise NotImplementedError
 
 
-@make_primitive_translator("non_existing_callable_primitive3")
+@translator.make_primitive_translator("non_existing_callable_primitive3")
 def SubTrans3_Callable(*args: Any, **kwargs: Any) -> None:  # noqa: ARG001
     raise NotImplementedError
 
 
-@make_primitive_translator("add")
+@translator.make_primitive_translator("add")
 def fake_add_translator(*args: Any, **kwargs: Any) -> None:  # noqa: ARG001
     raise NotImplementedError("'fake_add_translator()' was called.")
 
@@ -79,7 +73,7 @@ def fake_add_translator(*args: Any, **kwargs: Any) -> None:  # noqa: ARG001
 @pytest.mark.usefixtures("no_builtin_translators")
 def test_subtranslatior_managing() -> None:
     """Basic functionality of the subtranslators."""
-    original_active_subtrans = get_registered_primitive_translators()
+    original_active_subtrans = translator.get_registered_primitive_translators()
     assert len(original_active_subtrans) == 0
 
     # Create the classes.
@@ -91,34 +85,34 @@ def test_subtranslatior_managing() -> None:
 
     # Add the instances.
     for sub in prim_translators:
-        assert register_primitive_translator(sub) is sub
+        assert translator.register_primitive_translator(sub) is sub
 
     # Tests if they were correctly registered
-    active_subtrans = get_registered_primitive_translators()
+    active_subtrans = translator.get_registered_primitive_translators()
     for expected in prim_translators:
         assert active_subtrans[expected.primitive] is expected
     assert len(active_subtrans) == 3
 
 
 def test_subtranslatior_managing_isolation() -> None:
-    """Tests if `get_registered_primitive_translators()` protects the internal registry."""
+    """Tests if `translator.get_registered_primitive_translators()` protects the internal registry."""
     assert (
-        get_registered_primitive_translators()
+        translator.get_registered_primitive_translators()
         is not translator.primitive_translator._PRIMITIVE_TRANSLATORS_REGISTRY
     )
 
-    initial_primitives = get_registered_primitive_translators()
-    assert get_registered_primitive_translators() is not initial_primitives
+    initial_primitives = translator.get_registered_primitive_translators()
+    assert translator.get_registered_primitive_translators() is not initial_primitives
     assert "add" in initial_primitives, "For this test the 'add' primitive must be registered."
     org_add_prim = initial_primitives["add"]
 
     initial_primitives["add"] = fake_add_translator
     assert org_add_prim is not fake_add_translator
-    assert get_registered_primitive_translators()["add"] is org_add_prim
+    assert translator.get_registered_primitive_translators()["add"] is org_add_prim
 
 
 def test_subtranslatior_managing_swap() -> None:
-    """Tests the `set_active_primitive_translators_to()` functionality."""
+    """Tests the `translator.set_active_primitive_translators_to()` functionality."""
 
     # Allows to compare the structure of dicts.
     def same_structure(
@@ -127,7 +121,7 @@ def same_structure(
     ) -> bool:
         return d1.keys() == d2.keys() and all(id(d2[k]) == id(d1[k]) for k in d1)
 
-    initial_primitives = get_registered_primitive_translators()
+    initial_primitives = translator.get_registered_primitive_translators()
     assert "add" in initial_primitives
 
     # Generate a set of translators that we swap in
@@ -135,20 +129,20 @@ def same_structure(
     new_active_primitives["add"] = fake_add_translator
 
     # Now perform the changes.
-    old_active = set_active_primitive_translators_to(new_active_primitives)
+    old_active = translator.set_active_primitive_translators_to(new_active_primitives)
     assert (
         new_active_primitives is not translator.primitive_translator._PRIMITIVE_TRANSLATORS_REGISTRY
     )
     assert same_structure(old_active, initial_primitives)
-    assert same_structure(new_active_primitives, get_registered_primitive_translators())
+    assert same_structure(new_active_primitives, translator.get_registered_primitive_translators())
 
 
 def test_subtranslatior_managing_callable_annotation() -> None:
-    """Test if `make_primitive_translator()` works."""
+    """Test if `translator.make_primitive_translator()` works."""
 
     prim_name = "non_existing_property"
 
-    @make_primitive_translator(prim_name)
+    @translator.make_primitive_translator(prim_name)
     def non_existing_translator(*args: Any, **kwargs: Any) -> None:  # noqa: ARG001
         raise NotImplementedError
 
@@ -158,7 +152,7 @@ def non_existing_translator(*args: Any, **kwargs: Any) -> None:  # noqa: ARG001
 
 def test_subtranslatior_managing_overwriting() -> None:
     """Tests if we are able to overwrite a translator in the global registry."""
-    current_add_translator = get_registered_primitive_translators()["add"]
+    current_add_translator = translator.get_registered_primitive_translators()["add"]
 
     # This will not work because overwriting is not activated.
     with pytest.raises(
@@ -167,12 +161,14 @@ def test_subtranslatior_managing_overwriting() -> None:
             "Explicit override=True needed for primitive 'add' to overwrite existing one."
         ),
     ):
-        register_primitive_translator(fake_add_translator)
-    assert current_add_translator is get_registered_primitive_translators()["add"]
+        translator.register_primitive_translator(fake_add_translator)
+    assert current_add_translator is translator.get_registered_primitive_translators()["add"]
 
     # Now we use overwrite.
-    assert fake_add_translator is register_primitive_translator(fake_add_translator, overwrite=True)
-    assert fake_add_translator is get_registered_primitive_translators()["add"]
+    assert fake_add_translator is translator.register_primitive_translator(
+        fake_add_translator, overwrite=True
+    )
+    assert fake_add_translator is translator.get_registered_primitive_translators()["add"]
 
 
 @pytest.mark.usefixtures("no_builtin_translators")
@@ -184,8 +180,8 @@ def test_subtranslatior_managing_overwriting_2() -> None:
 
     trans_cnt = [0]
 
-    @register_primitive_translator(overwrite=True)
-    @make_primitive_translator("add")
+    @translator.register_primitive_translator(overwrite=True)
+    @translator.make_primitive_translator("add")
     def still_useless_but_a_bit_less(*args: Any, **kwargs: Any) -> None:  # noqa: ARG001
         trans_cnt[0] += 1
         return
@@ -216,7 +212,7 @@ def foo(A: int) -> int:
         return D + 1
 
     # Now register the add translator.
-    register_primitive_translator(fake_add_translator, overwrite=True)
+    translator.register_primitive_translator(fake_add_translator, overwrite=True)
 
     # Since `foo` was already constructed, a new registering can not change anything.
     A = np.zeros((10, 10))

From b64b666f34a135ac4c9db2e00b5bfb2abd10a33b Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Fri, 7 Jun 2024 13:30:37 +0200
Subject: [PATCH 325/458] Implemented a way to modify the set of
 compilation/optimization options that are currently used.

---
 src/jace/optimization.py         |  5 +--
 src/jace/stages.py               | 71 ++++++++++++++++++++++----------
 tests/unit_tests/test_caching.py | 43 +++++++++++++++++++
 3 files changed, 94 insertions(+), 25 deletions(-)

diff --git a/src/jace/optimization.py b/src/jace/optimization.py
index 63528db..94a8f36 100644
--- a/src/jace/optimization.py
+++ b/src/jace/optimization.py
@@ -5,10 +5,7 @@
 #
 # SPDX-License-Identifier: BSD-3-Clause
 
-"""JaCe specific optimizations.
-
-Currently just a dummy exists for the sake of providing a callable function.
-"""
+"""JaCe specific optimizations."""
 
 from __future__ import annotations
 
diff --git a/src/jace/stages.py b/src/jace/stages.py
index 94276c7..b64e5d6 100644
--- a/src/jace/stages.py
+++ b/src/jace/stages.py
@@ -51,14 +51,14 @@
     "Stage",
 ]
 
+_JACELOWERED_ACTIVE_COMPILE_OPTIONS: CompilerOptions = optimization.DEFAULT_OPTIMIZATIONS.copy()
+"""Global set of currently active compilation/optimization options.
 
-__all__ = [
-    "CompilerOptions",  # export for compatibility with Jax.
-    "JaCeCompiled",
-    "JaCeLowered",
-    "JaCeWrapped",
-    "Stage",
-]
+These options are used by `JaCeLowered.compile()` to determine which options
+are forwarded to the underlying `jace_optimize()` function. It is initialized
+to `jace.optimization.DEFAULT_OPTIMIZATIONS` and can be managed through
+`update_active_compiler_options()`.
+"""
 
 
 class JaCeWrapped(tcache.CachingStage["JaCeLowered"]):
@@ -197,10 +197,10 @@ class JaCeLowered(tcache.CachingStage["JaCeCompiled"]):
 
     This class is the output type of `JaCeWrapped.lower()` and represents the
     originally wrapped computation as an SDFG. This stage is followed by the
-    `JaCeCompiled` stage.
+    `JaCeCompiled` stage, by calling `self.compile()`.
 
-    Args:
-        tsdfg: The translated SDFG object representing the computation.
+    Before the SDFG is optimized the SDFG is optimized, see `JaCeLowered.compile()`
+    for more information on this topic.
 
     Args:
         tsdfg:  The lowered SDFG with metadata. Must be finalized.
@@ -226,16 +226,18 @@ def compile(
         self,
         compiler_options: CompilerOptions | None = None,
     ) -> JaCeCompiled:
-        """Optimize and compile the lowered SDFG using `compiler_options`.
-
-        Returns an object that encapsulates a compiled SDFG object. To influence
-        the various optimizations and compile options of JaCe you can use the
-        `compiler_options` argument. If nothing is specified
-        `jace.optimization.DEFAULT_OPTIMIZATIONS` will be used.
-
-        Note:
-            Before `compiler_options` is forwarded to `jace_optimize()` it
-            will be merged with the default arguments.
+        """Optimize and compile the lowered SDFG and return a `JaCeCompiled` object.
+
+        This is the transition function of this stage. Before the SDFG is
+        compiled, it will be optimized using `jace_optimize()`. The options
+        used for this consists of two parts. First there is the (global) set of
+        currently active compiler options, which is then merged with the options
+        passed through `compiler_options`, which take precedence. Thus
+        `compiler_options` describes the delta from the current active set of options.
+
+        See also:
+            `get_active_compiler_options()` to inspect the set of currently active
+            options and `update_active_compiler_options()` to modify the set.
         """
         # We **must** deepcopy before we do any optimization, because all optimizations are in
         #  place, however, to properly cache stages, stages needs to be immutable.
@@ -295,7 +297,34 @@ def _make_compiler_options(
         self,
         compiler_options: CompilerOptions | None,
     ) -> CompilerOptions:
-        return optimization.DEFAULT_OPTIMIZATIONS | (compiler_options or {})
+        """Return the compilation options that should be used for compilation.
+
+        See `JaCeLowered.compile()` to see how to influence them.
+        """
+        return get_active_compiler_options() | (compiler_options or {})
+
+
+def update_active_compiler_options(
+    new_active_options: CompilerOptions,
+) -> CompilerOptions:
+    """Updates the set of active compiler options.
+
+    Merges the options passed as `new_active_options` with the currently active
+    compiler options. This set is used by `JaCeLowered.compile()` to determine
+    which options should be used for optimization.
+    The function will return the set of options that was active before the call.
+    """
+    previous_active_options = _JACELOWERED_ACTIVE_COMPILE_OPTIONS.copy()
+    _JACELOWERED_ACTIVE_COMPILE_OPTIONS.update(new_active_options)
+    return previous_active_options
+
+
+def get_active_compiler_options() -> CompilerOptions:
+    """Returns the set of currently active compiler options.
+
+    By default the set is initialized with `jace.optimization.DEFAULT_OPTIMIZATIONS`.
+    """
+    return _JACELOWERED_ACTIVE_COMPILE_OPTIONS.copy()
 
 
 class JaCeCompiled:
diff --git a/tests/unit_tests/test_caching.py b/tests/unit_tests/test_caching.py
index fb50c6b..306b244 100644
--- a/tests/unit_tests/test_caching.py
+++ b/tests/unit_tests/test_caching.py
@@ -215,6 +215,49 @@ def jaceWrapped(A: np.ndarray, B: np.ndarray) -> np.ndarray:
     assert unoptiCompiled is jaceLowered.compile(optimization.NO_OPTIMIZATIONS)
 
 
+def test_caching_compilation_options() -> None:
+    """Tests if the global optimization managing works."""
+    original_compile_options = stages.get_active_compiler_options()
+    try:
+        lowering_cnt = [0]
+
+        @jace.jit
+        def wrapped(A: float) -> float:
+            lowering_cnt[0] += 1
+            return A + 1.0
+
+        lower_cache = wrapped._cache
+        lowered = wrapped.lower(1.0)
+        compile_cache = lowered._cache
+
+        assert len(lower_cache) == 1
+        assert len(compile_cache) == 0
+        assert lowering_cnt[0] == 1
+
+        # Using the first set of options.
+        stages.update_active_compiler_options(optimization.NO_OPTIMIZATIONS)
+        _ = wrapped(2.0)
+
+        # Except from one entry in the compile cache, nothing should have changed.
+        assert len(lower_cache) == 1
+        assert len(compile_cache) == 1
+        assert compile_cache.front()[0].stage_id == id(lowered)
+        assert lowering_cnt[0] == 1
+
+        # Now we change the options again which then will lead to another compilation,
+        #  but not to another lowering.
+        stages.update_active_compiler_options(optimization.DEFAULT_OPTIMIZATIONS)
+        _ = wrapped(2.0)
+
+        assert len(lower_cache) == 1
+        assert len(compile_cache) == 2
+        assert compile_cache.front()[0].stage_id == id(lowered)
+        assert lowering_cnt[0] == 1
+
+    finally:
+        stages.update_active_compiler_options(original_compile_options)
+
+
 def test_caching_dtype() -> None:
     """Tests if the data type is properly included in the test."""
 

From ed23d49d74dd24be8c3d20e9aa2eea25591b6cc8 Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Fri, 7 Jun 2024 14:34:11 +0200
Subject: [PATCH 326/458] Added a fixture that allows to select which options
 are used.

By default no optimizations are used.
However, inside the primitive tests, in the future most likely also in more places, it is overwritten such that also optimized and unoptimized options are used.
This doubles the number of tests.
---
 tests/conftest.py                             | 15 ++++++-
 .../primitive_translators/conftest.py         | 40 +++++++++++++++++++
 2 files changed, 54 insertions(+), 1 deletion(-)
 create mode 100644 tests/integration_tests/primitive_translators/conftest.py

diff --git a/tests/conftest.py b/tests/conftest.py
index 4bd941f..f5c9a23 100644
--- a/tests/conftest.py
+++ b/tests/conftest.py
@@ -9,7 +9,6 @@
 
 Todo:
     - Implement some fixture that allows to force validation.
-    - Implement fixture to disable and enable optimisation, i.e. doing it twice.
 """
 
 from __future__ import annotations
@@ -20,6 +19,7 @@
 import numpy as np
 import pytest
 
+from jace import optimization, stages
 from jace.util import translation_cache as tcache
 
 
@@ -90,3 +90,16 @@ def _reset_random_seed() -> None:
     This seed is used by the `util.mkarray()` helper.
     """
     np.random.seed(42)  # noqa: NPY002  # We use this seed for the time being.
+
+
+@pytest.fixture(autouse=True)
+def _set_compile_options() -> Generator[None, None, None]:
+    """Disable all optimizations of jitted code.
+
+    Without explicitly supplied arguments `JaCeLowered.compile()` will not
+    perform any optimizations.
+    Please not that certain tests might override this fixture.
+    """
+    initial_compile_options = stages.update_active_compiler_options(optimization.NO_OPTIMIZATIONS)
+    yield
+    stages.update_active_compiler_options(initial_compile_options)
diff --git a/tests/integration_tests/primitive_translators/conftest.py b/tests/integration_tests/primitive_translators/conftest.py
new file mode 100644
index 0000000..f51af06
--- /dev/null
+++ b/tests/integration_tests/primitive_translators/conftest.py
@@ -0,0 +1,40 @@
+# JaCe - JAX Just-In-Time compilation using DaCe (Data Centric Parallel Programming)
+#
+# Copyright (c) 2024, ETH Zurich
+# All rights reserved.
+#
+# SPDX-License-Identifier: BSD-3-Clause
+
+"""General configuration for the tests of the primitive translators."""
+
+from __future__ import annotations
+
+from typing import TYPE_CHECKING
+
+import pytest
+
+from jace import optimization, stages
+
+
+if TYPE_CHECKING:
+    from collections.abc import Generator
+
+
+@pytest.fixture(
+    autouse=True,
+    params=[
+        optimization.NO_OPTIMIZATIONS,
+        optimization.DEFAULT_OPTIMIZATIONS,
+    ],
+)
+def _set_compile_options(request) -> Generator[None, None, None]:
+    """Set the options used for testing the primitive translators.
+
+    This fixture override the global defined fixture.
+
+    Todo:
+        Implement a system that only runs the optimization case in CI.
+    """
+    initial_compile_options = stages.update_active_compiler_options(request.param)
+    yield
+    stages.update_active_compiler_options(initial_compile_options)

From 3518bdc5b90aeff7e3690e169f297a1774959400 Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Fri, 7 Jun 2024 14:51:52 +0200
Subject: [PATCH 327/458] Dynamic slicing can not run with disabled
 optimization.

The reason for this is quite interesting actually and there are several things that interact together to create the bug.
One part of the problem is, that we do not use scalars but only arrays and one part is probably a bug inside the code generator.
With enabled optimizations, start indexes of the dynamic slices are turned into symbols, which are implemented as (C) scalars.
However, if optimizations are disabled the start index is stored inside an array with length one.
In the Memlet, that we use to extract we essentially write something like `iteration_variable + start_index` which implies that `start_index` is a scalar, and if such an SDFG is compiled, then the code generator will generate `a[iteration_variable + start_index]`, but this is a compilation error, since `start_index` is a pointer and not a scalar.
The simple fix just to write `iteration_variable + start_index[0]` also does not work, as this seems to violate SDFG semantic because the code generator generates something like `a[iteration_variable + start_index(0)]` which is an error because `start_index` is obvious not a function.

Because there is no simple solution, this commit disables the tests for the slicing as a temporary solution.
The proper solution, which I will now implement, is to support scalars inside the translator.
In fact this will solve a lot of other problems.
---
 src/jace/translator/primitive_translators/slicing.py     | 6 ++++--
 .../primitive_translators/test_primitive_slicing.py      | 9 +++++++++
 2 files changed, 13 insertions(+), 2 deletions(-)

diff --git a/src/jace/translator/primitive_translators/slicing.py b/src/jace/translator/primitive_translators/slicing.py
index 1b708d4..ee415f4 100644
--- a/src/jace/translator/primitive_translators/slicing.py
+++ b/src/jace/translator/primitive_translators/slicing.py
@@ -97,8 +97,10 @@ def __call__(
         assert in_var_names[0]
         assert len(in_var_names) == len(util.get_jax_var_shape(eqn.invars[0])) + 1
 
+        raise NotImplementedError("This translator needs true scalars to correctly work.")
+
         # This is the sizes of the slice window.
-        window_sizes: Sequence[int] = eqn.params["slice_sizes"]
+        window_sizes: Sequence[int] = eqn.params["slice_sizes"]  # type: ignore[unreachable]
 
         # The first input to the primitive is the array we slice from, the others are the start
         #  indices of the slice window, each is a scalar, maybe literals.
@@ -130,7 +132,7 @@ def __call__(
             # Intermediate value to storing the adjusted start index.
             new_start_idx_var_name = builder.add_array(
                 eqn.invars[dim + 1],
-                name_prefix=f"__jace_adapted_start_idx_{start_index}",
+                name_prefix="__jace_adapted_start_idx_",
             )
             new_start_idx_acc = eqn_state.add_access(new_start_idx_var_name)
 
diff --git a/tests/integration_tests/primitive_translators/test_primitive_slicing.py b/tests/integration_tests/primitive_translators/test_primitive_slicing.py
index 2f6bf40..95778da 100644
--- a/tests/integration_tests/primitive_translators/test_primitive_slicing.py
+++ b/tests/integration_tests/primitive_translators/test_primitive_slicing.py
@@ -75,6 +75,9 @@ def testee(A: np.ndarray) -> jax.Array:
     assert np.all(ref == res)
 
 
+@pytest.mark.skip(
+    "In unoptimized mode there is an error, that is caused because we have an array insteadof a scalar."
+)
 def test_dynamic_slice_full_dynamic(
     A_4x4x4x4: np.ndarray,
     full_dynamic_start_idx: tuple[int, int, int, int],
@@ -88,6 +91,9 @@ def testee(A: np.ndarray, s1: int, s2: int, s3: int, s4: int) -> jax.Array:
     assert np.all(ref == res)
 
 
+@pytest.mark.skip(
+    "In unoptimized mode there is an error, that is caused because we have an array insteadof a scalar."
+)
 def test_dynamic_slice_partially_dynamic(
     A_4x4x4x4: np.ndarray,
 ) -> None:
@@ -100,6 +106,9 @@ def testee(A: np.ndarray, s1: int, s2: int) -> jax.Array:
     assert np.all(ref == res)
 
 
+@pytest.mark.skip(
+    "In unoptimized mode there is an error, that is caused because we have an array insteadof a scalar."
+)
 def test_dynamic_slice_full_literal(
     A_4x4x4x4: np.ndarray,
 ) -> None:

From 7d6cc9ccf97188ae94d5ba323a6c2fe17393b0ef Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Fri, 7 Jun 2024 15:01:19 +0200
Subject: [PATCH 328/458] For the time being disabled the optimized tests in
 the primitive translators tests.

They should be conditionally enabled.
---
 tests/integration_tests/primitive_translators/conftest.py | 3 ++-
 1 file changed, 2 insertions(+), 1 deletion(-)

diff --git a/tests/integration_tests/primitive_translators/conftest.py b/tests/integration_tests/primitive_translators/conftest.py
index f51af06..73b2699 100644
--- a/tests/integration_tests/primitive_translators/conftest.py
+++ b/tests/integration_tests/primitive_translators/conftest.py
@@ -24,7 +24,8 @@
     autouse=True,
     params=[
         optimization.NO_OPTIMIZATIONS,
-        optimization.DEFAULT_OPTIMIZATIONS,
+        # TODO(phimuell): find a way to conditionally enable.
+        # optimization.DEFAULT_OPTIMIZATIONS,
     ],
 )
 def _set_compile_options(request) -> Generator[None, None, None]:

From 630fcce7b69f14beabac460b849be6a8950bbe7d Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Fri, 7 Jun 2024 15:13:34 +0200
Subject: [PATCH 329/458] First stepe, in fixing the array/scalar stuff.

Now the builder will generate again scalars inbstead of arrays.
It is important to note, that this will essentially break everything, because essentially everything assumes that there are no sclars.
---
 .../translator/jaxpr_translator_builder.py    | 44 +++++++++----------
 1 file changed, 21 insertions(+), 23 deletions(-)

diff --git a/src/jace/translator/jaxpr_translator_builder.py b/src/jace/translator/jaxpr_translator_builder.py
index d00f110..ab7f582 100644
--- a/src/jace/translator/jaxpr_translator_builder.py
+++ b/src/jace/translator/jaxpr_translator_builder.py
@@ -34,7 +34,9 @@ class JaxprTranslationBuilder:
     - all variable names are derived from Jax names,
     - there are only transient variables inside the SDFG,
     - It lacks the special `__return` variable,
-    - the `arg_names` parameter is not set.
+    - the `arg_names` parameter is not set,
+    - scalar variables that are used as return value are SDFG scalars, thus they
+        can not directly be used to return something.
 
     For these reasons the SDFG is not directly usable, and further manipulations
     have to be performed. Especially, DaCe's validation function will fail and
@@ -66,8 +68,7 @@ class JaxprTranslationBuilder:
 
     Notes:
         After a translation has been performed the translator object can be used
-        again. Currently the builder will generate only Array as SDFG variables,
-        however, this is a temporary solution, see `add_array()`.
+        again.
     """
 
     _primitive_translators: Mapping[str, translator.PrimitiveTranslatorCallable]
@@ -322,14 +323,6 @@ def add_array(
             arg: The Jax object for which a SDFG equivalent should be created.
             name_prefix: If given it will be used as prefix for the name.
             update_var_mapping: Update the internal variable mapping; by default `False`.
-
-        Notes:
-            As a temporary fix for handling scalar return values, the function
-            will always generate arrays, even if `arg` is a scalar. According to
-            the DaCe developer, the majority of the backend, i.e. optimization
-            pipeline, should be able to handle it. But there are some special
-            parts that might explicitly want a scalar, it also might block
-            certain compiler optimization.
         """
 
         if isinstance(arg, jax_core.Literal):
@@ -342,9 +335,6 @@ def add_array(
         as_transient = True
         strides = None
 
-        # Temporary fix for handling DaCe scalars, see above for more.
-        shape = shape or (1,)
-
         # Propose a name and if needed extend it.
         arg_name = util.propose_jax_name(arg, self._jax_name_map)
         if name_prefix:
@@ -358,15 +348,23 @@ def add_array(
         if arg_name in util.FORBIDDEN_SDFG_VAR_NAMES:
             raise ValueError(f"add_array({arg}): The proposed name '{arg_name}', is forbidden.")
 
-        self._ctx.sdfg.add_array(
-            name=arg_name,
-            shape=shape,
-            strides=strides,
-            offset=offset,
-            storage=storage,
-            dtype=dtype,
-            transient=as_transient,
-        )
+        if shape == ():
+            self._ctx.sdfg.add_scalar(
+                name=arg_name,
+                storage=storage,
+                dtype=dtype,
+                transient=as_transient,
+            )
+        else:
+            self._ctx.sdfg.add_array(
+                name=arg_name,
+                shape=shape,
+                strides=strides,
+                offset=offset,
+                storage=storage,
+                dtype=dtype,
+                transient=as_transient,
+            )
 
         if update_var_mapping:
             try:

From e46637d033648e1ba8d366feb05604f439e0979e Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Fri, 7 Jun 2024 15:15:17 +0200
Subject: [PATCH 330/458] The Jaxpr is not also included in the translation
 context, do I need that?

---
 .../translator/jaxpr_translator_builder.py    | 21 ++++++++++++-------
 1 file changed, 14 insertions(+), 7 deletions(-)

diff --git a/src/jace/translator/jaxpr_translator_builder.py b/src/jace/translator/jaxpr_translator_builder.py
index ab7f582..1312321 100644
--- a/src/jace/translator/jaxpr_translator_builder.py
+++ b/src/jace/translator/jaxpr_translator_builder.py
@@ -125,6 +125,7 @@ def translate_jaxpr(
         #       SDFG/Jaxpr, this must be done manually.
         self._allocate_translation_ctx(
             name=name,
+            jaxpr=jaxpr,
         )
         self._create_constants(
             jaxpr=jaxpr,
@@ -504,7 +505,8 @@ def _create_constants(
 
     def _allocate_translation_ctx(
         self,
-        name: str | None = None,
+        name: str | None,
+        jaxpr: jax_core.ClosedJaxpr,
     ) -> JaxprTranslationBuilder:
         """Allocate a new context and activate it.
 
@@ -514,6 +516,7 @@ def _allocate_translation_ctx(
         self._ctx_stack.append(
             TranslationContext(
                 name=name,
+                jaxpr=jaxpr,
             )
         )
         return self
@@ -732,11 +735,12 @@ class TranslationContext:
     the `postprocess_jaxpr_sdfg()` function.
 
     Attributes:
-        sdfg:              The encapsulated SDFG object.
-        inp_names:         A list of the SDFG variables that are used as input
-        out_names:         A list of the SDFG variables that are used as output.
-        start_state:       The first state in the SDFG state machine.
-        terminal_state:    The (currently) last state in the state machine.
+        sdfg: The encapsulated SDFG object.
+        inp_names: A list of the SDFG variables that are used as input
+        out_names: A list of the SDFG variables that are used as output.
+        start_state: The first state in the SDFG state machine.
+        terminal_state: The (currently) last state in the state machine.
+        jaxpr: The Jaxpr that was used to translate.
 
     Args:
         name: The name of the SDFG, will be forwarded to the encapsulated `TranslatedJaxprSDFG`.
@@ -750,10 +754,12 @@ class TranslationContext:
     out_names: tuple[str, ...] | None
     start_state: dace.SDFGState
     terminal_state: dace.SDFGState
+    jaxpr: jax_core.ClosedJaxpr
 
     def __init__(
         self,
-        name: str | None = None,
+        name: str | None,
+        jaxpr: jax_core.ClosedJaxpr,
     ) -> None:
         if isinstance(name, str) and not util.VALID_SDFG_OBJ_NAME.fullmatch(name):
             raise ValueError(f"'{name}' is not a valid SDFG name.")
@@ -763,6 +769,7 @@ def __init__(
         self.out_names = None
         self.start_state = self.sdfg.add_state(label="initial_state", is_start_block=True)
         self.terminal_state = self.start_state
+        self.jaxpr = jaxpr
 
     def validate(self) -> bool:
         """Validate internal state of `self`.

From c7f6cc9465102b4baa04b64cc1a7c4ae5721e879 Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Fri, 7 Jun 2024 15:51:40 +0200
Subject: [PATCH 331/458] Fixed some missed up formating.

---
 src/jace/translator/jaxpr_translator_builder.py | 10 +++++-----
 1 file changed, 5 insertions(+), 5 deletions(-)

diff --git a/src/jace/translator/jaxpr_translator_builder.py b/src/jace/translator/jaxpr_translator_builder.py
index 437787e..3053dd9 100644
--- a/src/jace/translator/jaxpr_translator_builder.py
+++ b/src/jace/translator/jaxpr_translator_builder.py
@@ -734,11 +734,11 @@ class TranslationContext:
     the `postprocess_jaxpr_sdfg()` function.
 
     Attributes:
-        sdfg:              The encapsulated SDFG object.
-        inp_names:         A list of the SDFG variables that are used as input
-        out_names:         A list of the SDFG variables that are used as output.
-        start_state:       The first state in the SDFG state machine.
-        terminal_state:    The (currently) last state in the state machine.
+        sdfg: The encapsulated SDFG object.
+        inp_names: A list of the SDFG variables that are used as input
+        out_names: A list of the SDFG variables that are used as output.
+        start_state: The first state in the SDFG state machine.
+        terminal_state: The (currently) last state in the state machine.
 
     Args:
         name: The name of the SDFG, will be forwarded to the encapsulated `TranslatedJaxprSDFG`.

From 73f011693f08c1622d9a3120b4cff015963271ed Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Fri, 7 Jun 2024 15:58:37 +0200
Subject: [PATCH 332/458] I have now disabled the magic comma in ruff.

I do not like it, but it is fully in line with what the black manpage tells:
	By using it, you agree to cede control over minutiae of hand-formatting.
	In return, Black gives you speed, determinism, and freedom from pycodestyle nagging about formatting.
	You will save time and mental energy for more important matters.
---
 docs/conf.py                                  | 22 +----
 noxfile.py                                    |  8 +-
 pyproject.toml                                |  1 +
 src/jace/api.py                               |  7 +-
 src/jace/optimization.py                      |  5 +-
 src/jace/stages.py                            | 68 +++------------
 .../translator/jaxpr_translator_builder.py    | 86 ++++---------------
 .../mapped_operation_base_translator.py       | 13 +--
 src/jace/translator/pre_post_translation.py   |  3 +-
 src/jace/translator/primitive_translator.py   | 15 ++--
 .../arithmetic_logical_translators.py         | 13 +--
 .../select_n_translator.py                    |  8 +-
 .../primitive_translators/slicing.py          |  6 +-
 src/jace/util/__init__.py                     |  6 +-
 src/jace/util/dace_helper.py                  | 10 +--
 src/jace/util/jax_helper.py                   | 26 ++----
 src/jace/util/traits.py                       | 28 ++----
 src/jace/util/translation_cache.py            | 59 +++----------
 .../primitive_translators/conftest.py         |  2 +-
 ...primitive_arithmetic_logical_operations.py | 38 ++------
 .../test_primitive_broadcast_in_dim.py        |  8 +-
 .../test_primitive_convert_element_type.py    | 26 ++----
 .../test_primitive_reshape.py                 | 40 ++-------
 .../test_primitive_select_n.py                |  5 +-
 .../test_primitive_slicing.py                 | 23 ++---
 .../test_primitive_squeeze_expand_dims.py     | 30 ++-----
 .../test_jaxpr_translator_builder.py          | 45 +++-------
 .../test_primitive_translator_managing.py     |  5 +-
 tests/unit_tests/test_caching.py              |  9 +-
 tests/unit_tests/test_jax_api.py              |  2 +-
 tests/util.py                                 |  9 +-
 31 files changed, 138 insertions(+), 488 deletions(-)

diff --git a/docs/conf.py b/docs/conf.py
index cb0bb09..e902d98 100644
--- a/docs/conf.py
+++ b/docs/conf.py
@@ -26,28 +26,14 @@
 ]
 
 source_suffix = [".rst", ".md"]
-exclude_patterns = [
-    "_build",
-    "**.ipynb_checkpoints",
-    "Thumbs.db",
-    ".DS_Store",
-    ".env",
-    ".venv",
-]
+exclude_patterns = ["_build", "**.ipynb_checkpoints", "Thumbs.db", ".DS_Store", ".env", ".venv"]
 
 html_theme = "furo"
 
-myst_enable_extensions = [
-    "colon_fence",
-]
+myst_enable_extensions = ["colon_fence"]
 
-intersphinx_mapping = {
-    "python": ("https://docs.python.org/3", None),
-}
+intersphinx_mapping = {"python": ("https://docs.python.org/3", None)}
 
-nitpick_ignore = [
-    ("py:class", "_io.StringIO"),
-    ("py:class", "_io.BytesIO"),
-]
+nitpick_ignore = [("py:class", "_io.StringIO"), ("py:class", "_io.BytesIO")]
 
 always_document_param_types = True
diff --git a/noxfile.py b/noxfile.py
index 3772f2d..2154c16 100644
--- a/noxfile.py
+++ b/noxfile.py
@@ -79,13 +79,7 @@ def build_api_docs(session: nox.Session) -> None:
     session.install("sphinx")
     session.chdir("docs")
     session.run(
-        "sphinx-apidoc",
-        "-o",
-        "api/",
-        "--module-first",
-        "--no-toc",
-        "--force",
-        "../src/jace",
+        "sphinx-apidoc", "-o", "api/", "--module-first", "--no-toc", "--force", "../src/jace"
     )
 
 
diff --git a/pyproject.toml b/pyproject.toml
index d7e3b1d..62987e1 100644
--- a/pyproject.toml
+++ b/pyproject.toml
@@ -126,6 +126,7 @@ src = ["src"]
 
 [tool.ruff.format]
 docstring-code-format = true
+skip-magic-trailing-comma = true
 
 [tool.ruff.lint]
 extend-select = [
diff --git a/src/jace/api.py b/src/jace/api.py
index 9f128b3..46e15b2 100644
--- a/src/jace/api.py
+++ b/src/jace/api.py
@@ -21,12 +21,7 @@
     from collections.abc import Callable, Mapping
 
 
-__all__ = [
-    "grad",
-    "jacfwd",
-    "jacrev",
-    "jit",
-]
+__all__ = ["grad", "jacfwd", "jacrev", "jit"]
 
 
 @overload
diff --git a/src/jace/optimization.py b/src/jace/optimization.py
index 94a8f36..612929b 100644
--- a/src/jace/optimization.py
+++ b/src/jace/optimization.py
@@ -47,10 +47,7 @@ class CompilerOptions(TypedDict, total=False):
 }
 
 
-def jace_optimize(
-    tsdfg: translator.TranslatedJaxprSDFG,
-    **kwargs: Unpack[CompilerOptions],
-) -> None:
+def jace_optimize(tsdfg: translator.TranslatedJaxprSDFG, **kwargs: Unpack[CompilerOptions]) -> None:
     """Performs optimization of the translated SDFG _in place_.
 
     It is recommended to use the `CompilerOptions` `TypedDict` to pass options
diff --git a/src/jace/stages.py b/src/jace/stages.py
index b64e5d6..66d1e51 100644
--- a/src/jace/stages.py
+++ b/src/jace/stages.py
@@ -107,11 +107,7 @@ def __init__(
         self._jit_options = {**jit_options}
         self._fun = fun
 
-    def __call__(
-        self,
-        *args: Any,
-        **kwargs: Any,
-    ) -> Any:
+    def __call__(self, *args: Any, **kwargs: Any) -> Any:
         """Executes the wrapped function, lowering and compiling as needed in one step.
 
         The arguments passed to this function are the same as the wrapped function uses.
@@ -126,11 +122,7 @@ def __call__(
         return compiled(*args, **kwargs)
 
     @tcache.cached_transition
-    def lower(
-        self,
-        *args: Any,
-        **kwargs: Any,
-    ) -> JaCeLowered:
+    def lower(self, *args: Any, **kwargs: Any) -> JaCeLowered:
         """Lower this function explicitly for the given arguments.
 
         Performs the first two steps of the AOT steps described above, i.e.
@@ -180,10 +172,7 @@ def wrapped_fun(self) -> Callable:
         """Returns the wrapped function."""
         return self._fun
 
-    def _make_call_description(
-        self,
-        *args: Any,
-    ) -> tcache.StageTransformationSpec:
+    def _make_call_description(self, *args: Any) -> tcache.StageTransformationSpec:
         """This function computes the key for the `JaCeWrapped.lower()` call inside the cache.
 
         The function will compute a full abstract description on its argument.
@@ -214,18 +203,12 @@ class JaCeLowered(tcache.CachingStage["JaCeCompiled"]):
 
     _translated_sdfg: translator.TranslatedJaxprSDFG
 
-    def __init__(
-        self,
-        tsdfg: translator.TranslatedJaxprSDFG,
-    ) -> None:
+    def __init__(self, tsdfg: translator.TranslatedJaxprSDFG) -> None:
         super().__init__()
         self._translated_sdfg = tsdfg
 
     @tcache.cached_transition
-    def compile(
-        self,
-        compiler_options: CompilerOptions | None = None,
-    ) -> JaCeCompiled:
+    def compile(self, compiler_options: CompilerOptions | None = None) -> JaCeCompiled:
         """Optimize and compile the lowered SDFG and return a `JaCeCompiled` object.
 
         This is the transition function of this stage. Before the SDFG is
@@ -250,10 +233,7 @@ def compile(
             out_names=tsdfg.out_names,
         )
 
-    def compiler_ir(
-        self,
-        dialect: str | None = None,
-    ) -> translator.TranslatedJaxprSDFG:
+    def compiler_ir(self, dialect: str | None = None) -> translator.TranslatedJaxprSDFG:
         """Returns the internal SDFG.
 
         The function returns a `TranslatedJaxprSDFG` object. Direct modification
@@ -263,10 +243,7 @@ def compiler_ir(
             return self._translated_sdfg
         raise ValueError(f"Unknown dialect '{dialect}'.")
 
-    def view(
-        self,
-        filename: str | None = None,
-    ) -> None:
+    def view(self, filename: str | None = None) -> None:
         """Runs the `view()` method of the underlying SDFG.
 
         This will open a browser and display the SDFG.
@@ -281,8 +258,7 @@ def as_sdfg(self) -> dace.SDFG:
         return self.compiler_ir().sdfg
 
     def _make_call_description(
-        self,
-        compiler_options: CompilerOptions | None = None,
+        self, compiler_options: CompilerOptions | None = None
     ) -> tcache.StageTransformationSpec:
         """This function computes the key for the `self.compile()` call inside the cache.
 
@@ -293,10 +269,7 @@ def _make_call_description(
         call_args = tuple(sorted(options.items(), key=lambda x: x[0]))
         return tcache.StageTransformationSpec(stage_id=id(self), call_args=call_args)
 
-    def _make_compiler_options(
-        self,
-        compiler_options: CompilerOptions | None,
-    ) -> CompilerOptions:
+    def _make_compiler_options(self, compiler_options: CompilerOptions | None) -> CompilerOptions:
         """Return the compilation options that should be used for compilation.
 
         See `JaCeLowered.compile()` to see how to influence them.
@@ -304,9 +277,7 @@ def _make_compiler_options(
         return get_active_compiler_options() | (compiler_options or {})
 
 
-def update_active_compiler_options(
-    new_active_options: CompilerOptions,
-) -> CompilerOptions:
+def update_active_compiler_options(new_active_options: CompilerOptions) -> CompilerOptions:
     """Updates the set of active compiler options.
 
     Merges the options passed as `new_active_options` with the currently active
@@ -350,10 +321,7 @@ class JaCeCompiled:
     _out_names: tuple[str, ...]
 
     def __init__(
-        self,
-        csdfg: dace_helper.CompiledSDFG,
-        inp_names: Sequence[str],
-        out_names: Sequence[str],
+        self, csdfg: dace_helper.CompiledSDFG, inp_names: Sequence[str], out_names: Sequence[str]
     ) -> None:
         # NOTE: We only check that we have output, we do not care about the input, since the
         #  function `def foo(): return 1.0` is still a pure function, but we require that we have
@@ -364,23 +332,13 @@ def __init__(
         self._inp_names = tuple(inp_names)
         self._out_names = tuple(out_names)
 
-    def __call__(
-        self,
-        *args: Any,
-        **kwargs: Any,
-    ) -> Any:
+    def __call__(self, *args: Any, **kwargs: Any) -> Any:
         """Calls the embedded computation.
 
         The arguments must be the same as for the wrapped function, but with
         all static arguments removed.
         """
-        return dace_helper.run_jax_sdfg(
-            self._csdfg,
-            self._inp_names,
-            self._out_names,
-            args,
-            kwargs,
-        )
+        return dace_helper.run_jax_sdfg(self._csdfg, self._inp_names, self._out_names, args, kwargs)
 
 
 #: Known compilation stages in JaCe.
diff --git a/src/jace/translator/jaxpr_translator_builder.py b/src/jace/translator/jaxpr_translator_builder.py
index d00f110..69091b8 100644
--- a/src/jace/translator/jaxpr_translator_builder.py
+++ b/src/jace/translator/jaxpr_translator_builder.py
@@ -75,8 +75,7 @@ class JaxprTranslationBuilder:
     _ctx_stack: list[TranslationContext]
 
     def __init__(
-        self,
-        primitive_translators: Mapping[str, translator.PrimitiveTranslatorCallable],
+        self, primitive_translators: Mapping[str, translator.PrimitiveTranslatorCallable]
     ) -> None:
         # Maps name of primitives to the associated translator.
         self._primitive_translators = {**primitive_translators}
@@ -92,10 +91,7 @@ def __init__(
         self._ctx_stack = []
 
     def translate_jaxpr(
-        self,
-        jaxpr: jax_core.ClosedJaxpr,
-        *,
-        name: str | None = None,
+        self, jaxpr: jax_core.ClosedJaxpr, *, name: str | None = None
     ) -> TranslationContext:
         """Perform the translation of a Jaxpr into a SDFG.
 
@@ -122,12 +118,8 @@ def translate_jaxpr(
         #       Thus the builder will start to translate a second (nested) SDFG.
         #       Also note that there is no mechanism that forces the integration of the nested
         #       SDFG/Jaxpr, this must be done manually.
-        self._allocate_translation_ctx(
-            name=name,
-        )
-        self._create_constants(
-            jaxpr=jaxpr,
-        )
+        self._allocate_translation_ctx(name=name)
+        self._create_constants(jaxpr=jaxpr)
         self._create_initial_input(jaxpr=jaxpr)
 
         return self._translate_jaxpr_internal(jaxpr)
@@ -190,10 +182,7 @@ def arrays(self) -> Mapping[str, ddata.Data]:
         """
         return cast(Mapping[str, ddata.Data], self._ctx.sdfg.arrays)
 
-    def get_array(
-        self,
-        name: str | jax_core.Atom | util.JaCeVar,
-    ) -> ddata.Data:
+    def get_array(self, name: str | jax_core.Atom | util.JaCeVar) -> ddata.Data:
         """Returns the SDFG `Data` object `name` referees to.
 
         `name` can either be a string, in which case it is interpreted as a
@@ -212,22 +201,16 @@ def get_array(
 
     @overload
     def map_jax_var_to_sdfg(
-        self,
-        jax_var: jax_core.Atom | util.JaCeVar,
-        allow_fail: Literal[False] = False,
+        self, jax_var: jax_core.Atom | util.JaCeVar, allow_fail: Literal[False] = False
     ) -> str: ...
 
     @overload
     def map_jax_var_to_sdfg(
-        self,
-        jax_var: jax_core.Atom | util.JaCeVar,
-        allow_fail: Literal[True],
+        self, jax_var: jax_core.Atom | util.JaCeVar, allow_fail: Literal[True]
     ) -> str | None: ...
 
     def map_jax_var_to_sdfg(
-        self,
-        jax_var: jax_core.Atom | util.JaCeVar,
-        allow_fail: bool = False,
+        self, jax_var: jax_core.Atom | util.JaCeVar, allow_fail: bool = False
     ) -> str | None:
         """Get the name of the SDFG variable to which `jax_var` is referring to.
 
@@ -272,9 +255,7 @@ def is_root_translator(self) -> bool:
         return len(self._ctx_stack) == 1
 
     def add_jax_name_mapping(
-        self,
-        jax_var: jax_core.Var | util.JaCeVar,
-        sdfg_name: str,
+        self, jax_var: jax_core.Var | util.JaCeVar, sdfg_name: str
     ) -> JaxprTranslationBuilder:
         """Creates a new mapping between `jax_var` to `sdfg_name`.
 
@@ -454,10 +435,7 @@ def create_jax_var_list(  # type: ignore[misc]
 
         return ret_list
 
-    def _create_initial_input(
-        self,
-        jaxpr: jax_core.ClosedJaxpr,
-    ) -> None:
+    def _create_initial_input(self, jaxpr: jax_core.ClosedJaxpr) -> None:
         """Creates the input variables of `jaxpr`.
 
         Notes:
@@ -479,10 +457,7 @@ def _create_initial_input(
         # The output list is populated by `self._translate_jaxpr_internal()`
         self._ctx.inp_names = tuple(init_in_var_names)
 
-    def _create_constants(
-        self,
-        jaxpr: jax_core.ClosedJaxpr,
-    ) -> None:
+    def _create_constants(self, jaxpr: jax_core.ClosedJaxpr) -> None:
         """Creates all constants requested by the `jaxpr`.
 
         The function will create an SDFG variable and add them as constant to
@@ -504,20 +479,13 @@ def _create_constants(
                 sdfg_name, copy.deepcopy(const_value), self._ctx.sdfg.arrays[sdfg_name]
             )
 
-    def _allocate_translation_ctx(
-        self,
-        name: str | None = None,
-    ) -> JaxprTranslationBuilder:
+    def _allocate_translation_ctx(self, name: str | None = None) -> JaxprTranslationBuilder:
         """Allocate a new context and activate it.
 
         Args:
             name: The name of the SDFG.
         """
-        self._ctx_stack.append(
-            TranslationContext(
-                name=name,
-            )
-        )
+        self._ctx_stack.append(TranslationContext(name=name))
         return self
 
     @property
@@ -542,10 +510,7 @@ def _clear_translation_ctx(self) -> TranslationContext | None:
         # Remove the current head stack.
         return self._ctx_stack.pop()
 
-    def _translate_single_eqn(
-        self,
-        eqn: jax_core.JaxprEqn,
-    ) -> None:
+    def _translate_single_eqn(self, eqn: jax_core.JaxprEqn) -> None:
         """Translate `eqn` into its SDFG equivalent.
 
         To do this the function will perform the following steps:
@@ -601,10 +566,7 @@ def _translate_single_eqn(
         # Modify terminal root state of 'self'
         self._ctx.terminal_state = new_sdfg_term_state
 
-    def _translate_jaxpr_internal(
-        self,
-        jaxpr: jax_core.ClosedJaxpr,
-    ) -> TranslationContext:
+    def _translate_jaxpr_internal(self, jaxpr: jax_core.ClosedJaxpr) -> TranslationContext:
         """Performs the actual translation of the Jaxpr into an SDFG.
 
         The function assumes that the context is allocated as well as the
@@ -633,19 +595,14 @@ def _translate_jaxpr_internal(
             out_var_names = self._handle_null_jaxpr(jaxpr)
         else:
             out_var_names = self.create_jax_var_list(
-                jaxpr.jaxpr.outvars,
-                prevent_creation=True,
-                handle_literals=False,
+                jaxpr.jaxpr.outvars, prevent_creation=True, handle_literals=False
             )
 
         self._ctx.out_names = tuple(out_var_names)
 
         return cast(TranslationContext, self._clear_translation_ctx())
 
-    def _handle_null_jaxpr(
-        self,
-        jaxpr: jax_core.ClosedJaxpr,
-    ) -> list[str]:
+    def _handle_null_jaxpr(self, jaxpr: jax_core.ClosedJaxpr) -> list[str]:
         """This function is called in case a `Jaxpr` with zero equations is encountered.
 
         A function with zero equation might still have output, in which case
@@ -688,9 +645,7 @@ def _handle_null_jaxpr(
             # Now we create a variable that serves as true output, however, since the Jax variable
             #  is already known we can not update the variable mapping and must use another name.
             sdfg_out_name = self.add_array(
-                jax_out_var,
-                name_prefix="_zero_equation_output_for_",
-                update_var_mapping=False,
+                jax_out_var, name_prefix="_zero_equation_output_for_", update_var_mapping=False
             )
             out_var_names.append(sdfg_out_name)
 
@@ -753,10 +708,7 @@ class TranslationContext:
     start_state: dace.SDFGState
     terminal_state: dace.SDFGState
 
-    def __init__(
-        self,
-        name: str | None = None,
-    ) -> None:
+    def __init__(self, name: str | None = None) -> None:
         if isinstance(name, str) and not util.VALID_SDFG_OBJ_NAME.fullmatch(name):
             raise ValueError(f"'{name}' is not a valid SDFG name.")
 
diff --git a/src/jace/translator/mapped_operation_base_translator.py b/src/jace/translator/mapped_operation_base_translator.py
index 2b70f30..4cb915c 100644
--- a/src/jace/translator/mapped_operation_base_translator.py
+++ b/src/jace/translator/mapped_operation_base_translator.py
@@ -56,10 +56,7 @@ class MappedOperationTranslatorBase(translator.PrimitiveTranslator):
         This class will always generate a mapped Tasklet, even if a scalar is handled.
     """
 
-    def __init__(
-        self,
-        primitive_name: str,
-    ) -> None:
+    def __init__(self, primitive_name: str) -> None:
         self._prim_name = primitive_name
 
     @property
@@ -96,8 +93,7 @@ def __call__(
             ]
             tskl_output: dict[str, dace.Memlet] = {
                 "__out": dace.Memlet.simple(
-                    out_var_names[0],
-                    ", ".join(name for name, _ in tskl_ranges),
+                    out_var_names[0], ", ".join(name for name, _ in tskl_ranges)
                 )
             }
 
@@ -193,10 +189,7 @@ def make_input_memlets(
         return tskl_inputs
 
     def literal_substitution(
-        self,
-        tskl_code: str,
-        in_var_names: Sequence[str | None],
-        eqn: jax_core.JaxprEqn,
+        self, tskl_code: str, in_var_names: Sequence[str | None], eqn: jax_core.JaxprEqn
     ) -> str:
         """Perform literal substitution on the proto Tasklet code `tskl_code`.
 
diff --git a/src/jace/translator/pre_post_translation.py b/src/jace/translator/pre_post_translation.py
index 37be078..1e3f69f 100644
--- a/src/jace/translator/pre_post_translation.py
+++ b/src/jace/translator/pre_post_translation.py
@@ -56,8 +56,7 @@ def postprocess_jaxpr_sdfg(
 
 
 def finalize_translation_context(
-    trans_ctx: translator.TranslationContext,
-    validate: bool = True,
+    trans_ctx: translator.TranslationContext, validate: bool = True
 ) -> translator.TranslatedJaxprSDFG:
     """Finalizes the supplied translation context `trans_ctx`.
 
diff --git a/src/jace/translator/primitive_translator.py b/src/jace/translator/primitive_translator.py
index aaf164f..b452fee 100644
--- a/src/jace/translator/primitive_translator.py
+++ b/src/jace/translator/primitive_translator.py
@@ -117,8 +117,7 @@ def primitive(self) -> str:
 
 @overload
 def make_primitive_translator(
-    primitive: str,
-    primitive_translator: Literal[None] = None,
+    primitive: str, primitive_translator: Literal[None] = None
 ) -> Callable[[translator.PrimitiveTranslatorCallable], translator.PrimitiveTranslator]: ...
 
 
@@ -129,8 +128,7 @@ def make_primitive_translator(
 
 
 def make_primitive_translator(
-    primitive: str,
-    primitive_translator: translator.PrimitiveTranslatorCallable | None = None,
+    primitive: str, primitive_translator: translator.PrimitiveTranslatorCallable | None = None
 ) -> (
     Callable[[translator.PrimitiveTranslatorCallable], translator.PrimitiveTranslator]
     | translator.PrimitiveTranslator
@@ -161,21 +159,18 @@ def wrapper(
 
 @overload
 def register_primitive_translator(
-    primitive_translator: Literal[None] = None,
-    overwrite: bool = False,
+    primitive_translator: Literal[None] = None, overwrite: bool = False
 ) -> Callable[[translator.PrimitiveTranslator], translator.PrimitiveTranslator]: ...
 
 
 @overload
 def register_primitive_translator(
-    primitive_translator: translator.PrimitiveTranslator,
-    overwrite: bool = False,
+    primitive_translator: translator.PrimitiveTranslator, overwrite: bool = False
 ) -> translator.PrimitiveTranslator: ...
 
 
 def register_primitive_translator(
-    primitive_translator: translator.PrimitiveTranslator | None = None,
-    overwrite: bool = False,
+    primitive_translator: translator.PrimitiveTranslator | None = None, overwrite: bool = False
 ) -> (
     translator.PrimitiveTranslator
     | Callable[[translator.PrimitiveTranslator], translator.PrimitiveTranslator]
diff --git a/src/jace/translator/primitive_translators/arithmetic_logical_translators.py b/src/jace/translator/primitive_translators/arithmetic_logical_translators.py
index a344c4a..dfafa7b 100644
--- a/src/jace/translator/primitive_translators/arithmetic_logical_translators.py
+++ b/src/jace/translator/primitive_translators/arithmetic_logical_translators.py
@@ -45,11 +45,7 @@ class ArithmeticOperationTranslator(mapped_base.MappedOperationTranslatorBase):
             nested `pjit` implementation by Jax for unknown reasons.
     """
 
-    def __init__(
-        self,
-        prim_name: str,
-        tskl_tmpl: str,
-    ) -> None:
+    def __init__(self, prim_name: str, tskl_tmpl: str) -> None:
         super().__init__(primitive_name=prim_name)
         self._tskl_tmpl = tskl_tmpl
 
@@ -98,12 +94,7 @@ class LogicalOperationTranslator(mapped_base.MappedOperationTranslatorBase):
         `ArithmeticOperationTranslator` does.
     """
 
-    def __init__(
-        self,
-        prim_name: str,
-        int_tmpl: str,
-        bool_tmpl: str,
-    ) -> None:
+    def __init__(self, prim_name: str, int_tmpl: str, bool_tmpl: str) -> None:
         super().__init__(primitive_name=prim_name)
         self._int_tmpl = int_tmpl
         self._bool_tmpl = bool_tmpl
diff --git a/src/jace/translator/primitive_translators/select_n_translator.py b/src/jace/translator/primitive_translators/select_n_translator.py
index ee5eb5c..240375a 100644
--- a/src/jace/translator/primitive_translators/select_n_translator.py
+++ b/src/jace/translator/primitive_translators/select_n_translator.py
@@ -71,18 +71,14 @@ def make_input_memlets(
         """We have to add the offsets to the Memlet accesses."""
         return {
             f"__in{i-1}" if i else "__cond": dace.Memlet.simple(
-                in_var_name,
-                ", ".join(f"{it_idx}" for it_idx, _ in tskl_ranges),
+                in_var_name, ", ".join(f"{it_idx}" for it_idx, _ in tskl_ranges)
             )
             for i, in_var_name in enumerate(in_var_names)
             if in_var_name
         }
 
     def literal_substitution(
-        self,
-        tskl_code: str,
-        in_var_names: Sequence[str | None],
-        eqn: jax_core.JaxprEqn,
+        self, tskl_code: str, in_var_names: Sequence[str | None], eqn: jax_core.JaxprEqn
     ) -> str:
         """Can not be done by the base because of the renaming."""
         for i, in_var_name in enumerate(in_var_names[1:]):
diff --git a/src/jace/translator/primitive_translators/slicing.py b/src/jace/translator/primitive_translators/slicing.py
index ee415f4..5a04b3c 100644
--- a/src/jace/translator/primitive_translators/slicing.py
+++ b/src/jace/translator/primitive_translators/slicing.py
@@ -131,8 +131,7 @@ def __call__(
 
             # Intermediate value to storing the adjusted start index.
             new_start_idx_var_name = builder.add_array(
-                eqn.invars[dim + 1],
-                name_prefix="__jace_adapted_start_idx_",
+                eqn.invars[dim + 1], name_prefix="__jace_adapted_start_idx_"
             )
             new_start_idx_acc = eqn_state.add_access(new_start_idx_var_name)
 
@@ -179,8 +178,7 @@ def __call__(
 
         tskl_input = dace.Memlet.simple(in_var_name, ", ".join(memlet_accesses))
         tskl_output = dace.Memlet.simple(
-            out_var_names[0],
-            ", ".join(name for name, _ in tskl_ranges),
+            out_var_names[0], ", ".join(name for name, _ in tskl_ranges)
         )
 
         _, map_entry, _ = eqn_state.add_mapped_tasklet(
diff --git a/src/jace/util/__init__.py b/src/jace/util/__init__.py
index c2f2031..bfff733 100644
--- a/src/jace/util/__init__.py
+++ b/src/jace/util/__init__.py
@@ -19,11 +19,7 @@
     propose_jax_name,
     translate_dtype,
 )
-from .misc import (
-    FORBIDDEN_SDFG_VAR_NAMES,
-    VALID_SDFG_OBJ_NAME,
-    VALID_SDFG_VAR_NAME,
-)
+from .misc import FORBIDDEN_SDFG_VAR_NAMES, VALID_SDFG_OBJ_NAME, VALID_SDFG_VAR_NAME
 from .traits import (
     is_array,
     is_c_contiguous,
diff --git a/src/jace/util/dace_helper.py b/src/jace/util/dace_helper.py
index d3929e5..cbbb417 100644
--- a/src/jace/util/dace_helper.py
+++ b/src/jace/util/dace_helper.py
@@ -31,16 +31,10 @@
     from jace import translator
     from jace.util import dace_helper
 
-__all__ = [
-    "CompiledSDFG",
-    "compile_jax_sdfg",
-    "run_jax_sdfg",
-]
+__all__ = ["CompiledSDFG", "compile_jax_sdfg", "run_jax_sdfg"]
 
 
-def compile_jax_sdfg(
-    tsdfg: translator.TranslatedJaxprSDFG,
-) -> dace_helper.CompiledSDFG:
+def compile_jax_sdfg(tsdfg: translator.TranslatedJaxprSDFG) -> dace_helper.CompiledSDFG:
     """Compiles the SDFG embedded in `tsdfg` and return the resulting `CompiledSDFG` object."""
     if any(  # We do not support the DaCe return mechanism
         array_name.startswith("__return")
diff --git a/src/jace/util/jax_helper.py b/src/jace/util/jax_helper.py
index cbc25d7..b2e0d75 100644
--- a/src/jace/util/jax_helper.py
+++ b/src/jace/util/jax_helper.py
@@ -74,10 +74,7 @@ def __post_init__(self) -> None:
     def __hash__(self) -> int:
         return id(self)
 
-    def __eq__(
-        self,
-        other: Any,
-    ) -> bool:
+    def __eq__(self, other: Any) -> bool:
         if not isinstance(other, JaCeVar):
             return NotImplemented
         return id(self) == id(other)
@@ -103,9 +100,7 @@ def get_jax_var_name(jax_var: jax_core.Atom | JaCeVar) -> str:
             )
 
 
-def get_jax_var_shape(
-    jax_var: jax_core.Atom | JaCeVar,
-) -> tuple[int | dace.symbol | str, ...]:
+def get_jax_var_shape(jax_var: jax_core.Atom | JaCeVar) -> tuple[int | dace.symbol | str, ...]:
     """Returns the shape of `jax_var`."""
     match jax_var:
         case jax_core.Var() | jax_core.Literal():
@@ -118,9 +113,7 @@ def get_jax_var_shape(
             raise TypeError(f"'get_jax_var_shape()` is not implemented for '{type(jax_var)}'.")
 
 
-def get_jax_var_dtype(
-    jax_var: jax_core.Atom | JaCeVar,
-) -> dace.typeclass:
+def get_jax_var_dtype(jax_var: jax_core.Atom | JaCeVar) -> dace.typeclass:
     """Returns the DaCe equivalent of `jax_var`s datatype."""
     match jax_var:
         case jax_core.Var() | jax_core.Literal():
@@ -133,10 +126,7 @@ def get_jax_var_dtype(
             raise TypeError(f"'get_jax_var_dtype()` is not implemented for '{type(jax_var)}'.")
 
 
-def is_tracing_ongoing(
-    *args: Any,
-    **kwargs: Any,
-) -> bool:
+def is_tracing_ongoing(*args: Any, **kwargs: Any) -> bool:
     """Test if tracing is ongoing.
 
     While a return value `True` guarantees that a translation is ongoing, a
@@ -157,9 +147,7 @@ def is_tracing_ongoing(
     raise RuntimeError("Failed to determine if tracing is ongoing.")
 
 
-def translate_dtype(
-    dtype: Any,
-) -> dace.typeclass:
+def translate_dtype(dtype: Any) -> dace.typeclass:
     """Turns a Jax datatype into a DaCe datatype."""
     if dtype is None:
         raise NotImplementedError  # Handling a special case in DaCe.
@@ -220,9 +208,7 @@ def propose_jax_name(
     return jax_name
 
 
-def get_jax_literal_value(
-    lit: jax_core.Atom,
-) -> bool | float | int | np.generic:
+def get_jax_literal_value(lit: jax_core.Atom) -> bool | float | int | np.generic:
     """Returns the value a literal is wrapping.
 
     The function guarantees to return a scalar value.
diff --git a/src/jace/util/traits.py b/src/jace/util/traits.py
index 984f794..18c975f 100644
--- a/src/jace/util/traits.py
+++ b/src/jace/util/traits.py
@@ -19,9 +19,7 @@
 import jace.util as util
 
 
-def is_drop_var(
-    jax_var: jax_core.Atom | util.JaCeVar,
-) -> TypeGuard[jax_core.DropVar]:
+def is_drop_var(jax_var: jax_core.Atom | util.JaCeVar) -> TypeGuard[jax_core.DropVar]:
     """Tests if `jax_var` is a drop variable, i.e. a variable that is not read from in a Jaxpr."""
 
     if isinstance(jax_var, jax_core.DropVar):
@@ -31,9 +29,7 @@ def is_drop_var(
     return False
 
 
-def is_jax_array(
-    obj: Any,
-) -> TypeGuard[jax.Array]:
+def is_jax_array(obj: Any) -> TypeGuard[jax.Array]:
     """Tests if `obj` is a Jax array.
 
     Note:
@@ -43,16 +39,12 @@ def is_jax_array(
     return isinstance(obj, jax.Array)
 
 
-def is_array(
-    obj: Any,
-) -> bool:
+def is_array(obj: Any) -> bool:
     """Identifies arrays, this also includes Jax arrays."""
     return dace.is_array(obj) or is_jax_array(obj)
 
 
-def is_scalar(
-    obj: Any,
-) -> bool:
+def is_scalar(obj: Any) -> bool:
     """Tests if `obj` is a scalar."""
     # These are the type known to DaCe; Taken from `dace.dtypes`.
     known_types = {
@@ -82,9 +74,7 @@ def is_scalar(
     return type(obj) in known_types
 
 
-def is_on_device(
-    obj: Any,
-) -> bool:
+def is_on_device(obj: Any) -> bool:
     """Tests if `obj` is on a device.
 
     Jax arrays are always on the CPU and GPU (if there is one). Thus for Jax
@@ -95,18 +85,14 @@ def is_on_device(
     return dace.is_gpu_array(obj)
 
 
-def is_fully_addressable(
-    obj: Any,
-) -> bool:
+def is_fully_addressable(obj: Any) -> bool:
     """Tests if `obj` is fully addressable, i.e. is only on this host."""
     if is_jax_array(obj):
         return obj.is_fully_addressable
     return True
 
 
-def is_c_contiguous(
-    obj: Any,
-) -> bool:
+def is_c_contiguous(obj: Any) -> bool:
     """Tests if `obj` is in C order."""
     if not is_array(obj):
         return False
diff --git a/src/jace/util/translation_cache.py b/src/jace/util/translation_cache.py
index 6dab94c..7ded2d1 100644
--- a/src/jace/util/translation_cache.py
+++ b/src/jace/util/translation_cache.py
@@ -21,16 +21,7 @@
 import dataclasses
 import functools
 from collections.abc import Callable, Hashable
-from typing import (
-    TYPE_CHECKING,
-    Any,
-    Concatenate,
-    Generic,
-    ParamSpec,
-    TypeAlias,
-    TypeVar,
-    cast,
-)
+from typing import TYPE_CHECKING, Any, Concatenate, Generic, ParamSpec, TypeAlias, TypeVar, cast
 
 import dace
 from jax import core as jax_core
@@ -77,9 +68,7 @@ def __init__(self) -> None:
 
     @abc.abstractmethod
     def _make_call_description(
-        self: CachingStage,
-        *args: Any,
-        **kwargs: Any,
+        self: CachingStage, *args: Any, **kwargs: Any
     ) -> StageTransformationSpec:
         """Generates the key that is used to store/locate the call in the cache."""
         ...
@@ -105,11 +94,7 @@ def cached_transition(
     """
 
     @functools.wraps(transition)
-    def transition_wrapper(
-        self: CachingStageType,
-        *args: P.args,
-        **kwargs: P.kwargs,
-    ) -> NextStage:
+    def transition_wrapper(self: CachingStageType, *args: P.args, **kwargs: P.kwargs) -> NextStage:
         key: StageTransformationSpec = self._make_call_description(*args, **kwargs)
         if key in self._cache:
             return self._cache[key]
@@ -126,9 +111,7 @@ def clear_translation_cache() -> None:
         stage_caches.clear()
 
 
-def get_cache(
-    stage: CachingStage,
-) -> StageCache:
+def get_cache(stage: CachingStage) -> StageCache:
     """Returns the cache that should be used for `stage`."""
     stage_type = type(stage)
     if stage_type not in _TRANSLATION_CACHES:
@@ -161,10 +144,7 @@ class _AbstractCallArgument:
     storage: dace.StorageType
 
     @classmethod
-    def from_value(
-        cls,
-        value: Any,
-    ) -> _AbstractCallArgument:
+    def from_value(cls, value: Any) -> _AbstractCallArgument:
         """Construct an `_AbstractCallArgument` from `value`."""
         if not util.is_fully_addressable(value):
             raise NotImplementedError("Distributed arrays are not addressed yet.")
@@ -201,8 +181,7 @@ def from_value(
 #: This type is the abstract description of a function call.
 #:  It is part of the key used in the cache.
 CallArgsSpec: TypeAlias = tuple[
-    _AbstractCallArgument | Hashable | tuple[str, _AbstractCallArgument | Hashable],
-    ...,
+    _AbstractCallArgument | Hashable | tuple[str, _AbstractCallArgument | Hashable], ...
 ]
 
 
@@ -246,33 +225,20 @@ class StageCache(Generic[StageType]):
     _memory: collections.OrderedDict[StageTransformationSpec, StageType]
     _capacity: int
 
-    def __init__(
-        self,
-        capachity: int = 256,
-    ) -> None:
+    def __init__(self, capachity: int = 256) -> None:
         self._memory = collections.OrderedDict()
         self._capacity = capachity
 
-    def __contains__(
-        self,
-        key: StageTransformationSpec,
-    ) -> bool:
+    def __contains__(self, key: StageTransformationSpec) -> bool:
         return key in self._memory
 
-    def __getitem__(
-        self,
-        key: StageTransformationSpec,
-    ) -> StageType:
+    def __getitem__(self, key: StageTransformationSpec) -> StageType:
         if key not in self:
             raise KeyError(f"Key '{key}' is unknown.")
         self._memory.move_to_end(key, last=True)
         return self._memory[key]
 
-    def __setitem__(
-        self,
-        key: StageTransformationSpec,
-        res: StageType,
-    ) -> None:
+    def __setitem__(self, key: StageTransformationSpec, res: StageType) -> None:
         if key in self:
             self._memory.move_to_end(key, last=True)
             self._memory[key] = res
@@ -281,10 +247,7 @@ def __setitem__(
                 self.popitem(None)
             self._memory[key] = res
 
-    def popitem(
-        self,
-        key: StageTransformationSpec | None,
-    ) -> None:
+    def popitem(self, key: StageTransformationSpec | None) -> None:
         """Evict `key` from `self`.
 
         If `key` is `None` the oldest entry is evicted.
diff --git a/tests/integration_tests/primitive_translators/conftest.py b/tests/integration_tests/primitive_translators/conftest.py
index 73b2699..3c79e98 100644
--- a/tests/integration_tests/primitive_translators/conftest.py
+++ b/tests/integration_tests/primitive_translators/conftest.py
@@ -23,7 +23,7 @@
 @pytest.fixture(
     autouse=True,
     params=[
-        optimization.NO_OPTIMIZATIONS,
+        optimization.NO_OPTIMIZATIONS
         # TODO(phimuell): find a way to conditionally enable.
         # optimization.DEFAULT_OPTIMIZATIONS,
     ],
diff --git a/tests/integration_tests/primitive_translators/test_primitive_arithmetic_logical_operations.py b/tests/integration_tests/primitive_translators/test_primitive_arithmetic_logical_operations.py
index 0854dea..b062a66 100644
--- a/tests/integration_tests/primitive_translators/test_primitive_arithmetic_logical_operations.py
+++ b/tests/integration_tests/primitive_translators/test_primitive_arithmetic_logical_operations.py
@@ -82,9 +82,7 @@ def _only_alt_translators() -> Generator[None, None, None]:
         (jnp.bitwise_not, 1, np.int64),
     ]
 )
-def logical_ops(
-    request,
-) -> tuple[Callable, tuple[np.ndarray, ...]]:
+def logical_ops(request) -> tuple[Callable, tuple[np.ndarray, ...]]:
     """Returns a logical operation function and inputs."""
     return (
         request.param[0],
@@ -101,9 +99,7 @@ def logical_ops(
         ),
     ]
 )
-def dtype(
-    request,
-) -> type:
+def dtype(request) -> type:
     """Data types that should be used for the numerical tests of the ALT translators."""
     return request.param
 
@@ -128,10 +124,7 @@ def dtype(
         lambda x: jnp.atanh(jnp.tanh(x)),
     ]
 )
-def alt_unary_ops(
-    request,
-    dtype: type,
-) -> tuple[Callable, np.ndarray]:
+def alt_unary_ops(request, dtype: type) -> tuple[Callable, np.ndarray]:
     """The inputs and the operation we need for the full test.
 
     Some of the unary operations are combined to ensure that they will succeed.
@@ -152,9 +145,7 @@ def alt_unary_ops(
         lambda x, y: x**y,
     ]
 )
-def alt_binary_ops_float(
-    request,
-) -> tuple[Callable, tuple[np.ndarray, np.ndarray]]:
+def alt_binary_ops_float(request) -> tuple[Callable, tuple[np.ndarray, np.ndarray]]:
     """Binary ALT operations that operates on floats."""
     # Getting 0 in the division test is unlikely.
     return (  # type: ignore[return-value]  # Type confusion.
@@ -173,9 +164,7 @@ def alt_binary_ops_float(
         lambda x, y: x > y,
     ]
 )
-def alt_binary_compare_ops(
-    request,
-) -> tuple[Callable, tuple[np.ndarray, np.ndarray]]:
+def alt_binary_compare_ops(request) -> tuple[Callable, tuple[np.ndarray, np.ndarray]]:
     """Comparison operations, operates on integers."""
     return (
         request.param,
@@ -190,17 +179,12 @@ def alt_binary_compare_ops(
         [(5, 1, 3, 4, 1, 5), (5, 1, 3, 1, 2, 5)],
     ]
 )
-def broadcast_input(
-    request,
-) -> tuple[np.ndarray, np.ndarray]:
+def broadcast_input(request) -> tuple[np.ndarray, np.ndarray]:
     """Inputs to be used for the broadcast test."""
     return tuple(testutil.mkarray(shape) for shape in request.param)  # type: ignore[return-value] # can not deduce that it is only size 2.
 
 
-def _perform_alt_test(
-    testee: Callable,
-    *args: Any,
-) -> None:
+def _perform_alt_test(testee: Callable, *args: Any) -> None:
     """General function that just performs the test."""
     wrapped = jace.jit(testee)
 
@@ -304,9 +288,7 @@ def testee(A: np.ndarray) -> np.ndarray:
     _perform_alt_test(testee, A)
 
 
-def test_mapped_broadcast(
-    broadcast_input: tuple[np.ndarray, np.ndarray],
-) -> None:
+def test_mapped_broadcast(broadcast_input: tuple[np.ndarray, np.ndarray]) -> None:
     def testee(A: np.ndarray, B: np.ndarray) -> np.ndarray:
         return A + B
 
@@ -319,9 +301,7 @@ def testee(A: np.ndarray, B: np.ndarray) -> np.ndarray:
 # <------------ Tests for arithmetic and logical translators/operations
 
 
-def test_alt_general_unary(
-    alt_unary_ops: tuple[Callable, np.ndarray],
-) -> None:
+def test_alt_general_unary(alt_unary_ops: tuple[Callable, np.ndarray]) -> None:
     def testee(A: np.ndarray) -> np.ndarray:
         return alt_unary_ops[0](A)
 
diff --git a/tests/integration_tests/primitive_translators/test_primitive_broadcast_in_dim.py b/tests/integration_tests/primitive_translators/test_primitive_broadcast_in_dim.py
index 088e5d6..9300254 100644
--- a/tests/integration_tests/primitive_translators/test_primitive_broadcast_in_dim.py
+++ b/tests/integration_tests/primitive_translators/test_primitive_broadcast_in_dim.py
@@ -35,9 +35,7 @@
 
 
 @pytest.fixture(params=[(10,), (10, 1), (1, 10)])
-def vector_shape(
-    request,
-) -> tuple[int, ...]:
+def vector_shape(request) -> tuple[int, ...]:
     """Shapes used in the `test_bid_vector()` tests."""
     return request.param
 
@@ -70,9 +68,7 @@ def testee(a: float) -> jax.Array:
     assert np.all(res == ref)
 
 
-def test_bid_vector(
-    vector_shape: Sequence[int],
-) -> None:
+def test_bid_vector(vector_shape: Sequence[int]) -> None:
     """Broadcast a vector to a tensor."""
 
     def testee(A: np.ndarray) -> jax.Array:
diff --git a/tests/integration_tests/primitive_translators/test_primitive_convert_element_type.py b/tests/integration_tests/primitive_translators/test_primitive_convert_element_type.py
index 181b384..fe86b4b 100644
--- a/tests/integration_tests/primitive_translators/test_primitive_convert_element_type.py
+++ b/tests/integration_tests/primitive_translators/test_primitive_convert_element_type.py
@@ -38,17 +38,13 @@
 
 
 @pytest.fixture(params=_DACE_REAL_TYPES)
-def src_type(
-    request,
-) -> type:
+def src_type(request) -> type:
     """All valid source types, with the exception of bool."""
     return request.param
 
 
 @pytest.fixture(params=_DACE_REAL_TYPES + _DACE_COMPLEX_TYPES)
-def dst_type(
-    request,
-) -> type:
+def dst_type(request) -> type:
     """All valid destination types, with the exception of bool.
 
     Includes also complex types, because going from real to complex is useful,
@@ -57,10 +53,7 @@ def dst_type(
     return request.param
 
 
-def _convert_element_type_impl(
-    input_type: type,
-    output_type: type,
-) -> None:
+def _convert_element_type_impl(input_type: type, output_type: type) -> None:
     """Implementation of the tests of the convert element types primitive."""
     lowering_cnt = [0]
     A: np.ndarray = testutil.mkarray((10, 10), input_type)
@@ -79,20 +72,13 @@ def converter(A: np.ndarray) -> jax.Array:
     assert np.allclose(ref, res)
 
 
-def test_convert_element_type_main(
-    src_type: type,
-    dst_type: type,
-) -> None:
+def test_convert_element_type_main(src_type: type, dst_type: type) -> None:
     _convert_element_type_impl(src_type, dst_type)
 
 
-def test_convert_element_type_from_bool(
-    src_type: type,
-) -> None:
+def test_convert_element_type_from_bool(src_type: type) -> None:
     _convert_element_type_impl(np.bool_, src_type)
 
 
-def test_convert_element_type_to_bool(
-    src_type: type,
-) -> None:
+def test_convert_element_type_to_bool(src_type: type) -> None:
     _convert_element_type_impl(src_type, np.bool_)
diff --git a/tests/integration_tests/primitive_translators/test_primitive_reshape.py b/tests/integration_tests/primitive_translators/test_primitive_reshape.py
index a63b3f3..ac4ad50 100644
--- a/tests/integration_tests/primitive_translators/test_primitive_reshape.py
+++ b/tests/integration_tests/primitive_translators/test_primitive_reshape.py
@@ -26,9 +26,7 @@
 
 
 def _test_impl_reshaping(
-    src_shape: Sequence[int],
-    dst_shape: Sequence[int],
-    order: str = "C",
+    src_shape: Sequence[int], dst_shape: Sequence[int], order: str = "C"
 ) -> None:
     """Performs a reshaping from `src_shape` to `dst_shape`."""
     A = testutil.mkarray(src_shape)
@@ -45,61 +43,41 @@ def testee(A: np.ndarray) -> jax.Array:
 
 
 @pytest.fixture(
-    params=[
-        "C",
-        pytest.param("F", marks=pytest.mark.skip("Non C order is not supported")),
-    ]
+    params=["C", pytest.param("F", marks=pytest.mark.skip("Non C order is not supported"))]
 )
-def mem_order(
-    request,
-) -> str:
+def mem_order(request) -> str:
     """Gets the memory order that we want."""
     return request.param
 
 
 @pytest.fixture(params=[(216, 1, 1), (1, 216, 1), (1, 1, 216), (1, 6, 36), (36, 1, 6)])
-def new_shape(
-    request,
-) -> None:
+def new_shape(request) -> None:
     """New shapes for the `test_reshaping_same_rank()` test."""
     return request.param
 
 
 @pytest.fixture(params=[(12, 1), (1, 12), (1, 1, 12), (1, 2, 6)])
-def expanded_shape(
-    request,
-) -> None:
+def expanded_shape(request) -> None:
     """New shapes for the `test_reshaping_removing_rank()` test."""
     return request.param
 
 
 @pytest.fixture(params=[(216,), (6, 36), (36, 6), (216, 1)])
-def reduced_shape(
-    request,
-) -> None:
+def reduced_shape(request) -> None:
     """New shapes for the `test_reshaping_adding_rank()` test."""
     return request.param
 
 
-def test_reshaping_same_rank(
-    new_shape: Sequence[int],
-    mem_order: str,
-) -> None:
+def test_reshaping_same_rank(new_shape: Sequence[int], mem_order: str) -> None:
     """The rank, numbers of dimensions, stays the same,"""
     _test_impl_reshaping((6, 6, 6), new_shape, mem_order)
 
 
-def test_reshaping_adding_rank(
-    expanded_shape: Sequence[int],
-    mem_order: str,
-) -> None:
+def test_reshaping_adding_rank(expanded_shape: Sequence[int], mem_order: str) -> None:
     """Adding ranks to an array."""
     _test_impl_reshaping((12,), expanded_shape, mem_order)
 
 
-def test_reshaping_removing_rank(
-    reduced_shape: Sequence[int],
-    mem_order: str,
-) -> None:
+def test_reshaping_removing_rank(reduced_shape: Sequence[int], mem_order: str) -> None:
     """Removing ranks from an array."""
     _test_impl_reshaping((6, 6, 6), reduced_shape, mem_order)
diff --git a/tests/integration_tests/primitive_translators/test_primitive_select_n.py b/tests/integration_tests/primitive_translators/test_primitive_select_n.py
index e9871bf..a5faa44 100644
--- a/tests/integration_tests/primitive_translators/test_primitive_select_n.py
+++ b/tests/integration_tests/primitive_translators/test_primitive_select_n.py
@@ -24,10 +24,7 @@
     from collections.abc import Callable
 
 
-def _perform_test(
-    testee: Callable,
-    *args: Any,
-) -> None:
+def _perform_test(testee: Callable, *args: Any) -> None:
     res = testee(*args)
     ref = jace.jit(testee)(*args)
     assert np.all(res == ref)
diff --git a/tests/integration_tests/primitive_translators/test_primitive_slicing.py b/tests/integration_tests/primitive_translators/test_primitive_slicing.py
index 95778da..6c70c4e 100644
--- a/tests/integration_tests/primitive_translators/test_primitive_slicing.py
+++ b/tests/integration_tests/primitive_translators/test_primitive_slicing.py
@@ -36,16 +36,12 @@ def A_4x4x4x4() -> np.ndarray:
         (3, 1, 3, 0),  # Will lead to readjustment of the start index.
     ]
 )
-def full_dynamic_start_idx(
-    request,
-) -> tuple[int, int, int, int]:
+def full_dynamic_start_idx(request) -> tuple[int, int, int, int]:
     """Start indexes for the slice window of `test_dynamic_slice_full_dynamic()`."""
     return request.param
 
 
-def test_slice_no_strides(
-    A_20x20x20: np.ndarray,
-) -> None:
+def test_slice_no_strides(A_20x20x20: np.ndarray) -> None:
     """Test without strides."""
 
     def testee(A: np.ndarray) -> jax.Array:
@@ -59,9 +55,7 @@ def testee(A: np.ndarray) -> jax.Array:
     assert np.all(ref == res)
 
 
-def test_slice_strides(
-    A_20x20x20: np.ndarray,
-) -> None:
+def test_slice_strides(A_20x20x20: np.ndarray) -> None:
     """Test with strides."""
 
     def testee(A: np.ndarray) -> jax.Array:
@@ -79,8 +73,7 @@ def testee(A: np.ndarray) -> jax.Array:
     "In unoptimized mode there is an error, that is caused because we have an array insteadof a scalar."
 )
 def test_dynamic_slice_full_dynamic(
-    A_4x4x4x4: np.ndarray,
-    full_dynamic_start_idx: tuple[int, int, int, int],
+    A_4x4x4x4: np.ndarray, full_dynamic_start_idx: tuple[int, int, int, int]
 ) -> None:
     def testee(A: np.ndarray, s1: int, s2: int, s3: int, s4: int) -> jax.Array:
         return jax.lax.dynamic_slice(A, (s1, s2, s3, s4), (2, 2, 2, 2))
@@ -94,9 +87,7 @@ def testee(A: np.ndarray, s1: int, s2: int, s3: int, s4: int) -> jax.Array:
 @pytest.mark.skip(
     "In unoptimized mode there is an error, that is caused because we have an array insteadof a scalar."
 )
-def test_dynamic_slice_partially_dynamic(
-    A_4x4x4x4: np.ndarray,
-) -> None:
+def test_dynamic_slice_partially_dynamic(A_4x4x4x4: np.ndarray) -> None:
     def testee(A: np.ndarray, s1: int, s2: int) -> jax.Array:
         return jax.lax.dynamic_slice(A, (s1, 1, s2, 2), (2, 2, 2, 2))
 
@@ -109,9 +100,7 @@ def testee(A: np.ndarray, s1: int, s2: int) -> jax.Array:
 @pytest.mark.skip(
     "In unoptimized mode there is an error, that is caused because we have an array insteadof a scalar."
 )
-def test_dynamic_slice_full_literal(
-    A_4x4x4x4: np.ndarray,
-) -> None:
+def test_dynamic_slice_full_literal(A_4x4x4x4: np.ndarray) -> None:
     def testee(A: np.ndarray) -> jax.Array:
         return jax.lax.dynamic_slice(A, (0, 1, 0, 2), (2, 2, 2, 2))
 
diff --git a/tests/integration_tests/primitive_translators/test_primitive_squeeze_expand_dims.py b/tests/integration_tests/primitive_translators/test_primitive_squeeze_expand_dims.py
index cc5f56e..c82e4bb 100644
--- a/tests/integration_tests/primitive_translators/test_primitive_squeeze_expand_dims.py
+++ b/tests/integration_tests/primitive_translators/test_primitive_squeeze_expand_dims.py
@@ -30,10 +30,7 @@
     from collections.abc import Sequence
 
 
-def _roundtrip_implementation(
-    shape: Sequence[int],
-    axis: int | Sequence[int],
-) -> None:
+def _roundtrip_implementation(shape: Sequence[int], axis: int | Sequence[int]) -> None:
     """Implementation of the test for `expand_dims()` and `squeeze()`.
 
     It will first add dimensions and then remove them.
@@ -59,33 +56,18 @@ def _roundtrip_implementation(
 
 
 @pytest.fixture(params=[0, -1, 1])
-def single_axis(
-    request,
-) -> int:
+def single_axis(request) -> int:
     return request.param
 
 
-@pytest.fixture(
-    params=[
-        0,
-        -1,
-        (1, 2, 3),
-        (3, 2, 1),
-    ]
-)
-def multiple_axis(
-    request,
-) -> tuple[int, ...] | int:
+@pytest.fixture(params=[0, -1, (1, 2, 3), (3, 2, 1)])
+def multiple_axis(request) -> tuple[int, ...] | int:
     return request.param
 
 
-def test_expand_squeeze_rountrip_simple(
-    single_axis: int,
-) -> None:
+def test_expand_squeeze_rountrip_simple(single_axis: int) -> None:
     _roundtrip_implementation((10,), single_axis)
 
 
-def test_expand_squeeze_rountrip_big(
-    multiple_axis: Sequence[int],
-) -> None:
+def test_expand_squeeze_rountrip_big(multiple_axis: Sequence[int]) -> None:
     _roundtrip_implementation((2, 3, 4, 5), multiple_axis)
diff --git a/tests/integration_tests/test_jaxpr_translator_builder.py b/tests/integration_tests/test_jaxpr_translator_builder.py
index 53bd65a..17253b5 100644
--- a/tests/integration_tests/test_jaxpr_translator_builder.py
+++ b/tests/integration_tests/test_jaxpr_translator_builder.py
@@ -186,9 +186,7 @@ def test_builder_variable_alloc_prefix_naming(
     assert exp_name_3 == sdfg_name_3
 
 
-def test_builder_nested(
-    translation_builder: translator.JaxprTranslationBuilder,
-) -> None:
+def test_builder_nested(translation_builder: translator.JaxprTranslationBuilder) -> None:
     """Tests the ability of the nesting of the builder."""
 
     # Now add a variable to the current subtext.
@@ -260,9 +258,7 @@ def test_builder_nested(
     assert name_3 == translation_builder.map_jax_var_to_sdfg(array3)
 
 
-def test_builder_append_state(
-    translation_builder: translator.JaxprTranslationBuilder,
-) -> None:
+def test_builder_append_state(translation_builder: translator.JaxprTranslationBuilder) -> None:
     """Tests the functionality of appending states."""
     sdfg: dace.SDFG = translation_builder.sdfg
 
@@ -348,10 +344,7 @@ def test_builder_variable_alloc_list(
     var_list_1 = [array1, nscal, scal2]
     exp_names_1 = ["a", nscal.name, "c"]
 
-    res_names_1 = translation_builder.create_jax_var_list(
-        var_list_1,
-        update_var_mapping=True,
-    )
+    res_names_1 = translation_builder.create_jax_var_list(var_list_1, update_var_mapping=True)
     assert len(translation_builder.arrays) == 3
     assert res_names_1 == exp_names_1
 
@@ -359,10 +352,7 @@ def test_builder_variable_alloc_list(
     var_list_2 = [array2, nscal, scal1]
     exp_names_2 = ["d", nscal.name, "e"]
 
-    res_names_2 = translation_builder.create_jax_var_list(
-        var_list_2,
-        update_var_mapping=True,
-    )
+    res_names_2 = translation_builder.create_jax_var_list(var_list_2, update_var_mapping=True)
     assert res_names_2 == exp_names_2
     assert len(translation_builder.arrays) == 5
 
@@ -406,10 +396,7 @@ def test_builder_variable_alloc_list_prevent_creation(
         expected_exception=ValueError,
         match=re.escape(f"'prevent_creation' given but have to create '{array2}'."),
     ):
-        translation_builder.create_jax_var_list(
-            var_list,
-            prevent_creation=True,
-        )
+        translation_builder.create_jax_var_list(var_list, prevent_creation=True)
     assert len(translation_builder.arrays) == 1
     assert translation_builder.map_jax_var_to_sdfg(array1) == "a"
 
@@ -433,10 +420,7 @@ def test_builder_variable_alloc_list_only_creation(
         expected_exception=ValueError,
         match=re.escape(f"'only_creation' given '{array1}' already exists."),
     ):
-        translation_builder.create_jax_var_list(
-            var_list,
-            only_creation=True,
-        )
+        translation_builder.create_jax_var_list(var_list, only_creation=True)
     assert len(translation_builder.arrays) == 1
     assert translation_builder.map_jax_var_to_sdfg(array1) == "a"
 
@@ -461,23 +445,15 @@ def test_builder_variable_alloc_list_handle_literal(
         expected_exception=ValueError,
         match=re.escape("Encountered a literal but `handle_literals` was `False`."),
     ):
-        translation_builder.create_jax_var_list(
-            var_list,
-            handle_literals=False,
-        )
+        translation_builder.create_jax_var_list(var_list, handle_literals=False)
     assert len(translation_builder.arrays) == 0
 
-    name_list = translation_builder.create_jax_var_list(
-        var_list,
-        handle_literals=True,
-    )
+    name_list = translation_builder.create_jax_var_list(var_list, handle_literals=True)
     assert len(translation_builder.arrays) == 0
     assert name_list == [None]
 
 
-def test_builder_constants(
-    translation_builder: translator.JaxprTranslationBuilder,
-) -> None:
+def test_builder_constants(translation_builder: translator.JaxprTranslationBuilder) -> None:
     """Tests part of the `JaxprTranslationBuilder._create_constants()` api.
 
     See also the `test_subtranslators_alu.py::test_add3` test.
@@ -641,8 +617,7 @@ def test_builder_jace_var() -> None:
     """Simple tests about the `JaCeVar` objects."""
     for iname in ["do", "", "_ _", "9al", "_!"]:
         with pytest.raises(
-            expected_exception=ValueError,
-            match=re.escape(f"Supplied the invalid name '{iname}'."),
+            expected_exception=ValueError, match=re.escape(f"Supplied the invalid name '{iname}'.")
         ):
             _ = JaCeVar((), dace.int8, name=iname)
 
diff --git a/tests/integration_tests/test_primitive_translator_managing.py b/tests/integration_tests/test_primitive_translator_managing.py
index 2a6ca33..2c1f005 100644
--- a/tests/integration_tests/test_primitive_translator_managing.py
+++ b/tests/integration_tests/test_primitive_translator_managing.py
@@ -115,10 +115,7 @@ def test_subtranslatior_managing_swap() -> None:
     """Tests the `translator.set_active_primitive_translators_to()` functionality."""
 
     # Allows to compare the structure of dicts.
-    def same_structure(
-        d1: Mapping,
-        d2: Mapping,
-    ) -> bool:
+    def same_structure(d1: Mapping, d2: Mapping) -> bool:
         return d1.keys() == d2.keys() and all(id(d2[k]) == id(d1[k]) for k in d1)
 
     initial_primitives = translator.get_registered_primitive_translators()
diff --git a/tests/unit_tests/test_caching.py b/tests/unit_tests/test_caching.py
index 306b244..29ec75e 100644
--- a/tests/unit_tests/test_caching.py
+++ b/tests/unit_tests/test_caching.py
@@ -400,11 +400,7 @@ def wrapped(A: np.ndarray) -> np.ndarray:
         return A + 10.0
 
     shape = (10, 100, 1000)
-    C = np.array(
-        (testutil.mkarray(shape) - 0.5) * 10,
-        order="C",
-        dtype=np.float64,
-    )
+    C = np.array((testutil.mkarray(shape) - 0.5) * 10, order="C", dtype=np.float64)
     F = np.array(C, copy=True, order="F")
 
     # First we compile run it with C strides.
@@ -431,8 +427,7 @@ def test_caching_jax_numpy_array() -> None:
     """Tests if jax arrays are handled the same way as numpy array."""
 
     def _test_impl(
-        for_lowering: np.ndarray | jax.Array,
-        for_calling: np.ndarray | jax.Array,
+        for_lowering: np.ndarray | jax.Array, for_calling: np.ndarray | jax.Array
     ) -> None:
         tcache.clear_translation_cache()
         lowering_cnt = [0]
diff --git a/tests/unit_tests/test_jax_api.py b/tests/unit_tests/test_jax_api.py
index a9beae2..7d06a2d 100644
--- a/tests/unit_tests/test_jax_api.py
+++ b/tests/unit_tests/test_jax_api.py
@@ -194,7 +194,7 @@ def testee(A: np.ndarray, B: np.float64) -> np.ndarray:
         jaxpr = jax.make_jaxpr(testee)(A, B)
 
     builder = translator.JaxprTranslationBuilder(
-        primitive_translators=translator.get_registered_primitive_translators(),
+        primitive_translators=translator.get_registered_primitive_translators()
     )
     trans_ctx: translator.TranslationContext = builder.translate_jaxpr(jaxpr)
 
diff --git a/tests/util.py b/tests/util.py
index c5ff56e..f7e5d7a 100644
--- a/tests/util.py
+++ b/tests/util.py
@@ -18,15 +18,10 @@
     from collections.abc import Sequence
 
 
-__all__ = [
-    "mkarray",
-]
+__all__ = ["mkarray"]
 
 
-def mkarray(
-    shape: Sequence[int] | int,
-    dtype: type = np.float64,
-) -> np.ndarray:
+def mkarray(shape: Sequence[int] | int, dtype: type = np.float64) -> np.ndarray:
     """Generates a NumPy ndarray with shape `shape`.
 
     The function uses the generator that is managed by the `_reset_random_seed()` fixture.

From ca7f32a4f41d0958b4b9df2855aca4f56c3af2cf Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Fri, 7 Jun 2024 16:00:22 +0200
Subject: [PATCH 333/458] I have now disabled the magic comma in ruff.

I do not like it, but it is fully in line with what the black manpage tells:
	By using it, you agree to cede control over minutiae of hand-formatting.
	In return, Black gives you speed, determinism, and freedom from pycodestyle nagging about formatting.
	You will save time and mental energy for more important matters.
---
 docs/conf.py                                  | 22 +----
 noxfile.py                                    |  8 +-
 pyproject.toml                                |  1 +
 src/jace/api.py                               |  7 +-
 src/jace/optimization.py                      |  5 +-
 src/jace/stages.py                            | 68 +++-----------
 .../translator/jaxpr_translator_builder.py    | 93 ++++---------------
 .../mapped_operation_base_translator.py       | 13 +--
 src/jace/translator/pre_post_translation.py   |  3 +-
 src/jace/translator/primitive_translator.py   | 15 +--
 .../arithmetic_logical_translators.py         | 13 +--
 .../select_n_translator.py                    |  8 +-
 .../primitive_translators/slicing.py          |  6 +-
 src/jace/util/__init__.py                     |  6 +-
 src/jace/util/dace_helper.py                  | 10 +-
 src/jace/util/jax_helper.py                   | 26 ++----
 src/jace/util/traits.py                       | 28 ++----
 src/jace/util/translation_cache.py            | 59 +++---------
 .../primitive_translators/conftest.py         |  2 +-
 ...primitive_arithmetic_logical_operations.py | 38 ++------
 .../test_primitive_broadcast_in_dim.py        |  8 +-
 .../test_primitive_convert_element_type.py    | 26 ++----
 .../test_primitive_reshape.py                 | 40 ++------
 .../test_primitive_select_n.py                |  5 +-
 .../test_primitive_slicing.py                 | 23 ++---
 .../test_primitive_squeeze_expand_dims.py     | 30 ++----
 .../test_jaxpr_translator_builder.py          | 45 ++-------
 .../test_primitive_translator_managing.py     |  5 +-
 tests/unit_tests/test_caching.py              |  9 +-
 tests/unit_tests/test_jax_api.py              |  2 +-
 tests/util.py                                 |  9 +-
 31 files changed, 139 insertions(+), 494 deletions(-)

diff --git a/docs/conf.py b/docs/conf.py
index cb0bb09..e902d98 100644
--- a/docs/conf.py
+++ b/docs/conf.py
@@ -26,28 +26,14 @@
 ]
 
 source_suffix = [".rst", ".md"]
-exclude_patterns = [
-    "_build",
-    "**.ipynb_checkpoints",
-    "Thumbs.db",
-    ".DS_Store",
-    ".env",
-    ".venv",
-]
+exclude_patterns = ["_build", "**.ipynb_checkpoints", "Thumbs.db", ".DS_Store", ".env", ".venv"]
 
 html_theme = "furo"
 
-myst_enable_extensions = [
-    "colon_fence",
-]
+myst_enable_extensions = ["colon_fence"]
 
-intersphinx_mapping = {
-    "python": ("https://docs.python.org/3", None),
-}
+intersphinx_mapping = {"python": ("https://docs.python.org/3", None)}
 
-nitpick_ignore = [
-    ("py:class", "_io.StringIO"),
-    ("py:class", "_io.BytesIO"),
-]
+nitpick_ignore = [("py:class", "_io.StringIO"), ("py:class", "_io.BytesIO")]
 
 always_document_param_types = True
diff --git a/noxfile.py b/noxfile.py
index 3772f2d..2154c16 100644
--- a/noxfile.py
+++ b/noxfile.py
@@ -79,13 +79,7 @@ def build_api_docs(session: nox.Session) -> None:
     session.install("sphinx")
     session.chdir("docs")
     session.run(
-        "sphinx-apidoc",
-        "-o",
-        "api/",
-        "--module-first",
-        "--no-toc",
-        "--force",
-        "../src/jace",
+        "sphinx-apidoc", "-o", "api/", "--module-first", "--no-toc", "--force", "../src/jace"
     )
 
 
diff --git a/pyproject.toml b/pyproject.toml
index d7e3b1d..62987e1 100644
--- a/pyproject.toml
+++ b/pyproject.toml
@@ -126,6 +126,7 @@ src = ["src"]
 
 [tool.ruff.format]
 docstring-code-format = true
+skip-magic-trailing-comma = true
 
 [tool.ruff.lint]
 extend-select = [
diff --git a/src/jace/api.py b/src/jace/api.py
index 9f128b3..46e15b2 100644
--- a/src/jace/api.py
+++ b/src/jace/api.py
@@ -21,12 +21,7 @@
     from collections.abc import Callable, Mapping
 
 
-__all__ = [
-    "grad",
-    "jacfwd",
-    "jacrev",
-    "jit",
-]
+__all__ = ["grad", "jacfwd", "jacrev", "jit"]
 
 
 @overload
diff --git a/src/jace/optimization.py b/src/jace/optimization.py
index 94a8f36..612929b 100644
--- a/src/jace/optimization.py
+++ b/src/jace/optimization.py
@@ -47,10 +47,7 @@ class CompilerOptions(TypedDict, total=False):
 }
 
 
-def jace_optimize(
-    tsdfg: translator.TranslatedJaxprSDFG,
-    **kwargs: Unpack[CompilerOptions],
-) -> None:
+def jace_optimize(tsdfg: translator.TranslatedJaxprSDFG, **kwargs: Unpack[CompilerOptions]) -> None:
     """Performs optimization of the translated SDFG _in place_.
 
     It is recommended to use the `CompilerOptions` `TypedDict` to pass options
diff --git a/src/jace/stages.py b/src/jace/stages.py
index b64e5d6..66d1e51 100644
--- a/src/jace/stages.py
+++ b/src/jace/stages.py
@@ -107,11 +107,7 @@ def __init__(
         self._jit_options = {**jit_options}
         self._fun = fun
 
-    def __call__(
-        self,
-        *args: Any,
-        **kwargs: Any,
-    ) -> Any:
+    def __call__(self, *args: Any, **kwargs: Any) -> Any:
         """Executes the wrapped function, lowering and compiling as needed in one step.
 
         The arguments passed to this function are the same as the wrapped function uses.
@@ -126,11 +122,7 @@ def __call__(
         return compiled(*args, **kwargs)
 
     @tcache.cached_transition
-    def lower(
-        self,
-        *args: Any,
-        **kwargs: Any,
-    ) -> JaCeLowered:
+    def lower(self, *args: Any, **kwargs: Any) -> JaCeLowered:
         """Lower this function explicitly for the given arguments.
 
         Performs the first two steps of the AOT steps described above, i.e.
@@ -180,10 +172,7 @@ def wrapped_fun(self) -> Callable:
         """Returns the wrapped function."""
         return self._fun
 
-    def _make_call_description(
-        self,
-        *args: Any,
-    ) -> tcache.StageTransformationSpec:
+    def _make_call_description(self, *args: Any) -> tcache.StageTransformationSpec:
         """This function computes the key for the `JaCeWrapped.lower()` call inside the cache.
 
         The function will compute a full abstract description on its argument.
@@ -214,18 +203,12 @@ class JaCeLowered(tcache.CachingStage["JaCeCompiled"]):
 
     _translated_sdfg: translator.TranslatedJaxprSDFG
 
-    def __init__(
-        self,
-        tsdfg: translator.TranslatedJaxprSDFG,
-    ) -> None:
+    def __init__(self, tsdfg: translator.TranslatedJaxprSDFG) -> None:
         super().__init__()
         self._translated_sdfg = tsdfg
 
     @tcache.cached_transition
-    def compile(
-        self,
-        compiler_options: CompilerOptions | None = None,
-    ) -> JaCeCompiled:
+    def compile(self, compiler_options: CompilerOptions | None = None) -> JaCeCompiled:
         """Optimize and compile the lowered SDFG and return a `JaCeCompiled` object.
 
         This is the transition function of this stage. Before the SDFG is
@@ -250,10 +233,7 @@ def compile(
             out_names=tsdfg.out_names,
         )
 
-    def compiler_ir(
-        self,
-        dialect: str | None = None,
-    ) -> translator.TranslatedJaxprSDFG:
+    def compiler_ir(self, dialect: str | None = None) -> translator.TranslatedJaxprSDFG:
         """Returns the internal SDFG.
 
         The function returns a `TranslatedJaxprSDFG` object. Direct modification
@@ -263,10 +243,7 @@ def compiler_ir(
             return self._translated_sdfg
         raise ValueError(f"Unknown dialect '{dialect}'.")
 
-    def view(
-        self,
-        filename: str | None = None,
-    ) -> None:
+    def view(self, filename: str | None = None) -> None:
         """Runs the `view()` method of the underlying SDFG.
 
         This will open a browser and display the SDFG.
@@ -281,8 +258,7 @@ def as_sdfg(self) -> dace.SDFG:
         return self.compiler_ir().sdfg
 
     def _make_call_description(
-        self,
-        compiler_options: CompilerOptions | None = None,
+        self, compiler_options: CompilerOptions | None = None
     ) -> tcache.StageTransformationSpec:
         """This function computes the key for the `self.compile()` call inside the cache.
 
@@ -293,10 +269,7 @@ def _make_call_description(
         call_args = tuple(sorted(options.items(), key=lambda x: x[0]))
         return tcache.StageTransformationSpec(stage_id=id(self), call_args=call_args)
 
-    def _make_compiler_options(
-        self,
-        compiler_options: CompilerOptions | None,
-    ) -> CompilerOptions:
+    def _make_compiler_options(self, compiler_options: CompilerOptions | None) -> CompilerOptions:
         """Return the compilation options that should be used for compilation.
 
         See `JaCeLowered.compile()` to see how to influence them.
@@ -304,9 +277,7 @@ def _make_compiler_options(
         return get_active_compiler_options() | (compiler_options or {})
 
 
-def update_active_compiler_options(
-    new_active_options: CompilerOptions,
-) -> CompilerOptions:
+def update_active_compiler_options(new_active_options: CompilerOptions) -> CompilerOptions:
     """Updates the set of active compiler options.
 
     Merges the options passed as `new_active_options` with the currently active
@@ -350,10 +321,7 @@ class JaCeCompiled:
     _out_names: tuple[str, ...]
 
     def __init__(
-        self,
-        csdfg: dace_helper.CompiledSDFG,
-        inp_names: Sequence[str],
-        out_names: Sequence[str],
+        self, csdfg: dace_helper.CompiledSDFG, inp_names: Sequence[str], out_names: Sequence[str]
     ) -> None:
         # NOTE: We only check that we have output, we do not care about the input, since the
         #  function `def foo(): return 1.0` is still a pure function, but we require that we have
@@ -364,23 +332,13 @@ def __init__(
         self._inp_names = tuple(inp_names)
         self._out_names = tuple(out_names)
 
-    def __call__(
-        self,
-        *args: Any,
-        **kwargs: Any,
-    ) -> Any:
+    def __call__(self, *args: Any, **kwargs: Any) -> Any:
         """Calls the embedded computation.
 
         The arguments must be the same as for the wrapped function, but with
         all static arguments removed.
         """
-        return dace_helper.run_jax_sdfg(
-            self._csdfg,
-            self._inp_names,
-            self._out_names,
-            args,
-            kwargs,
-        )
+        return dace_helper.run_jax_sdfg(self._csdfg, self._inp_names, self._out_names, args, kwargs)
 
 
 #: Known compilation stages in JaCe.
diff --git a/src/jace/translator/jaxpr_translator_builder.py b/src/jace/translator/jaxpr_translator_builder.py
index 1312321..1dd1b5b 100644
--- a/src/jace/translator/jaxpr_translator_builder.py
+++ b/src/jace/translator/jaxpr_translator_builder.py
@@ -76,8 +76,7 @@ class JaxprTranslationBuilder:
     _ctx_stack: list[TranslationContext]
 
     def __init__(
-        self,
-        primitive_translators: Mapping[str, translator.PrimitiveTranslatorCallable],
+        self, primitive_translators: Mapping[str, translator.PrimitiveTranslatorCallable]
     ) -> None:
         # Maps name of primitives to the associated translator.
         self._primitive_translators = {**primitive_translators}
@@ -93,10 +92,7 @@ def __init__(
         self._ctx_stack = []
 
     def translate_jaxpr(
-        self,
-        jaxpr: jax_core.ClosedJaxpr,
-        *,
-        name: str | None = None,
+        self, jaxpr: jax_core.ClosedJaxpr, *, name: str | None = None
     ) -> TranslationContext:
         """Perform the translation of a Jaxpr into a SDFG.
 
@@ -123,13 +119,8 @@ def translate_jaxpr(
         #       Thus the builder will start to translate a second (nested) SDFG.
         #       Also note that there is no mechanism that forces the integration of the nested
         #       SDFG/Jaxpr, this must be done manually.
-        self._allocate_translation_ctx(
-            name=name,
-            jaxpr=jaxpr,
-        )
-        self._create_constants(
-            jaxpr=jaxpr,
-        )
+        self._allocate_translation_ctx(name=name, jaxpr=jaxpr)
+        self._create_constants(jaxpr=jaxpr)
         self._create_initial_input(jaxpr=jaxpr)
 
         return self._translate_jaxpr_internal(jaxpr)
@@ -192,10 +183,7 @@ def arrays(self) -> Mapping[str, ddata.Data]:
         """
         return cast(Mapping[str, ddata.Data], self._ctx.sdfg.arrays)
 
-    def get_array(
-        self,
-        name: str | jax_core.Atom | util.JaCeVar,
-    ) -> ddata.Data:
+    def get_array(self, name: str | jax_core.Atom | util.JaCeVar) -> ddata.Data:
         """Returns the SDFG `Data` object `name` referees to.
 
         `name` can either be a string, in which case it is interpreted as a
@@ -214,22 +202,16 @@ def get_array(
 
     @overload
     def map_jax_var_to_sdfg(
-        self,
-        jax_var: jax_core.Atom | util.JaCeVar,
-        allow_fail: Literal[False] = False,
+        self, jax_var: jax_core.Atom | util.JaCeVar, allow_fail: Literal[False] = False
     ) -> str: ...
 
     @overload
     def map_jax_var_to_sdfg(
-        self,
-        jax_var: jax_core.Atom | util.JaCeVar,
-        allow_fail: Literal[True],
+        self, jax_var: jax_core.Atom | util.JaCeVar, allow_fail: Literal[True]
     ) -> str | None: ...
 
     def map_jax_var_to_sdfg(
-        self,
-        jax_var: jax_core.Atom | util.JaCeVar,
-        allow_fail: bool = False,
+        self, jax_var: jax_core.Atom | util.JaCeVar, allow_fail: bool = False
     ) -> str | None:
         """Get the name of the SDFG variable to which `jax_var` is referring to.
 
@@ -274,9 +256,7 @@ def is_root_translator(self) -> bool:
         return len(self._ctx_stack) == 1
 
     def add_jax_name_mapping(
-        self,
-        jax_var: jax_core.Var | util.JaCeVar,
-        sdfg_name: str,
+        self, jax_var: jax_core.Var | util.JaCeVar, sdfg_name: str
     ) -> JaxprTranslationBuilder:
         """Creates a new mapping between `jax_var` to `sdfg_name`.
 
@@ -351,10 +331,7 @@ def add_array(
 
         if shape == ():
             self._ctx.sdfg.add_scalar(
-                name=arg_name,
-                storage=storage,
-                dtype=dtype,
-                transient=as_transient,
+                name=arg_name, storage=storage, dtype=dtype, transient=as_transient
             )
         else:
             self._ctx.sdfg.add_array(
@@ -453,10 +430,7 @@ def create_jax_var_list(  # type: ignore[misc]
 
         return ret_list
 
-    def _create_initial_input(
-        self,
-        jaxpr: jax_core.ClosedJaxpr,
-    ) -> None:
+    def _create_initial_input(self, jaxpr: jax_core.ClosedJaxpr) -> None:
         """Creates the input variables of `jaxpr`.
 
         Notes:
@@ -478,10 +452,7 @@ def _create_initial_input(
         # The output list is populated by `self._translate_jaxpr_internal()`
         self._ctx.inp_names = tuple(init_in_var_names)
 
-    def _create_constants(
-        self,
-        jaxpr: jax_core.ClosedJaxpr,
-    ) -> None:
+    def _create_constants(self, jaxpr: jax_core.ClosedJaxpr) -> None:
         """Creates all constants requested by the `jaxpr`.
 
         The function will create an SDFG variable and add them as constant to
@@ -504,21 +475,14 @@ def _create_constants(
             )
 
     def _allocate_translation_ctx(
-        self,
-        name: str | None,
-        jaxpr: jax_core.ClosedJaxpr,
+        self, name: str | None, jaxpr: jax_core.ClosedJaxpr
     ) -> JaxprTranslationBuilder:
         """Allocate a new context and activate it.
 
         Args:
             name: The name of the SDFG.
         """
-        self._ctx_stack.append(
-            TranslationContext(
-                name=name,
-                jaxpr=jaxpr,
-            )
-        )
+        self._ctx_stack.append(TranslationContext(name=name, jaxpr=jaxpr))
         return self
 
     @property
@@ -543,10 +507,7 @@ def _clear_translation_ctx(self) -> TranslationContext | None:
         # Remove the current head stack.
         return self._ctx_stack.pop()
 
-    def _translate_single_eqn(
-        self,
-        eqn: jax_core.JaxprEqn,
-    ) -> None:
+    def _translate_single_eqn(self, eqn: jax_core.JaxprEqn) -> None:
         """Translate `eqn` into its SDFG equivalent.
 
         To do this the function will perform the following steps:
@@ -602,10 +563,7 @@ def _translate_single_eqn(
         # Modify terminal root state of 'self'
         self._ctx.terminal_state = new_sdfg_term_state
 
-    def _translate_jaxpr_internal(
-        self,
-        jaxpr: jax_core.ClosedJaxpr,
-    ) -> TranslationContext:
+    def _translate_jaxpr_internal(self, jaxpr: jax_core.ClosedJaxpr) -> TranslationContext:
         """Performs the actual translation of the Jaxpr into an SDFG.
 
         The function assumes that the context is allocated as well as the
@@ -634,19 +592,14 @@ def _translate_jaxpr_internal(
             out_var_names = self._handle_null_jaxpr(jaxpr)
         else:
             out_var_names = self.create_jax_var_list(
-                jaxpr.jaxpr.outvars,
-                prevent_creation=True,
-                handle_literals=False,
+                jaxpr.jaxpr.outvars, prevent_creation=True, handle_literals=False
             )
 
         self._ctx.out_names = tuple(out_var_names)
 
         return cast(TranslationContext, self._clear_translation_ctx())
 
-    def _handle_null_jaxpr(
-        self,
-        jaxpr: jax_core.ClosedJaxpr,
-    ) -> list[str]:
+    def _handle_null_jaxpr(self, jaxpr: jax_core.ClosedJaxpr) -> list[str]:
         """This function is called in case a `Jaxpr` with zero equations is encountered.
 
         A function with zero equation might still have output, in which case
@@ -689,9 +642,7 @@ def _handle_null_jaxpr(
             # Now we create a variable that serves as true output, however, since the Jax variable
             #  is already known we can not update the variable mapping and must use another name.
             sdfg_out_name = self.add_array(
-                jax_out_var,
-                name_prefix="_zero_equation_output_for_",
-                update_var_mapping=False,
+                jax_out_var, name_prefix="_zero_equation_output_for_", update_var_mapping=False
             )
             out_var_names.append(sdfg_out_name)
 
@@ -756,11 +707,7 @@ class TranslationContext:
     terminal_state: dace.SDFGState
     jaxpr: jax_core.ClosedJaxpr
 
-    def __init__(
-        self,
-        name: str | None,
-        jaxpr: jax_core.ClosedJaxpr,
-    ) -> None:
+    def __init__(self, name: str | None, jaxpr: jax_core.ClosedJaxpr) -> None:
         if isinstance(name, str) and not util.VALID_SDFG_OBJ_NAME.fullmatch(name):
             raise ValueError(f"'{name}' is not a valid SDFG name.")
 
diff --git a/src/jace/translator/mapped_operation_base_translator.py b/src/jace/translator/mapped_operation_base_translator.py
index 2b70f30..4cb915c 100644
--- a/src/jace/translator/mapped_operation_base_translator.py
+++ b/src/jace/translator/mapped_operation_base_translator.py
@@ -56,10 +56,7 @@ class MappedOperationTranslatorBase(translator.PrimitiveTranslator):
         This class will always generate a mapped Tasklet, even if a scalar is handled.
     """
 
-    def __init__(
-        self,
-        primitive_name: str,
-    ) -> None:
+    def __init__(self, primitive_name: str) -> None:
         self._prim_name = primitive_name
 
     @property
@@ -96,8 +93,7 @@ def __call__(
             ]
             tskl_output: dict[str, dace.Memlet] = {
                 "__out": dace.Memlet.simple(
-                    out_var_names[0],
-                    ", ".join(name for name, _ in tskl_ranges),
+                    out_var_names[0], ", ".join(name for name, _ in tskl_ranges)
                 )
             }
 
@@ -193,10 +189,7 @@ def make_input_memlets(
         return tskl_inputs
 
     def literal_substitution(
-        self,
-        tskl_code: str,
-        in_var_names: Sequence[str | None],
-        eqn: jax_core.JaxprEqn,
+        self, tskl_code: str, in_var_names: Sequence[str | None], eqn: jax_core.JaxprEqn
     ) -> str:
         """Perform literal substitution on the proto Tasklet code `tskl_code`.
 
diff --git a/src/jace/translator/pre_post_translation.py b/src/jace/translator/pre_post_translation.py
index 37be078..1e3f69f 100644
--- a/src/jace/translator/pre_post_translation.py
+++ b/src/jace/translator/pre_post_translation.py
@@ -56,8 +56,7 @@ def postprocess_jaxpr_sdfg(
 
 
 def finalize_translation_context(
-    trans_ctx: translator.TranslationContext,
-    validate: bool = True,
+    trans_ctx: translator.TranslationContext, validate: bool = True
 ) -> translator.TranslatedJaxprSDFG:
     """Finalizes the supplied translation context `trans_ctx`.
 
diff --git a/src/jace/translator/primitive_translator.py b/src/jace/translator/primitive_translator.py
index aaf164f..b452fee 100644
--- a/src/jace/translator/primitive_translator.py
+++ b/src/jace/translator/primitive_translator.py
@@ -117,8 +117,7 @@ def primitive(self) -> str:
 
 @overload
 def make_primitive_translator(
-    primitive: str,
-    primitive_translator: Literal[None] = None,
+    primitive: str, primitive_translator: Literal[None] = None
 ) -> Callable[[translator.PrimitiveTranslatorCallable], translator.PrimitiveTranslator]: ...
 
 
@@ -129,8 +128,7 @@ def make_primitive_translator(
 
 
 def make_primitive_translator(
-    primitive: str,
-    primitive_translator: translator.PrimitiveTranslatorCallable | None = None,
+    primitive: str, primitive_translator: translator.PrimitiveTranslatorCallable | None = None
 ) -> (
     Callable[[translator.PrimitiveTranslatorCallable], translator.PrimitiveTranslator]
     | translator.PrimitiveTranslator
@@ -161,21 +159,18 @@ def wrapper(
 
 @overload
 def register_primitive_translator(
-    primitive_translator: Literal[None] = None,
-    overwrite: bool = False,
+    primitive_translator: Literal[None] = None, overwrite: bool = False
 ) -> Callable[[translator.PrimitiveTranslator], translator.PrimitiveTranslator]: ...
 
 
 @overload
 def register_primitive_translator(
-    primitive_translator: translator.PrimitiveTranslator,
-    overwrite: bool = False,
+    primitive_translator: translator.PrimitiveTranslator, overwrite: bool = False
 ) -> translator.PrimitiveTranslator: ...
 
 
 def register_primitive_translator(
-    primitive_translator: translator.PrimitiveTranslator | None = None,
-    overwrite: bool = False,
+    primitive_translator: translator.PrimitiveTranslator | None = None, overwrite: bool = False
 ) -> (
     translator.PrimitiveTranslator
     | Callable[[translator.PrimitiveTranslator], translator.PrimitiveTranslator]
diff --git a/src/jace/translator/primitive_translators/arithmetic_logical_translators.py b/src/jace/translator/primitive_translators/arithmetic_logical_translators.py
index a344c4a..dfafa7b 100644
--- a/src/jace/translator/primitive_translators/arithmetic_logical_translators.py
+++ b/src/jace/translator/primitive_translators/arithmetic_logical_translators.py
@@ -45,11 +45,7 @@ class ArithmeticOperationTranslator(mapped_base.MappedOperationTranslatorBase):
             nested `pjit` implementation by Jax for unknown reasons.
     """
 
-    def __init__(
-        self,
-        prim_name: str,
-        tskl_tmpl: str,
-    ) -> None:
+    def __init__(self, prim_name: str, tskl_tmpl: str) -> None:
         super().__init__(primitive_name=prim_name)
         self._tskl_tmpl = tskl_tmpl
 
@@ -98,12 +94,7 @@ class LogicalOperationTranslator(mapped_base.MappedOperationTranslatorBase):
         `ArithmeticOperationTranslator` does.
     """
 
-    def __init__(
-        self,
-        prim_name: str,
-        int_tmpl: str,
-        bool_tmpl: str,
-    ) -> None:
+    def __init__(self, prim_name: str, int_tmpl: str, bool_tmpl: str) -> None:
         super().__init__(primitive_name=prim_name)
         self._int_tmpl = int_tmpl
         self._bool_tmpl = bool_tmpl
diff --git a/src/jace/translator/primitive_translators/select_n_translator.py b/src/jace/translator/primitive_translators/select_n_translator.py
index ee5eb5c..240375a 100644
--- a/src/jace/translator/primitive_translators/select_n_translator.py
+++ b/src/jace/translator/primitive_translators/select_n_translator.py
@@ -71,18 +71,14 @@ def make_input_memlets(
         """We have to add the offsets to the Memlet accesses."""
         return {
             f"__in{i-1}" if i else "__cond": dace.Memlet.simple(
-                in_var_name,
-                ", ".join(f"{it_idx}" for it_idx, _ in tskl_ranges),
+                in_var_name, ", ".join(f"{it_idx}" for it_idx, _ in tskl_ranges)
             )
             for i, in_var_name in enumerate(in_var_names)
             if in_var_name
         }
 
     def literal_substitution(
-        self,
-        tskl_code: str,
-        in_var_names: Sequence[str | None],
-        eqn: jax_core.JaxprEqn,
+        self, tskl_code: str, in_var_names: Sequence[str | None], eqn: jax_core.JaxprEqn
     ) -> str:
         """Can not be done by the base because of the renaming."""
         for i, in_var_name in enumerate(in_var_names[1:]):
diff --git a/src/jace/translator/primitive_translators/slicing.py b/src/jace/translator/primitive_translators/slicing.py
index ee415f4..5a04b3c 100644
--- a/src/jace/translator/primitive_translators/slicing.py
+++ b/src/jace/translator/primitive_translators/slicing.py
@@ -131,8 +131,7 @@ def __call__(
 
             # Intermediate value to storing the adjusted start index.
             new_start_idx_var_name = builder.add_array(
-                eqn.invars[dim + 1],
-                name_prefix="__jace_adapted_start_idx_",
+                eqn.invars[dim + 1], name_prefix="__jace_adapted_start_idx_"
             )
             new_start_idx_acc = eqn_state.add_access(new_start_idx_var_name)
 
@@ -179,8 +178,7 @@ def __call__(
 
         tskl_input = dace.Memlet.simple(in_var_name, ", ".join(memlet_accesses))
         tskl_output = dace.Memlet.simple(
-            out_var_names[0],
-            ", ".join(name for name, _ in tskl_ranges),
+            out_var_names[0], ", ".join(name for name, _ in tskl_ranges)
         )
 
         _, map_entry, _ = eqn_state.add_mapped_tasklet(
diff --git a/src/jace/util/__init__.py b/src/jace/util/__init__.py
index c2f2031..bfff733 100644
--- a/src/jace/util/__init__.py
+++ b/src/jace/util/__init__.py
@@ -19,11 +19,7 @@
     propose_jax_name,
     translate_dtype,
 )
-from .misc import (
-    FORBIDDEN_SDFG_VAR_NAMES,
-    VALID_SDFG_OBJ_NAME,
-    VALID_SDFG_VAR_NAME,
-)
+from .misc import FORBIDDEN_SDFG_VAR_NAMES, VALID_SDFG_OBJ_NAME, VALID_SDFG_VAR_NAME
 from .traits import (
     is_array,
     is_c_contiguous,
diff --git a/src/jace/util/dace_helper.py b/src/jace/util/dace_helper.py
index d3929e5..cbbb417 100644
--- a/src/jace/util/dace_helper.py
+++ b/src/jace/util/dace_helper.py
@@ -31,16 +31,10 @@
     from jace import translator
     from jace.util import dace_helper
 
-__all__ = [
-    "CompiledSDFG",
-    "compile_jax_sdfg",
-    "run_jax_sdfg",
-]
+__all__ = ["CompiledSDFG", "compile_jax_sdfg", "run_jax_sdfg"]
 
 
-def compile_jax_sdfg(
-    tsdfg: translator.TranslatedJaxprSDFG,
-) -> dace_helper.CompiledSDFG:
+def compile_jax_sdfg(tsdfg: translator.TranslatedJaxprSDFG) -> dace_helper.CompiledSDFG:
     """Compiles the SDFG embedded in `tsdfg` and return the resulting `CompiledSDFG` object."""
     if any(  # We do not support the DaCe return mechanism
         array_name.startswith("__return")
diff --git a/src/jace/util/jax_helper.py b/src/jace/util/jax_helper.py
index cbc25d7..b2e0d75 100644
--- a/src/jace/util/jax_helper.py
+++ b/src/jace/util/jax_helper.py
@@ -74,10 +74,7 @@ def __post_init__(self) -> None:
     def __hash__(self) -> int:
         return id(self)
 
-    def __eq__(
-        self,
-        other: Any,
-    ) -> bool:
+    def __eq__(self, other: Any) -> bool:
         if not isinstance(other, JaCeVar):
             return NotImplemented
         return id(self) == id(other)
@@ -103,9 +100,7 @@ def get_jax_var_name(jax_var: jax_core.Atom | JaCeVar) -> str:
             )
 
 
-def get_jax_var_shape(
-    jax_var: jax_core.Atom | JaCeVar,
-) -> tuple[int | dace.symbol | str, ...]:
+def get_jax_var_shape(jax_var: jax_core.Atom | JaCeVar) -> tuple[int | dace.symbol | str, ...]:
     """Returns the shape of `jax_var`."""
     match jax_var:
         case jax_core.Var() | jax_core.Literal():
@@ -118,9 +113,7 @@ def get_jax_var_shape(
             raise TypeError(f"'get_jax_var_shape()` is not implemented for '{type(jax_var)}'.")
 
 
-def get_jax_var_dtype(
-    jax_var: jax_core.Atom | JaCeVar,
-) -> dace.typeclass:
+def get_jax_var_dtype(jax_var: jax_core.Atom | JaCeVar) -> dace.typeclass:
     """Returns the DaCe equivalent of `jax_var`s datatype."""
     match jax_var:
         case jax_core.Var() | jax_core.Literal():
@@ -133,10 +126,7 @@ def get_jax_var_dtype(
             raise TypeError(f"'get_jax_var_dtype()` is not implemented for '{type(jax_var)}'.")
 
 
-def is_tracing_ongoing(
-    *args: Any,
-    **kwargs: Any,
-) -> bool:
+def is_tracing_ongoing(*args: Any, **kwargs: Any) -> bool:
     """Test if tracing is ongoing.
 
     While a return value `True` guarantees that a translation is ongoing, a
@@ -157,9 +147,7 @@ def is_tracing_ongoing(
     raise RuntimeError("Failed to determine if tracing is ongoing.")
 
 
-def translate_dtype(
-    dtype: Any,
-) -> dace.typeclass:
+def translate_dtype(dtype: Any) -> dace.typeclass:
     """Turns a Jax datatype into a DaCe datatype."""
     if dtype is None:
         raise NotImplementedError  # Handling a special case in DaCe.
@@ -220,9 +208,7 @@ def propose_jax_name(
     return jax_name
 
 
-def get_jax_literal_value(
-    lit: jax_core.Atom,
-) -> bool | float | int | np.generic:
+def get_jax_literal_value(lit: jax_core.Atom) -> bool | float | int | np.generic:
     """Returns the value a literal is wrapping.
 
     The function guarantees to return a scalar value.
diff --git a/src/jace/util/traits.py b/src/jace/util/traits.py
index 984f794..18c975f 100644
--- a/src/jace/util/traits.py
+++ b/src/jace/util/traits.py
@@ -19,9 +19,7 @@
 import jace.util as util
 
 
-def is_drop_var(
-    jax_var: jax_core.Atom | util.JaCeVar,
-) -> TypeGuard[jax_core.DropVar]:
+def is_drop_var(jax_var: jax_core.Atom | util.JaCeVar) -> TypeGuard[jax_core.DropVar]:
     """Tests if `jax_var` is a drop variable, i.e. a variable that is not read from in a Jaxpr."""
 
     if isinstance(jax_var, jax_core.DropVar):
@@ -31,9 +29,7 @@ def is_drop_var(
     return False
 
 
-def is_jax_array(
-    obj: Any,
-) -> TypeGuard[jax.Array]:
+def is_jax_array(obj: Any) -> TypeGuard[jax.Array]:
     """Tests if `obj` is a Jax array.
 
     Note:
@@ -43,16 +39,12 @@ def is_jax_array(
     return isinstance(obj, jax.Array)
 
 
-def is_array(
-    obj: Any,
-) -> bool:
+def is_array(obj: Any) -> bool:
     """Identifies arrays, this also includes Jax arrays."""
     return dace.is_array(obj) or is_jax_array(obj)
 
 
-def is_scalar(
-    obj: Any,
-) -> bool:
+def is_scalar(obj: Any) -> bool:
     """Tests if `obj` is a scalar."""
     # These are the type known to DaCe; Taken from `dace.dtypes`.
     known_types = {
@@ -82,9 +74,7 @@ def is_scalar(
     return type(obj) in known_types
 
 
-def is_on_device(
-    obj: Any,
-) -> bool:
+def is_on_device(obj: Any) -> bool:
     """Tests if `obj` is on a device.
 
     Jax arrays are always on the CPU and GPU (if there is one). Thus for Jax
@@ -95,18 +85,14 @@ def is_on_device(
     return dace.is_gpu_array(obj)
 
 
-def is_fully_addressable(
-    obj: Any,
-) -> bool:
+def is_fully_addressable(obj: Any) -> bool:
     """Tests if `obj` is fully addressable, i.e. is only on this host."""
     if is_jax_array(obj):
         return obj.is_fully_addressable
     return True
 
 
-def is_c_contiguous(
-    obj: Any,
-) -> bool:
+def is_c_contiguous(obj: Any) -> bool:
     """Tests if `obj` is in C order."""
     if not is_array(obj):
         return False
diff --git a/src/jace/util/translation_cache.py b/src/jace/util/translation_cache.py
index 6dab94c..7ded2d1 100644
--- a/src/jace/util/translation_cache.py
+++ b/src/jace/util/translation_cache.py
@@ -21,16 +21,7 @@
 import dataclasses
 import functools
 from collections.abc import Callable, Hashable
-from typing import (
-    TYPE_CHECKING,
-    Any,
-    Concatenate,
-    Generic,
-    ParamSpec,
-    TypeAlias,
-    TypeVar,
-    cast,
-)
+from typing import TYPE_CHECKING, Any, Concatenate, Generic, ParamSpec, TypeAlias, TypeVar, cast
 
 import dace
 from jax import core as jax_core
@@ -77,9 +68,7 @@ def __init__(self) -> None:
 
     @abc.abstractmethod
     def _make_call_description(
-        self: CachingStage,
-        *args: Any,
-        **kwargs: Any,
+        self: CachingStage, *args: Any, **kwargs: Any
     ) -> StageTransformationSpec:
         """Generates the key that is used to store/locate the call in the cache."""
         ...
@@ -105,11 +94,7 @@ def cached_transition(
     """
 
     @functools.wraps(transition)
-    def transition_wrapper(
-        self: CachingStageType,
-        *args: P.args,
-        **kwargs: P.kwargs,
-    ) -> NextStage:
+    def transition_wrapper(self: CachingStageType, *args: P.args, **kwargs: P.kwargs) -> NextStage:
         key: StageTransformationSpec = self._make_call_description(*args, **kwargs)
         if key in self._cache:
             return self._cache[key]
@@ -126,9 +111,7 @@ def clear_translation_cache() -> None:
         stage_caches.clear()
 
 
-def get_cache(
-    stage: CachingStage,
-) -> StageCache:
+def get_cache(stage: CachingStage) -> StageCache:
     """Returns the cache that should be used for `stage`."""
     stage_type = type(stage)
     if stage_type not in _TRANSLATION_CACHES:
@@ -161,10 +144,7 @@ class _AbstractCallArgument:
     storage: dace.StorageType
 
     @classmethod
-    def from_value(
-        cls,
-        value: Any,
-    ) -> _AbstractCallArgument:
+    def from_value(cls, value: Any) -> _AbstractCallArgument:
         """Construct an `_AbstractCallArgument` from `value`."""
         if not util.is_fully_addressable(value):
             raise NotImplementedError("Distributed arrays are not addressed yet.")
@@ -201,8 +181,7 @@ def from_value(
 #: This type is the abstract description of a function call.
 #:  It is part of the key used in the cache.
 CallArgsSpec: TypeAlias = tuple[
-    _AbstractCallArgument | Hashable | tuple[str, _AbstractCallArgument | Hashable],
-    ...,
+    _AbstractCallArgument | Hashable | tuple[str, _AbstractCallArgument | Hashable], ...
 ]
 
 
@@ -246,33 +225,20 @@ class StageCache(Generic[StageType]):
     _memory: collections.OrderedDict[StageTransformationSpec, StageType]
     _capacity: int
 
-    def __init__(
-        self,
-        capachity: int = 256,
-    ) -> None:
+    def __init__(self, capachity: int = 256) -> None:
         self._memory = collections.OrderedDict()
         self._capacity = capachity
 
-    def __contains__(
-        self,
-        key: StageTransformationSpec,
-    ) -> bool:
+    def __contains__(self, key: StageTransformationSpec) -> bool:
         return key in self._memory
 
-    def __getitem__(
-        self,
-        key: StageTransformationSpec,
-    ) -> StageType:
+    def __getitem__(self, key: StageTransformationSpec) -> StageType:
         if key not in self:
             raise KeyError(f"Key '{key}' is unknown.")
         self._memory.move_to_end(key, last=True)
         return self._memory[key]
 
-    def __setitem__(
-        self,
-        key: StageTransformationSpec,
-        res: StageType,
-    ) -> None:
+    def __setitem__(self, key: StageTransformationSpec, res: StageType) -> None:
         if key in self:
             self._memory.move_to_end(key, last=True)
             self._memory[key] = res
@@ -281,10 +247,7 @@ def __setitem__(
                 self.popitem(None)
             self._memory[key] = res
 
-    def popitem(
-        self,
-        key: StageTransformationSpec | None,
-    ) -> None:
+    def popitem(self, key: StageTransformationSpec | None) -> None:
         """Evict `key` from `self`.
 
         If `key` is `None` the oldest entry is evicted.
diff --git a/tests/integration_tests/primitive_translators/conftest.py b/tests/integration_tests/primitive_translators/conftest.py
index 73b2699..3c79e98 100644
--- a/tests/integration_tests/primitive_translators/conftest.py
+++ b/tests/integration_tests/primitive_translators/conftest.py
@@ -23,7 +23,7 @@
 @pytest.fixture(
     autouse=True,
     params=[
-        optimization.NO_OPTIMIZATIONS,
+        optimization.NO_OPTIMIZATIONS
         # TODO(phimuell): find a way to conditionally enable.
         # optimization.DEFAULT_OPTIMIZATIONS,
     ],
diff --git a/tests/integration_tests/primitive_translators/test_primitive_arithmetic_logical_operations.py b/tests/integration_tests/primitive_translators/test_primitive_arithmetic_logical_operations.py
index 0854dea..b062a66 100644
--- a/tests/integration_tests/primitive_translators/test_primitive_arithmetic_logical_operations.py
+++ b/tests/integration_tests/primitive_translators/test_primitive_arithmetic_logical_operations.py
@@ -82,9 +82,7 @@ def _only_alt_translators() -> Generator[None, None, None]:
         (jnp.bitwise_not, 1, np.int64),
     ]
 )
-def logical_ops(
-    request,
-) -> tuple[Callable, tuple[np.ndarray, ...]]:
+def logical_ops(request) -> tuple[Callable, tuple[np.ndarray, ...]]:
     """Returns a logical operation function and inputs."""
     return (
         request.param[0],
@@ -101,9 +99,7 @@ def logical_ops(
         ),
     ]
 )
-def dtype(
-    request,
-) -> type:
+def dtype(request) -> type:
     """Data types that should be used for the numerical tests of the ALT translators."""
     return request.param
 
@@ -128,10 +124,7 @@ def dtype(
         lambda x: jnp.atanh(jnp.tanh(x)),
     ]
 )
-def alt_unary_ops(
-    request,
-    dtype: type,
-) -> tuple[Callable, np.ndarray]:
+def alt_unary_ops(request, dtype: type) -> tuple[Callable, np.ndarray]:
     """The inputs and the operation we need for the full test.
 
     Some of the unary operations are combined to ensure that they will succeed.
@@ -152,9 +145,7 @@ def alt_unary_ops(
         lambda x, y: x**y,
     ]
 )
-def alt_binary_ops_float(
-    request,
-) -> tuple[Callable, tuple[np.ndarray, np.ndarray]]:
+def alt_binary_ops_float(request) -> tuple[Callable, tuple[np.ndarray, np.ndarray]]:
     """Binary ALT operations that operates on floats."""
     # Getting 0 in the division test is unlikely.
     return (  # type: ignore[return-value]  # Type confusion.
@@ -173,9 +164,7 @@ def alt_binary_ops_float(
         lambda x, y: x > y,
     ]
 )
-def alt_binary_compare_ops(
-    request,
-) -> tuple[Callable, tuple[np.ndarray, np.ndarray]]:
+def alt_binary_compare_ops(request) -> tuple[Callable, tuple[np.ndarray, np.ndarray]]:
     """Comparison operations, operates on integers."""
     return (
         request.param,
@@ -190,17 +179,12 @@ def alt_binary_compare_ops(
         [(5, 1, 3, 4, 1, 5), (5, 1, 3, 1, 2, 5)],
     ]
 )
-def broadcast_input(
-    request,
-) -> tuple[np.ndarray, np.ndarray]:
+def broadcast_input(request) -> tuple[np.ndarray, np.ndarray]:
     """Inputs to be used for the broadcast test."""
     return tuple(testutil.mkarray(shape) for shape in request.param)  # type: ignore[return-value] # can not deduce that it is only size 2.
 
 
-def _perform_alt_test(
-    testee: Callable,
-    *args: Any,
-) -> None:
+def _perform_alt_test(testee: Callable, *args: Any) -> None:
     """General function that just performs the test."""
     wrapped = jace.jit(testee)
 
@@ -304,9 +288,7 @@ def testee(A: np.ndarray) -> np.ndarray:
     _perform_alt_test(testee, A)
 
 
-def test_mapped_broadcast(
-    broadcast_input: tuple[np.ndarray, np.ndarray],
-) -> None:
+def test_mapped_broadcast(broadcast_input: tuple[np.ndarray, np.ndarray]) -> None:
     def testee(A: np.ndarray, B: np.ndarray) -> np.ndarray:
         return A + B
 
@@ -319,9 +301,7 @@ def testee(A: np.ndarray, B: np.ndarray) -> np.ndarray:
 # <------------ Tests for arithmetic and logical translators/operations
 
 
-def test_alt_general_unary(
-    alt_unary_ops: tuple[Callable, np.ndarray],
-) -> None:
+def test_alt_general_unary(alt_unary_ops: tuple[Callable, np.ndarray]) -> None:
     def testee(A: np.ndarray) -> np.ndarray:
         return alt_unary_ops[0](A)
 
diff --git a/tests/integration_tests/primitive_translators/test_primitive_broadcast_in_dim.py b/tests/integration_tests/primitive_translators/test_primitive_broadcast_in_dim.py
index 088e5d6..9300254 100644
--- a/tests/integration_tests/primitive_translators/test_primitive_broadcast_in_dim.py
+++ b/tests/integration_tests/primitive_translators/test_primitive_broadcast_in_dim.py
@@ -35,9 +35,7 @@
 
 
 @pytest.fixture(params=[(10,), (10, 1), (1, 10)])
-def vector_shape(
-    request,
-) -> tuple[int, ...]:
+def vector_shape(request) -> tuple[int, ...]:
     """Shapes used in the `test_bid_vector()` tests."""
     return request.param
 
@@ -70,9 +68,7 @@ def testee(a: float) -> jax.Array:
     assert np.all(res == ref)
 
 
-def test_bid_vector(
-    vector_shape: Sequence[int],
-) -> None:
+def test_bid_vector(vector_shape: Sequence[int]) -> None:
     """Broadcast a vector to a tensor."""
 
     def testee(A: np.ndarray) -> jax.Array:
diff --git a/tests/integration_tests/primitive_translators/test_primitive_convert_element_type.py b/tests/integration_tests/primitive_translators/test_primitive_convert_element_type.py
index 181b384..fe86b4b 100644
--- a/tests/integration_tests/primitive_translators/test_primitive_convert_element_type.py
+++ b/tests/integration_tests/primitive_translators/test_primitive_convert_element_type.py
@@ -38,17 +38,13 @@
 
 
 @pytest.fixture(params=_DACE_REAL_TYPES)
-def src_type(
-    request,
-) -> type:
+def src_type(request) -> type:
     """All valid source types, with the exception of bool."""
     return request.param
 
 
 @pytest.fixture(params=_DACE_REAL_TYPES + _DACE_COMPLEX_TYPES)
-def dst_type(
-    request,
-) -> type:
+def dst_type(request) -> type:
     """All valid destination types, with the exception of bool.
 
     Includes also complex types, because going from real to complex is useful,
@@ -57,10 +53,7 @@ def dst_type(
     return request.param
 
 
-def _convert_element_type_impl(
-    input_type: type,
-    output_type: type,
-) -> None:
+def _convert_element_type_impl(input_type: type, output_type: type) -> None:
     """Implementation of the tests of the convert element types primitive."""
     lowering_cnt = [0]
     A: np.ndarray = testutil.mkarray((10, 10), input_type)
@@ -79,20 +72,13 @@ def converter(A: np.ndarray) -> jax.Array:
     assert np.allclose(ref, res)
 
 
-def test_convert_element_type_main(
-    src_type: type,
-    dst_type: type,
-) -> None:
+def test_convert_element_type_main(src_type: type, dst_type: type) -> None:
     _convert_element_type_impl(src_type, dst_type)
 
 
-def test_convert_element_type_from_bool(
-    src_type: type,
-) -> None:
+def test_convert_element_type_from_bool(src_type: type) -> None:
     _convert_element_type_impl(np.bool_, src_type)
 
 
-def test_convert_element_type_to_bool(
-    src_type: type,
-) -> None:
+def test_convert_element_type_to_bool(src_type: type) -> None:
     _convert_element_type_impl(src_type, np.bool_)
diff --git a/tests/integration_tests/primitive_translators/test_primitive_reshape.py b/tests/integration_tests/primitive_translators/test_primitive_reshape.py
index a63b3f3..ac4ad50 100644
--- a/tests/integration_tests/primitive_translators/test_primitive_reshape.py
+++ b/tests/integration_tests/primitive_translators/test_primitive_reshape.py
@@ -26,9 +26,7 @@
 
 
 def _test_impl_reshaping(
-    src_shape: Sequence[int],
-    dst_shape: Sequence[int],
-    order: str = "C",
+    src_shape: Sequence[int], dst_shape: Sequence[int], order: str = "C"
 ) -> None:
     """Performs a reshaping from `src_shape` to `dst_shape`."""
     A = testutil.mkarray(src_shape)
@@ -45,61 +43,41 @@ def testee(A: np.ndarray) -> jax.Array:
 
 
 @pytest.fixture(
-    params=[
-        "C",
-        pytest.param("F", marks=pytest.mark.skip("Non C order is not supported")),
-    ]
+    params=["C", pytest.param("F", marks=pytest.mark.skip("Non C order is not supported"))]
 )
-def mem_order(
-    request,
-) -> str:
+def mem_order(request) -> str:
     """Gets the memory order that we want."""
     return request.param
 
 
 @pytest.fixture(params=[(216, 1, 1), (1, 216, 1), (1, 1, 216), (1, 6, 36), (36, 1, 6)])
-def new_shape(
-    request,
-) -> None:
+def new_shape(request) -> None:
     """New shapes for the `test_reshaping_same_rank()` test."""
     return request.param
 
 
 @pytest.fixture(params=[(12, 1), (1, 12), (1, 1, 12), (1, 2, 6)])
-def expanded_shape(
-    request,
-) -> None:
+def expanded_shape(request) -> None:
     """New shapes for the `test_reshaping_removing_rank()` test."""
     return request.param
 
 
 @pytest.fixture(params=[(216,), (6, 36), (36, 6), (216, 1)])
-def reduced_shape(
-    request,
-) -> None:
+def reduced_shape(request) -> None:
     """New shapes for the `test_reshaping_adding_rank()` test."""
     return request.param
 
 
-def test_reshaping_same_rank(
-    new_shape: Sequence[int],
-    mem_order: str,
-) -> None:
+def test_reshaping_same_rank(new_shape: Sequence[int], mem_order: str) -> None:
     """The rank, numbers of dimensions, stays the same,"""
     _test_impl_reshaping((6, 6, 6), new_shape, mem_order)
 
 
-def test_reshaping_adding_rank(
-    expanded_shape: Sequence[int],
-    mem_order: str,
-) -> None:
+def test_reshaping_adding_rank(expanded_shape: Sequence[int], mem_order: str) -> None:
     """Adding ranks to an array."""
     _test_impl_reshaping((12,), expanded_shape, mem_order)
 
 
-def test_reshaping_removing_rank(
-    reduced_shape: Sequence[int],
-    mem_order: str,
-) -> None:
+def test_reshaping_removing_rank(reduced_shape: Sequence[int], mem_order: str) -> None:
     """Removing ranks from an array."""
     _test_impl_reshaping((6, 6, 6), reduced_shape, mem_order)
diff --git a/tests/integration_tests/primitive_translators/test_primitive_select_n.py b/tests/integration_tests/primitive_translators/test_primitive_select_n.py
index e9871bf..a5faa44 100644
--- a/tests/integration_tests/primitive_translators/test_primitive_select_n.py
+++ b/tests/integration_tests/primitive_translators/test_primitive_select_n.py
@@ -24,10 +24,7 @@
     from collections.abc import Callable
 
 
-def _perform_test(
-    testee: Callable,
-    *args: Any,
-) -> None:
+def _perform_test(testee: Callable, *args: Any) -> None:
     res = testee(*args)
     ref = jace.jit(testee)(*args)
     assert np.all(res == ref)
diff --git a/tests/integration_tests/primitive_translators/test_primitive_slicing.py b/tests/integration_tests/primitive_translators/test_primitive_slicing.py
index 95778da..6c70c4e 100644
--- a/tests/integration_tests/primitive_translators/test_primitive_slicing.py
+++ b/tests/integration_tests/primitive_translators/test_primitive_slicing.py
@@ -36,16 +36,12 @@ def A_4x4x4x4() -> np.ndarray:
         (3, 1, 3, 0),  # Will lead to readjustment of the start index.
     ]
 )
-def full_dynamic_start_idx(
-    request,
-) -> tuple[int, int, int, int]:
+def full_dynamic_start_idx(request) -> tuple[int, int, int, int]:
     """Start indexes for the slice window of `test_dynamic_slice_full_dynamic()`."""
     return request.param
 
 
-def test_slice_no_strides(
-    A_20x20x20: np.ndarray,
-) -> None:
+def test_slice_no_strides(A_20x20x20: np.ndarray) -> None:
     """Test without strides."""
 
     def testee(A: np.ndarray) -> jax.Array:
@@ -59,9 +55,7 @@ def testee(A: np.ndarray) -> jax.Array:
     assert np.all(ref == res)
 
 
-def test_slice_strides(
-    A_20x20x20: np.ndarray,
-) -> None:
+def test_slice_strides(A_20x20x20: np.ndarray) -> None:
     """Test with strides."""
 
     def testee(A: np.ndarray) -> jax.Array:
@@ -79,8 +73,7 @@ def testee(A: np.ndarray) -> jax.Array:
     "In unoptimized mode there is an error, that is caused because we have an array insteadof a scalar."
 )
 def test_dynamic_slice_full_dynamic(
-    A_4x4x4x4: np.ndarray,
-    full_dynamic_start_idx: tuple[int, int, int, int],
+    A_4x4x4x4: np.ndarray, full_dynamic_start_idx: tuple[int, int, int, int]
 ) -> None:
     def testee(A: np.ndarray, s1: int, s2: int, s3: int, s4: int) -> jax.Array:
         return jax.lax.dynamic_slice(A, (s1, s2, s3, s4), (2, 2, 2, 2))
@@ -94,9 +87,7 @@ def testee(A: np.ndarray, s1: int, s2: int, s3: int, s4: int) -> jax.Array:
 @pytest.mark.skip(
     "In unoptimized mode there is an error, that is caused because we have an array insteadof a scalar."
 )
-def test_dynamic_slice_partially_dynamic(
-    A_4x4x4x4: np.ndarray,
-) -> None:
+def test_dynamic_slice_partially_dynamic(A_4x4x4x4: np.ndarray) -> None:
     def testee(A: np.ndarray, s1: int, s2: int) -> jax.Array:
         return jax.lax.dynamic_slice(A, (s1, 1, s2, 2), (2, 2, 2, 2))
 
@@ -109,9 +100,7 @@ def testee(A: np.ndarray, s1: int, s2: int) -> jax.Array:
 @pytest.mark.skip(
     "In unoptimized mode there is an error, that is caused because we have an array insteadof a scalar."
 )
-def test_dynamic_slice_full_literal(
-    A_4x4x4x4: np.ndarray,
-) -> None:
+def test_dynamic_slice_full_literal(A_4x4x4x4: np.ndarray) -> None:
     def testee(A: np.ndarray) -> jax.Array:
         return jax.lax.dynamic_slice(A, (0, 1, 0, 2), (2, 2, 2, 2))
 
diff --git a/tests/integration_tests/primitive_translators/test_primitive_squeeze_expand_dims.py b/tests/integration_tests/primitive_translators/test_primitive_squeeze_expand_dims.py
index cc5f56e..c82e4bb 100644
--- a/tests/integration_tests/primitive_translators/test_primitive_squeeze_expand_dims.py
+++ b/tests/integration_tests/primitive_translators/test_primitive_squeeze_expand_dims.py
@@ -30,10 +30,7 @@
     from collections.abc import Sequence
 
 
-def _roundtrip_implementation(
-    shape: Sequence[int],
-    axis: int | Sequence[int],
-) -> None:
+def _roundtrip_implementation(shape: Sequence[int], axis: int | Sequence[int]) -> None:
     """Implementation of the test for `expand_dims()` and `squeeze()`.
 
     It will first add dimensions and then remove them.
@@ -59,33 +56,18 @@ def _roundtrip_implementation(
 
 
 @pytest.fixture(params=[0, -1, 1])
-def single_axis(
-    request,
-) -> int:
+def single_axis(request) -> int:
     return request.param
 
 
-@pytest.fixture(
-    params=[
-        0,
-        -1,
-        (1, 2, 3),
-        (3, 2, 1),
-    ]
-)
-def multiple_axis(
-    request,
-) -> tuple[int, ...] | int:
+@pytest.fixture(params=[0, -1, (1, 2, 3), (3, 2, 1)])
+def multiple_axis(request) -> tuple[int, ...] | int:
     return request.param
 
 
-def test_expand_squeeze_rountrip_simple(
-    single_axis: int,
-) -> None:
+def test_expand_squeeze_rountrip_simple(single_axis: int) -> None:
     _roundtrip_implementation((10,), single_axis)
 
 
-def test_expand_squeeze_rountrip_big(
-    multiple_axis: Sequence[int],
-) -> None:
+def test_expand_squeeze_rountrip_big(multiple_axis: Sequence[int]) -> None:
     _roundtrip_implementation((2, 3, 4, 5), multiple_axis)
diff --git a/tests/integration_tests/test_jaxpr_translator_builder.py b/tests/integration_tests/test_jaxpr_translator_builder.py
index 53bd65a..17253b5 100644
--- a/tests/integration_tests/test_jaxpr_translator_builder.py
+++ b/tests/integration_tests/test_jaxpr_translator_builder.py
@@ -186,9 +186,7 @@ def test_builder_variable_alloc_prefix_naming(
     assert exp_name_3 == sdfg_name_3
 
 
-def test_builder_nested(
-    translation_builder: translator.JaxprTranslationBuilder,
-) -> None:
+def test_builder_nested(translation_builder: translator.JaxprTranslationBuilder) -> None:
     """Tests the ability of the nesting of the builder."""
 
     # Now add a variable to the current subtext.
@@ -260,9 +258,7 @@ def test_builder_nested(
     assert name_3 == translation_builder.map_jax_var_to_sdfg(array3)
 
 
-def test_builder_append_state(
-    translation_builder: translator.JaxprTranslationBuilder,
-) -> None:
+def test_builder_append_state(translation_builder: translator.JaxprTranslationBuilder) -> None:
     """Tests the functionality of appending states."""
     sdfg: dace.SDFG = translation_builder.sdfg
 
@@ -348,10 +344,7 @@ def test_builder_variable_alloc_list(
     var_list_1 = [array1, nscal, scal2]
     exp_names_1 = ["a", nscal.name, "c"]
 
-    res_names_1 = translation_builder.create_jax_var_list(
-        var_list_1,
-        update_var_mapping=True,
-    )
+    res_names_1 = translation_builder.create_jax_var_list(var_list_1, update_var_mapping=True)
     assert len(translation_builder.arrays) == 3
     assert res_names_1 == exp_names_1
 
@@ -359,10 +352,7 @@ def test_builder_variable_alloc_list(
     var_list_2 = [array2, nscal, scal1]
     exp_names_2 = ["d", nscal.name, "e"]
 
-    res_names_2 = translation_builder.create_jax_var_list(
-        var_list_2,
-        update_var_mapping=True,
-    )
+    res_names_2 = translation_builder.create_jax_var_list(var_list_2, update_var_mapping=True)
     assert res_names_2 == exp_names_2
     assert len(translation_builder.arrays) == 5
 
@@ -406,10 +396,7 @@ def test_builder_variable_alloc_list_prevent_creation(
         expected_exception=ValueError,
         match=re.escape(f"'prevent_creation' given but have to create '{array2}'."),
     ):
-        translation_builder.create_jax_var_list(
-            var_list,
-            prevent_creation=True,
-        )
+        translation_builder.create_jax_var_list(var_list, prevent_creation=True)
     assert len(translation_builder.arrays) == 1
     assert translation_builder.map_jax_var_to_sdfg(array1) == "a"
 
@@ -433,10 +420,7 @@ def test_builder_variable_alloc_list_only_creation(
         expected_exception=ValueError,
         match=re.escape(f"'only_creation' given '{array1}' already exists."),
     ):
-        translation_builder.create_jax_var_list(
-            var_list,
-            only_creation=True,
-        )
+        translation_builder.create_jax_var_list(var_list, only_creation=True)
     assert len(translation_builder.arrays) == 1
     assert translation_builder.map_jax_var_to_sdfg(array1) == "a"
 
@@ -461,23 +445,15 @@ def test_builder_variable_alloc_list_handle_literal(
         expected_exception=ValueError,
         match=re.escape("Encountered a literal but `handle_literals` was `False`."),
     ):
-        translation_builder.create_jax_var_list(
-            var_list,
-            handle_literals=False,
-        )
+        translation_builder.create_jax_var_list(var_list, handle_literals=False)
     assert len(translation_builder.arrays) == 0
 
-    name_list = translation_builder.create_jax_var_list(
-        var_list,
-        handle_literals=True,
-    )
+    name_list = translation_builder.create_jax_var_list(var_list, handle_literals=True)
     assert len(translation_builder.arrays) == 0
     assert name_list == [None]
 
 
-def test_builder_constants(
-    translation_builder: translator.JaxprTranslationBuilder,
-) -> None:
+def test_builder_constants(translation_builder: translator.JaxprTranslationBuilder) -> None:
     """Tests part of the `JaxprTranslationBuilder._create_constants()` api.
 
     See also the `test_subtranslators_alu.py::test_add3` test.
@@ -641,8 +617,7 @@ def test_builder_jace_var() -> None:
     """Simple tests about the `JaCeVar` objects."""
     for iname in ["do", "", "_ _", "9al", "_!"]:
         with pytest.raises(
-            expected_exception=ValueError,
-            match=re.escape(f"Supplied the invalid name '{iname}'."),
+            expected_exception=ValueError, match=re.escape(f"Supplied the invalid name '{iname}'.")
         ):
             _ = JaCeVar((), dace.int8, name=iname)
 
diff --git a/tests/integration_tests/test_primitive_translator_managing.py b/tests/integration_tests/test_primitive_translator_managing.py
index 2a6ca33..2c1f005 100644
--- a/tests/integration_tests/test_primitive_translator_managing.py
+++ b/tests/integration_tests/test_primitive_translator_managing.py
@@ -115,10 +115,7 @@ def test_subtranslatior_managing_swap() -> None:
     """Tests the `translator.set_active_primitive_translators_to()` functionality."""
 
     # Allows to compare the structure of dicts.
-    def same_structure(
-        d1: Mapping,
-        d2: Mapping,
-    ) -> bool:
+    def same_structure(d1: Mapping, d2: Mapping) -> bool:
         return d1.keys() == d2.keys() and all(id(d2[k]) == id(d1[k]) for k in d1)
 
     initial_primitives = translator.get_registered_primitive_translators()
diff --git a/tests/unit_tests/test_caching.py b/tests/unit_tests/test_caching.py
index 306b244..29ec75e 100644
--- a/tests/unit_tests/test_caching.py
+++ b/tests/unit_tests/test_caching.py
@@ -400,11 +400,7 @@ def wrapped(A: np.ndarray) -> np.ndarray:
         return A + 10.0
 
     shape = (10, 100, 1000)
-    C = np.array(
-        (testutil.mkarray(shape) - 0.5) * 10,
-        order="C",
-        dtype=np.float64,
-    )
+    C = np.array((testutil.mkarray(shape) - 0.5) * 10, order="C", dtype=np.float64)
     F = np.array(C, copy=True, order="F")
 
     # First we compile run it with C strides.
@@ -431,8 +427,7 @@ def test_caching_jax_numpy_array() -> None:
     """Tests if jax arrays are handled the same way as numpy array."""
 
     def _test_impl(
-        for_lowering: np.ndarray | jax.Array,
-        for_calling: np.ndarray | jax.Array,
+        for_lowering: np.ndarray | jax.Array, for_calling: np.ndarray | jax.Array
     ) -> None:
         tcache.clear_translation_cache()
         lowering_cnt = [0]
diff --git a/tests/unit_tests/test_jax_api.py b/tests/unit_tests/test_jax_api.py
index a9beae2..7d06a2d 100644
--- a/tests/unit_tests/test_jax_api.py
+++ b/tests/unit_tests/test_jax_api.py
@@ -194,7 +194,7 @@ def testee(A: np.ndarray, B: np.float64) -> np.ndarray:
         jaxpr = jax.make_jaxpr(testee)(A, B)
 
     builder = translator.JaxprTranslationBuilder(
-        primitive_translators=translator.get_registered_primitive_translators(),
+        primitive_translators=translator.get_registered_primitive_translators()
     )
     trans_ctx: translator.TranslationContext = builder.translate_jaxpr(jaxpr)
 
diff --git a/tests/util.py b/tests/util.py
index c5ff56e..f7e5d7a 100644
--- a/tests/util.py
+++ b/tests/util.py
@@ -18,15 +18,10 @@
     from collections.abc import Sequence
 
 
-__all__ = [
-    "mkarray",
-]
+__all__ = ["mkarray"]
 
 
-def mkarray(
-    shape: Sequence[int] | int,
-    dtype: type = np.float64,
-) -> np.ndarray:
+def mkarray(shape: Sequence[int] | int, dtype: type = np.float64) -> np.ndarray:
     """Generates a NumPy ndarray with shape `shape`.
 
     The function uses the generator that is managed by the `_reset_random_seed()` fixture.

From 3c6194ae31abd884766925e8299538ebb5178bab Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Fri, 7 Jun 2024 15:56:14 +0200
Subject: [PATCH 334/458] I have now disabled the magic comma in ruff.

I do not like it, but it is fully in line with what the black manpage tells:
	By using it, you agree to cede control over minutiae of hand-formatting.
	In return, Black gives you speed, determinism, and freedom from pycodestyle nagging about formatting.
	You will save time and mental energy for more important matters.

This follows the mantra "what the formater does on the _big scale_ is _always_ correct regardless how it looks".
Disabeling it, is still allowed locally.
---
 docs/conf.py                                  | 22 +----
 noxfile.py                                    |  8 +-
 pyproject.toml                                |  1 +
 src/jace/api.py                               |  7 +-
 src/jace/optimization.py                      | 15 +---
 src/jace/stages.py                            | 64 +++-----------
 .../translator/jaxpr_translator_builder.py    | 86 ++++---------------
 src/jace/translator/post_translation.py       |  3 +-
 src/jace/translator/primitive_translator.py   | 15 ++--
 .../primitive_translators/__init__.py         |  4 +-
 .../primitive_translators/alu_translator.py   | 16 +---
 src/jace/util/__init__.py                     |  6 +-
 src/jace/util/dace_helper.py                  | 10 +--
 src/jace/util/jax_helper.py                   | 26 ++----
 src/jace/util/traits.py                       | 24 ++----
 src/jace/util/translation_cache.py            | 59 +++----------
 tests/test_jaxpr_translator_builder.py        | 37 ++------
 17 files changed, 85 insertions(+), 318 deletions(-)

diff --git a/docs/conf.py b/docs/conf.py
index cb0bb09..e902d98 100644
--- a/docs/conf.py
+++ b/docs/conf.py
@@ -26,28 +26,14 @@
 ]
 
 source_suffix = [".rst", ".md"]
-exclude_patterns = [
-    "_build",
-    "**.ipynb_checkpoints",
-    "Thumbs.db",
-    ".DS_Store",
-    ".env",
-    ".venv",
-]
+exclude_patterns = ["_build", "**.ipynb_checkpoints", "Thumbs.db", ".DS_Store", ".env", ".venv"]
 
 html_theme = "furo"
 
-myst_enable_extensions = [
-    "colon_fence",
-]
+myst_enable_extensions = ["colon_fence"]
 
-intersphinx_mapping = {
-    "python": ("https://docs.python.org/3", None),
-}
+intersphinx_mapping = {"python": ("https://docs.python.org/3", None)}
 
-nitpick_ignore = [
-    ("py:class", "_io.StringIO"),
-    ("py:class", "_io.BytesIO"),
-]
+nitpick_ignore = [("py:class", "_io.StringIO"), ("py:class", "_io.BytesIO")]
 
 always_document_param_types = True
diff --git a/noxfile.py b/noxfile.py
index 3772f2d..2154c16 100644
--- a/noxfile.py
+++ b/noxfile.py
@@ -79,13 +79,7 @@ def build_api_docs(session: nox.Session) -> None:
     session.install("sphinx")
     session.chdir("docs")
     session.run(
-        "sphinx-apidoc",
-        "-o",
-        "api/",
-        "--module-first",
-        "--no-toc",
-        "--force",
-        "../src/jace",
+        "sphinx-apidoc", "-o", "api/", "--module-first", "--no-toc", "--force", "../src/jace"
     )
 
 
diff --git a/pyproject.toml b/pyproject.toml
index 3556e8a..1746b5a 100644
--- a/pyproject.toml
+++ b/pyproject.toml
@@ -102,6 +102,7 @@ src = ["src"]
 
 [tool.ruff.format]
 docstring-code-format = true
+skip-magic-trailing-comma = true
 
 [tool.ruff.lint]
 extend-select = [
diff --git a/src/jace/api.py b/src/jace/api.py
index 9f128b3..46e15b2 100644
--- a/src/jace/api.py
+++ b/src/jace/api.py
@@ -21,12 +21,7 @@
     from collections.abc import Callable, Mapping
 
 
-__all__ = [
-    "grad",
-    "jacfwd",
-    "jacrev",
-    "jit",
-]
+__all__ = ["grad", "jacfwd", "jacrev", "jit"]
 
 
 @overload
diff --git a/src/jace/optimization.py b/src/jace/optimization.py
index 7240b79..92b52e4 100644
--- a/src/jace/optimization.py
+++ b/src/jace/optimization.py
@@ -36,21 +36,12 @@ class CompilerOptions(TypedDict, total=False):
 
 
 # TODO(phimuell): Add a context manager to modify the default.
-DEFAULT_OPTIMIZATIONS: Final[CompilerOptions] = {
-    "auto_optimize": True,
-    "simplify": True,
-}
+DEFAULT_OPTIMIZATIONS: Final[CompilerOptions] = {"auto_optimize": True, "simplify": True}
 
-NO_OPTIMIZATIONS: Final[CompilerOptions] = {
-    "auto_optimize": False,
-    "simplify": False,
-}
+NO_OPTIMIZATIONS: Final[CompilerOptions] = {"auto_optimize": False, "simplify": False}
 
 
-def jace_optimize(
-    tsdfg: translator.TranslatedJaxprSDFG,
-    **kwargs: Unpack[CompilerOptions],
-) -> None:
+def jace_optimize(tsdfg: translator.TranslatedJaxprSDFG, **kwargs: Unpack[CompilerOptions]) -> None:
     """Performs optimization of the translated SDFG _in place_.
 
     It is recommended to use the `CompilerOptions` `TypedDict` to pass options
diff --git a/src/jace/stages.py b/src/jace/stages.py
index 224bc00..81ebe61 100644
--- a/src/jace/stages.py
+++ b/src/jace/stages.py
@@ -98,11 +98,7 @@ def __init__(
         self._jit_options = {**jit_options}
         self._fun = fun
 
-    def __call__(
-        self,
-        *args: Any,
-        **kwargs: Any,
-    ) -> Any:
+    def __call__(self, *args: Any, **kwargs: Any) -> Any:
         """Executes the wrapped function, lowering and compiling as needed in one step.
 
         The arguments passed to this function are the same as the wrapped function uses.
@@ -118,11 +114,7 @@ def __call__(
         return compiled(*args, **kwargs)
 
     @tcache.cached_transition
-    def lower(
-        self,
-        *args: Any,
-        **kwargs: Any,
-    ) -> JaCeLowered:
+    def lower(self, *args: Any, **kwargs: Any) -> JaCeLowered:
         """Lower this function explicitly for the given arguments.
 
         Performs the first two steps of the AOT steps described above, i.e.
@@ -172,10 +164,7 @@ def wrapped_fun(self) -> Callable:
         """Returns the wrapped function."""
         return self._fun
 
-    def _make_call_description(
-        self,
-        *args: Any,
-    ) -> tcache.StageTransformationSpec:
+    def _make_call_description(self, *args: Any) -> tcache.StageTransformationSpec:
         """This function computes the key for the `JaCeWrapped.lower()` call inside the cache.
 
         The function will compute a full abstract description on its argument.
@@ -203,18 +192,12 @@ class JaCeLowered(tcache.CachingStage["JaCeCompiled"]):
 
     _translated_sdfg: translator.TranslatedJaxprSDFG
 
-    def __init__(
-        self,
-        tsdfg: translator.TranslatedJaxprSDFG,
-    ) -> None:
+    def __init__(self, tsdfg: translator.TranslatedJaxprSDFG) -> None:
         super().__init__()
         self._translated_sdfg = tsdfg
 
     @tcache.cached_transition
-    def compile(
-        self,
-        compiler_options: CompilerOptions | None = None,
-    ) -> JaCeCompiled:
+    def compile(self, compiler_options: CompilerOptions | None = None) -> JaCeCompiled:
         """Optimize and compile the lowered SDFG using `compiler_options`.
 
         Returns an object that encapsulates a compiled SDFG object. To influence
@@ -237,10 +220,7 @@ def compile(
             out_names=tsdfg.out_names,
         )
 
-    def compiler_ir(
-        self,
-        dialect: str | None = None,
-    ) -> translator.TranslatedJaxprSDFG:
+    def compiler_ir(self, dialect: str | None = None) -> translator.TranslatedJaxprSDFG:
         """Returns the internal SDFG.
 
         The function returns a `TranslatedJaxprSDFG` object. Direct modification
@@ -250,10 +230,7 @@ def compiler_ir(
             return self._translated_sdfg
         raise ValueError(f"Unknown dialect '{dialect}'.")
 
-    def view(
-        self,
-        filename: str | None = None,
-    ) -> None:
+    def view(self, filename: str | None = None) -> None:
         """Runs the `view()` method of the underlying SDFG.
 
         This will open a browser and display the SDFG.
@@ -268,8 +245,7 @@ def as_sdfg(self) -> dace.SDFG:
         return self.compiler_ir().sdfg
 
     def _make_call_description(
-        self,
-        compiler_options: CompilerOptions | None = None,
+        self, compiler_options: CompilerOptions | None = None
     ) -> tcache.StageTransformationSpec:
         """This function computes the key for the `self.compile()` call inside the cache.
 
@@ -280,10 +256,7 @@ def _make_call_description(
         call_args = tuple(sorted(options.items(), key=lambda x: x[0]))
         return tcache.StageTransformationSpec(stage_id=id(self), call_args=call_args)
 
-    def _make_compiler_options(
-        self,
-        compiler_options: CompilerOptions | None,
-    ) -> CompilerOptions:
+    def _make_compiler_options(self, compiler_options: CompilerOptions | None) -> CompilerOptions:
         return optimization.DEFAULT_OPTIMIZATIONS | (compiler_options or {})
 
 
@@ -310,10 +283,7 @@ class JaCeCompiled:
     _out_names: tuple[str, ...]
 
     def __init__(
-        self,
-        csdfg: dace_helper.CompiledSDFG,
-        inp_names: Sequence[str],
-        out_names: Sequence[str],
+        self, csdfg: dace_helper.CompiledSDFG, inp_names: Sequence[str], out_names: Sequence[str]
     ) -> None:
         if (not inp_names) or (not out_names):
             raise ValueError("Input and output can not be empty.")
@@ -321,23 +291,13 @@ def __init__(
         self._inp_names = tuple(inp_names)
         self._out_names = tuple(out_names)
 
-    def __call__(
-        self,
-        *args: Any,
-        **kwargs: Any,
-    ) -> Any:
+    def __call__(self, *args: Any, **kwargs: Any) -> Any:
         """Calls the embedded computation.
 
         The arguments must be the same as for the wrapped function, but with
         all static arguments removed.
         """
-        return dace_helper.run_jax_sdfg(
-            self._csdfg,
-            self._inp_names,
-            self._out_names,
-            args,
-            kwargs,
-        )
+        return dace_helper.run_jax_sdfg(self._csdfg, self._inp_names, self._out_names, args, kwargs)
 
 
 #: Known compilation stages in JaCe.
diff --git a/src/jace/translator/jaxpr_translator_builder.py b/src/jace/translator/jaxpr_translator_builder.py
index 3053dd9..6c9c488 100644
--- a/src/jace/translator/jaxpr_translator_builder.py
+++ b/src/jace/translator/jaxpr_translator_builder.py
@@ -75,8 +75,7 @@ class JaxprTranslationBuilder:
     _ctx_stack: list[TranslationContext]
 
     def __init__(
-        self,
-        primitive_translators: Mapping[str, translator.PrimitiveTranslatorCallable],
+        self, primitive_translators: Mapping[str, translator.PrimitiveTranslatorCallable]
     ) -> None:
         # Maps name of primitives to the associated translator.
         self._primitive_translators = {**primitive_translators}
@@ -92,10 +91,7 @@ def __init__(
         self._ctx_stack = []
 
     def translate_jaxpr(
-        self,
-        jaxpr: jax_core.ClosedJaxpr,
-        *,
-        name: str | None = None,
+        self, jaxpr: jax_core.ClosedJaxpr, *, name: str | None = None
     ) -> TranslationContext:
         """Perform the translation of a Jaxpr into a SDFG.
 
@@ -122,12 +118,8 @@ def translate_jaxpr(
         #       Thus the builder will start to translate a second (nested) SDFG.
         #       Also note that there is no mechanism that forces the integration of the nested
         #       SDFG/Jaxpr, this must be done manually.
-        self._allocate_translation_ctx(
-            name=name,
-        )
-        self._create_constants(
-            jaxpr=jaxpr,
-        )
+        self._allocate_translation_ctx(name=name)
+        self._create_constants(jaxpr=jaxpr)
         self._create_initial_input(jaxpr=jaxpr)
 
         return self._translate_jaxpr_internal(jaxpr)
@@ -190,10 +182,7 @@ def arrays(self) -> Mapping[str, ddata.Data]:
         """
         return cast(Mapping[str, ddata.Data], self._ctx.sdfg.arrays)
 
-    def get_array(
-        self,
-        name: str | jax_core.Atom | util.JaCeVar,
-    ) -> ddata.Data:
+    def get_array(self, name: str | jax_core.Atom | util.JaCeVar) -> ddata.Data:
         """Returns the SDFG `Data` object `name` referees to.
 
         `name` can either be a string, in which case it is interpreted as a
@@ -212,22 +201,16 @@ def get_array(
 
     @overload
     def map_jax_var_to_sdfg(
-        self,
-        jax_var: jax_core.Atom | util.JaCeVar,
-        allow_fail: Literal[False] = False,
+        self, jax_var: jax_core.Atom | util.JaCeVar, allow_fail: Literal[False] = False
     ) -> str: ...
 
     @overload
     def map_jax_var_to_sdfg(
-        self,
-        jax_var: jax_core.Atom | util.JaCeVar,
-        allow_fail: Literal[True],
+        self, jax_var: jax_core.Atom | util.JaCeVar, allow_fail: Literal[True]
     ) -> str | None: ...
 
     def map_jax_var_to_sdfg(
-        self,
-        jax_var: jax_core.Atom | util.JaCeVar,
-        allow_fail: bool = False,
+        self, jax_var: jax_core.Atom | util.JaCeVar, allow_fail: bool = False
     ) -> str | None:
         """Get the name of the SDFG variable to which `jax_var` is referring to.
 
@@ -272,9 +255,7 @@ def is_root_translator(self) -> bool:
         return len(self._ctx_stack) == 1
 
     def add_jax_name_mapping(
-        self,
-        jax_var: jax_core.Var | util.JaCeVar,
-        sdfg_name: str,
+        self, jax_var: jax_core.Var | util.JaCeVar, sdfg_name: str
     ) -> JaxprTranslationBuilder:
         """Creates a new mapping between `jax_var` to `sdfg_name`.
 
@@ -454,10 +435,7 @@ def create_jax_var_list(  # type: ignore[misc]
 
         return ret_list
 
-    def _create_initial_input(
-        self,
-        jaxpr: jax_core.ClosedJaxpr,
-    ) -> None:
+    def _create_initial_input(self, jaxpr: jax_core.ClosedJaxpr) -> None:
         """Creates the input variables of `jaxpr`.
 
         Notes:
@@ -479,10 +457,7 @@ def _create_initial_input(
         # The output list is populated by `self._translate_jaxpr_internal()`
         self._ctx.inp_names = tuple(init_in_var_names)
 
-    def _create_constants(
-        self,
-        jaxpr: jax_core.ClosedJaxpr,
-    ) -> None:
+    def _create_constants(self, jaxpr: jax_core.ClosedJaxpr) -> None:
         """Creates all constants requested by the `jaxpr`.
 
         The function will create an SDFG variable and add them as constant to
@@ -504,20 +479,13 @@ def _create_constants(
                 sdfg_name, copy.deepcopy(const_value), self._ctx.sdfg.arrays[sdfg_name]
             )
 
-    def _allocate_translation_ctx(
-        self,
-        name: str | None = None,
-    ) -> JaxprTranslationBuilder:
+    def _allocate_translation_ctx(self, name: str | None = None) -> JaxprTranslationBuilder:
         """Allocate a new context and activate it.
 
         Args:
             name: The name of the SDFG.
         """
-        self._ctx_stack.append(
-            TranslationContext(
-                name=name,
-            )
-        )
+        self._ctx_stack.append(TranslationContext(name=name))
         return self
 
     @property
@@ -542,10 +510,7 @@ def _clear_translation_ctx(self) -> TranslationContext | None:
         # Remove the current head stack.
         return self._ctx_stack.pop()
 
-    def _translate_single_eqn(
-        self,
-        eqn: jax_core.JaxprEqn,
-    ) -> None:
+    def _translate_single_eqn(self, eqn: jax_core.JaxprEqn) -> None:
         """Translate `eqn` into its SDFG equivalent.
 
         To do this the function will perform the following steps:
@@ -601,10 +566,7 @@ def _translate_single_eqn(
         # Modify terminal root state of 'self'
         self._ctx.terminal_state = new_sdfg_term_state
 
-    def _translate_jaxpr_internal(
-        self,
-        jaxpr: jax_core.ClosedJaxpr,
-    ) -> TranslationContext:
+    def _translate_jaxpr_internal(self, jaxpr: jax_core.ClosedJaxpr) -> TranslationContext:
         """Performs the actual translation of the Jaxpr into an SDFG.
 
         The function assumes that the context is allocated as well as the
@@ -633,19 +595,14 @@ def _translate_jaxpr_internal(
             out_var_names = self._handle_null_jaxpr(jaxpr)
         else:
             out_var_names = self.create_jax_var_list(
-                jaxpr.jaxpr.outvars,
-                prevent_creation=True,
-                handle_literals=False,
+                jaxpr.jaxpr.outvars, prevent_creation=True, handle_literals=False
             )
 
         self._ctx.out_names = tuple(out_var_names)
 
         return cast(TranslationContext, self._clear_translation_ctx())
 
-    def _handle_null_jaxpr(
-        self,
-        jaxpr: jax_core.ClosedJaxpr,
-    ) -> list[str]:
+    def _handle_null_jaxpr(self, jaxpr: jax_core.ClosedJaxpr) -> list[str]:
         """This function is called in case a `Jaxpr` with zero equations is encountered.
 
         A function with zero equation might still have output, in which case
@@ -688,9 +645,7 @@ def _handle_null_jaxpr(
             # Now we create a variable that serves as true output, however, since the Jax variable
             #  is already known we can not update the variable mapping and must use another name.
             sdfg_out_name = self.add_array(
-                jax_out_var,
-                name_prefix="_zero_equation_output_for_",
-                update_var_mapping=False,
+                jax_out_var, name_prefix="_zero_equation_output_for_", update_var_mapping=False
             )
             out_var_names.append(sdfg_out_name)
 
@@ -753,10 +708,7 @@ class TranslationContext:
     start_state: dace.SDFGState
     terminal_state: dace.SDFGState
 
-    def __init__(
-        self,
-        name: str | None = None,
-    ) -> None:
+    def __init__(self, name: str | None = None) -> None:
         if isinstance(name, str) and not util.VALID_SDFG_OBJ_NAME.fullmatch(name):
             raise ValueError(f"'{name}' is not a valid SDFG name.")
 
diff --git a/src/jace/translator/post_translation.py b/src/jace/translator/post_translation.py
index 37be078..1e3f69f 100644
--- a/src/jace/translator/post_translation.py
+++ b/src/jace/translator/post_translation.py
@@ -56,8 +56,7 @@ def postprocess_jaxpr_sdfg(
 
 
 def finalize_translation_context(
-    trans_ctx: translator.TranslationContext,
-    validate: bool = True,
+    trans_ctx: translator.TranslationContext, validate: bool = True
 ) -> translator.TranslatedJaxprSDFG:
     """Finalizes the supplied translation context `trans_ctx`.
 
diff --git a/src/jace/translator/primitive_translator.py b/src/jace/translator/primitive_translator.py
index bd149d3..ca2c2fe 100644
--- a/src/jace/translator/primitive_translator.py
+++ b/src/jace/translator/primitive_translator.py
@@ -117,8 +117,7 @@ def primitive(self) -> str:
 
 @overload
 def make_primitive_translator(
-    primitive: str,
-    primitive_translator: Literal[None] = None,
+    primitive: str, primitive_translator: Literal[None] = None
 ) -> Callable[[translator.PrimitiveTranslatorCallable], translator.PrimitiveTranslator]: ...
 
 
@@ -129,8 +128,7 @@ def make_primitive_translator(
 
 
 def make_primitive_translator(
-    primitive: str,
-    primitive_translator: translator.PrimitiveTranslatorCallable | None = None,
+    primitive: str, primitive_translator: translator.PrimitiveTranslatorCallable | None = None
 ) -> (
     Callable[[translator.PrimitiveTranslatorCallable], translator.PrimitiveTranslator]
     | translator.PrimitiveTranslator
@@ -161,21 +159,18 @@ def wrapper(
 
 @overload
 def register_primitive_translator(
-    primitive_translator: Literal[None] = None,
-    overwrite: bool = False,
+    primitive_translator: Literal[None] = None, overwrite: bool = False
 ) -> Callable[[translator.PrimitiveTranslator], translator.PrimitiveTranslator]: ...
 
 
 @overload
 def register_primitive_translator(
-    primitive_translator: translator.PrimitiveTranslator,
-    overwrite: bool = False,
+    primitive_translator: translator.PrimitiveTranslator, overwrite: bool = False
 ) -> translator.PrimitiveTranslator: ...
 
 
 def register_primitive_translator(
-    primitive_translator: translator.PrimitiveTranslator | None = None,
-    overwrite: bool = False,
+    primitive_translator: translator.PrimitiveTranslator | None = None, overwrite: bool = False
 ) -> (
     translator.PrimitiveTranslator
     | Callable[[translator.PrimitiveTranslator], translator.PrimitiveTranslator]
diff --git a/src/jace/translator/primitive_translators/__init__.py b/src/jace/translator/primitive_translators/__init__.py
index 729134b..65f9153 100644
--- a/src/jace/translator/primitive_translators/__init__.py
+++ b/src/jace/translator/primitive_translators/__init__.py
@@ -11,6 +11,4 @@
 from .alu_translator import ALUTranslator
 
 
-__all__ = [
-    "ALUTranslator",
-]
+__all__ = ["ALUTranslator"]
diff --git a/src/jace/translator/primitive_translators/alu_translator.py b/src/jace/translator/primitive_translators/alu_translator.py
index 8e68a75..079139d 100644
--- a/src/jace/translator/primitive_translators/alu_translator.py
+++ b/src/jace/translator/primitive_translators/alu_translator.py
@@ -29,11 +29,7 @@ class ALUTranslator(translator.PrimitiveTranslator):
     This translator will be reworked soon, it just exists that the initial PR can do anything at all!!
     """
 
-    def __init__(
-        self,
-        prim_name: str,
-        prim_tmpl: str,
-    ) -> None:
+    def __init__(self, prim_name: str, prim_tmpl: str) -> None:
         """Initialize the `ALUTranslator`."""
         self._prim_name = prim_name
         self._prim_tmpl = prim_tmpl
@@ -174,11 +170,7 @@ def __call__(
                 if in_var is None:  # So access node for literal
                     continue
                 eqn_state.add_edge(
-                    eqn_state.add_read(in_var),
-                    None,
-                    tskl_tasklet,
-                    in_connector,
-                    in_memlet,
+                    eqn_state.add_read(in_var), None, tskl_tasklet, in_connector, in_memlet
                 )
             eqn_state.add_edge(
                 tskl_tasklet,
@@ -200,9 +192,7 @@ def __call__(
         return eqn_state
 
     def _write_tasklet_code(
-        self,
-        in_var_names: Sequence[str | None],
-        eqn: jax_core.JaxprEqn,
+        self, in_var_names: Sequence[str | None], eqn: jax_core.JaxprEqn
     ) -> str:
         """This function generates the Tasklet code based on a primitive.
 
diff --git a/src/jace/util/__init__.py b/src/jace/util/__init__.py
index 778c645..1d67340 100644
--- a/src/jace/util/__init__.py
+++ b/src/jace/util/__init__.py
@@ -18,11 +18,7 @@
     propose_jax_name,
     translate_dtype,
 )
-from .misc import (
-    FORBIDDEN_SDFG_VAR_NAMES,
-    VALID_SDFG_OBJ_NAME,
-    VALID_SDFG_VAR_NAME,
-)
+from .misc import FORBIDDEN_SDFG_VAR_NAMES, VALID_SDFG_OBJ_NAME, VALID_SDFG_VAR_NAME
 from .traits import (
     is_array,
     is_drop_var,
diff --git a/src/jace/util/dace_helper.py b/src/jace/util/dace_helper.py
index 613a59c..5ce559b 100644
--- a/src/jace/util/dace_helper.py
+++ b/src/jace/util/dace_helper.py
@@ -29,16 +29,10 @@
     from jace import translator
     from jace.util import dace_helper
 
-__all__ = [
-    "CompiledSDFG",
-    "compile_jax_sdfg",
-    "run_jax_sdfg",
-]
+__all__ = ["CompiledSDFG", "compile_jax_sdfg", "run_jax_sdfg"]
 
 
-def compile_jax_sdfg(
-    tsdfg: translator.TranslatedJaxprSDFG,
-) -> dace_helper.CompiledSDFG:
+def compile_jax_sdfg(tsdfg: translator.TranslatedJaxprSDFG) -> dace_helper.CompiledSDFG:
     """Compiles the SDFG embedded in `tsdfg` and return the resulting `CompiledSDFG` object."""
     if any(  # We do not support the DaCe return mechanism
         array_name.startswith("__return")
diff --git a/src/jace/util/jax_helper.py b/src/jace/util/jax_helper.py
index ca6f60c..a4cd8fa 100644
--- a/src/jace/util/jax_helper.py
+++ b/src/jace/util/jax_helper.py
@@ -73,10 +73,7 @@ def __post_init__(self) -> None:
     def __hash__(self) -> int:
         return id(self)
 
-    def __eq__(
-        self,
-        other: Any,
-    ) -> bool:
+    def __eq__(self, other: Any) -> bool:
         if not isinstance(other, JaCeVar):
             return NotImplemented
         return id(self) == id(other)
@@ -102,9 +99,7 @@ def get_jax_var_name(jax_var: jax_core.Atom | JaCeVar) -> str:
             )
 
 
-def get_jax_var_shape(
-    jax_var: jax_core.Atom | JaCeVar,
-) -> tuple[int | dace.symbol | str, ...]:
+def get_jax_var_shape(jax_var: jax_core.Atom | JaCeVar) -> tuple[int | dace.symbol | str, ...]:
     """Returns the shape of `jax_var`."""
     match jax_var:
         case jax_core.Var() | jax_core.Literal():
@@ -117,9 +112,7 @@ def get_jax_var_shape(
             raise TypeError(f"'get_jax_var_shape()` is not implemented for '{type(jax_var)}'.")
 
 
-def get_jax_var_dtype(
-    jax_var: jax_core.Atom | JaCeVar,
-) -> dace.typeclass:
+def get_jax_var_dtype(jax_var: jax_core.Atom | JaCeVar) -> dace.typeclass:
     """Returns the DaCe equivalent of `jax_var`s datatype."""
     match jax_var:
         case jax_core.Var() | jax_core.Literal():
@@ -132,10 +125,7 @@ def get_jax_var_dtype(
             raise TypeError(f"'get_jax_var_dtype()` is not implemented for '{type(jax_var)}'.")
 
 
-def is_tracing_ongoing(
-    *args: Any,
-    **kwargs: Any,
-) -> bool:
+def is_tracing_ongoing(*args: Any, **kwargs: Any) -> bool:
     """Test if tracing is ongoing.
 
     While a return value `True` guarantees that a translation is ongoing, a
@@ -147,9 +137,7 @@ def is_tracing_ongoing(
     return any(isinstance(x, jax_core.Tracer) for x in itertools.chain(args, kwargs.values()))
 
 
-def translate_dtype(
-    dtype: Any,
-) -> dace.typeclass:
+def translate_dtype(dtype: Any) -> dace.typeclass:
     """Turns a Jax datatype into a DaCe datatype."""
     if dtype is None:
         raise NotImplementedError  # Handling a special case in DaCe.
@@ -210,9 +198,7 @@ def propose_jax_name(
     return jax_name
 
 
-def get_jax_literal_value(
-    lit: jax_core.Atom,
-) -> bool | float | int | np.generic:
+def get_jax_literal_value(lit: jax_core.Atom) -> bool | float | int | np.generic:
     """Returns the value a literal is wrapping.
 
     The function guarantees to return a scalar value.
diff --git a/src/jace/util/traits.py b/src/jace/util/traits.py
index acada34..ef918c3 100644
--- a/src/jace/util/traits.py
+++ b/src/jace/util/traits.py
@@ -19,9 +19,7 @@
 import jace.util as util
 
 
-def is_drop_var(
-    jax_var: jax_core.Atom | util.JaCeVar,
-) -> TypeGuard[jax_core.DropVar]:
+def is_drop_var(jax_var: jax_core.Atom | util.JaCeVar) -> TypeGuard[jax_core.DropVar]:
     """Tests if `jax_var` is a drop variable, i.e. a variable that is not read from in a Jaxpr."""
 
     if isinstance(jax_var, jax_core.DropVar):
@@ -31,9 +29,7 @@ def is_drop_var(
     return False
 
 
-def is_jax_array(
-    obj: Any,
-) -> TypeGuard[jax.Array]:
+def is_jax_array(obj: Any) -> TypeGuard[jax.Array]:
     """Tests if `obj` is a Jax array.
 
     Note:
@@ -43,16 +39,12 @@ def is_jax_array(
     return isinstance(obj, jax.Array)
 
 
-def is_array(
-    obj: Any,
-) -> bool:
+def is_array(obj: Any) -> bool:
     """Identifies arrays, this also includes Jax arrays."""
     return dace.is_array(obj) or is_jax_array(obj)
 
 
-def is_scalar(
-    obj: Any,
-) -> bool:
+def is_scalar(obj: Any) -> bool:
     """Tests if `obj` is a scalar."""
     # These are the type known to DaCe; Taken from `dace.dtypes`.
     known_types = {
@@ -82,9 +74,7 @@ def is_scalar(
     return type(obj) in known_types
 
 
-def is_on_device(
-    obj: Any,
-) -> bool:
+def is_on_device(obj: Any) -> bool:
     """Tests if `obj` is on a device.
 
     Jax arrays are always on the CPU and GPU (if there is one). Thus for Jax
@@ -95,9 +85,7 @@ def is_on_device(
     return dace.is_gpu_array(obj)
 
 
-def is_fully_addressable(
-    obj: Any,
-) -> bool:
+def is_fully_addressable(obj: Any) -> bool:
     """Tests if `obj` is fully addressable, i.e. is only on this host."""
     if is_jax_array(obj):
         return obj.is_fully_addressable
diff --git a/src/jace/util/translation_cache.py b/src/jace/util/translation_cache.py
index 54c722b..2320d46 100644
--- a/src/jace/util/translation_cache.py
+++ b/src/jace/util/translation_cache.py
@@ -21,16 +21,7 @@
 import dataclasses
 import functools
 from collections.abc import Callable, Hashable
-from typing import (
-    TYPE_CHECKING,
-    Any,
-    Concatenate,
-    Generic,
-    ParamSpec,
-    TypeAlias,
-    TypeVar,
-    cast,
-)
+from typing import TYPE_CHECKING, Any, Concatenate, Generic, ParamSpec, TypeAlias, TypeVar, cast
 
 import dace
 from jax import core as jax_core
@@ -77,9 +68,7 @@ def __init__(self) -> None:
 
     @abc.abstractmethod
     def _make_call_description(
-        self: CachingStage,
-        *args: Any,
-        **kwargs: Any,
+        self: CachingStage, *args: Any, **kwargs: Any
     ) -> StageTransformationSpec:
         """Generates the key that is used to store/locate the call in the cache."""
         ...
@@ -105,11 +94,7 @@ def cached_transition(
     """
 
     @functools.wraps(transition)
-    def transition_wrapper(
-        self: CachingStageType,
-        *args: P.args,
-        **kwargs: P.kwargs,
-    ) -> NextStage:
+    def transition_wrapper(self: CachingStageType, *args: P.args, **kwargs: P.kwargs) -> NextStage:
         key: StageTransformationSpec = self._make_call_description(*args, **kwargs)
         if key in self._cache:
             return self._cache[key]
@@ -126,9 +111,7 @@ def clear_translation_cache() -> None:
         stage_caches.clear()
 
 
-def get_cache(
-    stage: CachingStage,
-) -> StageCache:
+def get_cache(stage: CachingStage) -> StageCache:
     """Returns the cache that should be used for `stage`."""
     stage_type = type(stage)
     if stage_type not in _TRANSLATION_CACHES:
@@ -161,10 +144,7 @@ class _AbstractCallArgument:
     storage: dace.StorageType
 
     @classmethod
-    def from_value(
-        cls,
-        value: Any,
-    ) -> _AbstractCallArgument:
+    def from_value(cls, value: Any) -> _AbstractCallArgument:
         """Construct an `_AbstractCallArgument` from `value`."""
         if not util.is_fully_addressable(value):
             raise NotImplementedError("Distributed arrays are not addressed yet.")
@@ -201,8 +181,7 @@ def from_value(
 #: This type is the abstract description of a function call.
 #:  It is part of the key used in the cache.
 CallArgsSpec: TypeAlias = tuple[
-    _AbstractCallArgument | Hashable | tuple[str, _AbstractCallArgument | Hashable],
-    ...,
+    _AbstractCallArgument | Hashable | tuple[str, _AbstractCallArgument | Hashable], ...
 ]
 
 
@@ -246,33 +225,20 @@ class StageCache(Generic[StageType]):
     _memory: collections.OrderedDict[StageTransformationSpec, StageType]
     _size: int
 
-    def __init__(
-        self,
-        size: int = 256,
-    ) -> None:
+    def __init__(self, size: int = 256) -> None:
         self._memory = collections.OrderedDict()
         self._size = size
 
-    def __contains__(
-        self,
-        key: StageTransformationSpec,
-    ) -> bool:
+    def __contains__(self, key: StageTransformationSpec) -> bool:
         return key in self._memory
 
-    def __getitem__(
-        self,
-        key: StageTransformationSpec,
-    ) -> StageType:
+    def __getitem__(self, key: StageTransformationSpec) -> StageType:
         if key not in self:
             raise KeyError(f"Key '{key}' is unknown.")
         self._memory.move_to_end(key, last=True)
         return self._memory[key]
 
-    def __setitem__(
-        self,
-        key: StageTransformationSpec,
-        res: StageType,
-    ) -> None:
+    def __setitem__(self, key: StageTransformationSpec, res: StageType) -> None:
         if key in self:
             self._memory.move_to_end(key, last=True)
             self._memory[key] = res
@@ -281,10 +247,7 @@ def __setitem__(
                 self.popitem(None)
             self._memory[key] = res
 
-    def popitem(
-        self,
-        key: StageTransformationSpec | None,
-    ) -> None:
+    def popitem(self, key: StageTransformationSpec | None) -> None:
         """Evict `key` from `self`.
 
         If `key` is `None` the oldest entry is evicted.
diff --git a/tests/test_jaxpr_translator_builder.py b/tests/test_jaxpr_translator_builder.py
index c769788..a2337f6 100644
--- a/tests/test_jaxpr_translator_builder.py
+++ b/tests/test_jaxpr_translator_builder.py
@@ -341,10 +341,7 @@ def test_builder_variable_alloc_list(
     var_list_1 = [array1, nscal, scal2]
     exp_names_1 = ["a", nscal.name, "c"]
 
-    res_names_1 = translation_builder.create_jax_var_list(
-        var_list_1,
-        update_var_mapping=True,
-    )
+    res_names_1 = translation_builder.create_jax_var_list(var_list_1, update_var_mapping=True)
     assert len(translation_builder.arrays) == 3
     assert res_names_1 == exp_names_1
 
@@ -352,10 +349,7 @@ def test_builder_variable_alloc_list(
     var_list_2 = [array2, nscal, scal1]
     exp_names_2 = ["d", nscal.name, "e"]
 
-    res_names_2 = translation_builder.create_jax_var_list(
-        var_list_2,
-        update_var_mapping=True,
-    )
+    res_names_2 = translation_builder.create_jax_var_list(var_list_2, update_var_mapping=True)
     assert res_names_2 == exp_names_2
     assert len(translation_builder.arrays) == 5
 
@@ -399,10 +393,7 @@ def test_builder_variable_alloc_list_prevent_creation(
         expected_exception=ValueError,
         match=re.escape(f"'prevent_creation' given but have to create '{array2}'."),
     ):
-        translation_builder.create_jax_var_list(
-            var_list,
-            prevent_creation=True,
-        )
+        translation_builder.create_jax_var_list(var_list, prevent_creation=True)
     assert len(translation_builder.arrays) == 1
     assert translation_builder.map_jax_var_to_sdfg(array1) == "a"
 
@@ -426,10 +417,7 @@ def test_builder_variable_alloc_list_only_creation(
         expected_exception=ValueError,
         match=re.escape(f"'only_creation' given '{array1}' already exists."),
     ):
-        translation_builder.create_jax_var_list(
-            var_list,
-            only_creation=True,
-        )
+        translation_builder.create_jax_var_list(var_list, only_creation=True)
     assert len(translation_builder.arrays) == 1
     assert translation_builder.map_jax_var_to_sdfg(array1) == "a"
 
@@ -454,23 +442,15 @@ def test_builder_variable_alloc_list_handle_literal(
         expected_exception=ValueError,
         match=re.escape("Encountered a literal but `handle_literals` was `False`."),
     ):
-        translation_builder.create_jax_var_list(
-            var_list,
-            handle_literals=False,
-        )
+        translation_builder.create_jax_var_list(var_list, handle_literals=False)
     assert len(translation_builder.arrays) == 0
 
-    name_list = translation_builder.create_jax_var_list(
-        var_list,
-        handle_literals=True,
-    )
+    name_list = translation_builder.create_jax_var_list(var_list, handle_literals=True)
     assert len(translation_builder.arrays) == 0
     assert name_list == [None]
 
 
-def test_builder_constants(
-    translation_builder: translator.JaxprTranslationBuilder,
-) -> None:
+def test_builder_constants(translation_builder: translator.JaxprTranslationBuilder) -> None:
     """Tests part of the `JaxprTranslationBuilder._create_constants()` api.
 
     See also the `test_subtranslators_alu.py::test_add3` test.
@@ -533,8 +513,7 @@ def test_builder_jace_var() -> None:
     """Simple tests about the `JaCeVar` objects."""
     for iname in ["do", "", "_ _", "9al", "_!"]:
         with pytest.raises(
-            expected_exception=ValueError,
-            match=re.escape(f"Supplied the invalid name '{iname}'."),
+            expected_exception=ValueError, match=re.escape(f"Supplied the invalid name '{iname}'.")
         ):
             _ = JaCeVar((), dace.int8, name=iname)
 

From c5ebe96fee1108a6b06ffa5cf6be2c98e0c4722e Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.paul.mueller@bluemain.ch>
Date: Sun, 9 Jun 2024 11:14:43 +0200
Subject: [PATCH 335/458] Renamed a file.

---
 src/jace/util/__init__.py                 | 2 +-
 src/jace/util/{misc.py => definitions.py} | 0
 2 files changed, 1 insertion(+), 1 deletion(-)
 rename src/jace/util/{misc.py => definitions.py} (100%)

diff --git a/src/jace/util/__init__.py b/src/jace/util/__init__.py
index 1d67340..63029c7 100644
--- a/src/jace/util/__init__.py
+++ b/src/jace/util/__init__.py
@@ -9,6 +9,7 @@
 
 from __future__ import annotations
 
+from .definitions import FORBIDDEN_SDFG_VAR_NAMES, VALID_SDFG_OBJ_NAME, VALID_SDFG_VAR_NAME
 from .jax_helper import (
     JaCeVar,
     get_jax_var_dtype,
@@ -18,7 +19,6 @@
     propose_jax_name,
     translate_dtype,
 )
-from .misc import FORBIDDEN_SDFG_VAR_NAMES, VALID_SDFG_OBJ_NAME, VALID_SDFG_VAR_NAME
 from .traits import (
     is_array,
     is_drop_var,
diff --git a/src/jace/util/misc.py b/src/jace/util/definitions.py
similarity index 100%
rename from src/jace/util/misc.py
rename to src/jace/util/definitions.py

From 45fce564ef3bd9d993d2f368feb61afe3ea348b8 Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Mon, 10 Jun 2024 10:05:07 +0200
Subject: [PATCH 336/458] Fixed an issue in the tests regarding the direct
 construction of the translation builder.

This commit essentially fixes commit `e46637d0`, that added the Jaxpr to the context, however, the commit did not updated the tests.
---
 .../test_jaxpr_translator_builder.py                 | 12 ++++++++----
 1 file changed, 8 insertions(+), 4 deletions(-)

diff --git a/tests/integration_tests/test_jaxpr_translator_builder.py b/tests/integration_tests/test_jaxpr_translator_builder.py
index 17253b5..813fbb8 100644
--- a/tests/integration_tests/test_jaxpr_translator_builder.py
+++ b/tests/integration_tests/test_jaxpr_translator_builder.py
@@ -52,7 +52,8 @@ def translation_builder() -> translator.JaxprTranslationBuilder:
     builder = translator.JaxprTranslationBuilder(
         primitive_translators=translator.get_registered_primitive_translators()
     )
-    builder._allocate_translation_ctx(name=name)
+    jaxpr = jax.make_jaxpr(lambda A: A)(1.0)  # dummy jaxpr, needed for construction.
+    builder._allocate_translation_ctx(name=name, jaxpr=jaxpr)
     return builder
 
 
@@ -66,7 +67,8 @@ def test_builder_alloc() -> None:
 
     # The reserved names will be tested in `test_builder_fork()`.
     sdfg_name = "qwertzuiopasdfghjkl"
-    builder._allocate_translation_ctx(name=sdfg_name)
+    jaxpr = jax.make_jaxpr(lambda A: A)(1.0)  # dummy jaxpr, needed for construction.
+    builder._allocate_translation_ctx(name=sdfg_name, jaxpr=jaxpr)
     assert len(builder._ctx_stack) == 1
     assert builder.is_root_translator()
 
@@ -202,7 +204,8 @@ def test_builder_nested(translation_builder: translator.JaxprTranslationBuilder)
     assert translation_builder.sdfg.number_of_edges() == 1
 
     # Now we go one subcontext deeper; note we do this manually which should not be done.
-    translation_builder._allocate_translation_ctx("builder")
+    jaxpr = jax.make_jaxpr(lambda A: A)(1.0)  # dummy jaxpr, needed for construction.
+    translation_builder._allocate_translation_ctx(name="builder", jaxpr=jaxpr)
     assert len(translation_builder._ctx_stack) == 2
     assert translation_builder.sdfg.name == "builder"
     assert translation_builder.sdfg.number_of_nodes() == 1
@@ -466,7 +469,8 @@ def test_builder_constants(translation_builder: translator.JaxprTranslationBuild
 
     # We have to manually allocate the builder context.
     #  You should not do that.
-    translation_builder._allocate_translation_ctx(name="Manual_test")
+    jaxpr = jax.make_jaxpr(lambda A: A)(1.0)  # dummy jaxpr, needed for construction.
+    translation_builder._allocate_translation_ctx(name="Manual_test", jaxpr=jaxpr)
 
     # No create the constants.
     translation_builder._create_constants(jaxpr)

From a2ee92d6cb6b66edba396cc6fcbd12af9689b129 Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Mon, 10 Jun 2024 11:06:05 +0200
Subject: [PATCH 337/458] Added a layer to handle all outputs and inputs.

This should mostly finalize the work needed to enable the distinction between arrays and scalars inside the builder. While there is now this distinction inside the builder and also in the input layer, i.e. there is no silent
convertion from scalar to array, at least on CPU, on GPU we will have to do that, but we are not there yet, we still return arrays in any case. This is because
We do this, because it is a limitation in DaCe itself, and Jax itself only returns arrays.
---
 src/jace/stages.py                            |  16 +-
 .../translator/jaxpr_translator_builder.py    |  16 +-
 src/jace/translator/pre_post_translation.py   | 145 +++++++++++++++++-
 .../primitive_translators/slicing.py          |   4 +-
 src/jace/util/__init__.py                     |   2 +
 src/jace/util/dace_helper.py                  |  16 +-
 src/jace/util/traits.py                       |  30 +++-
 src/jace/util/translation_cache.py            |   2 +-
 8 files changed, 191 insertions(+), 40 deletions(-)

diff --git a/src/jace/stages.py b/src/jace/stages.py
index 66d1e51..6ef47d9 100644
--- a/src/jace/stages.py
+++ b/src/jace/stages.py
@@ -138,12 +138,6 @@ def lower(self, *args: Any, **kwargs: Any) -> JaCeLowered:
         if len(kwargs) != 0:
             raise NotImplementedError("Currently only positional arguments are supported.")
 
-        # TODO(phimuell): Currently the SDFG that we build only supports `C_CONTIGUOUS` memory
-        #  order. Since we support the paradigm that "everything passed to `lower()` should also
-        #  be accepted as argument to call the result", we forbid other memory orders here.
-        if not all((not util.is_array(arg)) or util.is_c_contiguous(arg) for arg in args):
-            raise NotImplementedError("Currently can not yet handle strides beside 'C_CONTIGUOUS'.")
-
         # In Jax `float32` is the main datatype, and they go to great lengths to avoid some
         #  aggressive [type promotion](https://jax.readthedocs.io/en/latest/type_promotion.html).
         #  However, in this case we will have problems when we call the SDFG, for some reasons
@@ -199,6 +193,11 @@ class JaCeLowered(tcache.CachingStage["JaCeCompiled"]):
         undefined behavior. Although `JaCeWrapped` is composable with Jax
         transformations `JaCeLowered` is not. A user should never create such
         an object, instead `JaCeWrapped.lower()` should be used.
+        The storage location and stride of an input (in addition to its shape
+        and data type) are hard coded into the SDFG. Thus, if a certain stride
+        was used for lowering a computation, that stride must also be used
+        when the SDFG is called. If the just in time compilation mode is used
+        JaCe will take care of this.
     """
 
     _translated_sdfg: translator.TranslatedJaxprSDFG
@@ -304,6 +303,10 @@ class JaCeCompiled:
     This is the last stage of the jit chain. A user should never create a
     `JaCeCompiled` instance, instead `JaCeLowered.compile()` should be used.
 
+    In order to execute the stored computation properly, an input's stride,
+    storage location, shape and datatype has to match the argument that was
+    used for lowering, i.e. was passed to the `lower()` function.
+
     Args:
         csdfg: The compiled SDFG object.
         inp_names: Names of the SDFG variables used as inputs.
@@ -314,6 +317,7 @@ class JaCeCompiled:
 
     Todo:
         - Handle pytrees.
+        - Automatic strides adaption.
     """
 
     _csdfg: dace_helper.CompiledSDFG
diff --git a/src/jace/translator/jaxpr_translator_builder.py b/src/jace/translator/jaxpr_translator_builder.py
index 1dd1b5b..9ea37dc 100644
--- a/src/jace/translator/jaxpr_translator_builder.py
+++ b/src/jace/translator/jaxpr_translator_builder.py
@@ -29,14 +29,14 @@ class JaxprTranslationBuilder:
 
     The SDFG created by this class has a very particular form, which we call
     canonical. The main features of such an SDFG are:
-    - the SDFG is a list of states, ideally each state corresponds to single Jax primitive,
+    - the SDFG is a list of states, ideally each state corresponds to one Jax primitive,
     - it has a single source and sink state.
     - all variable names are derived from Jax names,
     - there are only transient variables inside the SDFG,
-    - It lacks the special `__return` variable,
+    - it lacks the special `__return` variable,
     - the `arg_names` parameter is not set,
-    - scalar variables that are used as return value are SDFG scalars, thus they
-        can not directly be used to return something.
+    - for all scalar values a ` Scalar` SDFG variable is used, thus they cannot
+        be used to return anything.
 
     For these reasons the SDFG is not directly usable, and further manipulations
     have to be performed. Especially, DaCe's validation function will fail and
@@ -110,7 +110,6 @@ def translate_jaxpr(
         Args:
             name: Use this name for the SDFG instead some generated one.
         """
-
         if len(jaxpr.effects) != 0:
             raise NotImplementedError("'Jaxpr' with side effects are not supported.")
 
@@ -267,8 +266,8 @@ def add_jax_name_mapping(
             jax_var: The Jax variable.
             sdfg_name: The name of the corresponding SDFG variable.
         """
-        assert sdfg_name
-
+        if not sdfg_name:
+            raise ValueError("Supplied 'sdfg_name' is empty.")
         if jax_var in self._jax_name_map:
             raise ValueError(
                 f"Cannot change the mapping of '{jax_var}' from"
@@ -305,7 +304,6 @@ def add_array(
             name_prefix: If given it will be used as prefix for the name.
             update_var_mapping: Update the internal variable mapping; by default `False`.
         """
-
         if isinstance(arg, jax_core.Literal):
             raise ValueError(f"Can not generate an SDFG variable for literal '{arg}'.")
 
@@ -436,7 +434,6 @@ def _create_initial_input(self, jaxpr: jax_core.ClosedJaxpr) -> None:
         Notes:
             The function will populate the `inp_names` member of the current context.
         """
-        assert self.is_allocated(), "Builder is not allocated, can not create constants."
         assert self._ctx.inp_names is None
 
         # Handle the initial input arguments
@@ -458,7 +455,6 @@ def _create_constants(self, jaxpr: jax_core.ClosedJaxpr) -> None:
         The function will create an SDFG variable and add them as constant to
         the SDFG. Their value is deepcopied.
         """
-        assert self.is_allocated(), "Builder is not allocated, can not create constants."
         if len(jaxpr.consts) == 0:
             return
 
diff --git a/src/jace/translator/pre_post_translation.py b/src/jace/translator/pre_post_translation.py
index 1e3f69f..be2c231 100644
--- a/src/jace/translator/pre_post_translation.py
+++ b/src/jace/translator/pre_post_translation.py
@@ -16,7 +16,9 @@
 import copy
 from typing import TYPE_CHECKING, Any
 
-from jace import translator
+import dace
+
+from jace import translator, util
 
 
 if TYPE_CHECKING:
@@ -26,7 +28,7 @@
 def postprocess_jaxpr_sdfg(
     trans_ctx: translator.TranslationContext,
     fun: Callable,  # noqa: ARG001  # Currently unused
-    call_args: Sequence[Any],  # noqa: ARG001  # Currently unused
+    call_args: Sequence[Any],  # Currently unused
     intree: None,  # noqa: ARG001  # Currently unused
 ) -> translator.TranslatedJaxprSDFG:
     """Perform the final post processing steps on the `TranslationContext` _in place_.
@@ -41,20 +43,149 @@ def postprocess_jaxpr_sdfg(
         intree: The pytree describing the inputs.
 
     Todo:
-        - Setting correct input names (layer that does not depend on JAX).
-        - Setting the correct strides & storage properties.
         - Fixing the scalar input problem on GPU.
+        - Fixing stride problem of the input.
     """
     # Currently we do nothing except finalizing.
     trans_ctx.validate()
 
-    #
-    # Assume some post processing here.
-    #
+    # Handle inputs
+    create_input_output_stages(trans_ctx=trans_ctx, call_args=call_args)
 
     return finalize_translation_context(trans_ctx, validate=True)
 
 
+def create_input_output_stages(
+    trans_ctx: translator.TranslationContext, call_args: Sequence[Any]
+) -> None:
+    """Creates an input and output state inside the SDFG in place.
+
+    Args:
+        trans_ctx: The translation context that should be modified.
+        call_args: the call arguments that should be used.
+    """
+    _create_input_state(trans_ctx, call_args)
+    _create_output_state(trans_ctx)
+
+
+def _create_output_state(trans_ctx: translator.TranslationContext) -> None:
+    """Creates the output processing stage for the SDFG in place.
+
+    The function will create a new terminal state, in which all outputs, denoted
+    in `trans_ctx.out_names` will be written in new SDFG variables. However,
+    instead of scalars the function will generate arrays of length one. This is
+    needed because DaCe can only return arrays at the moment, it is also
+    consistent with what Jax does.
+
+    Notes:
+        All output variables follow the pattern `__jace_output_{i}`, where `i`
+        is a zero based counter. Furthermore, all output variables are transients
+        since `TranslationContext` is supposed to hold canonical SDFGs only.
+    """
+    assert trans_ctx.inp_names is not None and trans_ctx.out_names is not None
+
+    if set(trans_ctx.inp_names).intersection(trans_ctx.out_names):
+        raise NotImplementedError("Shared input and output variables are not supported yet.")
+
+    output_pattern = "__jace_output_{}"
+    sdfg = trans_ctx.sdfg
+    new_output_state: dace.SDFGState = sdfg.add_state("output_processing_stage")
+    new_output_names: list[str] = []
+
+    for i, org_output_name in enumerate(trans_ctx.out_names):
+        new_output_name = output_pattern.format(i)
+        org_output_desc: dace.data.Data = sdfg.arrays[org_output_name]
+
+        if isinstance(org_output_desc, dace.data.Scalar):
+            _, new_output_desc = sdfg.add_array(
+                new_output_name,
+                dtype=org_output_desc.dtype,
+                shape=(1,),
+                transient=True,
+                strides=None,  # explicit C stride
+            )
+            memlet = dace.Memlet.simple(new_output_name, subset_str="0", other_subset_str="0")
+        else:
+            new_output_desc = org_output_desc.clone()
+            sdfg.add_datadesc(new_output_name, new_output_desc)
+            memlet = dace.Memlet.from_array(org_output_name, org_output_desc)
+
+        new_output_state.add_nedge(
+            new_output_state.add_read(org_output_name),
+            new_output_state.add_write(new_output_name),
+            memlet,
+        )
+        new_output_names.append(new_output_name)
+
+    sdfg.add_edge(trans_ctx.terminal_state, new_output_state, dace.InterstateEdge())
+    trans_ctx.terminal_state = new_output_state
+    trans_ctx.out_names = tuple(new_output_names)
+
+
+def _create_input_state(trans_ctx: translator.TranslationContext, call_args: Sequence[Any]) -> None:
+    """Creates the input processing state for the SDFG in place.
+
+    The function creates a new set of variables that are exposed as inputs, whose
+    names follows the pattern `__jace_input_{i}`, where `i` is a zero based
+    counter. These new variables will have the same strides as the input array.
+    Furthermore, they will have the correct storage locations and scalars in
+    GPU mode will be handled correctly.
+
+    Args:
+        trans_ctx: The translation context that should be modified.
+        call_args: the call arguments that should be used.
+
+    Todo:
+        Handle transfer of scalar input in GPU mode.
+    """
+    assert trans_ctx.inp_names is not None and trans_ctx.out_names is not None
+
+    if set(trans_ctx.inp_names).intersection(trans_ctx.out_names):
+        raise NotImplementedError("Shared input and output variables are not supported yet.")
+    if len(call_args) != len(trans_ctx.inp_names):
+        raise ValueError(f"Expected {len(trans_ctx.inp_names)}, but got {len(call_args)}.")
+
+    sdfg = trans_ctx.sdfg
+    new_input_state: dace.SDFGState = sdfg.add_state(f"{sdfg.name}__start_state")
+    new_input_names: list[str] = []
+    input_pattern = "__jace_input_{}"
+
+    for i, (org_input_name, call_arg) in enumerate(zip(trans_ctx.inp_names, call_args)):
+        org_input_desc: dace.data.Data = sdfg.arrays[org_input_name]
+        new_input_name = input_pattern.format(i)
+
+        if isinstance(org_input_desc, dace.data.Scalar):
+            # TODO(phimuell): In GPU mode: scalar -> GPU_ARRAY -> Old input name
+            new_input_desc: dace.data.Scalar = org_input_desc.clone()
+            sdfg.add_datadesc(new_input_name, new_input_desc)
+            memlet = dace.Memlet.simple(new_input_name, subset_str="0", other_subset_str="0")
+
+        else:
+            _, new_input_desc = sdfg.add_array(
+                name=new_input_name,
+                shape=org_input_desc.shape,
+                dtype=org_input_desc.dtype,
+                strides=util.get_strides_for_dace(call_arg),
+                transient=True,
+                storage=dace.StorageType.GPU_Global
+                if util.is_on_device(call_arg)
+                else dace.StorageType.CPU_Heap,
+            )
+            memlet = dace.Memlet.from_array(new_input_name, new_input_desc)
+
+        new_input_state.add_nedge(
+            new_input_state.add_read(new_input_name),
+            new_input_state.add_write(org_input_name),
+            memlet,
+        )
+        new_input_names.append(new_input_name)
+
+    sdfg.add_edge(new_input_state, trans_ctx.start_state, dace.InterstateEdge())
+    sdfg.start_block = sdfg.node_id(new_input_state)
+    trans_ctx.start_state = new_input_state
+    trans_ctx.inp_names = tuple(new_input_names)
+
+
 def finalize_translation_context(
     trans_ctx: translator.TranslationContext, validate: bool = True
 ) -> translator.TranslatedJaxprSDFG:
diff --git a/src/jace/translator/primitive_translators/slicing.py b/src/jace/translator/primitive_translators/slicing.py
index 5a04b3c..7a28dc0 100644
--- a/src/jace/translator/primitive_translators/slicing.py
+++ b/src/jace/translator/primitive_translators/slicing.py
@@ -97,10 +97,8 @@ def __call__(
         assert in_var_names[0]
         assert len(in_var_names) == len(util.get_jax_var_shape(eqn.invars[0])) + 1
 
-        raise NotImplementedError("This translator needs true scalars to correctly work.")
-
         # This is the sizes of the slice window.
-        window_sizes: Sequence[int] = eqn.params["slice_sizes"]  # type: ignore[unreachable]
+        window_sizes: Sequence[int] = eqn.params["slice_sizes"]
 
         # The first input to the primitive is the array we slice from, the others are the start
         #  indices of the slice window, each is a scalar, maybe literals.
diff --git a/src/jace/util/__init__.py b/src/jace/util/__init__.py
index bfff733..56fdd43 100644
--- a/src/jace/util/__init__.py
+++ b/src/jace/util/__init__.py
@@ -21,6 +21,7 @@
 )
 from .misc import FORBIDDEN_SDFG_VAR_NAMES, VALID_SDFG_OBJ_NAME, VALID_SDFG_VAR_NAME
 from .traits import (
+    get_strides_for_dace,
     is_array,
     is_c_contiguous,
     is_drop_var,
@@ -41,6 +42,7 @@
     "get_jax_var_dtype",
     "get_jax_var_name",
     "get_jax_var_shape",
+    "get_strides_for_dace",
     "is_array",
     "is_c_contiguous",
     "is_drop_var",
diff --git a/src/jace/util/dace_helper.py b/src/jace/util/dace_helper.py
index cbbb417..90db509 100644
--- a/src/jace/util/dace_helper.py
+++ b/src/jace/util/dace_helper.py
@@ -15,7 +15,6 @@
 from typing import TYPE_CHECKING, Any
 
 import dace
-import numpy as np
 from dace import data as dace_data
 
 # The compiled SDFG is not available in the dace namespace or anywhere else
@@ -38,7 +37,7 @@ def compile_jax_sdfg(tsdfg: translator.TranslatedJaxprSDFG) -> dace_helper.Compi
     """Compiles the SDFG embedded in `tsdfg` and return the resulting `CompiledSDFG` object."""
     if any(  # We do not support the DaCe return mechanism
         array_name.startswith("__return")
-        for array_name in tsdfg.sdfg.arrays.keys()  # noqa: SIM118  # we can not use `in` because we are also interested in `__return_`!
+        for array_name in tsdfg.sdfg.arrays.keys()  # noqa: SIM118  # We can not use `in` because we are not interested in `my_mangled_variable__return_zulu`!
     ):
         raise ValueError("Only support SDFGs without '__return' members.")
 
@@ -95,12 +94,7 @@ def run_jax_sdfg(
     Note:
         There is no pytree mechanism jet, thus the return values are returned
         inside a `tuple` or in case of one value, directly, in the order
-        determined by Jax. Furthermore, DaCe does not support scalar return
-        values, thus they are silently converted into arrays of length 1, the
-        same holds for inputs.
-
-    Todo:
-        - Implement non C strides.
+        determined by Jax. As Jax JaCe does not return scalars, but only arrays.
     """
     sdfg: dace.SDFG = csdfg.sdfg
 
@@ -116,10 +110,8 @@ def run_jax_sdfg(
     # Build the argument list that we will pass to the compiled object.
     sdfg_call_args: dict[str, Any] = {}
     for in_name, in_val in zip(inp_names, call_args, strict=True):
-        if util.is_scalar(in_val):
-            # Currently the translator makes scalar into arrays, this has to be reflected here
-            in_val = np.array([in_val])
-        elif util.is_jax_array(in_val):
+        # TODO(phimuell): Implement a stride matching process.
+        if util.is_jax_array(in_val):
             # TODO(phimuell): Add test for this.
             if not util.is_fully_addressable(in_val):
                 raise ValueError(f"Passed a not fully addressable Jax array as '{in_name}'")
diff --git a/src/jace/util/traits.py b/src/jace/util/traits.py
index 18c975f..0fc6665 100644
--- a/src/jace/util/traits.py
+++ b/src/jace/util/traits.py
@@ -39,7 +39,7 @@ def is_jax_array(obj: Any) -> TypeGuard[jax.Array]:
     return isinstance(obj, jax.Array)
 
 
-def is_array(obj: Any) -> bool:
+def is_array(obj: Any) -> TypeGuard[jax.typing.ArrayLike]:
     """Identifies arrays, this also includes Jax arrays."""
     return dace.is_array(obj) or is_jax_array(obj)
 
@@ -74,6 +74,34 @@ def is_scalar(obj: Any) -> bool:
     return type(obj) in known_types
 
 
+def get_strides_for_dace(obj: Any) -> tuple[int, ...] | None:
+    """Get the strides of `obj` in a DaCe compatible format.
+
+    The function returns the strides in number of elements, as it is used inside
+    DaCe and not in bytes as it is inside NumPy. As in NumPy and DaCe the function
+    returns `None` to indicate standard C order.
+
+    Notes:
+        If `obj` is not array like an error is generated.
+    """
+    if not is_array(obj):
+        raise TypeError(f"Passed '{obj}' ({type(obj).__name__}) is not array like.")
+
+    if is_jax_array(obj):
+        if not is_fully_addressable(obj):
+            raise NotImplementedError("Sharded jax arrays are not supported.")
+        obj = obj.__array__()
+    assert hasattr(obj, "strides")
+
+    if obj.strides is None:
+        return None
+    if not hasattr(obj, "itemsize"):
+        # No `itemsize` member so we assume that it is already in elements.
+        return obj.strides
+
+    return tuple(stride // obj.itemsize for stride in obj.strides)
+
+
 def is_on_device(obj: Any) -> bool:
     """Tests if `obj` is on a device.
 
diff --git a/src/jace/util/translation_cache.py b/src/jace/util/translation_cache.py
index 574541c..5476dea 100644
--- a/src/jace/util/translation_cache.py
+++ b/src/jace/util/translation_cache.py
@@ -156,7 +156,7 @@ def from_value(cls, value: Any) -> _AbstractCallArgument:
                 value = value.__array__()  # Passing `copy=False` leads to error in NumPy.
             shape = value.shape
             dtype = util.translate_dtype(value.dtype)
-            strides = getattr(value, "strides", None)
+            strides = util.get_strides_for_dace(value)
             # Is `CPU_Heap` always okay? There would also be `CPU_Pinned`.
             storage = (
                 dace.StorageType.GPU_Global

From b7fcc801e0861275b4b7e169c2d85c125f920402 Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Mon, 10 Jun 2024 11:13:26 +0200
Subject: [PATCH 338/458] Updated the tests.

---
 .../test_primitive_reshape.py                 |  4 +--
 .../test_primitive_slicing.py                 |  9 -----
 .../test_jaxpr_translator_builder.py          | 36 +++++++++++--------
 .../test_primitive_translator_managing.py     |  6 +++-
 tests/unit_tests/test_caching.py              | 17 ++-------
 tests/util.py                                 | 22 +++++++-----
 6 files changed, 43 insertions(+), 51 deletions(-)

diff --git a/tests/integration_tests/primitive_translators/test_primitive_reshape.py b/tests/integration_tests/primitive_translators/test_primitive_reshape.py
index ac4ad50..be7d7ff 100644
--- a/tests/integration_tests/primitive_translators/test_primitive_reshape.py
+++ b/tests/integration_tests/primitive_translators/test_primitive_reshape.py
@@ -42,9 +42,7 @@ def testee(A: np.ndarray) -> jax.Array:
     assert np.all(res == ref)
 
 
-@pytest.fixture(
-    params=["C", pytest.param("F", marks=pytest.mark.skip("Non C order is not supported"))]
-)
+@pytest.fixture(params=["C", "F"])
 def mem_order(request) -> str:
     """Gets the memory order that we want."""
     return request.param
diff --git a/tests/integration_tests/primitive_translators/test_primitive_slicing.py b/tests/integration_tests/primitive_translators/test_primitive_slicing.py
index 6c70c4e..b5cde93 100644
--- a/tests/integration_tests/primitive_translators/test_primitive_slicing.py
+++ b/tests/integration_tests/primitive_translators/test_primitive_slicing.py
@@ -69,9 +69,6 @@ def testee(A: np.ndarray) -> jax.Array:
     assert np.all(ref == res)
 
 
-@pytest.mark.skip(
-    "In unoptimized mode there is an error, that is caused because we have an array insteadof a scalar."
-)
 def test_dynamic_slice_full_dynamic(
     A_4x4x4x4: np.ndarray, full_dynamic_start_idx: tuple[int, int, int, int]
 ) -> None:
@@ -84,9 +81,6 @@ def testee(A: np.ndarray, s1: int, s2: int, s3: int, s4: int) -> jax.Array:
     assert np.all(ref == res)
 
 
-@pytest.mark.skip(
-    "In unoptimized mode there is an error, that is caused because we have an array insteadof a scalar."
-)
 def test_dynamic_slice_partially_dynamic(A_4x4x4x4: np.ndarray) -> None:
     def testee(A: np.ndarray, s1: int, s2: int) -> jax.Array:
         return jax.lax.dynamic_slice(A, (s1, 1, s2, 2), (2, 2, 2, 2))
@@ -97,9 +91,6 @@ def testee(A: np.ndarray, s1: int, s2: int) -> jax.Array:
     assert np.all(ref == res)
 
 
-@pytest.mark.skip(
-    "In unoptimized mode there is an error, that is caused because we have an array insteadof a scalar."
-)
 def test_dynamic_slice_full_literal(A_4x4x4x4: np.ndarray) -> None:
     def testee(A: np.ndarray) -> jax.Array:
         return jax.lax.dynamic_slice(A, (0, 1, 0, 2), (2, 2, 2, 2))
diff --git a/tests/integration_tests/test_jaxpr_translator_builder.py b/tests/integration_tests/test_jaxpr_translator_builder.py
index 813fbb8..8afe6f2 100644
--- a/tests/integration_tests/test_jaxpr_translator_builder.py
+++ b/tests/integration_tests/test_jaxpr_translator_builder.py
@@ -19,7 +19,7 @@
 import jax
 import numpy as np
 import pytest
-from dace.data import Array
+from dace import data as dcdata
 from jax import numpy as jnp
 
 import jace
@@ -90,8 +90,11 @@ def test_builder_variable_alloc_auto_naming(
         sdfg_name = translation_builder.add_array(var, update_var_mapping=True)
         sdfg_var = translation_builder.get_array(sdfg_name)
         assert sdfg_name == chr(97 + i)
-        assert isinstance(sdfg_var, Array)  # Everything is now an array
-        assert sdfg_var.shape == ((1,) if var.shape == () else var.shape)
+        if var.shape == ():
+            assert isinstance(sdfg_var, dcdata.Scalar)
+        else:
+            assert isinstance(sdfg_var, dcdata.Array)
+            assert sdfg_var.shape == var.shape
         assert sdfg_var.dtype == var.dtype
 
 
@@ -110,8 +113,11 @@ def test_builder_variable_alloc_mixed_naming(
             assert sdfg_name == chr(97 + i)
         else:
             assert sdfg_name == var.name
-        assert isinstance(sdfg_var, Array)  # Everything is now an array
-        assert sdfg_var.shape == ((1,) if var.shape == () else var.shape)
+        if var.shape == ():
+            assert isinstance(sdfg_var, dcdata.Scalar)
+        else:
+            assert isinstance(sdfg_var, dcdata.Array)
+            assert sdfg_var.shape == var.shape
         assert sdfg_var.dtype == var.dtype
 
 
@@ -129,8 +135,11 @@ def test_builder_variable_alloc_mixed_naming2(
             letoff += 1
         else:
             assert sdfg_name == var.name
-        assert isinstance(sdfg_var, Array)  # Everything is now an array
-        assert sdfg_var.shape == ((1,) if var.shape == () else var.shape)
+        if var.shape == ():
+            assert isinstance(sdfg_var, dcdata.Scalar)
+        else:
+            assert isinstance(sdfg_var, dcdata.Array)
+            assert sdfg_var.shape == var.shape
         assert sdfg_var.dtype == var.dtype
 
 
@@ -469,7 +478,6 @@ def test_builder_constants(translation_builder: translator.JaxprTranslationBuild
 
     # We have to manually allocate the builder context.
     #  You should not do that.
-    jaxpr = jax.make_jaxpr(lambda A: A)(1.0)  # dummy jaxpr, needed for construction.
     translation_builder._allocate_translation_ctx(name="Manual_test", jaxpr=jaxpr)
 
     # No create the constants.
@@ -634,17 +642,15 @@ def test_builder_F_strides() -> None:
         See also `tests/test_caching.py::test_caching_strides`.
     """
 
-    @jace.jit
     def testee(A: np.ndarray) -> np.ndarray:
         return A + 10.0
 
-    F = np.full((4, 3), 10, dtype=np.float64, order="F")
+    A = testutil.mkarray((4, 3), order="F")
+    ref = testee(A)
+    res = jace.jit(testee)(A)
 
-    with pytest.raises(
-        expected_exception=NotImplementedError,
-        match=re.escape("Currently can not yet handle strides beside 'C_CONTIGUOUS'."),
-    ):
-        _ = testee(F)
+    assert ref.shape == res.shape
+    assert np.allclose(ref, res)
 
 
 def test_builder_drop_variables() -> None:
diff --git a/tests/integration_tests/test_primitive_translator_managing.py b/tests/integration_tests/test_primitive_translator_managing.py
index 2c1f005..7d4fa8f 100644
--- a/tests/integration_tests/test_primitive_translator_managing.py
+++ b/tests/integration_tests/test_primitive_translator_managing.py
@@ -190,7 +190,11 @@ def foo(A: int) -> int:
         D = C + 1
         return D + 1
 
-    _ = foo.lower(1)
+    with pytest.warns(
+        UserWarning,
+        match='WARNING: Use of uninitialized transient "e" in state output_processing_stage',
+    ):
+        _ = foo.lower(1)
     assert trans_cnt[0] == 4
 
 
diff --git a/tests/unit_tests/test_caching.py b/tests/unit_tests/test_caching.py
index 29ec75e..ad16e15 100644
--- a/tests/unit_tests/test_caching.py
+++ b/tests/unit_tests/test_caching.py
@@ -11,11 +11,9 @@
 from __future__ import annotations
 
 import itertools as it
-import re
 
 import jax
 import numpy as np
-import pytest
 from jax import numpy as jnp
 
 import jace
@@ -200,7 +198,7 @@ def jaceWrapped(A: np.ndarray, B: np.ndarray) -> np.ndarray:
     jaceLowered = jaceWrapped.lower(A, B)
 
     # Compiling it with and without optimizations enabled
-    optiCompiled = jaceLowered.compile()
+    optiCompiled = jaceLowered.compile(optimization.DEFAULT_OPTIMIZATIONS)
     unoptiCompiled = jaceLowered.compile(optimization.NO_OPTIMIZATIONS)
 
     # Because of the way how things work the optimized must have more than the unoptimized.
@@ -211,7 +209,6 @@ def jaceWrapped(A: np.ndarray, B: np.ndarray) -> np.ndarray:
 
     # Now we check if they are still inside the cache.
     assert optiCompiled is jaceLowered.compile(optimization.DEFAULT_OPTIMIZATIONS)
-    assert optiCompiled is jaceLowered.compile({})
     assert unoptiCompiled is jaceLowered.compile(optimization.NO_OPTIMIZATIONS)
 
 
@@ -388,7 +385,6 @@ def testee(A: np.ndarray) -> np.ndarray:
     assert second_key not in cache
 
 
-@pytest.mark.skip("Non C order is not supported")
 def test_caching_strides() -> None:
     """Test if the cache detects a change in strides."""
 
@@ -400,21 +396,14 @@ def wrapped(A: np.ndarray) -> np.ndarray:
         return A + 10.0
 
     shape = (10, 100, 1000)
-    C = np.array((testutil.mkarray(shape) - 0.5) * 10, order="C", dtype=np.float64)
+    C = testutil.mkarray(shape, order="C")
     F = np.array(C, copy=True, order="F")
 
     # First we compile run it with C strides.
     C_lower = wrapped.lower(C)
     C_res = wrapped(C)
 
-    # Now we run it with FORTRAN strides.
-    #  However, this does not work because we do not support strides at all.
-    #  But the cache is aware of this, which helps catch some nasty bugs.
-    with pytest.raises(
-        expected_exception=NotImplementedError,
-        match=re.escape("Currently can not yet handle strides beside 'C_CONTIGUOUS'."),
-    ):
-        F_lower = wrapped.lower(F)
+    F_lower = wrapped.lower(F)
     F_res = F_lower.compile()(F)
 
     assert C_res is not F_res
diff --git a/tests/util.py b/tests/util.py
index f7e5d7a..6080a6f 100644
--- a/tests/util.py
+++ b/tests/util.py
@@ -21,11 +21,11 @@
 __all__ = ["mkarray"]
 
 
-def mkarray(shape: Sequence[int] | int, dtype: type = np.float64) -> np.ndarray:
+def mkarray(shape: Sequence[int] | int, dtype: type = np.float64, order: str = "C") -> np.ndarray:
     """Generates a NumPy ndarray with shape `shape`.
 
-    The function uses the generator that is managed by the `_reset_random_seed()` fixture.
-    Thus inside a function the value will be deterministic.
+    The function uses the generator that is managed by the `_reset_random_seed()`
+    fixture. Thus inside a function the value will be deterministic.
 
     Args:
         shape:      The shape to use.
@@ -41,10 +41,14 @@ def mkarray(shape: Sequence[int] | int, dtype: type = np.float64) -> np.ndarray:
         shape = (shape,)
 
     if dtype == np.bool_:
-        return np.random.random(shape) > 0.5  # noqa: NPY002
-    if np.issubdtype(dtype, np.integer):
+        res = np.random.random(shape) > 0.5  # noqa: NPY002
+    elif np.issubdtype(dtype, np.integer):
         iinfo: np.iinfo = np.iinfo(dtype)
-        return np.random.randint(low=iinfo.min, high=iinfo.max, size=shape, dtype=dtype)  # noqa: NPY002
-    if np.issubdtype(dtype, np.complexfloating):
-        return np.array(mkarray(shape, np.float64) + 1.0j * mkarray(shape, np.float64), dtype=dtype)
-    return np.array(np.random.random(shape), dtype=dtype)  # noqa: NPY002
+        res = np.random.randint(  # type: ignore[assignment]  # noqa: NPY002
+            low=iinfo.min, high=iinfo.max, size=shape, dtype=dtype
+        )
+    elif np.issubdtype(dtype, np.complexfloating):
+        res = mkarray(shape, np.float64) + 1.0j * mkarray(shape, np.float64)
+    else:
+        res = np.random.random(shape)  # type: ignore[assignment]  # noqa: NPY002
+    return np.array(res, order=order, dtype=dtype)  # type: ignore[call-overload]

From b47284dca2f475da0743bcf100ea3603be924865 Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Mon, 10 Jun 2024 13:14:23 +0200
Subject: [PATCH 339/458] Some small changes.

---
 .../translator/jaxpr_translator_builder.py    |   8 +-
 .../primitive_translators/alu_translator.py   | 282 ------------------
 src/jace/util/dace_helper.py                  |  11 +-
 3 files changed, 8 insertions(+), 293 deletions(-)
 delete mode 100644 src/jace/translator/primitive_translators/alu_translator.py

diff --git a/src/jace/translator/jaxpr_translator_builder.py b/src/jace/translator/jaxpr_translator_builder.py
index 9ea37dc..107c58c 100644
--- a/src/jace/translator/jaxpr_translator_builder.py
+++ b/src/jace/translator/jaxpr_translator_builder.py
@@ -114,10 +114,10 @@ def translate_jaxpr(
             raise NotImplementedError("'Jaxpr' with side effects are not supported.")
 
         # NOTE: If `self` is already allocated, i.e. has an ongoing translation process,
-        #       the `_allocate_translation_ctx()` function will start a new context.
-        #       Thus the builder will start to translate a second (nested) SDFG.
-        #       Also note that there is no mechanism that forces the integration of the nested
-        #       SDFG/Jaxpr, this must be done manually.
+        #  the `_allocate_translation_ctx()` function will start a new context. Thus the
+        #  builder will start to translate a second (nested) SDFG. Also note that there
+        #  is no mechanism that forces the integration of the nested SDFG/Jaxpr,
+        #  this must be done manually.
         self._allocate_translation_ctx(name=name, jaxpr=jaxpr)
         self._create_constants(jaxpr=jaxpr)
         self._create_initial_input(jaxpr=jaxpr)
diff --git a/src/jace/translator/primitive_translators/alu_translator.py b/src/jace/translator/primitive_translators/alu_translator.py
deleted file mode 100644
index 079139d..0000000
--- a/src/jace/translator/primitive_translators/alu_translator.py
+++ /dev/null
@@ -1,282 +0,0 @@
-# JaCe - JAX Just-In-Time compilation using DaCe (Data Centric Parallel Programming)
-#
-# Copyright (c) 2024, ETH Zurich
-# All rights reserved.
-#
-# SPDX-License-Identifier: BSD-3-Clause
-
-"""This module contains the `ALUTranslator` which translates all arithmetic and logic primitives."""
-
-from __future__ import annotations
-
-from typing import TYPE_CHECKING, Any, Final, cast
-
-import dace
-import numpy as np
-from jax import core as jax_core
-from typing_extensions import override
-
-from jace import translator, util
-
-
-if TYPE_CHECKING:
-    from collections.abc import Sequence
-
-
-class ALUTranslator(translator.PrimitiveTranslator):
-    """This translator handles all arithmetic and logical operations.
-
-    This translator will be reworked soon, it just exists that the initial PR can do anything at all!!
-    """
-
-    def __init__(self, prim_name: str, prim_tmpl: str) -> None:
-        """Initialize the `ALUTranslator`."""
-        self._prim_name = prim_name
-        self._prim_tmpl = prim_tmpl
-
-    @property
-    @override
-    def primitive(self) -> str:
-        return self._prim_name
-
-    @override
-    def __call__(
-        self,
-        builder: translator.JaxprTranslationBuilder,
-        in_var_names: Sequence[str | None],
-        out_var_names: Sequence[str],
-        eqn: jax_core.JaxprEqn,
-        eqn_state: dace.SDFGState,
-    ) -> None:
-        """Perform the translation.
-
-        Deepening on the shapes of the input the function will either create a Tasklet or a mapped Tasklet.
-        The translator is able to handle broadcasting with NumPy rules.
-        The function will always perform the translation inside the provided state.
-
-        Args:
-            builder:         The builder object of the translation.
-            in_var_names:   List of the names of the arrays created inside the SDFG for the inpts or 'None' in case of a literal.
-            out_var_names:  List of the names of the arrays created inside the SDFG for the outputs.
-            eqn:            The Jax equation that is translated.
-            eqn_state:      State into which the primitive's SDFG representation is constructed.
-        """
-        assert self._prim_name == eqn.primitive.name
-
-        # Determine what kind of input we got and how we should proceed.
-        is_scalar = len(util.get_jax_var_shape(eqn.outvars[0])) == 0
-        inp_scalars = [len(util.get_jax_var_shape(Inp)) == 0 for i, Inp in enumerate(eqn.invars)]
-        has_scalars_as_inputs = any(inp_scalars)
-        has_some_literals = any(x is None for x in in_var_names)
-        inps_same_shape = all(
-            util.get_jax_var_shape(eqn.invars[0]) == util.get_jax_var_shape(eqn.invars[i])
-            for i in range(1, len(eqn.invars))
-        )
-
-        # We will now look which dimensions have to be broadcasted on which operator.
-        #  I.e. in the dimensions in the lists below there will be no map iteration index.
-        dims_to_bcastl: list[int] = []
-        dims_to_bcastr: list[int] = []
-
-        # Determine if and how we have to broadcast.
-        if inps_same_shape or is_scalar:
-            pass
-
-        elif has_some_literals or has_scalars_as_inputs:
-            # This is essentially an array plus a scalar, that is eitehr a literal or a variable.
-            assert (not has_some_literals) or all(
-                util.get_jax_var_shape(invar) == util.get_jax_var_shape(eqn.outvars[0])
-                for (invar, x) in zip(eqn.invars, in_var_names, strict=False)
-                if x is not None
-            )
-            assert (not has_scalars_as_inputs) or all(
-                util.get_jax_var_shape(invar) in {util.get_jax_var_shape(eqn.outvars[0]), ()}
-                for (invar, x) in zip(eqn.invars, in_var_names, strict=False)
-                if x is not None
-            )
-
-        else:
-            # This is the general broadcasting case
-            #  We assume that both inputs and the output have the same rank but different sizes in each dimension.
-            #  It seems that Jax ensures this.
-            #  We further assume that if the size in a dimension differs then one must have size 1.
-            #  This is the size we broadcast over, i.e. conceptually replicated.
-            out_shps = tuple(util.get_jax_var_shape(eqn.outvars[0]))  # Shape of the output
-            inp_shpl = tuple(util.get_jax_var_shape(eqn.invars[0]))  # Shape of the left/first input
-            inp_shpr = tuple(
-                util.get_jax_var_shape(eqn.invars[1])
-            )  # Shape of the right/second input
-
-            if not ((len(inp_shpl) == len(inp_shpr)) and (len(out_shps) == len(inp_shpr))):
-                raise NotImplementedError("Can not broadcast over different ranks.")
-
-            for dim, (shp_lft, shp_rgt, out_shp) in enumerate(zip(inp_shpl, inp_shpr, out_shps)):
-                if shp_lft == shp_rgt:
-                    assert out_shp == shp_lft
-                elif shp_lft == 1:
-                    assert shp_rgt == out_shp
-                    dims_to_bcastl.append(dim)
-                elif shp_rgt == 1:
-                    assert shp_lft == out_shp
-                    dims_to_bcastr.append(dim)
-                else:
-                    raise ValueError(f"Invalid shapes in dimension {dim} for broadcasting.")
-
-        # Now we create the Tasklet in which the calculation is performed.
-        tskl_code: str = self._write_tasklet_code(in_var_names, eqn)
-        tskl_name: str = eqn.primitive.name
-        tskl_map_ranges: list[tuple[str, str]] = [
-            (f"__i{dim}", f"0:{N}") for dim, N in enumerate(util.get_jax_var_shape(eqn.outvars[0]))
-        ]
-        tskl_output: tuple[str, dace.Memlet] = None  # type: ignore[assignment]
-        tskl_inputs: list[tuple[str, dace.Memlet] | tuple[None, None]] = []
-
-        # Generate the Memlets for the input.
-        for i, dims_to_bcast in zip(range(len(in_var_names)), [dims_to_bcastl, dims_to_bcastr]):
-            if in_var_names[i] is None:  # Literal: No input needed.
-                tskl_inputs.append((None, None))
-                continue
-            if inp_scalars[i]:  # Scalar
-                assert len(dims_to_bcast) == 0
-                i_memlet = dace.Memlet.simple(in_var_names[i], "0")
-            else:  # Array: We may have to broadcast
-                inputs_: list[str] = []
-                for dim, (map_var, _) in enumerate(tskl_map_ranges):
-                    if dim in dims_to_bcast:
-                        inputs_.append("0")
-                    else:
-                        inputs_.append(map_var)
-                i_memlet = dace.Memlet.simple(in_var_names[i], ", ".join(inputs_))
-                del inputs_
-            tskl_inputs.append((f"__in{i}", i_memlet))
-
-        # Now generate the Memlets for the output
-        if is_scalar:
-            tskl_output = ("__out0", dace.Memlet.simple(out_var_names[0], "0"))
-        else:
-            tskl_output = (
-                "__out0",
-                dace.Memlet.simple(out_var_names[0], ", ".join([X[0] for X in tskl_map_ranges])),
-            )
-
-        if is_scalar:
-            tskl_tasklet = eqn_state.add_tasklet(
-                tskl_name,
-                _list_to_dict(tskl_inputs).keys(),
-                _list_to_dict([tskl_output]).keys(),
-                tskl_code,
-            )
-            for in_var, (in_connector, in_memlet) in zip(in_var_names, tskl_inputs, strict=False):
-                if in_var is None:  # So access node for literal
-                    continue
-                eqn_state.add_edge(
-                    eqn_state.add_read(in_var), None, tskl_tasklet, in_connector, in_memlet
-                )
-            eqn_state.add_edge(
-                tskl_tasklet,
-                tskl_output[0],
-                eqn_state.add_write(out_var_names[0]),
-                None,
-                tskl_output[1],
-            )
-        else:
-            eqn_state.add_mapped_tasklet(
-                name=tskl_name,
-                map_ranges=_list_to_dict(tskl_map_ranges),
-                inputs=_list_to_dict(tskl_inputs),
-                code=tskl_code,
-                outputs=_list_to_dict([tskl_output]),
-                external_edges=True,
-            )
-
-        return eqn_state
-
-    def _write_tasklet_code(
-        self, in_var_names: Sequence[str | None], eqn: jax_core.JaxprEqn
-    ) -> str:
-        """This function generates the Tasklet code based on a primitive.
-
-        The function will also perform literal substitution and parameter handling.
-
-        Args:
-            in_var_names:   The list of SDFG variables used as input.
-        """
-
-        t_code = self._prim_tmpl
-
-        # Now we handle Literal substitution
-        for i, in_var_name in enumerate(in_var_names):
-            if in_var_name is not None:
-                continue
-
-            jax_in_var: jax_core.Literal = cast(jax_core.Literal, eqn.invars[i])
-            if util.get_jax_var_shape(jax_in_var) == ():
-                t_val = jax_in_var.val
-                if isinstance(t_val, np.ndarray):
-                    t_val = jax_in_var.val.max()  # I do not know a better way in that case
-                t_code = t_code.replace(f"__in{i}", str(t_val))
-            else:
-                raise ValueError(
-                    f"Can not handle the literal case of shape: {util.get_jax_var_shape(jax_in_var)}"
-                )
-
-        # Now replace the parameters
-        if len(eqn.params) != 0:
-            t_code = t_code.format(**eqn.params)
-
-        return t_code
-
-
-def _list_to_dict(inp: Sequence[tuple[None | Any, Any]]) -> dict[Any, Any]:
-    """This method turns a `list` of pairs into a `dict` and applies a `None` filter.
-
-    The function will only include pairs whose key, i.e. first element is not `None`.
-    """
-    return {k: v for k, v in inp if k is not None}
-
-
-# Contains all the templates for ALU operations.
-_ALU_OPS_TASKLET_TEMPLATES: Final[dict[str, str]] = {
-    # Unary operations
-    "pos": "__out0 = +(__in0)",
-    "neg": "__out0 = -(__in0)",
-    "not": "__out0 = not (__in0)",
-    "floor": "__out0 = floor(__in0)",
-    "ceil": "__out0 = ceil(__in0)",
-    "round": "__out0 = round(__in0)",
-    "abs": "__out0 = abs(__in0)",
-    "sign": "__out0 = sign(__in0)",
-    "sqrt": "__out0 = sqrt(__in0)",
-    "log": "__out0 = log(__in0)",
-    "exp": "__out0 = exp(__in0)",
-    "integer_pow": "__out0 = (__in0)**({y})",  # 'y' is a parameter of the primitive
-    "sin": "__out0 = sin(__in0)",
-    "asin": "__out0 = asin(__in0)",
-    "cos": "__out0 = cos(__in0)",
-    "acos": "__out0 = acos(__in0)",
-    "tan": "__out0 = tan(__in0)",
-    "atan": "__out0 = atan(__in0)",
-    "tanh": "__out0 = tanh(__in0)",
-    # Binary operations
-    "add": "__out0 = (__in0)+(__in1)",
-    "add_any": "__out0 = (__in0)+(__in1)",  # No idea what makes `add_any` differ from `add`
-    "sub": "__out0 = (__in0)-(__in1)",
-    "mul": "__out0 = (__in0)*(__in1)",
-    "div": "__out0 = (__in0)/(__in1)",
-    "rem": "__out0 = (__in0)%(__in1)",
-    "and": "__out0 = (__in0) and (__in1)",
-    "or": "__out0 = (__in0) or  (__in1)",
-    "pow": "__out0 = (__in0)**(__in1)",
-    "ipow": "__out0 = (__in0)**(int(__in1))",
-    "min": "__out0 = min(__in0, __in1)",
-    "max": "__out0 = max(__in0, __in1)",
-    "eq": "__out0 = __in0 == __in1",
-    "ne": "__out0 = __in0 != __in1",
-    "ge": "__out0 = __in0 >= __in1",
-    "gt": "__out0 = __in0 > __in1",
-    "le": "__out0 = __in0 <= __in1",
-    "lt": "__out0 = __in0 < __in1",
-}
-
-for prim_name, prim_tmpl in _ALU_OPS_TASKLET_TEMPLATES.items():
-    translator.register_primitive_translator(ALUTranslator(prim_name, prim_tmpl))
diff --git a/src/jace/util/dace_helper.py b/src/jace/util/dace_helper.py
index 90db509..458ec9f 100644
--- a/src/jace/util/dace_helper.py
+++ b/src/jace/util/dace_helper.py
@@ -40,9 +40,11 @@ def compile_jax_sdfg(tsdfg: translator.TranslatedJaxprSDFG) -> dace_helper.Compi
         for array_name in tsdfg.sdfg.arrays.keys()  # noqa: SIM118  # We can not use `in` because we are not interested in `my_mangled_variable__return_zulu`!
     ):
         raise ValueError("Only support SDFGs without '__return' members.")
+    if tsdfg.sdfg.free_symbols:  # This is a simplification that makes our life simple.
+        raise NotImplementedError(f"No free symbols allowed, found: {tsdfg.sdfg.free_symbols}")
 
     # To ensure that the SDFG is compiled and to get rid of a warning we must modify
-    #  some settings of the SDFG. To fake an immutable SDFG, we will restore them later.
+    #  some settings of the SDFG. But we also have to fake an immutable SDFG
     sdfg = tsdfg.sdfg
     org_sdfg_name = sdfg.name
     org_recompile = sdfg._recompile
@@ -102,17 +104,12 @@ def run_jax_sdfg(
         raise NotImplementedError("No kwargs are supported yet.")
     if len(inp_names) != len(call_args):
         raise RuntimeError("Wrong number of arguments.")
-    if sdfg.free_symbols:  # This is a simplification that makes our life simple.
-        raise NotImplementedError(
-            f"No externally defined symbols are allowed, found: {sdfg.free_symbols}"
-        )
 
     # Build the argument list that we will pass to the compiled object.
     sdfg_call_args: dict[str, Any] = {}
     for in_name, in_val in zip(inp_names, call_args, strict=True):
         # TODO(phimuell): Implement a stride matching process.
         if util.is_jax_array(in_val):
-            # TODO(phimuell): Add test for this.
             if not util.is_fully_addressable(in_val):
                 raise ValueError(f"Passed a not fully addressable Jax array as '{in_name}'")
             in_val = in_val.__array__()
@@ -137,7 +134,7 @@ def run_jax_sdfg(
         dace.Config.set("compiler", "allow_view_arguments", value=True)
         csdfg(**sdfg_call_args)
 
-    # Handling the output (pytrees are missing)
+    # TODO(phimuell): Handle pytrees
     if not out_names:
         return None
     ret_val: tuple[Any] = tuple(sdfg_call_args[out_name] for out_name in out_names)

From 40f8574f4d707449130fb102b998dbab252433e7 Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Mon, 10 Jun 2024 13:43:12 +0200
Subject: [PATCH 340/458] Added a configuration file in the `docs/` folder such
 that the trailing comma is applied there.

---
 docs/conf.py        | 27 ++++++++++++++++++++++-----
 docs/pyproject.toml |  2 ++
 pyproject.toml      |  1 +
 3 files changed, 25 insertions(+), 5 deletions(-)
 create mode 100644 docs/pyproject.toml

diff --git a/docs/conf.py b/docs/conf.py
index e902d98..01d2ca7 100644
--- a/docs/conf.py
+++ b/docs/conf.py
@@ -25,15 +25,32 @@
     "sphinx_copybutton",
 ]
 
-source_suffix = [".rst", ".md"]
-exclude_patterns = ["_build", "**.ipynb_checkpoints", "Thumbs.db", ".DS_Store", ".env", ".venv"]
+source_suffix = [
+    ".rst",
+    ".md",
+]
+exclude_patterns = [
+    "_build",
+    "**.ipynb_checkpoints",
+    "Thumbs.db",
+    ".DS_Store",
+    ".env",
+    ".venv",
+]
 
 html_theme = "furo"
 
-myst_enable_extensions = ["colon_fence"]
+myst_enable_extensions = [
+    "colon_fence",
+]
 
-intersphinx_mapping = {"python": ("https://docs.python.org/3", None)}
+intersphinx_mapping = {
+    "python": ("https://docs.python.org/3", None),
+}
 
-nitpick_ignore = [("py:class", "_io.StringIO"), ("py:class", "_io.BytesIO")]
+nitpick_ignore = [
+    ("py:class", "_io.StringIO"),
+    ("py:class", "_io.BytesIO"),
+]
 
 always_document_param_types = True
diff --git a/docs/pyproject.toml b/docs/pyproject.toml
new file mode 100644
index 0000000..b6658df
--- /dev/null
+++ b/docs/pyproject.toml
@@ -0,0 +1,2 @@
+[tool.ruff.format]
+skip-magic-trailing-comma = false
diff --git a/pyproject.toml b/pyproject.toml
index 1746b5a..33023fd 100644
--- a/pyproject.toml
+++ b/pyproject.toml
@@ -95,6 +95,7 @@ xfail_strict = true
 
 # -- ruff --
 [tool.ruff]
+extend-exclude = ["noxfile.py"]
 line-length = 100
 respect-gitignore = true
 show-fixes = true

From 4f52badeffff177026e8fa68a538af5908d00b4a Mon Sep 17 00:00:00 2001
From: Enrique Gonzalez Paredes <enriqueg@cscs.ch>
Date: Wed, 29 May 2024 12:58:15 +0200
Subject: [PATCH 341/458] WIP: requirements manager

---
 .pre-commit-config.yaml                     |   6 +-
 noxfile.py                                  |  21 +-
 pyproject.toml                              |  38 ++--
 requirements/base.in                        |   3 +
 requirements/base.txt                       |  91 +++++++++
 requirements/cuda12.in                      |   4 +
 requirements/cuda12.txt                     |  74 +++++++
 requirements/dev-cuda12.in                  |   2 +
 requirements/dev-cuda12.txt                 |  12 ++
 requirements-dev.txt => requirements/dev.in |  11 +-
 requirements/dev.txt                        |  95 +++++++++
 requirements/sync_tool.py                   | 209 ++++++++++++++++++++
 12 files changed, 534 insertions(+), 32 deletions(-)
 create mode 100644 requirements/base.in
 create mode 100644 requirements/base.txt
 create mode 100644 requirements/cuda12.in
 create mode 100644 requirements/cuda12.txt
 create mode 100644 requirements/dev-cuda12.in
 create mode 100644 requirements/dev-cuda12.txt
 rename requirements-dev.txt => requirements/dev.in (60%)
 create mode 100644 requirements/dev.txt
 create mode 100644 requirements/sync_tool.py

diff --git a/.pre-commit-config.yaml b/.pre-commit-config.yaml
index 13841be..59402ca 100644
--- a/.pre-commit-config.yaml
+++ b/.pre-commit-config.yaml
@@ -48,11 +48,10 @@ repos:
   - id: mixed-line-ending
   - id: name-tests-test
     args: ["--pytest-test-first"]
-  - id: requirements-txt-fixer
   - id: trailing-whitespace
 
 - repo: https://github.com/astral-sh/ruff-pre-commit
-  rev: v0.4.6
+  rev: v0.4.8
   hooks:
   - id: ruff
     args: ["--fix", "--show-fixes", "--preview"]
@@ -68,7 +67,8 @@ repos:
     - dace==0.15.1
     - jax[cpu]==0.4.28
     - numpy==1.26.4
-    - pytest==8.2.1
+    - pytest==8.2.2
+    - typing-extensions==4.12.2
 - repo: https://github.com/codespell-project/codespell
   rev: "v2.2.6"
   hooks:
diff --git a/noxfile.py b/noxfile.py
index 3772f2d..19c45f4 100644
--- a/noxfile.py
+++ b/noxfile.py
@@ -10,7 +10,7 @@
 DIR = Path(__file__).parent.resolve()
 
 nox.needs_version = ">=2024.3.2"
-nox.options.sessions = ["lint", "pylint", "tests"]
+nox.options.sessions = ["lint", "tests"]
 nox.options.default_venv_backend = "uv|virtualenv"
 
 
@@ -101,3 +101,22 @@ def build(session: nox.Session) -> None:
 
     session.install("build")
     session.run("python", "-m", "build")
+
+
+@nox.session
+def requirements(session: nox.Session) -> None:
+    """
+    Freeze dependencies from input specs and synchronize across tools.
+    """
+    requirements_path = DIR / "requirements"
+    req_sync_tool = requirements_path / "sync_tool.py"
+
+    dependencies = ["pre-commit"] + nox.project.load_toml(req_sync_tool)["dependencies"]
+    session.install(*dependencies)
+    session.install("pip-compile-multi")
+
+    session.run("python", req_sync_tool, "pull")
+    session.run("pip-compile-multi", "-g", "--skip-constraints")
+    session.run("python", req_sync_tool, "push")
+
+    session.run("pre-commit", "run", "--files", ".pre-commit-config.yaml", success_codes=[0, 1])
diff --git a/pyproject.toml b/pyproject.toml
index 3556e8a..175a679 100644
--- a/pyproject.toml
+++ b/pyproject.toml
@@ -3,9 +3,7 @@ build-backend = "setuptools.build_meta"
 requires = ["setuptools>=61"]
 
 [project]
-authors = [
-  {name = "ETH Zurich", email = "gridtools@cscs.ch"}
-]
+authors = [{name = "ETH Zurich", email = "gridtools@cscs.ch"}]
 classifiers = [
   "Development Status :: 1 - Planning",
   "Intended Audience :: Science/Research",
@@ -21,11 +19,7 @@ classifiers = [
   "Topic :: Scientific/Engineering",
   "Typing :: Typed"
 ]
-dependencies = [
-  "dace>=0.15",
-  "jax[cpu]>=0.4.24",
-  "numpy>=1.26.0"
-]
+dependencies = ["dace>=0.15", "jax[cpu]>=0.4.24", "numpy>=1.26.0"]
 description = "JAX jit using DaCe (Data Centric Parallel Programming)"
 name = "JaCe"
 readme = "README.md"
@@ -34,11 +28,7 @@ version = "0.1.0"
 license.file = "LICENSE"
 
 [project.optional-dependencies]
-cuda12 = [
-  "cupy-cuda12x>=12.1.0",
-  "jax[cuda12]>=0.4.24",
-  "optuna>=3.4.0"
-]
+cuda12 = ["cupy-cuda12x>=12.1.0", "jax[cuda12]>=0.4.24", "optuna>=3.4.0"]
 
 [project.urls]
 "Bug Tracker" = "https://github.com/GridTools/JaCe/issues"
@@ -47,10 +37,7 @@ Discussions = "https://github.com/GridTools/JaCe/discussions"
 Homepage = "https://github.com/GridTools/JaCe"
 
 [tool.coverage]
-report.exclude_also = [
-  '\.\.\.',
-  'if typing.TYPE_CHECKING:'
-]
+report.exclude_also = ['\.\.\.', 'if typing.TYPE_CHECKING:']
 run.source = ["jace"]
 
 # -- mypy  --
@@ -83,14 +70,10 @@ module = ["tests.*", "dace.*", "jax.*", "jaxlib.*"]
 
 [tool.pytest.ini_options]
 addopts = ["-ra", "--showlocals", "--strict-markers", "--strict-config"]
-filterwarnings = [
-  "error"
-]
+filterwarnings = ["error"]
 log_cli_level = "INFO"
 minversion = "6.0"
-testpaths = [
-  "tests"
-]
+testpaths = ["tests"]
 xfail_strict = true
 
 # -- ruff --
@@ -109,7 +92,9 @@ extend-select = [
   "B",  # flake8-bugbear
   "I",  # isort
   "G",  # flake8-logging-format
+  "W",  # pycodestyle-warning
   "C4",  # flake8-comprehensions
+  "C90",  # mccabe
   "PT",  # flake8-pytest-style
   "UP",  # pyupgrade       # TODO: in evaluation
   "ARG",  # flake8-unused-arguments
@@ -129,6 +114,7 @@ extend-select = [
 ignore = [
   'B905',  # [zip-without-explicit-strict]
   'E501',  # [line-too-long]
+  'TCH003',  # [typing-only-standard-library-import]
   'UP038'  # [non-pep604-isinstance]
 ]
 # ignore-init-module-imports = true  # deprecated in preview mode
@@ -160,7 +146,13 @@ section-order = [
 [tool.ruff.lint.isort.sections]
 tests = ["tests", "unit_tests", "integration_tests"]
 
+[tool.ruff.lint.mccabe]
+max-complexity = 12
+
 [tool.ruff.lint.per-file-ignores]
 "!tests/**.py" = ["PT"]  # Ignore `flake8-pytest-style` everywhere except in `tests/`
 "noxfile.py" = ["T20"]  # Ignore `flake8-print`
 "tests/**" = ["T10", "T20"]  # Ignore `flake8-debugger` and `flake8-print`
+
+[tool.ruff.lint.pycodestyle]
+max-doc-length = 85
diff --git a/requirements/base.in b/requirements/base.in
new file mode 100644
index 0000000..b25ef34
--- /dev/null
+++ b/requirements/base.in
@@ -0,0 +1,3 @@
+dace>=0.15
+jax[cpu]>=0.4.24
+numpy>=1.26.0
\ No newline at end of file
diff --git a/requirements/base.txt b/requirements/base.txt
new file mode 100644
index 0000000..d388c2f
--- /dev/null
+++ b/requirements/base.txt
@@ -0,0 +1,91 @@
+# SHA1:190b0703818fae41383e79f02d34ca019cedca4d
+#
+# This file is autogenerated by pip-compile-multi
+# To update, run:
+#
+#    pip-compile-multi
+#
+aenum==3.1.15
+    # via dace
+astunparse==1.6.3
+    # via dace
+blinker==1.8.2
+    # via flask
+certifi==2024.6.2
+    # via requests
+charset-normalizer==3.3.2
+    # via requests
+click==8.1.7
+    # via flask
+dace==0.15.1
+    # via -r requirements/base.in
+dill==0.3.8
+    # via dace
+flask==3.0.3
+    # via dace
+fparser==0.1.4
+    # via dace
+idna==3.7
+    # via requests
+itsdangerous==2.2.0
+    # via flask
+jax[cpu]==0.4.28
+    # via -r requirements/base.in
+jaxlib==0.4.28
+    # via jax
+jinja2==3.1.4
+    # via flask
+markupsafe==2.1.5
+    # via
+    #   jinja2
+    #   werkzeug
+ml-dtypes==0.4.0
+    # via
+    #   jax
+    #   jaxlib
+mpmath==1.3.0
+    # via sympy
+networkx==3.3
+    # via dace
+numpy==1.26.4
+    # via
+    #   -r requirements/base.in
+    #   dace
+    #   jax
+    #   jaxlib
+    #   ml-dtypes
+    #   opt-einsum
+    #   scipy
+opt-einsum==3.3.0
+    # via jax
+packaging==24.1
+    # via setuptools-scm
+ply==3.11
+    # via dace
+pyyaml==6.0.1
+    # via dace
+requests==2.32.3
+    # via dace
+scipy==1.13.1
+    # via
+    #   jax
+    #   jaxlib
+setuptools-scm==8.1.0
+    # via fparser
+six==1.16.0
+    # via astunparse
+sympy==1.9
+    # via dace
+tomli==2.0.1
+    # via setuptools-scm
+urllib3==2.2.1
+    # via requests
+websockets==12.0
+    # via dace
+werkzeug==3.0.3
+    # via flask
+wheel==0.43.0
+    # via astunparse
+
+# The following packages are considered to be unsafe in a requirements file:
+# setuptools
diff --git a/requirements/cuda12.in b/requirements/cuda12.in
new file mode 100644
index 0000000..5c9b956
--- /dev/null
+++ b/requirements/cuda12.in
@@ -0,0 +1,4 @@
+-r base.in
+cupy-cuda12x>=12.1.0
+jax[cuda12]>=0.4.24
+optuna>=3.4.0
\ No newline at end of file
diff --git a/requirements/cuda12.txt b/requirements/cuda12.txt
new file mode 100644
index 0000000..098643e
--- /dev/null
+++ b/requirements/cuda12.txt
@@ -0,0 +1,74 @@
+# SHA1:035352ab483a9ee349c593a1ff7f359a88012cc9
+#
+# This file is autogenerated by pip-compile-multi
+# To update, run:
+#
+#    pip-compile-multi
+#
+-r base.txt
+alembic==1.13.1
+    # via optuna
+colorlog==6.8.2
+    # via optuna
+cupy-cuda12x==13.1.0
+    # via -r requirements/cuda12.in
+fastrlock==0.8.2
+    # via cupy-cuda12x
+greenlet==3.0.3
+    # via sqlalchemy
+jax[cpu,cuda12]==0.4.28
+    # via
+    #   -r requirements/base.in
+    #   -r requirements/cuda12.in
+jax-cuda12-pjrt==0.4.28
+    # via jax-cuda12-plugin
+jax-cuda12-plugin==0.4.28
+    # via jax
+mako==1.3.5
+    # via alembic
+nvidia-cublas-cu12==12.5.2.13
+    # via
+    #   jax
+    #   nvidia-cudnn-cu12
+    #   nvidia-cusolver-cu12
+nvidia-cuda-cupti-cu12==12.5.39
+    # via jax
+nvidia-cuda-nvcc-cu12==12.5.40
+    # via jax
+nvidia-cuda-nvrtc-cu12==12.5.40
+    # via nvidia-cudnn-cu12
+nvidia-cuda-runtime-cu12==12.5.39
+    # via jax
+nvidia-cudnn-cu12==8.9.7.29
+    # via jax
+nvidia-cufft-cu12==11.2.3.18
+    # via jax
+nvidia-cusolver-cu12==11.6.2.40
+    # via jax
+nvidia-cusparse-cu12==12.4.1.24
+    # via
+    #   jax
+    #   nvidia-cusolver-cu12
+nvidia-nccl-cu12==2.21.5
+    # via jax
+nvidia-nvjitlink-cu12==12.5.40
+    # via
+    #   jax
+    #   nvidia-cufft-cu12
+    #   nvidia-cusolver-cu12
+    #   nvidia-cusparse-cu12
+optuna==3.6.1
+    # via -r requirements/cuda12.in
+sqlalchemy==2.0.30
+    # via
+    #   alembic
+    #   optuna
+tqdm==4.66.4
+    # via optuna
+typing-extensions==4.12.2
+    # via
+    #   alembic
+    #   sqlalchemy
+
+# The following packages are considered to be unsafe in a requirements file:
+# setuptools
diff --git a/requirements/dev-cuda12.in b/requirements/dev-cuda12.in
new file mode 100644
index 0000000..aa00469
--- /dev/null
+++ b/requirements/dev-cuda12.in
@@ -0,0 +1,2 @@
+-r base.in
+-r dev.in
diff --git a/requirements/dev-cuda12.txt b/requirements/dev-cuda12.txt
new file mode 100644
index 0000000..7c894e8
--- /dev/null
+++ b/requirements/dev-cuda12.txt
@@ -0,0 +1,12 @@
+# SHA1:d9f19ac423500f255d32c3e29dd96fd3b5c649a8
+#
+# This file is autogenerated by pip-compile-multi
+# To update, run:
+#
+#    pip-compile-multi
+#
+-r base.txt
+-r dev.txt
+
+# The following packages are considered to be unsafe in a requirements file:
+# setuptools
diff --git a/requirements-dev.txt b/requirements/dev.in
similarity index 60%
rename from requirements-dev.txt
rename to requirements/dev.in
index a7a822e..b648f8a 100644
--- a/requirements-dev.txt
+++ b/requirements/dev.in
@@ -1,11 +1,12 @@
+-r base.in
 furo>=2023.08.17
-mypy >= 1.9.0
+mypy>=1.9.0
 myst_parser>=0.13
-pytest >=6
-pytest-cov >=3
-ruff >= 0.3.5
+pytest>=6
+pytest-cov>=3
+ruff>=0.3.5
 sphinx>=7.0
 sphinx_autodoc_typehints
 sphinx_copybutton
-types-all
+tomlkit>=0.12.4
 typing-extensions>=4.10.0
diff --git a/requirements/dev.txt b/requirements/dev.txt
new file mode 100644
index 0000000..176b9a2
--- /dev/null
+++ b/requirements/dev.txt
@@ -0,0 +1,95 @@
+# SHA1:a7338646990b5874d5aa51bb3e2bd37753c754eb
+#
+# This file is autogenerated by pip-compile-multi
+# To update, run:
+#
+#    pip-compile-multi
+#
+-r base.txt
+alabaster==0.7.16
+    # via sphinx
+babel==2.15.0
+    # via sphinx
+beautifulsoup4==4.12.3
+    # via furo
+coverage[toml]==7.5.3
+    # via pytest-cov
+docutils==0.21.2
+    # via
+    #   myst-parser
+    #   sphinx
+exceptiongroup==1.2.1
+    # via pytest
+furo==2024.5.6
+    # via -r requirements/dev.in
+imagesize==1.4.1
+    # via sphinx
+iniconfig==2.0.0
+    # via pytest
+markdown-it-py==3.0.0
+    # via
+    #   mdit-py-plugins
+    #   myst-parser
+mdit-py-plugins==0.4.1
+    # via myst-parser
+mdurl==0.1.2
+    # via markdown-it-py
+mypy==1.10.0
+    # via -r requirements/dev.in
+mypy-extensions==1.0.0
+    # via mypy
+myst-parser==3.0.1
+    # via -r requirements/dev.in
+pluggy==1.5.0
+    # via pytest
+pygments==2.18.0
+    # via
+    #   furo
+    #   sphinx
+pytest==8.2.2
+    # via
+    #   -r requirements/dev.in
+    #   pytest-cov
+pytest-cov==5.0.0
+    # via -r requirements/dev.in
+ruff==0.4.8
+    # via -r requirements/dev.in
+snowballstemmer==2.2.0
+    # via sphinx
+soupsieve==2.5
+    # via beautifulsoup4
+sphinx==7.3.7
+    # via
+    #   -r requirements/dev.in
+    #   furo
+    #   myst-parser
+    #   sphinx-autodoc-typehints
+    #   sphinx-basic-ng
+    #   sphinx-copybutton
+sphinx-autodoc-typehints==2.1.1
+    # via -r requirements/dev.in
+sphinx-basic-ng==1.0.0b2
+    # via furo
+sphinx-copybutton==0.5.2
+    # via -r requirements/dev.in
+sphinxcontrib-applehelp==1.0.8
+    # via sphinx
+sphinxcontrib-devhelp==1.0.6
+    # via sphinx
+sphinxcontrib-htmlhelp==2.0.5
+    # via sphinx
+sphinxcontrib-jsmath==1.0.1
+    # via sphinx
+sphinxcontrib-qthelp==1.0.7
+    # via sphinx
+sphinxcontrib-serializinghtml==1.1.10
+    # via sphinx
+tomlkit==0.12.5
+    # via -r requirements/dev.in
+typing-extensions==4.12.2
+    # via
+    #   -r requirements/dev.in
+    #   mypy
+
+# The following packages are considered to be unsafe in a requirements file:
+# setuptools
diff --git a/requirements/sync_tool.py b/requirements/sync_tool.py
new file mode 100644
index 0000000..1eabda6
--- /dev/null
+++ b/requirements/sync_tool.py
@@ -0,0 +1,209 @@
+#! /usr/bin/env python3
+
+# JaCe - JAX Just-In-Time compilation using DaCe (Data Centric Parallel Programming)
+#
+# Copyright (c) 2024, ETH Zurich
+# All rights reserved.
+#
+# SPDX-License-Identifier: BSD-3-Clause
+
+# /// script
+# requires-python = ">=3.10"
+# dependencies = [
+#   "packaging>=24.0",
+#   "tomlkit>=0.12.4",
+#   "typer-slim>=0.12.3",
+#   "yamlpath>=3.8.2"
+# ]
+# ///
+
+from __future__ import annotations
+
+import pathlib
+import re
+import types
+from collections.abc import Iterable, Mapping
+from typing import NamedTuple, TypeAlias
+
+import tomlkit
+import typer
+import yamlpath
+from packaging import (
+    markers as pkg_markers,
+    requirements as pkg_requirements,
+    specifiers as pkg_specifiers,
+)
+
+
+# -- Classes --
+class RequirementSpec(NamedTuple):
+    package: pkg_requirements.Requirement
+    specifiers: pkg_specifiers.SpecifierSet | None = None
+    marker: pkg_markers.Marker | None = None
+
+    @classmethod
+    def from_text(cls, req_text: str) -> RequirementSpec:
+        req_text = req_text.strip()
+        assert req_text, "Requirement string cannot be empty"
+
+        m = re.match(r"^([^><=~]*)\s*([^;]*)\s*;?\s*(.*)$", req_text)
+        return RequirementSpec(
+            pkg_requirements.Requirement(m[1]),
+            pkg_specifiers.Specifier(m[2]) if m[2] else None,
+            pkg_markers.Marker(m[3]) if m[3] else None,
+        )
+
+    def as_text(self) -> str:
+        return f"{self.package!s}{(self.specifiers or '')!s}{(self.marker or '')!s}".strip()
+
+
+class Requirement(NamedTuple):
+    text: str
+    spec: RequirementSpec
+
+    @classmethod
+    def from_text(cls, req_text: str) -> Requirement:
+        return Requirement(req_text, RequirementSpec.from_text(req_text))
+
+    @classmethod
+    def from_spec(cls, req: RequirementSpec) -> Requirement:
+        return Requirement(req.as_text(), req)
+
+    def dump(self, *, template: str | None = None) -> str:
+        template = template or "{req.text}"
+        return template.format(req=self)
+
+
+class RequirementDumpSpec(NamedTuple):
+    value: Requirement | Iterable[Requirement]
+    template: str | None = None
+
+
+DumpSpec: TypeAlias = (
+    RequirementDumpSpec | tuple[Requirement | Iterable[Requirement], str | None] | str
+)
+
+
+# -- Functions --
+def make_requirements_map(
+    requirements: Iterable[Requirement],
+) -> dict[str, Requirement]:
+    return {req.spec.package.name: req for req in requirements}
+
+
+def load_from_requirements(filename: str) -> list[Requirement]:
+    requirements = []
+    with pathlib.Path(filename).open() as f:
+        for line in f:
+            if (end := line.find("#")) != -1:
+                line = line[:end]
+            line = line.strip()
+            if line and not line.startswith("-"):
+                requirements.append(Requirement.from_text(line))
+
+    return requirements
+
+
+def load_from_toml(filename: str, key: str) -> list[Requirement]:
+    with pathlib.Path(filename).open() as f:
+        toml_data = tomlkit.loads(f.read())
+
+    section = toml_data
+    for part in key.split("."):
+        section = section[part]
+
+    return [Requirement.from_text(req) for req in section]
+
+
+def dump(requirements: Iterable[Requirement], *, template: str | None = None) -> None:
+    return [req.dump(template=template) for req in requirements]
+
+
+def dump_to_requirements(
+    requirements: Iterable[Requirement],
+    filename: str,
+    *,
+    template: str | None = None,
+    header: str | None = None,
+    footer: str | None = None,
+) -> None:
+    with pathlib.Path(filename).open("w") as f:
+        if header:
+            f.write(f"{header}\n")
+        f.write("\n".join(dump(requirements, template=template)))
+        if footer:
+            f.write(f"{footer}\n")
+
+
+def dump_to_yaml(requirements_map: Mapping[str, DumpSpec], filename: str) -> None:
+    file_path = pathlib.Path(filename)
+    logging_args = types.SimpleNamespace(quiet=False, verbose=False, debug=False)
+    console_log = yamlpath.wrappers.ConsolePrinter(logging_args)
+    yaml = yamlpath.common.Parsers.get_yaml_editor()
+    (yaml_data, doc_loaded) = yamlpath.common.Parsers.get_yaml_data(yaml, console_log, file_path)
+    assert doc_loaded
+    processor = yamlpath.Processor(console_log, yaml_data)
+
+    for key_path, (value, template) in requirements_map.items():
+        match value:
+            case str():
+                processor.set_value(yamlpath.YAMLPath(key_path), value)
+            case Requirement():
+                processor.set_value(yamlpath.YAMLPath(key_path), value.dump(template=template))
+            case Iterable():
+                for _ in processor.delete_nodes(yamlpath.YAMLPath(key_path)):
+                    pass
+                for i, req in enumerate(dump(value, template=template)):
+                    item_path = yamlpath.YAMLPath(f"{key_path}[{i}]")
+                    processor.set_value(item_path, req)
+
+    with file_path.open("w") as f:
+        yaml.dump(yaml_data, f)
+
+
+# -- CLI --
+app = typer.Typer()
+
+
+@app.command()
+def pull():
+    base = load_from_toml("pyproject.toml", "project.dependencies")
+    dump_to_requirements(base, "requirements/base.in")
+    cuda12 = load_from_toml("pyproject.toml", "project.optional-dependencies.cuda12")
+    dump_to_requirements(cuda12, "requirements/cuda12.in", header="-r base.in")
+
+
+@app.command()
+def push():
+    base_names = {r.spec.package for r in load_from_toml("pyproject.toml", "project.dependencies")}
+    base_versions = [
+        r for r in load_from_requirements("requirements/base.txt") if r.spec.package in base_names
+    ]
+    dev_versions_map = make_requirements_map(load_from_requirements("requirements/dev.txt"))
+    mypy_req_versions = sorted(
+        base_versions + [dev_versions_map[r] for r in ("pytest", "typing-extensions")],
+        key=lambda r: str(r.spec.package),
+    )
+    dump_to_yaml(
+        {
+            # ruff
+            "repos[.repo%https://github.com/astral-sh/ruff-pre-commit].rev": (
+                dev_versions_map["ruff"],
+                "v{req.spec.specifiers.version}",
+            ),
+            # mypy
+            "repos[.repo%https://github.com/pre-commit/mirrors-mypy].rev": (
+                dev_versions_map["mypy"],
+                "v{req.spec.specifiers.version}",
+            ),
+            "repos[.repo%https://github.com/pre-commit/mirrors-mypy].hooks[.id%mypy].additional_dependencies": (
+                mypy_req_versions,
+                None,
+            ),
+        },
+        ".pre-commit-config.yaml",
+    )
+
+
+if __name__ == "__main__":
+    app()

From 9af8a4ebbc3fc7845a5ef4a4a89fc8132c3187c0 Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Mon, 10 Jun 2024 16:15:10 +0200
Subject: [PATCH 342/458] Small changes to the documentation of the
 translators.

---
 .../arithmetic_logical_translators.py         |  3 +-
 .../broadcast_in_dim_translator.py            |  2 +-
 .../convert_element_type_translator.py        | 16 ++-----
 .../primitive_translators/copy_translator.py  | 12 ++---
 .../primitive_translators/iota_translator.py  |  2 +-
 .../reshape_translator.py                     |  9 ++--
 .../select_n_translator.py                    | 12 ++---
 .../primitive_translators/slicing.py          | 47 +++++++++----------
 .../squeeze_translator.py                     | 11 +++--
 tests/util.py                                 |  2 +-
 10 files changed, 53 insertions(+), 63 deletions(-)

diff --git a/src/jace/translator/primitive_translators/arithmetic_logical_translators.py b/src/jace/translator/primitive_translators/arithmetic_logical_translators.py
index dfafa7b..2dda2f4 100644
--- a/src/jace/translator/primitive_translators/arithmetic_logical_translators.py
+++ b/src/jace/translator/primitive_translators/arithmetic_logical_translators.py
@@ -184,11 +184,10 @@ def write_tasklet_code(
 }
 
 
-
 # Create the arithmetic translators
 for pname, ptmpl in _ARITMETIC_OPERATION_TEMPLATES.items():
     translator.register_primitive_translator(ArithmeticOperationTranslator(pname, ptmpl))
 
-# create the logical translators.
+# Create the logical translators.
 for pname, (itmpl, btmpl) in _LOGICAL_OPERATION_TEMPLATES.items():
     translator.register_primitive_translator(LogicalOperationTranslator(pname, itmpl, btmpl))
diff --git a/src/jace/translator/primitive_translators/broadcast_in_dim_translator.py b/src/jace/translator/primitive_translators/broadcast_in_dim_translator.py
index bd5e587..12852e5 100644
--- a/src/jace/translator/primitive_translators/broadcast_in_dim_translator.py
+++ b/src/jace/translator/primitive_translators/broadcast_in_dim_translator.py
@@ -25,7 +25,7 @@
 
 
 class BroadcastInDimTranslator(mapped_base.MappedOperationTranslatorBase):
-    """This handles the `broadcast_in_dim` primitives."""
+    """Implements the `broadcast_in_dim` primitive."""
 
     def __init__(self) -> None:
         super().__init__(primitive_name="broadcast_in_dim")
diff --git a/src/jace/translator/primitive_translators/convert_element_type_translator.py b/src/jace/translator/primitive_translators/convert_element_type_translator.py
index 6dd7576..75877b3 100644
--- a/src/jace/translator/primitive_translators/convert_element_type_translator.py
+++ b/src/jace/translator/primitive_translators/convert_element_type_translator.py
@@ -30,13 +30,8 @@ class ConvertElementTypeTranslator(mapped_base.MappedOperationTranslatorBase):
     Copies the input to the output and performs type conversion.
 
     Notes:
-        This translator ignores the `new_dtype` and `weak_type` parameter the
-        equation and only performs the casting.
-
-    Todo:
-        Occasionally Jax generates a cast that is not needed, because the types
-        are the same. Currently this is handled, by generating an explicit copy,
-        however, it should be handled by a Memlet.
+        This translator ignores the `new_dtype` and `weak_type` parameters of
+        the equation and only performs the casting based on the type of the fields.
     """
 
     def __init__(self) -> None:
@@ -63,15 +58,14 @@ def write_tasklet_code(
         conv_code = "__in0"
 
         if in_dtype == out_dtype:
-            # For some reason Jax sometimes adds conversions where no are needed. I think
-            #  that the reason for this is the special type system that Jax made. In these cases
-            #  we do not add a cast, because such a Tasklet is not trivial and DaCe can not remove it.
+            # For some reason Jax sometimes adds conversions where no are needed. In these cases
+            #  we explicitly create a copy Tasklet, which is trivial and can be removed by DaCe.
+            # TODO(phimuell): Create a Memlet instead.
             return f"__out = {conv_code}"
 
         if in_dtype_s.startswith("bool"):
             # Interestingly `__out = int(__in0)` will not work, see commit `f5aabc` of the prototype.
             conv_code = f"(1 if {conv_code} else 0)"
-
         if out_dtype_s.startswith("bool"):
             conv_code = f"dace.bool_({conv_code})"
         elif hasattr(dace.dtypes, out_dtype_s):
diff --git a/src/jace/translator/primitive_translators/copy_translator.py b/src/jace/translator/primitive_translators/copy_translator.py
index c1afb34..d31e4cf 100644
--- a/src/jace/translator/primitive_translators/copy_translator.py
+++ b/src/jace/translator/primitive_translators/copy_translator.py
@@ -44,16 +44,14 @@ def write_tasklet_code(
 
 
 class DevicePutTranslator(mapped_base.MappedOperationTranslatorBase):
-    """The `device_put` primitive is used to transfer data between host and device.
+    """Implements the `device_put` primitive.
 
-    The current implementation only supports the copying where the data already
-    is. Currently DaCe only knows about the Host and the GPU. Furthermore,
-    currently JaCe works in such a way that everything is either put on the host
-    or the device. Because of this, the `DevicePutTranslator` is, currently,
-    just a simple copy operation that should be removed, by the optimization.
+    In Jax this primitive is used to copy data between the host and the device.
+    Because of the way how JaCe and the optimization pipeline works, either
+    everything is on the host or the device.
 
     Todo:
-        Make into a Memlet because only the Memlet can handle copying between devices.
+        Think about how to implement this correctly.
     """
 
     def __init__(self) -> None:
diff --git a/src/jace/translator/primitive_translators/iota_translator.py b/src/jace/translator/primitive_translators/iota_translator.py
index b664f53..d945845 100644
--- a/src/jace/translator/primitive_translators/iota_translator.py
+++ b/src/jace/translator/primitive_translators/iota_translator.py
@@ -25,7 +25,7 @@
 
 
 class IotaTranslator(mapped_base.MappedOperationTranslatorBase):
-    """This handles the `iota` primitives.
+    """Implements the `iota` primitive.
 
     Essentially a very general `jnp.arange()` function.
     """
diff --git a/src/jace/translator/primitive_translators/reshape_translator.py b/src/jace/translator/primitive_translators/reshape_translator.py
index 3de9f54..b6ab892 100644
--- a/src/jace/translator/primitive_translators/reshape_translator.py
+++ b/src/jace/translator/primitive_translators/reshape_translator.py
@@ -22,11 +22,12 @@
 
 
 class ReshapeTranslator(translator.PrimitiveTranslator):
-    """Reshapes an array.
+    """Implements the `reshape` primitive.
 
-    Todo:
-        - Handle `dimensions` parameter fully.
-        - Find a way to make it as a Map.
+    The current implementation uses a Memlet for this and essentially acts as
+    an optimization barrier. Furthermore the Jax primitive also has the optional
+    `dimensions` parameters which allows to permute the input, this is not
+    supported.
     """
 
     @property
diff --git a/src/jace/translator/primitive_translators/select_n_translator.py b/src/jace/translator/primitive_translators/select_n_translator.py
index 240375a..f6ce6f0 100644
--- a/src/jace/translator/primitive_translators/select_n_translator.py
+++ b/src/jace/translator/primitive_translators/select_n_translator.py
@@ -25,18 +25,19 @@
 
 
 class SelectNTranslator(mapped_base.MappedOperationTranslatorBase):
-    """Implements the `select_n` primitive, which is a generalization of `np.where`
-
-    While `numpy.where` only supports two cases, the Jax primitive supports an
-    arbitrary number of cases. In that sense it is essentially a `C` `switch`
-    statement, only that all cases have to materialize.
+    """Implements the `select_n` primitive.
 
+    The `select_n` primitive is a generalization of `np.where`, that can take an
+    arbitrary number of branches, which are selected by an integer predicate.
     The behaviour is undefined if the predicate is out of bound.
 
     Note:
         For a better understanding this function renames its input connectors.
         The first one, which is the predicate, is renamed to `__cond` and the
         others are renamed again to `__in{i}`, starting with zero.
+
+    Todo:
+        Implement the primitive as a nested SDFG.
     """
 
     def __init__(self) -> None:
@@ -49,7 +50,6 @@ def write_tasklet_code(
         in_var_names: Sequence[str | None],
         eqn: jax_core.JaxprEqn,
     ) -> str:
-        """Writes the selection code."""
         if len(in_var_names) == 3:
             # This order is correct, since `False` is interpreted as `0`, which means the first
             #  case. DaCe seems to have some problems with bools and integer casting around,
diff --git a/src/jace/translator/primitive_translators/slicing.py b/src/jace/translator/primitive_translators/slicing.py
index 7a28dc0..13659d1 100644
--- a/src/jace/translator/primitive_translators/slicing.py
+++ b/src/jace/translator/primitive_translators/slicing.py
@@ -25,10 +25,11 @@
 
 
 class SlicingTranslator(mapped_base.MappedOperationTranslatorBase):
-    """Implements the classical slicing operation.
+    """Implements the `slice` primitive.
 
-    It is basically a copy Tasklet that only copies parts of the input.
-    Note that there is also `dynamic_slice`.
+    This is the classical slicing operation which extracts a fixed sized window
+    from a fixed initial position. The `dynamic_slice` operation supports a
+    variable starting point.
     """
 
     def __init__(self) -> None:
@@ -68,17 +69,16 @@ def make_input_memlets(
 
 
 class DynamicSlicingTranslator(translator.PrimitiveTranslator):
-    """Implements the dynamic slicing translator.
+    """Implements the `dynamic_slice` primitive.
 
-    The [dynamic slicing](https://jax.readthedocs.io/en/latest/_autosummary/jax.lax.dynamic_slice.html)
-    performs a slicing of a _fixed_ window, however, the starting indexes are
-    not fix, but are variables that can come from the outside. Thus, the
-    translator uses "Dynamic Map Ranges". Furthermore, Jax guarantees that if
-    the window overruns the start indexes are adjusted.
+    [Dynamic slicing](https://jax.readthedocs.io/en/latest/_autosummary/jax.lax.dynamic_slice.html)
+    performs a slicing of a _fixed_ window, but the start of the window is
+    not fix, instead it is passed by variables. Furthermore, (as it is in Jax),
+    if the window would overrun the start indexes are adjusted.
 
-    Note:
-        Unlike the normal slicing primitive, it is not derived from
-        `MappedOperationTranslatorBase`.
+    Todo:
+        - Prevent that the modified start indexes are promoted to symbols,
+            to ensure mergability.
     """
 
     @property
@@ -105,21 +105,18 @@ def __call__(
         in_var_name: str = in_var_names[0]
         start_indices: list[str | None] = list(in_var_names[1:])
 
-        # For storing the adapted start index, we have to create access nodes, to store them.
-        #  To ensure a total order of execution we have to use the same access nodes that are
-        #  used to store the adjusted start index and to feed them into the map.
+        # Access nodes for the modified start indexes.
         in_access: dict[str, dace.nodes.AccessNode] = {}
 
-        # Jax will adjust the start indexes if the window will overrun.
-        #  The adjustment is based on the formula $min(s + w, N) - w$, where $s$ is the start
-        #  index, $w$ the window size and $N$ the length of a particular dimension.
-        #  To do it we will use Tasklets, because otherwise we can not merge the state.
+        # We will always adapt the start indexes and not check if it is needed.
         for dim, (start_index, dim_size, wsize) in enumerate(
             zip(start_indices, util.get_jax_var_shape(eqn.invars[0]), window_sizes)
         ):
             if start_index is None:
                 continue
 
+            # We use a Tasklet to perform the adjustment not a symbol, because this would
+            #  need an interstage edge serving as kind of an optimization barrier.
             tasklet = dace.nodes.Tasklet(
                 label=f"adjustment_of_slice_start_{start_index}_for_{out_var_names[0]}",
                 inputs={"unadjusted_start_idx": None},
@@ -127,13 +124,11 @@ def __call__(
                 code=f"adjusted_start_idx = min(unadjusted_start_idx + {wsize}, {dim_size}) - {wsize}",
             )
 
-            # Intermediate value to storing the adjusted start index.
             new_start_idx_var_name = builder.add_array(
                 eqn.invars[dim + 1], name_prefix="__jace_adapted_start_idx_"
             )
             new_start_idx_acc = eqn_state.add_access(new_start_idx_var_name)
 
-            # Create the connections to and from the Tasklet.
             eqn_state.add_edge(
                 eqn_state.add_read(start_index),
                 None,
@@ -148,6 +143,7 @@ def __call__(
                 None,
                 dace.Memlet.simple(new_start_idx_var_name, "0"),
             )
+            # Update the name of the start index
             start_indices[dim] = new_start_idx_var_name
             in_access[new_start_idx_var_name] = new_start_idx_acc
 
@@ -155,10 +151,9 @@ def __call__(
             (f"__i{dim}", f"0:{N}") for dim, N in enumerate(util.get_jax_var_shape(eqn.outvars[0]))
         ]
 
-        # We use dynamic map ranges, thus the map entry has input connectors, that does not start
-        #  with `IN_*`, instead the connector name defines a symbol within the map scope. This
-        #  `dict` maps the symbol name to the name of the input variable, that has the value of the
-        #  symbol. Literal substitution is done later.
+        # For copying the data, we use dynamic map ranges, which is basically an input connector
+        #  on the map entry whose name is not `IN_*`, this name can then be used as a symbol
+        #  inside the map scope; this symbol is then used as offset.
         dynamic_map_ranges: dict[str, str] = {}
         memlet_accesses: list[str] = []
 
@@ -178,7 +173,6 @@ def __call__(
         tskl_output = dace.Memlet.simple(
             out_var_names[0], ", ".join(name for name, _ in tskl_ranges)
         )
-
         _, map_entry, _ = eqn_state.add_mapped_tasklet(
             name=f"{self.primitive}_{out_var_names[0]}",
             map_ranges=tskl_ranges,
@@ -189,6 +183,7 @@ def __call__(
         )
 
         # Creating the inputs for the dynamic map ranges.
+        #  We have to use the same access nodes as above, to ensure a single order of computation.
         for symb_name, start_index in dynamic_map_ranges.items():
             eqn_state.add_edge(
                 in_access[start_index],
diff --git a/src/jace/translator/primitive_translators/squeeze_translator.py b/src/jace/translator/primitive_translators/squeeze_translator.py
index a5a44a6..f74f84c 100644
--- a/src/jace/translator/primitive_translators/squeeze_translator.py
+++ b/src/jace/translator/primitive_translators/squeeze_translator.py
@@ -24,9 +24,11 @@
 
 
 class SqueezeTranslator(mapped_base.MappedOperationTranslatorBase):
-    """Allows to remove dimensions with size one.
+    """Implements the `squeeze` primitive.
 
-    Essentially equivalent to `np.squeeze` and the inverse to `np.expand_dims()`.
+    The primitives allows to remove a dimension of size one. Essentially
+    equivalent to `np.squeeze` and the inverse to `np.expand_dims()`,
+    which is handled by the `broadcast_in_dim` primitive.
     """
 
     def __init__(self) -> None:
@@ -48,14 +50,15 @@ def make_input_memlets(
         in_var_names: Sequence[str | None],
         eqn: jax_core.JaxprEqn,
     ) -> dict[str, dace.Memlet]:
-        to_rem: Sequence[str] = eqn.params["dimensions"]
+        dims_to_delete: Sequence[str] = eqn.params["dimensions"]
         in_rank: int = len(util.get_jax_var_shape(eqn.invars[0]))
         cnt = itertools.count(0)
         return {
             "__in0": dace.Memlet.simple(
                 in_var_names[0],
                 ", ".join(
-                    "0" if dim in to_rem else tskl_ranges[next(cnt)][0] for dim in range(in_rank)
+                    "0" if dim in dims_to_delete else tskl_ranges[next(cnt)][0]
+                    for dim in range(in_rank)
                 ),
             )
         }
diff --git a/tests/util.py b/tests/util.py
index 6080a6f..bad76a0 100644
--- a/tests/util.py
+++ b/tests/util.py
@@ -44,7 +44,7 @@ def mkarray(shape: Sequence[int] | int, dtype: type = np.float64, order: str = "
         res = np.random.random(shape) > 0.5  # noqa: NPY002
     elif np.issubdtype(dtype, np.integer):
         iinfo: np.iinfo = np.iinfo(dtype)
-        res = np.random.randint(  # type: ignore[assignment]  # noqa: NPY002
+        res = np.random.randint(  # noqa: NPY002
             low=iinfo.min, high=iinfo.max, size=shape, dtype=dtype
         )
     elif np.issubdtype(dtype, np.complexfloating):

From 647c5f733a48137a980ae8f494c53ad1f55db10a Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Tue, 11 Jun 2024 11:17:36 +0200
Subject: [PATCH 343/458] Implemented pytrees.

This enables pytrees everywhere, it is not that nice and needs some cleaning.
---
 src/jace/api.py                              |  6 ++
 src/jace/stages.py                           | 91 ++++++++++++--------
 src/jace/translator/pre_post_translation.py  | 77 ++++++++++++++---
 src/jace/translator/translated_jaxpr_sdfg.py |  7 ++
 src/jace/util/dace_helper.py                 | 42 ++++-----
 src/jace/util/translation_cache.py           | 19 ++--
 tests/unit_tests/test_jax_api.py             |  8 +-
 7 files changed, 165 insertions(+), 85 deletions(-)

diff --git a/src/jace/api.py b/src/jace/api.py
index 46e15b2..81dad1f 100644
--- a/src/jace/api.py
+++ b/src/jace/api.py
@@ -10,6 +10,7 @@
 from __future__ import annotations
 
 import functools
+import inspect
 from typing import TYPE_CHECKING, Any, Literal, overload
 
 from jax import grad, jacfwd, jacrev
@@ -69,6 +70,11 @@ def jit(
         )
 
     def wrapper(f: Callable) -> stages.JaCeWrapped:
+        if any(
+            param.default is not param.empty for param in inspect.signature(f).parameters.values()
+        ):
+            raise NotImplementedError("Default values are not yet supported.")
+
         # TODO: Improve typing, such that signature is attached to the `JaCeWrapped`.
         jace_wrapper = stages.JaCeWrapped(
             fun=f,
diff --git a/src/jace/stages.py b/src/jace/stages.py
index 6ef47d9..e9488da 100644
--- a/src/jace/stages.py
+++ b/src/jace/stages.py
@@ -28,9 +28,10 @@
 from __future__ import annotations
 
 import copy
+import inspect
 from typing import TYPE_CHECKING, Any
 
-import jax as _jax
+from jax import tree_util as jax_tree
 
 from jace import optimization, translator, util
 from jace.optimization import CompilerOptions
@@ -79,7 +80,6 @@ class JaCeWrapped(tcache.CachingStage["JaCeLowered"]):
         jit_options: Options to influence the jit process.
 
     Todo:
-        - Support pytrees.
         - Support keyword arguments and default values of the wrapped function.
         - Support static arguments.
 
@@ -98,6 +98,9 @@ def __init__(
         primitive_translators: Mapping[str, translator.PrimitiveTranslator],
         jit_options: Mapping[str, Any],
     ) -> None:
+        assert all(
+            param.default is param.empty for param in inspect.signature(fun).parameters.values()
+        )
         super().__init__()
         # We have to shallow copy both the translator and the jit options.
         #  This prevents that any modifications affect `self`.
@@ -138,27 +141,21 @@ def lower(self, *args: Any, **kwargs: Any) -> JaCeLowered:
         if len(kwargs) != 0:
             raise NotImplementedError("Currently only positional arguments are supported.")
 
-        # In Jax `float32` is the main datatype, and they go to great lengths to avoid some
-        #  aggressive [type promotion](https://jax.readthedocs.io/en/latest/type_promotion.html).
-        #  However, in this case we will have problems when we call the SDFG, for some reasons
-        #  `CompiledSDFG` does not work in that case correctly, thus we enable it for the tracing.
-        with _jax.experimental.enable_x64():
-            builder = translator.JaxprTranslationBuilder(
-                primitive_translators=self._primitive_translators
-            )
-            jaxpr = _jax.make_jaxpr(self._fun)(*args)
-            trans_ctx: translator.TranslationContext = builder.translate_jaxpr(jaxpr)
-
-        # Perform the post processing and turn it into a `TranslatedJaxprSDFG` that can be
-        #  compiled and called later.
-        # NOTE: `tsdfg` was deepcopied as a side effect of post processing.
+        jaxpr, flat_in_vals, outtree = ptrans.trace_and_flatten_function(
+            fun=self._fun,
+            trace_call_args=args,
+            trace_call_kwargs=kwargs,
+            trace_options=self._jit_options,
+        )
+        builder = translator.JaxprTranslationBuilder(
+            primitive_translators=self._primitive_translators
+        )
+        trans_ctx: translator.TranslationContext = builder.translate_jaxpr(jaxpr)
         tsdfg: translator.TranslatedJaxprSDFG = ptrans.postprocess_jaxpr_sdfg(
-            trans_ctx=trans_ctx,
-            fun=self.wrapped_fun,
-            call_args=args,  # Already linearised, since we only accept positional args.
-            intree=None,  # Not yet implemented.
+            trans_ctx=trans_ctx, fun=self.wrapped_fun, call_args=flat_in_vals, outtree=outtree
         )
 
+        # NOTE: `tsdfg` is deepcopied as a side effect of post processing.
         return JaCeLowered(tsdfg)
 
     @property
@@ -166,13 +163,17 @@ def wrapped_fun(self) -> Callable:
         """Returns the wrapped function."""
         return self._fun
 
-    def _make_call_description(self, *args: Any) -> tcache.StageTransformationSpec:
+    def _make_call_description(
+        self, args_tree: jax_tree.PyTreeDef, flat_args: Sequence[Any]
+    ) -> tcache.StageTransformationSpec:
         """This function computes the key for the `JaCeWrapped.lower()` call inside the cache.
 
         The function will compute a full abstract description on its argument.
         """
-        call_args = tuple(tcache._AbstractCallArgument.from_value(x) for x in args)
-        return tcache.StageTransformationSpec(stage_id=id(self), call_args=call_args)
+        call_args = tuple(tcache._AbstractCallArgument.from_value(x) for x in flat_args)
+        return tcache.StageTransformationSpec(
+            stage_id=id(self), call_args=tuple(call_args), args_tree=args_tree
+        )
 
 
 class JaCeLowered(tcache.CachingStage["JaCeCompiled"]):
@@ -230,6 +231,7 @@ def compile(self, compiler_options: CompilerOptions | None = None) -> JaCeCompil
             csdfg=dace_helper.compile_jax_sdfg(tsdfg),
             inp_names=tsdfg.inp_names,
             out_names=tsdfg.out_names,
+            outtree=tsdfg.outtree,
         )
 
     def compiler_ir(self, dialect: str | None = None) -> translator.TranslatedJaxprSDFG:
@@ -257,22 +259,30 @@ def as_sdfg(self) -> dace.SDFG:
         return self.compiler_ir().sdfg
 
     def _make_call_description(
-        self, compiler_options: CompilerOptions | None = None
+        self, args_tree: jax_tree.PyTreeDef, flat_args: Sequence[Any]
     ) -> tcache.StageTransformationSpec:
         """This function computes the key for the `self.compile()` call inside the cache.
 
-        The key that is computed by this function is based on the concrete
-        values of the passed compiler options.
+        Contrary to the `JaCeWrapped.lower()` function the call description
+        depends on the concrete values of the arguments and takes the global
+        compile options into consideration.
         """
-        options = self._make_compiler_options(compiler_options)
-        call_args = tuple(sorted(options.items(), key=lambda x: x[0]))
-        return tcache.StageTransformationSpec(stage_id=id(self), call_args=call_args)
+        unflatted_args, unflatted_kwargs = jax_tree.tree_unflatten(args_tree, flat_args)
+        assert (not len(unflatted_kwargs)) and (len(unflatted_args) == 1)
+        options = self._make_compiler_options(unflatted_args[0])
+
+        # The values are stored inside `call_args` and `args_tree` stores the key.
+        call_args, args_tree = jax_tree.tree_flatten(options)
+        return tcache.StageTransformationSpec(
+            stage_id=id(self), call_args=tuple(call_args), args_tree=args_tree
+        )
 
     def _make_compiler_options(self, compiler_options: CompilerOptions | None) -> CompilerOptions:
         """Return the compilation options that should be used for compilation.
 
         See `JaCeLowered.compile()` to see how to influence them.
         """
+        assert isinstance(compiler_options, dict)
         return get_active_compiler_options() | (compiler_options or {})
 
 
@@ -311,30 +321,33 @@ class JaCeCompiled:
         csdfg: The compiled SDFG object.
         inp_names: Names of the SDFG variables used as inputs.
         out_names: Names of the SDFG variables used as outputs.
+        outtree: A pytree describing how to unflatten the output.
 
     Note:
         The class assumes ownership of its input arguments.
 
     Todo:
-        - Handle pytrees.
         - Automatic strides adaption.
     """
 
     _csdfg: dace_helper.CompiledSDFG
     _inp_names: tuple[str, ...]
     _out_names: tuple[str, ...]
+    _outtree: jax_tree.PyTreeDef
 
     def __init__(
-        self, csdfg: dace_helper.CompiledSDFG, inp_names: Sequence[str], out_names: Sequence[str]
+        self,
+        csdfg: dace_helper.CompiledSDFG,
+        inp_names: Sequence[str],
+        out_names: Sequence[str],
+        outtree: jax_tree.PyTreeDef,
     ) -> None:
-        # NOTE: We only check that we have output, we do not care about the input, since the
-        #  function `def foo(): return 1.0` is still a pure function, but we require that we have
-        #  output.
-        if not out_names:
-            raise ValueError("A jited function needs at least one output.")
+        if not (out_names or inp_names):
+            raise ValueError("No input nor output.")
         self._csdfg = csdfg
         self._inp_names = tuple(inp_names)
         self._out_names = tuple(out_names)
+        self._outtree = outtree
 
     def __call__(self, *args: Any, **kwargs: Any) -> Any:
         """Calls the embedded computation.
@@ -342,7 +355,11 @@ def __call__(self, *args: Any, **kwargs: Any) -> Any:
         The arguments must be the same as for the wrapped function, but with
         all static arguments removed.
         """
-        return dace_helper.run_jax_sdfg(self._csdfg, self._inp_names, self._out_names, args, kwargs)
+        flat_in_vals = jax_tree.tree_leaves((args, kwargs))
+        assert len(flat_in_vals) == len(self._inp_names), "Static arguments."
+        return dace_helper.run_jax_sdfg(
+            self._csdfg, self._inp_names, self._out_names, flat_in_vals, self._outtree
+        )
 
 
 #: Known compilation stages in JaCe.
diff --git a/src/jace/translator/pre_post_translation.py b/src/jace/translator/pre_post_translation.py
index be2c231..f4361ee 100644
--- a/src/jace/translator/pre_post_translation.py
+++ b/src/jace/translator/pre_post_translation.py
@@ -14,22 +14,25 @@
 from __future__ import annotations
 
 import copy
+import inspect
 from typing import TYPE_CHECKING, Any
 
 import dace
+import jax
+from jax import tree_util as jax_tree
 
 from jace import translator, util
 
 
 if TYPE_CHECKING:
-    from collections.abc import Callable, Sequence
+    from collections.abc import Callable, Mapping, Sequence
 
 
 def postprocess_jaxpr_sdfg(
     trans_ctx: translator.TranslationContext,
     fun: Callable,  # noqa: ARG001  # Currently unused
-    call_args: Sequence[Any],  # Currently unused
-    intree: None,  # noqa: ARG001  # Currently unused
+    call_args: Sequence[Any],
+    outtree: jax_tree.PyTreeDef,
 ) -> translator.TranslatedJaxprSDFG:
     """Perform the final post processing steps on the `TranslationContext` _in place_.
 
@@ -39,8 +42,8 @@ def postprocess_jaxpr_sdfg(
     Args:
         trans_ctx: The `TranslationContext` obtained from the `translate_jaxpr()` function.
         fun: The original function that was translated.
-        call_args: The linearized input arguments.
-        intree: The pytree describing the inputs.
+        call_args: The flattened input arguments.
+        outtree: A pytree describing how to unflatten the output.
 
     Todo:
         - Fixing the scalar input problem on GPU.
@@ -52,7 +55,7 @@ def postprocess_jaxpr_sdfg(
     # Handle inputs
     create_input_output_stages(trans_ctx=trans_ctx, call_args=call_args)
 
-    return finalize_translation_context(trans_ctx, validate=True)
+    return finalize_translation_context(trans_ctx, outtree=outtree, validate=True)
 
 
 def create_input_output_stages(
@@ -187,7 +190,7 @@ def _create_input_state(trans_ctx: translator.TranslationContext, call_args: Seq
 
 
 def finalize_translation_context(
-    trans_ctx: translator.TranslationContext, validate: bool = True
+    trans_ctx: translator.TranslationContext, outtree: jax_tree.PyTreeDef, validate: bool = True
 ) -> translator.TranslatedJaxprSDFG:
     """Finalizes the supplied translation context `trans_ctx`.
 
@@ -202,6 +205,7 @@ def finalize_translation_context(
 
     Args:
         trans_ctx: The context that should be finalized.
+        outtree: A pytree describing how to restore the output.
         validate: Call the validate function after the finalizing.
     """
     trans_ctx.validate()
@@ -215,15 +219,16 @@ def finalize_translation_context(
         sdfg=copy.deepcopy(trans_ctx.sdfg),
         inp_names=trans_ctx.inp_names,
         out_names=trans_ctx.out_names,
+        outtree=outtree,
     )
 
     # Make inputs and outputs to globals.
     sdfg_arg_names: list[str] = []
-    for glob_name in tsdfg.inp_names + tsdfg.out_names:
-        if glob_name in sdfg_arg_names:
+    for arg_name in tsdfg.inp_names + tsdfg.out_names:
+        if arg_name in sdfg_arg_names:
             continue
-        tsdfg.sdfg.arrays[glob_name].transient = False
-        sdfg_arg_names.append(glob_name)
+        tsdfg.sdfg.arrays[arg_name].transient = False
+        sdfg_arg_names.append(arg_name)
 
     # This forces the signature of the SDFG to include all arguments in order they appear.
     #  If an argument is used as input and output then it is only listed as input.
@@ -233,3 +238,53 @@ def finalize_translation_context(
         tsdfg.validate()
 
     return tsdfg
+
+
+def trace_and_flatten_function(
+    fun: Callable,
+    trace_call_args: Sequence[Any],
+    trace_call_kwargs: Mapping[str, Any],
+    trace_options: Mapping[str, Any],
+) -> tuple[jax.core.ClosedJaxpr, list[Any], jax_tree.PyTreeDef]:
+    """Traces `fun` and generates the Jaxpr as well as the input and output tree.
+
+    The function will perform the tracing using `trace_options`, which are the
+    same as supported by `jace.jit`. Furthermore the tracing is done with
+    x64 enabled.
+
+    Returns:
+        The function will return a tuple of length three.
+        1) The Jaxpr that was generated by tracing using the supplied arguments
+            and options.
+        2) The flattened input values.
+        3) A pytree describing the output structure.
+
+    Todo:
+        - Handle default arguments of `fun`.
+        - Handle static arguments.
+    """
+    if trace_options:
+        raise NotImplementedError(
+            f"Not supported tracing options: {', '.join(f'{k}' for k in trace_options)}"
+        )
+    assert all(param.default is param.empty for param in inspect.signature(fun).parameters.values())
+
+    # In Jax `float32` is the main datatype, and they go to great lengths to avoid some
+    #  aggressive [type promotion](https://jax.readthedocs.io/en/latest/type_promotion.html).
+    #  However, in this case we will have problems when we call the SDFG, for some reasons
+    #  `CompiledSDFG` does not work in that case correctly, thus we enable it for the tracing.
+    with jax.experimental.enable_x64():
+        # TODO(phimuell): copy the implementation of the real tracing, and not the debug one.
+        jaxpr, outshapes = jax.make_jaxpr(fun, return_shape=True)(
+            *trace_call_args, **trace_call_kwargs
+        )
+
+    # Regardless what the documentation of `make_jaxpr` claims, it does not output a pytree.
+    #  instead an abstract description of the shape, that we will transform into a pytree.
+    outtree = jax_tree.tree_structure(outshapes)
+
+    # Make the input tree
+    flat_in_vals = jax_tree.tree_leaves((trace_call_args, trace_call_kwargs))
+    assert len(jaxpr.in_avals) == len(flat_in_vals), "Static arguments not implemented."
+
+    return jaxpr, flat_in_vals, outtree
diff --git a/src/jace/translator/translated_jaxpr_sdfg.py b/src/jace/translator/translated_jaxpr_sdfg.py
index 811cce9..524c1a2 100644
--- a/src/jace/translator/translated_jaxpr_sdfg.py
+++ b/src/jace/translator/translated_jaxpr_sdfg.py
@@ -8,10 +8,15 @@
 from __future__ import annotations
 
 import dataclasses
+from typing import TYPE_CHECKING
 
 import dace
 
 
+if TYPE_CHECKING:
+    from jax import tree_util as jax_tree
+
+
 @dataclasses.dataclass(kw_only=True, frozen=True)
 class TranslatedJaxprSDFG:
     """Encapsulates the translated SDFG together with the metadata that is needed to run it.
@@ -38,11 +43,13 @@ class TranslatedJaxprSDFG:
         sdfg: The encapsulated SDFG object.
         inp_names: A list of the SDFG variables that are used as input
         out_names: A list of the SDFG variables that are used as output.
+        outtree: A pytree describing how to unflatten the output.
     """
 
     sdfg: dace.SDFG
     inp_names: tuple[str, ...]
     out_names: tuple[str, ...]
+    outtree: jax_tree.PyTreeDef
 
     def validate(self) -> bool:
         """Validate the underlying SDFG."""
diff --git a/src/jace/util/dace_helper.py b/src/jace/util/dace_helper.py
index 458ec9f..a85b909 100644
--- a/src/jace/util/dace_helper.py
+++ b/src/jace/util/dace_helper.py
@@ -16,16 +16,14 @@
 
 import dace
 from dace import data as dace_data
-
-# The compiled SDFG is not available in the dace namespace or anywhere else
-#  Thus we import it here directly
 from dace.codegen.compiled_sdfg import CompiledSDFG
+from jax import tree_util as jax_tree
 
 from jace import util
 
 
 if TYPE_CHECKING:
-    from collections.abc import Mapping, Sequence
+    from collections.abc import Sequence
 
     from jace import translator
     from jace.util import dace_helper
@@ -76,8 +74,8 @@ def run_jax_sdfg(
     csdfg: dace_helper.CompiledSDFG,
     inp_names: Sequence[str],
     out_names: Sequence[str],
-    call_args: Sequence[Any],
-    call_kwargs: Mapping[str, Any],
+    flat_call_args: Sequence[Any],
+    outtree: jax_tree.PyTreeDef,
 ) -> tuple[Any, ...] | Any:
     """Run the compiled SDFG.
 
@@ -90,24 +88,18 @@ def run_jax_sdfg(
         csdfg: The `CompiledSDFG` object.
         inp_names: List of names of the input arguments.
         out_names: List of names of the output arguments.
-        call_args: All positional arguments of the call.
-        call_kwargs: All keyword arguments of the call.
+        flat_call_args: Flattened input arguments.
+        outtree: A pytree describing how to unflatten the output.
 
-    Note:
-        There is no pytree mechanism jet, thus the return values are returned
-        inside a `tuple` or in case of one value, directly, in the order
-        determined by Jax. As Jax JaCe does not return scalars, but only arrays.
+    Notes:
+        Currently the strides of the input arguments must match the ones that
+        were used for lowering.
     """
-    sdfg: dace.SDFG = csdfg.sdfg
-
-    if len(call_kwargs) != 0:
-        raise NotImplementedError("No kwargs are supported yet.")
-    if len(inp_names) != len(call_args):
+    if len(inp_names) != len(flat_call_args):
         raise RuntimeError("Wrong number of arguments.")
 
-    # Build the argument list that we will pass to the compiled object.
     sdfg_call_args: dict[str, Any] = {}
-    for in_name, in_val in zip(inp_names, call_args, strict=True):
+    for in_name, in_val in zip(inp_names, flat_call_args, strict=True):
         # TODO(phimuell): Implement a stride matching process.
         if util.is_jax_array(in_val):
             if not util.is_fully_addressable(in_val):
@@ -115,17 +107,17 @@ def run_jax_sdfg(
             in_val = in_val.__array__()
         sdfg_call_args[in_name] = in_val
 
-    for out_name, sdfg_array in ((out_name, sdfg.arrays[out_name]) for out_name in out_names):
+    arrays = csdfg.sdfg.arrays
+    for out_name, sdfg_array in ((out_name, arrays[out_name]) for out_name in out_names):
         if out_name in sdfg_call_args:
             if util.is_jax_array(sdfg_call_args[out_name]):
-                # Jax arrays are immutable, so they can not be return values too.
-                raise ValueError("Passed a Jax array as output.")
+                raise ValueError("Passed an immutable Jax array as output.")
         else:
             sdfg_call_args[out_name] = dace_data.make_array_from_descriptor(sdfg_array)
 
     assert len(sdfg_call_args) == len(csdfg.argnames), (
         "Failed to construct the call arguments,"
-        f" expected {len(csdfg.argnames)} but got {len(call_args)}."
+        f" expected {len(csdfg.argnames)} but got {len(flat_call_args)}."
         f"\nExpected: {csdfg.argnames}\nGot: {list(sdfg_call_args.keys())}"
     )
 
@@ -134,8 +126,6 @@ def run_jax_sdfg(
         dace.Config.set("compiler", "allow_view_arguments", value=True)
         csdfg(**sdfg_call_args)
 
-    # TODO(phimuell): Handle pytrees
     if not out_names:
         return None
-    ret_val: tuple[Any] = tuple(sdfg_call_args[out_name] for out_name in out_names)
-    return ret_val[0] if len(out_names) == 1 else ret_val
+    return jax_tree.tree_unflatten(outtree, (sdfg_call_args[out_name] for out_name in out_names))
diff --git a/src/jace/util/translation_cache.py b/src/jace/util/translation_cache.py
index 5476dea..6664a36 100644
--- a/src/jace/util/translation_cache.py
+++ b/src/jace/util/translation_cache.py
@@ -20,11 +20,11 @@
 import collections
 import dataclasses
 import functools
-from collections.abc import Callable, Hashable
+from collections.abc import Callable, Hashable, Sequence
 from typing import TYPE_CHECKING, Any, Concatenate, Generic, ParamSpec, TypeAlias, TypeVar, cast
 
 import dace
-from jax import core as jax_core
+from jax import core as jax_core, tree_util as jax_tree
 
 from jace import util
 
@@ -68,7 +68,7 @@ def __init__(self) -> None:
 
     @abc.abstractmethod
     def _make_call_description(
-        self: CachingStage, *args: Any, **kwargs: Any
+        self: CachingStage, args_tree: jax_tree.PyTreeDef, flat_args: Sequence[Any]
     ) -> StageTransformationSpec:
         """Generates the key that is used to store/locate the call in the cache."""
         ...
@@ -95,7 +95,8 @@ def cached_transition(
 
     @functools.wraps(transition)
     def transition_wrapper(self: CachingStageType, *args: P.args, **kwargs: P.kwargs) -> NextStage:
-        key: StageTransformationSpec = self._make_call_description(*args, **kwargs)
+        flat_args, args_tree = jax_tree.tree_flatten((args, kwargs))
+        key = self._make_call_description(flat_args=flat_args, args_tree=args_tree)
         if key in self._cache:
             return self._cache[key]
         next_stage = transition(self, *args, **kwargs)
@@ -192,22 +193,26 @@ class StageTransformationSpec:
     State transition functions are annotated with `@cached_transition` and their
     result may be cached. They key to locate them inside the cache is represented
     by this class and computed by the `CachingStage._make_call_description()`
-    function. The actual key is consists of two parts, `stage_id` and `call_args`.
+    function. The actual key is consists of three parts, `stage_id`, `call_args`
+    and `args_tree`.
 
     Args:
         stage_id: Origin of the call, for which the id of the stage object should
             be used.
-        call_args: Description of the arguments of the call. There are two ways
-            to describe the arguments:
+        call_args: Flat representation of the arguments of the call. Each element
+            describes a single argument. To describe an argument there are two ways:
             - Abstract description: In this way, the actual value of the argument
                 is irrelevant, only the structure of them are important, similar
                 to the tracers used in Jax.
             - Concrete description: Here one caches on the actual value of the
                 argument. The only requirement is that they can be hashed.
+        args_tree: A pytree structure that describes how the input was flatten.
+                In Jax the hash of a pytree, takes its structure into account.
     """
 
     stage_id: int
     call_args: CallArgsSpec
+    args_tree: jax_tree.PyTreeDef
 
 
 # Denotes the stage that is stored inside the cache.
diff --git a/tests/unit_tests/test_jax_api.py b/tests/unit_tests/test_jax_api.py
index 7d06a2d..dee19bd 100644
--- a/tests/unit_tests/test_jax_api.py
+++ b/tests/unit_tests/test_jax_api.py
@@ -193,16 +193,16 @@ def testee(A: np.ndarray, B: np.float64) -> np.ndarray:
     with disable_x64():
         jaxpr = jax.make_jaxpr(testee)(A, B)
 
+    _, flat_in_vals, outtree = ptrans.trace_and_flatten_function(
+        fun=testee, trace_call_args=(A, B), trace_call_kwargs={}, trace_options={}
+    )
     builder = translator.JaxprTranslationBuilder(
         primitive_translators=translator.get_registered_primitive_translators()
     )
     trans_ctx: translator.TranslationContext = builder.translate_jaxpr(jaxpr)
 
     tsdfg: translator.TranslatedJaxprSDFG = ptrans.postprocess_jaxpr_sdfg(
-        trans_ctx=trans_ctx,
-        fun=testee,
-        call_args=(A, B),  # Already linearised, since we only accept positional args.
-        intree=None,  # Not yet implemented.
+        trans_ctx=trans_ctx, fun=testee, call_args=flat_in_vals, outtree=outtree
     )
 
     # Because x64 is disabled Jax traces the input as float32, even if we have passed

From c8c612cd042f5c3662b9a446001bf53be2fcb2d7 Mon Sep 17 00:00:00 2001
From: Enrique Gonzalez Paredes <enriqueg@cscs.ch>
Date: Wed, 12 Jun 2024 01:04:24 +0200
Subject: [PATCH 344/458] Update tooling configs.

---
 .github/dependabot.yml   |   8 +--
 .github/workflows/ci.yml |   4 +-
 .pre-commit-config.yaml  |  40 +++++++-------
 .readthedocs.yaml        |   2 +-
 CHANGELOG.md             |   2 +-
 CODING_GUIDELINES.md     |  45 +++++++++------
 CONTRIBUTING.md          |   2 +-
 README.md                |  23 ++++----
 ROADMAP.md               |  30 +++++-----
 noxfile.py               |  23 ++------
 pyproject.toml           | 115 +++++++++++++++++++++++++++------------
 src/jace/__init__.py     |   4 +-
 12 files changed, 169 insertions(+), 129 deletions(-)

diff --git a/.github/dependabot.yml b/.github/dependabot.yml
index 60f5aca..6fbe4e9 100644
--- a/.github/dependabot.yml
+++ b/.github/dependabot.yml
@@ -1,11 +1,11 @@
 version: 2
 updates:
   # Maintain dependencies for GitHub Actions
-- package-ecosystem: "github-actions"
-  directory: "/"
+- package-ecosystem: github-actions
+  directory: /
   schedule:
-    interval: "weekly"
+    interval: weekly
   groups:
     actions:
       patterns:
-      - "*"
+      - '*'
diff --git a/.github/workflows/ci.yml b/.github/workflows/ci.yml
index 86a32f3..b065ed7 100644
--- a/.github/workflows/ci.yml
+++ b/.github/workflows/ci.yml
@@ -24,7 +24,7 @@ jobs:
         fetch-depth: 0
     - uses: actions/setup-python@v5
       with:
-        python-version: "3.x"
+        python-version: 3.x
     - uses: pre-commit/action@v3.0.1
       with:
         extra_args: --hook-stage manual --all-files
@@ -36,7 +36,7 @@ jobs:
     strategy:
       fail-fast: false
       matrix:
-        python-version: ["3.10", "3.12"]
+        python-version: ['3.10', '3.12']
         runs-on: [ubuntu-latest, macos-latest, windows-latest]
 
     steps:
diff --git a/.pre-commit-config.yaml b/.pre-commit-config.yaml
index 13841be..9ff228d 100644
--- a/.pre-commit-config.yaml
+++ b/.pre-commit-config.yaml
@@ -2,30 +2,32 @@ default_language_version:
   python: python3.10
 
 ci:
-  autoupdate_commit_msg: "chore: update pre-commit hooks"
-  autofix_commit_msg: "style: pre-commit fixes"
+  autoupdate_commit_msg: 'chore: update pre-commit hooks'
+  autofix_commit_msg: 'style: pre-commit fixes'
 
 repos:
 - repo: https://github.com/macisamuele/language-formatters-pre-commit-hooks
-  rev: v2.6.0
+  rev: v2.13.0
   hooks:
   - id: pretty-format-ini
     args: [--autofix]
   - id: pretty-format-toml
-    args: [--autofix]
+    args: [--autofix, --indent, '2', --trailing-commas]
     additional_dependencies:
     - setuptools>=69.2.0
   - id: pretty-format-yaml
-    args: [--autofix, --preserve-quotes, --indent, "2"]
+    args: [--autofix, --indent, '2', --line-width, '100']
     additional_dependencies:
     - setuptools>=69.2.0
 
-- repo: https://github.com/pre-commit/mirrors-prettier
-  rev: "v3.1.0"
+- repo: https://github.com/executablebooks/mdformat
+  rev: 0.7.17
   hooks:
-  - id: prettier
-    types_or: [markdown, html, css, scss, javascript, json]
-    args: [--prose-wrap=preserve]
+  - id: mdformat
+    args: [--number]
+    additional_dependencies:
+    - mdformat-gfm
+    - mdformat-black
 
 - repo: https://github.com/Lucas-C/pre-commit-hooks
   rev: v1.1.9
@@ -33,10 +35,10 @@ repos:
   - id: insert-license
     exclude: ^\..*$
     types: [python]
-    args: [--comment-style, "|#|", --license-filepath, ./LICENSE_HEADER.txt]
+    args: [--comment-style, '|#|', --license-filepath, ./LICENSE_HEADER.txt]
 
 - repo: https://github.com/pre-commit/pre-commit-hooks
-  rev: "v4.6.0"
+  rev: v4.6.0
   hooks:
   - id: check-added-large-files
   - id: check-case-conflict
@@ -47,7 +49,7 @@ repos:
   - id: end-of-file-fixer
   - id: mixed-line-ending
   - id: name-tests-test
-    args: ["--pytest-test-first"]
+    args: [--pytest-test-first]
   - id: requirements-txt-fixer
   - id: trailing-whitespace
 
@@ -55,7 +57,7 @@ repos:
   rev: v0.4.6
   hooks:
   - id: ruff
-    args: ["--fix", "--show-fixes", "--preview"]
+    args: [--fix, --show-fixes, --preview]
   - id: ruff-format
 
 - repo: https://github.com/pre-commit/mirrors-mypy
@@ -70,12 +72,12 @@ repos:
     - numpy==1.26.4
     - pytest==8.2.1
 - repo: https://github.com/codespell-project/codespell
-  rev: "v2.2.6"
+  rev: v2.2.6
   hooks:
   - id: codespell
 
 - repo: https://github.com/shellcheck-py/shellcheck-py
-  rev: "v0.10.0.1"
+  rev: v0.10.0.1
   hooks:
   - id: shellcheck
 
@@ -88,13 +90,13 @@ repos:
     exclude: .pre-commit-config.yaml
 
 - repo: https://github.com/abravalheri/validate-pyproject
-  rev: "v0.16"
+  rev: v0.16
   hooks:
   - id: validate-pyproject
-    additional_dependencies: ["validate-pyproject-schema-store[all]"]
+    additional_dependencies: ['validate-pyproject-schema-store[all]']
 
 - repo: https://github.com/python-jsonschema/check-jsonschema
-  rev: "0.28.1"
+  rev: 0.28.1
   hooks:
   - id: check-dependabot
   - id: check-github-workflows
diff --git a/.readthedocs.yaml b/.readthedocs.yaml
index c27af52..c67fcdc 100644
--- a/.readthedocs.yaml
+++ b/.readthedocs.yaml
@@ -6,7 +6,7 @@ version: 2
 build:
   os: ubuntu-22.04
   tools:
-    python: "3.11"
+    python: '3.11'
 sphinx:
   configuration: docs/conf.py
 
diff --git a/CHANGELOG.md b/CHANGELOG.md
index 5967d06..358cc1c 100644
--- a/CHANGELOG.md
+++ b/CHANGELOG.md
@@ -5,7 +5,7 @@ All notable changes to this project will be documented in this file.
 The format is based on [Keep a Changelog](https://keepachangelog.com/en/1.1.0/),
 and this project adheres to [Semantic Versioning](https://semver.org/spec/v2.0.0.html).
 
-## [Unreleased] - 2024-04-12
+## \[Unreleased\] - 2024-04-12
 
 ### Added
 
diff --git a/CODING_GUIDELINES.md b/CODING_GUIDELINES.md
index c7c5d3c..889cbfb 100644
--- a/CODING_GUIDELINES.md
+++ b/CODING_GUIDELINES.md
@@ -7,8 +7,11 @@ We follow the [Google Python Style Guide][google-style-guide] with a few minor c
 We deviate from the [Google Python Style Guide][google-style-guide] only in the following points:
 
 - We use [`ruff-linter`][ruff-linter] instead of [`pylint`][pylint].
+
 - We use [`ruff-formatter`][ruff-formatter] for source code and imports formatting, which may work differently than indicated by the guidelines in section [_3. Python Style Rules_](https://google.github.io/styleguide/pyguide.html#3-python-style-rules). For example, maximum line length is set to 100 instead of 79 (although docstring lines should still be limited to 79).
+
 - According to subsection [_2.19 Power Features_](https://google.github.io/styleguide/pyguide.html#219-power-features), direct use of _power features_ (e.g. custom metaclasses, import hacks, reflection) should be avoided, but standard library classes that internally use these power features are accepted. Following the same spirit, we allow the use of power features in infrastructure code with similar functionality and scope as the Python standard library.
+
 - For readability purposes, when a docstring contains more than the required summary line, we prefer indenting the first line at the same cursor position as the first opening quote, although this is not explicitly considered in the doctring conventions described in subsection [_3.8.1 Docstrings_](https://google.github.io/styleguide/pyguide.html#381-docstrings). Example:
 
   ```python
@@ -26,7 +29,7 @@ We deviate from the [Google Python Style Guide][google-style-guide] only in the
 
 - According to subsection [_3.19.12 Imports For Typing_](https://google.github.io/styleguide/pyguide.html#31912-imports-for-typing), symbols from `typing` and `collections.abc` modules used in type annotations _"can be imported directly to keep common annotations concise and match standard typing practices"_. Following the same spirit, we allow symbols to be imported directly from third-party or internal modules when they only contain a collection of frequently used typying definitions.
 
-### Common questions
+### Language usage recommendations
 
 - `pass` vs `...` (`Ellipsis`)
 
@@ -35,15 +38,15 @@ We deviate from the [Google Python Style Guide][google-style-guide] only in the
   ```python
   # Correct use of `...` as the empty body of an abstract method
   class AbstractFoo:
-     @abstractmethod
-     def bar(self) -> Bar:
-        ...
+      @abstractmethod
+      def bar(self) -> Bar: ...
+
 
   # Correct use of `pass` when mixed with other statements
   try:
-     resource.load(id=42)
+      resource.load(id=42)
   except ResourceException:
-     pass
+      pass
   ```
 
 ### Error messages
@@ -53,7 +56,9 @@ Error messages should be written as sentences, starting with a capital letter an
 Examples:
 
 ```python
-raise ValueError(f"Invalid argument 'dimension': should be of type 'Dimension', got '{dimension.type}'.")
+raise ValueError(
+    f"Invalid argument 'dimension': should be of type 'Dimension', got '{dimension.type}'."
+)
 ```
 
 Interpolated integer values do not need double quotes, if they are indicating an amount. Example:
@@ -65,19 +70,25 @@ raise ValueError(f"Invalid number of arguments: expected 3 arguments, got {len(a
 The double quotes can also be dropped when presenting a sequence of values. In this case the message should be rephrased so the sequence is separated from the text by a colon ':'.
 
 ```python
-raise ValueError(f"unexpected keyword arguments: {', '.join(set(kwarg_names) - set(expected_kwarg_names))}.")
+raise ValueError(
+    f"unexpected keyword arguments: {', '.join(set(kwarg_names) - set(expected_kwarg_names))}."
+)
 ```
 
 The message should be kept to one sentence if reasonably possible. Ideally the sentence should be kept short and avoid unnecessary words. Examples:
 
 ```python
 # too many sentences
-raise ValueError(f"Received an unexpected number of arguments. Should receive 5 arguments, but got {len(args)}. Please provide the correct number of arguments.")
+raise ValueError(
+    f"Received an unexpected number of arguments. Should receive 5 arguments, but got {len(args)}. Please provide the correct number of arguments."
+)
 # better
 raise ValueError(f"Wrong number of arguments: expected 5, got {len(args)}.")
 
 # less extreme
-raise TypeError(f"Wrong argument type. Can only accept 'int's, got '{type(arg)}' instead.")
+raise TypeError(
+    f"Wrong argument type. Can only accept 'int's, got '{type(arg)}' instead."
+)
 # but can still be improved
 raise TypeError(f"Wrong argument type: 'int' expected, got '{type(arg)}'")
 ```
@@ -88,14 +99,14 @@ The terseness vs. helpfulness tradeoff should be more in favor of terseness for
 
 TODO: update to `autodoc2`
 
-We generate the API documentation automatically from the docstrings using [Sphinx][sphinx] and some extensions such as [Sphinx-autodoc][sphinx-autodoc] and [Sphinx-napoleon][sphinx-napoleon]. These follow the Google Python Style Guide docstring conventions to automatically format the generated documentation. A complete overview can be found here: [Example Google Style Python Docstrings](https://sphinxcontrib-napoleon.readthedocs.io/en/latest/example_google.html#example-google).
+We generate the API documentation automatically from the docstrings using [Sphinx] and some extensions such as [Sphinx-autodoc] and [Sphinx-napoleon]. These follow the Google Python Style Guide docstring conventions to automatically format the generated documentation. A complete overview can be found here: [Example Google Style Python Docstrings](https://sphinxcontrib-napoleon.readthedocs.io/en/latest/example_google.html#example-google).
 
 Sphinx supports the [reStructuredText][sphinx-rest] (reST) markup language for defining additional formatting options in the generated documentation, however section [_3.8 Comments and Docstrings_](https://google.github.io/styleguide/pyguide.html#38-comments-and-docstrings) of the Google Python Style Guide does not specify how to use markups in docstrings. As a result, we decided to forbid reST markup in docstrings, except for the following cases:
 
 - Cross-referencing other objects using Sphinx text roles for the [Python domain](https://www.sphinx-doc.org/en/master/usage/restructuredtext/domains.html#the-python-domain) (as explained [here](https://www.sphinx-doc.org/en/master/usage/restructuredtext/domains.html#python-roles)).
-- Very basic formatting markup to improve _readability_ of the generated documentation without obscuring the source docstring (e.g. ` ``literal`` ` strings, bulleted lists).
+- Very basic formatting markup to improve _readability_ of the generated documentation without obscuring the source docstring (e.g. ``` ``literal`` ``` strings, bulleted lists).
 
-We highly encourage the [doctest][doctest] format for code examples in docstrings. In fact, doctest runs code examples and makes sure they are in sync with the codebase.
+We highly encourage the [doctest] format for code examples in docstrings. In fact, doctest runs code examples and makes sure they are in sync with the codebase.
 
 ### Module structure
 
@@ -126,14 +137,16 @@ Consider configuration files as another type of source code and apply the same c
 You may occasionally need to disable checks from _quality assurance_ (QA) tools (e.g. linters, type checkers, etc.) on specific lines as some tool might not be able to fully understand why a certain piece of code is needed. This is usually done with special comments, e.g. `# noqa: F401`, `# type: ignore`. However, you should **only** ignore QA errors when you fully understand their source and rewriting your code to pass QA checks would make it less readable. Additionally, you should add a short descriptive code if possible (check [ruff rules][ruff-rules] and [mypy error codes][mypy-error-codes] for reference):
 
 ```python
-f = lambda: 'empty'  # noqa: E731 [lambda-assignment]
+f = lambda: "empty"  # noqa: E731 [lambda-assignment]
 ```
 
 and, if needed, a brief comment for future reference:
 
 ```python
 ...
-return undeclared_symbol  # noqa: F821 [undefined-name] on purpose to trigger black-magic
+return (
+    undeclared_symbol  # noqa: F821 [undefined-name] on purpose to trigger black-magic
+)
 ```
 
 ## Testing
@@ -144,9 +157,7 @@ Testing components is a critical part of a software development project. We foll
 
 [doctest]: https://docs.python.org/3/library/doctest.html
 [google-style-guide]: https://google.github.io/styleguide/pyguide.html
-[mypy]: https://mypy.readthedocs.io/
 [mypy-error-codes]: https://mypy.readthedocs.io/en/stable/error_code_list.html
-[pre-commit]: https://pre-commit.com/
 [pylint]: https://pylint.pycqa.org/
 [ruff-formatter]: https://docs.astral.sh/ruff/formatter/
 [ruff-linter]: https://docs.astral.sh/ruff/linter/
diff --git a/CONTRIBUTING.md b/CONTRIBUTING.md
index e3dc26e..19d5adb 100644
--- a/CONTRIBUTING.md
+++ b/CONTRIBUTING.md
@@ -98,7 +98,7 @@ Before submitting a pull request, check that it meets the following criteria:
 3. The pull request should have a proper description of its intent and the main changes in the code. In general this description should be used as commit message if the pull request is approved (check point **5.** below).
 4. If the pull request contains code authored by first-time contributors, they should add their names to the [AUTHORS.md](AUTHORS.md) file.
 5. Pick one reviewer and try to contact them directly to let them know about the pull request. If there is no feedback in 24h/48h try to contact them again or pick another reviewer.
-6. Once the pull request has been approved, it should be squash-merged as soon as possible with a meaningful description of the changes. We use the [Conventional Commits][https://www.conventionalcommits.org/en/v1.0.0/#summary] specification for writing informative and automation-friendly commit messages. The following _commit types_ are accepted:
+6. Once the pull request has been approved, it should be squash-merged as soon as possible with a meaningful description of the changes. We use the [Conventional Commits](https://www.conventionalcommits.org/en/v1.0.0/#summary) specification for writing informative and automation-friendly commit messages. The following _commit types_ are accepted:
    - `build`: changes that affect the build system or external dependencies
    - `chore`: changes related to the development tools or process
    - `ci`: changes to our CI configuration files and scripts
diff --git a/README.md b/README.md
index f17b970..86e7f31 100644
--- a/README.md
+++ b/README.md
@@ -19,17 +19,14 @@ The DaCe project aims to build new representations for programs and algorithms,
 
 <!-- SPHINX-START -->
 
-<!-- prettier-ignore-start -->
-[actions-badge]:            https://github.com/GridTools/JaCe/workflows/CI/badge.svg
-[actions-link]:             https://github.com/GridTools/JaCe/actions
-[conda-badge]:              https://img.shields.io/conda/vn/conda-forge/JaCe
-[conda-link]:               https://github.com/conda-forge/JaCe-feedstock
+[actions-badge]: https://github.com/GridTools/JaCe/workflows/CI/badge.svg
+[actions-link]: https://github.com/GridTools/JaCe/actions
+[conda-badge]: https://img.shields.io/conda/vn/conda-forge/JaCe
+[conda-link]: https://github.com/conda-forge/JaCe-feedstock
 [github-discussions-badge]: https://img.shields.io/static/v1?label=Discussions&message=Ask&color=blue&logo=github
-[github-discussions-link]:  https://github.com/GridTools/JaCe/discussions
-[pypi-link]:                https://pypi.org/project/JaCe/
-[pypi-platforms]:           https://img.shields.io/pypi/pyversions/JaCe
-[pypi-version]:             https://img.shields.io/pypi/v/JaCe
-[rtd-badge]:                https://readthedocs.org/projects/JaCe/badge/?version=latest
-[rtd-link]:                 https://JaCe.readthedocs.io/en/latest/?badge=latest
-
-<!-- prettier-ignore-end -->
+[github-discussions-link]: https://github.com/GridTools/JaCe/discussions
+[pypi-link]: https://pypi.org/project/JaCe/
+[pypi-platforms]: https://img.shields.io/pypi/pyversions/JaCe
+[pypi-version]: https://img.shields.io/pypi/v/JaCe
+[rtd-badge]: https://readthedocs.org/projects/JaCe/badge/?version=latest
+[rtd-link]: https://JaCe.readthedocs.io/en/latest/?badge=latest
diff --git a/ROADMAP.md b/ROADMAP.md
index 2beaa39..ec14397 100644
--- a/ROADMAP.md
+++ b/ROADMAP.md
@@ -9,23 +9,23 @@ A kind of roadmap that gives a rough idea about how the project will be continue
   - [ ] Implementing the `stages` model that is supported by Jax.
   - [ ] Handling Jax arrays as native input (only on single host).
   - [ ] Cache the compilation and lowering results for later reuse.
-        In Jax these parts (together with the dispatch) are actually written in C++, thus in the beginning we will use a self made cache.
+    In Jax these parts (together with the dispatch) are actually written in C++, thus in the beginning we will use a self made cache.
 - [ ] Implementing some basic `PrimitiveTranslators`, that allows us to run some early tests, such as:
   - [ ] Backporting the ones from the prototype.
   - [ ] Implement the `scatter` primitive (needed for pyhpc).
   - [ ] Implement the `scan` primitive (needed for pyhpc).
 - [ ] _Initial_ optimization pipeline
-      In order to do benchmarks, we need to perform optimizations first.
-      However, the one offered by DaCe were not that well, so we should, for now, backport the ones from the prototype.
+  In order to do benchmarks, we need to perform optimizations first.
+  However, the one offered by DaCe were not that well, so we should, for now, backport the ones from the prototype.
 - [ ] Support GPU code (relatively simple, but needs some detection logic).
 - [ ] Initial benchmark:
-      In the beginning we will not have the same dispatching performance as Jax.
-      But passing these benchmarks could give us some better hint of how to proceed in this matter.
+  In the beginning we will not have the same dispatching performance as Jax.
+  But passing these benchmarks could give us some better hint of how to proceed in this matter.
   - [ ] Passing the [pyhpc-benchmark](https://github.com/dionhaefner/pyhpc-benchmarks)
   - [ ] Passing Felix' fluid project; possibility.
 - [ ] Support of static arguments.
 - [ ] Stop relying on `jax.make_jaxpr()`.
-      Look at the `jax._src.pjit.make_jit()` function for how to hijack the staging process.
+  Look at the `jax._src.pjit.make_jit()` function for how to hijack the staging process.
 - [ ] Implementing more advanced primitives:
   - [ ] Handling pytrees as arguments.
   - [ ] Implement random numbers.
@@ -44,15 +44,15 @@ These are more general topics that should be addressed at one point.
 - [ ] Integrating better with Jax
   - [ ] Support its array type (probably implement this in DaCe).
 - [ ] Increase the dispatching speed + Cache
-      Jax does this in C++, which is impossible to beat in Python, thus we have to go that root as well.
+  Jax does this in C++, which is impossible to beat in Python, thus we have to go that root as well.
 - [ ] Debugging information.
 - [ ] Dynamic shapes
-      This could be done by making the inputs fully dynamic, and then use the primitives to simplify.
-      For example in an addition the shape of the two inputs and the outputs are the same.
-      That is knowledge that is inherent to the primitives itself.
-      However, the compiled object must know how to extract the sizes itself.
+  This could be done by making the inputs fully dynamic, and then use the primitives to simplify.
+  For example in an addition the shape of the two inputs and the outputs are the same.
+  That is knowledge that is inherent to the primitives itself.
+  However, the compiled object must know how to extract the sizes itself.
 - [ ] Defining a Logo:
-      It should be green with a nice curly font.
+  It should be green with a nice curly font.
 
 # Optimization & Transformations
 
@@ -61,7 +61,7 @@ Our experiments with the prototype showed that the most important transformation
 
 - [ ] Modified state fusion; Because of the structure we have, this could make `Simplify` much more efficient.
 - [ ] Trivial Tasklet removal.
-      Since we will work a lot with Maps that are trivial (probably the best structure for fusing) we will end up with some of trivial Tasklets, i.e. `__out = __in`.
-      Thus, we should have a good way to get rid of them.
+  Since we will work a lot with Maps that are trivial (probably the best structure for fusing) we will end up with some of trivial Tasklets, i.e. `__out = __in`.
+  Thus, we should have a good way to get rid of them.
 - [ ] Modified Map fusion transformation.
-      We should still support parallel and serial fusion as the prototype did, but focusing on serial.
+  We should still support parallel and serial fusion as the prototype did, but focusing on serial.
diff --git a/noxfile.py b/noxfile.py
index 3772f2d..6c53e26 100644
--- a/noxfile.py
+++ b/noxfile.py
@@ -16,28 +16,21 @@
 
 @nox.session
 def lint(session: nox.Session) -> None:
-    """
-    Run the linter.
-    """
+    """Run the linter."""
     session.install("pre-commit")
     session.run("pre-commit", "run", "--all-files", "--show-diff-on-failure", *session.posargs)
 
 
 @nox.session
 def tests(session: nox.Session) -> None:
-    """
-    Run the unit and regular tests.
-    """
+    """Run the unit and regular tests."""
     session.install(".[test]")
     session.run("pytest", *session.posargs)
 
 
 @nox.session(reuse_venv=True)
 def docs(session: nox.Session) -> None:
-    """
-    Build the docs. Pass "--serve" to serve. Pass "-b linkcheck" to check links.
-    """
-
+    """Build the docs. Pass "--serve" to serve. Pass "-b linkcheck" to check links."""
     parser = argparse.ArgumentParser()
     parser.add_argument("--serve", action="store_true", help="Serve after building")
     parser.add_argument("-b", dest="builder", default="html", help="Build target (default: html)")
@@ -72,10 +65,7 @@ def docs(session: nox.Session) -> None:
 
 @nox.session
 def build_api_docs(session: nox.Session) -> None:
-    """
-    Build (regenerate) API docs.
-    """
-
+    """Build (regenerate) API docs."""
     session.install("sphinx")
     session.chdir("docs")
     session.run(
@@ -91,10 +81,7 @@ def build_api_docs(session: nox.Session) -> None:
 
 @nox.session
 def build(session: nox.Session) -> None:
-    """
-    Build an SDist and wheel.
-    """
-
+    """Build an SDist and wheel."""
     build_path = DIR.joinpath("build")
     if build_path.exists():
         shutil.rmtree(build_path)
diff --git a/pyproject.toml b/pyproject.toml
index 3556e8a..5026706 100644
--- a/pyproject.toml
+++ b/pyproject.toml
@@ -1,10 +1,12 @@
 [build-system]
 build-backend = "setuptools.build_meta"
-requires = ["setuptools>=61"]
+requires = [
+  "setuptools>=61",
+]
 
 [project]
 authors = [
-  {name = "ETH Zurich", email = "gridtools@cscs.ch"}
+  {name = "ETH Zurich", email = "gridtools@cscs.ch"},
 ]
 classifiers = [
   "Development Status :: 1 - Planning",
@@ -19,12 +21,12 @@ classifiers = [
   "Programming Language :: Python :: 3.11",
   "Programming Language :: Python :: 3.12",
   "Topic :: Scientific/Engineering",
-  "Typing :: Typed"
+  "Typing :: Typed",
 ]
 dependencies = [
   "dace>=0.15",
   "jax[cpu]>=0.4.24",
-  "numpy>=1.26.0"
+  "numpy>=1.26.0",
 ]
 description = "JAX jit using DaCe (Data Centric Parallel Programming)"
 name = "JaCe"
@@ -37,7 +39,7 @@ license.file = "LICENSE"
 cuda12 = [
   "cupy-cuda12x>=12.1.0",
   "jax[cuda12]>=0.4.24",
-  "optuna>=3.4.0"
+  "optuna>=3.4.0",
 ]
 
 [project.urls]
@@ -49,7 +51,7 @@ Homepage = "https://github.com/GridTools/JaCe"
 [tool.coverage]
 report.exclude_also = [
   '\.\.\.',
-  'if typing.TYPE_CHECKING:'
+  'if typing.TYPE_CHECKING:',
 ]
 run.source = ["jace"]
 
@@ -76,21 +78,22 @@ warn_unused_ignores = true
 disallow_incomplete_defs = false
 disallow_untyped_defs = false
 ignore_missing_imports = true
-module = ["tests.*", "dace.*", "jax.*", "jaxlib.*"]
+module = [
+  "tests.*",
+  "dace.*",
+  "jax.*",
+  "jaxlib.*",
+]
 
 # -- pytest  --
 [tool.pytest]
 
 [tool.pytest.ini_options]
 addopts = ["-ra", "--showlocals", "--strict-markers", "--strict-config"]
-filterwarnings = [
-  "error"
-]
+filterwarnings = ["error"]
 log_cli_level = "INFO"
 minversion = "6.0"
-testpaths = [
-  "tests"
-]
+testpaths = ["tests"]
 xfail_strict = true
 
 # -- ruff --
@@ -104,16 +107,24 @@ src = ["src"]
 docstring-code-format = true
 
 [tool.ruff.lint]
+extend-safe-fixes = ["D", "TCH"]
 extend-select = [
   "A",  # flake8-builtins
   "B",  # flake8-bugbear
   "I",  # isort
   "G",  # flake8-logging-format
+  "N",  # pep8-naming
+  "W",  # pycodestyle-warning
   "C4",  # flake8-comprehensions
+  "C90",  # mccabe
+  "D",  # pydocstyle
+  "D213",  # multi-line-summary-second-line (off by default in pydocstyle "google' convention)
   "PT",  # flake8-pytest-style
+  "TD",  # flake8-todo
   "UP",  # pyupgrade       # TODO: in evaluation
   "ARG",  # flake8-unused-arguments
   "ERA",  # eradicate
+  "FLY",  # flynt
   "ICN",  # flake8-import-conventions
   "PGH",  # pygrep-hooks
   "PIE",  # flake8-pie
@@ -121,46 +132,80 @@ extend-select = [
   "RET",  # flake8-return   # TODO: in evaluation
   "RUF",  # Ruff-specific
   "SIM",  # flake8-simplify # TODO: in evaluation
+  "SLOT",  # flake8-slots
   "T10",  # flake8-debugger
-  "T20",  # flake8-print    # TODO: in evaluation
+  "T20",  # flake8-print
   "TCH",  # flake8-type-checking  # TODO: in evaluation
-  "NPY"  # NumPy specific rules
+  "NPY",  # NumPy specific rules
 ]
 ignore = [
-  'B905',  # [zip-without-explicit-strict]
-  'E501',  # [line-too-long]
-  'UP038'  # [non-pep604-isinstance]
+  "B905",  # [zip-without-explicit-strict]
+  "D105",  # undocumented-magic-method
+  "D107",  # [undocumented-public-init]
+  "D212",  # [multi-line-summary-first-line]
+  "E501",  # [line-too-long]
+  "TCH003",  # [typing-only-standard-library-import]
+  "TD003",  # [missing-todo-link]
+  "UP038",  # [non-pep604-isinstance]
 ]
+task-tags = ["TODO"]
 # ignore-init-module-imports = true  # deprecated in preview mode
 unfixable = []
 
 [tool.ruff.lint.isort]
 combine-as-imports = true
-known-first-party = ['jace']
+known-first-party = ["jace"]
 known-third-party = [
-  'cupy',
-  'dace',
-  'jax',
-  'numpy',
-  'pytest',
-  'typing_extensions'
+  "cupy",
+  "dace",
+  "jax",
+  "numpy",
+  "pytest",
+  "typing_extensions",
 ]
 lines-after-imports = 2
 order-by-type = true
 required-imports = ["from __future__ import annotations"]
 section-order = [
-  'future',
-  'standard-library',
-  'third-party',
-  'first-party',
-  'tests',
-  'local-folder'
+  "future",
+  "standard-library",
+  "third-party",
+  "first-party",
+  "tests",
+  "local-folder",
 ]
 
 [tool.ruff.lint.isort.sections]
-tests = ["tests", "unit_tests", "integration_tests"]
+tests = [
+  "tests",
+  "unit_tests",
+  "integration_tests",
+]
+
+[tool.ruff.lint.mccabe]
+max-complexity = 12
 
 [tool.ruff.lint.per-file-ignores]
-"!tests/**.py" = ["PT"]  # Ignore `flake8-pytest-style` everywhere except in `tests/`
-"noxfile.py" = ["T20"]  # Ignore `flake8-print`
-"tests/**" = ["T10", "T20"]  # Ignore `flake8-debugger` and `flake8-print`
+"!tests/**.py" = ["PT"]  # Ignore `flake8-pytest-style` outside `tests/`
+"docs/**" = [
+  "D",  # pydocstyle
+  "T10",  # flake8-debugger
+  "T20",  # flake8-print
+]
+"noxfile.py" = [
+  "D",  # pydocstyle
+  "T20",  # flake8-print
+]
+"tests/**" = [
+  "D",  # pydocstyle
+  "T10",  # flake8-debugger
+  "T20",  # flake8-print
+]
+
+[tool.ruff.lint.pycodestyle]
+ignore-overlong-task-comments = true
+max-doc-length = 88
+
+[tool.ruff.lint.pydocstyle]
+convention = "google"
+ignore-decorators = ["typing.overload"]
diff --git a/src/jace/__init__.py b/src/jace/__init__.py
index 56f6505..ebc8a4f 100644
--- a/src/jace/__init__.py
+++ b/src/jace/__init__.py
@@ -5,9 +5,7 @@
 #
 # SPDX-License-Identifier: BSD-3-Clause
 
-"""
-JaCe: JAX jit using DaCe (Data Centric Parallel Programming)
-"""
+"""JaCe: JAX jit using DaCe (Data Centric Parallel Programming)."""
 
 from __future__ import annotations
 

From 478840598d88eb55d87114ccbf883c1a65e9858b Mon Sep 17 00:00:00 2001
From: Enrique Gonzalez Paredes <enriqueg@cscs.ch>
Date: Wed, 12 Jun 2024 10:57:15 +0200
Subject: [PATCH 345/458] Update hooks versions

---
 .pre-commit-config.yaml | 16 ++++++++++------
 1 file changed, 10 insertions(+), 6 deletions(-)

diff --git a/.pre-commit-config.yaml b/.pre-commit-config.yaml
index 9ff228d..10c71ef 100644
--- a/.pre-commit-config.yaml
+++ b/.pre-commit-config.yaml
@@ -30,10 +30,14 @@ repos:
     - mdformat-black
 
 - repo: https://github.com/Lucas-C/pre-commit-hooks
-  rev: v1.1.9
+  rev: v1.5.5
   hooks:
   - id: insert-license
-    exclude: ^\..*$
+    exclude: |
+      (?x)^(
+          ^\..*$ |
+          noxfile.py
+      )$
     types: [python]
     args: [--comment-style, '|#|', --license-filepath, ./LICENSE_HEADER.txt]
 
@@ -54,7 +58,7 @@ repos:
   - id: trailing-whitespace
 
 - repo: https://github.com/astral-sh/ruff-pre-commit
-  rev: v0.4.6
+  rev: v0.4.8
   hooks:
   - id: ruff
     args: [--fix, --show-fixes, --preview]
@@ -72,7 +76,7 @@ repos:
     - numpy==1.26.4
     - pytest==8.2.1
 - repo: https://github.com/codespell-project/codespell
-  rev: v2.2.6
+  rev: v2.3.0
   hooks:
   - id: codespell
 
@@ -90,13 +94,13 @@ repos:
     exclude: .pre-commit-config.yaml
 
 - repo: https://github.com/abravalheri/validate-pyproject
-  rev: v0.16
+  rev: v0.18
   hooks:
   - id: validate-pyproject
     additional_dependencies: ['validate-pyproject-schema-store[all]']
 
 - repo: https://github.com/python-jsonschema/check-jsonschema
-  rev: 0.28.1
+  rev: 0.28.5
   hooks:
   - id: check-dependabot
   - id: check-github-workflows

From 414c55f195efdbe38dce44d5d044af2ba0289e9e Mon Sep 17 00:00:00 2001
From: Enrique Gonzalez Paredes <enriqueg@cscs.ch>
Date: Wed, 12 Jun 2024 11:06:30 +0200
Subject: [PATCH 346/458] Fix code style in markdown file

---
 CODING_GUIDELINES.md | 4 +---
 1 file changed, 1 insertion(+), 3 deletions(-)

diff --git a/CODING_GUIDELINES.md b/CODING_GUIDELINES.md
index 889cbfb..5fd7e00 100644
--- a/CODING_GUIDELINES.md
+++ b/CODING_GUIDELINES.md
@@ -144,9 +144,7 @@ and, if needed, a brief comment for future reference:
 
 ```python
 ...
-return (
-    undeclared_symbol  # noqa: F821 [undefined-name] on purpose to trigger black-magic
-)
+return undeclared  # noqa: F821 [undefined-name] on purpose to trigger black-magic
 ```
 
 ## Testing

From 8cec4113172a4cad11a32343aa613f085944dd39 Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Wed, 12 Jun 2024 11:07:54 +0200
Subject: [PATCH 347/458] Made some cleaning to the pytree implementation.

It also partially cleans the tracing stuff.
---
 src/jace/api.py                              |  11 +-
 src/jace/stages.py                           | 191 ++++++++++---------
 src/jace/translator/pre_post_translation.py  |  86 +++++----
 src/jace/translator/translated_jaxpr_sdfg.py |  13 +-
 src/jace/util/dace_helper.py                 |  43 +++--
 src/jace/util/translation_cache.py           | 102 +++++-----
 6 files changed, 250 insertions(+), 196 deletions(-)

diff --git a/src/jace/api.py b/src/jace/api.py
index 81dad1f..58a0a93 100644
--- a/src/jace/api.py
+++ b/src/jace/api.py
@@ -51,17 +51,18 @@ def jit(
 ) -> stages.JaCeWrapped | Callable[[Callable], stages.JaCeWrapped]:
     """JaCe's replacement for `jax.jit` (just-in-time) wrapper.
 
-    It works the same way as `jax.jit` does, but instead of using XLA the
-    computation is lowered to DaCe. In addition it accepts some JaCe specific
-    arguments.
+    It works the same way as `jax.jit` does, but instead of lowering the
+    computation to XLA, it is lowered to DaCe.
+    The function supports a subset of the arguments that are accepted by `jax.jit()`,
+    currently none, and some JaCe specific ones.
 
     Args:
         primitive_translators: Use these primitive translators for the lowering
             to SDFG. If not specified the translators in the global registry are
             used.
 
-    Notes:
-        After constructions any change to `primitive_translators` has no effect.
+    Note:
+        This function is the only valid way to obtain a JaCe computation.
     """
     if kwargs:
         # TODO(phimuell): Add proper name verification and exception type.
diff --git a/src/jace/stages.py b/src/jace/stages.py
index e9488da..359063b 100644
--- a/src/jace/stages.py
+++ b/src/jace/stages.py
@@ -7,29 +7,28 @@
 """Reimplementation of the `jax.stages` module.
 
 This module reimplements the public classes of that Jax module.
-However, they are a bit different, because JaCe uses DaCe as backend.
+However, because JaCe uses DaCe as backend they differ is some small aspects.
 
 As in Jax JaCe has different stages, the terminology is taken from
 [Jax' AOT-Tutorial](https://jax.readthedocs.io/en/latest/aot.html).
 - Stage out:
-    In this phase an executable Python function is translated to Jaxpr.
+    In this phase an executable Python function is translated to a Jaxpr.
 - Lower:
-    This will transform the Jaxpr into an SDFG equivalent. As a implementation
-    note, currently this and the previous step are handled as a single step.
+    This will transform the Jaxpr into its SDFG equivalent.
 - Compile:
-    This will turn the SDFG into an executable object, see `dace.codegen.CompiledSDFG`.
+    This will turn the SDFG into an executable object.
 - Execution:
     This is the actual running of the computation.
 
-As in Jax the `stages` module give access to the last three stages, but not
-the first one.
+As in Jax the in JaCe the user only has access to the last tree stages and
+staging out and lowering is handled as a single step.
 """
 
 from __future__ import annotations
 
 import copy
 import inspect
-from typing import TYPE_CHECKING, Any
+from typing import TYPE_CHECKING, Any, Union
 
 from jax import tree_util as jax_tree
 
@@ -57,10 +56,13 @@
 
 These options are used by `JaCeLowered.compile()` to determine which options
 are forwarded to the underlying `jace_optimize()` function. It is initialized
-to `jace.optimization.DEFAULT_OPTIMIZATIONS` and can be managed through
-`update_active_compiler_options()`.
+to `jace.optimization.DEFAULT_OPTIMIZATIONS` and can be managed through the
+`update_active_compiler_options()` function.
 """
 
+#: Known compilation stages in JaCe.
+Stage = Union["JaCeWrapped", "JaCeLowered", "JaCeCompiled"]
+
 
 class JaCeWrapped(tcache.CachingStage["JaCeLowered"]):
     """A function ready to be specialized, lowered, and compiled.
@@ -68,16 +70,19 @@ class JaCeWrapped(tcache.CachingStage["JaCeLowered"]):
     This class represents the output of functions such as `jace.jit()` and is
     the first stage in the translation/compilation chain of JaCe. A user should
     never create a `JaCeWrapped` object directly, instead `jace.jit` should be
-    used for that. While it supports just-in-time lowering and compilation, by
-    just calling it, these steps can also be performed explicitly. The lowering
-    performed by this stage is cached, thus if a `JaCeWrapped` object is lowered
-    later, with the same argument the result is taken from the cache.
+    used. While it supports just-in-time lowering and compilation, by just
+    calling it, these steps can also be performed explicitly.
+    The lowering, performed by this stage is cached, thus if a `JaCeWrapped`
+    object is later lowered with the same arguments the result might be taken
+    from the cache.
+
     Furthermore, a `JaCeWrapped` object is composable with all Jax transformations.
 
     Args:
         fun: The function that is wrapped.
-        primitive_translators: The list of primitive translators that that should be used.
-        jit_options: Options to influence the jit process.
+        primitive_translators: The list of primitive translators that should
+            be used for the lowering to SDFG.
+        jit_options: Options to control the lowering process.
 
     Todo:
         - Support keyword arguments and default values of the wrapped function.
@@ -111,37 +116,44 @@ def __init__(
         self._fun = fun
 
     def __call__(self, *args: Any, **kwargs: Any) -> Any:
-        """Executes the wrapped function, lowering and compiling as needed in one step.
+        """Executes the wrapped function.
+
+        This function will lower and compile in one go.
+        The function accepts the same arguments as the original computation.
 
-        The arguments passed to this function are the same as the wrapped function uses.
+        Note:
+            This function is also aware if a Jax tracing is going on. In this
+            case, it will not lower and compile but forward the call to the
+            wrapped Python function.
         """
-        # If we are inside a traced context, then we forward the call to the wrapped function.
-        #  This ensures that JaCe is composable with Jax.
         if util.is_tracing_ongoing(*args, **kwargs):
             return self._fun(*args, **kwargs)
 
         lowered = self.lower(*args, **kwargs)
         compiled = lowered.compile()
+        # TODO(phimuell): Filter out static arguments
         return compiled(*args, **kwargs)
 
     @tcache.cached_transition
     def lower(self, *args: Any, **kwargs: Any) -> JaCeLowered:
-        """Lower this function explicitly for the given arguments.
+        """Lower the wrapped computation for the given arguments.
+
+        This function accepts the same arguments as the original computation does.
 
         Performs the first two steps of the AOT steps described above, i.e.
         trace the wrapped function with the given arguments and stage it out
-        to a Jaxpr. Then translate it to SDFG. The result is encapsulated
+        to a Jaxpr. Then translate it to an SDFG. The result is encapsulated
         inside a `JaCeLowered` object which can later be compiled.
 
+        It should be noted that the current lowering process will hard code
+        the strides and the storage location of the input inside the SDFG.
+        Thus if the SDFG is lowered with arrays in C order, calling the compiled
+        SDFG with FORTRAN order will result in an error.
+
         Note:
-            The call to the function is cached. As key an abstract description
-            of the call, similar to the tracers used by Jax, is used.
             The tracing is always done with activated `x64` mode.
         """
-        if len(kwargs) != 0:
-            raise NotImplementedError("Currently only positional arguments are supported.")
-
-        jaxpr, flat_in_vals, outtree = ptrans.trace_and_flatten_function(
+        jaxpr, flat_call_args, outtree = ptrans.trace_and_flatten_function(
             fun=self._fun,
             trace_call_args=args,
             trace_call_kwargs=kwargs,
@@ -152,7 +164,7 @@ def lower(self, *args: Any, **kwargs: Any) -> JaCeLowered:
         )
         trans_ctx: translator.TranslationContext = builder.translate_jaxpr(jaxpr)
         tsdfg: translator.TranslatedJaxprSDFG = ptrans.postprocess_jaxpr_sdfg(
-            trans_ctx=trans_ctx, fun=self.wrapped_fun, call_args=flat_in_vals, outtree=outtree
+            trans_ctx=trans_ctx, fun=self.wrapped_fun, call_args=flat_call_args, outtree=outtree
         )
 
         # NOTE: `tsdfg` is deepcopied as a side effect of post processing.
@@ -164,15 +176,22 @@ def wrapped_fun(self) -> Callable:
         return self._fun
 
     def _make_call_description(
-        self, args_tree: jax_tree.PyTreeDef, flat_args: Sequence[Any]
+        self, intree: jax_tree.PyTreeDef, flat_call_args: Sequence[Any]
     ) -> tcache.StageTransformationSpec:
-        """This function computes the key for the `JaCeWrapped.lower()` call inside the cache.
+        """Generates the key used to cache lowering calls.
+
+        For all non static arguments the function will generate an abstract
+        description of an argument and for all static arguments the concrete
+        value.
 
-        The function will compute a full abstract description on its argument.
+        Notes:
+            The abstract description also includes storage location, i.e. if
+            on CPU or on GPU, and the strides of the arrays.
         """
-        call_args = tuple(tcache._AbstractCallArgument.from_value(x) for x in flat_args)
+        # TODO(phimuell): Implement static arguments
+        flat_call_args = tuple(tcache._AbstractCallArgument.from_value(x) for x in flat_call_args)
         return tcache.StageTransformationSpec(
-            stage_id=id(self), call_args=tuple(call_args), args_tree=args_tree
+            stage_id=id(self), flat_call_args=tuple(flat_call_args), intree=intree
         )
 
 
@@ -181,24 +200,20 @@ class JaCeLowered(tcache.CachingStage["JaCeCompiled"]):
 
     This class is the output type of `JaCeWrapped.lower()` and represents the
     originally wrapped computation as an SDFG. This stage is followed by the
-    `JaCeCompiled` stage, by calling `self.compile()`.
+    `JaCeCompiled` stage, by calling `self.compile()`. A user should never
+    directly construct a `JaCeLowered` object directly, instead
+    `JaCeWrapped.lower()` should be used.
 
-    Before the SDFG is optimized the SDFG is optimized, see `JaCeLowered.compile()`
-    for more information on this topic.
+    Before the SDFG is compiled it is optimized, see `JaCeLowered.compile()` for
+    how to control the process.
 
     Args:
-        tsdfg:  The lowered SDFG with metadata. Must be finalized.
+        tsdfg:  The lowered SDFG with metadata.
 
     Note:
-        `self` will manage the passed `tsdfg` object. Modifying it results in
+        `self` will manage the passed `tsdfg` object. Modifying it results is
         undefined behavior. Although `JaCeWrapped` is composable with Jax
-        transformations `JaCeLowered` is not. A user should never create such
-        an object, instead `JaCeWrapped.lower()` should be used.
-        The storage location and stride of an input (in addition to its shape
-        and data type) are hard coded into the SDFG. Thus, if a certain stride
-        was used for lowering a computation, that stride must also be used
-        when the SDFG is called. If the just in time compilation mode is used
-        JaCe will take care of this.
+        transformations `JaCeLowered` is not.
     """
 
     _translated_sdfg: translator.TranslatedJaxprSDFG
@@ -211,16 +226,16 @@ def __init__(self, tsdfg: translator.TranslatedJaxprSDFG) -> None:
     def compile(self, compiler_options: CompilerOptions | None = None) -> JaCeCompiled:
         """Optimize and compile the lowered SDFG and return a `JaCeCompiled` object.
 
-        This is the transition function of this stage. Before the SDFG is
-        compiled, it will be optimized using `jace_optimize()`. The options
-        used for this consists of two parts. First there is the (global) set of
-        currently active compiler options, which is then merged with the options
-        passed through `compiler_options`, which take precedence. Thus
-        `compiler_options` describes the delta from the current active set of options.
+        Before the SDFG is compiled, it will be optimized using `jace_optimize()`.
+        There are two different sources of these options. The first one is the
+        global set of currently active compiler options. The second one is the
+        options that are passed to this function, which takes precedence. Thus,
+        the `compiler_options` argument of this function describes the difference
+        from the currently active global options.
 
         See also:
             `get_active_compiler_options()` to inspect the set of currently active
-            options and `update_active_compiler_options()` to modify the set.
+            options and `update_active_compiler_options()` to modify them.
         """
         # We **must** deepcopy before we do any optimization, because all optimizations are in
         #  place, however, to properly cache stages, stages needs to be immutable.
@@ -238,17 +253,14 @@ def compiler_ir(self, dialect: str | None = None) -> translator.TranslatedJaxprS
         """Returns the internal SDFG.
 
         The function returns a `TranslatedJaxprSDFG` object. Direct modification
-        of the returned object is forbidden and will cause undefined behaviour.
+        of the returned object is forbidden and results in undefined behaviour.
         """
         if (dialect is None) or (dialect.upper() == "SDFG"):
             return self._translated_sdfg
         raise ValueError(f"Unknown dialect '{dialect}'.")
 
     def view(self, filename: str | None = None) -> None:
-        """Runs the `view()` method of the underlying SDFG.
-
-        This will open a browser and display the SDFG.
-        """
+        """Runs the `view()` method of the underlying SDFG."""
         self.compiler_ir().sdfg.view(filename=filename, verbose=False)
 
     def as_sdfg(self) -> dace.SDFG:
@@ -259,29 +271,26 @@ def as_sdfg(self) -> dace.SDFG:
         return self.compiler_ir().sdfg
 
     def _make_call_description(
-        self, args_tree: jax_tree.PyTreeDef, flat_args: Sequence[Any]
+        self, intree: jax_tree.PyTreeDef, flat_call_args: Sequence[Any]
     ) -> tcache.StageTransformationSpec:
-        """This function computes the key for the `self.compile()` call inside the cache.
+        """Creates the key for the `self.compile()` transition function.
 
-        Contrary to the `JaCeWrapped.lower()` function the call description
-        depends on the concrete values of the arguments and takes the global
-        compile options into consideration.
+        The generated key will not only depend on the arguments that were
+        passed to the translation function, i.e. `compile(compiler_options)`,
+        in addition it will also take the set of currently active set of
+        global options. Furthermore, the key will depend on the concrete values.
         """
-        unflatted_args, unflatted_kwargs = jax_tree.tree_unflatten(args_tree, flat_args)
+        unflatted_args, unflatted_kwargs = jax_tree.tree_unflatten(intree, flat_call_args)
         assert (not len(unflatted_kwargs)) and (len(unflatted_args) == 1)
-        options = self._make_compiler_options(unflatted_args[0])
 
-        # The values are stored inside `call_args` and `args_tree` stores the key.
-        call_args, args_tree = jax_tree.tree_flatten(options)
+        options = self._make_compiler_options(unflatted_args[0])
+        flat_options, optiontree = jax_tree.tree_flatten(options)
         return tcache.StageTransformationSpec(
-            stage_id=id(self), call_args=tuple(call_args), args_tree=args_tree
+            stage_id=id(self), flat_call_args=tuple(flat_options), intree=optiontree
         )
 
     def _make_compiler_options(self, compiler_options: CompilerOptions | None) -> CompilerOptions:
-        """Return the compilation options that should be used for compilation.
-
-        See `JaCeLowered.compile()` to see how to influence them.
-        """
+        """Return the compilation options that should be used for compilation."""
         assert isinstance(compiler_options, dict)
         return get_active_compiler_options() | (compiler_options or {})
 
@@ -291,8 +300,13 @@ def update_active_compiler_options(new_active_options: CompilerOptions) -> Compi
 
     Merges the options passed as `new_active_options` with the currently active
     compiler options. This set is used by `JaCeLowered.compile()` to determine
-    which options should be used for optimization.
+    which options should be used.
     The function will return the set of options that was active before the call.
+
+    To obtain the set of currently active options use `get_active_compiler_options()`.
+
+    Todo:
+        Make a proper context manager.
     """
     previous_active_options = _JACELOWERED_ACTIVE_COMPILE_OPTIONS.copy()
     _JACELOWERED_ACTIVE_COMPILE_OPTIONS.update(new_active_options)
@@ -300,22 +314,19 @@ def update_active_compiler_options(new_active_options: CompilerOptions) -> Compi
 
 
 def get_active_compiler_options() -> CompilerOptions:
-    """Returns the set of currently active compiler options.
-
-    By default the set is initialized with `jace.optimization.DEFAULT_OPTIMIZATIONS`.
-    """
+    """Returns the set of currently active compiler options."""
     return _JACELOWERED_ACTIVE_COMPILE_OPTIONS.copy()
 
 
 class JaCeCompiled:
     """Compiled version of the SDFG.
 
-    This is the last stage of the jit chain. A user should never create a
+    This is the last stage of the JaCe's jit chain. A user should never create a
     `JaCeCompiled` instance, instead `JaCeLowered.compile()` should be used.
 
-    In order to execute the stored computation properly, an input's stride,
-    storage location, shape and datatype has to match the argument that was
-    used for lowering, i.e. was passed to the `lower()` function.
+    Since the strides and storage location of the arguments, that where used
+    to lower the computation are hard coded inside the SDFG, a `JaCeCompiled`
+    object can only be called with compatible arguments.
 
     Args:
         csdfg: The compiled SDFG object.
@@ -352,15 +363,17 @@ def __init__(
     def __call__(self, *args: Any, **kwargs: Any) -> Any:
         """Calls the embedded computation.
 
-        The arguments must be the same as for the wrapped function, but with
-        all static arguments removed.
+
+        Note:
+            Unlike the `lower()` function which takes the same arguments as the
+            original computation, to call this function you have to remove all
+            static arguments.
+            Furthermore, all arguments must have strides and storage locations
+            that is compatible with the ones that were used for lowering.
         """
         flat_in_vals = jax_tree.tree_leaves((args, kwargs))
         assert len(flat_in_vals) == len(self._inp_names), "Static arguments."
-        return dace_helper.run_jax_sdfg(
-            self._csdfg, self._inp_names, self._out_names, flat_in_vals, self._outtree
+        flat_output = dace_helper.run_jax_sdfg(
+            self._csdfg, self._inp_names, self._out_names, flat_in_vals
         )
-
-
-#: Known compilation stages in JaCe.
-Stage = JaCeWrapped | JaCeLowered | JaCeCompiled
+        return jax_tree.tree_unflatten(self._outtree, flat_output)
diff --git a/src/jace/translator/pre_post_translation.py b/src/jace/translator/pre_post_translation.py
index f4361ee..c7db385 100644
--- a/src/jace/translator/pre_post_translation.py
+++ b/src/jace/translator/pre_post_translation.py
@@ -34,10 +34,10 @@ def postprocess_jaxpr_sdfg(
     call_args: Sequence[Any],
     outtree: jax_tree.PyTreeDef,
 ) -> translator.TranslatedJaxprSDFG:
-    """Perform the final post processing steps on the `TranslationContext` _in place_.
+    """Perform the final post processing steps on the `TranslationContext` _in place_ and return a `TranslatedJaxprSDFG` object.
 
-    The function will perform post processing stages on the context in place.
-    However, the function will return a decoupled `TranslatedJaxprSDFG` object.
+    While the function performs the post processing on the context in place,
+    the returned `TranslatedJaxprSDFG` will be decoupled from the input.
 
     Args:
         trans_ctx: The `TranslationContext` obtained from the `translate_jaxpr()` function.
@@ -49,10 +49,7 @@ def postprocess_jaxpr_sdfg(
         - Fixing the scalar input problem on GPU.
         - Fixing stride problem of the input.
     """
-    # Currently we do nothing except finalizing.
     trans_ctx.validate()
-
-    # Handle inputs
     create_input_output_stages(trans_ctx=trans_ctx, call_args=call_args)
 
     return finalize_translation_context(trans_ctx, outtree=outtree, validate=True)
@@ -63,9 +60,14 @@ def create_input_output_stages(
 ) -> None:
     """Creates an input and output state inside the SDFG in place.
 
+    See `_create_input_state()` and `_create_output_state()` for more information.
+
     Args:
         trans_ctx: The translation context that should be modified.
-        call_args: the call arguments that should be used.
+        call_args: The flattened call arguments that should be used.
+
+    Note:
+        The output SDFG will still be canonical.
     """
     _create_input_state(trans_ctx, call_args)
     _create_output_state(trans_ctx)
@@ -75,15 +77,12 @@ def _create_output_state(trans_ctx: translator.TranslationContext) -> None:
     """Creates the output processing stage for the SDFG in place.
 
     The function will create a new terminal state, in which all outputs, denoted
-    in `trans_ctx.out_names` will be written in new SDFG variables. However,
-    instead of scalars the function will generate arrays of length one. This is
-    needed because DaCe can only return arrays at the moment, it is also
-    consistent with what Jax does.
+    in `trans_ctx.out_names`, will be written into new SDFG variables.
+    In case the output variable is a scalar, the output will be replaced by an
+    array of length one.
 
     Notes:
-        All output variables follow the pattern `__jace_output_{i}`, where `i`
-        is a zero based counter. Furthermore, all output variables are transients
-        since `TranslationContext` is supposed to hold canonical SDFGs only.
+        This is consistent with Jax' behaviour.
     """
     assert trans_ctx.inp_names is not None and trans_ctx.out_names is not None
 
@@ -98,16 +97,20 @@ def _create_output_state(trans_ctx: translator.TranslationContext) -> None:
     for i, org_output_name in enumerate(trans_ctx.out_names):
         new_output_name = output_pattern.format(i)
         org_output_desc: dace.data.Data = sdfg.arrays[org_output_name]
+        assert org_output_desc.transient
+        assert (
+            new_output_name not in sdfg.arrays
+        ), f"Final output variable '{new_output_name}' is already present."
 
         if isinstance(org_output_desc, dace.data.Scalar):
             _, new_output_desc = sdfg.add_array(
                 new_output_name,
                 dtype=org_output_desc.dtype,
                 shape=(1,),
-                transient=True,
-                strides=None,  # explicit C stride
+                transient=True,  # Needed for an canonical SDFG
             )
             memlet = dace.Memlet.simple(new_output_name, subset_str="0", other_subset_str="0")
+
         else:
             new_output_desc = org_output_desc.clone()
             sdfg.add_datadesc(new_output_name, new_output_desc)
@@ -128,15 +131,17 @@ def _create_output_state(trans_ctx: translator.TranslationContext) -> None:
 def _create_input_state(trans_ctx: translator.TranslationContext, call_args: Sequence[Any]) -> None:
     """Creates the input processing state for the SDFG in place.
 
-    The function creates a new set of variables that are exposed as inputs, whose
-    names follows the pattern `__jace_input_{i}`, where `i` is a zero based
-    counter. These new variables will have the same strides as the input array.
-    Furthermore, they will have the correct storage locations and scalars in
-    GPU mode will be handled correctly.
+    The function creates a new set of variables that are exposed as inputs.
+    If an input argument is an array, the new variable will have the same
+    strides and storage location the actual input value, that is passed
+    inside `call_args`.
+    If the input is a scalar and GPU mode is activated, the function will add
+    the necessary connections to transfer it to the device.
 
     Args:
         trans_ctx: The translation context that should be modified.
-        call_args: the call arguments that should be used.
+        call_args: The flattened call arguments for which the input
+            state should be specialized.
 
     Todo:
         Handle transfer of scalar input in GPU mode.
@@ -169,10 +174,12 @@ def _create_input_state(trans_ctx: translator.TranslationContext, call_args: Seq
                 shape=org_input_desc.shape,
                 dtype=org_input_desc.dtype,
                 strides=util.get_strides_for_dace(call_arg),
-                transient=True,
-                storage=dace.StorageType.GPU_Global
-                if util.is_on_device(call_arg)
-                else dace.StorageType.CPU_Heap,
+                transient=True,  # For canonical SDFG.
+                storage=(
+                    dace.StorageType.GPU_Global
+                    if util.is_on_device(call_arg)
+                    else dace.StorageType.CPU_Heap
+                ),
             )
             memlet = dace.Memlet.from_array(new_input_name, new_input_desc)
 
@@ -205,7 +212,7 @@ def finalize_translation_context(
 
     Args:
         trans_ctx: The context that should be finalized.
-        outtree: A pytree describing how to restore the output.
+        outtree: A pytree describing how to unflatten the output.
         validate: Call the validate function after the finalizing.
     """
     trans_ctx.validate()
@@ -213,6 +220,8 @@ def finalize_translation_context(
         raise ValueError("Input names are not specified.")
     if trans_ctx.out_names is None:
         raise ValueError("Output names are not specified.")
+    if not (trans_ctx.out_names or trans_ctx.inp_names):
+        raise ValueError("No input nor output.")
 
     # We guarantee decoupling
     tsdfg = translator.TranslatedJaxprSDFG(
@@ -236,7 +245,6 @@ def finalize_translation_context(
 
     if validate:
         tsdfg.validate()
-
     return tsdfg
 
 
@@ -246,22 +254,34 @@ def trace_and_flatten_function(
     trace_call_kwargs: Mapping[str, Any],
     trace_options: Mapping[str, Any],
 ) -> tuple[jax.core.ClosedJaxpr, list[Any], jax_tree.PyTreeDef]:
-    """Traces `fun` and generates the Jaxpr as well as the input and output tree.
+    """Traces `fun` and generates the Jaxpr and compute some related meta data.
 
-    The function will perform the tracing using `trace_options`, which are the
-    same as supported by `jace.jit`. Furthermore the tracing is done with
-    x64 enabled.
+    For tracing the computation `fun` the function uses the `trace_call_args`
+    and `trace_call_kwargs` arguments, both should not be flattened yet.
 
     Returns:
         The function will return a tuple of length three.
-        1) The Jaxpr that was generated by tracing using the supplied arguments
+        1) The Jaxpr that was generated by Jax using the supplied arguments
             and options.
         2) The flattened input values.
         3) A pytree describing the output structure.
 
+    Args:
+        fun: The original Python computation.
+        trace_call_args: The positional arguments that should be used for
+            tracing the computation.
+        trace_call_kwargs: The keyword arguments that should be for tracing
+            the computation.
+        trace_options: The options used for tracing, the same arguments that
+            are supported by `jace.jit`.
+
     Todo:
         - Handle default arguments of `fun`.
         - Handle static arguments.
+        - Turn `trace_options` into a `TypedDict` and sync with `jace.jit`.
+
+    Note:
+        - The tracing is done with x64 enabled.
     """
     if trace_options:
         raise NotImplementedError(
diff --git a/src/jace/translator/translated_jaxpr_sdfg.py b/src/jace/translator/translated_jaxpr_sdfg.py
index 524c1a2..c19b488 100644
--- a/src/jace/translator/translated_jaxpr_sdfg.py
+++ b/src/jace/translator/translated_jaxpr_sdfg.py
@@ -21,14 +21,14 @@
 class TranslatedJaxprSDFG:
     """Encapsulates the translated SDFG together with the metadata that is needed to run it.
 
-    Contrary to the SDFG that is encapsulated inside the `TranslationContext`
+    Contrary to the SDFG that is encapsulated inside an `TranslationContext`
     object, `self` carries a proper SDFG, however:
     - It does not have `__return*` variables, instead all return arguments are
         passed by arguments.
     - All input arguments are passed through arguments mentioned in `inp_names`,
         while the outputs are passed through `out_names`.
     - Only variables listed as in/outputs are non transient.
-    - The order inside `inp_names` and `out_names` is the same as in the translated Jaxpr.
+    - The order inside `inp_names` and `out_names` is the same as in the original Jaxpr.
     - If inputs are also used as outputs they appear in both `inp_names` and `out_names`.
     - Its `arg_names` is set to  `inp_names + out_names`, but arguments that are
         input and outputs are only listed as inputs.
@@ -41,9 +41,14 @@ class TranslatedJaxprSDFG:
 
     Attributes:
         sdfg: The encapsulated SDFG object.
-        inp_names: A list of the SDFG variables that are used as input
-        out_names: A list of the SDFG variables that are used as output.
+        inp_names: Names of the SDFG variables used as inputs.
+        out_names: Names of the SDFG variables used as outputs.
         outtree: A pytree describing how to unflatten the output.
+
+    Todo:
+        After the SDFG is compiled a lot of code looks strange, because there is
+        no container to store the compiled SDFG and the metadata. This class
+        should be extended to address this need.
     """
 
     sdfg: dace.SDFG
diff --git a/src/jace/util/dace_helper.py b/src/jace/util/dace_helper.py
index a85b909..7fef0f2 100644
--- a/src/jace/util/dace_helper.py
+++ b/src/jace/util/dace_helper.py
@@ -17,7 +17,6 @@
 import dace
 from dace import data as dace_data
 from dace.codegen.compiled_sdfg import CompiledSDFG
-from jax import tree_util as jax_tree
 
 from jace import util
 
@@ -25,13 +24,14 @@
 if TYPE_CHECKING:
     from collections.abc import Sequence
 
+    import numpy as np
+
     from jace import translator
-    from jace.util import dace_helper
 
 __all__ = ["CompiledSDFG", "compile_jax_sdfg", "run_jax_sdfg"]
 
 
-def compile_jax_sdfg(tsdfg: translator.TranslatedJaxprSDFG) -> dace_helper.CompiledSDFG:
+def compile_jax_sdfg(tsdfg: translator.TranslatedJaxprSDFG) -> CompiledSDFG:
     """Compiles the SDFG embedded in `tsdfg` and return the resulting `CompiledSDFG` object."""
     if any(  # We do not support the DaCe return mechanism
         array_name.startswith("__return")
@@ -60,7 +60,7 @@ def compile_jax_sdfg(tsdfg: translator.TranslatedJaxprSDFG) -> dace_helper.Compi
             dace.Config.set("default_build_folder", value=pathlib.Path(".jacecache").resolve())
             sdfg._recompile = True
             sdfg._regenerate_code = True
-            csdfg: dace_helper.CompiledSDFG = sdfg.compile()
+            csdfg: CompiledSDFG = sdfg.compile()
 
     finally:
         sdfg.name = org_sdfg_name
@@ -71,31 +71,42 @@ def compile_jax_sdfg(tsdfg: translator.TranslatedJaxprSDFG) -> dace_helper.Compi
 
 
 def run_jax_sdfg(
-    csdfg: dace_helper.CompiledSDFG,
+    csdfg: CompiledSDFG,
     inp_names: Sequence[str],
     out_names: Sequence[str],
     flat_call_args: Sequence[Any],
-    outtree: jax_tree.PyTreeDef,
-) -> tuple[Any, ...] | Any:
+) -> list[np.ndarray]:
     """Run the compiled SDFG.
 
     The function assumes that the SDFG was finalized and then compiled by
-    `compile_jax_sdfg()`. For running the SDFG you also have to pass the input
-    names (`inp_names`) and output names (`out_names`) that were inside the
-    `TranslatedJaxprSDFG` from which `csdfg` was compiled from.
+    `compile_jax_sdfg()`. All arguments except `csdfg` must come from the
+    `TranslatedJaxprSDFG` object that was used to compile SDFG.
+
+    Returns:
+        The function will return a flattened version of the output. To
+        reconstruct the actual return type/value of the original computation
+        the `outtree` that is stored inside the `TranslatedJaxprSDFG` object
+        that was used to compile the SDFG can be used.
 
     Args:
         csdfg: The `CompiledSDFG` object.
-        inp_names: List of names of the input arguments.
-        out_names: List of names of the output arguments.
+        inp_names: Names of the SDFG variables used as inputs.
+        out_names: Names of the SDFG variables used as outputs.
         flat_call_args: Flattened input arguments.
-        outtree: A pytree describing how to unflatten the output.
 
     Notes:
         Currently the strides of the input arguments must match the ones that
-        were used for lowering.
+        were used for lowering the SDFG.
+        In DaCe the return values are allocated on a per `CompiledSDFG` basis.
+        Thus every call to a compiled SDFG will override the value of the last
+        call, in JaCe the memory is allocated on every call. In addition
+        scalars are returned as arrays of length one.
+
+    Todo:
+        - Once we supported GPU change type annotation.
     """
     if len(inp_names) != len(flat_call_args):
+        # Either error or static arguments are not removed.
         raise RuntimeError("Wrong number of arguments.")
 
     sdfg_call_args: dict[str, Any] = {}
@@ -126,6 +137,4 @@ def run_jax_sdfg(
         dace.Config.set("compiler", "allow_view_arguments", value=True)
         csdfg(**sdfg_call_args)
 
-    if not out_names:
-        return None
-    return jax_tree.tree_unflatten(outtree, (sdfg_call_args[out_name] for out_name in out_names))
+    return [sdfg_call_args[out_name] for out_name in out_names]
diff --git a/src/jace/util/translation_cache.py b/src/jace/util/translation_cache.py
index 6664a36..99801eb 100644
--- a/src/jace/util/translation_cache.py
+++ b/src/jace/util/translation_cache.py
@@ -38,24 +38,19 @@
 
 
 # Denotes the stage that follows the current one.
-#  Used by the `NextStage` Mixin.
+#  Used by the `CachingStage` mixin.
 NextStage = TypeVar("NextStage", bound="stages.Stage")
 
 
 class CachingStage(Generic[NextStage]):
     """Annotates a stage whose transition to the next stage is cacheable.
 
-    To make the transition of a stage cacheable, the stage must be derived from
-    this class, and its initialization must call `CachingStage.__init__()`.
-    Furthermore, its transition function must be annotated by the
-    `@cached_transition` decorator.
-
-    A class must implement the `_make_call_description()` to compute an abstract
-    description of the call. This is needed to operate the cache to store the
-    stage transitions.
-
-    Notes:
-        The `__init__()` function must explicitly be called to fully setup `self`.
+    To make a transition cacheable, a stage must:
+    - be derived from this class.
+    - its `__init__()` function must explicitly call `CachingStage.__init__()`.
+    - the transition function must be annotated by `@cached_transition`.
+    - it must implement the `_make_call_description()` to create the key.
+    - the stage object must be immutable.
 
     Todo:
         - Handle eviction from the cache due to collecting of unused predecessor stages.
@@ -68,9 +63,20 @@ def __init__(self) -> None:
 
     @abc.abstractmethod
     def _make_call_description(
-        self: CachingStage, args_tree: jax_tree.PyTreeDef, flat_args: Sequence[Any]
+        self: CachingStage, intree: jax_tree.PyTreeDef, flat_call_args: Sequence[Any]
     ) -> StageTransformationSpec:
-        """Generates the key that is used to store/locate the call in the cache."""
+        """Computes the key used to represent the call.
+
+        This function is used by the `@cached_transition` decorator to perform
+        the lookup inside the cache. It should return a description of the call
+        that is encapsulated inside a `StageTransformationSpec` object, see
+        there for more information.
+
+        Args:
+            intree: Pytree object describing how the input arguments were flattened.
+            flat_call_args: The flattened arguments that were passed to the
+                annotated function.
+        """
         ...
 
 
@@ -85,9 +91,11 @@ def cached_transition(
 ) -> Callable[Concatenate[CachingStage[NextStage], P], NextStage]:
     """Decorator for making the transition function of the stage cacheable.
 
-    In order to work, the stage must be derived from `CachingStage`. For computing
-    the key of a call the function will use the `_make_call_description()`
-    function of the cache.
+    See the description of `CachingStage` for the requirements.
+    The function will use `_make_call_description()` to decide if the call is
+    already known and if so it will return the cached object. If the call is
+    not known it will call the wrapped transition function and record its
+    return value inside the cache, before returning it.
 
     Todo:
         - Implement a way to temporary disable the cache.
@@ -95,13 +103,11 @@ def cached_transition(
 
     @functools.wraps(transition)
     def transition_wrapper(self: CachingStageType, *args: P.args, **kwargs: P.kwargs) -> NextStage:
-        flat_args, args_tree = jax_tree.tree_flatten((args, kwargs))
-        key = self._make_call_description(flat_args=flat_args, args_tree=args_tree)
-        if key in self._cache:
-            return self._cache[key]
-        next_stage = transition(self, *args, **kwargs)
-        self._cache[key] = next_stage
-        return next_stage
+        flat_call_args, intree = jax_tree.tree_flatten((args, kwargs))
+        key = self._make_call_description(flat_call_args=flat_call_args, intree=intree)
+        if key not in self._cache:
+            self._cache[key] = transition(self, *args, **kwargs)
+        return self._cache[key]
 
     return cast(TransitionFunction, transition_wrapper)
 
@@ -129,14 +135,15 @@ class _AbstractCallArgument:
     which is similar to tracers in Jax. This class represents the second way.
     To create an instance you should use `_AbstractCallArgument.from_value()`.
 
-    Its description is limited to scalars and arrays. To describe more complex
-    types, they should be processed by pytrees first.
-
     Attributes:
         shape: In case of an array its shape, in case of a scalar the empty tuple.
         dtype: The DaCe type of the argument.
         strides: The strides of the argument, or `None` if they are unknown or a scalar.
         storage: The storage type where the argument is stored.
+
+    Note:
+        This class is only able to describe scalars and arrays, thus it should
+        only be used after the arguments were flattened.
     """
 
     shape: tuple[int, ...]
@@ -158,7 +165,7 @@ def from_value(cls, value: Any) -> _AbstractCallArgument:
             shape = value.shape
             dtype = util.translate_dtype(value.dtype)
             strides = util.get_strides_for_dace(value)
-            # Is `CPU_Heap` always okay? There would also be `CPU_Pinned`.
+            # TODO(phimuell): `CPU_Heap` vs. `CPU_Pinned`.
             storage = (
                 dace.StorageType.GPU_Global
                 if util.is_on_device(value)
@@ -179,48 +186,47 @@ def from_value(cls, value: Any) -> _AbstractCallArgument:
         raise TypeError(f"Can not make 'an abstract description from '{type(value).__name__}'.")
 
 
-#: This type is the abstract description of a function call.
-#:  It is part of the key used in the cache.
-CallArgsSpec: TypeAlias = tuple[
-    _AbstractCallArgument | Hashable | tuple[str, _AbstractCallArgument | Hashable], ...
-]
+#: Type to describe a single argument either in an abstract or concrete way.
+CallArgsSpec: TypeAlias = tuple[_AbstractCallArgument | Hashable]
 
 
 @dataclasses.dataclass(frozen=True)
 class StageTransformationSpec:
-    """Represents the entire call to a state transformation function of a stage.
+    """Represents an entire call to a state transformation inside the cache.
 
     State transition functions are annotated with `@cached_transition` and their
-    result may be cached. They key to locate them inside the cache is represented
+    result is cached. They key to locate them inside the cache is represented
     by this class and computed by the `CachingStage._make_call_description()`
     function. The actual key is consists of three parts, `stage_id`, `call_args`
-    and `args_tree`.
+    and `intree`, see below for more.
 
     Args:
         stage_id: Origin of the call, for which the id of the stage object should
             be used.
-        call_args: Flat representation of the arguments of the call. Each element
+        flat_call_args: Flat representation of the arguments of the call. Each element
             describes a single argument. To describe an argument there are two ways:
             - Abstract description: In this way, the actual value of the argument
-                is irrelevant, only the structure of them are important, similar
-                to the tracers used in Jax.
-            - Concrete description: Here one caches on the actual value of the
-                argument. The only requirement is that they can be hashed.
-        args_tree: A pytree structure that describes how the input was flatten.
-                In Jax the hash of a pytree, takes its structure into account.
+                is irrelevant, its structure is important, similar to the tracers
+                used in Jax. To represent it, use `_AbstractCallArgument`.
+            - Concrete description: Here the actual value of the argument is
+                considered, this is similar to how static arguments in Jax works.
+                The only requirement is that they can be hashed.
+        intree: A pytree structure that describes how the input was flatten.
     """
 
     stage_id: int
-    call_args: CallArgsSpec
-    args_tree: jax_tree.PyTreeDef
+    flat_call_args: CallArgsSpec
+    intree: jax_tree.PyTreeDef
 
 
-# Denotes the stage that is stored inside the cache.
+#: Denotes the stage that is stored inside the cache.
 StageType = TypeVar("StageType", bound="stages.Stage")
 
 
 class StageCache(Generic[StageType]):
-    """Simple LRU cache to cache the results of the stage transition function.
+    """Simple LRU cache to store the results of the stage transition function.
+
+    There is one cache per stage (type) and not per instance.
 
     Args:
         capacity: The size of the cache, defaults to 256.
@@ -276,7 +282,7 @@ def capacity(self) -> int:
         return self._capacity
 
     def front(self) -> tuple[StageTransformationSpec, StageType]:
-        """Returns the front, i.e. newest entry in the cache."""
+        """Returns the front of the cache, i.e. its newest entry."""
         return next(reversed(self._memory.items()))
 
     def __repr__(self) -> str:

From 9b40b272d84ee2c80e87c76a777b859e03ef2395 Mon Sep 17 00:00:00 2001
From: Enrique Gonzalez Paredes <enriqueg@cscs.ch>
Date: Wed, 12 Jun 2024 11:42:56 +0200
Subject: [PATCH 348/458] Fine tune rule ignores

---
 pyproject.toml | 10 ++++++----
 1 file changed, 6 insertions(+), 4 deletions(-)

diff --git a/pyproject.toml b/pyproject.toml
index 5026706..8a8f63d 100644
--- a/pyproject.toml
+++ b/pyproject.toml
@@ -121,7 +121,7 @@ extend-select = [
   "D213",  # multi-line-summary-second-line (off by default in pydocstyle "google' convention)
   "PT",  # flake8-pytest-style
   "TD",  # flake8-todo
-  "UP",  # pyupgrade       # TODO: in evaluation
+  "UP",  # pyupgrade       # TODO(egparedes): in evaluation
   "ARG",  # flake8-unused-arguments
   "ERA",  # eradicate
   "FLY",  # flynt
@@ -129,13 +129,13 @@ extend-select = [
   "PGH",  # pygrep-hooks
   "PIE",  # flake8-pie
   "PTH",  # flake8-use-pathlib
-  "RET",  # flake8-return   # TODO: in evaluation
+  "RET",  # flake8-return   # TODO(egparedes): in evaluation
   "RUF",  # Ruff-specific
-  "SIM",  # flake8-simplify # TODO: in evaluation
+  "SIM",  # flake8-simplify # TODO(egparedes): in evaluation
   "SLOT",  # flake8-slots
   "T10",  # flake8-debugger
   "T20",  # flake8-print
-  "TCH",  # flake8-type-checking  # TODO: in evaluation
+  "TCH",  # flake8-type-checking  # TODO(egparedes): in evaluation
   "NPY",  # NumPy specific rules
 ]
 ignore = [
@@ -143,6 +143,7 @@ ignore = [
   "D105",  # undocumented-magic-method
   "D107",  # [undocumented-public-init]
   "D212",  # [multi-line-summary-first-line]
+  "D402",  # [no-signature]
   "E501",  # [line-too-long]
   "TCH003",  # [typing-only-standard-library-import]
   "TD003",  # [missing-todo-link]
@@ -198,6 +199,7 @@ max-complexity = 12
 ]
 "tests/**" = [
   "D",  # pydocstyle
+  "N",  # TODO(egparedes): remove ignore as soon as all tests are properly named
   "T10",  # flake8-debugger
   "T20",  # flake8-print
 ]

From 894b10c81b9a968f33994ed150dbf8470e82523e Mon Sep 17 00:00:00 2001
From: Enrique Gonzalez Paredes <enriqueg@cscs.ch>
Date: Wed, 12 Jun 2024 12:01:38 +0200
Subject: [PATCH 349/458] More fixes and additions to ruff config

---
 pyproject.toml | 10 +++++++---
 1 file changed, 7 insertions(+), 3 deletions(-)

diff --git a/pyproject.toml b/pyproject.toml
index 8a8f63d..35deb56 100644
--- a/pyproject.toml
+++ b/pyproject.toml
@@ -126,8 +126,11 @@ extend-select = [
   "ERA",  # eradicate
   "FLY",  # flynt
   "ICN",  # flake8-import-conventions
+  "NPY",  # NumPy specific rules
+  "PERF",  # Perflint
   "PGH",  # pygrep-hooks
   "PIE",  # flake8-pie
+  "PL",  # pylint
   "PTH",  # flake8-use-pathlib
   "RET",  # flake8-return   # TODO(egparedes): in evaluation
   "RUF",  # Ruff-specific
@@ -136,11 +139,11 @@ extend-select = [
   "T10",  # flake8-debugger
   "T20",  # flake8-print
   "TCH",  # flake8-type-checking  # TODO(egparedes): in evaluation
-  "NPY",  # NumPy specific rules
+  "TRY",  # tryceratops
 ]
 ignore = [
   "B905",  # [zip-without-explicit-strict]
-  "D105",  # undocumented-magic-method
+  "D105",  # [undocumented-magic-method]
   "D107",  # [undocumented-public-init]
   "D212",  # [multi-line-summary-first-line]
   "D402",  # [no-signature]
@@ -187,7 +190,7 @@ tests = [
 max-complexity = 12
 
 [tool.ruff.lint.per-file-ignores]
-"!tests/**.py" = ["PT"]  # Ignore `flake8-pytest-style` outside `tests/`
+"!tests/**.py" = ["PT"]  # Ignore flake8-pytest-style outside 'tests/'
 "docs/**" = [
   "D",  # pydocstyle
   "T10",  # flake8-debugger
@@ -200,6 +203,7 @@ max-complexity = 12
 "tests/**" = [
   "D",  # pydocstyle
   "N",  # TODO(egparedes): remove ignore as soon as all tests are properly named
+  "PLR2004",  # [magic-value-comparison]
   "T10",  # flake8-debugger
   "T20",  # flake8-print
 ]

From 1928b9598c11655b282795b41d41ece292b43514 Mon Sep 17 00:00:00 2001
From: Enrique Gonzalez Paredes <enriqueg@cscs.ch>
Date: Wed, 12 Jun 2024 12:10:44 +0200
Subject: [PATCH 350/458] Add coverage config from Philip

---
 pyproject.toml | 32 ++++++++++++++++++++++++++------
 1 file changed, 26 insertions(+), 6 deletions(-)

diff --git a/pyproject.toml b/pyproject.toml
index 35deb56..477ef93 100644
--- a/pyproject.toml
+++ b/pyproject.toml
@@ -48,12 +48,32 @@ Changelog = "https://github.com/GridTools/JaCe/releases"
 Discussions = "https://github.com/GridTools/JaCe/discussions"
 Homepage = "https://github.com/GridTools/JaCe"
 
+# -- coverage --
 [tool.coverage]
-report.exclude_also = [
+
+[tool.coverage.html]
+show_contexts = true
+
+[tool.coverage.report]
+exclude_also = [
   '\.\.\.',
+  'if TYPE_CHECKING:',
   'if typing.TYPE_CHECKING:',
+  'def __repr__',
+  '@overload',
+  'raise AssertionError',
+  'raise NotImplementedError',
+  'if 0:',
+  'if __name__ == .__main__.:',
+  '@(abc\\.)?abstractmethod',
+  '@(abc\\.)?abstract',
+  'class .*\bProtocol\):',
 ]
-run.source = ["jace"]
+
+[tool.coverage.run]
+branch = true
+dynamic_context = "test_function"
+source = ["jace"]
 
 # -- mypy  --
 [tool.mypy]
@@ -121,7 +141,7 @@ extend-select = [
   "D213",  # multi-line-summary-second-line (off by default in pydocstyle "google' convention)
   "PT",  # flake8-pytest-style
   "TD",  # flake8-todo
-  "UP",  # pyupgrade       # TODO(egparedes): in evaluation
+  "UP",  # pyupgrade
   "ARG",  # flake8-unused-arguments
   "ERA",  # eradicate
   "FLY",  # flynt
@@ -132,13 +152,13 @@ extend-select = [
   "PIE",  # flake8-pie
   "PL",  # pylint
   "PTH",  # flake8-use-pathlib
-  "RET",  # flake8-return   # TODO(egparedes): in evaluation
+  "RET",  # flake8-return
   "RUF",  # Ruff-specific
-  "SIM",  # flake8-simplify # TODO(egparedes): in evaluation
+  "SIM",  # flake8-simplify
   "SLOT",  # flake8-slots
   "T10",  # flake8-debugger
   "T20",  # flake8-print
-  "TCH",  # flake8-type-checking  # TODO(egparedes): in evaluation
+  "TCH",  # flake8-type-checking
   "TRY",  # tryceratops
 ]
 ignore = [

From 9909f6dbeed5dad4482b898faaf02b16f15e0f43 Mon Sep 17 00:00:00 2001
From: Enrique Gonzalez Paredes <enriqueg@cscs.ch>
Date: Wed, 12 Jun 2024 13:31:43 +0200
Subject: [PATCH 351/458] More fine tuning of ruff and pre-commit

---
 .pre-commit-config.yaml | 2 --
 pyproject.toml          | 4 ++++
 2 files changed, 4 insertions(+), 2 deletions(-)

diff --git a/.pre-commit-config.yaml b/.pre-commit-config.yaml
index 10c71ef..cd2eb8f 100644
--- a/.pre-commit-config.yaml
+++ b/.pre-commit-config.yaml
@@ -52,8 +52,6 @@ repos:
   - id: debug-statements
   - id: end-of-file-fixer
   - id: mixed-line-ending
-  - id: name-tests-test
-    args: [--pytest-test-first]
   - id: requirements-txt-fixer
   - id: trailing-whitespace
 
diff --git a/pyproject.toml b/pyproject.toml
index 477ef93..d0e62ab 100644
--- a/pyproject.toml
+++ b/pyproject.toml
@@ -170,6 +170,7 @@ ignore = [
   "E501",  # [line-too-long]
   "TCH003",  # [typing-only-standard-library-import]
   "TD003",  # [missing-todo-link]
+  "TRY003",  # [raise-vanilla-args]  # TODO(egparedes): reevaluate if it should be activated
   "UP038",  # [non-pep604-isinstance]
 ]
 task-tags = ["TODO"]
@@ -235,3 +236,6 @@ max-doc-length = 88
 [tool.ruff.lint.pydocstyle]
 convention = "google"
 ignore-decorators = ["typing.overload"]
+
+[tool.ruff.lint.pylint]
+max-positional-args = 6

From 5f24405bb2d5b20a11b2b00ff5783df19e138c84 Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Wed, 12 Jun 2024 13:33:01 +0200
Subject: [PATCH 352/458] Removed a convenience function.

---
 src/jace/translator/__init__.py             |  2 --
 src/jace/translator/primitive_translator.py | 18 +---------
 tests/test_subtranslator_helper.py          | 38 ++++-----------------
 3 files changed, 8 insertions(+), 50 deletions(-)

diff --git a/src/jace/translator/__init__.py b/src/jace/translator/__init__.py
index 7c2a1c4..a045f0c 100644
--- a/src/jace/translator/__init__.py
+++ b/src/jace/translator/__init__.py
@@ -20,7 +20,6 @@
     get_registered_primitive_translators,
     make_primitive_translator,
     register_primitive_translator,
-    set_active_primitive_translators_to,
 )
 from .translated_jaxpr_sdfg import TranslatedJaxprSDFG
 
@@ -34,5 +33,4 @@
     "get_registered_primitive_translators",
     "make_primitive_translator",
     "register_primitive_translator",
-    "set_active_primitive_translators_to",
 ]
diff --git a/src/jace/translator/primitive_translator.py b/src/jace/translator/primitive_translator.py
index ca2c2fe..842d6d6 100644
--- a/src/jace/translator/primitive_translator.py
+++ b/src/jace/translator/primitive_translator.py
@@ -17,7 +17,7 @@
 
 
 if TYPE_CHECKING:
-    from collections.abc import Callable, Mapping, MutableMapping, Sequence
+    from collections.abc import Callable, Sequence
 
     import dace
     from jax import core as jax_core
@@ -217,19 +217,3 @@ def get_registered_primitive_translators() -> dict[str, translator.PrimitiveTran
     object is decoupled from the registry.
     """
     return _PRIMITIVE_TRANSLATORS_REGISTRY.copy()
-
-
-def set_active_primitive_translators_to(
-    new_translators: Mapping[str, translator.PrimitiveTranslator],
-) -> MutableMapping[str, translator.PrimitiveTranslator]:
-    """Exchange the global translator registry state of JaCe with `new_translators`.
-
-    The function will return the state of the global translator registry prior
-    to this call. Any changes to `new_translators` after calling this function
-    will have no effect on the global translator registry and vice versa.
-    """
-    global _PRIMITIVE_TRANSLATORS_REGISTRY
-    assert all(getattr(trans, "primitive", prim) for prim, trans in new_translators.items())
-    previous_translators = _PRIMITIVE_TRANSLATORS_REGISTRY
-    _PRIMITIVE_TRANSLATORS_REGISTRY = dict(new_translators)
-    return previous_translators
diff --git a/tests/test_subtranslator_helper.py b/tests/test_subtranslator_helper.py
index c6dd33b..e94408e 100644
--- a/tests/test_subtranslator_helper.py
+++ b/tests/test_subtranslator_helper.py
@@ -21,24 +21,26 @@
     get_registered_primitive_translators,
     make_primitive_translator,
     register_primitive_translator,
-    set_active_primitive_translators_to,
 )
 
 
 @pytest.fixture(autouse=True)
 def _conserve_builtin_translators():
     """Restores the set of registered subtranslators after a test."""
-    initial_translators = get_registered_primitive_translators()
+    initial_translators = translator.primitive_translator._PRIMITIVE_TRANSLATORS_REGISTRY.copy()
     yield
-    set_active_primitive_translators_to(initial_translators)
+    translator.primitive_translator._PRIMITIVE_TRANSLATORS_REGISTRY.clear()
+    translator.primitive_translator._PRIMITIVE_TRANSLATORS_REGISTRY.update(initial_translators)
 
 
 @pytest.fixture()
 def no_builtin_translators():  # noqa: PT004  # This is how you should do it: https://docs.pytest.org/en/7.1.x/how-to/fixtures.html#use-fixtures-in-classes-and-modules-with-usefixtures
     """This fixture can be used if the test does not want any builtin translators."""
-    initial_translators = translator.set_active_primitive_translators_to({})
+    initial_translators = translator.primitive_translator._PRIMITIVE_TRANSLATORS_REGISTRY.copy()
+    translator.primitive_translator._PRIMITIVE_TRANSLATORS_REGISTRY.clear()
     yield
-    translator.set_active_primitive_translators_to(initial_translators)
+    translator.primitive_translator._PRIMITIVE_TRANSLATORS_REGISTRY.clear()
+    translator.primitive_translator._PRIMITIVE_TRANSLATORS_REGISTRY.update(initial_translators)
 
 
 # These are definitions of some Subtranslators that can be used to test things.
@@ -117,32 +119,6 @@ def test_subtranslatior_managing_isolation():
     assert get_registered_primitive_translators()["add"] is org_add_prim
 
 
-def test_subtranslatior_managing_swap():
-    """Tests the `set_active_primitive_translators_to()` functionality."""
-
-    # Allows to compare the structure of dicts.
-    def same_structure(d1: dict, d2: dict) -> bool:
-        return d1.keys() == d2.keys() and all(id(d2[k]) == id(d1[k]) for k in d1)
-
-    initial_primitives = get_registered_primitive_translators()
-    assert "add" in initial_primitives
-
-    # Now mutate the dict a little bit, shallow copy it first.
-    mutated_primitives = initial_primitives.copy()
-    mutated_primitives["add"] = fake_add_translator
-    assert mutated_primitives.keys() == initial_primitives.keys()
-    assert same_structure(initial_primitives, get_registered_primitive_translators())
-    assert not same_structure(mutated_primitives, initial_primitives)
-    assert not same_structure(mutated_primitives, get_registered_primitive_translators())
-
-    # Now change the initial one with the mutated one.
-    #  The object is copied but should still have the same structure.
-    old_active = set_active_primitive_translators_to(mutated_primitives)
-    assert mutated_primitives is not translator.primitive_translator._PRIMITIVE_TRANSLATORS_REGISTRY
-    assert same_structure(old_active, initial_primitives)
-    assert same_structure(mutated_primitives, get_registered_primitive_translators())
-
-
 @pytest.mark.usefixtures("no_builtin_translators")
 def test_subtranslatior_managing_callable_annotation():
     """Test if `make_primitive_translator()` works."""

From cc7f6495b5d895c244da5c5d92d40fdf7fec6b4b Mon Sep 17 00:00:00 2001
From: Enrique Gonzalez Paredes <enriqueg@cscs.ch>
Date: Wed, 12 Jun 2024 13:43:58 +0200
Subject: [PATCH 353/458] Fix wrong place to add ruff configuration

---
 .pre-commit-config.yaml | 2 +-
 pyproject.toml          | 1 +
 2 files changed, 2 insertions(+), 1 deletion(-)

diff --git a/.pre-commit-config.yaml b/.pre-commit-config.yaml
index cd2eb8f..586cb6f 100644
--- a/.pre-commit-config.yaml
+++ b/.pre-commit-config.yaml
@@ -59,7 +59,7 @@ repos:
   rev: v0.4.8
   hooks:
   - id: ruff
-    args: [--fix, --show-fixes, --preview]
+    args: [--fix, --show-fixes]
   - id: ruff-format
 
 - repo: https://github.com/pre-commit/mirrors-mypy
diff --git a/pyproject.toml b/pyproject.toml
index d0e62ab..d186132 100644
--- a/pyproject.toml
+++ b/pyproject.toml
@@ -119,6 +119,7 @@ xfail_strict = true
 # -- ruff --
 [tool.ruff]
 line-length = 100
+preview = true
 respect-gitignore = true
 show-fixes = true
 src = ["src"]

From 03d6d081ca814f56298170997ddef5063c8f4745 Mon Sep 17 00:00:00 2001
From: Enrique Gonzalez Paredes <enriqueg@cscs.ch>
Date: Wed, 12 Jun 2024 13:42:20 +0200
Subject: [PATCH 354/458] Updates from new config

---
 .pre-commit-config.yaml |  51 ++++++-------
 pyproject.toml          | 156 ++++++++++++++++++++++++++++++----------
 2 files changed, 147 insertions(+), 60 deletions(-)

diff --git a/.pre-commit-config.yaml b/.pre-commit-config.yaml
index 59402ca..59057f5 100644
--- a/.pre-commit-config.yaml
+++ b/.pre-commit-config.yaml
@@ -2,41 +2,47 @@ default_language_version:
   python: python3.10
 
 ci:
-  autoupdate_commit_msg: "chore: update pre-commit hooks"
-  autofix_commit_msg: "style: pre-commit fixes"
+  autoupdate_commit_msg: 'chore: update pre-commit hooks'
+  autofix_commit_msg: 'style: pre-commit fixes'
 
 repos:
 - repo: https://github.com/macisamuele/language-formatters-pre-commit-hooks
-  rev: v2.6.0
+  rev: v2.13.0
   hooks:
   - id: pretty-format-ini
     args: [--autofix]
   - id: pretty-format-toml
-    args: [--autofix]
+    args: [--autofix, --indent, '2', --trailing-commas]
     additional_dependencies:
     - setuptools>=69.2.0
   - id: pretty-format-yaml
-    args: [--autofix, --preserve-quotes, --indent, "2"]
+    args: [--autofix, --indent, '2', --line-width, '100']
     additional_dependencies:
     - setuptools>=69.2.0
 
-- repo: https://github.com/pre-commit/mirrors-prettier
-  rev: "v3.1.0"
+- repo: https://github.com/executablebooks/mdformat
+  rev: 0.7.17
   hooks:
-  - id: prettier
-    types_or: [markdown, html, css, scss, javascript, json]
-    args: [--prose-wrap=preserve]
+  - id: mdformat
+    args: [--number]
+    additional_dependencies:
+    - mdformat-gfm
+    - mdformat-black
 
 - repo: https://github.com/Lucas-C/pre-commit-hooks
-  rev: v1.1.9
+  rev: v1.5.5
   hooks:
   - id: insert-license
-    exclude: ^\..*$
+    exclude: |
+      (?x)^(
+          ^\..*$ |
+          noxfile.py
+      )$
     types: [python]
-    args: [--comment-style, "|#|", --license-filepath, ./LICENSE_HEADER.txt]
+    args: [--comment-style, '|#|', --license-filepath, ./LICENSE_HEADER.txt]
 
 - repo: https://github.com/pre-commit/pre-commit-hooks
-  rev: "v4.6.0"
+  rev: v4.6.0
   hooks:
   - id: check-added-large-files
   - id: check-case-conflict
@@ -46,15 +52,13 @@ repos:
   - id: debug-statements
   - id: end-of-file-fixer
   - id: mixed-line-ending
-  - id: name-tests-test
-    args: ["--pytest-test-first"]
   - id: trailing-whitespace
 
 - repo: https://github.com/astral-sh/ruff-pre-commit
   rev: v0.4.8
   hooks:
   - id: ruff
-    args: ["--fix", "--show-fixes", "--preview"]
+    args: [--fix, --show-fixes]
   - id: ruff-format
 
 - repo: https://github.com/pre-commit/mirrors-mypy
@@ -67,15 +71,14 @@ repos:
     - dace==0.15.1
     - jax[cpu]==0.4.28
     - numpy==1.26.4
-    - pytest==8.2.2
-    - typing-extensions==4.12.2
+    - pytest==8.2.1
 - repo: https://github.com/codespell-project/codespell
-  rev: "v2.2.6"
+  rev: v2.3.0
   hooks:
   - id: codespell
 
 - repo: https://github.com/shellcheck-py/shellcheck-py
-  rev: "v0.10.0.1"
+  rev: v0.10.0.1
   hooks:
   - id: shellcheck
 
@@ -88,13 +91,13 @@ repos:
     exclude: .pre-commit-config.yaml
 
 - repo: https://github.com/abravalheri/validate-pyproject
-  rev: "v0.16"
+  rev: v0.18
   hooks:
   - id: validate-pyproject
-    additional_dependencies: ["validate-pyproject-schema-store[all]"]
+    additional_dependencies: ['validate-pyproject-schema-store[all]']
 
 - repo: https://github.com/python-jsonschema/check-jsonschema
-  rev: "0.28.1"
+  rev: 0.28.5
   hooks:
   - id: check-dependabot
   - id: check-github-workflows
diff --git a/pyproject.toml b/pyproject.toml
index 175a679..d186132 100644
--- a/pyproject.toml
+++ b/pyproject.toml
@@ -1,9 +1,13 @@
 [build-system]
 build-backend = "setuptools.build_meta"
-requires = ["setuptools>=61"]
+requires = [
+  "setuptools>=61",
+]
 
 [project]
-authors = [{name = "ETH Zurich", email = "gridtools@cscs.ch"}]
+authors = [
+  {name = "ETH Zurich", email = "gridtools@cscs.ch"},
+]
 classifiers = [
   "Development Status :: 1 - Planning",
   "Intended Audience :: Science/Research",
@@ -17,9 +21,13 @@ classifiers = [
   "Programming Language :: Python :: 3.11",
   "Programming Language :: Python :: 3.12",
   "Topic :: Scientific/Engineering",
-  "Typing :: Typed"
+  "Typing :: Typed",
+]
+dependencies = [
+  "dace>=0.15",
+  "jax[cpu]>=0.4.24",
+  "numpy>=1.26.0",
 ]
-dependencies = ["dace>=0.15", "jax[cpu]>=0.4.24", "numpy>=1.26.0"]
 description = "JAX jit using DaCe (Data Centric Parallel Programming)"
 name = "JaCe"
 readme = "README.md"
@@ -28,7 +36,11 @@ version = "0.1.0"
 license.file = "LICENSE"
 
 [project.optional-dependencies]
-cuda12 = ["cupy-cuda12x>=12.1.0", "jax[cuda12]>=0.4.24", "optuna>=3.4.0"]
+cuda12 = [
+  "cupy-cuda12x>=12.1.0",
+  "jax[cuda12]>=0.4.24",
+  "optuna>=3.4.0",
+]
 
 [project.urls]
 "Bug Tracker" = "https://github.com/GridTools/JaCe/issues"
@@ -36,9 +48,32 @@ Changelog = "https://github.com/GridTools/JaCe/releases"
 Discussions = "https://github.com/GridTools/JaCe/discussions"
 Homepage = "https://github.com/GridTools/JaCe"
 
+# -- coverage --
 [tool.coverage]
-report.exclude_also = ['\.\.\.', 'if typing.TYPE_CHECKING:']
-run.source = ["jace"]
+
+[tool.coverage.html]
+show_contexts = true
+
+[tool.coverage.report]
+exclude_also = [
+  '\.\.\.',
+  'if TYPE_CHECKING:',
+  'if typing.TYPE_CHECKING:',
+  'def __repr__',
+  '@overload',
+  'raise AssertionError',
+  'raise NotImplementedError',
+  'if 0:',
+  'if __name__ == .__main__.:',
+  '@(abc\\.)?abstractmethod',
+  '@(abc\\.)?abstract',
+  'class .*\bProtocol\):',
+]
+
+[tool.coverage.run]
+branch = true
+dynamic_context = "test_function"
+source = ["jace"]
 
 # -- mypy  --
 [tool.mypy]
@@ -63,7 +98,12 @@ warn_unused_ignores = true
 disallow_incomplete_defs = false
 disallow_untyped_defs = false
 ignore_missing_imports = true
-module = ["tests.*", "dace.*", "jax.*", "jaxlib.*"]
+module = [
+  "tests.*",
+  "dace.*",
+  "jax.*",
+  "jaxlib.*",
+]
 
 # -- pytest  --
 [tool.pytest]
@@ -79,6 +119,7 @@ xfail_strict = true
 # -- ruff --
 [tool.ruff]
 line-length = 100
+preview = true
 respect-gitignore = true
 show-fixes = true
 src = ["src"]
@@ -87,72 +128,115 @@ src = ["src"]
 docstring-code-format = true
 
 [tool.ruff.lint]
+extend-safe-fixes = ["D", "TCH"]
 extend-select = [
   "A",  # flake8-builtins
   "B",  # flake8-bugbear
   "I",  # isort
   "G",  # flake8-logging-format
+  "N",  # pep8-naming
   "W",  # pycodestyle-warning
   "C4",  # flake8-comprehensions
   "C90",  # mccabe
+  "D",  # pydocstyle
+  "D213",  # multi-line-summary-second-line (off by default in pydocstyle "google' convention)
   "PT",  # flake8-pytest-style
-  "UP",  # pyupgrade       # TODO: in evaluation
+  "TD",  # flake8-todo
+  "UP",  # pyupgrade
   "ARG",  # flake8-unused-arguments
   "ERA",  # eradicate
+  "FLY",  # flynt
   "ICN",  # flake8-import-conventions
+  "NPY",  # NumPy specific rules
+  "PERF",  # Perflint
   "PGH",  # pygrep-hooks
   "PIE",  # flake8-pie
+  "PL",  # pylint
   "PTH",  # flake8-use-pathlib
-  "RET",  # flake8-return   # TODO: in evaluation
+  "RET",  # flake8-return
   "RUF",  # Ruff-specific
-  "SIM",  # flake8-simplify # TODO: in evaluation
+  "SIM",  # flake8-simplify
+  "SLOT",  # flake8-slots
   "T10",  # flake8-debugger
-  "T20",  # flake8-print    # TODO: in evaluation
-  "TCH",  # flake8-type-checking  # TODO: in evaluation
-  "NPY"  # NumPy specific rules
+  "T20",  # flake8-print
+  "TCH",  # flake8-type-checking
+  "TRY",  # tryceratops
 ]
 ignore = [
-  'B905',  # [zip-without-explicit-strict]
-  'E501',  # [line-too-long]
-  'TCH003',  # [typing-only-standard-library-import]
-  'UP038'  # [non-pep604-isinstance]
+  "B905",  # [zip-without-explicit-strict]
+  "D105",  # [undocumented-magic-method]
+  "D107",  # [undocumented-public-init]
+  "D212",  # [multi-line-summary-first-line]
+  "D402",  # [no-signature]
+  "E501",  # [line-too-long]
+  "TCH003",  # [typing-only-standard-library-import]
+  "TD003",  # [missing-todo-link]
+  "TRY003",  # [raise-vanilla-args]  # TODO(egparedes): reevaluate if it should be activated
+  "UP038",  # [non-pep604-isinstance]
 ]
+task-tags = ["TODO"]
 # ignore-init-module-imports = true  # deprecated in preview mode
 unfixable = []
 
 [tool.ruff.lint.isort]
 combine-as-imports = true
-known-first-party = ['jace']
+known-first-party = ["jace"]
 known-third-party = [
-  'cupy',
-  'dace',
-  'jax',
-  'numpy',
-  'pytest',
-  'typing_extensions'
+  "cupy",
+  "dace",
+  "jax",
+  "numpy",
+  "pytest",
+  "typing_extensions",
 ]
 lines-after-imports = 2
 order-by-type = true
 required-imports = ["from __future__ import annotations"]
 section-order = [
-  'future',
-  'standard-library',
-  'third-party',
-  'first-party',
-  'tests',
-  'local-folder'
+  "future",
+  "standard-library",
+  "third-party",
+  "first-party",
+  "tests",
+  "local-folder",
 ]
 
 [tool.ruff.lint.isort.sections]
-tests = ["tests", "unit_tests", "integration_tests"]
+tests = [
+  "tests",
+  "unit_tests",
+  "integration_tests",
+]
 
 [tool.ruff.lint.mccabe]
 max-complexity = 12
 
 [tool.ruff.lint.per-file-ignores]
-"!tests/**.py" = ["PT"]  # Ignore `flake8-pytest-style` everywhere except in `tests/`
-"noxfile.py" = ["T20"]  # Ignore `flake8-print`
-"tests/**" = ["T10", "T20"]  # Ignore `flake8-debugger` and `flake8-print`
+"!tests/**.py" = ["PT"]  # Ignore flake8-pytest-style outside 'tests/'
+"docs/**" = [
+  "D",  # pydocstyle
+  "T10",  # flake8-debugger
+  "T20",  # flake8-print
+]
+"noxfile.py" = [
+  "D",  # pydocstyle
+  "T20",  # flake8-print
+]
+"tests/**" = [
+  "D",  # pydocstyle
+  "N",  # TODO(egparedes): remove ignore as soon as all tests are properly named
+  "PLR2004",  # [magic-value-comparison]
+  "T10",  # flake8-debugger
+  "T20",  # flake8-print
+]
 
 [tool.ruff.lint.pycodestyle]
-max-doc-length = 85
+ignore-overlong-task-comments = true
+max-doc-length = 88
+
+[tool.ruff.lint.pydocstyle]
+convention = "google"
+ignore-decorators = ["typing.overload"]
+
+[tool.ruff.lint.pylint]
+max-positional-args = 6

From 0da47fa74751af54b736f987c73609e509e019be Mon Sep 17 00:00:00 2001
From: Enrique Gonzalez Paredes <enriqueg@cscs.ch>
Date: Wed, 12 Jun 2024 14:20:17 +0200
Subject: [PATCH 355/458] Fixes

---
 CODING_GUIDELINES.md | 2 +-
 pyproject.toml       | 2 +-
 2 files changed, 2 insertions(+), 2 deletions(-)

diff --git a/CODING_GUIDELINES.md b/CODING_GUIDELINES.md
index 5fd7e00..3e7fabb 100644
--- a/CODING_GUIDELINES.md
+++ b/CODING_GUIDELINES.md
@@ -29,7 +29,7 @@ We deviate from the [Google Python Style Guide][google-style-guide] only in the
 
 - According to subsection [_3.19.12 Imports For Typing_](https://google.github.io/styleguide/pyguide.html#31912-imports-for-typing), symbols from `typing` and `collections.abc` modules used in type annotations _"can be imported directly to keep common annotations concise and match standard typing practices"_. Following the same spirit, we allow symbols to be imported directly from third-party or internal modules when they only contain a collection of frequently used typying definitions.
 
-### Language usage recommendations
+### Python usage recommendations
 
 - `pass` vs `...` (`Ellipsis`)
 
diff --git a/pyproject.toml b/pyproject.toml
index d186132..0bcfa20 100644
--- a/pyproject.toml
+++ b/pyproject.toml
@@ -239,4 +239,4 @@ convention = "google"
 ignore-decorators = ["typing.overload"]
 
 [tool.ruff.lint.pylint]
-max-positional-args = 6
+max-args = 6
\ No newline at end of file

From b7a166f4a08ccf0b7e5ce1393912cf391bfe5db4 Mon Sep 17 00:00:00 2001
From: Enrique Gonzalez Paredes <enriqueg@cscs.ch>
Date: Wed, 12 Jun 2024 14:42:09 +0200
Subject: [PATCH 356/458] Back to defaults

---
 pyproject.toml | 1 -
 1 file changed, 1 deletion(-)

diff --git a/pyproject.toml b/pyproject.toml
index 0bcfa20..a12c642 100644
--- a/pyproject.toml
+++ b/pyproject.toml
@@ -174,7 +174,6 @@ ignore = [
   "TRY003",  # [raise-vanilla-args]  # TODO(egparedes): reevaluate if it should be activated
   "UP038",  # [non-pep604-isinstance]
 ]
-task-tags = ["TODO"]
 # ignore-init-module-imports = true  # deprecated in preview mode
 unfixable = []
 

From 367e7b6f4b96ddb75d459f2cdb7f65f1c9c6b3cf Mon Sep 17 00:00:00 2001
From: Enrique Gonzalez Paredes <enriqueg@cscs.ch>
Date: Wed, 12 Jun 2024 15:01:30 +0200
Subject: [PATCH 357/458] Fix format

---
 pyproject.toml | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/pyproject.toml b/pyproject.toml
index a12c642..37c0d3d 100644
--- a/pyproject.toml
+++ b/pyproject.toml
@@ -238,4 +238,4 @@ convention = "google"
 ignore-decorators = ["typing.overload"]
 
 [tool.ruff.lint.pylint]
-max-args = 6
\ No newline at end of file
+max-args = 6

From 1e825c3af4b928b240350086b234e461a301907a Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Wed, 12 Jun 2024 15:07:35 +0200
Subject: [PATCH 358/458] Applied some of enriques new configuration.

---
 .github/dependabot.yml                        |   8 +-
 .github/workflows/ci.yml                      |   4 +-
 .pre-commit-config.yaml                       |  53 +++---
 .readthedocs.yaml                             |   2 +-
 CHANGELOG.md                                  |   2 +-
 CODING_GUIDELINES.md                          |  42 +++--
 CONTRIBUTING.md                               |   2 +-
 README.md                                     |  23 +--
 ROADMAP.md                                    |  30 ++--
 pyproject.toml                                | 160 +++++++++++++-----
 src/jace/api.py                               |  12 +-
 src/jace/optimization.py                      |  11 +-
 src/jace/stages.py                            |  73 ++++----
 src/jace/translator/__init__.py               |   3 +-
 .../translator/jaxpr_translator_builder.py    | 137 ++++++++-------
 src/jace/translator/post_translation.py       |  16 +-
 src/jace/translator/primitive_translator.py   |  23 +--
 .../primitive_translators/alu_translator.py   |  14 +-
 src/jace/translator/translated_jaxpr_sdfg.py  |   9 +-
 src/jace/util/__init__.py                     |   1 -
 src/jace/util/dace_helper.py                  |  22 +--
 src/jace/util/definitions.py                  |   6 +-
 src/jace/util/jax_helper.py                   |  31 ++--
 src/jace/util/traits.py                       |  11 +-
 src/jace/util/translation_cache.py            |  25 ++-
 tests/test_caching.py                         |  11 +-
 tests/test_decorator.py                       |   2 +-
 tests/test_jax_api.py                         |   5 +-
 tests/test_jaxpr_translator_builder.py        |  30 ++--
 tests/test_misc.py                            |   6 +-
 tests/test_subtranslator_helper.py            |   3 +-
 31 files changed, 466 insertions(+), 311 deletions(-)

diff --git a/.github/dependabot.yml b/.github/dependabot.yml
index 60f5aca..6fbe4e9 100644
--- a/.github/dependabot.yml
+++ b/.github/dependabot.yml
@@ -1,11 +1,11 @@
 version: 2
 updates:
   # Maintain dependencies for GitHub Actions
-- package-ecosystem: "github-actions"
-  directory: "/"
+- package-ecosystem: github-actions
+  directory: /
   schedule:
-    interval: "weekly"
+    interval: weekly
   groups:
     actions:
       patterns:
-      - "*"
+      - '*'
diff --git a/.github/workflows/ci.yml b/.github/workflows/ci.yml
index 86a32f3..b065ed7 100644
--- a/.github/workflows/ci.yml
+++ b/.github/workflows/ci.yml
@@ -24,7 +24,7 @@ jobs:
         fetch-depth: 0
     - uses: actions/setup-python@v5
       with:
-        python-version: "3.x"
+        python-version: 3.x
     - uses: pre-commit/action@v3.0.1
       with:
         extra_args: --hook-stage manual --all-files
@@ -36,7 +36,7 @@ jobs:
     strategy:
       fail-fast: false
       matrix:
-        python-version: ["3.10", "3.12"]
+        python-version: ['3.10', '3.12']
         runs-on: [ubuntu-latest, macos-latest, windows-latest]
 
     steps:
diff --git a/.pre-commit-config.yaml b/.pre-commit-config.yaml
index 6ae432a..586cb6f 100644
--- a/.pre-commit-config.yaml
+++ b/.pre-commit-config.yaml
@@ -1,39 +1,48 @@
+default_language_version:
+  python: python3.10
+
 ci:
-  autoupdate_commit_msg: "chore: update pre-commit hooks"
-  autofix_commit_msg: "style: pre-commit fixes"
+  autoupdate_commit_msg: 'chore: update pre-commit hooks'
+  autofix_commit_msg: 'style: pre-commit fixes'
 
 repos:
 - repo: https://github.com/macisamuele/language-formatters-pre-commit-hooks
-  rev: v2.6.0
+  rev: v2.13.0
   hooks:
   - id: pretty-format-ini
     args: [--autofix]
   - id: pretty-format-toml
-    args: [--autofix]
+    args: [--autofix, --indent, '2', --trailing-commas]
     additional_dependencies:
     - setuptools>=69.2.0
   - id: pretty-format-yaml
-    args: [--autofix, --preserve-quotes, --indent, "2"]
+    args: [--autofix, --indent, '2', --line-width, '100']
     additional_dependencies:
     - setuptools>=69.2.0
 
-- repo: https://github.com/pre-commit/mirrors-prettier
-  rev: "v3.1.0"
+- repo: https://github.com/executablebooks/mdformat
+  rev: 0.7.17
   hooks:
-  - id: prettier
-    types_or: [markdown, html, css, scss, javascript, json]
-    args: [--prose-wrap=preserve]
+  - id: mdformat
+    args: [--number]
+    additional_dependencies:
+    - mdformat-gfm
+    - mdformat-black
 
 - repo: https://github.com/Lucas-C/pre-commit-hooks
-  rev: v1.1.9
+  rev: v1.5.5
   hooks:
   - id: insert-license
-    exclude: ^\..*$
+    exclude: |
+      (?x)^(
+          ^\..*$ |
+          noxfile.py
+      )$
     types: [python]
-    args: [--comment-style, "|#|", --license-filepath, ./LICENSE_HEADER.txt]
+    args: [--comment-style, '|#|', --license-filepath, ./LICENSE_HEADER.txt]
 
 - repo: https://github.com/pre-commit/pre-commit-hooks
-  rev: "v4.6.0"
+  rev: v4.6.0
   hooks:
   - id: check-added-large-files
   - id: check-case-conflict
@@ -43,16 +52,14 @@ repos:
   - id: debug-statements
   - id: end-of-file-fixer
   - id: mixed-line-ending
-  - id: name-tests-test
-    args: ["--pytest-test-first"]
   - id: requirements-txt-fixer
   - id: trailing-whitespace
 
 - repo: https://github.com/astral-sh/ruff-pre-commit
-  rev: v0.4.6
+  rev: v0.4.8
   hooks:
   - id: ruff
-    args: ["--fix", "--show-fixes", "--preview"]
+    args: [--fix, --show-fixes]
   - id: ruff-format
 
 - repo: https://github.com/pre-commit/mirrors-mypy
@@ -67,12 +74,12 @@ repos:
     - numpy==1.26.4
     - pytest==8.2.1
 - repo: https://github.com/codespell-project/codespell
-  rev: "v2.2.6"
+  rev: v2.3.0
   hooks:
   - id: codespell
 
 - repo: https://github.com/shellcheck-py/shellcheck-py
-  rev: "v0.10.0.1"
+  rev: v0.10.0.1
   hooks:
   - id: shellcheck
 
@@ -85,13 +92,13 @@ repos:
     exclude: .pre-commit-config.yaml
 
 - repo: https://github.com/abravalheri/validate-pyproject
-  rev: "v0.16"
+  rev: v0.18
   hooks:
   - id: validate-pyproject
-    additional_dependencies: ["validate-pyproject-schema-store[all]"]
+    additional_dependencies: ['validate-pyproject-schema-store[all]']
 
 - repo: https://github.com/python-jsonschema/check-jsonschema
-  rev: "0.28.1"
+  rev: 0.28.5
   hooks:
   - id: check-dependabot
   - id: check-github-workflows
diff --git a/.readthedocs.yaml b/.readthedocs.yaml
index c27af52..c67fcdc 100644
--- a/.readthedocs.yaml
+++ b/.readthedocs.yaml
@@ -6,7 +6,7 @@ version: 2
 build:
   os: ubuntu-22.04
   tools:
-    python: "3.11"
+    python: '3.11'
 sphinx:
   configuration: docs/conf.py
 
diff --git a/CHANGELOG.md b/CHANGELOG.md
index 5967d06..358cc1c 100644
--- a/CHANGELOG.md
+++ b/CHANGELOG.md
@@ -5,7 +5,7 @@ All notable changes to this project will be documented in this file.
 The format is based on [Keep a Changelog](https://keepachangelog.com/en/1.1.0/),
 and this project adheres to [Semantic Versioning](https://semver.org/spec/v2.0.0.html).
 
-## [Unreleased] - 2024-04-12
+## \[Unreleased\] - 2024-04-12
 
 ### Added
 
diff --git a/CODING_GUIDELINES.md b/CODING_GUIDELINES.md
index 582ae00..7874f60 100644
--- a/CODING_GUIDELINES.md
+++ b/CODING_GUIDELINES.md
@@ -7,7 +7,9 @@ We follow the [Google Python Style Guide][google-style-guide] with a few minor c
 We deviate from the [Google Python Style Guide][google-style-guide] only in the following points:
 
 - We use [`ruff-linter`][ruff-linter] instead of [`pylint`][pylint].
+
 - We use [`ruff-formatter`][ruff-formatter] for source code and imports formatting, which may work differently than indicated by the guidelines in section [_3. Python Style Rules_](https://google.github.io/styleguide/pyguide.html#3-python-style-rules). For example, maximum line length is set to 100 instead of 79 (although docstring lines should still be limited to 79).
+
 - According to subsection [_2.19 Power Features_](https://google.github.io/styleguide/pyguide.html#219-power-features), direct use of _power features_ (e.g. custom metaclasses, import hacks, reflection) should be avoided, but standard library classes that internally use these power features are accepted. Following the same spirit, we allow the use of power features in infrastructure code with similar functionality and scope as the Python standard library.
 
   ```python
@@ -33,15 +35,15 @@ We deviate from the [Google Python Style Guide][google-style-guide] only in the
   ```python
   # Correct use of `...` as the empty body of an abstract method
   class AbstractFoo:
-     @abstractmethod
-     def bar(self) -> Bar:
-        ...
+      @abstractmethod
+      def bar(self) -> Bar: ...
+
 
   # Correct use of `pass` when mixed with other statements
   try:
-     resource.load(id=42)
+      resource.load(id=42)
   except ResourceException:
-     pass
+      pass
   ```
 
 ### Error messages
@@ -51,7 +53,9 @@ Error messages should be written as sentences, starting with a capital letter an
 Examples:
 
 ```python
-raise ValueError(f"Invalid argument 'dimension': should be of type 'Dimension', got '{dimension.type}'.")
+raise ValueError(
+    f"Invalid argument 'dimension': should be of type 'Dimension', got '{dimension.type}'."
+)
 ```
 
 Interpolated integer values do not need double quotes, if they are indicating an amount. Example:
@@ -63,19 +67,25 @@ raise ValueError(f"Invalid number of arguments: expected 3 arguments, got {len(a
 The double quotes can also be dropped when presenting a sequence of values. In this case the message should be rephrased so the sequence is separated from the text by a colon ':'.
 
 ```python
-raise ValueError(f"unexpected keyword arguments: {', '.join(set(kwarg_names) - set(expected_kwarg_names))}.")
+raise ValueError(
+    f"unexpected keyword arguments: {', '.join(set(kwarg_names) - set(expected_kwarg_names))}."
+)
 ```
 
 The message should be kept to one sentence if reasonably possible. Ideally the sentence should be kept short and avoid unnecessary words. Examples:
 
 ```python
 # too many sentences
-raise ValueError(f"Received an unexpected number of arguments. Should receive 5 arguments, but got {len(args)}. Please provide the correct number of arguments.")
+raise ValueError(
+    f"Received an unexpected number of arguments. Should receive 5 arguments, but got {len(args)}. Please provide the correct number of arguments."
+)
 # better
 raise ValueError(f"Wrong number of arguments: expected 5, got {len(args)}.")
 
 # less extreme
-raise TypeError(f"Wrong argument type. Can only accept 'int's, got '{type(arg)}' instead.")
+raise TypeError(
+    f"Wrong argument type. Can only accept 'int's, got '{type(arg)}' instead."
+)
 # but can still be improved
 raise TypeError(f"Wrong argument type: 'int' expected, got '{type(arg)}'")
 ```
@@ -86,14 +96,14 @@ The terseness vs. helpfulness tradeoff should be more in favor of terseness for
 
 TODO: update to `autodoc2`
 
-We generate the API documentation automatically from the docstrings using [Sphinx][sphinx] and some extensions such as [Sphinx-autodoc][sphinx-autodoc] and [Sphinx-napoleon][sphinx-napoleon]. These follow the Google Python Style Guide docstring conventions to automatically format the generated documentation. A complete overview can be found here: [Example Google Style Python Docstrings](https://sphinxcontrib-napoleon.readthedocs.io/en/latest/example_google.html#example-google).
+We generate the API documentation automatically from the docstrings using [Sphinx] and some extensions such as [Sphinx-autodoc] and [Sphinx-napoleon]. These follow the Google Python Style Guide docstring conventions to automatically format the generated documentation. A complete overview can be found here: [Example Google Style Python Docstrings](https://sphinxcontrib-napoleon.readthedocs.io/en/latest/example_google.html#example-google).
 
 Sphinx supports the [reStructuredText][sphinx-rest] (reST) markup language for defining additional formatting options in the generated documentation, however section [_3.8 Comments and Docstrings_](https://google.github.io/styleguide/pyguide.html#38-comments-and-docstrings) of the Google Python Style Guide does not specify how to use markups in docstrings. As a result, we decided to forbid reST markup in docstrings, except for the following cases:
 
 - Cross-referencing other objects using Sphinx text roles for the [Python domain](https://www.sphinx-doc.org/en/master/usage/restructuredtext/domains.html#the-python-domain) (as explained [here](https://www.sphinx-doc.org/en/master/usage/restructuredtext/domains.html#python-roles)).
-- Very basic formatting markup to improve _readability_ of the generated documentation without obscuring the source docstring (e.g. ` ``literal`` ` strings, bulleted lists).
+- Very basic formatting markup to improve _readability_ of the generated documentation without obscuring the source docstring (e.g. ``` ``literal`` ``` strings, bulleted lists).
 
-We highly encourage the [doctest][doctest] format for code examples in docstrings. In fact, doctest runs code examples and makes sure they are in sync with the codebase.
+We highly encourage the [doctest] format for code examples in docstrings. In fact, doctest runs code examples and makes sure they are in sync with the codebase.
 
 ### Module structure
 
@@ -124,14 +134,16 @@ Consider configuration files as another type of source code and apply the same c
 You may occasionally need to disable checks from _quality assurance_ (QA) tools (e.g. linters, type checkers, etc.) on specific lines as some tool might not be able to fully understand why a certain piece of code is needed. This is usually done with special comments, e.g. `# noqa: F401`, `# type: ignore`. However, you should **only** ignore QA errors when you fully understand their source and rewriting your code to pass QA checks would make it less readable. Additionally, you should add a short descriptive code if possible (check [ruff rules][ruff-rules] and [mypy error codes][mypy-error-codes] for reference):
 
 ```python
-f = lambda: 'empty'  # noqa: E731 [lambda-assignment]
+f = lambda: "empty"  # noqa: E731 [lambda-assignment]
 ```
 
 and, if needed, a brief comment for future reference:
 
 ```python
 ...
-return undeclared_symbol  # noqa: F821 [undefined-name] on purpose to trigger black-magic
+return (
+    undeclared_symbol  # noqa: F821 [undefined-name] on purpose to trigger black-magic
+)
 ```
 
 ## Testing
@@ -142,9 +154,7 @@ Testing components is a critical part of a software development project. We foll
 
 [doctest]: https://docs.python.org/3/library/doctest.html
 [google-style-guide]: https://google.github.io/styleguide/pyguide.html
-[mypy]: https://mypy.readthedocs.io/
 [mypy-error-codes]: https://mypy.readthedocs.io/en/stable/error_code_list.html
-[pre-commit]: https://pre-commit.com/
 [pylint]: https://pylint.pycqa.org/
 [ruff-formatter]: https://docs.astral.sh/ruff/formatter/
 [ruff-linter]: https://docs.astral.sh/ruff/linter/
diff --git a/CONTRIBUTING.md b/CONTRIBUTING.md
index e3dc26e..19d5adb 100644
--- a/CONTRIBUTING.md
+++ b/CONTRIBUTING.md
@@ -98,7 +98,7 @@ Before submitting a pull request, check that it meets the following criteria:
 3. The pull request should have a proper description of its intent and the main changes in the code. In general this description should be used as commit message if the pull request is approved (check point **5.** below).
 4. If the pull request contains code authored by first-time contributors, they should add their names to the [AUTHORS.md](AUTHORS.md) file.
 5. Pick one reviewer and try to contact them directly to let them know about the pull request. If there is no feedback in 24h/48h try to contact them again or pick another reviewer.
-6. Once the pull request has been approved, it should be squash-merged as soon as possible with a meaningful description of the changes. We use the [Conventional Commits][https://www.conventionalcommits.org/en/v1.0.0/#summary] specification for writing informative and automation-friendly commit messages. The following _commit types_ are accepted:
+6. Once the pull request has been approved, it should be squash-merged as soon as possible with a meaningful description of the changes. We use the [Conventional Commits](https://www.conventionalcommits.org/en/v1.0.0/#summary) specification for writing informative and automation-friendly commit messages. The following _commit types_ are accepted:
    - `build`: changes that affect the build system or external dependencies
    - `chore`: changes related to the development tools or process
    - `ci`: changes to our CI configuration files and scripts
diff --git a/README.md b/README.md
index f17b970..fe91ae6 100644
--- a/README.md
+++ b/README.md
@@ -20,16 +20,17 @@ The DaCe project aims to build new representations for programs and algorithms,
 <!-- SPHINX-START -->
 
 <!-- prettier-ignore-start -->
-[actions-badge]:            https://github.com/GridTools/JaCe/workflows/CI/badge.svg
-[actions-link]:             https://github.com/GridTools/JaCe/actions
-[conda-badge]:              https://img.shields.io/conda/vn/conda-forge/JaCe
-[conda-link]:               https://github.com/conda-forge/JaCe-feedstock
-[github-discussions-badge]: https://img.shields.io/static/v1?label=Discussions&message=Ask&color=blue&logo=github
-[github-discussions-link]:  https://github.com/GridTools/JaCe/discussions
-[pypi-link]:                https://pypi.org/project/JaCe/
-[pypi-platforms]:           https://img.shields.io/pypi/pyversions/JaCe
-[pypi-version]:             https://img.shields.io/pypi/v/JaCe
-[rtd-badge]:                https://readthedocs.org/projects/JaCe/badge/?version=latest
-[rtd-link]:                 https://JaCe.readthedocs.io/en/latest/?badge=latest
 
 <!-- prettier-ignore-end -->
+
+[actions-badge]: https://github.com/GridTools/JaCe/workflows/CI/badge.svg
+[actions-link]: https://github.com/GridTools/JaCe/actions
+[conda-badge]: https://img.shields.io/conda/vn/conda-forge/JaCe
+[conda-link]: https://github.com/conda-forge/JaCe-feedstock
+[github-discussions-badge]: https://img.shields.io/static/v1?label=Discussions&message=Ask&color=blue&logo=github
+[github-discussions-link]: https://github.com/GridTools/JaCe/discussions
+[pypi-link]: https://pypi.org/project/JaCe/
+[pypi-platforms]: https://img.shields.io/pypi/pyversions/JaCe
+[pypi-version]: https://img.shields.io/pypi/v/JaCe
+[rtd-badge]: https://readthedocs.org/projects/JaCe/badge/?version=latest
+[rtd-link]: https://JaCe.readthedocs.io/en/latest/?badge=latest
diff --git a/ROADMAP.md b/ROADMAP.md
index 2beaa39..ec14397 100644
--- a/ROADMAP.md
+++ b/ROADMAP.md
@@ -9,23 +9,23 @@ A kind of roadmap that gives a rough idea about how the project will be continue
   - [ ] Implementing the `stages` model that is supported by Jax.
   - [ ] Handling Jax arrays as native input (only on single host).
   - [ ] Cache the compilation and lowering results for later reuse.
-        In Jax these parts (together with the dispatch) are actually written in C++, thus in the beginning we will use a self made cache.
+    In Jax these parts (together with the dispatch) are actually written in C++, thus in the beginning we will use a self made cache.
 - [ ] Implementing some basic `PrimitiveTranslators`, that allows us to run some early tests, such as:
   - [ ] Backporting the ones from the prototype.
   - [ ] Implement the `scatter` primitive (needed for pyhpc).
   - [ ] Implement the `scan` primitive (needed for pyhpc).
 - [ ] _Initial_ optimization pipeline
-      In order to do benchmarks, we need to perform optimizations first.
-      However, the one offered by DaCe were not that well, so we should, for now, backport the ones from the prototype.
+  In order to do benchmarks, we need to perform optimizations first.
+  However, the one offered by DaCe were not that well, so we should, for now, backport the ones from the prototype.
 - [ ] Support GPU code (relatively simple, but needs some detection logic).
 - [ ] Initial benchmark:
-      In the beginning we will not have the same dispatching performance as Jax.
-      But passing these benchmarks could give us some better hint of how to proceed in this matter.
+  In the beginning we will not have the same dispatching performance as Jax.
+  But passing these benchmarks could give us some better hint of how to proceed in this matter.
   - [ ] Passing the [pyhpc-benchmark](https://github.com/dionhaefner/pyhpc-benchmarks)
   - [ ] Passing Felix' fluid project; possibility.
 - [ ] Support of static arguments.
 - [ ] Stop relying on `jax.make_jaxpr()`.
-      Look at the `jax._src.pjit.make_jit()` function for how to hijack the staging process.
+  Look at the `jax._src.pjit.make_jit()` function for how to hijack the staging process.
 - [ ] Implementing more advanced primitives:
   - [ ] Handling pytrees as arguments.
   - [ ] Implement random numbers.
@@ -44,15 +44,15 @@ These are more general topics that should be addressed at one point.
 - [ ] Integrating better with Jax
   - [ ] Support its array type (probably implement this in DaCe).
 - [ ] Increase the dispatching speed + Cache
-      Jax does this in C++, which is impossible to beat in Python, thus we have to go that root as well.
+  Jax does this in C++, which is impossible to beat in Python, thus we have to go that root as well.
 - [ ] Debugging information.
 - [ ] Dynamic shapes
-      This could be done by making the inputs fully dynamic, and then use the primitives to simplify.
-      For example in an addition the shape of the two inputs and the outputs are the same.
-      That is knowledge that is inherent to the primitives itself.
-      However, the compiled object must know how to extract the sizes itself.
+  This could be done by making the inputs fully dynamic, and then use the primitives to simplify.
+  For example in an addition the shape of the two inputs and the outputs are the same.
+  That is knowledge that is inherent to the primitives itself.
+  However, the compiled object must know how to extract the sizes itself.
 - [ ] Defining a Logo:
-      It should be green with a nice curly font.
+  It should be green with a nice curly font.
 
 # Optimization & Transformations
 
@@ -61,7 +61,7 @@ Our experiments with the prototype showed that the most important transformation
 
 - [ ] Modified state fusion; Because of the structure we have, this could make `Simplify` much more efficient.
 - [ ] Trivial Tasklet removal.
-      Since we will work a lot with Maps that are trivial (probably the best structure for fusing) we will end up with some of trivial Tasklets, i.e. `__out = __in`.
-      Thus, we should have a good way to get rid of them.
+  Since we will work a lot with Maps that are trivial (probably the best structure for fusing) we will end up with some of trivial Tasklets, i.e. `__out = __in`.
+  Thus, we should have a good way to get rid of them.
 - [ ] Modified Map fusion transformation.
-      We should still support parallel and serial fusion as the prototype did, but focusing on serial.
+  We should still support parallel and serial fusion as the prototype did, but focusing on serial.
diff --git a/pyproject.toml b/pyproject.toml
index 33023fd..e4f1d11 100644
--- a/pyproject.toml
+++ b/pyproject.toml
@@ -1,10 +1,12 @@
 [build-system]
 build-backend = "setuptools.build_meta"
-requires = ["setuptools>=61"]
+requires = [
+  "setuptools>=61",
+]
 
 [project]
 authors = [
-  {name = "ETH Zurich", email = "gridtools@cscs.ch"}
+  {name = "ETH Zurich", email = "gridtools@cscs.ch"},
 ]
 classifiers = [
   "Development Status :: 1 - Planning",
@@ -19,12 +21,12 @@ classifiers = [
   "Programming Language :: Python :: 3.11",
   "Programming Language :: Python :: 3.12",
   "Topic :: Scientific/Engineering",
-  "Typing :: Typed"
+  "Typing :: Typed",
 ]
 dependencies = [
   "dace>=0.15",
   "jax[cpu]>=0.4.24",
-  "numpy>=1.26.0"
+  "numpy>=1.26.0",
 ]
 description = "JAX jit using DaCe (Data Centric Parallel Programming)"
 name = "JaCe"
@@ -37,7 +39,7 @@ license.file = "LICENSE"
 cuda12 = [
   "cupy-cuda12x>=12.1.0",
   "jax[cuda12]>=0.4.24",
-  "optuna>=3.4.0"
+  "optuna>=3.4.0",
 ]
 
 [project.urls]
@@ -46,12 +48,32 @@ Changelog = "https://github.com/GridTools/JaCe/releases"
 Discussions = "https://github.com/GridTools/JaCe/discussions"
 Homepage = "https://github.com/GridTools/JaCe"
 
+# -- coverage --
 [tool.coverage]
-report.exclude_also = [
+
+[tool.coverage.html]
+show_contexts = true
+
+[tool.coverage.report]
+exclude_also = [
   '\.\.\.',
-  'if typing.TYPE_CHECKING:'
+  'if TYPE_CHECKING:',
+  'if typing.TYPE_CHECKING:',
+  'def __repr__',
+  '@overload',
+  'raise AssertionError',
+  'raise NotImplementedError',
+  'if 0:',
+  'if __name__ == .__main__.:',
+  '@(abc\\.)?abstractmethod',
+  '@(abc\\.)?abstract',
+  'class .*\bProtocol\):',
 ]
-run.source = ["jace"]
+
+[tool.coverage.run]
+branch = true
+dynamic_context = "test_function"
+source = ["jace"]
 
 # -- mypy  --
 [tool.mypy]
@@ -76,93 +98,145 @@ warn_unused_ignores = true
 disallow_incomplete_defs = false
 disallow_untyped_defs = false
 ignore_missing_imports = true
-module = ["tests.*", "dace.*", "jax.*", "jaxlib.*"]
+module = [
+  "tests.*",
+  "dace.*",
+  "jax.*",
+  "jaxlib.*",
+]
 
 # -- pytest  --
 [tool.pytest]
 
 [tool.pytest.ini_options]
 addopts = ["-ra", "--showlocals", "--strict-markers", "--strict-config"]
-filterwarnings = [
-  "error"
-]
+filterwarnings = ["error"]
 log_cli_level = "INFO"
 minversion = "6.0"
-testpaths = [
-  "tests"
-]
+testpaths = ["tests"]
 xfail_strict = true
 
 # -- ruff --
 [tool.ruff]
-extend-exclude = ["noxfile.py"]
 line-length = 100
+preview = true
 respect-gitignore = true
 show-fixes = true
 src = ["src"]
 
 [tool.ruff.format]
 docstring-code-format = true
-skip-magic-trailing-comma = true
 
 [tool.ruff.lint]
+extend-safe-fixes = ["D", "TCH"]
 extend-select = [
   "A",  # flake8-builtins
   "B",  # flake8-bugbear
   "I",  # isort
   "G",  # flake8-logging-format
+  "N",  # pep8-naming
+  "W",  # pycodestyle-warning
   "C4",  # flake8-comprehensions
+  "C90",  # mccabe
+  "D",  # pydocstyle
+  "D213",  # multi-line-summary-second-line (off by default in pydocstyle "google' convention)
   "PT",  # flake8-pytest-style
-  "UP",  # pyupgrade       # TODO: in evaluation
+  "TD",  # flake8-todo
+  "UP",  # pyupgrade
   "ARG",  # flake8-unused-arguments
   "ERA",  # eradicate
+  "FLY",  # flynt
   "ICN",  # flake8-import-conventions
+  "NPY",  # NumPy specific rules
+  "PERF",  # Perflint
   "PGH",  # pygrep-hooks
   "PIE",  # flake8-pie
+  "PL",  # pylint
   "PTH",  # flake8-use-pathlib
-  "RET",  # flake8-return   # TODO: in evaluation
+  "RET",  # flake8-return
   "RUF",  # Ruff-specific
-  "SIM",  # flake8-simplify # TODO: in evaluation
+  "SIM",  # flake8-simplify
+  "SLOT",  # flake8-slots
   "T10",  # flake8-debugger
-  "T20",  # flake8-print    # TODO: in evaluation
-  "TCH",  # flake8-type-checking  # TODO: in evaluation
-  "NPY"  # NumPy specific rules
+  "T20",  # flake8-print
+  "TCH",  # flake8-type-checking
+  "TRY",  # tryceratops
 ]
 ignore = [
-  'B905',  # [zip-without-explicit-strict]
-  'E501',  # [line-too-long]
-  'UP038'  # [non-pep604-isinstance]
+  "B905",  # [zip-without-explicit-strict]
+  "D105",  # [undocumented-magic-method]
+  "D107",  # [undocumented-public-init]
+  "D212",  # [multi-line-summary-first-line]
+  "D402",  # [no-signature]
+  "E501",  # [line-too-long]
+  "TCH003",  # [typing-only-standard-library-import]
+  "TD003",  # [missing-todo-link]
+  "TRY003",  # [raise-vanilla-args]  # TODO(egparedes): reevaluate if it should be activated
+  "UP038",  # [non-pep604-isinstance]
 ]
+task-tags = ["TODO"]
 # ignore-init-module-imports = true  # deprecated in preview mode
 unfixable = []
 
 [tool.ruff.lint.isort]
 combine-as-imports = true
-known-first-party = ['jace']
+known-first-party = ["jace"]
 known-third-party = [
-  'cupy',
-  'dace',
-  'jax',
-  'numpy',
-  'pytest',
-  'typing_extensions'
+  "cupy",
+  "dace",
+  "jax",
+  "numpy",
+  "pytest",
+  "typing_extensions",
 ]
 lines-after-imports = 2
 order-by-type = true
 required-imports = ["from __future__ import annotations"]
 section-order = [
-  'future',
-  'standard-library',
-  'third-party',
-  'first-party',
-  'tests',
-  'local-folder'
+  "future",
+  "standard-library",
+  "third-party",
+  "first-party",
+  "tests",
+  "local-folder",
 ]
 
 [tool.ruff.lint.isort.sections]
-tests = ["tests", "unit_tests", "integration_tests"]
+tests = [
+  "tests",
+  "unit_tests",
+  "integration_tests",
+]
+
+[tool.ruff.lint.mccabe]
+max-complexity = 12
 
 [tool.ruff.lint.per-file-ignores]
-"!tests/**.py" = ["PT"]  # Ignore `flake8-pytest-style` everywhere except in `tests/`
-"noxfile.py" = ["T20"]  # Ignore `flake8-print`
-"tests/**" = ["T10", "T20"]  # Ignore `flake8-debugger` and `flake8-print`
+"!tests/**.py" = ["PT"]  # Ignore flake8-pytest-style outside 'tests/'
+"docs/**" = [
+  "D",  # pydocstyle
+  "T10",  # flake8-debugger
+  "T20",  # flake8-print
+]
+"noxfile.py" = [
+  "D",  # pydocstyle
+  "T20",  # flake8-print
+]
+"tests/**" = [
+  "D",  # pydocstyle
+  "N",  # TODO(egparedes): remove ignore as soon as all tests are properly named
+  "PLR2004",  # [magic-value-comparison]
+  "T10",  # flake8-debugger
+  "T20",  # flake8-print
+]
+
+[tool.ruff.lint.pycodestyle]
+ignore-overlong-task-comments = true
+max-doc-length = 88
+
+[tool.ruff.lint.pydocstyle]
+convention = "google"
+ignore-decorators = ["typing.overload"]
+
+[tool.ruff.lint.pylint]
+max-args = 6
diff --git a/src/jace/api.py b/src/jace/api.py
index 46e15b2..8afc20a 100644
--- a/src/jace/api.py
+++ b/src/jace/api.py
@@ -48,16 +48,18 @@ def jit(
     primitive_translators: Mapping[str, translator.PrimitiveTranslator] | None = None,
     **kwargs: Any,
 ) -> stages.JaCeWrapped | Callable[[Callable], stages.JaCeWrapped]:
-    """JaCe's replacement for `jax.jit` (just-in-time) wrapper.
+    """
+    JaCe's replacement for `jax.jit` (just-in-time) wrapper.
 
     It works the same way as `jax.jit` does, but instead of using XLA the
     computation is lowered to DaCe. In addition it accepts some JaCe specific
     arguments.
 
     Args:
-        primitive_translators: Use these primitive translators for the lowering
-            to SDFG. If not specified the translators in the global registry are
-            used.
+        fun: Function to wrap.
+        primitive_translators: Use these primitive translators for the lowering to SDFG.
+            If not specified the translators in the global registry are used.
+        kwargs: Jit arguments.
 
     Notes:
         After constructions any change to `primitive_translators` has no effect.
@@ -69,7 +71,7 @@ def jit(
         )
 
     def wrapper(f: Callable) -> stages.JaCeWrapped:
-        # TODO: Improve typing, such that signature is attached to the `JaCeWrapped`.
+        # TODO(egparedes): Improve typing.
         jace_wrapper = stages.JaCeWrapped(
             fun=f,
             primitive_translators=(
diff --git a/src/jace/optimization.py b/src/jace/optimization.py
index 92b52e4..b5af4fa 100644
--- a/src/jace/optimization.py
+++ b/src/jace/optimization.py
@@ -5,7 +5,8 @@
 #
 # SPDX-License-Identifier: BSD-3-Clause
 
-"""JaCe specific optimizations.
+"""
+JaCe specific optimizations.
 
 Currently just a dummy exists for the sake of providing a callable function.
 """
@@ -22,7 +23,8 @@
 
 
 class CompilerOptions(TypedDict, total=False):
-    """All known compiler options to `JaCeLowered.compile()`.
+    """
+    All known compiler options to `JaCeLowered.compile()`.
 
     See `jace_optimize()` for a description of the different options.
 
@@ -41,8 +43,9 @@ class CompilerOptions(TypedDict, total=False):
 NO_OPTIMIZATIONS: Final[CompilerOptions] = {"auto_optimize": False, "simplify": False}
 
 
-def jace_optimize(tsdfg: translator.TranslatedJaxprSDFG, **kwargs: Unpack[CompilerOptions]) -> None:
-    """Performs optimization of the translated SDFG _in place_.
+def jace_optimize(tsdfg: translator.TranslatedJaxprSDFG, **kwargs: Unpack[CompilerOptions]) -> None:  # noqa: D417  # Missing description for kwargs
+    """
+    Performs optimization of the translated SDFG _in place_.
 
     It is recommended to use the `CompilerOptions` `TypedDict` to pass options
     to the function. However, any option that is not specified will be
diff --git a/src/jace/stages.py b/src/jace/stages.py
index 81ebe61..4639b11 100644
--- a/src/jace/stages.py
+++ b/src/jace/stages.py
@@ -4,7 +4,8 @@
 # All rights reserved.
 #
 # SPDX-License-Identifier: BSD-3-Clause
-"""Reimplementation of the `jax.stages` module.
+"""
+Reimplementation of the `jax.stages` module.
 
 This module reimplements the public classes of that Jax module.
 However, they are a bit different, because JaCe uses DaCe as backend.
@@ -53,7 +54,8 @@
 
 
 class JaCeWrapped(tcache.CachingStage["JaCeLowered"]):
-    """A function ready to be specialized, lowered, and compiled.
+    """
+    A function ready to be specialized, lowered, and compiled.
 
     This class represents the output of functions such as `jace.jit()` and is
     the first stage in the translation/compilation chain of JaCe. A user should
@@ -66,7 +68,7 @@ class JaCeWrapped(tcache.CachingStage["JaCeLowered"]):
 
     Args:
         fun: The function that is wrapped.
-        primitive_translators: The list of primitive translators that that should be used.
+        primitive_translators: Primitive translators that that should be used.
         jit_options: Options to influence the jit process.
 
     Todo:
@@ -99,13 +101,13 @@ def __init__(
         self._fun = fun
 
     def __call__(self, *args: Any, **kwargs: Any) -> Any:
-        """Executes the wrapped function, lowering and compiling as needed in one step.
+        """
+        Executes the wrapped function, lowering and compiling as needed in one step.
 
         The arguments passed to this function are the same as the wrapped function uses.
         """
-
-        # If we are inside a traced context, then we forward the call to the wrapped function.
-        #  This ensures that JaCe is composable with Jax.
+        # If we are inside a traced context, then we forward the call to the wrapped
+        #  function. This ensures that JaCe is composable with Jax.
         if util.is_tracing_ongoing(*args, **kwargs):
             return self._fun(*args, **kwargs)
 
@@ -115,7 +117,8 @@ def __call__(self, *args: Any, **kwargs: Any) -> Any:
 
     @tcache.cached_transition
     def lower(self, *args: Any, **kwargs: Any) -> JaCeLowered:
-        """Lower this function explicitly for the given arguments.
+        """
+        Lower this function explicitly for the given arguments.
 
         Performs the first two steps of the AOT steps described above, i.e.
         trace the wrapped function with the given arguments and stage it out
@@ -130,16 +133,18 @@ def lower(self, *args: Any, **kwargs: Any) -> JaCeLowered:
         if len(kwargs) != 0:
             raise NotImplementedError("Currently only positional arguments are supported.")
 
-        # TODO(phimuell): Currently the SDFG that we build only supports `C_CONTIGUOUS` memory
-        #  order. Since we support the paradigm that "everything passed to `lower()` should also
-        #  be accepted as argument to call the result", we forbid other memory orders here.
+        # TODO(phimuell): Currently the SDFG that we build only supports `C_CONTIGUOUS`
+        #  memory order. Since we support the paradigm that "everything passed to
+        #  `lower()` should also be accepted as argument to call the result", we forbid
+        #  other memory orders here.
         if not all((not util.is_array(arg)) or arg.flags["C_CONTIGUOUS"] for arg in args):
             raise NotImplementedError("Currently can not yet handle strides beside 'C_CONTIGUOUS'.")
 
-        # In Jax `float32` is the main datatype, and they go to great lengths to avoid some
-        #  aggressive [type promotion](https://jax.readthedocs.io/en/latest/type_promotion.html).
-        #  However, in this case we will have problems when we call the SDFG, for some reasons
-        #  `CompiledSDFG` does not work in that case correctly, thus we enable it for the tracing.
+        # In Jax `float32` is the main datatype, and they go to great lengths to avoid
+        #  some aggressive [type promotion](https://jax.readthedocs.io/en/latest/type_promotion.html).
+        #  However, in this case we will have problems when we call the SDFG, for some
+        #  reasons `CompiledSDFG` does not work in that case correctly, thus we enable
+        #  it for the tracing.
         with _jax.experimental.enable_x64():
             builder = translator.JaxprTranslationBuilder(
                 primitive_translators=self._primitive_translators
@@ -147,8 +152,8 @@ def lower(self, *args: Any, **kwargs: Any) -> JaCeLowered:
             jaxpr = _jax.make_jaxpr(self._fun)(*args)
             trans_ctx: translator.TranslationContext = builder.translate_jaxpr(jaxpr)
 
-        # Perform the post processing and turn it into a `TranslatedJaxprSDFG` that can be
-        #  compiled and called later.
+        # Perform the post processing and turn it into a `TranslatedJaxprSDFG` that can
+        #  be compiled and called later.
         # NOTE: `tsdfg` was deepcopied as a side effect of post processing.
         tsdfg: translator.TranslatedJaxprSDFG = ptrans.postprocess_jaxpr_sdfg(
             trans_ctx=trans_ctx,
@@ -165,7 +170,8 @@ def wrapped_fun(self) -> Callable:
         return self._fun
 
     def _make_call_description(self, *args: Any) -> tcache.StageTransformationSpec:
-        """This function computes the key for the `JaCeWrapped.lower()` call inside the cache.
+        """
+        Computes the key for the `JaCeWrapped.lower()` call inside the cache.
 
         The function will compute a full abstract description on its argument.
         """
@@ -174,7 +180,8 @@ def _make_call_description(self, *args: Any) -> tcache.StageTransformationSpec:
 
 
 class JaCeLowered(tcache.CachingStage["JaCeCompiled"]):
-    """Represents the original computation as an SDFG.
+    """
+    Represents the original computation as an SDFG.
 
     This class is the output type of `JaCeWrapped.lower()` and represents the
     originally wrapped computation as an SDFG. This stage is followed by the
@@ -198,7 +205,8 @@ def __init__(self, tsdfg: translator.TranslatedJaxprSDFG) -> None:
 
     @tcache.cached_transition
     def compile(self, compiler_options: CompilerOptions | None = None) -> JaCeCompiled:
-        """Optimize and compile the lowered SDFG using `compiler_options`.
+        """
+        Optimize and compile the lowered SDFG using `compiler_options`.
 
         Returns an object that encapsulates a compiled SDFG object. To influence
         the various optimizations and compile options of JaCe you can use the
@@ -209,8 +217,8 @@ def compile(self, compiler_options: CompilerOptions | None = None) -> JaCeCompil
             Before `compiler_options` is forwarded to `jace_optimize()` it
             will be merged with the default arguments.
         """
-        # We **must** deepcopy before we do any optimization, because all optimizations are in
-        #  place, however, to properly cache stages, stages needs to be immutable.
+        # We **must** deepcopy before we do any optimization, because all optimizations
+        #  are in place, to properly cache stages, stages needs to be immutable.
         tsdfg: translator.TranslatedJaxprSDFG = copy.deepcopy(self._translated_sdfg)
         optimization.jace_optimize(tsdfg=tsdfg, **self._make_compiler_options(compiler_options))
 
@@ -221,7 +229,8 @@ def compile(self, compiler_options: CompilerOptions | None = None) -> JaCeCompil
         )
 
     def compiler_ir(self, dialect: str | None = None) -> translator.TranslatedJaxprSDFG:
-        """Returns the internal SDFG.
+        """
+        Returns the internal SDFG.
 
         The function returns a `TranslatedJaxprSDFG` object. Direct modification
         of the returned object is forbidden and will cause undefined behaviour.
@@ -231,14 +240,16 @@ def compiler_ir(self, dialect: str | None = None) -> translator.TranslatedJaxprS
         raise ValueError(f"Unknown dialect '{dialect}'.")
 
     def view(self, filename: str | None = None) -> None:
-        """Runs the `view()` method of the underlying SDFG.
+        """
+        Runs the `view()` method of the underlying SDFG.
 
         This will open a browser and display the SDFG.
         """
         self.compiler_ir().sdfg.view(filename=filename, verbose=False)
 
     def as_sdfg(self) -> dace.SDFG:
-        """Returns the encapsulated SDFG.
+        """
+        Returns the encapsulated SDFG.
 
         Modifying the returned SDFG in any way is undefined behavior.
         """
@@ -247,7 +258,8 @@ def as_sdfg(self) -> dace.SDFG:
     def _make_call_description(
         self, compiler_options: CompilerOptions | None = None
     ) -> tcache.StageTransformationSpec:
-        """This function computes the key for the `self.compile()` call inside the cache.
+        """
+        This function computes the key for the `self.compile()` call inside the cache.
 
         The key that is computed by this function is based on the concrete
         values of the passed compiler options.
@@ -256,12 +268,14 @@ def _make_call_description(
         call_args = tuple(sorted(options.items(), key=lambda x: x[0]))
         return tcache.StageTransformationSpec(stage_id=id(self), call_args=call_args)
 
-    def _make_compiler_options(self, compiler_options: CompilerOptions | None) -> CompilerOptions:
+    @staticmethod
+    def _make_compiler_options(compiler_options: CompilerOptions | None) -> CompilerOptions:
         return optimization.DEFAULT_OPTIMIZATIONS | (compiler_options or {})
 
 
 class JaCeCompiled:
-    """Compiled version of the SDFG.
+    """
+    Compiled version of the SDFG.
 
     This is the last stage of the jit chain. A user should never create a
     `JaCeCompiled` instance, instead `JaCeLowered.compile()` should be used.
@@ -292,7 +306,8 @@ def __init__(
         self._out_names = tuple(out_names)
 
     def __call__(self, *args: Any, **kwargs: Any) -> Any:
-        """Calls the embedded computation.
+        """
+        Calls the embedded computation.
 
         The arguments must be the same as for the wrapped function, but with
         all static arguments removed.
diff --git a/src/jace/translator/__init__.py b/src/jace/translator/__init__.py
index a045f0c..2f184a0 100644
--- a/src/jace/translator/__init__.py
+++ b/src/jace/translator/__init__.py
@@ -5,7 +5,8 @@
 #
 # SPDX-License-Identifier: BSD-3-Clause
 
-"""Subpackage containing all the code related to the Jaxpr to SDFG translation.
+"""
+Subpackage containing all the code related to the Jaxpr to SDFG translation.
 
 The concrete primitive translators that ships with JaCe are inside the
 `primitive_translators` subpackage.
diff --git a/src/jace/translator/jaxpr_translator_builder.py b/src/jace/translator/jaxpr_translator_builder.py
index 6c9c488..da2e68f 100644
--- a/src/jace/translator/jaxpr_translator_builder.py
+++ b/src/jace/translator/jaxpr_translator_builder.py
@@ -4,7 +4,6 @@
 # All rights reserved.
 #
 # SPDX-License-Identifier: BSD-3-Clause
-
 """Contains the translator that actually builds an SDFG based on a Jaxpr description."""
 
 from __future__ import annotations
@@ -25,11 +24,12 @@
 
 
 class JaxprTranslationBuilder:
-    """Internal builder class for creating an SDFG equivalent of a `Jaxpr` instance.
+    """
+    Internal builder class for creating an SDFG equivalent of a `Jaxpr` instance.
 
     The SDFG created by this class has a very particular form, which we call
     canonical. The main features of such an SDFG are:
-    - the SDFG is a list of states, ideally each state corresponds to single Jax primitive,
+    - the SDFG is a list of states,
     - it has a single source and sink state.
     - all variable names are derived from Jax names,
     - there are only transient variables inside the SDFG,
@@ -81,9 +81,9 @@ def __init__(
         self._primitive_translators = {**primitive_translators}
 
         # Maps Jax variables to the name of its SDFG equivalent.
-        #  Shared between all translation contexts, to ensure consecutive variable naming as
-        #  seen as in a pretty printed Jaxpr.
-        #  Will be cleared by `_clear_translation_ctx()` at the end of the root translation.
+        #  Shared between all translation contexts, to ensure consecutive variable
+        #  naming as seen as in a pretty printed Jaxpr. Will be cleared by
+        #  `_clear_translation_ctx()` at the end of the root translation.
         self._jax_name_map = {}
 
         # Stack of all context, to handle nested Jaxpr instances.
@@ -93,7 +93,8 @@ def __init__(
     def translate_jaxpr(
         self, jaxpr: jax_core.ClosedJaxpr, *, name: str | None = None
     ) -> TranslationContext:
-        """Perform the translation of a Jaxpr into a SDFG.
+        """
+        Perform the translation of a Jaxpr into a SDFG.
 
         In case this function is called and `self` has an ongoing translation
         process, a new translation context will be created. This allows to
@@ -108,16 +109,16 @@ def translate_jaxpr(
 
         Args:
             name: Use this name for the SDFG instead some generated one.
+            jaxpr: The Jaxpr object that should be translated.
         """
-
         if len(jaxpr.effects) != 0:
             raise NotImplementedError("'Jaxpr' with side effects are not supported.")
 
-        # NOTE: If `self` is already allocated, i.e. has an ongoing translation process,
-        #       the `_allocate_translation_ctx()` function will start a new context.
-        #       Thus the builder will start to translate a second (nested) SDFG.
-        #       Also note that there is no mechanism that forces the integration of the nested
-        #       SDFG/Jaxpr, this must be done manually.
+        # NOTE: If `self` is already allocated, i.e. has an ongoing translation
+        #  process, the `_allocate_translation_ctx()` function will start a new
+        #  context. Thus the builder will start to translate a second (nested)
+        #  SDFG. Also note that there is no mechanism that forces the integration
+        #  of the nested SDFG/Jaxpr, this must be done manually.
         self._allocate_translation_ctx(name=name)
         self._create_constants(jaxpr=jaxpr)
         self._create_initial_input(jaxpr=jaxpr)
@@ -131,7 +132,8 @@ def append_new_state(
         assignments: Mapping[str, Any] | None = None,
         prev_state: dace.SDFGState | None = None,
     ) -> dace.SDFGState:
-        """Creates a new `SDFGState`, adds it to the SDFG and returns it.
+        """
+        Creates a new `SDFGState`, adds it to the SDFG and returns it.
 
         By default the new state is appended to the current terminal state.
         However, if `prev_state` is specified it will be appended to it. In
@@ -140,9 +142,9 @@ def append_new_state(
 
         Args:
             label: The name that should be given to the new `SDFGState`.
-            condition: The condition of the state transitions used on the `InterstateEdge`.
-            assignments: Symbol assignments that should be done during the transition.
-            prev_state: Alternative `SDFGState` at which we should append the new state.
+            condition: Condition on the `InterstateEdge`.
+            assignments: Symbol assignments on the `InterstateEdge`.
+            prev_state: Alternative state at which we append.
 
         Notes:
             It is potentially dangerous to not append to the current terminal
@@ -174,7 +176,8 @@ def append_new_state(
 
     @property
     def arrays(self) -> Mapping[str, ddata.Data]:
-        """Get all data descriptors that are currently known to the SDFG.
+        """
+        Get all data descriptors that are currently known to the SDFG.
 
         Notes:
             Essentially a shorthand and preferred way for `self.sdfg.arrays`.
@@ -183,7 +186,8 @@ def arrays(self) -> Mapping[str, ddata.Data]:
         return cast(Mapping[str, ddata.Data], self._ctx.sdfg.arrays)
 
     def get_array(self, name: str | jax_core.Atom | util.JaCeVar) -> ddata.Data:
-        """Returns the SDFG `Data` object `name` referees to.
+        """
+        Returns the SDFG `Data` object `name` referees to.
 
         `name` can either be a string, in which case it is interpreted as a
         verbatim SDFG name. If it is a Jax or JaCe variable, the function will
@@ -212,14 +216,15 @@ def map_jax_var_to_sdfg(
     def map_jax_var_to_sdfg(
         self, jax_var: jax_core.Atom | util.JaCeVar, allow_fail: bool = False
     ) -> str | None:
-        """Get the name of the SDFG variable to which `jax_var` is referring to.
+        """
+        Get the name of the SDFG variable to which `jax_var` is referring to.
 
         Args:
             jax_var: The Jax variable to look up.
-            allow_fail: If no mapping is known return `None` instead of raising `KeyError`.
+            allow_fail: Return `None` instead of raising a `KeyError`.
         """
         if isinstance(jax_var, jax_core.Literal):
-            raise RuntimeError(f"There is no SDFG variable for literal '{jax_var}'.")
+            raise TypeError(f"There is no SDFG variable for literal '{jax_var}'.")
         if jax_var in self._jax_name_map:
             sdfg_name = self._jax_name_map[jax_var]
         elif allow_fail:
@@ -239,14 +244,16 @@ def sdfg(self) -> dace.SDFG:
         return self._ctx.sdfg
 
     def is_allocated(self) -> bool:
-        """Tests if `self` has an allocated context.
+        """
+        Tests if `self` has an allocated context.
 
         If `self` is allocated then there is also an ongoing translation process.
         """
         return len(self._ctx_stack) != 0
 
     def is_root_translator(self) -> bool:
-        """Tests if `self` is the root translator.
+        """
+        Tests if `self` is the root translator.
 
         The root translator (context) is the very first translator process.
         """
@@ -257,7 +264,8 @@ def is_root_translator(self) -> bool:
     def add_jax_name_mapping(
         self, jax_var: jax_core.Var | util.JaCeVar, sdfg_name: str
     ) -> JaxprTranslationBuilder:
-        """Creates a new mapping between `jax_var` to `sdfg_name`.
+        """
+        Creates a new mapping between `jax_var` to `sdfg_name`.
 
         If the mapping already exists an error will be generated. This function
         is not able to delete a variable mapping that was established before.
@@ -288,7 +296,8 @@ def add_array(
         name_prefix: str | None = None,
         update_var_mapping: bool = False,
     ) -> str:
-        """Creates an SDFG variable for Jax variable `arg` and returns its SDFG name.
+        """
+        Creates an SDFG variable for Jax variable `arg` and returns its SDFG name.
 
         The SDFG object is always created as a transient. Furthermore, the
         function will not update the internal variable mapping, by default.
@@ -302,7 +311,7 @@ def add_array(
         Args:
             arg: The Jax object for which a SDFG equivalent should be created.
             name_prefix: If given it will be used as prefix for the name.
-            update_var_mapping: Update the internal variable mapping; by default `False`.
+            update_var_mapping: Update the internal variable mapping.
 
         Notes:
             As a temporary fix for handling scalar return values, the function
@@ -312,9 +321,8 @@ def add_array(
             parts that might explicitly want a scalar, it also might block
             certain compiler optimization.
         """
-
         if isinstance(arg, jax_core.Literal):
-            raise ValueError(f"Can not generate an SDFG variable for literal '{arg}'.")
+            raise TypeError(f"Can not generate an SDFG variable for literal '{arg}'.")
 
         shape: tuple[int | dace.symbol | str, ...] = util.get_jax_var_shape(arg)
         dtype: dace.typeclass = util.get_jax_var_dtype(arg)
@@ -387,7 +395,8 @@ def create_jax_var_list(  # type: ignore[misc]
         handle_literals: bool = False,
         **kwargs: Any,
     ) -> list[None | str]:
-        """Creates SDFG variables for the listed Jax variables and returns their SDFG names.
+        """
+        Create SDFG variables from the passed Jax variables.
 
         If a Jax variable already has a SDFG equivalent then the function will
         use this variable. If no corresponding SDFG variable is known the function
@@ -403,9 +412,9 @@ def create_jax_var_list(  # type: ignore[misc]
         to `True` literals will will be included in the output with the value `None`.
 
         Args:
-            jax_var_list: The list of Jax variables that should be transformed to SDFG names.
+            jax_var_list: The list of Jax variables that should be processed.
             prevent_creation: Never create a variable, all must already be known.
-            only_creation: Always create a variable, it is an error if one already exist.
+            only_creation: Always create a variable.
             handle_literals: Allow the processing of literals.
             kwargs: Will be forwarded to `self.add_array()` if a variable is created.
 
@@ -436,7 +445,8 @@ def create_jax_var_list(  # type: ignore[misc]
         return ret_list
 
     def _create_initial_input(self, jaxpr: jax_core.ClosedJaxpr) -> None:
-        """Creates the input variables of `jaxpr`.
+        """
+        Creates the input variables of `jaxpr`.
 
         Notes:
             The function will populate the `inp_names` member of the current context.
@@ -451,14 +461,14 @@ def _create_initial_input(self, jaxpr: jax_core.ClosedJaxpr) -> None:
             handle_literals=False,  # Initial arguments are never literals
             update_var_mapping=True,
         )
-        # This forces the code to only accept kwargs; it is also part of "what a canonical sdfg" is.
         self.sdfg.arg_names = []
 
         # The output list is populated by `self._translate_jaxpr_internal()`
         self._ctx.inp_names = tuple(init_in_var_names)
 
     def _create_constants(self, jaxpr: jax_core.ClosedJaxpr) -> None:
-        """Creates all constants requested by the `jaxpr`.
+        """
+        Creates all constants requested by the `jaxpr`.
 
         The function will create an SDFG variable and add them as constant to
         the SDFG. Their value is deepcopied.
@@ -480,7 +490,8 @@ def _create_constants(self, jaxpr: jax_core.ClosedJaxpr) -> None:
             )
 
     def _allocate_translation_ctx(self, name: str | None = None) -> JaxprTranslationBuilder:
-        """Allocate a new context and activate it.
+        """
+        Allocate a new context and activate it.
 
         Args:
             name: The name of the SDFG.
@@ -495,7 +506,8 @@ def _ctx(self) -> TranslationContext:
         return self._ctx_stack[-1]
 
     def _clear_translation_ctx(self) -> TranslationContext | None:
-        """Remove the currently active context from `self` and returns it.
+        """
+        Remove the currently active context from `self` and returns it.
 
         If `self` is not allocated it will return `None`.
         """
@@ -511,7 +523,8 @@ def _clear_translation_ctx(self) -> TranslationContext | None:
         return self._ctx_stack.pop()
 
     def _translate_single_eqn(self, eqn: jax_core.JaxprEqn) -> None:
-        """Translate `eqn` into its SDFG equivalent.
+        """
+        Translate `eqn` into its SDFG equivalent.
 
         To do this the function will perform the following steps:
         - Assemble the in and output variables.
@@ -567,7 +580,8 @@ def _translate_single_eqn(self, eqn: jax_core.JaxprEqn) -> None:
         self._ctx.terminal_state = new_sdfg_term_state
 
     def _translate_jaxpr_internal(self, jaxpr: jax_core.ClosedJaxpr) -> TranslationContext:
-        """Performs the actual translation of the Jaxpr into an SDFG.
+        """
+        Performs the actual translation of the Jaxpr into an SDFG.
 
         The function assumes that the context is allocated as well as the
         initial variables. The function removes and returns the currently
@@ -603,7 +617,8 @@ def _translate_jaxpr_internal(self, jaxpr: jax_core.ClosedJaxpr) -> TranslationC
         return cast(TranslationContext, self._clear_translation_ctx())
 
     def _handle_null_jaxpr(self, jaxpr: jax_core.ClosedJaxpr) -> list[str]:
-        """This function is called in case a `Jaxpr` with zero equations is encountered.
+        """
+        This function is called in case a `Jaxpr` with zero equations is encountered.
 
         A function with zero equation might still have output, in which case
         an input is copied to an output. This function will handle the copying
@@ -634,22 +649,23 @@ def _handle_null_jaxpr(self, jaxpr: jax_core.ClosedJaxpr) -> list[str]:
         out_var_names: list[str] = []
 
         # If we are here then we are dealing with a nested SDFG/Jaxpr, that has output.
-        #  Because an input also serves as output, the nested SDFG will have a connector for the
-        #  input and one for the output, but both with the same name. This will make node
-        #  validation fail. We have to work around this by introducing some fake copies, which
-        #  will be removed by DaCe later.
+        #  Because an input also serves as output, the nested SDFG will have a
+        #  connector for the input and one for the output, but both with the same name.
+        #  This will make node validation fail. We have to work around this by
+        #  introducing some fake copies, which will be removed by DaCe later.
         for jax_out_var in jaxpr.jaxpr.outvars:
-            # Since the output is also used as an input the variable mapping must be already known.
             sdfg_in_name: str = self.map_jax_var_to_sdfg(jax_out_var)
 
-            # Now we create a variable that serves as true output, however, since the Jax variable
-            #  is already known we can not update the variable mapping and must use another name.
+            # Now we create a variable that serves as true output, however, since the
+            #  Jax variable is already known we can not update the variable mapping and
+            #  must use another name.
             sdfg_out_name = self.add_array(
                 jax_out_var, name_prefix="_zero_equation_output_for_", update_var_mapping=False
             )
             out_var_names.append(sdfg_out_name)
 
-            # Now we perform the copy from the input variable in the newly created output variable.
+            # Now we perform the copy from the input variable in the newly created
+            #  output variable.
             inp_acc = self._start_state.add_read(sdfg_in_name)
             out_acc = self._start_state.add_write(sdfg_out_name)
             self._start_state.add_nedge(
@@ -658,11 +674,11 @@ def _handle_null_jaxpr(self, jaxpr: jax_core.ClosedJaxpr) -> list[str]:
                 data=dace.Memlet.from_array(sdfg_in_name, self.get_array(sdfg_in_name)),
             )
 
-            # `jax_out_var` now has, in some sense, two SDFG equivalents, the input, that
-            #  was previously created by `self._create_initial_input()` and the `sdfg_out_name`
-            #  we just created. But we can not add this to the mapping. Because it is the best,
-            #  as in the least worst thing we can do, we remove it from the mapping.
-            #  I am open for different approaches.
+            # `jax_out_var` now has, in some sense, two SDFG equivalents, the input,
+            #  that was previously created by `self._create_initial_input()` and the
+            #  `sdfg_out_name` we just created. But we can not add this to the mapping.
+            #  Because it is the best, as in the least worst thing we can do, we remove
+            #  it from the mapping. I am open for different approaches.
             self._jax_name_map.pop(jax_out_var)
 
         return out_var_names
@@ -678,7 +694,8 @@ def _terminal_sdfg_state(self) -> dace.SDFGState:
 
 
 class TranslationContext:
-    """Translation context used by the `JaxprTranslationBuilder`.
+    """
+    Translation context used by the `JaxprTranslationBuilder`.
 
     Internal representation of the builder of an SDFG under construction together
     with the needed metadata. Essentially it is an extended version of the
@@ -696,10 +713,11 @@ class TranslationContext:
         terminal_state: The (currently) last state in the state machine.
 
     Args:
-        name: The name of the SDFG, will be forwarded to the encapsulated `TranslatedJaxprSDFG`.
+        name: The name of the SDFG.
 
     Note:
-        Access of any attribute of this class by an outside user is considered undefined behaviour.
+        Access of any attribute of this class by an outside user is considered
+        undefined behaviour.
     """
 
     sdfg: dace.SDFG
@@ -719,10 +737,11 @@ def __init__(self, name: str | None = None) -> None:
         self.terminal_state = self.start_state
 
     def validate(self) -> bool:
-        """Validate internal state of `self`.
+        """
+        Validate internal state of `self`.
 
-        Since the SDFG is under construction it will not be validated, instead the meta data
-        will be validated.
+        Since the SDFG is under construction it will not be validated, instead the
+        meta data will be validated.
         """
         if self.start_state is not self.sdfg.start_block:
             raise dace.sdfg.InvalidSDFGError(
diff --git a/src/jace/translator/post_translation.py b/src/jace/translator/post_translation.py
index 1e3f69f..ec445e9 100644
--- a/src/jace/translator/post_translation.py
+++ b/src/jace/translator/post_translation.py
@@ -5,7 +5,8 @@
 #
 # SPDX-License-Identifier: BSD-3-Clause
 
-"""This module contains all functions that are related to post processing the SDFG.
+"""
+This module contains all functions that are related to post processing the SDFG.
 
 Most of them operate on `TranslatedJaxprSDFG` objects.
 Currently they mostly exist for the sake of existing.
@@ -29,13 +30,14 @@ def postprocess_jaxpr_sdfg(
     call_args: Sequence[Any],  # noqa: ARG001  # Currently unused
     intree: None,  # noqa: ARG001  # Currently unused
 ) -> translator.TranslatedJaxprSDFG:
-    """Perform the final post processing steps on the `TranslationContext` _in place_.
+    """
+    Perform the final post processing steps on the `TranslationContext` _in place_.
 
     The function will perform post processing stages on the context in place.
     However, the function will return a decoupled `TranslatedJaxprSDFG` object.
 
     Args:
-        trans_ctx: The `TranslationContext` obtained from the `translate_jaxpr()` function.
+        trans_ctx: The `TranslationContext` obtained from a `translate_jaxpr()` call.
         fun: The original function that was translated.
         call_args: The linearized input arguments.
         intree: The pytree describing the inputs.
@@ -58,7 +60,8 @@ def postprocess_jaxpr_sdfg(
 def finalize_translation_context(
     trans_ctx: translator.TranslationContext, validate: bool = True
 ) -> translator.TranslatedJaxprSDFG:
-    """Finalizes the supplied translation context `trans_ctx`.
+    """
+    Finalizes the supplied translation context `trans_ctx`.
 
     The function will process the SDFG that is encapsulated inside the context,
     i.e. a canonical one, into a proper SDFG, as it is described in
@@ -94,8 +97,9 @@ def finalize_translation_context(
         tsdfg.sdfg.arrays[glob_name].transient = False
         sdfg_arg_names.append(glob_name)
 
-    # This forces the signature of the SDFG to include all arguments in order they appear.
-    #  If an argument is used as input and output then it is only listed as input.
+    # This forces the signature of the SDFG to include all arguments in order they
+    #  appear. If an argument is used as input and output then it is only listed as
+    #  input.
     tsdfg.sdfg.arg_names = sdfg_arg_names
 
     if validate:
diff --git a/src/jace/translator/primitive_translator.py b/src/jace/translator/primitive_translator.py
index 842d6d6..dc3bd74 100644
--- a/src/jace/translator/primitive_translator.py
+++ b/src/jace/translator/primitive_translator.py
@@ -4,7 +4,8 @@
 # All rights reserved.
 #
 # SPDX-License-Identifier: BSD-3-Clause
-"""Interface for all primitive translators and managing of the global translator registry.
+"""
+Interface for all primitive translators and managing of the global translator registry.
 
 Todo:
     Implement proper context manager for working with the registry.
@@ -30,10 +31,7 @@
 
 
 class PrimitiveTranslatorCallable(Protocol):
-    """Callable version of the primitive translators.
-
-    Used for type annotation purposes, the proper public interface is `PrimitiveTranslator`.
-    """
+    """Callable version of the primitive translators."""
 
     @abc.abstractmethod
     def __call__(
@@ -44,7 +42,8 @@ def __call__(
         eqn: jax_core.JaxprEqn,
         eqn_state: dace.SDFGState,
     ) -> dace.SDFGState | None:
-        """Translates the Jax primitive into its SDFG equivalent.
+        """
+        Translates the Jax primitive into its SDFG equivalent.
 
         Before the builder calls this function it will perform the following
         preparatory tasks:
@@ -92,7 +91,8 @@ def __call__(
 
 @runtime_checkable
 class PrimitiveTranslator(PrimitiveTranslatorCallable, Protocol):
-    """Interface for all Jax primitive translators.
+    """
+    Interface for all Jax primitive translators.
 
     A translator for a primitive translates a single equation of a Jaxpr into
     its SDFG equivalent. For satisfying this interface a concrete implementation
@@ -133,7 +133,8 @@ def make_primitive_translator(
     Callable[[translator.PrimitiveTranslatorCallable], translator.PrimitiveTranslator]
     | translator.PrimitiveTranslator
 ):
-    """Turn `primitive_translator` into a `PrimitiveTranslator` for primitive `primitive`.
+    """
+    Turn `primitive_translator` into a `PrimitiveTranslator` for primitive `primitive`.
 
     Essentially, this function adds the `primitive` property to a callable, such
     that it satisfy the `PrimitiveTranslator` protocol. However, it does not add
@@ -175,7 +176,8 @@ def register_primitive_translator(
     translator.PrimitiveTranslator
     | Callable[[translator.PrimitiveTranslator], translator.PrimitiveTranslator]
 ):
-    """Adds a primitive translator to JaCe's global registry.
+    """
+    Adds a primitive translator to JaCe's global registry.
 
     The default set of primitives that are used if nothing is specified to to
     `jace.jit` are stored inside a global registry. To add a translator to this
@@ -210,7 +212,8 @@ def wrapper(
 
 
 def get_registered_primitive_translators() -> dict[str, translator.PrimitiveTranslator]:
-    """Returns a copy of the current state of JaCe's global primitive registry.
+    """
+    Returns a copy of the current state of JaCe's global primitive registry.
 
     The state returned by this function is compatible to what `jace.jit`'s
     `primitive_translators` argument expects. It is important the the returned
diff --git a/src/jace/translator/primitive_translators/alu_translator.py b/src/jace/translator/primitive_translators/alu_translator.py
index 079139d..d865ee8 100644
--- a/src/jace/translator/primitive_translators/alu_translator.py
+++ b/src/jace/translator/primitive_translators/alu_translator.py
@@ -6,6 +6,7 @@
 # SPDX-License-Identifier: BSD-3-Clause
 
 """This module contains the `ALUTranslator` which translates all arithmetic and logic primitives."""
+# ruff: noqa: W505 PLR0912 C901 PLR0914 PLR0915 D417
 
 from __future__ import annotations
 
@@ -24,7 +25,8 @@
 
 
 class ALUTranslator(translator.PrimitiveTranslator):
-    """This translator handles all arithmetic and logical operations.
+    """
+    This translator handles all arithmetic and logical operations.
 
     This translator will be reworked soon, it just exists that the initial PR can do anything at all!!
     """
@@ -48,7 +50,8 @@ def __call__(
         eqn: jax_core.JaxprEqn,
         eqn_state: dace.SDFGState,
     ) -> None:
-        """Perform the translation.
+        """
+        Perform the translation.
 
         Deepening on the shapes of the input the function will either create a Tasklet or a mapped Tasklet.
         The translator is able to handle broadcasting with NumPy rules.
@@ -194,14 +197,14 @@ def __call__(
     def _write_tasklet_code(
         self, in_var_names: Sequence[str | None], eqn: jax_core.JaxprEqn
     ) -> str:
-        """This function generates the Tasklet code based on a primitive.
+        """
+        This function generates the Tasklet code based on a primitive.
 
         The function will also perform literal substitution and parameter handling.
 
         Args:
             in_var_names:   The list of SDFG variables used as input.
         """
-
         t_code = self._prim_tmpl
 
         # Now we handle Literal substitution
@@ -228,7 +231,8 @@ def _write_tasklet_code(
 
 
 def _list_to_dict(inp: Sequence[tuple[None | Any, Any]]) -> dict[Any, Any]:
-    """This method turns a `list` of pairs into a `dict` and applies a `None` filter.
+    """
+    This method turns a `list` of pairs into a `dict` and applies a `None` filter.
 
     The function will only include pairs whose key, i.e. first element is not `None`.
     """
diff --git a/src/jace/translator/translated_jaxpr_sdfg.py b/src/jace/translator/translated_jaxpr_sdfg.py
index 811cce9..afa91ff 100644
--- a/src/jace/translator/translated_jaxpr_sdfg.py
+++ b/src/jace/translator/translated_jaxpr_sdfg.py
@@ -5,6 +5,8 @@
 #
 # SPDX-License-Identifier: BSD-3-Clause
 
+"""Container for storing a translated SDFG."""
+
 from __future__ import annotations
 
 import dataclasses
@@ -14,7 +16,8 @@
 
 @dataclasses.dataclass(kw_only=True, frozen=True)
 class TranslatedJaxprSDFG:
-    """Encapsulates the translated SDFG together with the metadata that is needed to run it.
+    """
+    Encapsulates a translated SDFG with additional the metadata.
 
     Contrary to the SDFG that is encapsulated inside the `TranslationContext`
     object, `self` carries a proper SDFG, however:
@@ -23,8 +26,8 @@ class TranslatedJaxprSDFG:
     - All input arguments are passed through arguments mentioned in `inp_names`,
         while the outputs are passed through `out_names`.
     - Only variables listed as in/outputs are non transient.
-    - The order inside `inp_names` and `out_names` is the same as in the translated Jaxpr.
-    - If inputs are also used as outputs they appear in both `inp_names` and `out_names`.
+    - The order inside `inp_names` and `out_names` is the same as in the original Jaxpr.
+    - If an input is used as outputs it appears in both `inp_names` and `out_names`.
     - Its `arg_names` is set to  `inp_names + out_names`, but arguments that are
         input and outputs are only listed as inputs.
 
diff --git a/src/jace/util/__init__.py b/src/jace/util/__init__.py
index 63029c7..ab73e4e 100644
--- a/src/jace/util/__init__.py
+++ b/src/jace/util/__init__.py
@@ -34,7 +34,6 @@
     "VALID_SDFG_OBJ_NAME",
     "VALID_SDFG_VAR_NAME",
     "JaCeVar",
-    "dataclass_with_default_init",
     "get_jax_var_dtype",
     "get_jax_var_name",
     "get_jax_var_shape",
diff --git a/src/jace/util/dace_helper.py b/src/jace/util/dace_helper.py
index 5ce559b..1828fac 100644
--- a/src/jace/util/dace_helper.py
+++ b/src/jace/util/dace_helper.py
@@ -27,13 +27,12 @@
     from collections.abc import Mapping, Sequence
 
     from jace import translator
-    from jace.util import dace_helper
 
 __all__ = ["CompiledSDFG", "compile_jax_sdfg", "run_jax_sdfg"]
 
 
-def compile_jax_sdfg(tsdfg: translator.TranslatedJaxprSDFG) -> dace_helper.CompiledSDFG:
-    """Compiles the SDFG embedded in `tsdfg` and return the resulting `CompiledSDFG` object."""
+def compile_jax_sdfg(tsdfg: translator.TranslatedJaxprSDFG) -> CompiledSDFG:
+    """Compiles the embedded SDFG and return the resulting `CompiledSDFG` object."""
     if any(  # We do not support the DaCe return mechanism
         array_name.startswith("__return")
         for array_name in tsdfg.sdfg.arrays.keys()  # noqa: SIM118  # we can not use `in` because we are also interested in `__return_`!
@@ -48,15 +47,16 @@ def compile_jax_sdfg(tsdfg: translator.TranslatedJaxprSDFG) -> dace_helper.Compi
     org_regenerate_code = sdfg._regenerate_code
 
     try:
-        # We need to give the SDFG another name, this is needed to prevent a DaCe error/warning.
-        #  This happens if we compile the same lowered SDFG multiple times with different options.
+        # We need to give the SDFG another name, this is needed to prevent a DaCe
+        #  error/warning. This happens if we compile the same lowered SDFG multiple
+        #  times with different options.
         sdfg.name = f"{sdfg.name}__comp_{int(time.time() * 1000)}"
 
         with dace.config.temporary_config():
             sdfg._recompile = True
             sdfg._regenerate_code = True
             dace.Config.set("compiler", "use_cache", value=False)
-            csdfg: dace_helper.CompiledSDFG = sdfg.compile()
+            csdfg: CompiledSDFG = sdfg.compile()
 
     finally:
         sdfg.name = org_sdfg_name
@@ -67,13 +67,14 @@ def compile_jax_sdfg(tsdfg: translator.TranslatedJaxprSDFG) -> dace_helper.Compi
 
 
 def run_jax_sdfg(
-    csdfg: dace_helper.CompiledSDFG,
+    csdfg: CompiledSDFG,
     inp_names: Sequence[str],
     out_names: Sequence[str],
     call_args: Sequence[Any],
     call_kwargs: Mapping[str, Any],
 ) -> tuple[Any, ...] | Any:
-    """Run the compiled SDFG.
+    """
+    Run the compiled SDFG.
 
     The function assumes that the SDFG was finalized and then compiled by
     `compile_jax_sdfg()`. For running the SDFG you also have to pass the input
@@ -112,8 +113,9 @@ def run_jax_sdfg(
     sdfg_call_args: dict[str, Any] = {}
     for in_name, in_val in zip(inp_names, call_args, strict=True):
         if util.is_scalar(in_val):
-            # Currently the translator makes scalar into arrays, this has to be reflected here
-            in_val = np.array([in_val])
+            # Currently the translator makes scalar into arrays, this has to be
+            #  reflected here
+            in_val = np.array([in_val])  # noqa: PLW2901  # Loop variable is intentionally modified.
         sdfg_call_args[in_name] = in_val
 
     for out_name, sdfg_array in ((out_name, sdfg.arrays[out_name]) for out_name in out_names):
diff --git a/src/jace/util/definitions.py b/src/jace/util/definitions.py
index d593c70..13daf7a 100644
--- a/src/jace/util/definitions.py
+++ b/src/jace/util/definitions.py
@@ -5,6 +5,8 @@
 #
 # SPDX-License-Identifier: BSD-3-Clause
 
+"""Definitions of patterns for valid names."""
+
 from __future__ import annotations
 
 import re
@@ -21,8 +23,8 @@
 # fmt: off
 #: This is a set of all names that are invalid SDFG names.
 FORBIDDEN_SDFG_VAR_NAMES: Final[set[str]] = {
-    # These should be most of the C++ keywords, it is more important to have the short ones.
-    #  Taken from 'https://learn.microsoft.com/en-us/cpp/cpp/keywords-cpp?view=msvc-170'
+    # These should be most of the C++ keywords, it is more important to have the short
+    #  ones. Taken from 'https://learn.microsoft.com/en-us/cpp/cpp/keywords-cpp?view=msvc-170'
     "alignas", "alignof", "and", "asm", "auto", "bitand", "bitor", "bool", "break", "case",
     "catch", "char", "class", "compl", "concept", "const", "consteval", "constexpr",
     "constinit", "continue", "decltype", "default", "delete", "directive", "do", "double",
diff --git a/src/jace/util/jax_helper.py b/src/jace/util/jax_helper.py
index a4cd8fa..175671f 100644
--- a/src/jace/util/jax_helper.py
+++ b/src/jace/util/jax_helper.py
@@ -5,7 +5,8 @@
 #
 # SPDX-License-Identifier: BSD-3-Clause
 
-"""Implements all utility functions that are related to Jax.
+"""
+Implements all utility functions that are related to Jax.
 
 Most of the functions defined here allow an unified access to Jax' internal in
 a consistent and stable way.
@@ -21,7 +22,7 @@
 import jax.core as jax_core
 import numpy as np
 
-import jace.util as util
+from jace import util
 
 
 if TYPE_CHECKING:
@@ -30,7 +31,8 @@
 
 @dataclasses.dataclass(repr=True, frozen=True, eq=False)
 class JaCeVar:
-    """Replacement for the `jax.Var` class.
+    """
+    Replacement for the `jax.Var` class.
 
     This class can be seen as some kind of substitute `jax.core.Var`. The main
     intention of this class is as an internal representation of values, as they
@@ -103,8 +105,7 @@ def get_jax_var_shape(jax_var: jax_core.Atom | JaCeVar) -> tuple[int | dace.symb
     """Returns the shape of `jax_var`."""
     match jax_var:
         case jax_core.Var() | jax_core.Literal():
-            # AbstractValue, does not have a `shape` attribute, but in all cases we care, it will.
-            assert hasattr(jax_var.aval, "shape")
+            assert hasattr(jax_var.aval, "shape")  # To silences mypy.
             return jax_var.aval.shape
         case JaCeVar():
             return jax_var.shape
@@ -116,8 +117,7 @@ def get_jax_var_dtype(jax_var: jax_core.Atom | JaCeVar) -> dace.typeclass:
     """Returns the DaCe equivalent of `jax_var`s datatype."""
     match jax_var:
         case jax_core.Var() | jax_core.Literal():
-            # AbstractValue, does not have a `dtype` attribute, but in all cases we care, it will.
-            assert hasattr(jax_var.aval, "dtype")
+            assert hasattr(jax_var.aval, "dtype")  # To silences mypy.
             return translate_dtype(jax_var.aval.dtype)
         case JaCeVar():
             return jax_var.dtype
@@ -126,7 +126,8 @@ def get_jax_var_dtype(jax_var: jax_core.Atom | JaCeVar) -> dace.typeclass:
 
 
 def is_tracing_ongoing(*args: Any, **kwargs: Any) -> bool:
-    """Test if tracing is ongoing.
+    """
+    Test if tracing is ongoing.
 
     While a return value `True` guarantees that a translation is ongoing, a
     value of `False` does not guarantees that no tracing is ongoing.
@@ -154,7 +155,8 @@ def propose_jax_name(
     jax_var: jax_core.Atom | JaCeVar,
     jax_name_map: Mapping[jax_core.Var | JaCeVar, str] | None = None,
 ) -> str:
-    """Proposes a variable name for `jax_var`.
+    """
+    Proposes a variable name for `jax_var`.
 
     If `jax_name_map` is `None` the function will fallback to
     `get_jax_var_name(jax_var)`. If `jax_name_map` is supplied the function
@@ -183,15 +185,15 @@ def propose_jax_name(
     if isinstance(jax_var, JaCeVar) and (jax_var.name is not None):
         return jax_var.name
 
-    # This code is taken from Jax so it will generate similar ways, the difference is that
-    #  we do the counting differently.
+    # This code is taken from Jax so it will generate similar ways, the difference is
+    #  that we do the counting differently.
     #  Note that `z` is followed by `ba` and not `aa` as it is in Excel.
     c = len(jax_name_map)
     jax_name = ""
     while len(jax_name) == 0 or c != 0:
         c, i = c // 26, c % 26
         jax_name = chr(97 + i) + jax_name
-    jax_name = jax_name + getattr(jax_var, "suffix", "")
+    jax_name += getattr(jax_var, "suffix", "")
 
     if jax_name in util.FORBIDDEN_SDFG_VAR_NAMES:
         jax_name = f"__jace_forbidden_{jax_name}"
@@ -199,12 +201,13 @@ def propose_jax_name(
 
 
 def get_jax_literal_value(lit: jax_core.Atom) -> bool | float | int | np.generic:
-    """Returns the value a literal is wrapping.
+    """
+    Returns the value a literal is wrapping.
 
     The function guarantees to return a scalar value.
     """
     if not isinstance(lit, jax_core.Literal):
-        raise ValueError(f"Can only extract literals not '{type(lit)}'.")
+        raise TypeError(f"Can only extract literals not '{type(lit)}'.")
     val = lit.val
     if isinstance(val, np.ndarray):
         assert val.shape == ()
diff --git a/src/jace/util/traits.py b/src/jace/util/traits.py
index ef918c3..a8e6bc8 100644
--- a/src/jace/util/traits.py
+++ b/src/jace/util/traits.py
@@ -16,12 +16,11 @@
 import numpy as np
 from jax import core as jax_core
 
-import jace.util as util
+from jace import util
 
 
 def is_drop_var(jax_var: jax_core.Atom | util.JaCeVar) -> TypeGuard[jax_core.DropVar]:
-    """Tests if `jax_var` is a drop variable, i.e. a variable that is not read from in a Jaxpr."""
-
+    """Tests if `jax_var` is a drop variable."""
     if isinstance(jax_var, jax_core.DropVar):
         return True
     if isinstance(jax_var, util.JaCeVar):
@@ -30,7 +29,8 @@ def is_drop_var(jax_var: jax_core.Atom | util.JaCeVar) -> TypeGuard[jax_core.Dro
 
 
 def is_jax_array(obj: Any) -> TypeGuard[jax.Array]:
-    """Tests if `obj` is a Jax array.
+    """
+    Tests if `obj` is a Jax array.
 
     Note:
      Jax arrays are special as they can not be mutated. Furthermore, they always
@@ -75,7 +75,8 @@ def is_scalar(obj: Any) -> bool:
 
 
 def is_on_device(obj: Any) -> bool:
-    """Tests if `obj` is on a device.
+    """
+    Tests if `obj` is on a device.
 
     Jax arrays are always on the CPU and GPU (if there is one). Thus for Jax
     arrays this function is more of a test, if there is a GPU at all.
diff --git a/src/jace/util/translation_cache.py b/src/jace/util/translation_cache.py
index 2320d46..f6366bd 100644
--- a/src/jace/util/translation_cache.py
+++ b/src/jace/util/translation_cache.py
@@ -5,7 +5,8 @@
 #
 # SPDX-License-Identifier: BSD-3-Clause
 
-"""This module contains the functionality related to the compilation cache of the stages.
+"""
+This module contains the functionality related to the compilation cache of the stages.
 
 The cache currently caches the lowering, i.e. the result of `JaCeWrapped.lower()`
 and the compilation, i.e. `JaCeLowered.compile()`. The caches are on a per stage
@@ -43,7 +44,8 @@
 
 
 class CachingStage(Generic[NextStage]):
-    """Annotates a stage whose transition to the next stage is cacheable.
+    """
+    Annotates a stage whose transition to the next stage is cacheable.
 
     To make the transition of a stage cacheable, the stage must be derived from
     this class, and its initialization must call `CachingStage.__init__()`.
@@ -83,7 +85,8 @@ def _make_call_description(
 def cached_transition(
     transition: Callable[Concatenate[CachingStageType, P], NextStage],
 ) -> Callable[Concatenate[CachingStage[NextStage], P], NextStage]:
-    """Decorator for making the transition function of the stage cacheable.
+    """
+    Decorator for making the transition function of the stage cacheable.
 
     In order to work, the stage must be derived from `CachingStage`. For computing
     the key of a call the function will use the `_make_call_description()`
@@ -121,7 +124,8 @@ def get_cache(stage: CachingStage) -> StageCache:
 
 @dataclasses.dataclass(frozen=True)
 class _AbstractCallArgument:
-    """Class to represent a single argument to the transition function in an abstract way.
+    """
+    Class to represent a single argument to the transition function in an abstract way.
 
     As noted in `StageTransformationSpec` there are two ways to describe an
     argument, either by using its concrete value or an abstract description,
@@ -187,7 +191,8 @@ def from_value(cls, value: Any) -> _AbstractCallArgument:
 
 @dataclasses.dataclass(frozen=True)
 class StageTransformationSpec:
-    """Represents the entire call to a state transformation function of a stage.
+    """
+    Represents the entire call to a state transformation function of a stage.
 
     State transition functions are annotated with `@cached_transition` and their
     result may be cached. They key to locate them inside the cache is represented
@@ -215,7 +220,8 @@ class StageTransformationSpec:
 
 
 class StageCache(Generic[StageType]):
-    """Simple LRU cache to cache the results of the stage transition function.
+    """
+    Simple LRU cache to cache the results of the stage transition function.
 
     Args:
         size: The size of the cache, defaults to 256.
@@ -248,7 +254,8 @@ def __setitem__(self, key: StageTransformationSpec, res: StageType) -> None:
             self._memory[key] = res
 
     def popitem(self, key: StageTransformationSpec | None) -> None:
-        """Evict `key` from `self`.
+        """
+        Evict `key` from `self`.
 
         If `key` is `None` the oldest entry is evicted.
         """
@@ -260,8 +267,8 @@ def popitem(self, key: StageTransformationSpec | None) -> None:
             self._memory.move_to_end(key, last=False)
             self._memory.popitem(last=False)
 
-    def clear(self) -> None:
+    def clear(self) -> None:  # noqa: D102  # Missing description.
         self._memory.clear()
 
     def __repr__(self) -> str:
-        return f"StageCache({len(self._memory)} / {self._size} || {', '.join( '[' + repr(k) + ']' for k in self._memory)})"
+        return f"StageCache({len(self._memory)} / {self._size} || {', '.join('[' + repr(k) + ']' for k in self._memory)})"
diff --git a/tests/test_caching.py b/tests/test_caching.py
index 38b6f72..bc0e44c 100644
--- a/tests/test_caching.py
+++ b/tests/test_caching.py
@@ -26,9 +26,6 @@ def _clear_translation_cache():
     """Decorator that clears the translation cache.
 
     Ensures that a function finds an empty cache and clears up afterwards.
-
-    Todo:
-        Ask Enrique how I can make that fixture apply everywhere not just in the file but the whole test suite.
     """
     tcache.clear_translation_cache()
     yield
@@ -55,7 +52,7 @@ def wrapped(A, B):
     A = np.arange(12, dtype=np.float64).reshape((4, 3))
     B = np.full((4, 3), 10, dtype=np.float64)
 
-    # The second batch of argument, it is the same size (structurally) but different values.
+    # The second batch of argument, same structure but different values.
     AA = A + 1.0362
     BB = B + 0.638956
 
@@ -164,7 +161,7 @@ def wrapped(A, B):
 
 
 def test_caching_compilation() -> None:
-    """Tests the compilation cache, this is just very simple, since it uses the same code paths as lowering."""
+    """Tests the compilation cache, this is just very simple."""
 
     @jace.jit
     def jaceWrapped(A: np.ndarray, B: np.ndarray) -> np.ndarray:
@@ -192,8 +189,8 @@ def jaceWrapped(A: np.ndarray, B: np.ndarray) -> np.ndarray:
     # Now we disable all optimizations
     unoptiCompiled = jaceLowered.compile(optimization.NO_OPTIMIZATIONS)
 
-    # Because of the way how things work the optimized must have more than the unoptimized.
-    #  If there is sharing, then this would not be the case.
+    # Because of the way how things work the optimized must have more than the
+    #  unoptimized. If there is sharing, then this would not be the case.
     assert unoptiCompiled is not optiCompiled
     assert optiCompiled._csdfg.sdfg.number_of_nodes() == 1
     assert optiCompiled._csdfg.sdfg.number_of_nodes() < unoptiCompiled._csdfg.sdfg.number_of_nodes()
diff --git a/tests/test_decorator.py b/tests/test_decorator.py
index 812ba60..7971b29 100644
--- a/tests/test_decorator.py
+++ b/tests/test_decorator.py
@@ -16,6 +16,7 @@
 import pytest
 
 import jace
+from jace.util import translation_cache as tcache
 
 
 @pytest.fixture(autouse=True)
@@ -27,7 +28,6 @@ def _clear_translation_cache():
     Todo:
         Should be used _everywhere_.
     """
-    from jace.util import translation_cache as tcache
 
     tcache.clear_translation_cache()
     yield
diff --git a/tests/test_jax_api.py b/tests/test_jax_api.py
index 80eff4a..0c1905d 100644
--- a/tests/test_jax_api.py
+++ b/tests/test_jax_api.py
@@ -174,11 +174,10 @@ def df(x):
 
 @pytest.mark.skip(reason="Running JaCe with disabled 'x64' support does not work.")
 def test_disabled_x64():
-    """Tests the behaviour of the tool chain if we explicitly disable x64 support in Jax.
+    """Tests the behaviour of the tool chain if x64 is disabled.
 
     If you want to test, if this restriction still applies, you can enable the test.
     """
-    from jax.experimental import disable_x64
 
     def testee(A: np.ndarray, B: np.float64) -> np.ndarray:
         return A + B
@@ -187,7 +186,7 @@ def testee(A: np.ndarray, B: np.float64) -> np.ndarray:
     B = np.float64(10.0)
 
     # Run them with disabled x64 support
-    with disable_x64():
+    with jax.experimental.disable_x64():
         # JaCe
         jace_testee = jace.jit(testee)
         jace_lowered = jace_testee.lower(A, B)
diff --git a/tests/test_jaxpr_translator_builder.py b/tests/test_jaxpr_translator_builder.py
index a2337f6..efc6657 100644
--- a/tests/test_jaxpr_translator_builder.py
+++ b/tests/test_jaxpr_translator_builder.py
@@ -12,9 +12,11 @@
 import re
 
 import dace
+import jax
 import numpy as np
 import pytest
 from dace.data import Array
+from jax import core as jax_core
 
 import jace
 from jace import translator, util
@@ -93,7 +95,8 @@ def test_builder_variable_alloc_mixed_naming(
 ) -> None:
     """Tests the naming in a mixed setting.
 
-    If `update_var_mapping=True` is given, then the naming will skip variables, see also `test_builder_variable_alloc_mixed_naming2()`.
+    If `update_var_mapping=True` is given, then the naming will skip variables,
+    see also `test_builder_variable_alloc_mixed_naming2()`.
     """
     #                        *       b       c       d      *      f      g
     for i, var in enumerate([narray, array1, array2, scal1, nscal, scal2, scal3]):
@@ -113,8 +116,9 @@ def test_builder_variable_alloc_mixed_naming2(
 ) -> None:
     """Tests the naming in a mixed setting.
 
-    This time we do not use `update_var_mapping=True`, instead it now depends on the name.
-    This means that automatic naming will now again include all, letters, but not in a linear order.
+    This time we do not use `update_var_mapping=True`, instead it now depends on the
+    name. This means that automatic naming will now again include all, letters, but not
+    in a linear order.
     """
     letoff = 0
     #             *      a        b       c      *      d     e
@@ -198,7 +202,7 @@ def test_builder_nested(translation_builder: translator.JaxprTranslationBuilder)
     assert translation_builder.sdfg.number_of_nodes() == 2
     assert translation_builder.sdfg.number_of_edges() == 1
 
-    # Now we go one subcontext deeper; note we do this manually which should not be done.
+    # Now we go one subcontext deeper
     translation_builder._allocate_translation_ctx("builder")
     assert len(translation_builder._ctx_stack) == 2
     assert translation_builder.sdfg.name == "builder"
@@ -240,7 +244,8 @@ def test_builder_nested(translation_builder: translator.JaxprTranslationBuilder)
     assert translation_builder.sdfg.number_of_edges() == 1
 
     # Again the variable that was declared in the last stack is now no longer present.
-    #  Note if the nested SDFG was integrated into the parent SDFG it would be accessible
+    #  Note if the nested SDFG was integrated into the parent SDFG it would be
+    #  accessible
     with pytest.raises(
         expected_exception=KeyError,
         match=re.escape(
@@ -270,7 +275,8 @@ def test_builder_append_state(translation_builder: translator.JaxprTranslationBu
     assert next(iter(sdfg.edges())).src is sdfg.start_block
     assert next(iter(sdfg.edges())).dst is terminal_state_1
 
-    # Specifying an explicit append state that is the terminal should also update the terminal state of the builder.
+    # Specifying an explicit append state that is the terminal should also update the
+    #  terminal state of the builder.
     terminal_state_2: dace.SDFGState = translation_builder.append_new_state(
         "terminal_state_2", prev_state=terminal_state_1
     )
@@ -295,7 +301,7 @@ def test_builder_append_state(translation_builder: translator.JaxprTranslationBu
 def test_builder_variable_multiple_variables(
     translation_builder: translator.JaxprTranslationBuilder,
 ) -> None:
-    """A simple test in which we try to add a variable that are known, but with a different name."""
+    """Add an already known variable, but with a different name."""
     # Now we will add `array1` and then different ways of updating it.
     narray1: str = translation_builder.add_array(array1, update_var_mapping=True)
 
@@ -371,7 +377,6 @@ def test_builder_variable_alloc_list_cleaning(
     ):
         _ = translation_builder.create_jax_var_list(var_list)
 
-    # This currently fails, because the `create_jax_var_list()` function does not clean up.
     assert len(translation_builder.arrays) == 0
 
 
@@ -429,13 +434,10 @@ def test_builder_variable_alloc_list_handle_literal(
 
     It will test the `handle_literals` flag.
     """
-    # First we have to build a jax literal.
-    import numpy as np
-    from jax import core as jcore
 
     val = np.array(1)
-    aval = jcore.get_aval(val)
-    lit = jcore.Literal(val, aval)
+    aval = jax_core.get_aval(val)
+    lit = jax_core.Literal(val, aval)
     var_list = [lit]
 
     with pytest.raises(
@@ -455,8 +457,6 @@ def test_builder_constants(translation_builder: translator.JaxprTranslationBuild
 
     See also the `test_subtranslators_alu.py::test_add3` test.
     """
-    import jax
-
     # Create the Jaxpr that we need.
     constant = [[1.0, 2.0, 3.0], [4.0, 5.0, 6.0], [7.0, 8.0, 9.0]]
     jaxpr = jax.make_jaxpr(lambda A: A + jax.numpy.array(constant))(1.0)
diff --git a/tests/test_misc.py b/tests/test_misc.py
index 8870674..80abefd 100644
--- a/tests/test_misc.py
+++ b/tests/test_misc.py
@@ -19,9 +19,9 @@
 def test_mismatch_in_datatyte_calling():
     """Tests compilation and calling with different types.
 
-    Note that this more or less tests the calling implementation of the `CompiledSDFG` class in DaCe.
-    As I understand the `CompiledSDFG::_construct_args()` function this should be detected.
-    However, as evidently it does not do this.
+    Note that this more or less tests the calling implementation of the `CompiledSDFG`
+    class in DaCe. As I understand the `CompiledSDFG::_construct_args()` function this
+    should be detected. However, as evidently it does not do this.
     """
 
     @jace.jit
diff --git a/tests/test_subtranslator_helper.py b/tests/test_subtranslator_helper.py
index e94408e..56b30fb 100644
--- a/tests/test_subtranslator_helper.py
+++ b/tests/test_subtranslator_helper.py
@@ -103,7 +103,7 @@ def test_subtranslatior_managing():
 
 
 def test_subtranslatior_managing_isolation():
-    """Tests if `get_registered_primitive_translators()` protects the internal registry."""
+    """Tests if `get_registered_primitive_translators()` decouples."""
     assert (
         get_registered_primitive_translators()
         is not translator.primitive_translator._PRIMITIVE_TRANSLATORS_REGISTRY
@@ -169,7 +169,6 @@ def test_subtranslatior_managing_overwriting_2():
     @make_primitive_translator("add")
     def still_useless_but_a_bit_less(*args: Any, **kwargs: Any) -> None:  # noqa: ARG001
         trans_cnt[0] += 1
-        return
 
     @jace.jit
     def foo(A):

From d1231665c120474f088d3633ac6e88b1eabe8bde Mon Sep 17 00:00:00 2001
From: Enrique Gonzalez Paredes <enriqueg@cscs.ch>
Date: Wed, 12 Jun 2024 16:07:19 +0200
Subject: [PATCH 359/458] Final cleanups and fixes

---
 .pre-commit-config.yaml   |  5 +++--
 noxfile.py                | 11 +++++------
 pyproject.toml            |  8 +++++++-
 requirements/base.in      |  2 +-
 requirements/base.txt     |  4 ++--
 requirements/cuda12.in    |  2 +-
 requirements/cuda12.txt   | 10 ++++------
 requirements/sync_tool.py | 25 +++++++++++++++----------
 8 files changed, 38 insertions(+), 29 deletions(-)

diff --git a/.pre-commit-config.yaml b/.pre-commit-config.yaml
index 59057f5..255e6ed 100644
--- a/.pre-commit-config.yaml
+++ b/.pre-commit-config.yaml
@@ -69,9 +69,10 @@ repos:
     args: [--no-install-types]
     additional_dependencies:
     - dace==0.15.1
-    - jax[cpu]==0.4.28
+    - jax[cpu]==0.4.29
     - numpy==1.26.4
-    - pytest==8.2.1
+    - pytest==8.2.2
+    - typing-extensions==4.12.2
 - repo: https://github.com/codespell-project/codespell
   rev: v2.3.0
   hooks:
diff --git a/noxfile.py b/noxfile.py
index 9aba077..4b9ba40 100644
--- a/noxfile.py
+++ b/noxfile.py
@@ -1,3 +1,5 @@
+"""Nox session definitions."""
+
 from __future__ import annotations
 
 import argparse
@@ -24,7 +26,7 @@ def lint(session: nox.Session) -> None:
 @nox.session
 def tests(session: nox.Session) -> None:
     """Run the unit and regular tests."""
-    session.install(".[test]")
+    session.install("-e", ".", "-r", "requirements/dev.txt")
     session.run("pytest", *session.posargs)
 
 
@@ -40,8 +42,7 @@ def docs(session: nox.Session) -> None:
         session.error("Must not specify non-HTML builder with --serve")
 
     extra_installs = ["sphinx-autobuild"] if args.serve else []
-
-    session.install("-e.[docs]", *extra_installs)
+    session.install("-e", ".", "-r", "requirements/dev.txt", *extra_installs)
     session.chdir("docs")
 
     if args.builder == "linkcheck":
@@ -92,9 +93,7 @@ def build(session: nox.Session) -> None:
 
 @nox.session
 def requirements(session: nox.Session) -> None:
-    """
-    Freeze dependencies from input specs and synchronize across tools.
-    """
+    """Freeze dependencies from input specs and synchronize across tools."""
     requirements_path = DIR / "requirements"
     req_sync_tool = requirements_path / "sync_tool.py"
 
diff --git a/pyproject.toml b/pyproject.toml
index 37c0d3d..73eebf9 100644
--- a/pyproject.toml
+++ b/pyproject.toml
@@ -211,7 +211,7 @@ tests = [
 max-complexity = 12
 
 [tool.ruff.lint.per-file-ignores]
-"!tests/**.py" = ["PT"]  # Ignore flake8-pytest-style outside 'tests/'
+"!tests/**" = ["PT"]  # Ignore flake8-pytest-style outside 'tests/'
 "docs/**" = [
   "D",  # pydocstyle
   "T10",  # flake8-debugger
@@ -219,6 +219,12 @@ max-complexity = 12
 ]
 "noxfile.py" = [
   "D",  # pydocstyle
+  "T10",  # flake8-debugger
+  "T20",  # flake8-print
+]
+"requirements/**" = [
+  "D",  # pydocstyle
+  "T10",  # flake8-debugger
   "T20",  # flake8-print
 ]
 "tests/**" = [
diff --git a/requirements/base.in b/requirements/base.in
index b25ef34..c077dae 100644
--- a/requirements/base.in
+++ b/requirements/base.in
@@ -1,3 +1,3 @@
 dace>=0.15
 jax[cpu]>=0.4.24
-numpy>=1.26.0
\ No newline at end of file
+numpy>=1.26.0
diff --git a/requirements/base.txt b/requirements/base.txt
index d388c2f..1aae055 100644
--- a/requirements/base.txt
+++ b/requirements/base.txt
@@ -29,9 +29,9 @@ idna==3.7
     # via requests
 itsdangerous==2.2.0
     # via flask
-jax[cpu]==0.4.28
+jax[cpu]==0.4.29
     # via -r requirements/base.in
-jaxlib==0.4.28
+jaxlib==0.4.29
     # via jax
 jinja2==3.1.4
     # via flask
diff --git a/requirements/cuda12.in b/requirements/cuda12.in
index 5c9b956..d603a3b 100644
--- a/requirements/cuda12.in
+++ b/requirements/cuda12.in
@@ -1,4 +1,4 @@
 -r base.in
 cupy-cuda12x>=12.1.0
 jax[cuda12]>=0.4.24
-optuna>=3.4.0
\ No newline at end of file
+optuna>=3.4.0
diff --git a/requirements/cuda12.txt b/requirements/cuda12.txt
index 098643e..078edf2 100644
--- a/requirements/cuda12.txt
+++ b/requirements/cuda12.txt
@@ -16,13 +16,13 @@ fastrlock==0.8.2
     # via cupy-cuda12x
 greenlet==3.0.3
     # via sqlalchemy
-jax[cpu,cuda12]==0.4.28
+jax[cpu,cuda12]==0.4.29
     # via
     #   -r requirements/base.in
     #   -r requirements/cuda12.in
-jax-cuda12-pjrt==0.4.28
+jax-cuda12-pjrt==0.4.29
     # via jax-cuda12-plugin
-jax-cuda12-plugin==0.4.28
+jax-cuda12-plugin==0.4.29
     # via jax
 mako==1.3.5
     # via alembic
@@ -35,11 +35,9 @@ nvidia-cuda-cupti-cu12==12.5.39
     # via jax
 nvidia-cuda-nvcc-cu12==12.5.40
     # via jax
-nvidia-cuda-nvrtc-cu12==12.5.40
-    # via nvidia-cudnn-cu12
 nvidia-cuda-runtime-cu12==12.5.39
     # via jax
-nvidia-cudnn-cu12==8.9.7.29
+nvidia-cudnn-cu12==9.1.1.17
     # via jax
 nvidia-cufft-cu12==11.2.3.18
     # via jax
diff --git a/requirements/sync_tool.py b/requirements/sync_tool.py
index 1eabda6..6755092 100644
--- a/requirements/sync_tool.py
+++ b/requirements/sync_tool.py
@@ -17,6 +17,8 @@
 # ]
 # ///
 
+"""Script to synchronize requirements across tools."""
+
 from __future__ import annotations
 
 import pathlib
@@ -37,6 +39,8 @@
 
 # -- Classes --
 class RequirementSpec(NamedTuple):
+    """A parsed requirement specification."""
+
     package: pkg_requirements.Requirement
     specifiers: pkg_specifiers.SpecifierSet | None = None
     marker: pkg_markers.Marker | None = None
@@ -58,6 +62,8 @@ def as_text(self) -> str:
 
 
 class Requirement(NamedTuple):
+    """An item in a list of requirements and its parsed specification."""
+
     text: str
     spec: RequirementSpec
 
@@ -85,19 +91,17 @@ class RequirementDumpSpec(NamedTuple):
 
 
 # -- Functions --
-def make_requirements_map(
-    requirements: Iterable[Requirement],
-) -> dict[str, Requirement]:
+def make_requirements_map(requirements: Iterable[Requirement]) -> dict[str, Requirement]:
     return {req.spec.package.name: req for req in requirements}
 
 
 def load_from_requirements(filename: str) -> list[Requirement]:
     requirements = []
-    with pathlib.Path(filename).open() as f:
-        for line in f:
-            if (end := line.find("#")) != -1:
-                line = line[:end]
-            line = line.strip()
+    with pathlib.Path(filename).open(encoding="locale") as f:
+        for raw_line in f:
+            if (end := raw_line.find("#")) != -1:
+                raw_line = raw_line[:end]  # noqa: PLW2901 [redefined-loop-name]
+            line = raw_line.strip()
             if line and not line.startswith("-"):
                 requirements.append(Requirement.from_text(line))
 
@@ -105,7 +109,7 @@ def load_from_requirements(filename: str) -> list[Requirement]:
 
 
 def load_from_toml(filename: str, key: str) -> list[Requirement]:
-    with pathlib.Path(filename).open() as f:
+    with pathlib.Path(filename).open(encoding="locale") as f:
         toml_data = tomlkit.loads(f.read())
 
     section = toml_data
@@ -127,12 +131,13 @@ def dump_to_requirements(
     header: str | None = None,
     footer: str | None = None,
 ) -> None:
-    with pathlib.Path(filename).open("w") as f:
+    with pathlib.Path(filename).open("w", encoding="locale") as f:
         if header:
             f.write(f"{header}\n")
         f.write("\n".join(dump(requirements, template=template)))
         if footer:
             f.write(f"{footer}\n")
+        f.write("\n")
 
 
 def dump_to_yaml(requirements_map: Mapping[str, DumpSpec], filename: str) -> None:

From 39dd108e36ead70348c5996abbc417b6dcd03cac Mon Sep 17 00:00:00 2001
From: Enrique Gonzalez Paredes <enriqueg@cscs.ch>
Date: Wed, 12 Jun 2024 16:12:25 +0200
Subject: [PATCH 360/458] Clean up sync script

---
 requirements/sync_tool.py | 6 +++---
 1 file changed, 3 insertions(+), 3 deletions(-)

diff --git a/requirements/sync_tool.py b/requirements/sync_tool.py
index 6755092..846cb0e 100644
--- a/requirements/sync_tool.py
+++ b/requirements/sync_tool.py
@@ -75,7 +75,7 @@ def from_text(cls, req_text: str) -> Requirement:
     def from_spec(cls, req: RequirementSpec) -> Requirement:
         return Requirement(req.as_text(), req)
 
-    def dump(self, *, template: str | None = None) -> str:
+    def as_text(self, *, template: str | None = None) -> str:
         template = template or "{req.text}"
         return template.format(req=self)
 
@@ -120,7 +120,7 @@ def load_from_toml(filename: str, key: str) -> list[Requirement]:
 
 
 def dump(requirements: Iterable[Requirement], *, template: str | None = None) -> None:
-    return [req.dump(template=template) for req in requirements]
+    return [req.as_text(template=template) for req in requirements]
 
 
 def dump_to_requirements(
@@ -154,7 +154,7 @@ def dump_to_yaml(requirements_map: Mapping[str, DumpSpec], filename: str) -> Non
             case str():
                 processor.set_value(yamlpath.YAMLPath(key_path), value)
             case Requirement():
-                processor.set_value(yamlpath.YAMLPath(key_path), value.dump(template=template))
+                processor.set_value(yamlpath.YAMLPath(key_path), value.as_text(template=template))
             case Iterable():
                 for _ in processor.delete_nodes(yamlpath.YAMLPath(key_path)):
                     pass

From c1074c4e7642736b8b41513b15ef9b3d2afec823 Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Thu, 13 Jun 2024 07:41:00 +0200
Subject: [PATCH 361/458] Fixed an issue with the optimization options.

The function to finalize the options, i.e. get the ones that should be used is now a free function.
---
 src/jace/stages.py | 118 +++++++++++++++++++++++++--------------------
 1 file changed, 67 insertions(+), 51 deletions(-)

diff --git a/src/jace/stages.py b/src/jace/stages.py
index 7a21f31..6c3be8a 100644
--- a/src/jace/stages.py
+++ b/src/jace/stages.py
@@ -50,17 +50,11 @@
     "JaCeLowered",
     "JaCeWrapped",
     "Stage",
+    "finalize_compilation_options",
+    "get_active_compiler_options",
+    "update_active_compiler_options",
 ]
 
-_JACELOWERED_ACTIVE_COMPILE_OPTIONS: CompilerOptions = optimization.DEFAULT_OPTIMIZATIONS.copy()
-"""Global set of currently active compilation/optimization options.
-
-These options are used by `JaCeLowered.compile()` to determine which options
-are forwarded to the underlying `jace_optimize()` function. It is initialized
-to `jace.optimization.DEFAULT_OPTIMIZATIONS` and can be managed through the
-`update_active_compiler_options()` function.
-"""
-
 #: Known compilation stages in JaCe.
 Stage = Union["JaCeWrapped", "JaCeLowered", "JaCeCompiled"]
 
@@ -230,21 +224,17 @@ def compile(self, compiler_options: CompilerOptions | None = None) -> JaCeCompil
         """
         Optimize and compile the lowered SDFG using `compiler_options`.
 
-        Before the SDFG is compiled, it will be optimized using `jace_optimize()`.
-        There are two different sources of these options. The first one is the
-        global set of currently active compiler options. The second one is the
-        options that are passed to this function, which takes precedence. Thus,
-        the `compiler_options` argument of this function describes the difference
-        from the currently active global options.
+        To perform the optimizations `jace_optimize()` is used. The options that are
+        passed to it it are obtained by passing `compiler_options` to
+        `finalize_compilation_options()` first, see there for more information.
 
-        See Also:
-            `get_active_compiler_options()` to inspect the set of currently active
-            options and `update_active_compiler_options()` to modify them.
+        Args:
+            compiler_options: The optimization options to use.
         """
         # We **must** deepcopy before we do any optimization, because all optimizations
         #  are in place, to properly cache stages, stages needs to be immutable.
         tsdfg: translator.TranslatedJaxprSDFG = copy.deepcopy(self._translated_sdfg)
-        optimization.jace_optimize(tsdfg=tsdfg, **self._make_compiler_options(compiler_options))
+        optimization.jace_optimize(tsdfg=tsdfg, **finalize_compilation_options(compiler_options))
 
         return JaCeCompiled(
             csdfg=dace_helper.compile_jax_sdfg(tsdfg),
@@ -292,44 +282,14 @@ def _make_call_description(
         global options. Furthermore, the key will depend on the concrete values.
         """
         unflatted_args, unflatted_kwargs = jax_tree.tree_unflatten(intree, flat_call_args)
-        assert (not len(unflatted_kwargs)) and (len(unflatted_args) == 1)
+        assert (not len(unflatted_kwargs)) and (len(unflatted_args) <= 1)
 
-        options = self._make_compiler_options(unflatted_args[0])
+        options = finalize_compilation_options(unflatted_args[0] if unflatted_args else {})
         flat_options, optiontree = jax_tree.tree_flatten(options)
         return tcache.StageTransformationSpec(
             stage_id=id(self), flat_call_args=tuple(flat_options), intree=optiontree
         )
 
-    @staticmethod
-    def _make_compiler_options(compiler_options: CompilerOptions | None) -> CompilerOptions:
-        """Return the compilation options that should be used for compilation."""
-        assert isinstance(compiler_options, dict)
-        return get_active_compiler_options() | (compiler_options or {})
-
-
-def update_active_compiler_options(new_active_options: CompilerOptions) -> CompilerOptions:
-    """
-    Updates the set of active compiler options.
-
-    Merges the options passed as `new_active_options` with the currently active
-    compiler options. This set is used by `JaCeLowered.compile()` to determine
-    which options should be used.
-    The function will return the set of options that was active before the call.
-
-    To obtain the set of currently active options use `get_active_compiler_options()`.
-
-    Todo:
-        Make a proper context manager.
-    """
-    previous_active_options = _JACELOWERED_ACTIVE_COMPILE_OPTIONS.copy()
-    _JACELOWERED_ACTIVE_COMPILE_OPTIONS.update(new_active_options)
-    return previous_active_options
-
-
-def get_active_compiler_options() -> CompilerOptions:
-    """Returns the set of currently active compiler options."""
-    return _JACELOWERED_ACTIVE_COMPILE_OPTIONS.copy()
-
 
 class JaCeCompiled:
     """
@@ -391,3 +351,59 @@ def __call__(self, *args: Any, **kwargs: Any) -> Any:
             self._csdfg, self._inp_names, self._out_names, flat_in_vals
         )
         return jax_tree.tree_unflatten(self._outtree, flat_output)
+
+
+# <--------------------------- Compilation/Optimization options management
+
+_JACELOWERED_ACTIVE_COMPILE_OPTIONS: CompilerOptions = optimization.DEFAULT_OPTIMIZATIONS.copy()
+"""Global set of currently active compilation/optimization options.
+
+These options are used by `JaCeLowered.compile()` to determine which options are
+forwarded to the underlying `jace_optimize()` function. It is initialized to
+`jace.optimization.DEFAULT_OPTIMIZATIONS` and can be managed through the
+`update_active_compiler_options()` function. For obtaining the options that should
+finally be used the `finalize_compilation_options()` function can be used.
+"""
+
+
+def update_active_compiler_options(new_active_options: CompilerOptions) -> CompilerOptions:
+    """
+    Updates the set of active compiler options.
+
+    Merges the options passed as `new_active_options` with the currently active
+    compiler options. This set is used by `JaCeLowered.compile()` to determine
+    which options should be used.
+    The function will return the set of options that was active before the call.
+
+    To obtain the set of currently active options use `get_active_compiler_options()`.
+
+    Todo:
+        Make a proper context manager.
+    """
+    previous_active_options = _JACELOWERED_ACTIVE_COMPILE_OPTIONS.copy()
+    _JACELOWERED_ACTIVE_COMPILE_OPTIONS.update(new_active_options)
+    return previous_active_options
+
+
+def get_active_compiler_options() -> CompilerOptions:
+    """Returns the set of currently active compiler options."""
+    return _JACELOWERED_ACTIVE_COMPILE_OPTIONS.copy()
+
+
+def finalize_compilation_options(compiler_options: CompilerOptions | None) -> CompilerOptions:
+    """
+    Returns the final compilation options.
+
+    There are two different sources of these options. The first one is the global set
+    of currently active compiler options. The second one is the options that are passed
+    to this function, which takes precedence. Thus, the `compiler_options` argument of
+    this function describes the difference from the currently active global options.
+
+    Args:
+        compiler_options: The local compilation options.
+
+    See Also:
+        `get_active_compiler_options()` to inspect the set of currently active options
+        and `update_active_compiler_options()` to modify them.
+    """
+    return get_active_compiler_options() | (compiler_options or {})

From 9ac17bded6e770eb349d2752e789b040cde5f847 Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Thu, 13 Jun 2024 08:42:04 +0200
Subject: [PATCH 362/458] Implemented a `CompiledJaxprSDFG` object.

It was annyong before, the non compiled version was nicely combined in a single container, but the compiled was not.
In addition I removed the outtree from it, this is now the job of the stage to do that.
---
 src/jace/__init__.py                          |   4 +
 src/jace/optimization.py                      |   4 +-
 src/jace/stages.py                            |  55 +++--
 src/jace/translated_jaxpr_sdfg.py             | 229 ++++++++++++++++++
 src/jace/translator/__init__.py               |   2 -
 src/jace/translator/pre_post_translation.py   |  25 +-
 src/jace/translator/translated_jaxpr_sdfg.py  |  83 -------
 src/jace/util/dace_helper.py                  | 142 -----------
 tests/integration_tests/test_empty_jaxpr.py   |   2 +-
 .../test_jaxpr_translator_builder.py          |   6 +-
 tests/unit_tests/test_jax_api.py              |   6 +-
 11 files changed, 282 insertions(+), 276 deletions(-)
 create mode 100644 src/jace/translated_jaxpr_sdfg.py
 delete mode 100644 src/jace/translator/translated_jaxpr_sdfg.py
 delete mode 100644 src/jace/util/dace_helper.py

diff --git a/src/jace/__init__.py b/src/jace/__init__.py
index 11c5d2a..91c41b3 100644
--- a/src/jace/__init__.py
+++ b/src/jace/__init__.py
@@ -13,14 +13,18 @@
 
 from .__about__ import __author__, __copyright__, __license__, __version__, __version_info__
 from .api import grad, jacfwd, jacrev, jit
+from .translated_jaxpr_sdfg import CompiledJaxprSDFG, TranslatedJaxprSDFG, compile_jaxpr_sdfg
 
 
 __all__ = [
+    "CompiledJaxprSDFG",
+    "TranslatedJaxprSDFG",
     "__author__",
     "__copyright__",
     "__license__",
     "__version__",
     "__version_info__",
+    "compile_jaxpr_sdfg",
     "grad",
     "jacfwd",
     "jacrev",
diff --git a/src/jace/optimization.py b/src/jace/optimization.py
index 261d0ab..1346186 100644
--- a/src/jace/optimization.py
+++ b/src/jace/optimization.py
@@ -15,7 +15,7 @@
 
 
 if TYPE_CHECKING:
-    from jace import translator
+    import jace
 
 
 class CompilerOptions(TypedDict, total=False):
@@ -48,7 +48,7 @@ class CompilerOptions(TypedDict, total=False):
 }
 
 
-def jace_optimize(tsdfg: translator.TranslatedJaxprSDFG, **kwargs: Unpack[CompilerOptions]) -> None:  # noqa: D417  # Missing description for kwargs
+def jace_optimize(tsdfg: jace.TranslatedJaxprSDFG, **kwargs: Unpack[CompilerOptions]) -> None:  # noqa: D417  # Missing description for kwargs
     """
     Performs optimization of the translated SDFG _in place_.
 
diff --git a/src/jace/stages.py b/src/jace/stages.py
index 6c3be8a..a5c6049 100644
--- a/src/jace/stages.py
+++ b/src/jace/stages.py
@@ -33,10 +33,11 @@
 
 from jax import tree_util as jax_tree
 
+import jace
 from jace import optimization, translator, util
 from jace.optimization import CompilerOptions
 from jace.translator import pre_post_translation as ptrans
-from jace.util import dace_helper, translation_cache as tcache
+from jace.util import translation_cache as tcache
 
 
 if TYPE_CHECKING:
@@ -158,12 +159,14 @@ def lower(self, *args: Any, **kwargs: Any) -> JaCeLowered:
             primitive_translators=self._primitive_translators
         )
         trans_ctx: translator.TranslationContext = builder.translate_jaxpr(jaxpr)
-        tsdfg: translator.TranslatedJaxprSDFG = ptrans.postprocess_jaxpr_sdfg(
-            trans_ctx=trans_ctx, fun=self.wrapped_fun, call_args=flat_call_args, outtree=outtree
+        tsdfg: jace.TranslatedJaxprSDFG = ptrans.postprocess_jaxpr_sdfg(
+            trans_ctx=trans_ctx,
+            fun=self.wrapped_fun,
+            call_args=flat_call_args,
         )
 
         # NOTE: `tsdfg` is deepcopied as a side effect of post processing.
-        return JaCeLowered(tsdfg)
+        return JaCeLowered(tsdfg, outtree)
 
     @property
     def wrapped_fun(self) -> Callable:
@@ -205,7 +208,8 @@ class JaCeLowered(tcache.CachingStage["JaCeCompiled"]):
     how to control the process.
 
     Args:
-        tsdfg:  The lowered SDFG with metadata.
+        tsdfg: The lowered SDFG with metadata.
+        outtree: The pytree describing how to unflatten the output.
 
     Note:
         `self` will manage the passed `tsdfg` object. Modifying it results is
@@ -213,11 +217,17 @@ class JaCeLowered(tcache.CachingStage["JaCeCompiled"]):
         transformations `JaCeLowered` is not.
     """
 
-    _translated_sdfg: translator.TranslatedJaxprSDFG
+    _translated_sdfg: jace.TranslatedJaxprSDFG
+    _outtree: jax_tree.PyTreeDef
 
-    def __init__(self, tsdfg: translator.TranslatedJaxprSDFG) -> None:
+    def __init__(
+        self,
+        tsdfg: jace.TranslatedJaxprSDFG,
+        outtree: jax_tree.PyTreeDef,
+    ) -> None:
         super().__init__()
         self._translated_sdfg = tsdfg
+        self._outtree = outtree
 
     @tcache.cached_transition
     def compile(self, compiler_options: CompilerOptions | None = None) -> JaCeCompiled:
@@ -233,17 +243,15 @@ def compile(self, compiler_options: CompilerOptions | None = None) -> JaCeCompil
         """
         # We **must** deepcopy before we do any optimization, because all optimizations
         #  are in place, to properly cache stages, stages needs to be immutable.
-        tsdfg: translator.TranslatedJaxprSDFG = copy.deepcopy(self._translated_sdfg)
+        tsdfg: jace.TranslatedJaxprSDFG = copy.deepcopy(self._translated_sdfg)
         optimization.jace_optimize(tsdfg=tsdfg, **finalize_compilation_options(compiler_options))
 
         return JaCeCompiled(
-            csdfg=dace_helper.compile_jax_sdfg(tsdfg),
-            inp_names=tsdfg.inp_names,
-            out_names=tsdfg.out_names,
-            outtree=tsdfg.outtree,
+            csdfg=jace.compile_jaxpr_sdfg(tsdfg),
+            outtree=self._outtree,
         )
 
-    def compiler_ir(self, dialect: str | None = None) -> translator.TranslatedJaxprSDFG:
+    def compiler_ir(self, dialect: str | None = None) -> jace.TranslatedJaxprSDFG:
         """
         Returns the internal SDFG.
 
@@ -315,23 +323,15 @@ class JaCeCompiled:
         - Automatic strides adaption.
     """
 
-    _csdfg: dace_helper.CompiledSDFG
-    _inp_names: tuple[str, ...]
-    _out_names: tuple[str, ...]
+    _csdfg: jace.CompiledJaxprSDFG
     _outtree: jax_tree.PyTreeDef
 
     def __init__(
         self,
-        csdfg: dace_helper.CompiledSDFG,
-        inp_names: Sequence[str],
-        out_names: Sequence[str],
+        csdfg: jace.CompiledJaxprSDFG,
         outtree: jax_tree.PyTreeDef,
     ) -> None:
-        if not (out_names or inp_names):
-            raise ValueError("No input nor output.")
         self._csdfg = csdfg
-        self._inp_names = tuple(inp_names)
-        self._out_names = tuple(out_names)
         self._outtree = outtree
 
     def __call__(self, *args: Any, **kwargs: Any) -> Any:
@@ -345,11 +345,10 @@ def __call__(self, *args: Any, **kwargs: Any) -> Any:
             Furthermore, all arguments must have strides and storage locations
             that is compatible with the ones that were used for lowering.
         """
-        flat_in_vals = jax_tree.tree_leaves((args, kwargs))
-        assert len(flat_in_vals) == len(self._inp_names), "Static arguments."
-        flat_output = dace_helper.run_jax_sdfg(
-            self._csdfg, self._inp_names, self._out_names, flat_in_vals
-        )
+        flat_call_args = jax_tree.tree_leaves((args, kwargs))
+        flat_output = self._csdfg(flat_call_args)
+        if flat_output is None:
+            return None
         return jax_tree.tree_unflatten(self._outtree, flat_output)
 
 
diff --git a/src/jace/translated_jaxpr_sdfg.py b/src/jace/translated_jaxpr_sdfg.py
new file mode 100644
index 0000000..bbab2be
--- /dev/null
+++ b/src/jace/translated_jaxpr_sdfg.py
@@ -0,0 +1,229 @@
+# JaCe - JAX Just-In-Time compilation using DaCe (Data Centric Parallel Programming)
+#
+# Copyright (c) 2024, ETH Zurich
+# All rights reserved.
+#
+# SPDX-License-Identifier: BSD-3-Clause
+
+"""Extended versions of `SDFG` and `CompiledSDFG` with additional metadata."""
+
+from __future__ import annotations
+
+import dataclasses
+import os
+import pathlib
+import time
+from typing import TYPE_CHECKING, Any
+
+import dace
+from dace import data as dace_data
+
+from jace import util
+
+
+if TYPE_CHECKING:
+    from collections.abc import Sequence
+
+    import numpy as np
+    from dace.codegen import compiled_sdfg
+    from dace.codegen.compiled_sdfg import CompiledSDFG
+
+
+@dataclasses.dataclass(frozen=True, kw_only=True)
+class TranslatedJaxprSDFG:
+    """
+    Encapsulates a translated SDFG with additional the metadata.
+
+    Contrary to the SDFG that is encapsulated inside an `TranslationContext`
+    object, `self` carries a proper SDFG, however:
+    - It does not have `__return*` variables, instead all return arguments are
+        passed by arguments.
+    - All input arguments are passed through arguments mentioned in `inp_names`,
+        while the outputs are passed through `out_names`.
+    - Only variables listed as in/outputs are non transient.
+    - The order inside `inp_names` and `out_names` is the same as in the original Jaxpr.
+    - If an input is used as outputs it appears in both `inp_names` and `out_names`.
+    - Its `arg_names` is set to  `inp_names + out_names`, but arguments that are
+        input and outputs are only listed as inputs.
+
+    The only valid way to obtain a `TranslatedJaxprSDFG` is by passing a
+    `TranslationContext`, that was in turn constructed by
+    `JaxprTranslationBuilder.translate_jaxpr()`, to the
+    `finalize_translation_context()` or preferably to the `postprocess_jaxpr_sdfg()`
+    function.
+
+    Attributes:
+        sdfg: The encapsulated SDFG object.
+        inp_names: SDFG variables used as inputs.
+        out_names: SDFG variables used as outputs.
+
+    Todo:
+        After the SDFG is compiled a lot of code looks strange, because there is
+        no container to store the compiled SDFG and the metadata. This class
+        should be extended to address this need.
+    """
+
+    sdfg: dace.SDFG
+    inp_names: tuple[str, ...]
+    out_names: tuple[str, ...]
+
+    def validate(self) -> bool:
+        """Validate the underlying SDFG."""
+        if any(self.sdfg.arrays[inp].transient for inp in self.inp_names):
+            raise dace.sdfg.InvalidSDFGError(
+                f"Found transient inputs: {(inp for inp in self.inp_names if self.sdfg.arrays[inp].transient)}",
+                self.sdfg,
+                self.sdfg.node_id(self.sdfg.start_state),
+            )
+        if any(self.sdfg.arrays[out].transient for out in self.out_names):
+            raise dace.sdfg.InvalidSDFGError(
+                f"Found transient outputs: {(out for out in self.out_names if self.sdfg.arrays[out].transient)}",
+                self.sdfg,
+                self.sdfg.node_id(self.sdfg.start_state),
+            )
+        if self.sdfg.free_symbols:  # This is a simplification that makes our life simple.
+            raise dace.sdfg.InvalidSDFGError(
+                f"Found free symbols: {self.sdfg.free_symbols}",
+                self.sdfg,
+                self.sdfg.node_id(self.sdfg.start_state),
+            )
+        self.sdfg.validate()
+        return True
+
+
+class CompiledJaxprSDFG:
+    """
+    Compiled version of a `TranslatedJaxprSDFG` instance.
+
+    Essentially this class is a wrapper around DaCe's `CompiledSDFG` object, that
+    supports the calling convention used inside JaCe, as in `DaCe` it is callable.
+    The only valid way to obtain a `CompiledJaxprSDFG` instance is through
+    `compile_jaxpr_sdfg()`.
+
+    Args:
+        csdfg: The `CompiledSDFG` object.
+        inp_names: Names of the SDFG variables used as inputs.
+        out_names: Names of the SDFG variables used as outputs.
+
+    Attributes:
+        csdfg: The `CompiledSDFG` object.
+        sdfg: The encapsulated SDFG object.
+        inp_names: Names of the SDFG variables used as inputs.
+        out_names: Names of the SDFG variables used as outputs.
+
+    Notes:
+        Currently the strides of the input arguments must match the ones that were used
+        for lowering the SDFG.
+        In DaCe the return values are allocated on a per `CompiledSDFG` basis. Thus
+        every call to a compiled SDFG will override the value of the last call, in JaCe
+        the memory is allocated on every call. In addition scalars are returned as
+        arrays of length one.
+    """
+
+    csdfg: compiled_sdfg.CompiledSDFG
+    sdfg: dace.SDFG
+    inp_names: tuple[str, ...]
+    out_names: tuple[str, ...]
+
+    def __init__(
+        self,
+        csdfg: compiled_sdfg.CompiledSDFG,
+        inp_names: tuple[str, ...],
+        out_names: tuple[str, ...],
+    ) -> None:
+        self.csdfg = csdfg
+        self.sdfg = self.csdfg.sdfg
+        self.inp_names = inp_names
+        self.out_names = out_names
+
+    def __call__(
+        self,
+        flat_call_args: Sequence[Any],
+    ) -> list[np.ndarray] | None:
+        """
+        Run the compiled SDFG using the flattened input.
+
+        The function will not perform flattening of its input nor unflattening of
+        the output.
+
+        Args:
+            csdfg: The compiled SDFG to call.
+            flat_call_args: Flattened input arguments.
+        """
+        if len(self.inp_names) != len(flat_call_args):
+            # Either error or static arguments are not removed.
+            raise RuntimeError("Wrong number of arguments.")
+
+        sdfg_call_args: dict[str, Any] = {}
+        for in_name, in_val in zip(self.inp_names, flat_call_args):
+            # TODO(phimuell): Implement a stride matching process.
+            if util.is_jax_array(in_val):
+                if not util.is_fully_addressable(in_val):
+                    raise ValueError(f"Passed a not fully addressable Jax array as '{in_name}'")
+                in_val = in_val.__array__()  # noqa: PLW2901  # Jax arrays do not expose the __array_interface__.
+            sdfg_call_args[in_name] = in_val
+
+        arrays = self.sdfg.arrays
+        for out_name, sdfg_array in ((out_name, arrays[out_name]) for out_name in self.out_names):
+            if out_name in sdfg_call_args:
+                if util.is_jax_array(sdfg_call_args[out_name]):
+                    raise ValueError("Passed an immutable Jax array as output.")
+            else:
+                sdfg_call_args[out_name] = dace_data.make_array_from_descriptor(sdfg_array)
+
+        assert len(sdfg_call_args) == len(self.csdfg.argnames), (
+            "Failed to construct the call arguments,"
+            f" expected {len(self.csdfg.argnames)} but got {len(flat_call_args)}."
+            f"\nExpected: {self.csdfg.argnames}\nGot: {list(sdfg_call_args.keys())}"
+        )
+
+        # Calling the SDFG
+        with dace.config.temporary_config():
+            dace.Config.set("compiler", "allow_view_arguments", value=True)
+            self.csdfg(**sdfg_call_args)
+
+        if self.out_names:
+            return [sdfg_call_args[out_name] for out_name in self.out_names]
+        return None
+
+
+def compile_jaxpr_sdfg(tsdfg: TranslatedJaxprSDFG) -> CompiledJaxprSDFG:
+    """Compile `tsdfg` and return a `CompiledJaxprSDFG` object with the result."""
+    if any(  # We do not support the DaCe return mechanism
+        array_name.startswith("__return")
+        for array_name in tsdfg.sdfg.arrays.keys()  # noqa: SIM118  # We can not use `in` because we are not interested in `my_mangled_variable__return_zulu`!
+    ):
+        raise ValueError("Only support SDFGs without '__return' members.")
+    if tsdfg.sdfg.free_symbols:  # This is a simplification that makes our life simple.
+        raise NotImplementedError(f"No free symbols allowed, found: {tsdfg.sdfg.free_symbols}")
+    if not (tsdfg.out_names or tsdfg.inp_names):
+        raise ValueError("No input nor output.")
+
+    # To ensure that the SDFG is compiled and to get rid of a warning we must modify
+    #  some settings of the SDFG. But we also have to fake an immutable SDFG
+    sdfg = tsdfg.sdfg
+    org_sdfg_name = sdfg.name
+    org_recompile = sdfg._recompile
+    org_regenerate_code = sdfg._regenerate_code
+
+    try:
+        # We need to give the SDFG another name, this is needed to prevent a DaCe
+        #  error/warning. This happens if we compile the same lowered SDFG multiple
+        #  times with different options.
+        sdfg.name = f"{sdfg.name}__comp_{int(time.time() * 1000)}_{os.getpid()}"
+        assert len(sdfg.name) < 255  # noqa: PLR2004  # Not a magic number.
+
+        with dace.config.temporary_config():
+            dace.Config.set("compiler", "use_cache", value=False)
+            dace.Config.set("cache", value="name")
+            dace.Config.set("default_build_folder", value=pathlib.Path(".jacecache").resolve())
+            sdfg._recompile = True
+            sdfg._regenerate_code = True
+            csdfg: CompiledSDFG = sdfg.compile()
+
+    finally:
+        sdfg.name = org_sdfg_name
+        sdfg._recompile = org_recompile
+        sdfg._regenerate_code = org_regenerate_code
+
+    return CompiledJaxprSDFG(csdfg=csdfg, inp_names=tsdfg.inp_names, out_names=tsdfg.out_names)
diff --git a/src/jace/translator/__init__.py b/src/jace/translator/__init__.py
index 2f184a0..9cd3dfd 100644
--- a/src/jace/translator/__init__.py
+++ b/src/jace/translator/__init__.py
@@ -22,14 +22,12 @@
     make_primitive_translator,
     register_primitive_translator,
 )
-from .translated_jaxpr_sdfg import TranslatedJaxprSDFG
 
 
 __all__ = [
     "JaxprTranslationBuilder",
     "PrimitiveTranslator",
     "PrimitiveTranslatorCallable",
-    "TranslatedJaxprSDFG",
     "TranslationContext",
     "get_registered_primitive_translators",
     "make_primitive_translator",
diff --git a/src/jace/translator/pre_post_translation.py b/src/jace/translator/pre_post_translation.py
index 2299d1b..a32ade6 100644
--- a/src/jace/translator/pre_post_translation.py
+++ b/src/jace/translator/pre_post_translation.py
@@ -22,19 +22,22 @@
 import jax
 from jax import tree_util as jax_tree
 
-from jace import translator, util
+import jace
+from jace import util
 
 
 if TYPE_CHECKING:
     from collections.abc import Callable, Mapping, Sequence
 
+    from jace import translator
+
 
 def postprocess_jaxpr_sdfg(
     trans_ctx: translator.TranslationContext,
     fun: Callable,  # noqa: ARG001  # Currently unused
     call_args: Sequence[Any],
-    outtree: jax_tree.PyTreeDef,
-) -> translator.TranslatedJaxprSDFG:
+    validate: bool = True,
+) -> jace.TranslatedJaxprSDFG:
     """
     Final post processing steps on the `TranslationContext`.
 
@@ -45,16 +48,15 @@ def postprocess_jaxpr_sdfg(
         trans_ctx: The `TranslationContext` obtained from a `translate_jaxpr()` call.
         fun: The original function that was translated.
         call_args: The flattened input arguments.
-        outtree: A pytree describing how to unflatten the output.
+        validate: Perform validation.
 
     Todo:
         - Fixing the scalar input problem on GPU.
         - Fixing stride problem of the input.
     """
-    trans_ctx.validate()
+    trans_ctx.validate()  # Always validate, it is cheap.
     create_input_output_stages(trans_ctx=trans_ctx, call_args=call_args)
-
-    return finalize_translation_context(trans_ctx, outtree=outtree, validate=True)
+    return finalize_translation_context(trans_ctx, validate=validate)
 
 
 def create_input_output_stages(
@@ -202,8 +204,9 @@ def _create_input_state(trans_ctx: translator.TranslationContext, call_args: Seq
 
 
 def finalize_translation_context(
-    trans_ctx: translator.TranslationContext, outtree: jax_tree.PyTreeDef, validate: bool = True
-) -> translator.TranslatedJaxprSDFG:
+    trans_ctx: translator.TranslationContext,
+    validate: bool = True,
+) -> jace.TranslatedJaxprSDFG:
     """
     Finalizes the supplied translation context `trans_ctx`.
 
@@ -218,7 +221,6 @@ def finalize_translation_context(
 
     Args:
         trans_ctx: The context that should be finalized.
-        outtree: A pytree describing how to unflatten the output.
         validate: Call the validate function after the finalizing.
     """
     trans_ctx.validate()
@@ -230,11 +232,10 @@ def finalize_translation_context(
         raise ValueError("No input nor output.")
 
     # We guarantee decoupling
-    tsdfg = translator.TranslatedJaxprSDFG(
+    tsdfg = jace.TranslatedJaxprSDFG(
         sdfg=copy.deepcopy(trans_ctx.sdfg),
         inp_names=trans_ctx.inp_names,
         out_names=trans_ctx.out_names,
-        outtree=outtree,
     )
 
     # Make inputs and outputs to globals.
diff --git a/src/jace/translator/translated_jaxpr_sdfg.py b/src/jace/translator/translated_jaxpr_sdfg.py
deleted file mode 100644
index 7b05f3b..0000000
--- a/src/jace/translator/translated_jaxpr_sdfg.py
+++ /dev/null
@@ -1,83 +0,0 @@
-# JaCe - JAX Just-In-Time compilation using DaCe (Data Centric Parallel Programming)
-#
-# Copyright (c) 2024, ETH Zurich
-# All rights reserved.
-#
-# SPDX-License-Identifier: BSD-3-Clause
-
-"""Container for storing a translated SDFG."""
-
-from __future__ import annotations
-
-import dataclasses
-from typing import TYPE_CHECKING
-
-import dace
-
-
-if TYPE_CHECKING:
-    from jax import tree_util as jax_tree
-
-
-@dataclasses.dataclass(kw_only=True, frozen=True)
-class TranslatedJaxprSDFG:
-    """
-    Encapsulates a translated SDFG with additional the metadata.
-
-    Contrary to the SDFG that is encapsulated inside an `TranslationContext`
-    object, `self` carries a proper SDFG, however:
-    - It does not have `__return*` variables, instead all return arguments are
-        passed by arguments.
-    - All input arguments are passed through arguments mentioned in `inp_names`,
-        while the outputs are passed through `out_names`.
-    - Only variables listed as in/outputs are non transient.
-    - The order inside `inp_names` and `out_names` is the same as in the original Jaxpr.
-    - If an input is used as outputs it appears in both `inp_names` and `out_names`.
-    - Its `arg_names` is set to  `inp_names + out_names`, but arguments that are
-        input and outputs are only listed as inputs.
-
-    The only valid way to obtain a `TranslatedJaxprSDFG` is by passing a
-    `TranslationContext`, that was in turn constructed by
-    `JaxprTranslationBuilder.translate_jaxpr()`, to the
-    `finalize_translation_context()` or preferably to the `postprocess_jaxpr_sdfg()`
-    function.
-
-    Attributes:
-        sdfg: The encapsulated SDFG object.
-        inp_names: Names of the SDFG variables used as inputs.
-        out_names: Names of the SDFG variables used as outputs.
-        outtree: A pytree describing how to unflatten the output.
-
-    Todo:
-        After the SDFG is compiled a lot of code looks strange, because there is
-        no container to store the compiled SDFG and the metadata. This class
-        should be extended to address this need.
-    """
-
-    sdfg: dace.SDFG
-    inp_names: tuple[str, ...]
-    out_names: tuple[str, ...]
-    outtree: jax_tree.PyTreeDef
-
-    def validate(self) -> bool:
-        """Validate the underlying SDFG."""
-        if any(self.sdfg.arrays[inp].transient for inp in self.inp_names):
-            raise dace.sdfg.InvalidSDFGError(
-                f"Found transient inputs: {(inp for inp in self.inp_names if self.sdfg.arrays[inp].transient)}",
-                self.sdfg,
-                self.sdfg.node_id(self.sdfg.start_state),
-            )
-        if any(self.sdfg.arrays[out].transient for out in self.out_names):
-            raise dace.sdfg.InvalidSDFGError(
-                f"Found transient outputs: {(out for out in self.out_names if self.sdfg.arrays[out].transient)}",
-                self.sdfg,
-                self.sdfg.node_id(self.sdfg.start_state),
-            )
-        if self.sdfg.free_symbols:  # This is a simplification that makes our life simple.
-            raise dace.sdfg.InvalidSDFGError(
-                f"Found free symbols: {self.sdfg.free_symbols}",
-                self.sdfg,
-                self.sdfg.node_id(self.sdfg.start_state),
-            )
-        self.sdfg.validate()
-        return True
diff --git a/src/jace/util/dace_helper.py b/src/jace/util/dace_helper.py
deleted file mode 100644
index adec44e..0000000
--- a/src/jace/util/dace_helper.py
+++ /dev/null
@@ -1,142 +0,0 @@
-# JaCe - JAX Just-In-Time compilation using DaCe (Data Centric Parallel Programming)
-#
-# Copyright (c) 2024, ETH Zurich
-# All rights reserved.
-#
-# SPDX-License-Identifier: BSD-3-Clause
-
-"""Implements all utility functions that are related to DaCe."""
-
-from __future__ import annotations
-
-import os
-import pathlib
-import time
-from typing import TYPE_CHECKING, Any
-
-import dace
-from dace import data as dace_data
-from dace.codegen.compiled_sdfg import CompiledSDFG
-
-from jace import util
-
-
-if TYPE_CHECKING:
-    from collections.abc import Sequence
-
-    import numpy as np
-
-    from jace import translator
-
-__all__ = ["CompiledSDFG", "compile_jax_sdfg", "run_jax_sdfg"]
-
-
-def compile_jax_sdfg(tsdfg: translator.TranslatedJaxprSDFG) -> CompiledSDFG:
-    """Compiles the embedded SDFG and return the resulting `CompiledSDFG` object."""
-    if any(  # We do not support the DaCe return mechanism
-        array_name.startswith("__return")
-        for array_name in tsdfg.sdfg.arrays.keys()  # noqa: SIM118  # We can not use `in` because we are not interested in `my_mangled_variable__return_zulu`!
-    ):
-        raise ValueError("Only support SDFGs without '__return' members.")
-    if tsdfg.sdfg.free_symbols:  # This is a simplification that makes our life simple.
-        raise NotImplementedError(f"No free symbols allowed, found: {tsdfg.sdfg.free_symbols}")
-
-    # To ensure that the SDFG is compiled and to get rid of a warning we must modify
-    #  some settings of the SDFG. But we also have to fake an immutable SDFG
-    sdfg = tsdfg.sdfg
-    org_sdfg_name = sdfg.name
-    org_recompile = sdfg._recompile
-    org_regenerate_code = sdfg._regenerate_code
-
-    try:
-        # We need to give the SDFG another name, this is needed to prevent a DaCe
-        #  error/warning. This happens if we compile the same lowered SDFG multiple
-        #  times with different options.
-        sdfg.name = f"{sdfg.name}__comp_{int(time.time() * 1000)}_{os.getpid()}"
-        assert len(sdfg.name) < 255  # noqa: PLR2004  # Not a magic number.
-
-        with dace.config.temporary_config():
-            dace.Config.set("compiler", "use_cache", value=False)
-            dace.Config.set("cache", value="name")
-            dace.Config.set("default_build_folder", value=pathlib.Path(".jacecache").resolve())
-            sdfg._recompile = True
-            sdfg._regenerate_code = True
-            csdfg: CompiledSDFG = sdfg.compile()
-
-    finally:
-        sdfg.name = org_sdfg_name
-        sdfg._recompile = org_recompile
-        sdfg._regenerate_code = org_regenerate_code
-
-    return csdfg
-
-
-def run_jax_sdfg(
-    csdfg: CompiledSDFG,
-    inp_names: Sequence[str],
-    out_names: Sequence[str],
-    flat_call_args: Sequence[Any],
-) -> list[np.ndarray]:
-    """
-    Run the compiled SDFG.
-
-    The function assumes that the SDFG was finalized and then compiled by
-    `compile_jax_sdfg()`. All arguments except `csdfg` must come from the
-    `TranslatedJaxprSDFG` object that was used to compile SDFG.
-
-    Returns:
-        The function will return a flattened version of the output. To
-        reconstruct the actual return type/value of the original computation
-        the `outtree` that is stored inside the `TranslatedJaxprSDFG` object
-        that was used to compile the SDFG can be used.
-
-    Args:
-        csdfg: The `CompiledSDFG` object.
-        inp_names: Names of the SDFG variables used as inputs.
-        out_names: Names of the SDFG variables used as outputs.
-        flat_call_args: Flattened input arguments.
-
-    Notes:
-        Currently the strides of the input arguments must match the ones that
-        were used for lowering the SDFG.
-        In DaCe the return values are allocated on a per `CompiledSDFG` basis.
-        Thus every call to a compiled SDFG will override the value of the last
-        call, in JaCe the memory is allocated on every call. In addition
-        scalars are returned as arrays of length one.
-
-    Todo:
-        - Once we supported GPU change type annotation.
-    """
-    if len(inp_names) != len(flat_call_args):
-        # Either error or static arguments are not removed.
-        raise RuntimeError("Wrong number of arguments.")
-
-    sdfg_call_args: dict[str, Any] = {}
-    for in_name, in_val in zip(inp_names, flat_call_args, strict=True):
-        # TODO(phimuell): Implement a stride matching process.
-        if util.is_jax_array(in_val):
-            if not util.is_fully_addressable(in_val):
-                raise ValueError(f"Passed a not fully addressable Jax array as '{in_name}'")
-            in_val = in_val.__array__()  # noqa: PLW2901  # Jax arrays do not expose the __array_interface__.
-        sdfg_call_args[in_name] = in_val
-
-    arrays = csdfg.sdfg.arrays
-    for out_name, sdfg_array in ((out_name, arrays[out_name]) for out_name in out_names):
-        if out_name in sdfg_call_args:
-            if util.is_jax_array(sdfg_call_args[out_name]):
-                raise ValueError("Passed an immutable Jax array as output.")
-        else:
-            sdfg_call_args[out_name] = dace_data.make_array_from_descriptor(sdfg_array)
-
-    assert len(sdfg_call_args) == len(csdfg.argnames), (
-        "Failed to construct the call arguments,"
-        f" expected {len(csdfg.argnames)} but got {len(flat_call_args)}."
-        f"\nExpected: {csdfg.argnames}\nGot: {list(sdfg_call_args.keys())}"
-    )
-
-    # Calling the SDFG
-    with dace.config.temporary_config():
-        dace.Config.set("compiler", "allow_view_arguments", value=True)
-        csdfg(**sdfg_call_args)
-
-    return [sdfg_call_args[out_name] for out_name in out_names]
diff --git a/tests/integration_tests/test_empty_jaxpr.py b/tests/integration_tests/test_empty_jaxpr.py
index b877471..8bcf195 100644
--- a/tests/integration_tests/test_empty_jaxpr.py
+++ b/tests/integration_tests/test_empty_jaxpr.py
@@ -60,7 +60,7 @@ def wrapped(A: np.ndarray, B: np.float64) -> np.ndarray:  # noqa: ARG001  # Expl
     res = compiled(A, B)
 
     assert len(lowered._translated_sdfg.inp_names) == 2
-    assert len(compiled._inp_names) == 2
+    assert len(compiled._csdfg.inp_names) == 2
     assert isinstance(res, np.ndarray)
     assert np.all(res == A)
     assert res.__array_interface__["data"][0] != A.__array_interface__["data"][0]
diff --git a/tests/integration_tests/test_jaxpr_translator_builder.py b/tests/integration_tests/test_jaxpr_translator_builder.py
index 9375b4c..5647d43 100644
--- a/tests/integration_tests/test_jaxpr_translator_builder.py
+++ b/tests/integration_tests/test_jaxpr_translator_builder.py
@@ -547,9 +547,9 @@ def wrapped(A: np.ndarray, B: np.ndarray) -> tuple[np.ndarray, np.ndarray]:
     res = compiled(A, B)
 
     assert len(lowered._translated_sdfg.inp_names) == 2
-    assert len(compiled._inp_names) == 2
+    assert len(compiled._csdfg.inp_names) == 2
     assert len(lowered._translated_sdfg.out_names) == 2
-    assert len(compiled._out_names) == 2
+    assert len(compiled._csdfg.out_names) == 2
     assert isinstance(res, tuple), f"Expected 'tuple', but got '{type(res).__name__}'."
     assert len(res) == 2
     assert np.allclose(ref, res)
@@ -621,7 +621,7 @@ def testee(A: np.ndarray, B: np.ndarray) -> np.ndarray:  # noqa: ARG001  # Expli
     res2 = compiled(A, C)  # wrong call to show that nothing is affected.
 
     assert len(lowered._translated_sdfg.inp_names) == 2
-    assert len(compiled._inp_names) == 2
+    assert len(compiled._csdfg.inp_names) == 2
     assert np.all(res1 == res2)
     assert np.allclose(ref, res1)
 
diff --git a/tests/unit_tests/test_jax_api.py b/tests/unit_tests/test_jax_api.py
index fe99161..d61d360 100644
--- a/tests/unit_tests/test_jax_api.py
+++ b/tests/unit_tests/test_jax_api.py
@@ -192,7 +192,7 @@ def testee(A: np.ndarray, B: np.float64) -> np.ndarray:
     with jax.experimental.disable_x64():
         jaxpr = jax.make_jaxpr(testee)(A, B)
 
-    _, flat_in_vals, outtree = ptrans.trace_and_flatten_function(
+    _, flat_in_vals, _ = ptrans.trace_and_flatten_function(
         fun=testee, trace_call_args=(A, B), trace_call_kwargs={}, trace_options={}
     )
     builder = translator.JaxprTranslationBuilder(
@@ -200,8 +200,8 @@ def testee(A: np.ndarray, B: np.float64) -> np.ndarray:
     )
     trans_ctx: translator.TranslationContext = builder.translate_jaxpr(jaxpr)
 
-    tsdfg: translator.TranslatedJaxprSDFG = ptrans.postprocess_jaxpr_sdfg(
-        trans_ctx=trans_ctx, fun=testee, call_args=flat_in_vals, outtree=outtree
+    tsdfg: jace.TranslatedJaxprSDFG = ptrans.postprocess_jaxpr_sdfg(
+        trans_ctx=trans_ctx, fun=testee, call_args=flat_in_vals
     )
 
     # Because x64 is disabled Jax traces the input as float32, even if we have passed

From 6a8e2b5fbfcbf1f86bf830f1eb5d828c28d641d2 Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Thu, 13 Jun 2024 09:23:41 +0200
Subject: [PATCH 363/458] Made some cleaning.

---
 src/jace/stages.py                          | 134 +++++++++-----------
 src/jace/translator/pre_post_translation.py |  67 +++++-----
 2 files changed, 89 insertions(+), 112 deletions(-)

diff --git a/src/jace/stages.py b/src/jace/stages.py
index a5c6049..8806787 100644
--- a/src/jace/stages.py
+++ b/src/jace/stages.py
@@ -73,7 +73,8 @@ class JaCeWrapped(tcache.CachingStage["JaCeLowered"]):
     object is later lowered with the same arguments the result might be taken
     from the cache.
 
-    Furthermore, a `JaCeWrapped` object is composable with all Jax transformations.
+    Furthermore, a `JaCeWrapped` object is composable with all Jax transformations,
+    all other stages are not.
 
     Args:
         fun: The function that is wrapped.
@@ -81,12 +82,12 @@ class JaCeWrapped(tcache.CachingStage["JaCeLowered"]):
         jit_options: Options to influence the jit process.
 
     Todo:
-        - Support keyword arguments and default values of the wrapped function.
+        - Support default values of the wrapped function.
         - Support static arguments.
 
     Note:
         The tracing of function will always happen with enabled `x64` mode,
-        which is implicitly and temporary activated while tracing.
+        which is implicitly and temporary activated during tracing.
     """
 
     _fun: Callable
@@ -103,11 +104,7 @@ def __init__(
             param.default is param.empty for param in inspect.signature(fun).parameters.values()
         )
         super().__init__()
-        # We have to shallow copy both the translator and the jit options.
-        #  This prevents that any modifications affect `self`.
-        #  Shallow is enough since the translators themselves are immutable.
         self._primitive_translators = {**primitive_translators}
-        # TODO(phimuell): Do we need to deepcopy the options?
         self._jit_options = {**jit_options}
         self._fun = fun
 
@@ -115,13 +112,13 @@ def __call__(self, *args: Any, **kwargs: Any) -> Any:
         """
         Executes the wrapped function, lowering and compiling as needed in one step.
 
-        This function will lower and compile in one go.
-        The function accepts the same arguments as the original computation.
+        This function will lower and compile in one go. The function accepts the same
+        arguments as the original computation and the return value is unflattened.
 
         Note:
             This function is also aware if a Jax tracing is going on. In this
-            case, it will not lower and compile but forward the call to the
-            wrapped Python function.
+            case, it will forward the computation.
+            Currently, this function ignores the value of `jax.disable_jit()`.
         """
         if util.is_tracing_ongoing(*args, **kwargs):
             return self._fun(*args, **kwargs)
@@ -136,15 +133,15 @@ def lower(self, *args: Any, **kwargs: Any) -> JaCeLowered:
         """
         Lower the wrapped computation for the given arguments.
 
-        Performs the first two steps of the AOT steps described above, i.e.
-        trace the wrapped function with the given arguments and stage it out
-        to a Jaxpr. Then translate it to an SDFG. The result is encapsulated
-        inside a `JaCeLowered` object which can later be compiled.
+        Performs the first two steps of the AOT steps described above, i.e. trace the
+        wrapped function with the given arguments and stage it out to a Jaxpr. Then
+        translate it to an SDFG. The result is encapsulated inside a `JaCeLowered`
+        object that can later be compiled.
 
-        It should be noted that the current lowering process will hard code
-        the strides and the storage location of the input inside the SDFG.
-        Thus if the SDFG is lowered with arrays in C order, calling the compiled
-        SDFG with FORTRAN order will result in an error.
+        It should be noted that the current lowering process will hard code the strides
+        and the storage location of the input inside the SDFG. Thus if the SDFG is
+        lowered with arrays in C order, calling the compiled SDFG with FORTRAN order
+        will result in an error.
 
         Note:
             The tracing is always done with activated `x64` mode.
@@ -169,8 +166,7 @@ def lower(self, *args: Any, **kwargs: Any) -> JaCeLowered:
         return JaCeLowered(tsdfg, outtree)
 
     @property
-    def wrapped_fun(self) -> Callable:
-        """Returns the wrapped function."""
+    def wrapped_fun(self) -> Callable:  # noqa: D102  # No docstring.
         return self._fun
 
     def _make_call_description(
@@ -179,13 +175,12 @@ def _make_call_description(
         """
         Computes the key for the `JaCeWrapped.lower()` call inside the cache.
 
-        For all non static arguments the function will generate an abstract
-        description of an argument and for all static arguments the concrete
-        value.
+        For all non static arguments the function will generate an abstract description
+        of an argument and for all static arguments the concrete value.
 
         Notes:
-            The abstract description also includes storage location, i.e. if
-            on CPU or on GPU, and the strides of the arrays.
+            The abstract description also includes storage location, i.e. if on CPU or
+            on GPU, and the strides of the arrays.
         """
         # TODO(phimuell): Implement static arguments
         flat_call_args = tuple(tcache._AbstractCallArgument.from_value(x) for x in flat_call_args)
@@ -198,23 +193,22 @@ class JaCeLowered(tcache.CachingStage["JaCeCompiled"]):
     """
     Represents the original computation as an SDFG.
 
-    This class is the output type of `JaCeWrapped.lower()` and represents the
-    originally wrapped computation as an SDFG. This stage is followed by the
-    `JaCeCompiled` stage, by calling `self.compile()`. A user should never
-    directly construct a `JaCeLowered` object directly, instead
-    `JaCeWrapped.lower()` should be used.
+    This class is the output type of `JaCeWrapped.lower()` and represents the original
+    computation as an SDFG. This stage is followed by the `JaCeCompiled` stage, by
+    calling `self.compile()`. A user should never directly construct a `JaCeLowered`
+    object directly, instead `JaCeWrapped.lower()` should be used.
 
-    Before the SDFG is compiled it is optimized, see `JaCeLowered.compile()` for
-    how to control the process.
+    Before the SDFG is compiled it is optimized, see `JaCeLowered.compile()` for how to
+    control the process.
 
     Args:
         tsdfg: The lowered SDFG with metadata.
         outtree: The pytree describing how to unflatten the output.
 
     Note:
-        `self` will manage the passed `tsdfg` object. Modifying it results is
-        undefined behavior. Although `JaCeWrapped` is composable with Jax
-        transformations `JaCeLowered` is not.
+        `self` will manage the passed `tsdfg` object. Modifying it results is undefined
+        behavior. Although `JaCeWrapped` is composable with Jax transformations
+        `JaCeLowered` is not.
     """
 
     _translated_sdfg: jace.TranslatedJaxprSDFG
@@ -234,9 +228,9 @@ def compile(self, compiler_options: CompilerOptions | None = None) -> JaCeCompil
         """
         Optimize and compile the lowered SDFG using `compiler_options`.
 
-        To perform the optimizations `jace_optimize()` is used. The options that are
-        passed to it it are obtained by passing `compiler_options` to
-        `finalize_compilation_options()` first, see there for more information.
+        To perform the optimizations `jace_optimize()` is used. The actual options that
+        are forwarded to it are obtained by passing `compiler_options` to
+        `finalize_compilation_options()`.
 
         Args:
             compiler_options: The optimization options to use.
@@ -255,21 +249,13 @@ def compiler_ir(self, dialect: str | None = None) -> jace.TranslatedJaxprSDFG:
         """
         Returns the internal SDFG.
 
-        The function returns a `TranslatedJaxprSDFG` object. Direct modification
-        of the returned object is forbidden and results in undefined behaviour.
+        The function returns a `TranslatedJaxprSDFG` object. Direct modification of the
+        returned object is forbidden and results in undefined behaviour.
         """
         if (dialect is None) or (dialect.upper() == "SDFG"):
             return self._translated_sdfg
         raise ValueError(f"Unknown dialect '{dialect}'.")
 
-    def view(self, filename: str | None = None) -> None:
-        """
-        Runs the `view()` method of the underlying SDFG.
-
-        This will open a browser and display the SDFG.
-        """
-        self.compiler_ir().sdfg.view(filename=filename, verbose=False)
-
     def as_sdfg(self) -> dace.SDFG:
         """
         Returns the encapsulated SDFG.
@@ -284,13 +270,11 @@ def _make_call_description(
         """
         Creates the key for the `self.compile()` transition function.
 
-        The generated key will not only depend on the arguments that were
-        passed to the translation function, i.e. `compile(compiler_options)`,
-        in addition it will also take the set of currently active set of
-        global options. Furthermore, the key will depend on the concrete values.
+        The key will depend on the final values that were used for optimization, i.e.
+        they it will also include the global set of optimization options.
         """
         unflatted_args, unflatted_kwargs = jax_tree.tree_unflatten(intree, flat_call_args)
-        assert (not len(unflatted_kwargs)) and (len(unflatted_args) <= 1)
+        assert (not unflatted_kwargs) and (len(unflatted_args) <= 1)
 
         options = finalize_compilation_options(unflatted_args[0] if unflatted_args else {})
         flat_options, optiontree = jax_tree.tree_flatten(options)
@@ -306,15 +290,15 @@ class JaCeCompiled:
     This is the last stage of the JaCe's jit chain. A user should never create a
     `JaCeCompiled` instance, instead `JaCeLowered.compile()` should be used.
 
-    Since the strides and storage location of the arguments, that where used
-    to lower the computation are hard coded inside the SDFG, a `JaCeCompiled`
-    object can only be called with compatible arguments.
+    Since the strides and storage location of the arguments, that where used to lower
+    the computation are hard coded inside the SDFG, a `JaCeCompiled` object can only be
+    called with compatible arguments.
 
     Args:
         csdfg: The compiled SDFG object.
-        inp_names: Names of the SDFG variables used as inputs.
-        out_names: Names of the SDFG variables used as outputs.
-        outtree: A pytree describing how to unflatten the output.
+        inp_names: SDFG variables used as inputs.
+        out_names: SDFG variables used as outputs.
+        outtree: Pytree describing how to unflatten the output.
 
     Note:
         The class assumes ownership of its input arguments.
@@ -339,11 +323,10 @@ def __call__(self, *args: Any, **kwargs: Any) -> Any:
         Calls the embedded computation.
 
         Note:
-            Unlike the `lower()` function which takes the same arguments as the
-            original computation, to call this function you have to remove all
-            static arguments.
-            Furthermore, all arguments must have strides and storage locations
-            that is compatible with the ones that were used for lowering.
+            Unlike the `lower()` function which takes the same arguments as the original
+            computation, to call this function you have to remove all static arguments.
+            Furthermore, all arguments must have strides and storage locations that is
+            compatible with the ones that were used for lowering.
         """
         flat_call_args = jax_tree.tree_leaves((args, kwargs))
         flat_output = self._csdfg(flat_call_args)
@@ -357,11 +340,11 @@ def __call__(self, *args: Any, **kwargs: Any) -> Any:
 _JACELOWERED_ACTIVE_COMPILE_OPTIONS: CompilerOptions = optimization.DEFAULT_OPTIMIZATIONS.copy()
 """Global set of currently active compilation/optimization options.
 
-These options are used by `JaCeLowered.compile()` to determine which options are
-forwarded to the underlying `jace_optimize()` function. It is initialized to
-`jace.optimization.DEFAULT_OPTIMIZATIONS` and can be managed through the
-`update_active_compiler_options()` function. For obtaining the options that should
-finally be used the `finalize_compilation_options()` function can be used.
+The global set is initialized with `jace.optimization.DEFAULT_OPTIMIZATIONS`. It can be
+managed through `update_active_compiler_options()` and accessed through
+`get_active_compiler_options()`, however, it is advised that a user should use
+`finalize_compilation_options()` for getting the final options that should be used
+for optimization.
 """
 
 
@@ -393,10 +376,13 @@ def finalize_compilation_options(compiler_options: CompilerOptions | None) -> Co
     """
     Returns the final compilation options.
 
-    There are two different sources of these options. The first one is the global set
-    of currently active compiler options. The second one is the options that are passed
-    to this function, which takes precedence. Thus, the `compiler_options` argument of
-    this function describes the difference from the currently active global options.
+    There are two different sources of optimization options. The first one is the global
+    set of currently active compiler options. The second one is the options that are
+    passed to this function, which takes precedence. Thus, the `compiler_options`
+    argument describes the difference from the currently active global options.
+
+    This function is used by `JaCeLowered` if it has to determine which options to use
+    for optimization, either for compiling the lowered SDFG or for computing the key.
 
     Args:
         compiler_options: The local compilation options.
diff --git a/src/jace/translator/pre_post_translation.py b/src/jace/translator/pre_post_translation.py
index a32ade6..5fef3af 100644
--- a/src/jace/translator/pre_post_translation.py
+++ b/src/jace/translator/pre_post_translation.py
@@ -5,12 +5,7 @@
 #
 # SPDX-License-Identifier: BSD-3-Clause
 
-"""
-This module contains all functions that are related to post processing the SDFG.
-
-Most of them operate on `TranslatedJaxprSDFG` objects.
-Currently they mostly exist for the sake of existing.
-"""
+"""Functions for the pre and post processing during the translation."""
 
 from __future__ import annotations
 
@@ -41,8 +36,8 @@ def postprocess_jaxpr_sdfg(
     """
     Final post processing steps on the `TranslationContext`.
 
-    While the function performs the post processing on the context in place,
-    the returned `TranslatedJaxprSDFG` will be decoupled from the input.
+    While the function performs the post processing on the context in place, the
+    returned `TranslatedJaxprSDFG` will be decoupled from the input.
 
     Args:
         trans_ctx: The `TranslationContext` obtained from a `translate_jaxpr()` call.
@@ -72,7 +67,7 @@ def create_input_output_stages(
         call_args: The flattened call arguments that should be used.
 
     Note:
-        The output SDFG will still be canonical.
+        The processed SDFG will remain canonical.
     """
     _create_input_state(trans_ctx, call_args)
     _create_output_state(trans_ctx)
@@ -83,12 +78,12 @@ def _create_output_state(trans_ctx: translator.TranslationContext) -> None:
     Creates the output processing stage for the SDFG in place.
 
     The function will create a new terminal state, in which all outputs, denoted
-    in `trans_ctx.out_names`, will be written into new SDFG variables.
-    In case the output variable is a scalar, the output will be replaced by an
-    array of length one.
+    in `trans_ctx.out_names`, will be written into new SDFG variables. In case the
+    output variable is a scalar, the output will be replaced by an array of length one.
+    This behaviour is consistent with Jax.
 
-    Notes:
-        This is consistent with Jax' behaviour.
+    Args:
+        trans_ctx: The translation context to process.
     """
     assert trans_ctx.inp_names is not None and trans_ctx.out_names is not None
 
@@ -138,12 +133,11 @@ def _create_input_state(trans_ctx: translator.TranslationContext, call_args: Seq
     """
     Creates the input processing state for the SDFG in place.
 
-    The function creates a new set of variables that are exposed as inputs.
-    If an input argument is an array, the new variable will have the same
-    strides and storage location the actual input value, that is passed
-    inside `call_args`.
-    If the input is a scalar and GPU mode is activated, the function will add
-    the necessary connections to transfer it to the device.
+    The function will create a new set of variables that are exposed as inputs. If an
+    input argument is an array, the new variable will have the same strides and storage
+    location the actual input value, that is passed inside `call_args`. If the input is
+    a scalar and GPU mode is activated, the function will add the necessary connections
+    to transfer it to the device.
 
     Args:
         trans_ctx: The translation context that should be modified.
@@ -210,14 +204,14 @@ def finalize_translation_context(
     """
     Finalizes the supplied translation context `trans_ctx`.
 
-    The function will process the SDFG that is encapsulated inside the context,
-    i.e. a canonical one, into a proper SDFG, as it is described in
-    `TranslatedJaxprSDFG`. It is important to realize that this function does
-    not perform any optimization of the underlying SDFG itself, instead it
-    prepares an SDFG such that it can be passed to the optimization pipeline.
+    The function will process the SDFG that is encapsulated inside the context, i.e. a
+    canonical one, into a proper SDFG, as it is described in `TranslatedJaxprSDFG`. It
+    is important to realize that this function does not perform any optimization of the
+    underlying SDFG itself, instead it prepares an SDFG such that it can be passed to
+    the optimization pipeline.
 
-    The function will not mutate the passed translation context and the output
-    is always decoupled from its output.
+    The returned object is fully decoupled from its input and `trans_ctx` is not
+    modified.
 
     Args:
         trans_ctx: The context that should be finalized.
@@ -259,24 +253,24 @@ def trace_and_flatten_function(
     trace_options: Mapping[str, Any],
 ) -> tuple[jax.core.ClosedJaxpr, list[Any], jax_tree.PyTreeDef]:
     """
-    Traces `fun` and generates the Jaxpr and compute some related meta data.
+    Traces `fun` and generates the Jaxpr and some related meta data.
 
     For tracing the computation `fun` the function uses the `trace_call_args`
-    and `trace_call_kwargs` arguments, both should not be flattened yet.
+    and `trace_call_kwargs` arguments, both should not be flattened. Furthermore,
+    the tracing is done in enabled x64 mode.
 
     Returns:
         The function will return a tuple of length three.
-        1) The Jaxpr that was generated by Jax using the supplied arguments
-            and options.
-        2) The flattened input values.
-        3) A pytree describing the output structure.
+        1) The Jaxpr that was generated by Jax using the supplied arguments and options.
+        2) The flattened input.
+        3) A pytree describing the output.
 
     Args:
         fun: The original Python computation.
         trace_call_args: The positional arguments that should be used for
             tracing the computation.
-        trace_call_kwargs: The keyword arguments that should be for tracing
-            the computation.
+        trace_call_kwargs: The keyword arguments that should be used for
+            tracing the computation.
         trace_options: The options used for tracing, the same arguments that
             are supported by `jace.jit`.
 
@@ -284,9 +278,6 @@ def trace_and_flatten_function(
         - Handle default arguments of `fun`.
         - Handle static arguments.
         - Turn `trace_options` into a `TypedDict` and sync with `jace.jit`.
-
-    Note:
-        - The tracing is done with x64 enabled.
     """
     if trace_options:
         raise NotImplementedError(

From c05ee3ce6bafd5a782af4d679712bff9cf789360 Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Thu, 13 Jun 2024 09:33:49 +0200
Subject: [PATCH 364/458] Added a test for the pytree support in JaCe.

---
 tests/unit_tests/test_jax_api.py | 17 +++++++++++++++++
 1 file changed, 17 insertions(+)

diff --git a/tests/unit_tests/test_jax_api.py b/tests/unit_tests/test_jax_api.py
index d61d360..8014826 100644
--- a/tests/unit_tests/test_jax_api.py
+++ b/tests/unit_tests/test_jax_api.py
@@ -267,3 +267,20 @@ def testee(A: jax.Array) -> jax.Array:
     assert res.shape == ref.shape
     assert res.dtype == ref.dtype
     assert np.allclose(res, ref)
+
+
+def test_jax_pytree() -> None:
+    """Perform if pytrees are handled correctly."""
+
+    def testee(A: dict[str, np.ndarray]) -> dict[str, jax.Array]:
+        mod_a = {k: jnp.sin(v) for k, v in A.items()}
+        mod_a["__additional"] = jnp.asin(A["a1"])
+        return mod_a
+
+    A = {f"a{i}": testutil.mkarray((10, 10)) for i in range(4)}
+    ref = testee(A)
+    res = jace.jit(testee)(A)
+
+    assert len(res) == len(ref)
+    assert type(res) == type(ref)
+    assert (np.allclose(res[k], ref[k]) for k in ref)

From ce4c64304df7520609dec8ec6daba01557ac0a15 Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Thu, 13 Jun 2024 09:36:46 +0200
Subject: [PATCH 365/458] Enabled the optimization mode in the tests again.

---
 tests/integration_tests/primitive_translators/conftest.py | 5 ++---
 1 file changed, 2 insertions(+), 3 deletions(-)

diff --git a/tests/integration_tests/primitive_translators/conftest.py b/tests/integration_tests/primitive_translators/conftest.py
index 3c79e98..f51af06 100644
--- a/tests/integration_tests/primitive_translators/conftest.py
+++ b/tests/integration_tests/primitive_translators/conftest.py
@@ -23,9 +23,8 @@
 @pytest.fixture(
     autouse=True,
     params=[
-        optimization.NO_OPTIMIZATIONS
-        # TODO(phimuell): find a way to conditionally enable.
-        # optimization.DEFAULT_OPTIMIZATIONS,
+        optimization.NO_OPTIMIZATIONS,
+        optimization.DEFAULT_OPTIMIZATIONS,
     ],
 )
 def _set_compile_options(request) -> Generator[None, None, None]:

From 1743374c087c8406b80295dbde22d441467bf2b2 Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Thu, 13 Jun 2024 10:47:44 +0200
Subject: [PATCH 366/458] Disabled the elementconversion stuff, since it takes
 too long.

---
 .../test_primitive_convert_element_type.py                   | 5 ++++-
 1 file changed, 4 insertions(+), 1 deletion(-)

diff --git a/tests/integration_tests/primitive_translators/test_primitive_convert_element_type.py b/tests/integration_tests/primitive_translators/test_primitive_convert_element_type.py
index fe86b4b..a5bbcdb 100644
--- a/tests/integration_tests/primitive_translators/test_primitive_convert_element_type.py
+++ b/tests/integration_tests/primitive_translators/test_primitive_convert_element_type.py
@@ -25,8 +25,11 @@
 from tests import util as testutil
 
 
+pytest.skip("Takes too long", allow_module_level=True)
+
+
 # fmt: off
-_DACE_REAL_TYPES: Final[list[type]] = [
+_DACE_REAL_TYPES: Final[list[type]] = [ # type: ignore[unreachable]
         np.int_, np.int8, np.int16, np.int32, np.int64,
         np.uint, np.uint8, np.uint16, np.uint32, np.uint64,
         np.float64, np.float32, np.float64,

From efc27e0eb6ff0028d9d1b1130637221f94557a27 Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Thu, 13 Jun 2024 13:52:23 +0200
Subject: [PATCH 367/458] Disabled the optimized unit tests, since there is a
 simplification bug in DaCe.

See https://github.com/spcl/dace/issues/1595 for more information.
---
 tests/integration_tests/primitive_translators/conftest.py | 5 ++++-
 1 file changed, 4 insertions(+), 1 deletion(-)

diff --git a/tests/integration_tests/primitive_translators/conftest.py b/tests/integration_tests/primitive_translators/conftest.py
index f51af06..1c4008b 100644
--- a/tests/integration_tests/primitive_translators/conftest.py
+++ b/tests/integration_tests/primitive_translators/conftest.py
@@ -24,7 +24,10 @@
     autouse=True,
     params=[
         optimization.NO_OPTIMIZATIONS,
-        optimization.DEFAULT_OPTIMIZATIONS,
+        pytest.param(
+            optimization.DEFAULT_OPTIMIZATIONS,
+            marks=pytest.mark.skip("Simplify bug 'https://github.com/spcl/dace/issues/1595'"),
+        ),
     ],
 )
 def _set_compile_options(request) -> Generator[None, None, None]:

From 0221d7bef2bb0717e845e02f8852d7b29d19236c Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Thu, 13 Jun 2024 13:53:08 +0200
Subject: [PATCH 368/458] Updated the tests a little bit.

---
 tests/integration_tests/test_jaxpr_translator_builder.py | 8 ++++----
 1 file changed, 4 insertions(+), 4 deletions(-)

diff --git a/tests/integration_tests/test_jaxpr_translator_builder.py b/tests/integration_tests/test_jaxpr_translator_builder.py
index 5647d43..3233b2d 100644
--- a/tests/integration_tests/test_jaxpr_translator_builder.py
+++ b/tests/integration_tests/test_jaxpr_translator_builder.py
@@ -513,9 +513,8 @@ def wrapped(A: float) -> float:
     assert lower_cnt[0] == 1
 
 
-@pytest.mark.skip(reason="Currently 'scalar' return values, are actually shape '(1,)' arrays.")
 def test_builder_scalar_return_type() -> None:
-    """Tests if the type is the same, in case of scalar return."""
+    """As Jax we always return an array, even for a scalar."""
 
     @jace.jit
     def wrapped(A: np.float64) -> np.float64:
@@ -523,8 +522,9 @@ def wrapped(A: np.float64) -> np.float64:
 
     A = np.float64(1.0)
     res = wrapped(A)
-    assert type(res) is np.float64, f"Expected type 'np.float64', but got '{type(res).__name__}'."
-    assert res == np.float64(0.0)
+    assert res.shape == (1,)
+    assert res.dtype == np.float64
+    assert res[0] == np.float64(1.0)
 
 
 def test_builder_multiple_return_values() -> None:

From fd9fb8eeab109b2a90b229cc52c209cfcd12c314 Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Thu, 13 Jun 2024 15:16:13 +0200
Subject: [PATCH 369/458] This should solve some cache issue.

---
 .../test_primitive_iota.py                     | 18 +++++++++---------
 1 file changed, 9 insertions(+), 9 deletions(-)

diff --git a/tests/integration_tests/primitive_translators/test_primitive_iota.py b/tests/integration_tests/primitive_translators/test_primitive_iota.py
index 10ba671..1fd548a 100644
--- a/tests/integration_tests/primitive_translators/test_primitive_iota.py
+++ b/tests/integration_tests/primitive_translators/test_primitive_iota.py
@@ -9,6 +9,7 @@
 
 import jax
 import numpy as np
+import pytest
 from jax import numpy as jnp
 
 import jace
@@ -23,16 +24,15 @@ def testee(A: int) -> jax.Array:
     assert np.all(ref == res)
 
 
-def test_iota_broadcast() -> None:
+@pytest.mark.parametrize("d", [0, 1, 2, 3])
+def test_iota_broadcast(d) -> None:
     shape = (2, 2, 2, 2)
 
-    for d in range(len(shape)):
-        # Must be inside the loop to bypass caching.
-        def testee(A: np.int32) -> jax.Array:
-            return jax.lax.broadcasted_iota("int32", shape, d) + A  # noqa: B023  # Variable capturing.
+    def testee(A: np.int32) -> jax.Array:
+        return jax.lax.broadcasted_iota("int32", shape, d) + A
 
-        ref = testee(np.int32(0))
-        res = jace.jit(testee)(np.int32(0))
+    ref = testee(np.int32(0))
+    res = jace.jit(testee)(np.int32(0))
 
-        assert res.shape == shape
-        assert np.all(ref == res), f"Expected: {ref.tolist()}; Got: {res.tolist()}"
+    assert res.shape == shape
+    assert np.all(ref == res), f"Expected: {ref.tolist()}; Got: {res.tolist()}"

From e43dd5339b37b92fbc3a3c618c34362cb5dca79b Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Thu, 13 Jun 2024 15:19:40 +0200
Subject: [PATCH 370/458] Renamed the `mkarray()` function to `make_array()`.

---
 ...primitive_arithmetic_logical_operations.py | 24 +++++++-------
 .../test_primitive_broadcast_in_dim.py        |  2 +-
 .../test_primitive_convert_element_type.py    |  2 +-
 .../test_primitive_copy.py                    |  2 +-
 .../test_primitive_reshape.py                 |  2 +-
 .../test_primitive_select_n.py                | 10 +++---
 .../test_primitive_slicing.py                 |  4 +--
 .../test_primitive_squeeze_expand_dims.py     |  2 +-
 .../test_jaxpr_translator_builder.py          | 20 ++++++------
 tests/unit_tests/test_caching.py              | 32 +++++++++----------
 tests/unit_tests/test_decorator.py            |  8 ++---
 tests/unit_tests/test_jax_api.py              | 16 +++++-----
 tests/unit_tests/test_misc.py                 |  4 +--
 tests/util.py                                 | 10 +++---
 14 files changed, 70 insertions(+), 68 deletions(-)

diff --git a/tests/integration_tests/primitive_translators/test_primitive_arithmetic_logical_operations.py b/tests/integration_tests/primitive_translators/test_primitive_arithmetic_logical_operations.py
index cd49feb..c5dbea0 100644
--- a/tests/integration_tests/primitive_translators/test_primitive_arithmetic_logical_operations.py
+++ b/tests/integration_tests/primitive_translators/test_primitive_arithmetic_logical_operations.py
@@ -86,7 +86,7 @@ def logical_ops(request) -> tuple[Callable, tuple[np.ndarray, ...]]:
     """Returns a logical operation function and inputs."""
     return (
         request.param[0],
-        tuple(testutil.mkarray((2, 2), request.param[2]) for _ in range(request.param[1])),
+        tuple(testutil.make_array((2, 2), request.param[2]) for _ in range(request.param[1])),
     )
 
 
@@ -130,7 +130,7 @@ def alt_unary_ops(request, dtype: type) -> tuple[Callable, np.ndarray]:
     Some of the unary operations are combined to ensure that they will succeed.
     An example is `asin()` which only takes values in the range `[-1, 1]`.
     """
-    return (request.param, testutil.mkarray((2, 2), dtype))
+    return (request.param, testutil.make_array((2, 2), dtype))
 
 
 @pytest.fixture(
@@ -150,7 +150,7 @@ def alt_binary_ops_float(request) -> tuple[Callable, tuple[np.ndarray, np.ndarra
     # Getting 0 in the division test is unlikely.
     return (  # type: ignore[return-value]  # Type confusion.
         request.param,
-        tuple(testutil.mkarray((2, 2), np.float64) for _ in range(2)),
+        tuple(testutil.make_array((2, 2), np.float64) for _ in range(2)),
     )
 
 
@@ -168,7 +168,7 @@ def alt_binary_compare_ops(request) -> tuple[Callable, tuple[np.ndarray, np.ndar
     """Comparison operations, operates on integers."""
     return (
         request.param,
-        tuple(np.abs(testutil.mkarray((20, 20), np.int32)) % 30 for _ in range(2)),
+        tuple(np.abs(testutil.make_array((20, 20), np.int32)) % 30 for _ in range(2)),
     )
 
 
@@ -181,7 +181,7 @@ def alt_binary_compare_ops(request) -> tuple[Callable, tuple[np.ndarray, np.ndar
 )
 def broadcast_input(request) -> tuple[np.ndarray, np.ndarray]:
     """Inputs to be used for the broadcast test."""
-    return tuple(testutil.mkarray(shape) for shape in request.param)  # type: ignore[return-value] # can not deduce that it is only size 2.
+    return tuple(testutil.make_array(shape) for shape in request.param)  # type: ignore[return-value] # can not deduce that it is only size 2.
 
 
 def _perform_alt_test(testee: Callable, *args: Any) -> None:
@@ -216,7 +216,7 @@ def test_mapped_unary_array() -> None:
     def testee(A: np.ndarray) -> jax.Array:
         return jnp.sin(A)
 
-    A = testutil.mkarray((100, 10, 3))
+    A = testutil.make_array((100, 10, 3))
 
     _perform_alt_test(testee, A)
 
@@ -253,8 +253,8 @@ def test_mapped_binary_array() -> None:
     def testee(A: np.ndarray, B: np.ndarray) -> np.ndarray:
         return A + B
 
-    A = testutil.mkarray((100, 10, 3))
-    B = testutil.mkarray((100, 10, 3))
+    A = testutil.make_array((100, 10, 3))
+    B = testutil.make_array((100, 10, 3))
     _perform_alt_test(testee, A, B)
 
 
@@ -262,7 +262,7 @@ def test_mapped_binary_array_scalar() -> None:
     def testee(A: np.ndarray | np.float64, B: np.float64 | np.ndarray) -> np.ndarray:
         return A + B  # type: ignore[return-value]  # It is always an array.
 
-    A = testutil.mkarray((100, 22))
+    A = testutil.make_array((100, 22))
     B = np.float64(1.34)
     _perform_alt_test(testee, A, B)
     _perform_alt_test(testee, B, A)
@@ -275,7 +275,7 @@ def testeeR(A: np.ndarray) -> np.ndarray:
     def testeeL(A: np.ndarray) -> np.ndarray:
         return 1.52 + A
 
-    A = testutil.mkarray((100, 22))
+    A = testutil.make_array((100, 22))
     _perform_alt_test(testeeR, A)
     _perform_alt_test(testeeL, A)
 
@@ -284,7 +284,7 @@ def test_mapped_binary_array_constants() -> None:
     def testee(A: np.ndarray) -> np.ndarray:
         return A + jnp.array([[1.0, 2.0, 3.0], [4.0, 5.0, 6.0], [7.0, 8.0, 9.0]])
 
-    A = testutil.mkarray((3, 3))
+    A = testutil.make_array((3, 3))
     _perform_alt_test(testee, A)
 
 
@@ -357,5 +357,5 @@ def test_alt_unary_integer_power() -> None:
     def testee(A: np.ndarray) -> np.ndarray:
         return A**3
 
-    A = testutil.mkarray((10, 2, 3))
+    A = testutil.make_array((10, 2, 3))
     _perform_alt_test(testee, A)
diff --git a/tests/integration_tests/primitive_translators/test_primitive_broadcast_in_dim.py b/tests/integration_tests/primitive_translators/test_primitive_broadcast_in_dim.py
index 8342b6c..f99ce26 100644
--- a/tests/integration_tests/primitive_translators/test_primitive_broadcast_in_dim.py
+++ b/tests/integration_tests/primitive_translators/test_primitive_broadcast_in_dim.py
@@ -75,7 +75,7 @@ def test_bid_vector(vector_shape: Sequence[int]) -> None:
     def testee(A: np.ndarray) -> jax.Array:
         return jnp.broadcast_to(A, (10, 10))
 
-    A = testutil.mkarray(vector_shape)
+    A = testutil.make_array(vector_shape)
     ref = testee(A)
     res = jace.jit(testee)(A)
     assert res.shape == ref.shape
diff --git a/tests/integration_tests/primitive_translators/test_primitive_convert_element_type.py b/tests/integration_tests/primitive_translators/test_primitive_convert_element_type.py
index a5bbcdb..58e7d5d 100644
--- a/tests/integration_tests/primitive_translators/test_primitive_convert_element_type.py
+++ b/tests/integration_tests/primitive_translators/test_primitive_convert_element_type.py
@@ -59,7 +59,7 @@ def dst_type(request) -> type:
 def _convert_element_type_impl(input_type: type, output_type: type) -> None:
     """Implementation of the tests of the convert element types primitive."""
     lowering_cnt = [0]
-    A: np.ndarray = testutil.mkarray((10, 10), input_type)
+    A: np.ndarray = testutil.make_array((10, 10), input_type)
     ref: np.ndarray = np.array(A, copy=True, dtype=output_type)
 
     @jace.jit
diff --git a/tests/integration_tests/primitive_translators/test_primitive_copy.py b/tests/integration_tests/primitive_translators/test_primitive_copy.py
index c4a3d62..16e4ec0 100644
--- a/tests/integration_tests/primitive_translators/test_primitive_copy.py
+++ b/tests/integration_tests/primitive_translators/test_primitive_copy.py
@@ -21,7 +21,7 @@ def test_copy() -> None:
     def testee(A: np.ndarray) -> jax.Array:
         return jnp.copy(A)
 
-    A = testutil.mkarray((10, 10, 10))
+    A = testutil.make_array((10, 10, 10))
     res = testee(A)
     assert A.dtype == res.dtype
     assert A.shape == res.shape
diff --git a/tests/integration_tests/primitive_translators/test_primitive_reshape.py b/tests/integration_tests/primitive_translators/test_primitive_reshape.py
index be7d7ff..376cc9a 100644
--- a/tests/integration_tests/primitive_translators/test_primitive_reshape.py
+++ b/tests/integration_tests/primitive_translators/test_primitive_reshape.py
@@ -29,7 +29,7 @@ def _test_impl_reshaping(
     src_shape: Sequence[int], dst_shape: Sequence[int], order: str = "C"
 ) -> None:
     """Performs a reshaping from `src_shape` to `dst_shape`."""
-    A = testutil.mkarray(src_shape)
+    A = testutil.make_array(src_shape)
     A = np.array(A, order=order)  # type: ignore[call-overload]  # MyPy wants a literal as order.
 
     def testee(A: np.ndarray) -> jax.Array:
diff --git a/tests/integration_tests/primitive_translators/test_primitive_select_n.py b/tests/integration_tests/primitive_translators/test_primitive_select_n.py
index a5faa44..dd773a4 100644
--- a/tests/integration_tests/primitive_translators/test_primitive_select_n.py
+++ b/tests/integration_tests/primitive_translators/test_primitive_select_n.py
@@ -35,9 +35,9 @@ def testee(P: np.ndarray, T: np.ndarray, F: np.ndarray) -> jax.Array:
         return jnp.where(P, T, F)
 
     shape = (10, 10)
-    pred = testutil.mkarray(shape, np.bool_)
-    tbranch = testutil.mkarray(shape)
-    fbranch = testutil.mkarray(shape)
+    pred = testutil.make_array(shape, np.bool_)
+    tbranch = testutil.make_array(shape)
+    fbranch = testutil.make_array(shape)
     _perform_test(testee, pred, tbranch, fbranch)
 
 
@@ -52,8 +52,8 @@ def testee3(P: np.ndarray) -> jax.Array:
         return jnp.where(P, 8, 9)
 
     shape = ()
-    pred = testutil.mkarray(shape, np.bool_)
-    tbranch = testutil.mkarray(shape, np.int_)
+    pred = testutil.make_array(shape, np.bool_)
+    tbranch = testutil.make_array(shape, np.int_)
     fbranch = tbranch + 1
 
     _perform_test(testee1, pred, fbranch)
diff --git a/tests/integration_tests/primitive_translators/test_primitive_slicing.py b/tests/integration_tests/primitive_translators/test_primitive_slicing.py
index b5cde93..9b6f9e1 100644
--- a/tests/integration_tests/primitive_translators/test_primitive_slicing.py
+++ b/tests/integration_tests/primitive_translators/test_primitive_slicing.py
@@ -20,12 +20,12 @@
 
 @pytest.fixture()
 def A_20x20x20() -> np.ndarray:
-    return testutil.mkarray((20, 20, 20))
+    return testutil.make_array((20, 20, 20))
 
 
 @pytest.fixture()
 def A_4x4x4x4() -> np.ndarray:
-    return testutil.mkarray((4, 4, 4, 4))
+    return testutil.make_array((4, 4, 4, 4))
 
 
 @pytest.fixture(
diff --git a/tests/integration_tests/primitive_translators/test_primitive_squeeze_expand_dims.py b/tests/integration_tests/primitive_translators/test_primitive_squeeze_expand_dims.py
index c82e4bb..d732667 100644
--- a/tests/integration_tests/primitive_translators/test_primitive_squeeze_expand_dims.py
+++ b/tests/integration_tests/primitive_translators/test_primitive_squeeze_expand_dims.py
@@ -39,7 +39,7 @@ def _roundtrip_implementation(shape: Sequence[int], axis: int | Sequence[int]) -
         shape:  Shape of the input array.
         axes:   A series of axis that should be tried.
     """
-    A = testutil.mkarray(shape)
+    A = testutil.make_array(shape)
     A_org = A.copy()
 
     for ops in [jnp.expand_dims, jnp.squeeze]:
diff --git a/tests/integration_tests/test_jaxpr_translator_builder.py b/tests/integration_tests/test_jaxpr_translator_builder.py
index 3233b2d..8d24d25 100644
--- a/tests/integration_tests/test_jaxpr_translator_builder.py
+++ b/tests/integration_tests/test_jaxpr_translator_builder.py
@@ -505,7 +505,7 @@ def wrapped(A: float) -> float:
         lower_cnt[0] += 1
         return scalar_ops(A)
 
-    vals = testutil.mkarray(100)
+    vals = testutil.make_array(100)
     for i in range(vals.size):
         res = wrapped(vals[i])
         ref = scalar_ops(vals[i])
@@ -537,8 +537,8 @@ def test_builder_multiple_return_values() -> None:
     def wrapped(A: np.ndarray, B: np.ndarray) -> tuple[np.ndarray, np.ndarray]:
         return A + B, A - B
 
-    A = testutil.mkarray((2, 2))
-    B = testutil.mkarray((2, 2))
+    A = testutil.make_array((2, 2))
+    B = testutil.make_array((2, 2))
 
     lowered = wrapped.lower(A, B)
     compiled = lowered.compile()
@@ -570,8 +570,8 @@ def test_builder_direct_return() -> None:
     def wrapped(A: np.ndarray, B: np.ndarray) -> tuple[np.ndarray, np.ndarray, np.ndarray]:
         return A + B, B, A
 
-    A = testutil.mkarray((2, 2))
-    B = testutil.mkarray((2, 2))
+    A = testutil.make_array((2, 2))
+    B = testutil.make_array((2, 2))
 
     ref0 = A + B
     res = wrapped(A, B)
@@ -592,7 +592,7 @@ def test_builder_literal_return_value() -> None:
     def testee(A: np.ndarray) -> tuple[np.ndarray, np.float64, np.ndarray]:
         return (A + 1.0, np.float64(1.0), A - 1.0)
 
-    A = testutil.mkarray((2, 2))
+    A = testutil.make_array((2, 2))
     ref = testee(A)
     res = jace.jit(testee)(A)
 
@@ -608,9 +608,9 @@ def test_builder_unused_arg() -> None:
     def testee(A: np.ndarray, B: np.ndarray) -> np.ndarray:  # noqa: ARG001  # Explicitly unused.
         return A + 3.0
 
-    A = testutil.mkarray((10, 10))
-    B = testutil.mkarray((11, 11))
-    C = testutil.mkarray((20, 20))
+    A = testutil.make_array((10, 10))
+    B = testutil.make_array((11, 11))
+    C = testutil.make_array((20, 20))
 
     wrapped = jace.jit(testee)
     lowered = wrapped.lower(A, B)
@@ -646,7 +646,7 @@ def test_builder_F_strides() -> None:
     def testee(A: np.ndarray) -> np.ndarray:
         return A + 10.0
 
-    A = testutil.mkarray((4, 3), order="F")
+    A = testutil.make_array((4, 3), order="F")
     ref = testee(A)
     res = jace.jit(testee)(A)
 
diff --git a/tests/unit_tests/test_caching.py b/tests/unit_tests/test_caching.py
index f074df8..8818747 100644
--- a/tests/unit_tests/test_caching.py
+++ b/tests/unit_tests/test_caching.py
@@ -33,7 +33,7 @@ def wrapped(A: np.ndarray) -> jax.Array:
         lowering_cnt[0] += 1
         return jnp.sin(A)
 
-    A = testutil.mkarray((10, 10))
+    A = testutil.make_array((10, 10))
     ref = np.sin(A)
     res_ids: set[int] = set()
     # We have to store the array, because numpy does reuse the memory.
@@ -67,8 +67,8 @@ def wrapped(A, B):
         return testee(A, B)
 
     # First batch of arguments.
-    A = testutil.mkarray((4, 3))
-    B = testutil.mkarray((4, 3))
+    A = testutil.make_array((4, 3))
+    B = testutil.make_array((4, 3))
 
     # The second batch of argument, same structure, but different values.
     AA = A + 1.0362
@@ -106,12 +106,12 @@ def wrapped(A, B):
         return A * B
 
     # First size of arguments
-    A = testutil.mkarray((4, 3))
-    B = testutil.mkarray((4, 3))
+    A = testutil.make_array((4, 3))
+    B = testutil.make_array((4, 3))
 
     # Second size of arguments
-    C = testutil.mkarray((4, 4))
-    D = testutil.mkarray((4, 4))
+    C = testutil.make_array((4, 4))
+    D = testutil.make_array((4, 4))
 
     # Now lower the function once for each.
     lowered1 = wrapped.lower(A, B)
@@ -141,10 +141,10 @@ def wrapped(A, B):
         lowering_cnt[0] += 1
         return A * 4.0, B + 2.0
 
-    A = testutil.mkarray((4, 30), dtype=np.float64)
-    B = testutil.mkarray((4, 3), dtype=np.float64)
-    C = testutil.mkarray((4, 3), dtype=np.int64)
-    D = testutil.mkarray((6, 3), dtype=np.int64)
+    A = testutil.make_array((4, 30), dtype=np.float64)
+    B = testutil.make_array((4, 3), dtype=np.float64)
+    C = testutil.make_array((4, 3), dtype=np.int64)
+    D = testutil.make_array((6, 3), dtype=np.int64)
 
     # These are the known lowered instances.
     lowerings: dict[tuple[int, int], stages.JaCeLowered] = {}
@@ -188,8 +188,8 @@ def jaceWrapped(A: np.ndarray, B: np.ndarray) -> np.ndarray:
         return A + B + C + D + E
 
     # These are the argument
-    A = testutil.mkarray((4, 3))
-    B = testutil.mkarray((4, 3))
+    A = testutil.make_array((4, 3))
+    B = testutil.make_array((4, 3))
 
     # Now we lower it.
     jaceLowered = jaceWrapped.lower(A, B)
@@ -266,7 +266,7 @@ def testee(A: np.ndarray) -> np.ndarray:
     shape = (10, 10)
 
     for i, dtype in enumerate(dtypes):
-        A = testutil.mkarray(shape, dtype=dtype)
+        A = testutil.make_array(shape, dtype=dtype)
 
         # First lowering
         assert lowering_cnt[0] == i
@@ -393,7 +393,7 @@ def wrapped(A: np.ndarray) -> np.ndarray:
         return A + 10.0
 
     shape = (10, 100, 1000)
-    C = testutil.mkarray(shape, order="C")
+    C = testutil.make_array(shape, order="C")
     F = np.array(C, copy=True, order="F")
 
     # First we compile run it with C strides.
@@ -431,7 +431,7 @@ def wrapped(A: np.ndarray | jax.Array) -> np.ndarray | jax.Array:
         _ = wrapped(for_calling)
         assert lowering_cnt[0] == 1, "Expected no further lowering."
 
-    A_numpy = testutil.mkarray((10, 10))
+    A_numpy = testutil.make_array((10, 10))
     A_jax = jnp.array(A_numpy, copy=True)
     assert A_numpy.dtype == A_jax.dtype
 
diff --git a/tests/unit_tests/test_decorator.py b/tests/unit_tests/test_decorator.py
index ca6a0de..a23ca6d 100644
--- a/tests/unit_tests/test_decorator.py
+++ b/tests/unit_tests/test_decorator.py
@@ -32,8 +32,8 @@ def testee(A, B):
         lowering_cnt[0] += 1
         return testee_(A, B)
 
-    A = testutil.mkarray((4, 3))
-    B = testutil.mkarray((4, 3))
+    A = testutil.make_array((4, 3))
+    B = testutil.make_array((4, 3))
 
     lowered = testee.lower(A, B)
     compiled = lowered.compile()
@@ -58,8 +58,8 @@ def testee(A, B):
         lowering_cnt[0] += 1
         return testee_(A, B)
 
-    A = testutil.mkarray((4, 3))
-    B = testutil.mkarray((4, 3))
+    A = testutil.make_array((4, 3))
+    B = testutil.make_array((4, 3))
 
     ref = testee_(A, B)
     res = testee(A, B)
diff --git a/tests/unit_tests/test_jax_api.py b/tests/unit_tests/test_jax_api.py
index 8014826..ad21947 100644
--- a/tests/unit_tests/test_jax_api.py
+++ b/tests/unit_tests/test_jax_api.py
@@ -27,8 +27,8 @@ def test_jit() -> None:
     def testee(A: np.ndarray, B: np.ndarray) -> np.ndarray:
         return A + B
 
-    A = testutil.mkarray((4, 3))
-    B = testutil.mkarray((4, 3))
+    A = testutil.make_array((4, 3))
+    B = testutil.make_array((4, 3))
 
     jax_testee = jax.jit(testee)
     jace_testee = jace.jit(testee)
@@ -90,7 +90,7 @@ def jace_fun(A, B, C):
     def jax_fun(A, B, C):
         return jace.jit(base_fun)(A, B, C)
 
-    A, B, C = (testutil.mkarray((10, 3, 50)) for _ in range(3))
+    A, B, C = (testutil.make_array((10, 3, 50)) for _ in range(3))
 
     assert np.allclose(jace_fun(A, B, C), jax_fun(A, B, C))
 
@@ -115,7 +115,7 @@ def f3_jax(A, B, C, D):
     def f3_jace(A, B, C, D):
         return f3_jax(A, B, C, D)
 
-    A, B, C, D = (testutil.mkarray((10, 3, 50)) for _ in range(4))
+    A, B, C, D = (testutil.make_array((10, 3, 50)) for _ in range(4))
 
     ref = ((A + B) - C) * D
     res_jax = f3_jax(A, B, C, D)
@@ -140,7 +140,7 @@ def jace_ddf(x):
         return jace.grad(jace.grad(f))(x)
 
     # These are the random numbers where we test
-    Xs = (testutil.mkarray(10) - 0.5) * 10
+    Xs = (testutil.make_array(10) - 0.5) * 10
 
     for i in range(Xs.shape[0]):
         x = Xs[i]
@@ -183,7 +183,7 @@ def test_disabled_x64() -> None:
     def testee(A: np.ndarray, B: np.float64) -> np.ndarray:
         return A + B
 
-    A = testutil.mkarray((4, 3))
+    A = testutil.make_array((4, 3))
     B = np.float64(10.0)
 
     # Run them with disabled x64 support
@@ -259,7 +259,7 @@ def test_jax_array_as_input() -> None:
     def testee(A: jax.Array) -> jax.Array:
         return jnp.sin(A + 1.0)
 
-    A = jnp.array(testutil.mkarray((10, 19)))
+    A = jnp.array(testutil.make_array((10, 19)))
 
     ref = testee(A)
     res = jace.jit(testee)(A)
@@ -277,7 +277,7 @@ def testee(A: dict[str, np.ndarray]) -> dict[str, jax.Array]:
         mod_a["__additional"] = jnp.asin(A["a1"])
         return mod_a
 
-    A = {f"a{i}": testutil.mkarray((10, 10)) for i in range(4)}
+    A = {f"a{i}": testutil.make_array((10, 10)) for i in range(4)}
     ref = testee(A)
     res = jace.jit(testee)(A)
 
diff --git a/tests/unit_tests/test_misc.py b/tests/unit_tests/test_misc.py
index 3a1fcf6..a2ca5de 100644
--- a/tests/unit_tests/test_misc.py
+++ b/tests/unit_tests/test_misc.py
@@ -31,8 +31,8 @@ def testee(A: np.ndarray) -> np.ndarray:
         return -A
 
     # Different types.
-    A1 = testutil.mkarray((4, 3), dtype=np.float32)
-    A2 = testutil.mkarray((4, 3), dtype=np.int64)
+    A1 = testutil.make_array((4, 3), dtype=np.float32)
+    A2 = testutil.make_array((4, 3), dtype=np.int64)
 
     # Lower and compilation for first type
     callee = testee.lower(A1).compile()
diff --git a/tests/util.py b/tests/util.py
index 558fe3e..45af5aa 100644
--- a/tests/util.py
+++ b/tests/util.py
@@ -20,10 +20,12 @@
     from collections.abc import Mapping, Sequence
 
 
-__all__ = ["mkarray"]
+__all__ = ["make_array"]
 
 
-def mkarray(shape: Sequence[int] | int, dtype: type = np.float64, order: str = "C") -> np.ndarray:
+def make_array(
+    shape: Sequence[int] | int, dtype: type = np.float64, order: str = "C"
+) -> np.ndarray:
     """Generates a NumPy ndarray with shape `shape`.
 
     The function uses the generator that is managed by the `_reset_random_seed()`
@@ -38,7 +40,7 @@ def mkarray(shape: Sequence[int] | int, dtype: type = np.float64, order: str = "
     """
 
     if shape == ():
-        return mkarray((1,), dtype)[0]
+        return make_array((1,), dtype)[0]
     if isinstance(shape, int):
         shape = (shape,)
 
@@ -50,7 +52,7 @@ def mkarray(shape: Sequence[int] | int, dtype: type = np.float64, order: str = "
             low=iinfo.min, high=iinfo.max, size=shape, dtype=dtype
         )
     elif np.issubdtype(dtype, np.complexfloating):
-        res = mkarray(shape, np.float64) + 1.0j * mkarray(shape, np.float64)
+        res = make_array(shape, np.float64) + 1.0j * make_array(shape, np.float64)
     else:
         res = np.random.random(shape)  # type: ignore[assignment]  # noqa: NPY002
     return np.array(res, order=order, dtype=dtype)  # type: ignore[call-overload]

From 744c2b28d8cea6c2ab7a1ba8e43fee688490054d Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Thu, 13 Jun 2024 15:40:35 +0200
Subject: [PATCH 371/458] Should cover most of the pep whatever naming.

---
 ...primitive_arithmetic_logical_operations.py | 117 +++++++-------
 .../test_primitive_broadcast_in_dim.py        |  20 +--
 .../test_primitive_convert_element_type.py    |  10 +-
 .../test_primitive_copy.py                    |  15 +-
 .../test_primitive_iota.py                    |   8 +-
 .../test_primitive_reshape.py                 |  12 +-
 .../test_primitive_select_n.py                |  16 +-
 .../test_primitive_slicing.py                 |  58 +++----
 .../test_primitive_squeeze_expand_dims.py     |  16 +-
 tests/integration_tests/test_empty_jaxpr.py   |  66 ++++----
 .../test_jaxpr_translator_builder.py          | 104 ++++++-------
 .../test_primitive_translator_managing.py     |  32 ++--
 tests/unit_tests/test_caching.py              | 146 +++++++++---------
 tests/unit_tests/test_decorator.py            |  38 ++---
 tests/unit_tests/test_jax_api.py              |  86 +++++------
 tests/unit_tests/test_misc.py                 |  12 +-
 16 files changed, 377 insertions(+), 379 deletions(-)

diff --git a/tests/integration_tests/primitive_translators/test_primitive_arithmetic_logical_operations.py b/tests/integration_tests/primitive_translators/test_primitive_arithmetic_logical_operations.py
index c5dbea0..2764830 100644
--- a/tests/integration_tests/primitive_translators/test_primitive_arithmetic_logical_operations.py
+++ b/tests/integration_tests/primitive_translators/test_primitive_arithmetic_logical_operations.py
@@ -191,10 +191,7 @@ def _perform_alt_test(testee: Callable, *args: Any) -> None:
     ref = testee(*args)
     res = wrapped(*args)
 
-    if jace.util.is_scalar(ref):
-        # Builder hack, only arrays are generated.
-        assert res.shape == (1,)
-    elif ref.shape == ():
+    if jace.util.is_scalar(ref) or ref.shape == ():
         assert res.shape == (1,)
     else:
         assert ref.shape == res.shape
@@ -206,119 +203,119 @@ def _perform_alt_test(testee: Callable, *args: Any) -> None:
 
 
 def test_mapped_unary_scalar() -> None:
-    def testee(A: np.float64) -> np.float64 | jax.Array:
-        return jnp.cos(A)
+    def testee(a: np.float64) -> np.float64 | jax.Array:
+        return jnp.cos(a)
 
     _perform_alt_test(testee, np.float64(1.0))
 
 
 def test_mapped_unary_array() -> None:
-    def testee(A: np.ndarray) -> jax.Array:
-        return jnp.sin(A)
+    def testee(a: np.ndarray) -> jax.Array:
+        return jnp.sin(a)
 
-    A = testutil.make_array((100, 10, 3))
+    a = testutil.make_array((100, 10, 3))
 
-    _perform_alt_test(testee, A)
+    _perform_alt_test(testee, a)
 
 
 def test_mapped_unary_scalar_literal() -> None:
-    def testee(A: float) -> float | jax.Array:
-        return jnp.sin(1.98) + A
+    def testee(a: float) -> float | jax.Array:
+        return jnp.sin(1.98) + a
 
     _perform_alt_test(testee, 10.0)
 
 
 def test_mapped_binary_scalar() -> None:
-    def testee(A: np.float64, B: np.float64) -> np.float64:
-        return A * B
+    def testee(a: np.float64, B: np.float64) -> np.float64:
+        return a * B
 
     _perform_alt_test(testee, np.float64(1.0), np.float64(2.0))
 
 
 def test_mapped_binary_scalar_partial_literal() -> None:
-    def testeeR(A: np.float64) -> np.float64:
-        return A * 2.03
+    def testeeR(a: np.float64) -> np.float64:
+        return a * 2.03
 
-    def testeeL(A: np.float64) -> np.float64:
-        return 2.03 * A
+    def testeeL(a: np.float64) -> np.float64:
+        return 2.03 * a
 
-    A = np.float64(7.0)
-    _perform_alt_test(testeeR, A)
-    _perform_alt_test(testeeL, A)
+    a = np.float64(7.0)
+    _perform_alt_test(testeeR, a)
+    _perform_alt_test(testeeL, a)
 
 
 def test_mapped_binary_array() -> None:
     """Test binary of arrays, with same size."""
 
-    def testee(A: np.ndarray, B: np.ndarray) -> np.ndarray:
-        return A + B
+    def testee(a: np.ndarray, B: np.ndarray) -> np.ndarray:
+        return a + B
 
-    A = testutil.make_array((100, 10, 3))
+    a = testutil.make_array((100, 10, 3))
     B = testutil.make_array((100, 10, 3))
-    _perform_alt_test(testee, A, B)
+    _perform_alt_test(testee, a, B)
 
 
 def test_mapped_binary_array_scalar() -> None:
-    def testee(A: np.ndarray | np.float64, B: np.float64 | np.ndarray) -> np.ndarray:
-        return A + B  # type: ignore[return-value]  # It is always an array.
+    def testee(a: np.ndarray | np.float64, B: np.float64 | np.ndarray) -> np.ndarray:
+        return a + B  # type: ignore[return-value]  # It is always an array.
 
-    A = testutil.make_array((100, 22))
+    a = testutil.make_array((100, 22))
     B = np.float64(1.34)
-    _perform_alt_test(testee, A, B)
-    _perform_alt_test(testee, B, A)
+    _perform_alt_test(testee, a, B)
+    _perform_alt_test(testee, B, a)
 
 
 def test_mapped_binary_array_partial_literal() -> None:
-    def testeeR(A: np.ndarray) -> np.ndarray:
-        return A + 1.52
+    def testeeR(a: np.ndarray) -> np.ndarray:
+        return a + 1.52
 
-    def testeeL(A: np.ndarray) -> np.ndarray:
-        return 1.52 + A
+    def testeeL(a: np.ndarray) -> np.ndarray:
+        return 1.52 + a
 
-    A = testutil.make_array((100, 22))
-    _perform_alt_test(testeeR, A)
-    _perform_alt_test(testeeL, A)
+    a = testutil.make_array((100, 22))
+    _perform_alt_test(testeeR, a)
+    _perform_alt_test(testeeL, a)
 
 
 def test_mapped_binary_array_constants() -> None:
-    def testee(A: np.ndarray) -> np.ndarray:
-        return A + jnp.array([[1.0, 2.0, 3.0], [4.0, 5.0, 6.0], [7.0, 8.0, 9.0]])
+    def testee(a: np.ndarray) -> np.ndarray:
+        return a + jnp.array([[1.0, 2.0, 3.0], [4.0, 5.0, 6.0], [7.0, 8.0, 9.0]])
 
-    A = testutil.make_array((3, 3))
-    _perform_alt_test(testee, A)
+    a = testutil.make_array((3, 3))
+    _perform_alt_test(testee, a)
 
 
 def test_mapped_broadcast(broadcast_input: tuple[np.ndarray, np.ndarray]) -> None:
-    def testee(A: np.ndarray, B: np.ndarray) -> np.ndarray:
-        return A + B
+    def testee(a: np.ndarray, B: np.ndarray) -> np.ndarray:
+        return a + B
 
-    A = broadcast_input[0]
+    a = broadcast_input[0]
     B = broadcast_input[1]
-    _perform_alt_test(testee, A, B)
-    _perform_alt_test(testee, B, A)
+    _perform_alt_test(testee, a, B)
+    _perform_alt_test(testee, B, a)
 
 
 # <------------ Tests for arithmetic and logical translators/operations
 
 
 def test_alt_general_unary(alt_unary_ops: tuple[Callable, np.ndarray]) -> None:
-    def testee(A: np.ndarray) -> np.ndarray:
-        return alt_unary_ops[0](A)
+    def testee(a: np.ndarray) -> np.ndarray:
+        return alt_unary_ops[0](a)
 
     _perform_alt_test(testee, alt_unary_ops[1])
 
 
 def test_alt_unary_isfinite() -> None:
-    def testee(A: np.ndarray) -> jax.Array:
-        return jnp.isfinite(A)
+    def testee(a: np.ndarray) -> jax.Array:
+        return jnp.isfinite(a)
 
-    A = np.array([np.inf, +np.inf, -np.inf, np.nan, -np.nan, 1.0])
+    a = np.array([np.inf, +np.inf, -np.inf, np.nan, -np.nan, 1.0])
 
     args = dace.Config.get("compiler", "cpu", "args")
     try:
         new_args = args.replace("-ffast-math", "-fno-finite-math-only")
         dace.Config.set("compiler", "cpu", "args", value=new_args)
-        _perform_alt_test(testee, A)
+        _perform_alt_test(testee, a)
 
     finally:
         dace.Config.set("compiler", "cpu", "args", value=args)
@@ -327,8 +324,8 @@ def testee(A: np.ndarray) -> jax.Array:
 def test_alt_general_binary_float(
     alt_binary_ops_float: tuple[Callable, tuple[np.ndarray, np.ndarray]],
 ) -> None:
-    def testee(A: np.ndarray, B: np.ndarray) -> np.ndarray:
-        return alt_binary_ops_float[0](A, B)
+    def testee(a: np.ndarray, B: np.ndarray) -> np.ndarray:
+        return alt_binary_ops_float[0](a, B)
 
     _perform_alt_test(testee, *alt_binary_ops_float[1])
 
@@ -336,8 +333,8 @@ def testee(A: np.ndarray, B: np.ndarray) -> np.ndarray:
 def test_alt_compare_operation(
     alt_binary_compare_ops: tuple[Callable, tuple[np.ndarray, np.ndarray]],
 ) -> None:
-    def testee(A: np.ndarray, B: np.ndarray) -> np.ndarray:
-        return alt_binary_compare_ops[0](A, B)
+    def testee(a: np.ndarray, B: np.ndarray) -> np.ndarray:
+        return alt_binary_compare_ops[0](a, B)
 
     _perform_alt_test(testee, *alt_binary_compare_ops[1])
 
@@ -354,8 +351,8 @@ def testee(*args: np.ndarray) -> np.ndarray:
 
 
 def test_alt_unary_integer_power() -> None:
-    def testee(A: np.ndarray) -> np.ndarray:
-        return A**3
+    def testee(a: np.ndarray) -> np.ndarray:
+        return a**3
 
-    A = testutil.make_array((10, 2, 3))
-    _perform_alt_test(testee, A)
+    a = testutil.make_array((10, 2, 3))
+    _perform_alt_test(testee, a)
diff --git a/tests/integration_tests/primitive_translators/test_primitive_broadcast_in_dim.py b/tests/integration_tests/primitive_translators/test_primitive_broadcast_in_dim.py
index f99ce26..7d434fd 100644
--- a/tests/integration_tests/primitive_translators/test_primitive_broadcast_in_dim.py
+++ b/tests/integration_tests/primitive_translators/test_primitive_broadcast_in_dim.py
@@ -44,12 +44,12 @@ def vector_shape(request) -> tuple[int, ...]:
 def test_bid_scalar() -> None:
     """Broadcast a scalar to a matrix."""
 
-    def testee(A: float) -> jax.Array:
-        return jnp.broadcast_to(A, (2, 2))
+    def testee(a: float) -> jax.Array:
+        return jnp.broadcast_to(a, (2, 2))
 
-    A = 1.032
-    ref = testee(A)
-    res = jace.jit(testee)(A)
+    a = 1.032
+    ref = testee(a)
+    res = jace.jit(testee)(a)
 
     assert res.shape == ref.shape
     assert res.dtype == ref.dtype
@@ -72,12 +72,12 @@ def testee(a: float) -> jax.Array:
 def test_bid_vector(vector_shape: Sequence[int]) -> None:
     """Broadcast a vector to a tensor."""
 
-    def testee(A: np.ndarray) -> jax.Array:
-        return jnp.broadcast_to(A, (10, 10))
+    def testee(a: np.ndarray) -> jax.Array:
+        return jnp.broadcast_to(a, (10, 10))
 
-    A = testutil.make_array(vector_shape)
-    ref = testee(A)
-    res = jace.jit(testee)(A)
+    a = testutil.make_array(vector_shape)
+    ref = testee(a)
+    res = jace.jit(testee)(a)
     assert res.shape == ref.shape
     assert res.dtype == ref.dtype
     assert np.all(res == ref)
diff --git a/tests/integration_tests/primitive_translators/test_primitive_convert_element_type.py b/tests/integration_tests/primitive_translators/test_primitive_convert_element_type.py
index 58e7d5d..2e3664d 100644
--- a/tests/integration_tests/primitive_translators/test_primitive_convert_element_type.py
+++ b/tests/integration_tests/primitive_translators/test_primitive_convert_element_type.py
@@ -59,15 +59,15 @@ def dst_type(request) -> type:
 def _convert_element_type_impl(input_type: type, output_type: type) -> None:
     """Implementation of the tests of the convert element types primitive."""
     lowering_cnt = [0]
-    A: np.ndarray = testutil.make_array((10, 10), input_type)
-    ref: np.ndarray = np.array(A, copy=True, dtype=output_type)
+    a: np.ndarray = testutil.make_array((10, 10), input_type)
+    ref: np.ndarray = np.array(a, copy=True, dtype=output_type)
 
     @jace.jit
-    def converter(A: np.ndarray) -> jax.Array:
+    def converter(a: np.ndarray) -> jax.Array:
         lowering_cnt[0] += 1
-        return jnp.array(A, copy=False, dtype=output_type)
+        return jnp.array(a, copy=False, dtype=output_type)
 
-    res = converter(A)
+    res = converter(a)
     assert lowering_cnt[0] == 1
     assert (
         res.dtype == output_type
diff --git a/tests/integration_tests/primitive_translators/test_primitive_copy.py b/tests/integration_tests/primitive_translators/test_primitive_copy.py
index 16e4ec0..0d3b566 100644
--- a/tests/integration_tests/primitive_translators/test_primitive_copy.py
+++ b/tests/integration_tests/primitive_translators/test_primitive_copy.py
@@ -18,11 +18,12 @@
 
 def test_copy() -> None:
     @jace.jit
-    def testee(A: np.ndarray) -> jax.Array:
-        return jnp.copy(A)
+    def testee(a: np.ndarray) -> jax.Array:
+        return jnp.copy(a)
 
-    A = testutil.make_array((10, 10, 10))
-    res = testee(A)
-    assert A.dtype == res.dtype
-    assert A.shape == res.shape
-    assert np.all(res == A)
+    a = testutil.make_array((10, 10, 10))
+    res = testee(a)
+    assert a.dtype == res.dtype
+    assert a.shape == res.shape
+    assert a.__array_interface__["data"][0] != res.__array_interface__["data"][0]
+    assert np.all(res == a)
diff --git a/tests/integration_tests/primitive_translators/test_primitive_iota.py b/tests/integration_tests/primitive_translators/test_primitive_iota.py
index 1fd548a..14e4ac0 100644
--- a/tests/integration_tests/primitive_translators/test_primitive_iota.py
+++ b/tests/integration_tests/primitive_translators/test_primitive_iota.py
@@ -16,8 +16,8 @@
 
 
 def test_iota_arange() -> None:
-    def testee(A: int) -> jax.Array:
-        return jnp.arange(18, dtype=int) + A
+    def testee(a: int) -> jax.Array:
+        return jnp.arange(18, dtype=int) + a
 
     ref = testee(0)
     res = jace.jit(testee)(0)
@@ -28,8 +28,8 @@ def testee(A: int) -> jax.Array:
 def test_iota_broadcast(d) -> None:
     shape = (2, 2, 2, 2)
 
-    def testee(A: np.int32) -> jax.Array:
-        return jax.lax.broadcasted_iota("int32", shape, d) + A
+    def testee(a: np.int32) -> jax.Array:
+        return jax.lax.broadcasted_iota("int32", shape, d) + a
 
     ref = testee(np.int32(0))
     res = jace.jit(testee)(np.int32(0))
diff --git a/tests/integration_tests/primitive_translators/test_primitive_reshape.py b/tests/integration_tests/primitive_translators/test_primitive_reshape.py
index 376cc9a..9d3948f 100644
--- a/tests/integration_tests/primitive_translators/test_primitive_reshape.py
+++ b/tests/integration_tests/primitive_translators/test_primitive_reshape.py
@@ -29,14 +29,14 @@ def _test_impl_reshaping(
     src_shape: Sequence[int], dst_shape: Sequence[int], order: str = "C"
 ) -> None:
     """Performs a reshaping from `src_shape` to `dst_shape`."""
-    A = testutil.make_array(src_shape)
-    A = np.array(A, order=order)  # type: ignore[call-overload]  # MyPy wants a literal as order.
+    a = testutil.make_array(src_shape)
+    a = np.array(a, order=order)  # type: ignore[call-overload]  # MyPy wants a literal as order.
 
-    def testee(A: np.ndarray) -> jax.Array:
-        return jnp.reshape(A, dst_shape)
+    def testee(a: np.ndarray) -> jax.Array:
+        return jnp.reshape(a, dst_shape)
 
-    ref = testee(A)
-    res = jace.jit(testee)(A)
+    ref = testee(a)
+    res = jace.jit(testee)(a)
 
     assert res.shape == dst_shape
     assert np.all(res == ref)
diff --git a/tests/integration_tests/primitive_translators/test_primitive_select_n.py b/tests/integration_tests/primitive_translators/test_primitive_select_n.py
index dd773a4..0981c97 100644
--- a/tests/integration_tests/primitive_translators/test_primitive_select_n.py
+++ b/tests/integration_tests/primitive_translators/test_primitive_select_n.py
@@ -31,8 +31,8 @@ def _perform_test(testee: Callable, *args: Any) -> None:
 
 
 def test_select_n_where() -> None:
-    def testee(P: np.ndarray, T: np.ndarray, F: np.ndarray) -> jax.Array:
-        return jnp.where(P, T, F)
+    def testee(pred: np.ndarray, tbranch: np.ndarray, fbranch: np.ndarray) -> jax.Array:
+        return jnp.where(pred, tbranch, fbranch)
 
     shape = (10, 10)
     pred = testutil.make_array(shape, np.bool_)
@@ -42,14 +42,14 @@ def testee(P: np.ndarray, T: np.ndarray, F: np.ndarray) -> jax.Array:
 
 
 def test_select_n_where_literal() -> None:
-    def testee1(P: np.ndarray, F: np.ndarray) -> jax.Array:
-        return jnp.where(P, 2, F)
+    def testee1(pred: np.ndarray, fbranch: np.ndarray) -> jax.Array:
+        return jnp.where(pred, 2, fbranch)
 
-    def testee2(P: np.ndarray, T: np.ndarray) -> jax.Array:
-        return jnp.where(P, T, 3)
+    def testee2(pred: np.ndarray, tbranch: np.ndarray) -> jax.Array:
+        return jnp.where(pred, tbranch, 3)
 
-    def testee3(P: np.ndarray) -> jax.Array:
-        return jnp.where(P, 8, 9)
+    def testee3(pred: np.ndarray) -> jax.Array:
+        return jnp.where(pred, 8, 9)
 
     shape = ()
     pred = testutil.make_array(shape, np.bool_)
diff --git a/tests/integration_tests/primitive_translators/test_primitive_slicing.py b/tests/integration_tests/primitive_translators/test_primitive_slicing.py
index 9b6f9e1..1615dd0 100644
--- a/tests/integration_tests/primitive_translators/test_primitive_slicing.py
+++ b/tests/integration_tests/primitive_translators/test_primitive_slicing.py
@@ -19,12 +19,12 @@
 
 
 @pytest.fixture()
-def A_20x20x20() -> np.ndarray:
+def a_20x20x20() -> np.ndarray:
     return testutil.make_array((20, 20, 20))
 
 
 @pytest.fixture()
-def A_4x4x4x4() -> np.ndarray:
+def a_4x4x4x4() -> np.ndarray:
     return testutil.make_array((4, 4, 4, 4))
 
 
@@ -41,61 +41,61 @@ def full_dynamic_start_idx(request) -> tuple[int, int, int, int]:
     return request.param
 
 
-def test_slice_no_strides(A_20x20x20: np.ndarray) -> None:
+def test_slice_no_strides(a_20x20x20: np.ndarray) -> None:
     """Test without strides."""
 
-    def testee(A: np.ndarray) -> jax.Array:
-        # Read as: A[2:18, 3:19, 4:17]
-        return jax.lax.slice(A, (2, 3, 4), (18, 19, 17), None)
+    def testee(a: np.ndarray) -> jax.Array:
+        # Read as: a[2:18, 3:19, 4:17]
+        return jax.lax.slice(a, (2, 3, 4), (18, 19, 17), None)
 
-    ref = testee(A_20x20x20)
-    res = jace.jit(testee)(A_20x20x20)
+    ref = testee(a_20x20x20)
+    res = jace.jit(testee)(a_20x20x20)
 
     assert ref.shape == res.shape
     assert np.all(ref == res)
 
 
-def test_slice_strides(A_20x20x20: np.ndarray) -> None:
+def test_slice_strides(a_20x20x20: np.ndarray) -> None:
     """Test with strides."""
 
-    def testee(A: np.ndarray) -> jax.Array:
-        # Read as: A[2:18:1, 3:19:2, 4:17:3]
-        return jax.lax.slice(A, (2, 3, 4), (18, 19, 17), (1, 2, 3))
+    def testee(a: np.ndarray) -> jax.Array:
+        # Read as: a[2:18:1, 3:19:2, 4:17:3]
+        return jax.lax.slice(a, (2, 3, 4), (18, 19, 17), (1, 2, 3))
 
-    ref = testee(A_20x20x20)
-    res = jace.jit(testee)(A_20x20x20)
+    ref = testee(a_20x20x20)
+    res = jace.jit(testee)(a_20x20x20)
 
     assert ref.shape == res.shape
     assert np.all(ref == res)
 
 
 def test_dynamic_slice_full_dynamic(
-    A_4x4x4x4: np.ndarray, full_dynamic_start_idx: tuple[int, int, int, int]
+    a_4x4x4x4: np.ndarray, full_dynamic_start_idx: tuple[int, int, int, int]
 ) -> None:
-    def testee(A: np.ndarray, s1: int, s2: int, s3: int, s4: int) -> jax.Array:
-        return jax.lax.dynamic_slice(A, (s1, s2, s3, s4), (2, 2, 2, 2))
+    def testee(a: np.ndarray, s1: int, s2: int, s3: int, s4: int) -> jax.Array:
+        return jax.lax.dynamic_slice(a, (s1, s2, s3, s4), (2, 2, 2, 2))
 
-    res = jace.jit(testee)(A_4x4x4x4, *full_dynamic_start_idx)
-    ref = testee(A_4x4x4x4, *full_dynamic_start_idx)
+    res = jace.jit(testee)(a_4x4x4x4, *full_dynamic_start_idx)
+    ref = testee(a_4x4x4x4, *full_dynamic_start_idx)
 
     assert np.all(ref == res)
 
 
-def test_dynamic_slice_partially_dynamic(A_4x4x4x4: np.ndarray) -> None:
-    def testee(A: np.ndarray, s1: int, s2: int) -> jax.Array:
-        return jax.lax.dynamic_slice(A, (s1, 1, s2, 2), (2, 2, 2, 2))
+def test_dynamic_slice_partially_dynamic(a_4x4x4x4: np.ndarray) -> None:
+    def testee(a: np.ndarray, s1: int, s2: int) -> jax.Array:
+        return jax.lax.dynamic_slice(a, (s1, 1, s2, 2), (2, 2, 2, 2))
 
-    res = jace.jit(testee)(A_4x4x4x4, 1, 2)
-    ref = testee(A_4x4x4x4, 1, 2)
+    res = jace.jit(testee)(a_4x4x4x4, 1, 2)
+    ref = testee(a_4x4x4x4, 1, 2)
 
     assert np.all(ref == res)
 
 
-def test_dynamic_slice_full_literal(A_4x4x4x4: np.ndarray) -> None:
-    def testee(A: np.ndarray) -> jax.Array:
-        return jax.lax.dynamic_slice(A, (0, 1, 0, 2), (2, 2, 2, 2))
+def test_dynamic_slice_full_literal(a_4x4x4x4: np.ndarray) -> None:
+    def testee(a: np.ndarray) -> jax.Array:
+        return jax.lax.dynamic_slice(a, (0, 1, 0, 2), (2, 2, 2, 2))
 
-    res = jace.jit(testee)(A_4x4x4x4)
-    ref = testee(A_4x4x4x4)
+    res = jace.jit(testee)(a_4x4x4x4)
+    ref = testee(a_4x4x4x4)
 
     assert np.all(ref == res)
diff --git a/tests/integration_tests/primitive_translators/test_primitive_squeeze_expand_dims.py b/tests/integration_tests/primitive_translators/test_primitive_squeeze_expand_dims.py
index d732667..5ff6a49 100644
--- a/tests/integration_tests/primitive_translators/test_primitive_squeeze_expand_dims.py
+++ b/tests/integration_tests/primitive_translators/test_primitive_squeeze_expand_dims.py
@@ -39,20 +39,20 @@ def _roundtrip_implementation(shape: Sequence[int], axis: int | Sequence[int]) -
         shape:  Shape of the input array.
         axes:   A series of axis that should be tried.
     """
-    A = testutil.make_array(shape)
-    A_org = A.copy()
+    a = testutil.make_array(shape)
+    a_org = a.copy()
 
     for ops in [jnp.expand_dims, jnp.squeeze]:
         with jax.experimental.enable_x64():
-            ref = ops(A, axis)  # type: ignore[operator]  # Function of unknown type.
-            res = jace.jit(lambda A: ops(A, axis))(A)  # type: ignore[operator]  # noqa: B023
+            ref = ops(a, axis)  # type: ignore[operator]  # Function of unknown type.
+            res = jace.jit(lambda a: ops(a, axis))(a)  # type: ignore[operator]  # noqa: B023
 
-        assert ref.shape == res.shape, f"A.shape = {shape}; Expected: {ref.shape}; Got: {res.shape}"
+        assert ref.shape == res.shape, f"a.shape = {shape}; Expected: {ref.shape}; Got: {res.shape}"
         assert ref.dtype == res.dtype
         assert np.all(ref == res), f"Value error for shape '{shape}' and axis={axis}"
-        A = np.array(ref, copy=True)  # It is a Jax array, and we have to reverse this.
-    assert A_org.shape == res.shape
-    assert np.all(A_org == res)
+        a = np.array(ref, copy=True)  # It is a Jax array, and we have to reverse this.
+    assert a_org.shape == res.shape
+    assert np.all(a_org == res)
 
 
 @pytest.fixture(params=[0, -1, 1])
diff --git a/tests/integration_tests/test_empty_jaxpr.py b/tests/integration_tests/test_empty_jaxpr.py
index 8bcf195..24d8420 100644
--- a/tests/integration_tests/test_empty_jaxpr.py
+++ b/tests/integration_tests/test_empty_jaxpr.py
@@ -22,69 +22,69 @@
 
 def test_empty_single_return() -> None:
     @jace.jit
-    def wrapped(A: np.ndarray) -> np.ndarray:
-        return A
+    def wrapped(a: np.ndarray) -> np.ndarray:
+        return a
 
-    A = np.arange(12, dtype=np.float64).reshape((4, 3))
-    res = wrapped(A)
+    a = np.arange(12, dtype=np.float64).reshape((4, 3))
+    res = wrapped(a)
 
-    assert np.all(res == A)
-    assert res.__array_interface__["data"][0] != A.__array_interface__["data"][0]
+    assert np.all(res == a)
+    assert res.__array_interface__["data"][0] != a.__array_interface__["data"][0]
 
 
 def test_empty_multiple_return() -> None:
     @jace.jit
-    def wrapped(A: np.ndarray, B: np.float64) -> tuple[np.ndarray, np.float64]:
-        return A, B
+    def wrapped(a: np.ndarray, b: np.float64) -> tuple[np.ndarray, np.float64]:
+        return a, b
 
-    A = np.arange(12, dtype=np.float64).reshape((4, 3))
-    B = np.float64(30.0)
-    res = wrapped(A, B)
+    a = np.arange(12, dtype=np.float64).reshape((4, 3))
+    b = np.float64(30.0)
+    res = wrapped(a, b)
 
-    assert np.all(res[0] == A)
-    assert res[1] == B
-    assert res[0].__array_interface__["data"][0] != A.__array_interface__["data"][0]
+    assert np.all(res[0] == a)
+    assert res[1] == b
+    assert res[0].__array_interface__["data"][0] != a.__array_interface__["data"][0]
 
 
 def test_empty_unused_argument() -> None:
     """Empty body and an unused input argument."""
 
     @jace.jit
-    def wrapped(A: np.ndarray, B: np.float64) -> np.ndarray:  # noqa: ARG001  # Explicitly unused.
-        return A
+    def wrapped(a: np.ndarray, b: np.float64) -> np.ndarray:  # noqa: ARG001  # Explicitly unused.
+        return a
 
-    A = np.arange(12, dtype=np.float64).reshape((4, 3))
-    B = np.float64(30.0)
-    lowered = wrapped.lower(A, B)
+    a = np.arange(12, dtype=np.float64).reshape((4, 3))
+    b = np.float64(30.0)
+    lowered = wrapped.lower(a, b)
     compiled = lowered.compile()
-    res = compiled(A, B)
+    res = compiled(a, b)
 
     assert len(lowered._translated_sdfg.inp_names) == 2
     assert len(compiled._csdfg.inp_names) == 2
     assert isinstance(res, np.ndarray)
-    assert np.all(res == A)
-    assert res.__array_interface__["data"][0] != A.__array_interface__["data"][0]
+    assert np.all(res == a)
+    assert res.__array_interface__["data"][0] != a.__array_interface__["data"][0]
 
 
 def test_empty_scalar() -> None:
     @jace.jit
-    def wrapped(A: np.float64) -> np.float64:
-        return A
+    def wrapped(a: np.float64) -> np.float64:
+        return a
 
-    A = np.pi
+    a = np.pi
 
-    assert np.all(wrapped(A) == A)
+    assert np.all(wrapped(a) == a)
 
 
 @pytest.mark.skip(reason="Nested Jaxpr are not handled.")
 def test_empty_nested() -> None:
     @jace.jit
-    def wrapped(A: np.float64) -> np.float64:
-        return jax.jit(lambda A: A)(A)
+    def wrapped(a: np.float64) -> np.float64:
+        return jax.jit(lambda a: a)(a)
 
-    A = np.pi
+    a = np.pi
 
-    assert np.all(wrapped(A) == A)
+    assert np.all(wrapped(a) == a)
 
 
 @pytest.mark.skip(reason="Literal return value is not implemented.")
@@ -112,8 +112,8 @@ def test_empty_with_drop_vars() -> None:
     def testee(a: np.float64, b: np.float64) -> np.float64:
         return a + b
 
-    A = np.e
-    ref = testee(A)
-    res = jace.jit(testee)(A)
+    a = np.e
+    ref = testee(a)
+    res = jace.jit(testee)(a)
 
     assert np.all(ref == res)
diff --git a/tests/integration_tests/test_jaxpr_translator_builder.py b/tests/integration_tests/test_jaxpr_translator_builder.py
index 8d24d25..28c7b86 100644
--- a/tests/integration_tests/test_jaxpr_translator_builder.py
+++ b/tests/integration_tests/test_jaxpr_translator_builder.py
@@ -67,7 +67,7 @@ def test_builder_alloc() -> None:
 
     # The reserved names will be tested in `test_builder_fork()`.
     sdfg_name = "qwertzuiopasdfghjkl"
-    jaxpr = jax.make_jaxpr(lambda A: A)(1.0)  # dummy jaxpr, needed for construction.
+    jaxpr = jax.make_jaxpr(lambda x: x)(1.0)  # dummy jaxpr, needed for construction.
     builder._allocate_translation_ctx(name=sdfg_name, jaxpr=jaxpr)
     assert len(builder._ctx_stack) == 1
     assert builder.is_root_translator()
@@ -218,7 +218,7 @@ def test_builder_nested(translation_builder: translator.JaxprTranslationBuilder)
     assert translation_builder.sdfg.number_of_edges() == 1
 
     # Now we go one subcontext deeper.
-    jaxpr = jax.make_jaxpr(lambda A: A)(1.0)  # dummy jaxpr, needed for construction.
+    jaxpr = jax.make_jaxpr(lambda x: x)(1.0)  # dummy jaxpr, needed for construction.
     translation_builder._allocate_translation_ctx(name="builder", jaxpr=jaxpr)
     assert len(translation_builder._ctx_stack) == 2
     assert translation_builder.sdfg.name == "builder"
@@ -475,7 +475,7 @@ def test_builder_constants(translation_builder: translator.JaxprTranslationBuild
     """
     # Create the Jaxpr that we need.
     constant = [[1.0, 2.0, 3.0], [4.0, 5.0, 6.0], [7.0, 8.0, 9.0]]
-    jaxpr = jax.make_jaxpr(lambda A: A + jax.numpy.array(constant))(1.0)
+    jaxpr = jax.make_jaxpr(lambda x: x + jax.numpy.array(constant))(1.0)
 
     # We have to manually allocate the builder context.
     #  You should not do that.
@@ -495,15 +495,15 @@ def test_builder_constants(translation_builder: translator.JaxprTranslationBuild
 def test_builder_scalar_return_value() -> None:
     """Tests if scalars can be returned directly."""
 
-    def scalar_ops(A: float) -> float:
-        return A + A - A * A
+    def scalar_ops(a: float) -> float:
+        return a + a - a * a
 
     lower_cnt = [0]
 
     @jace.jit
-    def wrapped(A: float) -> float:
+    def wrapped(a: float) -> float:
         lower_cnt[0] += 1
-        return scalar_ops(A)
+        return scalar_ops(a)
 
     vals = testutil.make_array(100)
     for i in range(vals.size):
@@ -517,11 +517,11 @@ def test_builder_scalar_return_type() -> None:
     """As Jax we always return an array, even for a scalar."""
 
     @jace.jit
-    def wrapped(A: np.float64) -> np.float64:
-        return A + A - A * A
+    def wrapped(a: np.float64) -> np.float64:
+        return a + a - a * a
 
-    A = np.float64(1.0)
-    res = wrapped(A)
+    a = np.float64(1.0)
+    res = wrapped(a)
     assert res.shape == (1,)
     assert res.dtype == np.float64
     assert res[0] == np.float64(1.0)
@@ -534,17 +534,17 @@ def test_builder_multiple_return_values() -> None:
     """
 
     @jace.jit
-    def wrapped(A: np.ndarray, B: np.ndarray) -> tuple[np.ndarray, np.ndarray]:
-        return A + B, A - B
+    def wrapped(a: np.ndarray, b: np.ndarray) -> tuple[np.ndarray, np.ndarray]:
+        return a + b, a - b
 
-    A = testutil.make_array((2, 2))
-    B = testutil.make_array((2, 2))
+    a = testutil.make_array((2, 2))
+    b = testutil.make_array((2, 2))
 
-    lowered = wrapped.lower(A, B)
+    lowered = wrapped.lower(a, b)
     compiled = lowered.compile()
 
-    ref = (A + B, A - B)
-    res = compiled(A, B)
+    ref = (a + b, a - b)
+    res = compiled(a, b)
 
     assert len(lowered._translated_sdfg.inp_names) == 2
     assert len(compiled._csdfg.inp_names) == 2
@@ -567,34 +567,34 @@ def test_builder_direct_return() -> None:
     """
 
     @jace.jit
-    def wrapped(A: np.ndarray, B: np.ndarray) -> tuple[np.ndarray, np.ndarray, np.ndarray]:
-        return A + B, B, A
+    def wrapped(a: np.ndarray, b: np.ndarray) -> tuple[np.ndarray, np.ndarray, np.ndarray]:
+        return a + b, b, a
 
-    A = testutil.make_array((2, 2))
-    B = testutil.make_array((2, 2))
+    a = testutil.make_array((2, 2))
+    b = testutil.make_array((2, 2))
 
-    ref0 = A + B
-    res = wrapped(A, B)
+    ref0 = a + b
+    res = wrapped(a, b)
 
     assert isinstance(res, tuple)
     assert len(res) == 3
     assert np.allclose(ref0, res[0])
-    assert np.all(res[2] == A)
-    assert res[2].__array_interface__["data"][0] != A.__array_interface__["data"][0]
-    assert np.all(res[1] == B)
-    assert res[1].__array_interface__["data"][0] != B.__array_interface__["data"][0]
+    assert np.all(res[2] == a)
+    assert res[2].__array_interface__["data"][0] != a.__array_interface__["data"][0]
+    assert np.all(res[1] == b)
+    assert res[1].__array_interface__["data"][0] != b.__array_interface__["data"][0]
 
 
 @pytest.mark.skip(reason="Literal return values are not supported.")
 def test_builder_literal_return_value() -> None:
     """Tests if there can be literals in the return values."""
 
-    def testee(A: np.ndarray) -> tuple[np.ndarray, np.float64, np.ndarray]:
-        return (A + 1.0, np.float64(1.0), A - 1.0)
+    def testee(a: np.ndarray) -> tuple[np.ndarray, np.float64, np.ndarray]:
+        return (a + 1.0, np.float64(1.0), a - 1.0)
 
-    A = testutil.make_array((2, 2))
-    ref = testee(A)
-    res = jace.jit(testee)(A)
+    a = testutil.make_array((2, 2))
+    ref = testee(a)
+    res = jace.jit(testee)(a)
 
     assert isinstance(res, tuple)
     assert len(res) == 3
@@ -605,20 +605,20 @@ def testee(A: np.ndarray) -> tuple[np.ndarray, np.float64, np.ndarray]:
 def test_builder_unused_arg() -> None:
     """Tests if there is an unused argument."""
 
-    def testee(A: np.ndarray, B: np.ndarray) -> np.ndarray:  # noqa: ARG001  # Explicitly unused.
-        return A + 3.0
+    def testee(a: np.ndarray, b: np.ndarray) -> np.ndarray:  # noqa: ARG001  # Explicitly unused.
+        return a + 3.0
 
-    A = testutil.make_array((10, 10))
-    B = testutil.make_array((11, 11))
-    C = testutil.make_array((20, 20))
+    a = testutil.make_array((10, 10))
+    b = testutil.make_array((11, 11))
+    c = testutil.make_array((20, 20))
 
     wrapped = jace.jit(testee)
-    lowered = wrapped.lower(A, B)
+    lowered = wrapped.lower(a, b)
     compiled = lowered.compile()
 
-    ref = testee(A, B)
-    res1 = compiled(A, B)  # Correct call
-    res2 = compiled(A, C)  # wrong call to show that nothing is affected.
+    ref = testee(a, b)
+    res1 = compiled(a, b)  # Correct call
+    res2 = compiled(a, c)  # wrong call to show that nothing is affected.
 
     assert len(lowered._translated_sdfg.inp_names) == 2
     assert len(compiled._csdfg.inp_names) == 2
@@ -643,12 +643,12 @@ def test_builder_F_strides() -> None:
         See also `tests/test_caching.py::test_caching_strides`.
     """
 
-    def testee(A: np.ndarray) -> np.ndarray:
-        return A + 10.0
+    def testee(a: np.ndarray) -> np.ndarray:
+        return a + 10.0
 
-    A = testutil.make_array((4, 3), order="F")
-    ref = testee(A)
-    res = jace.jit(testee)(A)
+    a = testutil.make_array((4, 3), order="F")
+    ref = testee(a)
+    res = jace.jit(testee)(a)
 
     assert ref.shape == res.shape
     assert np.allclose(ref, res)
@@ -658,11 +658,11 @@ def test_builder_drop_variables() -> None:
     """Tests if the builder can handle drop variables."""
 
     @jace.grad
-    def testee(A: np.float64) -> jax.Array:
-        return jnp.exp(jnp.sin(jnp.tan(A**3))) ** 2
+    def testee(a: np.float64) -> jax.Array:
+        return jnp.exp(jnp.sin(jnp.tan(a**3))) ** 2
 
-    A = np.e
-    ref = testee(A)
-    res = jace.jit(testee)(A)
+    a = np.e
+    ref = testee(a)
+    res = jace.jit(testee)(a)
 
     assert np.allclose(ref, res)
diff --git a/tests/integration_tests/test_primitive_translator_managing.py b/tests/integration_tests/test_primitive_translator_managing.py
index 89daded..f4efe3c 100644
--- a/tests/integration_tests/test_primitive_translator_managing.py
+++ b/tests/integration_tests/test_primitive_translator_managing.py
@@ -168,11 +168,11 @@ def still_useless_but_a_bit_less(*args: Any, **kwargs: Any) -> None:  # noqa: AR
         trans_cnt[0] += 1
 
     @jace.jit
-    def foo(A: int) -> int:
-        B = A + 1
-        C = B + 1
-        D = C + 1
-        return D + 1
+    def foo(a: int) -> int:
+        b = a + 1
+        c = b + 1
+        d = c + 1
+        return d + 1
 
     with pytest.warns(
         UserWarning,
@@ -190,27 +190,27 @@ def test_subtranslatior_managing_decoupling() -> None:
 
     # This will use the translators that are currently installed.
     @jace.jit
-    def foo(A: int) -> int:
-        B = A + 1
-        C = B + 1
-        D = C + 1
-        return D + 1
+    def foo(a: int) -> int:
+        b = a + 1
+        c = b + 1
+        d = c + 1
+        return d + 1
 
     # Now register the add translator.
     translator.register_primitive_translator(fake_add_translator, overwrite=True)
 
     # Since `foo` was already constructed, a new registering can not change anything.
-    A = np.zeros((10, 10))
-    assert np.all(foo(A) == 4)
+    a = np.zeros((10, 10))
+    assert np.all(foo(a) == 4)
 
     # But if we now annotate a new function, then we will get fake translator
     @jace.jit
-    def foo_fail(A):
-        B = A + 1
-        return B + 1
+    def foo_fail(a):
+        b = a + 1
+        return b + 1
 
     with pytest.raises(
         expected_exception=NotImplementedError,
         match=re.escape("'fake_add_translator()' was called."),
     ):
-        _ = foo_fail.lower(A)
+        _ = foo_fail.lower(a)
diff --git a/tests/unit_tests/test_caching.py b/tests/unit_tests/test_caching.py
index 8818747..5a196eb 100644
--- a/tests/unit_tests/test_caching.py
+++ b/tests/unit_tests/test_caching.py
@@ -29,18 +29,18 @@ def test_caching_working() -> None:
     lowering_cnt = [0]
 
     @jace.jit
-    def wrapped(A: np.ndarray) -> jax.Array:
+    def wrapped(a: np.ndarray) -> jax.Array:
         lowering_cnt[0] += 1
-        return jnp.sin(A)
+        return jnp.sin(a)
 
-    A = testutil.make_array((10, 10))
-    ref = np.sin(A)
+    a = testutil.make_array((10, 10))
+    ref = np.sin(a)
     res_ids: set[int] = set()
     # We have to store the array, because numpy does reuse the memory.
     res_set: list[np.ndarray] = []
 
     for _ in range(10):
-        res = wrapped(A)
+        res = wrapped(a)
         res_id = res.__array_interface__["data"][0]
 
         assert np.allclose(res, ref)
@@ -57,39 +57,39 @@ def test_caching_same_sizes() -> None:
     lowering_cnt = [0]
 
     # This is the pure Python function.
-    def testee(A: np.ndarray, B: np.ndarray) -> np.ndarray:
-        return A * B
+    def testee(a: np.ndarray, b: np.ndarray) -> np.ndarray:
+        return a * b
 
     # this is the wrapped function.
     @jace.jit
-    def wrapped(A, B):
+    def wrapped(a, b):
         lowering_cnt[0] += 1
-        return testee(A, B)
+        return testee(a, b)
 
     # First batch of arguments.
-    A = testutil.make_array((4, 3))
-    B = testutil.make_array((4, 3))
+    a = testutil.make_array((4, 3))
+    b = testutil.make_array((4, 3))
 
     # The second batch of argument, same structure, but different values.
-    AA = A + 1.0362
-    BB = B + 0.638956
+    AA = a + 1.0362
+    BB = b + 0.638956
 
     # Now let's lower it once directly and call it.
-    lowered: stages.JaCeLowered = wrapped.lower(A, B)
+    lowered: stages.JaCeLowered = wrapped.lower(a, b)
     compiled: stages.JaCeCompiled = lowered.compile()
     assert lowering_cnt[0] == 1
-    assert np.allclose(testee(A, B), compiled(A, B))
+    assert np.allclose(testee(a, b), compiled(a, b))
 
     # Now lets call the wrapped object directly, since we already did the lowering
     #  no lowering (and compiling) is needed.
-    assert np.allclose(testee(A, B), wrapped(A, B))
+    assert np.allclose(testee(a, b), wrapped(a, b))
     assert lowering_cnt[0] == 1
 
     # Now lets call it with different objects, that have the same structure.
     #  Again no lowering should happen.
     assert np.allclose(testee(AA, BB), wrapped(AA, BB))
     assert wrapped.lower(AA, BB) is lowered
-    assert wrapped.lower(A, B) is lowered
+    assert wrapped.lower(a, b) is lowered
     assert lowering_cnt[0] == 1
 
 
@@ -101,21 +101,21 @@ def test_caching_different_sizes() -> None:
 
     # This is the wrapped function.
     @jace.jit
-    def wrapped(A, B):
+    def wrapped(a, b):
         lowering_cnt[0] += 1
-        return A * B
+        return a * b
 
     # First size of arguments
-    A = testutil.make_array((4, 3))
-    B = testutil.make_array((4, 3))
+    a = testutil.make_array((4, 3))
+    b = testutil.make_array((4, 3))
 
     # Second size of arguments
-    C = testutil.make_array((4, 4))
-    D = testutil.make_array((4, 4))
+    c = testutil.make_array((4, 4))
+    d = testutil.make_array((4, 4))
 
     # Now lower the function once for each.
-    lowered1 = wrapped.lower(A, B)
-    lowered2 = wrapped.lower(C, D)
+    lowered1 = wrapped.lower(a, b)
+    lowered2 = wrapped.lower(c, d)
     assert lowering_cnt[0] == 2
     assert lowered1 is not lowered2
 
@@ -137,14 +137,14 @@ def test_caching_different_structure() -> None:
     lowering_cnt = [0]
 
     @jace.jit
-    def wrapped(A, B):
+    def wrapped(a, b):
         lowering_cnt[0] += 1
-        return A * 4.0, B + 2.0
+        return a * 4.0, b + 2.0
 
-    A = testutil.make_array((4, 30), dtype=np.float64)
-    B = testutil.make_array((4, 3), dtype=np.float64)
-    C = testutil.make_array((4, 3), dtype=np.int64)
-    D = testutil.make_array((6, 3), dtype=np.int64)
+    a = testutil.make_array((4, 30), dtype=np.float64)
+    b = testutil.make_array((4, 3), dtype=np.float64)
+    c = testutil.make_array((4, 3), dtype=np.int64)
+    d = testutil.make_array((6, 3), dtype=np.int64)
 
     # These are the known lowered instances.
     lowerings: dict[tuple[int, int], stages.JaCeLowered] = {}
@@ -154,7 +154,7 @@ def wrapped(A, B):
     compiled_ids: set[int] = set()
 
     # Generating the lowerings
-    for arg1, arg2 in it.permutations([A, B, C, D], 2):
+    for arg1, arg2 in it.permutations([a, b, c, d], 2):
         lower = wrapped.lower(arg1, arg2)
         compiled = lower.compile()
         assert id(lower) not in lowering_ids
@@ -165,7 +165,7 @@ def wrapped(A, B):
         compiled_ids.add(id(compiled))
 
     # Now check if they are still cached.
-    for arg1, arg2 in it.permutations([A, B, C, D], 2):
+    for arg1, arg2 in it.permutations([a, b, c, d], 2):
         lower = wrapped.lower(arg1, arg2)
         clower = lowerings[id(arg1), id(arg2)]
         assert clower is lower
@@ -181,18 +181,18 @@ def test_caching_compilation() -> None:
     """Tests the compilation cache."""
 
     @jace.jit
-    def jaceWrapped(A: np.ndarray, B: np.ndarray) -> np.ndarray:
-        C = A * B
-        D = C + A
-        E = D + B  # Just enough state.
-        return A + B + C + D + E
+    def jaceWrapped(a: np.ndarray, b: np.ndarray) -> np.ndarray:
+        c = a * b
+        d = c + a
+        e = d + b  # Just enough state.
+        return a + b + c + d + e
 
     # These are the argument
-    A = testutil.make_array((4, 3))
-    B = testutil.make_array((4, 3))
+    a = testutil.make_array((4, 3))
+    b = testutil.make_array((4, 3))
 
     # Now we lower it.
-    jaceLowered = jaceWrapped.lower(A, B)
+    jaceLowered = jaceWrapped.lower(a, b)
 
     # Compiling it with and without optimizations enabled
     optiCompiled = jaceLowered.compile(optimization.DEFAULT_OPTIMIZATIONS)
@@ -216,9 +216,9 @@ def test_caching_compilation_options() -> None:
         lowering_cnt = [0]
 
         @jace.jit
-        def wrapped(A: float) -> float:
+        def wrapped(a: float) -> float:
             lowering_cnt[0] += 1
-            return A + 1.0
+            return a + 1.0
 
         lower_cache = wrapped._cache
         lowered = wrapped.lower(1.0)
@@ -258,23 +258,23 @@ def test_caching_dtype() -> None:
     lowering_cnt = [0]
 
     @jace.jit
-    def testee(A: np.ndarray) -> np.ndarray:
+    def testee(a: np.ndarray) -> np.ndarray:
         lowering_cnt[0] += 1
-        return A + A
+        return a + a
 
     dtypes = [np.float64, np.float32, np.int32, np.int64]
     shape = (10, 10)
 
     for i, dtype in enumerate(dtypes):
-        A = testutil.make_array(shape, dtype=dtype)
+        a = testutil.make_array(shape, dtype=dtype)
 
         # First lowering
         assert lowering_cnt[0] == i
-        _ = testee(A)
+        _ = testee(a)
         assert lowering_cnt[0] == i + 1
 
         # Second, implicit, lowering, which must be cached.
-        assert np.allclose(testee(A), 2 * A)
+        assert np.allclose(testee(a), 2 * a)
         assert lowering_cnt[0] == i + 1
 
 
@@ -282,8 +282,8 @@ def test_caching_eviction_simple() -> None:
     """Simple tests for cache eviction."""
 
     @jace.jit
-    def testee(A: np.ndarray) -> np.ndarray:
-        return A + 1.0
+    def testee(a: np.ndarray) -> np.ndarray:
+        return a + 1.0
 
     cache: tcache.StageCache = testee._cache
     assert len(cache) == 0
@@ -339,8 +339,8 @@ def test_caching_eviction_complex() -> None:
     """Tests if the stuff is properly evicted if the cache is full."""
 
     @jace.jit
-    def testee(A: np.ndarray) -> np.ndarray:
-        return A + 1.0
+    def testee(a: np.ndarray) -> np.ndarray:
+        return a + 1.0
 
     cache: tcache.StageCache = testee._cache
     capacity = cache.capacity
@@ -348,8 +348,8 @@ def testee(A: np.ndarray) -> np.ndarray:
 
     # Lets fill the cache to the brim.
     for i in range(capacity):
-        A = np.ones(i + 10)
-        lowered = testee.lower(A)
+        a = np.ones(i + 10)
+        lowered = testee.lower(a)
         assert len(cache) == i + 1
 
         if i == 0:
@@ -388,24 +388,24 @@ def test_caching_strides() -> None:
     lower_cnt = [0]
 
     @jace.jit
-    def wrapped(A: np.ndarray) -> np.ndarray:
+    def wrapped(a: np.ndarray) -> np.ndarray:
         lower_cnt[0] += 1
-        return A + 10.0
+        return a + 10.0
 
     shape = (10, 100, 1000)
-    C = testutil.make_array(shape, order="C")
-    F = np.array(C, copy=True, order="F")
+    array_c = testutil.make_array(shape, order="c")
+    array_f = np.array(array_c, copy=True, order="F")
 
-    # First we compile run it with C strides.
-    C_lower = wrapped.lower(C)
-    C_res = wrapped(C)
+    # First we compile run it with c strides.
+    lower_c = wrapped.lower(array_c)
+    res_c = wrapped(array_c)
 
-    F_lower = wrapped.lower(F)
-    F_res = F_lower.compile()(F)
+    lower_f = wrapped.lower(array_f)
+    res_f = lower_f.compile()(array_f)
 
-    assert C_res is not F_res
-    assert np.allclose(F_res, C_res)
-    assert F_lower is not C_lower
+    assert res_c is not res_f
+    assert np.allclose(res_f, res_c)
+    assert lower_f is not lower_c
     assert lower_cnt[0] == 2
 
 
@@ -419,9 +419,9 @@ def _test_impl(
         lowering_cnt = [0]
 
         @jace.jit
-        def wrapped(A: np.ndarray | jax.Array) -> np.ndarray | jax.Array:
+        def wrapped(a: np.ndarray | jax.Array) -> np.ndarray | jax.Array:
             lowering_cnt[0] += 1
-            return A + 1.0
+            return a + 1.0
 
         # Explicit lowering.
         _ = wrapped(for_lowering)
@@ -431,9 +431,9 @@ def wrapped(A: np.ndarray | jax.Array) -> np.ndarray | jax.Array:
         _ = wrapped(for_calling)
         assert lowering_cnt[0] == 1, "Expected no further lowering."
 
-    A_numpy = testutil.make_array((10, 10))
-    A_jax = jnp.array(A_numpy, copy=True)
-    assert A_numpy.dtype == A_jax.dtype
+    a_numpy = testutil.make_array((10, 10))
+    a_jax = jnp.array(a_numpy, copy=True)
+    assert a_numpy.dtype == a_jax.dtype
 
-    _test_impl(A_numpy, A_jax)
-    _test_impl(A_jax, A_numpy)
+    _test_impl(a_numpy, a_jax)
+    _test_impl(a_jax, a_numpy)
diff --git a/tests/unit_tests/test_decorator.py b/tests/unit_tests/test_decorator.py
index a23ca6d..7460491 100644
--- a/tests/unit_tests/test_decorator.py
+++ b/tests/unit_tests/test_decorator.py
@@ -22,24 +22,24 @@
 def test_decorator_individually() -> None:
     """Tests the compilation steps individually."""
 
-    def testee_(A: np.ndarray, B: np.ndarray) -> np.ndarray:
-        return A + B
+    def testee_(a: np.ndarray, b: np.ndarray) -> np.ndarray:
+        return a + b
 
     lowering_cnt = [0]
 
     @jace.jit
-    def testee(A, B):
+    def testee(a, b):
         lowering_cnt[0] += 1
-        return testee_(A, B)
+        return testee_(a, b)
 
-    A = testutil.make_array((4, 3))
-    B = testutil.make_array((4, 3))
+    a = testutil.make_array((4, 3))
+    b = testutil.make_array((4, 3))
 
-    lowered = testee.lower(A, B)
+    lowered = testee.lower(a, b)
     compiled = lowered.compile()
 
-    ref = testee_(A, B)
-    res = compiled(A, B)
+    ref = testee_(a, b)
+    res = compiled(a, b)
 
     assert np.allclose(ref, res), f"Expected '{ref}' got '{res}'."
     assert lowering_cnt[0] == 1
@@ -48,21 +48,21 @@ def testee(A, B):
 def test_decorator_one_go() -> None:
     """Tests the compilation steps in one go."""
 
-    def testee_(A: np.ndarray, B: np.ndarray) -> np.ndarray:
-        return A + B
+    def testee_(a: np.ndarray, b: np.ndarray) -> np.ndarray:
+        return a + b
 
     lowering_cnt = [0]
 
     @jace.jit
-    def testee(A, B):
+    def testee(a, b):
         lowering_cnt[0] += 1
-        return testee_(A, B)
+        return testee_(a, b)
 
-    A = testutil.make_array((4, 3))
-    B = testutil.make_array((4, 3))
+    a = testutil.make_array((4, 3))
+    b = testutil.make_array((4, 3))
 
-    ref = testee_(A, B)
-    res = testee(A, B)
+    ref = testee_(a, b)
+    res = testee(a, b)
 
     assert np.allclose(ref, res), f"Expected '{ref}' got '{res}'."
     assert lowering_cnt[0] == 1
@@ -71,8 +71,8 @@ def testee(A, B):
 def test_decorator_wrapped() -> None:
     """Tests if some properties are set correctly."""
 
-    def testee(A: np.ndarray, B: np.ndarray) -> np.ndarray:
-        return A * B
+    def testee(a: np.ndarray, b: np.ndarray) -> np.ndarray:
+        return a * b
 
     wrapped = jace.jit(testee)
 
diff --git a/tests/unit_tests/test_jax_api.py b/tests/unit_tests/test_jax_api.py
index ad21947..e308489 100644
--- a/tests/unit_tests/test_jax_api.py
+++ b/tests/unit_tests/test_jax_api.py
@@ -24,17 +24,17 @@
 def test_jit() -> None:
     """Simple add function."""
 
-    def testee(A: np.ndarray, B: np.ndarray) -> np.ndarray:
-        return A + B
+    def testee(a: np.ndarray, b: np.ndarray) -> np.ndarray:
+        return a + b
 
-    A = testutil.make_array((4, 3))
-    B = testutil.make_array((4, 3))
+    a = testutil.make_array((4, 3))
+    b = testutil.make_array((4, 3))
 
     jax_testee = jax.jit(testee)
     jace_testee = jace.jit(testee)
 
-    ref = jax_testee(A, B)
-    res = jace_testee(A, B)
+    ref = jax_testee(a, b)
+    res = jace_testee(a, b)
 
     assert np.allclose(ref, res), f"Expected '{ref}' got '{res}'."
 
@@ -80,19 +80,19 @@ def ddf(x):
 def test_composition_with_jax() -> None:
     """Tests if JaCe can interact with Jax and vice versa."""
 
-    def base_fun(A, B, C):
-        return A + B * jnp.sin(C) - A * B
+    def base_fun(a, b, C):
+        return a + b * jnp.sin(C) - a * b
 
     @jace.jit
-    def jace_fun(A, B, C):
-        return jax.jit(base_fun)(A, B, C)
+    def jace_fun(a, b, C):
+        return jax.jit(base_fun)(a, b, C)
 
-    def jax_fun(A, B, C):
-        return jace.jit(base_fun)(A, B, C)
+    def jax_fun(a, b, C):
+        return jace.jit(base_fun)(a, b, C)
 
-    A, B, C = (testutil.make_array((10, 3, 50)) for _ in range(3))
+    a, b, C = (testutil.make_array((10, 3, 50)) for _ in range(3))
 
-    assert np.allclose(jace_fun(A, B, C), jax_fun(A, B, C))
+    assert np.allclose(jace_fun(a, b, C), jax_fun(a, b, C))
 
 
 @pytest.mark.skip(reason="Nested Jaxpr are not handled.")
@@ -100,26 +100,26 @@ def test_composition_with_jax_2() -> None:
     """Second test if JaCe can interact with Jax and vice versa."""
 
     @jax.jit
-    def f1_jax(A, B):
-        return A + B
+    def f1_jax(a, b):
+        return a + b
 
     @jace.jit
-    def f2_jace(A, B, C):
-        return f1_jax(A, B) - C
+    def f2_jace(a, b, C):
+        return f1_jax(a, b) - C
 
     @jax.jit
-    def f3_jax(A, B, C, D):
-        return f2_jace(A, B, C) * D
+    def f3_jax(a, b, C, D):
+        return f2_jace(a, b, C) * D
 
     @jace.jit
-    def f3_jace(A, B, C, D):
-        return f3_jax(A, B, C, D)
+    def f3_jace(a, b, C, D):
+        return f3_jax(a, b, C, D)
 
-    A, B, C, D = (testutil.make_array((10, 3, 50)) for _ in range(4))
+    a, b, C, D = (testutil.make_array((10, 3, 50)) for _ in range(4))
 
-    ref = ((A + B) - C) * D
-    res_jax = f3_jax(A, B, C, D)
-    res_jace = f3_jace(A, B, C, D)
+    ref = ((a + b) - C) * D
+    res_jax = f3_jax(a, b, C, D)
+    res_jace = f3_jace(a, b, C, D)
 
     assert np.allclose(ref, res_jax), "Jax failed."
     assert np.allclose(ref, res_jace), "JaCe Failed."
@@ -180,20 +180,20 @@ def test_disabled_x64() -> None:
         Once the x64 issue is resolved make this test a bit more useful.
     """
 
-    def testee(A: np.ndarray, B: np.float64) -> np.ndarray:
-        return A + B
+    def testee(a: np.ndarray, b: np.float64) -> np.ndarray:
+        return a + b
 
-    A = testutil.make_array((4, 3))
-    B = np.float64(10.0)
+    a = testutil.make_array((4, 3))
+    b = np.float64(10.0)
 
     # Run them with disabled x64 support
     #  This is basically a reimplementation of the `JaCeWrapped.lower()` function.
     #  but we have to do it this way to disable the x64 mode in translation.
     with jax.experimental.disable_x64():
-        jaxpr = jax.make_jaxpr(testee)(A, B)
+        jaxpr = jax.make_jaxpr(testee)(a, b)
 
     _, flat_in_vals, _ = ptrans.trace_and_flatten_function(
-        fun=testee, trace_call_args=(A, B), trace_call_kwargs={}, trace_options={}
+        fun=testee, trace_call_args=(a, b), trace_call_kwargs={}, trace_options={}
     )
     builder = translator.JaxprTranslationBuilder(
         primitive_translators=translator.get_registered_primitive_translators()
@@ -256,13 +256,13 @@ def ones10x10() -> jax.Array:
 def test_jax_array_as_input() -> None:
     """This function tests if we use Jax arrays as inputs."""
 
-    def testee(A: jax.Array) -> jax.Array:
-        return jnp.sin(A + 1.0)
+    def testee(a: jax.Array) -> jax.Array:
+        return jnp.sin(a + 1.0)
 
-    A = jnp.array(testutil.make_array((10, 19)))
+    a = jnp.array(testutil.make_array((10, 19)))
 
-    ref = testee(A)
-    res = jace.jit(testee)(A)
+    ref = testee(a)
+    res = jace.jit(testee)(a)
 
     assert res.shape == ref.shape
     assert res.dtype == ref.dtype
@@ -272,14 +272,14 @@ def testee(A: jax.Array) -> jax.Array:
 def test_jax_pytree() -> None:
     """Perform if pytrees are handled correctly."""
 
-    def testee(A: dict[str, np.ndarray]) -> dict[str, jax.Array]:
-        mod_a = {k: jnp.sin(v) for k, v in A.items()}
-        mod_a["__additional"] = jnp.asin(A["a1"])
+    def testee(a: dict[str, np.ndarray]) -> dict[str, jax.Array]:
+        mod_a = {k: jnp.sin(v) for k, v in a.items()}
+        mod_a["__additional"] = jnp.asin(a["a1"])
         return mod_a
 
-    A = {f"a{i}": testutil.make_array((10, 10)) for i in range(4)}
-    ref = testee(A)
-    res = jace.jit(testee)(A)
+    a = {f"a{i}": testutil.make_array((10, 10)) for i in range(4)}
+    ref = testee(a)
+    res = jace.jit(testee)(a)
 
     assert len(res) == len(ref)
     assert type(res) == type(ref)
diff --git a/tests/unit_tests/test_misc.py b/tests/unit_tests/test_misc.py
index a2ca5de..fa235f8 100644
--- a/tests/unit_tests/test_misc.py
+++ b/tests/unit_tests/test_misc.py
@@ -27,16 +27,16 @@ class in DaCe. As I understand the `CompiledSDFG::_construct_args()` function th
     """
 
     @jace.jit
-    def testee(A: np.ndarray) -> np.ndarray:
-        return -A
+    def testee(a: np.ndarray) -> np.ndarray:
+        return -a
 
     # Different types.
-    A1 = testutil.make_array((4, 3), dtype=np.float32)
-    A2 = testutil.make_array((4, 3), dtype=np.int64)
+    a1 = testutil.make_array((4, 3), dtype=np.float32)
+    a2 = testutil.make_array((4, 3), dtype=np.int64)
 
     # Lower and compilation for first type
-    callee = testee.lower(A1).compile()
+    callee = testee.lower(a1).compile()
 
     # But calling with the second type
     with pytest.raises(Exception):  # noqa: B017, PT011 # Unknown exception.
-        _ = callee(A2)
+        _ = callee(a2)

From 9cd0e0128283db379b0da129105fb7893a3149f4 Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Fri, 14 Jun 2024 07:48:41 +0200
Subject: [PATCH 372/458] This should fix the problems in the CI.

---
 .github/workflows/ci.yml | 2 +-
 CONTRIBUTING.md          | 4 ++--
 2 files changed, 3 insertions(+), 3 deletions(-)

diff --git a/.github/workflows/ci.yml b/.github/workflows/ci.yml
index b065ed7..0bb29c7 100644
--- a/.github/workflows/ci.yml
+++ b/.github/workflows/ci.yml
@@ -50,7 +50,7 @@ jobs:
         allow-prereleases: true
 
     - name: Install requirementes
-      run: python -m pip install -r requirements-dev.txt
+      run: python -m pip install -r requirements/dev.txt
 
     - name: Install package
       run: python -m pip install .
diff --git a/CONTRIBUTING.md b/CONTRIBUTING.md
index 19d5adb..8810f89 100644
--- a/CONTRIBUTING.md
+++ b/CONTRIBUTING.md
@@ -25,7 +25,7 @@ You can set up a development environment by running:
 python3 -m venv .venv
 source ./.venv/bin/activate
 pip install --upgrade pip setuptools wheel
-pip install -r requirements-dev.txt
+pip install -r requirements/dev.txt
 pip install -v -e .
 ```
 
@@ -34,7 +34,7 @@ If you have the [Python Launcher for Unix](https://github.com/brettcannon/python
 ```bash
 py -m venv .venv
 py -m pip install --upgrade pip setuptools wheel
-py -m pip install -r requirements-dev.txt
+py -m pip install -r requirements/dev.txt
 py -m pip install -v -e .
 ```
 

From 3377f412a81df108a317c4c8758a1d684b32f33d Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Fri, 14 Jun 2024 10:12:20 +0200
Subject: [PATCH 373/458] Now allowed direct return values even in non empty
 Jaxpr.

---
 src/jace/stages.py                            |  2 +-
 src/jace/translator/pre_post_translation.py   | 48 +++++++++++--------
 .../test_jaxpr_translator_builder.py          |  1 -
 tests/unit_tests/test_jax_api.py              |  2 +-
 4 files changed, 30 insertions(+), 23 deletions(-)

diff --git a/src/jace/stages.py b/src/jace/stages.py
index 8806787..a84cf4a 100644
--- a/src/jace/stages.py
+++ b/src/jace/stages.py
@@ -159,7 +159,7 @@ def lower(self, *args: Any, **kwargs: Any) -> JaCeLowered:
         tsdfg: jace.TranslatedJaxprSDFG = ptrans.postprocess_jaxpr_sdfg(
             trans_ctx=trans_ctx,
             fun=self.wrapped_fun,
-            call_args=flat_call_args,
+            flat_call_args=flat_call_args,
         )
 
         # NOTE: `tsdfg` is deepcopied as a side effect of post processing.
diff --git a/src/jace/translator/pre_post_translation.py b/src/jace/translator/pre_post_translation.py
index 5fef3af..9432e01 100644
--- a/src/jace/translator/pre_post_translation.py
+++ b/src/jace/translator/pre_post_translation.py
@@ -30,7 +30,7 @@
 def postprocess_jaxpr_sdfg(
     trans_ctx: translator.TranslationContext,
     fun: Callable,  # noqa: ARG001  # Currently unused
-    call_args: Sequence[Any],
+    flat_call_args: Sequence[Any],
     validate: bool = True,
 ) -> jace.TranslatedJaxprSDFG:
     """
@@ -42,7 +42,7 @@ def postprocess_jaxpr_sdfg(
     Args:
         trans_ctx: The `TranslationContext` obtained from a `translate_jaxpr()` call.
         fun: The original function that was translated.
-        call_args: The flattened input arguments.
+        flat_call_args: The flattened input arguments.
         validate: Perform validation.
 
     Todo:
@@ -50,12 +50,12 @@ def postprocess_jaxpr_sdfg(
         - Fixing stride problem of the input.
     """
     trans_ctx.validate()  # Always validate, it is cheap.
-    create_input_output_stages(trans_ctx=trans_ctx, call_args=call_args)
+    create_input_output_stages(trans_ctx=trans_ctx, flat_call_args=flat_call_args)
     return finalize_translation_context(trans_ctx, validate=validate)
 
 
 def create_input_output_stages(
-    trans_ctx: translator.TranslationContext, call_args: Sequence[Any]
+    trans_ctx: translator.TranslationContext, flat_call_args: Sequence[Any]
 ) -> None:
     """
     Creates an input and output state inside the SDFG in place.
@@ -64,12 +64,12 @@ def create_input_output_stages(
 
     Args:
         trans_ctx: The translation context that should be modified.
-        call_args: The flattened call arguments that should be used.
+        flat_call_args: The flattened call arguments that should be used.
 
     Note:
         The processed SDFG will remain canonical.
     """
-    _create_input_state(trans_ctx, call_args)
+    _create_input_state(trans_ctx, flat_call_args)
     _create_output_state(trans_ctx)
 
 
@@ -87,8 +87,13 @@ def _create_output_state(trans_ctx: translator.TranslationContext) -> None:
     """
     assert trans_ctx.inp_names is not None and trans_ctx.out_names is not None
 
-    if set(trans_ctx.inp_names).intersection(trans_ctx.out_names):
-        raise NotImplementedError("Shared input and output variables are not supported yet.")
+    # NOTE: Currently we do not support to write back into an input argument, as Jax.
+    #  However, this is a requirement for handling ICON stencils, that we will support
+    #  eventually. If we get a translation context that lists a variable name in the
+    #  inputs and outputs, this means that it was returned unmodified. In Jax this
+    #  will lead to a copy and we also do it. This is implemented by just naïvely
+    #  creating a separate output variable for every output we have, irrespectively
+    #  of its name inside the Jaxpr.
 
     output_pattern = "__jace_output_{}"
     sdfg = trans_ctx.sdfg
@@ -129,19 +134,20 @@ def _create_output_state(trans_ctx: translator.TranslationContext) -> None:
     trans_ctx.out_names = tuple(new_output_names)
 
 
-def _create_input_state(trans_ctx: translator.TranslationContext, call_args: Sequence[Any]) -> None:
+def _create_input_state(
+    trans_ctx: translator.TranslationContext, flat_call_args: Sequence[Any]
+) -> None:
     """
     Creates the input processing state for the SDFG in place.
 
-    The function will create a new set of variables that are exposed as inputs. If an
-    input argument is an array, the new variable will have the same strides and storage
-    location the actual input value, that is passed inside `call_args`. If the input is
-    a scalar and GPU mode is activated, the function will add the necessary connections
-    to transfer it to the device.
+    The function will create a new set of variables that are exposed as inputs. This
+    variables are based on the example input arguments passed through `flat_call_args`.
+    This process will hard code the memory location and strides into the SDFG.
+    The assignment is performed inside a new state, which is put at the beginning.
 
     Args:
         trans_ctx: The translation context that should be modified.
-        call_args: The flattened call arguments for which the input
+        flat_call_args: The flattened call arguments for which the input
             state should be specialized.
 
     Todo:
@@ -149,17 +155,19 @@ def _create_input_state(trans_ctx: translator.TranslationContext, call_args: Seq
     """
     assert trans_ctx.inp_names is not None and trans_ctx.out_names is not None
 
-    if set(trans_ctx.inp_names).intersection(trans_ctx.out_names):
-        raise NotImplementedError("Shared input and output variables are not supported yet.")
-    if len(call_args) != len(trans_ctx.inp_names):
-        raise ValueError(f"Expected {len(trans_ctx.inp_names)}, but got {len(call_args)}.")
+    # NOTE: This function will create a distinct variable for every input. Once we
+    #  allow write back arguments they will be handled in the `_create_output_state()`
+    #  function anyway, also see the comment in that function.
+
+    if len(flat_call_args) != len(trans_ctx.inp_names):
+        raise ValueError(f"Expected {len(trans_ctx.inp_names)}, but got {len(flat_call_args)}.")
 
     sdfg = trans_ctx.sdfg
     new_input_state: dace.SDFGState = sdfg.add_state(f"{sdfg.name}__start_state")
     new_input_names: list[str] = []
     input_pattern = "__jace_input_{}"
 
-    for i, (org_input_name, call_arg) in enumerate(zip(trans_ctx.inp_names, call_args)):
+    for i, (org_input_name, call_arg) in enumerate(zip(trans_ctx.inp_names, flat_call_args)):
         org_input_desc: dace.data.Data = sdfg.arrays[org_input_name]
         new_input_name = input_pattern.format(i)
 
diff --git a/tests/integration_tests/test_jaxpr_translator_builder.py b/tests/integration_tests/test_jaxpr_translator_builder.py
index 28c7b86..da941a3 100644
--- a/tests/integration_tests/test_jaxpr_translator_builder.py
+++ b/tests/integration_tests/test_jaxpr_translator_builder.py
@@ -555,7 +555,6 @@ def wrapped(a: np.ndarray, b: np.ndarray) -> tuple[np.ndarray, np.ndarray]:
     assert np.allclose(ref, res)
 
 
-@pytest.mark.skip(reason="Direct returns, in a non empty context does not work yet.")
 def test_builder_direct_return() -> None:
     """Tests the case, when an input value is returned as output.
 
diff --git a/tests/unit_tests/test_jax_api.py b/tests/unit_tests/test_jax_api.py
index e308489..47ce672 100644
--- a/tests/unit_tests/test_jax_api.py
+++ b/tests/unit_tests/test_jax_api.py
@@ -201,7 +201,7 @@ def testee(a: np.ndarray, b: np.float64) -> np.ndarray:
     trans_ctx: translator.TranslationContext = builder.translate_jaxpr(jaxpr)
 
     tsdfg: jace.TranslatedJaxprSDFG = ptrans.postprocess_jaxpr_sdfg(
-        trans_ctx=trans_ctx, fun=testee, call_args=flat_in_vals
+        trans_ctx=trans_ctx, fun=testee, flat_call_args=flat_in_vals
     )
 
     # Because x64 is disabled Jax traces the input as float32, even if we have passed

From 272dd007a3a4d8b3e56749213d09bac216a4ab37 Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Fri, 14 Jun 2024 10:33:44 +0200
Subject: [PATCH 374/458] Bump version.

---
 .pre-commit-config.yaml |  2 +-
 requirements/base.txt   | 30 ++++--------------------------
 requirements/cuda12.txt |  2 +-
 requirements/dev.txt    | 10 ++++++++++
 4 files changed, 16 insertions(+), 28 deletions(-)

diff --git a/.pre-commit-config.yaml b/.pre-commit-config.yaml
index 255e6ed..4e4b514 100644
--- a/.pre-commit-config.yaml
+++ b/.pre-commit-config.yaml
@@ -68,7 +68,7 @@ repos:
     files: src|tests
     args: [--no-install-types]
     additional_dependencies:
-    - dace==0.15.1
+    - dace==0.16
     - jax[cpu]==0.4.29
     - numpy==1.26.4
     - pytest==8.2.2
diff --git a/requirements/base.txt b/requirements/base.txt
index 1aae055..70bc827 100644
--- a/requirements/base.txt
+++ b/requirements/base.txt
@@ -9,36 +9,20 @@ aenum==3.1.15
     # via dace
 astunparse==1.6.3
     # via dace
-blinker==1.8.2
-    # via flask
-certifi==2024.6.2
-    # via requests
-charset-normalizer==3.3.2
-    # via requests
-click==8.1.7
-    # via flask
-dace==0.15.1
+dace==0.16
     # via -r requirements/base.in
 dill==0.3.8
     # via dace
-flask==3.0.3
-    # via dace
 fparser==0.1.4
     # via dace
-idna==3.7
-    # via requests
-itsdangerous==2.2.0
-    # via flask
 jax[cpu]==0.4.29
     # via -r requirements/base.in
 jaxlib==0.4.29
     # via jax
 jinja2==3.1.4
-    # via flask
+    # via dace
 markupsafe==2.1.5
-    # via
-    #   jinja2
-    #   werkzeug
+    # via jinja2
 ml-dtypes==0.4.0
     # via
     #   jax
@@ -64,8 +48,6 @@ ply==3.11
     # via dace
 pyyaml==6.0.1
     # via dace
-requests==2.32.3
-    # via dace
 scipy==1.13.1
     # via
     #   jax
@@ -74,16 +56,12 @@ setuptools-scm==8.1.0
     # via fparser
 six==1.16.0
     # via astunparse
-sympy==1.9
+sympy==1.12.1
     # via dace
 tomli==2.0.1
     # via setuptools-scm
-urllib3==2.2.1
-    # via requests
 websockets==12.0
     # via dace
-werkzeug==3.0.3
-    # via flask
 wheel==0.43.0
     # via astunparse
 
diff --git a/requirements/cuda12.txt b/requirements/cuda12.txt
index 078edf2..ebeb3aa 100644
--- a/requirements/cuda12.txt
+++ b/requirements/cuda12.txt
@@ -10,7 +10,7 @@ alembic==1.13.1
     # via optuna
 colorlog==6.8.2
     # via optuna
-cupy-cuda12x==13.1.0
+cupy-cuda12x==13.2.0
     # via -r requirements/cuda12.in
 fastrlock==0.8.2
     # via cupy-cuda12x
diff --git a/requirements/dev.txt b/requirements/dev.txt
index 176b9a2..a112135 100644
--- a/requirements/dev.txt
+++ b/requirements/dev.txt
@@ -12,6 +12,10 @@ babel==2.15.0
     # via sphinx
 beautifulsoup4==4.12.3
     # via furo
+certifi==2024.6.2
+    # via requests
+charset-normalizer==3.3.2
+    # via requests
 coverage[toml]==7.5.3
     # via pytest-cov
 docutils==0.21.2
@@ -22,6 +26,8 @@ exceptiongroup==1.2.1
     # via pytest
 furo==2024.5.6
     # via -r requirements/dev.in
+idna==3.7
+    # via requests
 imagesize==1.4.1
     # via sphinx
 iniconfig==2.0.0
@@ -52,6 +58,8 @@ pytest==8.2.2
     #   pytest-cov
 pytest-cov==5.0.0
     # via -r requirements/dev.in
+requests==2.32.3
+    # via sphinx
 ruff==0.4.8
     # via -r requirements/dev.in
 snowballstemmer==2.2.0
@@ -90,6 +98,8 @@ typing-extensions==4.12.2
     # via
     #   -r requirements/dev.in
     #   mypy
+urllib3==2.2.1
+    # via requests
 
 # The following packages are considered to be unsafe in a requirements file:
 # setuptools

From 3e5408baee174c11ab0f04263cf09f851164f8b2 Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Fri, 14 Jun 2024 13:46:32 +0200
Subject: [PATCH 375/458] Bump version.

---
 .pre-commit-config.yaml | 2 +-
 pyproject.toml          | 2 +-
 2 files changed, 2 insertions(+), 2 deletions(-)

diff --git a/.pre-commit-config.yaml b/.pre-commit-config.yaml
index 586cb6f..451bc29 100644
--- a/.pre-commit-config.yaml
+++ b/.pre-commit-config.yaml
@@ -69,7 +69,7 @@ repos:
     files: src|tests
     args: [--no-install-types]
     additional_dependencies:
-    - dace==0.15.1
+    - dace==0.16
     - jax[cpu]==0.4.28
     - numpy==1.26.4
     - pytest==8.2.1
diff --git a/pyproject.toml b/pyproject.toml
index e4f1d11..17955c7 100644
--- a/pyproject.toml
+++ b/pyproject.toml
@@ -24,7 +24,7 @@ classifiers = [
   "Typing :: Typed",
 ]
 dependencies = [
-  "dace>=0.15",
+  "dace>=0.16",
   "jax[cpu]>=0.4.24",
   "numpy>=1.26.0",
 ]

From 3f1d2ad111d0127160ee201f86289e7d988cb72f Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Fri, 14 Jun 2024 13:49:41 +0200
Subject: [PATCH 376/458] Updated the ignore file to also include some JaCe
 stuff.

---
 .gitignore | 4 ++++
 1 file changed, 4 insertions(+)

diff --git a/.gitignore b/.gitignore
index 15604f3..e49382d 100644
--- a/.gitignore
+++ b/.gitignore
@@ -155,6 +155,10 @@ Thumbs.db
 
 # DaCe
 .dacecache/
+_dacegraphs
+
+# JaCe
+.jacecache/
 
 # Common editor files
 *~

From e6730d121905b0e994f3b6447132815949a61adc Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Fri, 14 Jun 2024 14:11:09 +0200
Subject: [PATCH 377/458] Moved tracing to its own top level module.

It is used by the translator but it does not belong into `translator`.
---
 src/jace/stages.py                          |  4 +-
 src/jace/tracing.py                         | 88 +++++++++++++++++++++
 src/jace/translator/pre_post_translation.py | 67 +---------------
 tests/unit_tests/test_jax_api.py            |  4 +-
 4 files changed, 93 insertions(+), 70 deletions(-)
 create mode 100644 src/jace/tracing.py

diff --git a/src/jace/stages.py b/src/jace/stages.py
index a84cf4a..6cb960c 100644
--- a/src/jace/stages.py
+++ b/src/jace/stages.py
@@ -34,7 +34,7 @@
 from jax import tree_util as jax_tree
 
 import jace
-from jace import optimization, translator, util
+from jace import optimization, tracing, translator, util
 from jace.optimization import CompilerOptions
 from jace.translator import pre_post_translation as ptrans
 from jace.util import translation_cache as tcache
@@ -146,7 +146,7 @@ def lower(self, *args: Any, **kwargs: Any) -> JaCeLowered:
         Note:
             The tracing is always done with activated `x64` mode.
         """
-        jaxpr, flat_call_args, outtree = ptrans.trace_and_flatten_function(
+        jaxpr, flat_call_args, outtree = tracing.trace_and_flatten_function(
             fun=self._fun,
             trace_call_args=args,
             trace_call_kwargs=kwargs,
diff --git a/src/jace/tracing.py b/src/jace/tracing.py
new file mode 100644
index 0000000..b755756
--- /dev/null
+++ b/src/jace/tracing.py
@@ -0,0 +1,88 @@
+# JaCe - JAX Just-In-Time compilation using DaCe (Data Centric Parallel Programming)
+#
+# Copyright (c) 2024, ETH Zurich
+# All rights reserved.
+#
+# SPDX-License-Identifier: BSD-3-Clause
+
+"""
+Implements the tracing machinery that is used to build the Jaxpr.
+
+Essentially, Jax provides `jax.make_jaxpr()` which is essentially a debug utility. Jax
+does not provide any public way to get a Jaxpr. This module provides the necessary
+functionality for use in JaCe.
+"""
+
+from __future__ import annotations
+
+import inspect
+from typing import TYPE_CHECKING, Any
+
+import jax
+from jax import tree_util as jax_tree
+
+
+if TYPE_CHECKING:
+    from collections.abc import Callable, Mapping, Sequence
+
+
+def trace_and_flatten_function(
+    fun: Callable,
+    trace_call_args: Sequence[Any],
+    trace_call_kwargs: Mapping[str, Any],
+    trace_options: Mapping[str, Any],
+) -> tuple[jax.core.ClosedJaxpr, list[Any], jax_tree.PyTreeDef]:
+    """
+    Traces `fun` and generates the Jaxpr and some related meta data.
+
+    For tracing the computation `fun` the function uses the `trace_call_args`
+    and `trace_call_kwargs` arguments, both should not be flattened. Furthermore,
+    the tracing is done in enabled x64 mode.
+
+    Returns:
+        The function will return a tuple of length three.
+        1) The Jaxpr that was generated by Jax using the supplied arguments and options.
+        2) The flattened input.
+        3) A pytree describing the output.
+
+    Args:
+        fun: The original Python computation.
+        trace_call_args: The positional arguments that should be used for
+            tracing the computation.
+        trace_call_kwargs: The keyword arguments that should be used for
+            tracing the computation.
+        trace_options: The options used for tracing, the same arguments that
+            are supported by `jace.jit`.
+
+    Todo:
+        - Handle default arguments of `fun`.
+        - Handle static arguments.
+        - Turn `trace_options` into a `TypedDict` and sync with `jace.jit`.
+    """
+    if trace_options:
+        raise NotImplementedError(
+            f"Not supported tracing options: {', '.join(f'{k}' for k in trace_options)}"
+        )
+    assert all(param.default is param.empty for param in inspect.signature(fun).parameters.values())
+
+    # In Jax `float32` is the main datatype, and they go to great lengths to avoid some
+    #  aggressive [type promotion](https://jax.readthedocs.io/en/latest/type_promotion.html).
+    #  However, in this case we will have problems when we call the SDFG, for some
+    #  reasons `CompiledSDFG` does not work in that case correctly, thus we enable it
+    #  for the tracing.
+    with jax.experimental.enable_x64():
+        # TODO(phimuell): copy the implementation of the real tracing
+        jaxpr, outshapes = jax.make_jaxpr(fun, return_shape=True)(
+            *trace_call_args, **trace_call_kwargs
+        )
+
+    # Regardless what the documentation of `make_jaxpr` claims, it does not output a
+    #  pytree instead an abstract description of the shape, that we will transform into
+    #  a pytree.
+    outtree = jax_tree.tree_structure(outshapes)
+
+    # Make the input tree
+    flat_in_vals = jax_tree.tree_leaves((trace_call_args, trace_call_kwargs))
+    assert len(jaxpr.in_avals) == len(flat_in_vals), "Static arguments not implemented."
+
+    return jaxpr, flat_in_vals, outtree
diff --git a/src/jace/translator/pre_post_translation.py b/src/jace/translator/pre_post_translation.py
index 9432e01..c2a79cb 100644
--- a/src/jace/translator/pre_post_translation.py
+++ b/src/jace/translator/pre_post_translation.py
@@ -10,19 +10,16 @@
 from __future__ import annotations
 
 import copy
-import inspect
 from typing import TYPE_CHECKING, Any
 
 import dace
-import jax
-from jax import tree_util as jax_tree
 
 import jace
 from jace import util
 
 
 if TYPE_CHECKING:
-    from collections.abc import Callable, Mapping, Sequence
+    from collections.abc import Callable, Sequence
 
     from jace import translator
 
@@ -252,65 +249,3 @@ def finalize_translation_context(
     if validate:
         tsdfg.validate()
     return tsdfg
-
-
-def trace_and_flatten_function(
-    fun: Callable,
-    trace_call_args: Sequence[Any],
-    trace_call_kwargs: Mapping[str, Any],
-    trace_options: Mapping[str, Any],
-) -> tuple[jax.core.ClosedJaxpr, list[Any], jax_tree.PyTreeDef]:
-    """
-    Traces `fun` and generates the Jaxpr and some related meta data.
-
-    For tracing the computation `fun` the function uses the `trace_call_args`
-    and `trace_call_kwargs` arguments, both should not be flattened. Furthermore,
-    the tracing is done in enabled x64 mode.
-
-    Returns:
-        The function will return a tuple of length three.
-        1) The Jaxpr that was generated by Jax using the supplied arguments and options.
-        2) The flattened input.
-        3) A pytree describing the output.
-
-    Args:
-        fun: The original Python computation.
-        trace_call_args: The positional arguments that should be used for
-            tracing the computation.
-        trace_call_kwargs: The keyword arguments that should be used for
-            tracing the computation.
-        trace_options: The options used for tracing, the same arguments that
-            are supported by `jace.jit`.
-
-    Todo:
-        - Handle default arguments of `fun`.
-        - Handle static arguments.
-        - Turn `trace_options` into a `TypedDict` and sync with `jace.jit`.
-    """
-    if trace_options:
-        raise NotImplementedError(
-            f"Not supported tracing options: {', '.join(f'{k}' for k in trace_options)}"
-        )
-    assert all(param.default is param.empty for param in inspect.signature(fun).parameters.values())
-
-    # In Jax `float32` is the main datatype, and they go to great lengths to avoid some
-    #  aggressive [type promotion](https://jax.readthedocs.io/en/latest/type_promotion.html).
-    #  However, in this case we will have problems when we call the SDFG, for some
-    #  reasons `CompiledSDFG` does not work in that case correctly, thus we enable it
-    #  for the tracing.
-    with jax.experimental.enable_x64():
-        # TODO(phimuell): copy the implementation of the real tracing
-        jaxpr, outshapes = jax.make_jaxpr(fun, return_shape=True)(
-            *trace_call_args, **trace_call_kwargs
-        )
-
-    # Regardless what the documentation of `make_jaxpr` claims, it does not output a
-    #  pytree instead an abstract description of the shape, that we will transform into
-    #  a pytree.
-    outtree = jax_tree.tree_structure(outshapes)
-
-    # Make the input tree
-    flat_in_vals = jax_tree.tree_leaves((trace_call_args, trace_call_kwargs))
-    assert len(jaxpr.in_avals) == len(flat_in_vals), "Static arguments not implemented."
-
-    return jaxpr, flat_in_vals, outtree
diff --git a/tests/unit_tests/test_jax_api.py b/tests/unit_tests/test_jax_api.py
index 47ce672..b3d44b0 100644
--- a/tests/unit_tests/test_jax_api.py
+++ b/tests/unit_tests/test_jax_api.py
@@ -15,7 +15,7 @@
 from jax import numpy as jnp
 
 import jace
-from jace import translator, util
+from jace import tracing, translator, util
 from jace.translator import pre_post_translation as ptrans
 
 from tests import util as testutil
@@ -192,7 +192,7 @@ def testee(a: np.ndarray, b: np.float64) -> np.ndarray:
     with jax.experimental.disable_x64():
         jaxpr = jax.make_jaxpr(testee)(a, b)
 
-    _, flat_in_vals, _ = ptrans.trace_and_flatten_function(
+    _, flat_in_vals, _ = tracing.trace_and_flatten_function(
         fun=testee, trace_call_args=(a, b), trace_call_kwargs={}, trace_options={}
     )
     builder = translator.JaxprTranslationBuilder(

From 82cf898960668fb0da812d30dbb202554ec37aac Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Fri, 14 Jun 2024 14:19:31 +0200
Subject: [PATCH 378/458] Updated the ROADMAP.

---
 ROADMAP.md | 11 ++++++-----
 1 file changed, 6 insertions(+), 5 deletions(-)

diff --git a/ROADMAP.md b/ROADMAP.md
index ec14397..2633585 100644
--- a/ROADMAP.md
+++ b/ROADMAP.md
@@ -4,11 +4,11 @@ A kind of roadmap that gives a rough idea about how the project will be continue
 
 - [x] Being able to perform _some_ translations [PR#3](https://github.com/GridTools/jace/pull/3).
 - [ ] Basic functionalities:
-  - [ ] Annotation `@jace.jit`.
-  - [ ] Composable with Jax, i.e. take the Jax derivative of a JaCe annotated function.
-  - [ ] Implementing the `stages` model that is supported by Jax.
-  - [ ] Handling Jax arrays as native input (only on single host).
-  - [ ] Cache the compilation and lowering results for later reuse.
+  - [x] Annotation `@jace.jit`.
+  - [x] Composable with Jax, i.e. take the Jax derivative of a JaCe annotated function.
+  - [x] Implementing the `stages` model that is supported by Jax.
+  - [x] Handling Jax arrays as native input (only on single host).
+  - [x] Cache the compilation and lowering results for later reuse.
     In Jax these parts (together with the dispatch) are actually written in C++, thus in the beginning we will use a self made cache.
 - [ ] Implementing some basic `PrimitiveTranslators`, that allows us to run some early tests, such as:
   - [ ] Backporting the ones from the prototype.
@@ -23,6 +23,7 @@ A kind of roadmap that gives a rough idea about how the project will be continue
   But passing these benchmarks could give us some better hint of how to proceed in this matter.
   - [ ] Passing the [pyhpc-benchmark](https://github.com/dionhaefner/pyhpc-benchmarks)
   - [ ] Passing Felix' fluid project; possibility.
+  - [ ] Flash-Attention, there is a DaCe implementation.
 - [ ] Support of static arguments.
 - [ ] Stop relying on `jax.make_jaxpr()`.
   Look at the `jax._src.pjit.make_jit()` function for how to hijack the staging process.

From da57db9132719296b1d2efed12e92d445e602f0b Mon Sep 17 00:00:00 2001
From: Enrique Gonzalez Paredes <enriqueg@cscs.ch>
Date: Fri, 14 Jun 2024 15:08:33 +0200
Subject: [PATCH 379/458] Improve developer documentation and add devenv
 session setup to nox

---
 .github/workflows/ci.yml    |   2 +-
 .pre-commit-config.yaml     |   2 +-
 CONTRIBUTING.md             |   9 ++-
 noxfile.py                  | 152 ++++++++++++++++++++++++++----------
 requirements/base.txt       |  30 +------
 requirements/cuda12.txt     |   2 +-
 requirements/dev-cuda12.in  |   2 +-
 requirements/dev-cuda12.txt |   4 +-
 requirements/dev.in         |   6 +-
 requirements/dev.txt        |  45 ++++++++++-
 10 files changed, 174 insertions(+), 80 deletions(-)

diff --git a/.github/workflows/ci.yml b/.github/workflows/ci.yml
index b065ed7..0bb29c7 100644
--- a/.github/workflows/ci.yml
+++ b/.github/workflows/ci.yml
@@ -50,7 +50,7 @@ jobs:
         allow-prereleases: true
 
     - name: Install requirementes
-      run: python -m pip install -r requirements-dev.txt
+      run: python -m pip install -r requirements/dev.txt
 
     - name: Install package
       run: python -m pip install .
diff --git a/.pre-commit-config.yaml b/.pre-commit-config.yaml
index 255e6ed..4e4b514 100644
--- a/.pre-commit-config.yaml
+++ b/.pre-commit-config.yaml
@@ -68,7 +68,7 @@ repos:
     files: src|tests
     args: [--no-install-types]
     additional_dependencies:
-    - dace==0.15.1
+    - dace==0.16
     - jax[cpu]==0.4.29
     - numpy==1.26.4
     - pytest==8.2.2
diff --git a/CONTRIBUTING.md b/CONTRIBUTING.md
index 19d5adb..1b060b1 100644
--- a/CONTRIBUTING.md
+++ b/CONTRIBUTING.md
@@ -9,6 +9,7 @@ The fastest way to start with development is to use nox. If you don't have nox,
 To use, run `nox`. This will lint and test using every installed version of Python on your system, skipping ones that are not installed. You can also run specific jobs:
 
 ```console
+$ nox -s venv-3.10  # (or venv-3.11, or venv-3.12) Setup a fully working development envinroment
 $ nox -s lint  # Lint only
 $ nox -s tests  # Python tests
 $ nox -s docs -- --serve  # Build and serve the docs
@@ -25,16 +26,16 @@ You can set up a development environment by running:
 python3 -m venv .venv
 source ./.venv/bin/activate
 pip install --upgrade pip setuptools wheel
-pip install -r requirements-dev.txt
+pip install -r requirements/dev.txt
 pip install -v -e .
 ```
 
-If you have the [Python Launcher for Unix](https://github.com/brettcannon/python-launcher), you can instead do:
+Or, if you have the [Python Launcher for Unix](https://github.com/brettcannon/python-launcher), you could do:
 
 ```bash
 py -m venv .venv
 py -m pip install --upgrade pip setuptools wheel
-py -m pip install -r requirements-dev.txt
+py -m pip install -r requirements/dev.txt
 py -m pip install -v -e .
 ```
 
@@ -43,7 +44,7 @@ py -m pip install -v -e .
 You should prepare pre-commit, which will help you by checking that commits pass required checks:
 
 ```bash
-pip install pre-commit # or brew install pre-commit on macOS
+pipx install pre-commit # or brew install pre-commit on macOS
 pre-commit install # Will install a pre-commit hook into the git repo
 ```
 
diff --git a/noxfile.py b/noxfile.py
index 4b9ba40..e55b13f 100644
--- a/noxfile.py
+++ b/noxfile.py
@@ -3,22 +3,43 @@
 from __future__ import annotations
 
 import argparse
+import pathlib
+import re
 import shutil
-from pathlib import Path
 
 import nox
 
 
-DIR = Path(__file__).parent.resolve()
-
 nox.needs_version = ">=2024.3.2"
 nox.options.sessions = ["lint", "tests"]
 nox.options.default_venv_backend = "uv|virtualenv"
 
 
+ROOT_DIR = pathlib.Path(__file__).parent.resolve()
+DEFAULT_DEV_VENV_PATH = ROOT_DIR / ".venv"
+
+
+def load_from_frozen_requirements(filename: str) -> dict[str, str]:
+    requirements = {}
+    with pathlib.Path(filename).open(encoding="locale") as f:
+        for raw_line in f:
+            if (end := raw_line.find("#")) != -1:
+                raw_line = raw_line[:end]  # noqa: PLW2901 [redefined-loop-name]
+            line = raw_line.strip()
+            if line and not line.startswith("-"):
+                m = re.match(r"^([^=]*)\s*([^;]*)\s*;?\s*(.*)$", line)
+                if m:
+                    requirements[m[1]] = m[2]
+
+    return requirements
+
+
+REQUIREMENTS = load_from_frozen_requirements(ROOT_DIR / "requirements" / "dev.txt")
+
+
 @nox.session
 def lint(session: nox.Session) -> None:
-    """Run the linter."""
+    """Run the linter (pre-commit)."""
     session.install("pre-commit")
     session.run("pre-commit", "run", "--all-files", "--show-diff-on-failure", *session.posargs)
 
@@ -30,9 +51,93 @@ def tests(session: nox.Session) -> None:
     session.run("pytest", *session.posargs)
 
 
+@nox.session(python=["3.10", "3.11", "3.12"])
+def venv(session: nox.Session) -> None:
+    """
+    Sets up a Python development environment. Use as: `nox -s venv -- [dest_path] [req_preset]
+
+    This session will:
+    - Create a python virtualenv for the session
+    - Install the `virtualenv` cli tool into this environment
+    - Use `virtualenv` to create a project virtual environment
+    - Invoke the python interpreter from the created project environment
+      to install the project and all it's development dependencies.
+    """  # noqa: W505 [doc-line-too-long]
+    venv_path = f"{DEFAULT_DEV_VENV_PATH}-{session.python}"
+    req_preset = "dev"
+    virtualenv_args = []
+    if session.posargs:
+        venv_path, *more_pos_args = session.posargs
+        if more_pos_args:
+            req_preset, _ = more_pos_args
+    venv_path = pathlib.Path(venv_path).resolve()
+
+    if not venv_path.exists():
+        print(f"Creating virtualenv at '{venv_path}' (options: {virtualenv_args})...")
+        session.install("virtualenv")
+        session.run("virtualenv", venv_path, silent=True)
+
+    python_path = venv_path / "bin" / "python"
+    requirements_file = f"requirements/{req_preset}.txt"
+
+    # Use the venv's interpreter to install the project along with
+    # all it's dev dependencies, this ensures it's installed in the right way
+    print(f"Setting up development environment from '{requirements_file}'...")
+    session.run(
+        python_path,
+        "-m",
+        "pip",
+        "install",
+        "-r",
+        requirements_file,
+        "-e.",
+        external=True,
+    )
+
+
+@nox.session
+def requirements(session: nox.Session) -> None:
+    """Freeze requirements files from project specification and synchronize versions across tools."""  # noqa: W505 [doc-line-too-long]
+    requirements_path = ROOT_DIR / "requirements"
+    req_sync_tool = requirements_path / "sync_tool.py"
+
+    dependencies = ["pre-commit"] + nox.project.load_toml(req_sync_tool)["dependencies"]
+    session.install(*dependencies)
+    session.install("pip-compile-multi")
+
+    session.run("python", req_sync_tool, "pull")
+    session.run("pip-compile-multi", "-g", "--skip-constraints")
+    session.run("python", req_sync_tool, "push")
+
+    session.run("pre-commit", "run", "--files", ".pre-commit-config.yaml", success_codes=[0, 1])
+
+
 @nox.session(reuse_venv=True)
 def docs(session: nox.Session) -> None:
-    """Build the docs. Pass "--serve" to serve. Pass "-b linkcheck" to check links."""
+    """Regenerate and build all API and user docs."""
+    session.notify("api_docs")
+    session.notify("user_docs", posargs=session.posargs)
+
+
+@nox.session(reuse_venv=True)
+def api_docs(session: nox.Session) -> None:
+    """Build (regenerate) API docs."""
+    session.install(f"sphinx=={REQUIREMENTS['sphinx']}")
+    session.chdir("docs")
+    session.run(
+        "sphinx-apidoc",
+        "-o",
+        "api/",
+        "--module-first",
+        "--no-toc",
+        "--force",
+        "../src/jace",
+    )
+
+
+@nox.session(reuse_venv=True)
+def user_docs(session: nox.Session) -> None:
+    """Build the user docs. Pass "--serve" to serve. Pass "-b linkcheck" to check links."""  # noqa: W505 [doc-line-too-long]
     parser = argparse.ArgumentParser()
     parser.add_argument("--serve", action="store_true", help="Serve after building")
     parser.add_argument("-b", dest="builder", default="html", help="Build target (default: html)")
@@ -64,45 +169,12 @@ def docs(session: nox.Session) -> None:
         session.run("sphinx-build", "--keep-going", *shared_args)
 
 
-@nox.session
-def build_api_docs(session: nox.Session) -> None:
-    """Build (regenerate) API docs."""
-    session.install("sphinx")
-    session.chdir("docs")
-    session.run(
-        "sphinx-apidoc",
-        "-o",
-        "api/",
-        "--module-first",
-        "--no-toc",
-        "--force",
-        "../src/jace",
-    )
-
-
 @nox.session
 def build(session: nox.Session) -> None:
     """Build an SDist and wheel."""
-    build_path = DIR.joinpath("build")
+    build_path = ROOT_DIR / "build"
     if build_path.exists():
         shutil.rmtree(build_path)
 
-    session.install("build")
+    session.install(f"build=={REQUIREMENTS['build']}")
     session.run("python", "-m", "build")
-
-
-@nox.session
-def requirements(session: nox.Session) -> None:
-    """Freeze dependencies from input specs and synchronize across tools."""
-    requirements_path = DIR / "requirements"
-    req_sync_tool = requirements_path / "sync_tool.py"
-
-    dependencies = ["pre-commit"] + nox.project.load_toml(req_sync_tool)["dependencies"]
-    session.install(*dependencies)
-    session.install("pip-compile-multi")
-
-    session.run("python", req_sync_tool, "pull")
-    session.run("pip-compile-multi", "-g", "--skip-constraints")
-    session.run("python", req_sync_tool, "push")
-
-    session.run("pre-commit", "run", "--files", ".pre-commit-config.yaml", success_codes=[0, 1])
diff --git a/requirements/base.txt b/requirements/base.txt
index 1aae055..70bc827 100644
--- a/requirements/base.txt
+++ b/requirements/base.txt
@@ -9,36 +9,20 @@ aenum==3.1.15
     # via dace
 astunparse==1.6.3
     # via dace
-blinker==1.8.2
-    # via flask
-certifi==2024.6.2
-    # via requests
-charset-normalizer==3.3.2
-    # via requests
-click==8.1.7
-    # via flask
-dace==0.15.1
+dace==0.16
     # via -r requirements/base.in
 dill==0.3.8
     # via dace
-flask==3.0.3
-    # via dace
 fparser==0.1.4
     # via dace
-idna==3.7
-    # via requests
-itsdangerous==2.2.0
-    # via flask
 jax[cpu]==0.4.29
     # via -r requirements/base.in
 jaxlib==0.4.29
     # via jax
 jinja2==3.1.4
-    # via flask
+    # via dace
 markupsafe==2.1.5
-    # via
-    #   jinja2
-    #   werkzeug
+    # via jinja2
 ml-dtypes==0.4.0
     # via
     #   jax
@@ -64,8 +48,6 @@ ply==3.11
     # via dace
 pyyaml==6.0.1
     # via dace
-requests==2.32.3
-    # via dace
 scipy==1.13.1
     # via
     #   jax
@@ -74,16 +56,12 @@ setuptools-scm==8.1.0
     # via fparser
 six==1.16.0
     # via astunparse
-sympy==1.9
+sympy==1.12.1
     # via dace
 tomli==2.0.1
     # via setuptools-scm
-urllib3==2.2.1
-    # via requests
 websockets==12.0
     # via dace
-werkzeug==3.0.3
-    # via flask
 wheel==0.43.0
     # via astunparse
 
diff --git a/requirements/cuda12.txt b/requirements/cuda12.txt
index 078edf2..ebeb3aa 100644
--- a/requirements/cuda12.txt
+++ b/requirements/cuda12.txt
@@ -10,7 +10,7 @@ alembic==1.13.1
     # via optuna
 colorlog==6.8.2
     # via optuna
-cupy-cuda12x==13.1.0
+cupy-cuda12x==13.2.0
     # via -r requirements/cuda12.in
 fastrlock==0.8.2
     # via cupy-cuda12x
diff --git a/requirements/dev-cuda12.in b/requirements/dev-cuda12.in
index aa00469..496e623 100644
--- a/requirements/dev-cuda12.in
+++ b/requirements/dev-cuda12.in
@@ -1,2 +1,2 @@
--r base.in
+-r cuda12.in
 -r dev.in
diff --git a/requirements/dev-cuda12.txt b/requirements/dev-cuda12.txt
index 7c894e8..0dca1e7 100644
--- a/requirements/dev-cuda12.txt
+++ b/requirements/dev-cuda12.txt
@@ -1,11 +1,11 @@
-# SHA1:d9f19ac423500f255d32c3e29dd96fd3b5c649a8
+# SHA1:bdbfa7e1d9b9ca837d092c4efc6792c2b58238be
 #
 # This file is autogenerated by pip-compile-multi
 # To update, run:
 #
 #    pip-compile-multi
 #
--r base.txt
+-r cuda12.txt
 -r dev.txt
 
 # The following packages are considered to be unsafe in a requirements file:
diff --git a/requirements/dev.in b/requirements/dev.in
index b648f8a..4421d27 100644
--- a/requirements/dev.in
+++ b/requirements/dev.in
@@ -1,4 +1,5 @@
 -r base.in
+build>=1.2
 furo>=2023.08.17
 mypy>=1.9.0
 myst_parser>=0.13
@@ -6,7 +7,8 @@ pytest>=6
 pytest-cov>=3
 ruff>=0.3.5
 sphinx>=7.0
-sphinx_autodoc_typehints
-sphinx_copybutton
+sphinx-autobuild>=2021.3.14
+sphinx_autodoc_typehints>=2.1
+sphinx_copybutton>=0.5
 tomlkit>=0.12.4
 typing-extensions>=4.10.0
diff --git a/requirements/dev.txt b/requirements/dev.txt
index 176b9a2..4b45b5e 100644
--- a/requirements/dev.txt
+++ b/requirements/dev.txt
@@ -1,4 +1,4 @@
-# SHA1:a7338646990b5874d5aa51bb3e2bd37753c754eb
+# SHA1:60e060370596513d7e06534a0655974dcc750dcd
 #
 # This file is autogenerated by pip-compile-multi
 # To update, run:
@@ -8,10 +8,24 @@
 -r base.txt
 alabaster==0.7.16
     # via sphinx
+anyio==4.4.0
+    # via
+    #   starlette
+    #   watchfiles
 babel==2.15.0
     # via sphinx
 beautifulsoup4==4.12.3
     # via furo
+build==1.2.1
+    # via -r requirements/dev.in
+certifi==2024.6.2
+    # via requests
+charset-normalizer==3.3.2
+    # via requests
+click==8.1.7
+    # via uvicorn
+colorama==0.4.6
+    # via sphinx-autobuild
 coverage[toml]==7.5.3
     # via pytest-cov
 docutils==0.21.2
@@ -19,9 +33,17 @@ docutils==0.21.2
     #   myst-parser
     #   sphinx
 exceptiongroup==1.2.1
-    # via pytest
+    # via
+    #   anyio
+    #   pytest
 furo==2024.5.6
     # via -r requirements/dev.in
+h11==0.14.0
+    # via uvicorn
+idna==3.7
+    # via
+    #   anyio
+    #   requests
 imagesize==1.4.1
     # via sphinx
 iniconfig==2.0.0
@@ -46,14 +68,20 @@ pygments==2.18.0
     # via
     #   furo
     #   sphinx
+pyproject-hooks==1.1.0
+    # via build
 pytest==8.2.2
     # via
     #   -r requirements/dev.in
     #   pytest-cov
 pytest-cov==5.0.0
     # via -r requirements/dev.in
+requests==2.32.3
+    # via sphinx
 ruff==0.4.8
     # via -r requirements/dev.in
+sniffio==1.3.1
+    # via anyio
 snowballstemmer==2.2.0
     # via sphinx
 soupsieve==2.5
@@ -63,9 +91,12 @@ sphinx==7.3.7
     #   -r requirements/dev.in
     #   furo
     #   myst-parser
+    #   sphinx-autobuild
     #   sphinx-autodoc-typehints
     #   sphinx-basic-ng
     #   sphinx-copybutton
+sphinx-autobuild==2024.4.16
+    # via -r requirements/dev.in
 sphinx-autodoc-typehints==2.1.1
     # via -r requirements/dev.in
 sphinx-basic-ng==1.0.0b2
@@ -84,12 +115,22 @@ sphinxcontrib-qthelp==1.0.7
     # via sphinx
 sphinxcontrib-serializinghtml==1.1.10
     # via sphinx
+starlette==0.37.2
+    # via sphinx-autobuild
 tomlkit==0.12.5
     # via -r requirements/dev.in
 typing-extensions==4.12.2
     # via
     #   -r requirements/dev.in
+    #   anyio
     #   mypy
+    #   uvicorn
+urllib3==2.2.1
+    # via requests
+uvicorn==0.30.1
+    # via sphinx-autobuild
+watchfiles==0.22.0
+    # via sphinx-autobuild
 
 # The following packages are considered to be unsafe in a requirements file:
 # setuptools

From 6eef078c00f4f4ced6ec0a4a7bce770f8fc4b9d0 Mon Sep 17 00:00:00 2001
From: Enrique Gonzalez Paredes <enriqueg@cscs.ch>
Date: Fri, 14 Jun 2024 15:13:13 +0200
Subject: [PATCH 380/458] Add information message

---
 noxfile.py | 2 ++
 1 file changed, 2 insertions(+)

diff --git a/noxfile.py b/noxfile.py
index e55b13f..27f9404 100644
--- a/noxfile.py
+++ b/noxfile.py
@@ -76,6 +76,8 @@ def venv(session: nox.Session) -> None:
         print(f"Creating virtualenv at '{venv_path}' (options: {virtualenv_args})...")
         session.install("virtualenv")
         session.run("virtualenv", venv_path, silent=True)
+    else:
+        print(f"'{venv_path}' path already exists. Skipping virtualenv creation...")
 
     python_path = venv_path / "bin" / "python"
     requirements_file = f"requirements/{req_preset}.txt"

From 63699087df229e7aae821b7650f9269ecbe57827 Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Mon, 17 Jun 2024 10:31:27 +0200
Subject: [PATCH 381/458] pytest now ignores deprication warnings from numpy,
 this is needed because DaCe uses some of these internals.

---
 pyproject.toml | 5 ++++-
 1 file changed, 4 insertions(+), 1 deletion(-)

diff --git a/pyproject.toml b/pyproject.toml
index b9d9992..393ce01 100644
--- a/pyproject.toml
+++ b/pyproject.toml
@@ -110,7 +110,10 @@ module = [
 
 [tool.pytest.ini_options]
 addopts = ["-ra", "--showlocals", "--strict-markers", "--strict-config"]
-filterwarnings = ["error"]
+filterwarnings = [
+  "error",
+  "ignore:numpy\\..*:DeprecationWarning",  # DaCe is not NumPy v2.0 ready so ignore the usage of deprecated features.
+]
 log_cli_level = "INFO"
 minversion = "6.0"
 testpaths = ["tests"]

From 0aa1726cfa67fc930e28dbc988d7b39ede6d5bb6 Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Mon, 17 Jun 2024 10:47:03 +0200
Subject: [PATCH 382/458] Changed the names inside the test to make them
 conforming to an (in the end) arbitrary rule.

---
 pyproject.toml                                |  1 -
 ...primitive_arithmetic_logical_operations.py | 56 +++++++++----------
 .../test_jaxpr_translator_builder.py          |  4 +-
 .../test_primitive_translator_managing.py     |  4 +-
 tests/unit_tests/test_caching.py              | 29 +++++-----
 tests/unit_tests/test_jax_api.py              | 42 +++++++-------
 6 files changed, 69 insertions(+), 67 deletions(-)

diff --git a/pyproject.toml b/pyproject.toml
index c86c4fe..edb44b9 100644
--- a/pyproject.toml
+++ b/pyproject.toml
@@ -232,7 +232,6 @@ max-complexity = 12
 ]
 "tests/**" = [
   "D",  # pydocstyle
-  "N",  # TODO(egparedes): remove ignore as soon as all tests are properly named
   "PLR2004",  # [magic-value-comparison]
   "T10",  # flake8-debugger
   "T20",  # flake8-print
diff --git a/tests/integration_tests/primitive_translators/test_primitive_arithmetic_logical_operations.py b/tests/integration_tests/primitive_translators/test_primitive_arithmetic_logical_operations.py
index 2764830..fc15ecf 100644
--- a/tests/integration_tests/primitive_translators/test_primitive_arithmetic_logical_operations.py
+++ b/tests/integration_tests/primitive_translators/test_primitive_arithmetic_logical_operations.py
@@ -226,55 +226,55 @@ def testee(a: float) -> float | jax.Array:
 
 
 def test_mapped_binary_scalar() -> None:
-    def testee(a: np.float64, B: np.float64) -> np.float64:
-        return a * B
+    def testee(a: np.float64, b: np.float64) -> np.float64:
+        return a * b
 
     _perform_alt_test(testee, np.float64(1.0), np.float64(2.0))
 
 
 def test_mapped_binary_scalar_partial_literal() -> None:
-    def testeeR(a: np.float64) -> np.float64:
+    def testee_r(a: np.float64) -> np.float64:
         return a * 2.03
 
-    def testeeL(a: np.float64) -> np.float64:
+    def testee_l(a: np.float64) -> np.float64:
         return 2.03 * a
 
     a = np.float64(7.0)
-    _perform_alt_test(testeeR, a)
-    _perform_alt_test(testeeL, a)
+    _perform_alt_test(testee_r, a)
+    _perform_alt_test(testee_l, a)
 
 
 def test_mapped_binary_array() -> None:
     """Test binary of arrays, with same size."""
 
-    def testee(a: np.ndarray, B: np.ndarray) -> np.ndarray:
-        return a + B
+    def testee(a: np.ndarray, b: np.ndarray) -> np.ndarray:
+        return a + b
 
     a = testutil.make_array((100, 10, 3))
-    B = testutil.make_array((100, 10, 3))
-    _perform_alt_test(testee, a, B)
+    b = testutil.make_array((100, 10, 3))
+    _perform_alt_test(testee, a, b)
 
 
 def test_mapped_binary_array_scalar() -> None:
-    def testee(a: np.ndarray | np.float64, B: np.float64 | np.ndarray) -> np.ndarray:
-        return a + B  # type: ignore[return-value]  # It is always an array.
+    def testee(a: np.ndarray | np.float64, b: np.float64 | np.ndarray) -> np.ndarray:
+        return a + b  # type: ignore[return-value]  # It is always an array.
 
     a = testutil.make_array((100, 22))
-    B = np.float64(1.34)
-    _perform_alt_test(testee, a, B)
-    _perform_alt_test(testee, B, a)
+    b = np.float64(1.34)
+    _perform_alt_test(testee, a, b)
+    _perform_alt_test(testee, b, a)
 
 
 def test_mapped_binary_array_partial_literal() -> None:
-    def testeeR(a: np.ndarray) -> np.ndarray:
+    def testee_r(a: np.ndarray) -> np.ndarray:
         return a + 1.52
 
-    def testeeL(a: np.ndarray) -> np.ndarray:
+    def testee_l(a: np.ndarray) -> np.ndarray:
         return 1.52 + a
 
     a = testutil.make_array((100, 22))
-    _perform_alt_test(testeeR, a)
-    _perform_alt_test(testeeL, a)
+    _perform_alt_test(testee_r, a)
+    _perform_alt_test(testee_l, a)
 
 
 def test_mapped_binary_array_constants() -> None:
@@ -286,13 +286,13 @@ def testee(a: np.ndarray) -> np.ndarray:
 
 
 def test_mapped_broadcast(broadcast_input: tuple[np.ndarray, np.ndarray]) -> None:
-    def testee(a: np.ndarray, B: np.ndarray) -> np.ndarray:
-        return a + B
+    def testee(a: np.ndarray, b: np.ndarray) -> np.ndarray:
+        return a + b
 
     a = broadcast_input[0]
-    B = broadcast_input[1]
-    _perform_alt_test(testee, a, B)
-    _perform_alt_test(testee, B, a)
+    b = broadcast_input[1]
+    _perform_alt_test(testee, a, b)
+    _perform_alt_test(testee, b, a)
 
 
 # <------------ Tests for arithmetic and logical translators/operations
@@ -324,8 +324,8 @@ def testee(a: np.ndarray) -> jax.Array:
 def test_alt_general_binary_float(
     alt_binary_ops_float: tuple[Callable, tuple[np.ndarray, np.ndarray]],
 ) -> None:
-    def testee(a: np.ndarray, B: np.ndarray) -> np.ndarray:
-        return alt_binary_ops_float[0](a, B)
+    def testee(a: np.ndarray, b: np.ndarray) -> np.ndarray:
+        return alt_binary_ops_float[0](a, b)
 
     _perform_alt_test(testee, *alt_binary_ops_float[1])
 
@@ -333,8 +333,8 @@ def testee(a: np.ndarray, B: np.ndarray) -> np.ndarray:
 def test_alt_compare_operation(
     alt_binary_compare_ops: tuple[Callable, tuple[np.ndarray, np.ndarray]],
 ) -> None:
-    def testee(a: np.ndarray, B: np.ndarray) -> np.ndarray:
-        return alt_binary_compare_ops[0](a, B)
+    def testee(a: np.ndarray, b: np.ndarray) -> np.ndarray:
+        return alt_binary_compare_ops[0](a, b)
 
     _perform_alt_test(testee, *alt_binary_compare_ops[1])
 
diff --git a/tests/integration_tests/test_jaxpr_translator_builder.py b/tests/integration_tests/test_jaxpr_translator_builder.py
index da941a3..60f791a 100644
--- a/tests/integration_tests/test_jaxpr_translator_builder.py
+++ b/tests/integration_tests/test_jaxpr_translator_builder.py
@@ -52,7 +52,7 @@ def translation_builder() -> translator.JaxprTranslationBuilder:
     builder = translator.JaxprTranslationBuilder(
         primitive_translators=translator.get_registered_primitive_translators()
     )
-    jaxpr = jax.make_jaxpr(lambda A: A)(1.0)  # dummy jaxpr, needed for construction.
+    jaxpr = jax.make_jaxpr(lambda a: a)(1.0)  # dummy jaxpr, needed for construction.
     builder._allocate_translation_ctx(name=name, jaxpr=jaxpr)
     return builder
 
@@ -634,7 +634,7 @@ def test_builder_jace_var() -> None:
             _ = JaCeVar((), dace.int8, name=iname)
 
 
-def test_builder_F_strides() -> None:
+def test_builder_FORTRAN_strides() -> None:  # noqa: N802  # Function name
     """Tests if we can lower without a standard stride.
 
     Notes:
diff --git a/tests/integration_tests/test_primitive_translator_managing.py b/tests/integration_tests/test_primitive_translator_managing.py
index f4efe3c..c72b9bf 100644
--- a/tests/integration_tests/test_primitive_translator_managing.py
+++ b/tests/integration_tests/test_primitive_translator_managing.py
@@ -63,7 +63,7 @@ def __call__(self) -> None:  # type: ignore[override]  # Arguments
 
 
 @translator.make_primitive_translator("non_existing_callable_primitive3")
-def SubTrans3_Callable(*args: Any, **kwargs: Any) -> None:  # noqa: ARG001
+def primitive_translator_3_callable(*args: Any, **kwargs: Any) -> None:  # noqa: ARG001
     raise NotImplementedError
 
 
@@ -83,7 +83,7 @@ def test_subtranslatior_managing() -> None:
     sub2 = SubTrans2()
 
     # These are all primitive translators
-    prim_translators = [sub1, sub2, SubTrans3_Callable]
+    prim_translators = [sub1, sub2, primitive_translator_3_callable]
 
     # Add the instances.
     for sub in prim_translators:
diff --git a/tests/unit_tests/test_caching.py b/tests/unit_tests/test_caching.py
index 5a196eb..3b0b7a4 100644
--- a/tests/unit_tests/test_caching.py
+++ b/tests/unit_tests/test_caching.py
@@ -71,8 +71,8 @@ def wrapped(a, b):
     b = testutil.make_array((4, 3))
 
     # The second batch of argument, same structure, but different values.
-    AA = a + 1.0362
-    BB = b + 0.638956
+    aa = a + 1.0362
+    bb = b + 0.638956
 
     # Now let's lower it once directly and call it.
     lowered: stages.JaCeLowered = wrapped.lower(a, b)
@@ -87,8 +87,8 @@ def wrapped(a, b):
 
     # Now lets call it with different objects, that have the same structure.
     #  Again no lowering should happen.
-    assert np.allclose(testee(AA, BB), wrapped(AA, BB))
-    assert wrapped.lower(AA, BB) is lowered
+    assert np.allclose(testee(aa, bb), wrapped(aa, bb))
+    assert wrapped.lower(aa, bb) is lowered
     assert wrapped.lower(a, b) is lowered
     assert lowering_cnt[0] == 1
 
@@ -181,7 +181,7 @@ def test_caching_compilation() -> None:
     """Tests the compilation cache."""
 
     @jace.jit
-    def jaceWrapped(a: np.ndarray, b: np.ndarray) -> np.ndarray:
+    def jace_wrapped(a: np.ndarray, b: np.ndarray) -> np.ndarray:
         c = a * b
         d = c + a
         e = d + b  # Just enough state.
@@ -192,21 +192,24 @@ def jaceWrapped(a: np.ndarray, b: np.ndarray) -> np.ndarray:
     b = testutil.make_array((4, 3))
 
     # Now we lower it.
-    jaceLowered = jaceWrapped.lower(a, b)
+    jace_lowered = jace_wrapped.lower(a, b)
 
     # Compiling it with and without optimizations enabled
-    optiCompiled = jaceLowered.compile(optimization.DEFAULT_OPTIMIZATIONS)
-    unoptiCompiled = jaceLowered.compile(optimization.NO_OPTIMIZATIONS)
+    optized_compiled = jace_lowered.compile(optimization.DEFAULT_OPTIMIZATIONS)
+    unoptized_compiled = jace_lowered.compile(optimization.NO_OPTIMIZATIONS)
 
     # Because of the way how things work the optimized must have more than the
     #  unoptimized. If there is sharing, then this would not be the case.
-    assert unoptiCompiled is not optiCompiled
-    assert optiCompiled._csdfg.sdfg.number_of_nodes() == 1
-    assert optiCompiled._csdfg.sdfg.number_of_nodes() < unoptiCompiled._csdfg.sdfg.number_of_nodes()
+    assert unoptized_compiled is not optized_compiled
+    assert optized_compiled._csdfg.sdfg.number_of_nodes() == 1
+    assert (
+        optized_compiled._csdfg.sdfg.number_of_nodes()
+        < unoptized_compiled._csdfg.sdfg.number_of_nodes()
+    )
 
     # Now we check if they are still inside the cache.
-    assert optiCompiled is jaceLowered.compile(optimization.DEFAULT_OPTIMIZATIONS)
-    assert unoptiCompiled is jaceLowered.compile(optimization.NO_OPTIMIZATIONS)
+    assert optized_compiled is jace_lowered.compile(optimization.DEFAULT_OPTIMIZATIONS)
+    assert unoptized_compiled is jace_lowered.compile(optimization.NO_OPTIMIZATIONS)
 
 
 def test_caching_compilation_options() -> None:
diff --git a/tests/unit_tests/test_jax_api.py b/tests/unit_tests/test_jax_api.py
index b3d44b0..866f53b 100644
--- a/tests/unit_tests/test_jax_api.py
+++ b/tests/unit_tests/test_jax_api.py
@@ -80,19 +80,19 @@ def ddf(x):
 def test_composition_with_jax() -> None:
     """Tests if JaCe can interact with Jax and vice versa."""
 
-    def base_fun(a, b, C):
-        return a + b * jnp.sin(C) - a * b
+    def base_fun(a, b, c):
+        return a + b * jnp.sin(c) - a * b
 
     @jace.jit
-    def jace_fun(a, b, C):
-        return jax.jit(base_fun)(a, b, C)
+    def jace_fun(a, b, c):
+        return jax.jit(base_fun)(a, b, c)
 
-    def jax_fun(a, b, C):
-        return jace.jit(base_fun)(a, b, C)
+    def jax_fun(a, b, c):
+        return jace.jit(base_fun)(a, b, c)
 
-    a, b, C = (testutil.make_array((10, 3, 50)) for _ in range(3))
+    a, b, c = (testutil.make_array((10, 3, 50)) for _ in range(3))
 
-    assert np.allclose(jace_fun(a, b, C), jax_fun(a, b, C))
+    assert np.allclose(jace_fun(a, b, c), jax_fun(a, b, c))
 
 
 @pytest.mark.skip(reason="Nested Jaxpr are not handled.")
@@ -104,22 +104,22 @@ def f1_jax(a, b):
         return a + b
 
     @jace.jit
-    def f2_jace(a, b, C):
-        return f1_jax(a, b) - C
+    def f2_jace(a, b, c):
+        return f1_jax(a, b) - c
 
     @jax.jit
-    def f3_jax(a, b, C, D):
-        return f2_jace(a, b, C) * D
+    def f3_jax(a, b, c, d):
+        return f2_jace(a, b, c) * d
 
     @jace.jit
-    def f3_jace(a, b, C, D):
-        return f3_jax(a, b, C, D)
+    def f3_jace(a, b, c, d):
+        return f3_jax(a, b, c, d)
 
-    a, b, C, D = (testutil.make_array((10, 3, 50)) for _ in range(4))
+    a, b, c, d = (testutil.make_array((10, 3, 50)) for _ in range(4))
 
-    ref = ((a + b) - C) * D
-    res_jax = f3_jax(a, b, C, D)
-    res_jace = f3_jace(a, b, C, D)
+    ref = ((a + b) - c) * d
+    res_jax = f3_jax(a, b, c, d)
+    res_jace = f3_jace(a, b, c, d)
 
     assert np.allclose(ref, res_jax), "Jax failed."
     assert np.allclose(ref, res_jace), "JaCe Failed."
@@ -140,10 +140,10 @@ def jace_ddf(x):
         return jace.grad(jace.grad(f))(x)
 
     # These are the random numbers where we test
-    Xs = (testutil.make_array(10) - 0.5) * 10
+    xs = (testutil.make_array(10) - 0.5) * 10
 
-    for i in range(Xs.shape[0]):
-        x = Xs[i]
+    for i in range(xs.shape[0]):
+        x = xs[i]
         res = jace_ddf(x)
         ref = jax_ddf(x)
         assert np.allclose(res, ref)

From 3424a59796fc5ab87167f75fa9b5f96af0958250 Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Mon, 17 Jun 2024 11:36:04 +0200
Subject: [PATCH 383/458] Updated the tracing function.

It is now more like jax.
---
 src/jace/stages.py               |   8 ++-
 src/jace/tracing.py              | 114 ++++++++++++++++++++-----------
 tests/unit_tests/test_jax_api.py |  10 ++-
 3 files changed, 83 insertions(+), 49 deletions(-)

diff --git a/src/jace/stages.py b/src/jace/stages.py
index 6cb960c..0477c72 100644
--- a/src/jace/stages.py
+++ b/src/jace/stages.py
@@ -146,16 +146,18 @@ def lower(self, *args: Any, **kwargs: Any) -> JaCeLowered:
         Note:
             The tracing is always done with activated `x64` mode.
         """
-        jaxpr, flat_call_args, outtree = tracing.trace_and_flatten_function(
+        jaxpr_maker = tracing.make_jaxpr(
             fun=self._fun,
-            trace_call_args=args,
-            trace_call_kwargs=kwargs,
             trace_options=self._jit_options,
+            return_outtree=True,
         )
+        jaxpr, outtree = jaxpr_maker(*args, **kwargs)
         builder = translator.JaxprTranslationBuilder(
             primitive_translators=self._primitive_translators
         )
         trans_ctx: translator.TranslationContext = builder.translate_jaxpr(jaxpr)
+
+        flat_call_args = jax_tree.tree_leaves((args, kwargs))
         tsdfg: jace.TranslatedJaxprSDFG = ptrans.postprocess_jaxpr_sdfg(
             trans_ctx=trans_ctx,
             fun=self.wrapped_fun,
diff --git a/src/jace/tracing.py b/src/jace/tracing.py
index b755756..f07fb94 100644
--- a/src/jace/tracing.py
+++ b/src/jace/tracing.py
@@ -16,43 +16,67 @@
 from __future__ import annotations
 
 import inspect
-from typing import TYPE_CHECKING, Any
+from typing import TYPE_CHECKING, Any, Concatenate, Literal, ParamSpec, overload
 
 import jax
 from jax import tree_util as jax_tree
 
 
 if TYPE_CHECKING:
-    from collections.abc import Callable, Mapping, Sequence
+    from collections.abc import Callable, Mapping
 
+_P = ParamSpec("_P")
 
-def trace_and_flatten_function(
-    fun: Callable,
-    trace_call_args: Sequence[Any],
-    trace_call_kwargs: Mapping[str, Any],
+
+@overload
+def make_jaxpr(
+    fun: Callable[Concatenate[_P], Any],
+    trace_options: Mapping[str, Any],
+    return_outtree: Literal[True],
+) -> Callable[Concatenate[_P], tuple[jax.core.ClosedJaxpr, jax_tree.PyTreeDef]]: ...
+
+
+@overload
+def make_jaxpr(
+    fun: Callable[Concatenate[_P], Any],
+    trace_options: Mapping[str, Any],
+    return_outtree: Literal[False] = False,
+) -> Callable[Concatenate[_P], jax.core.ClosedJaxpr]: ...
+
+
+def make_jaxpr(
+    fun: Callable[Concatenate[_P], Any],
     trace_options: Mapping[str, Any],
-) -> tuple[jax.core.ClosedJaxpr, list[Any], jax_tree.PyTreeDef]:
+    return_outtree: bool = False,
+) -> (
+    Callable[_P, tuple[jax.core.ClosedJaxpr, jax_tree.PyTreeDef]]
+    | Callable[_P, jax.core.ClosedJaxpr]
+):
     """
-    Traces `fun` and generates the Jaxpr and some related meta data.
+    JaCe's replacement for `jax.make_jaxpr()`.
+
+    Returns a callable object that produces as Jaxpr and optionally a pytree defining
+    the output. By default the callable will only return the Jaxpr, however, by setting
+    `return_outtree` the function will also return the output tree, this is different
+    from the `return_shape` of `jax.make_jaxpr()`.
+    Furthermore, this function accepts all tracing parameters, passed through the
+    `trace_options` map that `@jace.jit` supports.
 
-    For tracing the computation `fun` the function uses the `trace_call_args`
-    and `trace_call_kwargs` arguments, both should not be flattened. Furthermore,
-    the tracing is done in enabled x64 mode.
+    Currently the tracing is always performed with an enabled `x64` mode.
 
     Returns:
-        The function will return a tuple of length three.
-        1) The Jaxpr that was generated by Jax using the supplied arguments and options.
-        2) The flattened input.
-        3) A pytree describing the output.
+        The function returns a callable, that if passed arguments will performs the
+        tracing on them, this section will describe the return value of that function.
+        If `return_outtree` is `False` the function will simply return the generated
+        Jaxpr. If `return_outtree` is `True` the function will return a pair.
+        The first element is the Jaxpr and the second element is a pytree object
+        that describes the output.
 
     Args:
         fun: The original Python computation.
-        trace_call_args: The positional arguments that should be used for
-            tracing the computation.
-        trace_call_kwargs: The keyword arguments that should be used for
-            tracing the computation.
         trace_options: The options used for tracing, the same arguments that
             are supported by `jace.jit`.
+        return_outtree: Also return the pytree of the output.
 
     Todo:
         - Handle default arguments of `fun`.
@@ -65,24 +89,34 @@ def trace_and_flatten_function(
         )
     assert all(param.default is param.empty for param in inspect.signature(fun).parameters.values())
 
-    # In Jax `float32` is the main datatype, and they go to great lengths to avoid some
-    #  aggressive [type promotion](https://jax.readthedocs.io/en/latest/type_promotion.html).
-    #  However, in this case we will have problems when we call the SDFG, for some
-    #  reasons `CompiledSDFG` does not work in that case correctly, thus we enable it
-    #  for the tracing.
-    with jax.experimental.enable_x64():
-        # TODO(phimuell): copy the implementation of the real tracing
-        jaxpr, outshapes = jax.make_jaxpr(fun, return_shape=True)(
-            *trace_call_args, **trace_call_kwargs
-        )
-
-    # Regardless what the documentation of `make_jaxpr` claims, it does not output a
-    #  pytree instead an abstract description of the shape, that we will transform into
-    #  a pytree.
-    outtree = jax_tree.tree_structure(outshapes)
-
-    # Make the input tree
-    flat_in_vals = jax_tree.tree_leaves((trace_call_args, trace_call_kwargs))
-    assert len(jaxpr.in_avals) == len(flat_in_vals), "Static arguments not implemented."
-
-    return jaxpr, flat_in_vals, outtree
+    def tracer_impl(
+        *args: _P.args,
+        **kwargs: _P.kwargs,
+    ) -> tuple[jax.core.ClosedJaxpr, jax_tree.PyTreeDef] | jax.core.ClosedJaxpr:
+        # In Jax `float32` is the main datatype, and they go to great lengths to avoid
+        #  some aggressive [type promotion](https://jax.readthedocs.io/en/latest/type_promotion.html).
+        #  However, in this case we will have problems when we call the SDFG, for some
+        #  reasons `CompiledSDFG` does not work in that case correctly, thus we enable
+        #  it for the tracing.
+        with jax.experimental.enable_x64():
+            # TODO(phimuell): copy the implementation of the real tracing
+            jaxpr_maker = jax.make_jaxpr(
+                fun,
+                **trace_options,
+                return_shape=True,
+            )
+            jaxpr, outshapes = jaxpr_maker(
+                *args,
+                **kwargs,
+            )
+
+        if not return_outtree:
+            return jaxpr
+
+        # Regardless what the documentation of `make_jaxpr` claims, it does not output
+        #  a pytree instead an abstract description of the shape, that we will
+        #  transform into a pytree.
+        outtree = jax_tree.tree_structure(outshapes)
+        return jaxpr, outtree
+
+    return tracer_impl  # type: ignore[return-value]  # Type confusion
diff --git a/tests/unit_tests/test_jax_api.py b/tests/unit_tests/test_jax_api.py
index 866f53b..2ddc79d 100644
--- a/tests/unit_tests/test_jax_api.py
+++ b/tests/unit_tests/test_jax_api.py
@@ -12,10 +12,10 @@
 import jax
 import numpy as np
 import pytest
-from jax import numpy as jnp
+from jax import numpy as jnp, tree_util as jax_tree
 
 import jace
-from jace import tracing, translator, util
+from jace import translator, util
 from jace.translator import pre_post_translation as ptrans
 
 from tests import util as testutil
@@ -192,16 +192,14 @@ def testee(a: np.ndarray, b: np.float64) -> np.ndarray:
     with jax.experimental.disable_x64():
         jaxpr = jax.make_jaxpr(testee)(a, b)
 
-    _, flat_in_vals, _ = tracing.trace_and_flatten_function(
-        fun=testee, trace_call_args=(a, b), trace_call_kwargs={}, trace_options={}
-    )
+    flat_call_args = jax_tree.tree_leaves(((a, b), {}))
     builder = translator.JaxprTranslationBuilder(
         primitive_translators=translator.get_registered_primitive_translators()
     )
     trans_ctx: translator.TranslationContext = builder.translate_jaxpr(jaxpr)
 
     tsdfg: jace.TranslatedJaxprSDFG = ptrans.postprocess_jaxpr_sdfg(
-        trans_ctx=trans_ctx, fun=testee, flat_call_args=flat_in_vals
+        trans_ctx=trans_ctx, fun=testee, flat_call_args=flat_call_args
     )
 
     # Because x64 is disabled Jax traces the input as float32, even if we have passed

From d8603d5fd39f9bdf807f838ec58236e39ee9777c Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Tue, 18 Jun 2024 08:09:58 +0200
Subject: [PATCH 384/458] Now the arguments of the wrapped functions are type
 chakable.

However the return type is not, because JaCe changes a scalar to an array.
---
 src/jace/api.py                               | 17 +++++++++--------
 src/jace/stages.py                            | 19 +++++++++++++------
 tests/integration_tests/test_empty_jaxpr.py   |  4 ++--
 .../test_primitive_translator_managing.py     | 18 +++++++++---------
 4 files changed, 33 insertions(+), 25 deletions(-)

diff --git a/src/jace/api.py b/src/jace/api.py
index ea397b9..c344c40 100644
--- a/src/jace/api.py
+++ b/src/jace/api.py
@@ -11,7 +11,7 @@
 
 import functools
 import inspect
-from typing import TYPE_CHECKING, Any, Literal, overload
+from typing import TYPE_CHECKING, Any, Literal, ParamSpec, overload
 
 from jax import grad, jacfwd, jacrev
 
@@ -24,6 +24,8 @@
 
 __all__ = ["grad", "jacfwd", "jacrev", "jit"]
 
+_P = ParamSpec("_P")
+
 
 @overload
 def jit(
@@ -31,24 +33,24 @@ def jit(
     /,
     primitive_translators: Mapping[str, translator.PrimitiveTranslator] | None = None,
     **kwargs: Any,
-) -> Callable[[Callable], stages.JaCeWrapped]: ...
+) -> Callable[[Callable[_P, Any]], stages.JaCeWrapped[_P]]: ...
 
 
 @overload
 def jit(
-    fun: Callable,
+    fun: Callable[_P, Any],
     /,
     primitive_translators: Mapping[str, translator.PrimitiveTranslator] | None = None,
     **kwargs: Any,
-) -> stages.JaCeWrapped: ...
+) -> stages.JaCeWrapped[_P]: ...
 
 
 def jit(
-    fun: Callable | None = None,
+    fun: Callable[_P, Any] | None = None,
     /,
     primitive_translators: Mapping[str, translator.PrimitiveTranslator] | None = None,
     **kwargs: Any,
-) -> stages.JaCeWrapped | Callable[[Callable], stages.JaCeWrapped]:
+) -> Callable[[Callable[_P, Any]], stages.JaCeWrapped[_P]] | stages.JaCeWrapped[_P]:
     """
     JaCe's replacement for `jax.jit` (just-in-time) wrapper.
 
@@ -72,13 +74,12 @@ def jit(
             f"The following arguments to 'jace.jit' are not yet supported: {', '.join(kwargs)}."
         )
 
-    def wrapper(f: Callable) -> stages.JaCeWrapped:
+    def wrapper(f: Callable[_P, Any]) -> stages.JaCeWrapped[_P]:
         if any(
             param.default is not param.empty for param in inspect.signature(f).parameters.values()
         ):
             raise NotImplementedError("Default values are not yet supported.")
 
-        # TODO(egparedes): Improve typing.
         jace_wrapper = stages.JaCeWrapped(
             fun=f,
             primitive_translators=(
diff --git a/src/jace/stages.py b/src/jace/stages.py
index 0477c72..381e8df 100644
--- a/src/jace/stages.py
+++ b/src/jace/stages.py
@@ -29,7 +29,7 @@
 
 import copy
 import inspect
-from typing import TYPE_CHECKING, Any, Union
+from typing import TYPE_CHECKING, Any, Generic, ParamSpec, Union
 
 from jax import tree_util as jax_tree
 
@@ -59,8 +59,15 @@
 #: Known compilation stages in JaCe.
 Stage = Union["JaCeWrapped", "JaCeLowered", "JaCeCompiled"]
 
+# Used for type annotation of the `Stages`, it is important that the return type can
+#  not be annotated, because JaCe will modify it, in case it is a scalar. Thus the
+#  return type is not annotated. Furthermore, because static arguments change the
+#  signature (in a runtime dependent manor) `JaCeCompiled.__call__()` can not be
+#  annotated as well. For that reason only the arguments are annotated.
+_P = ParamSpec("_P")
 
-class JaCeWrapped(tcache.CachingStage["JaCeLowered"]):
+
+class JaCeWrapped(tcache.CachingStage["JaCeLowered"], Generic[_P]):
     """
     A function ready to be specialized, lowered, and compiled.
 
@@ -90,13 +97,13 @@ class JaCeWrapped(tcache.CachingStage["JaCeLowered"]):
         which is implicitly and temporary activated during tracing.
     """
 
-    _fun: Callable
+    _fun: Callable[_P, Any]
     _primitive_translators: dict[str, translator.PrimitiveTranslator]
     _jit_options: dict[str, Any]
 
     def __init__(
         self,
-        fun: Callable,
+        fun: Callable[_P, Any],
         primitive_translators: Mapping[str, translator.PrimitiveTranslator],
         jit_options: Mapping[str, Any],
     ) -> None:
@@ -108,7 +115,7 @@ def __init__(
         self._jit_options = {**jit_options}
         self._fun = fun
 
-    def __call__(self, *args: Any, **kwargs: Any) -> Any:
+    def __call__(self, *args: _P.args, **kwargs: _P.kwargs) -> Any:
         """
         Executes the wrapped function, lowering and compiling as needed in one step.
 
@@ -129,7 +136,7 @@ def __call__(self, *args: Any, **kwargs: Any) -> Any:
         return compiled(*args, **kwargs)
 
     @tcache.cached_transition
-    def lower(self, *args: Any, **kwargs: Any) -> JaCeLowered:
+    def lower(self, *args: _P.args, **kwargs: _P.kwargs) -> JaCeLowered:
         """
         Lower the wrapped computation for the given arguments.
 
diff --git a/tests/integration_tests/test_empty_jaxpr.py b/tests/integration_tests/test_empty_jaxpr.py
index 24d8420..58f8f65 100644
--- a/tests/integration_tests/test_empty_jaxpr.py
+++ b/tests/integration_tests/test_empty_jaxpr.py
@@ -71,7 +71,7 @@ def test_empty_scalar() -> None:
     def wrapped(a: np.float64) -> np.float64:
         return a
 
-    a = np.pi
+    a = np.float64(np.pi)
 
     assert np.all(wrapped(a) == a)
 
@@ -82,7 +82,7 @@ def test_empty_nested() -> None:
     def wrapped(a: np.float64) -> np.float64:
         return jax.jit(lambda a: a)(a)
 
-    a = np.pi
+    a = np.float64(np.pi)
 
     assert np.all(wrapped(a) == a)
 
diff --git a/tests/integration_tests/test_primitive_translator_managing.py b/tests/integration_tests/test_primitive_translator_managing.py
index c72b9bf..7cab00b 100644
--- a/tests/integration_tests/test_primitive_translator_managing.py
+++ b/tests/integration_tests/test_primitive_translator_managing.py
@@ -190,24 +190,24 @@ def test_subtranslatior_managing_decoupling() -> None:
 
     # This will use the translators that are currently installed.
     @jace.jit
-    def foo(a: int) -> int:
-        b = a + 1
-        c = b + 1
-        d = c + 1
-        return d + 1
+    def foo(a: np.ndarray) -> np.ndarray:
+        b = a + np.int32(1)
+        c = b + np.int32(1)
+        d = c + np.int32(1)
+        return d + np.int32(1)
 
     # Now register the add translator.
     translator.register_primitive_translator(fake_add_translator, overwrite=True)
 
     # Since `foo` was already constructed, a new registering can not change anything.
-    a = np.zeros((10, 10))
+    a = np.zeros((10, 10), dtype=np.int32)
     assert np.all(foo(a) == 4)
 
     # But if we now annotate a new function, then we will get fake translator
     @jace.jit
-    def foo_fail(a):
-        b = a + 1
-        return b + 1
+    def foo_fail(a: np.ndarray) -> np.ndarray:
+        b = a + np.int32(1)
+        return b + np.int32(1)
 
     with pytest.raises(
         expected_exception=NotImplementedError,

From 54374d3544e24f84dc4cb79859b6e4a77b648906 Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Tue, 18 Jun 2024 08:43:12 +0200
Subject: [PATCH 385/458] Added partial support for return value typing in the
 stages.

See the big note in the beginning of `jace.stages` to learn more.
Essentially this is the correct maximum.
---
 src/jace/api.py                               | 19 ++++++----
 src/jace/stages.py                            | 37 +++++++++++--------
 .../test_primitive_copy.py                    |  2 +-
 .../test_jaxpr_translator_builder.py          |  2 +-
 tests/unit_tests/test_caching.py              |  6 +--
 5 files changed, 38 insertions(+), 28 deletions(-)

diff --git a/src/jace/api.py b/src/jace/api.py
index c344c40..ebd97cc 100644
--- a/src/jace/api.py
+++ b/src/jace/api.py
@@ -11,7 +11,7 @@
 
 import functools
 import inspect
-from typing import TYPE_CHECKING, Any, Literal, ParamSpec, overload
+from typing import TYPE_CHECKING, Any, Literal, ParamSpec, TypeVar, overload
 
 from jax import grad, jacfwd, jacrev
 
@@ -24,7 +24,9 @@
 
 __all__ = ["grad", "jacfwd", "jacrev", "jit"]
 
+# Used for type annotation, see the notes in `jace.stages` for more.
 _P = ParamSpec("_P")
+_RetrunType = TypeVar("_RetrunType")
 
 
 @overload
@@ -33,24 +35,27 @@ def jit(
     /,
     primitive_translators: Mapping[str, translator.PrimitiveTranslator] | None = None,
     **kwargs: Any,
-) -> Callable[[Callable[_P, Any]], stages.JaCeWrapped[_P]]: ...
+) -> Callable[[Callable[_P, _RetrunType]], stages.JaCeWrapped[_P, _RetrunType]]: ...
 
 
 @overload
 def jit(
-    fun: Callable[_P, Any],
+    fun: Callable[_P, _RetrunType],
     /,
     primitive_translators: Mapping[str, translator.PrimitiveTranslator] | None = None,
     **kwargs: Any,
-) -> stages.JaCeWrapped[_P]: ...
+) -> stages.JaCeWrapped[_P, _RetrunType]: ...
 
 
 def jit(
-    fun: Callable[_P, Any] | None = None,
+    fun: Callable[_P, _RetrunType] | None = None,
     /,
     primitive_translators: Mapping[str, translator.PrimitiveTranslator] | None = None,
     **kwargs: Any,
-) -> Callable[[Callable[_P, Any]], stages.JaCeWrapped[_P]] | stages.JaCeWrapped[_P]:
+) -> (
+    Callable[[Callable[_P, _RetrunType]], stages.JaCeWrapped[_P, _RetrunType]]
+    | stages.JaCeWrapped[_P, _RetrunType]
+):
     """
     JaCe's replacement for `jax.jit` (just-in-time) wrapper.
 
@@ -74,7 +79,7 @@ def jit(
             f"The following arguments to 'jace.jit' are not yet supported: {', '.join(kwargs)}."
         )
 
-    def wrapper(f: Callable[_P, Any]) -> stages.JaCeWrapped[_P]:
+    def wrapper(f: Callable[_P, _RetrunType]) -> stages.JaCeWrapped[_P, _RetrunType]:
         if any(
             param.default is not param.empty for param in inspect.signature(f).parameters.values()
         ):
diff --git a/src/jace/stages.py b/src/jace/stages.py
index 381e8df..7df7a2e 100644
--- a/src/jace/stages.py
+++ b/src/jace/stages.py
@@ -29,7 +29,7 @@
 
 import copy
 import inspect
-from typing import TYPE_CHECKING, Any, Generic, ParamSpec, Union
+from typing import TYPE_CHECKING, Any, Generic, ParamSpec, TypeVar, Union
 
 from jax import tree_util as jax_tree
 
@@ -59,15 +59,20 @@
 #: Known compilation stages in JaCe.
 Stage = Union["JaCeWrapped", "JaCeLowered", "JaCeCompiled"]
 
-# Used for type annotation of the `Stages`, it is important that the return type can
-#  not be annotated, because JaCe will modify it, in case it is a scalar. Thus the
-#  return type is not annotated. Furthermore, because static arguments change the
-#  signature (in a runtime dependent manor) `JaCeCompiled.__call__()` can not be
-#  annotated as well. For that reason only the arguments are annotated.
+# These are used to annotated the `Stages`, however, there are some limitations.
+#  First, the only stage that is fully annotated is `JaCeWrapped`. Second, since
+#  static arguments modify the type signature of `JaCeCompiled.__call__()`, see
+#  [Jax](https://jax.readthedocs.io/en/latest/aot.html#lowering-with-static-arguments)
+#  for more, its argument can not be annotated, only its return type can.
+#  However, in case of scalar return values, the return type is wrong anyway, since
+#  JaCe and Jax for that matter, transforms scalars to arrays. Since there is no way of
+#  changing that, but from a semantic point they behave the same so it should not
+#  matter too much.
 _P = ParamSpec("_P")
+_RetrunType = TypeVar("_RetrunType")
 
 
-class JaCeWrapped(tcache.CachingStage["JaCeLowered"], Generic[_P]):
+class JaCeWrapped(tcache.CachingStage["JaCeLowered"], Generic[_P, _RetrunType]):
     """
     A function ready to be specialized, lowered, and compiled.
 
@@ -97,13 +102,13 @@ class JaCeWrapped(tcache.CachingStage["JaCeLowered"], Generic[_P]):
         which is implicitly and temporary activated during tracing.
     """
 
-    _fun: Callable[_P, Any]
+    _fun: Callable[_P, _RetrunType]
     _primitive_translators: dict[str, translator.PrimitiveTranslator]
     _jit_options: dict[str, Any]
 
     def __init__(
         self,
-        fun: Callable[_P, Any],
+        fun: Callable[_P, _RetrunType],
         primitive_translators: Mapping[str, translator.PrimitiveTranslator],
         jit_options: Mapping[str, Any],
     ) -> None:
@@ -115,7 +120,7 @@ def __init__(
         self._jit_options = {**jit_options}
         self._fun = fun
 
-    def __call__(self, *args: _P.args, **kwargs: _P.kwargs) -> Any:
+    def __call__(self, *args: _P.args, **kwargs: _P.kwargs) -> _RetrunType:
         """
         Executes the wrapped function, lowering and compiling as needed in one step.
 
@@ -136,7 +141,7 @@ def __call__(self, *args: _P.args, **kwargs: _P.kwargs) -> Any:
         return compiled(*args, **kwargs)
 
     @tcache.cached_transition
-    def lower(self, *args: _P.args, **kwargs: _P.kwargs) -> JaCeLowered:
+    def lower(self, *args: _P.args, **kwargs: _P.kwargs) -> JaCeLowered[_RetrunType]:
         """
         Lower the wrapped computation for the given arguments.
 
@@ -198,7 +203,7 @@ def _make_call_description(
         )
 
 
-class JaCeLowered(tcache.CachingStage["JaCeCompiled"]):
+class JaCeLowered(tcache.CachingStage["JaCeCompiled"], Generic[_RetrunType]):
     """
     Represents the original computation as an SDFG.
 
@@ -233,7 +238,7 @@ def __init__(
         self._outtree = outtree
 
     @tcache.cached_transition
-    def compile(self, compiler_options: CompilerOptions | None = None) -> JaCeCompiled:
+    def compile(self, compiler_options: CompilerOptions | None = None) -> JaCeCompiled[_RetrunType]:
         """
         Optimize and compile the lowered SDFG using `compiler_options`.
 
@@ -292,7 +297,7 @@ def _make_call_description(
         )
 
 
-class JaCeCompiled:
+class JaCeCompiled(Generic[_RetrunType]):
     """
     Compiled version of the SDFG.
 
@@ -327,7 +332,7 @@ def __init__(
         self._csdfg = csdfg
         self._outtree = outtree
 
-    def __call__(self, *args: Any, **kwargs: Any) -> Any:
+    def __call__(self, *args: Any, **kwargs: Any) -> _RetrunType:
         """
         Calls the embedded computation.
 
@@ -340,7 +345,7 @@ def __call__(self, *args: Any, **kwargs: Any) -> Any:
         flat_call_args = jax_tree.tree_leaves((args, kwargs))
         flat_output = self._csdfg(flat_call_args)
         if flat_output is None:
-            return None
+            return None  # type: ignore[return-value]  # Type confusion.
         return jax_tree.tree_unflatten(self._outtree, flat_output)
 
 
diff --git a/tests/integration_tests/primitive_translators/test_primitive_copy.py b/tests/integration_tests/primitive_translators/test_primitive_copy.py
index 0d3b566..11fefc9 100644
--- a/tests/integration_tests/primitive_translators/test_primitive_copy.py
+++ b/tests/integration_tests/primitive_translators/test_primitive_copy.py
@@ -25,5 +25,5 @@ def testee(a: np.ndarray) -> jax.Array:
     res = testee(a)
     assert a.dtype == res.dtype
     assert a.shape == res.shape
-    assert a.__array_interface__["data"][0] != res.__array_interface__["data"][0]
+    assert a.__array_interface__["data"][0] != res.__array_interface__["data"][0]  # type: ignore[attr-defined]
     assert np.all(res == a)
diff --git a/tests/integration_tests/test_jaxpr_translator_builder.py b/tests/integration_tests/test_jaxpr_translator_builder.py
index 60f791a..ebbc075 100644
--- a/tests/integration_tests/test_jaxpr_translator_builder.py
+++ b/tests/integration_tests/test_jaxpr_translator_builder.py
@@ -524,7 +524,7 @@ def wrapped(a: np.float64) -> np.float64:
     res = wrapped(a)
     assert res.shape == (1,)
     assert res.dtype == np.float64
-    assert res[0] == np.float64(1.0)
+    assert np.all(res == np.float64(1.0))
 
 
 def test_builder_multiple_return_values() -> None:
diff --git a/tests/unit_tests/test_caching.py b/tests/unit_tests/test_caching.py
index 3b0b7a4..a6fa29b 100644
--- a/tests/unit_tests/test_caching.py
+++ b/tests/unit_tests/test_caching.py
@@ -37,11 +37,11 @@ def wrapped(a: np.ndarray) -> jax.Array:
     ref = np.sin(a)
     res_ids: set[int] = set()
     # We have to store the array, because numpy does reuse the memory.
-    res_set: list[np.ndarray] = []
+    res_set: list[jax.Array] = []
 
     for _ in range(10):
         res = wrapped(a)
-        res_id = res.__array_interface__["data"][0]
+        res_id = res.__array_interface__["data"][0]  # type: ignore[attr-defined]
 
         assert np.allclose(res, ref)
         assert lowering_cnt[0] == 1
@@ -62,7 +62,7 @@ def testee(a: np.ndarray, b: np.ndarray) -> np.ndarray:
 
     # this is the wrapped function.
     @jace.jit
-    def wrapped(a, b):
+    def wrapped(a: np.ndarray, b: np.ndarray) -> np.ndarray:
         lowering_cnt[0] += 1
         return testee(a, b)
 

From 261d90254c42510d6cc80913aefa2d7c2134eac3 Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Tue, 18 Jun 2024 08:48:14 +0200
Subject: [PATCH 386/458] Imporved typing in the tracing signature.

---
 src/jace/tracing.py | 13 +++++++------
 1 file changed, 7 insertions(+), 6 deletions(-)

diff --git a/src/jace/tracing.py b/src/jace/tracing.py
index f07fb94..a9a98d0 100644
--- a/src/jace/tracing.py
+++ b/src/jace/tracing.py
@@ -16,7 +16,7 @@
 from __future__ import annotations
 
 import inspect
-from typing import TYPE_CHECKING, Any, Concatenate, Literal, ParamSpec, overload
+from typing import TYPE_CHECKING, Any, Literal, ParamSpec, TypeVar, overload
 
 import jax
 from jax import tree_util as jax_tree
@@ -26,26 +26,27 @@
     from collections.abc import Callable, Mapping
 
 _P = ParamSpec("_P")
+_RetrunType = TypeVar("_RetrunType")
 
 
 @overload
 def make_jaxpr(
-    fun: Callable[Concatenate[_P], Any],
+    fun: Callable[_P, _RetrunType],
     trace_options: Mapping[str, Any],
     return_outtree: Literal[True],
-) -> Callable[Concatenate[_P], tuple[jax.core.ClosedJaxpr, jax_tree.PyTreeDef]]: ...
+) -> Callable[_P, tuple[jax.core.ClosedJaxpr, jax_tree.PyTreeDef]]: ...
 
 
 @overload
 def make_jaxpr(
-    fun: Callable[Concatenate[_P], Any],
+    fun: Callable[_P, _RetrunType],
     trace_options: Mapping[str, Any],
     return_outtree: Literal[False] = False,
-) -> Callable[Concatenate[_P], jax.core.ClosedJaxpr]: ...
+) -> Callable[_P, jax.core.ClosedJaxpr]: ...
 
 
 def make_jaxpr(
-    fun: Callable[Concatenate[_P], Any],
+    fun: Callable[_P, Any],
     trace_options: Mapping[str, Any],
     return_outtree: bool = False,
 ) -> (

From 027ae355f38ed6b0b9f69b723436e768dd559bf9 Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Tue, 18 Jun 2024 09:11:34 +0200
Subject: [PATCH 387/458] The options for Jit are now represented as a
 `TypedDict`.

---
 src/jace/api.py     | 22 +++++++++++++++++-----
 src/jace/stages.py  |  6 +++---
 src/jace/tracing.py | 12 ++++++------
 3 files changed, 26 insertions(+), 14 deletions(-)

diff --git a/src/jace/api.py b/src/jace/api.py
index ebd97cc..da42139 100644
--- a/src/jace/api.py
+++ b/src/jace/api.py
@@ -11,9 +11,10 @@
 
 import functools
 import inspect
-from typing import TYPE_CHECKING, Any, Literal, ParamSpec, TypeVar, overload
+from typing import TYPE_CHECKING, Literal, ParamSpec, TypedDict, TypeVar, overload
 
 from jax import grad, jacfwd, jacrev
+from typing_extensions import Unpack
 
 from jace import stages, translator
 
@@ -22,19 +23,30 @@
     from collections.abc import Callable, Mapping
 
 
-__all__ = ["grad", "jacfwd", "jacrev", "jit"]
+__all__ = ["JitOptions", "grad", "jacfwd", "jacrev", "jit"]
 
 # Used for type annotation, see the notes in `jace.stages` for more.
 _P = ParamSpec("_P")
 _RetrunType = TypeVar("_RetrunType")
 
 
+class JitOptions(TypedDict, total=False):
+    """
+    All known options to `jace.jit` that influence tracing.
+
+    Notes:
+        Currently there are no known options, but essentially it is a subset of some
+        of the options that are supported by `jax.jit` together with some additional
+        JaCe specific ones.
+    """
+
+
 @overload
 def jit(
     fun: Literal[None] = None,
     /,
     primitive_translators: Mapping[str, translator.PrimitiveTranslator] | None = None,
-    **kwargs: Any,
+    **kwargs: Unpack[JitOptions],
 ) -> Callable[[Callable[_P, _RetrunType]], stages.JaCeWrapped[_P, _RetrunType]]: ...
 
 
@@ -43,7 +55,7 @@ def jit(
     fun: Callable[_P, _RetrunType],
     /,
     primitive_translators: Mapping[str, translator.PrimitiveTranslator] | None = None,
-    **kwargs: Any,
+    **kwargs: Unpack[JitOptions],
 ) -> stages.JaCeWrapped[_P, _RetrunType]: ...
 
 
@@ -51,7 +63,7 @@ def jit(
     fun: Callable[_P, _RetrunType] | None = None,
     /,
     primitive_translators: Mapping[str, translator.PrimitiveTranslator] | None = None,
-    **kwargs: Any,
+    **kwargs: Unpack[JitOptions],
 ) -> (
     Callable[[Callable[_P, _RetrunType]], stages.JaCeWrapped[_P, _RetrunType]]
     | stages.JaCeWrapped[_P, _RetrunType]
diff --git a/src/jace/stages.py b/src/jace/stages.py
index 7df7a2e..d49e150 100644
--- a/src/jace/stages.py
+++ b/src/jace/stages.py
@@ -34,7 +34,7 @@
 from jax import tree_util as jax_tree
 
 import jace
-from jace import optimization, tracing, translator, util
+from jace import api, optimization, tracing, translator, util
 from jace.optimization import CompilerOptions
 from jace.translator import pre_post_translation as ptrans
 from jace.util import translation_cache as tcache
@@ -104,13 +104,13 @@ class JaCeWrapped(tcache.CachingStage["JaCeLowered"], Generic[_P, _RetrunType]):
 
     _fun: Callable[_P, _RetrunType]
     _primitive_translators: dict[str, translator.PrimitiveTranslator]
-    _jit_options: dict[str, Any]
+    _jit_options: api.JitOptions
 
     def __init__(
         self,
         fun: Callable[_P, _RetrunType],
         primitive_translators: Mapping[str, translator.PrimitiveTranslator],
-        jit_options: Mapping[str, Any],
+        jit_options: api.JitOptions,
     ) -> None:
         assert all(
             param.default is param.empty for param in inspect.signature(fun).parameters.values()
diff --git a/src/jace/tracing.py b/src/jace/tracing.py
index a9a98d0..29b7eda 100644
--- a/src/jace/tracing.py
+++ b/src/jace/tracing.py
@@ -23,7 +23,9 @@
 
 
 if TYPE_CHECKING:
-    from collections.abc import Callable, Mapping
+    from collections.abc import Callable
+
+    from jace import api
 
 _P = ParamSpec("_P")
 _RetrunType = TypeVar("_RetrunType")
@@ -32,7 +34,7 @@
 @overload
 def make_jaxpr(
     fun: Callable[_P, _RetrunType],
-    trace_options: Mapping[str, Any],
+    trace_options: api.JitOptions,
     return_outtree: Literal[True],
 ) -> Callable[_P, tuple[jax.core.ClosedJaxpr, jax_tree.PyTreeDef]]: ...
 
@@ -40,14 +42,14 @@ def make_jaxpr(
 @overload
 def make_jaxpr(
     fun: Callable[_P, _RetrunType],
-    trace_options: Mapping[str, Any],
+    trace_options: api.JitOptions,
     return_outtree: Literal[False] = False,
 ) -> Callable[_P, jax.core.ClosedJaxpr]: ...
 
 
 def make_jaxpr(
     fun: Callable[_P, Any],
-    trace_options: Mapping[str, Any],
+    trace_options: api.JitOptions,
     return_outtree: bool = False,
 ) -> (
     Callable[_P, tuple[jax.core.ClosedJaxpr, jax_tree.PyTreeDef]]
@@ -60,8 +62,6 @@ def make_jaxpr(
     the output. By default the callable will only return the Jaxpr, however, by setting
     `return_outtree` the function will also return the output tree, this is different
     from the `return_shape` of `jax.make_jaxpr()`.
-    Furthermore, this function accepts all tracing parameters, passed through the
-    `trace_options` map that `@jace.jit` supports.
 
     Currently the tracing is always performed with an enabled `x64` mode.
 

From 7cdb5f5add86e2266b25cadac1bb12fab03e86f2 Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Tue, 18 Jun 2024 09:55:02 +0200
Subject: [PATCH 388/458] Integrated part of teh development branch into the
 new PR branch.

Essentially it is a partially copy of `src/jace` from the development branch (027ae355f38ed) to this branch.
However, the translators were not copied, thus they are still WIP mode.
Furthermore, all changes to the test were made such that they pass, i.e. they are in WIP mode.
---
 src/jace/__init__.py                          |   3 +
 src/jace/api.py                               |  59 +-
 src/jace/optimization.py                      |  26 +-
 src/jace/stages.py                            | 371 +++++++-----
 src/jace/tracing.py                           | 123 ++++
 src/jace/translated_jaxpr_sdfg.py             | 229 ++++++++
 src/jace/translator/__init__.py               |   2 -
 .../translator/jaxpr_translator_builder.py    |  83 +--
 src/jace/translator/post_translation.py       | 108 ----
 src/jace/translator/pre_post_translation.py   | 251 ++++++++
 src/jace/translator/primitive_translator.py   |   6 +-
 src/jace/translator/translated_jaxpr_sdfg.py  |  71 ---
 src/jace/util/__init__.py                     |   6 +
 src/jace/util/dace_helper.py                  | 144 -----
 src/jace/util/jax_helper.py                   |  18 +-
 src/jace/util/traits.py                       |  40 +-
 src/jace/util/translation_cache.py            | 123 ++--
 tests/test_caching.py                         |  11 +-
 tests/test_jaxpr_translator_builder.py        | 539 ------------------
 tests/test_subtranslator_helper.py            |   6 +-
 20 files changed, 1087 insertions(+), 1132 deletions(-)
 create mode 100644 src/jace/tracing.py
 create mode 100644 src/jace/translated_jaxpr_sdfg.py
 delete mode 100644 src/jace/translator/post_translation.py
 create mode 100644 src/jace/translator/pre_post_translation.py
 delete mode 100644 src/jace/translator/translated_jaxpr_sdfg.py
 delete mode 100644 src/jace/util/dace_helper.py
 delete mode 100644 tests/test_jaxpr_translator_builder.py

diff --git a/src/jace/__init__.py b/src/jace/__init__.py
index 11c5d2a..7d2536c 100644
--- a/src/jace/__init__.py
+++ b/src/jace/__init__.py
@@ -13,9 +13,12 @@
 
 from .__about__ import __author__, __copyright__, __license__, __version__, __version_info__
 from .api import grad, jacfwd, jacrev, jit
+from .translated_jaxpr_sdfg import CompiledJaxprSDFG, TranslatedJaxprSDFG
 
 
 __all__ = [
+    "CompiledJaxprSDFG",
+    "TranslatedJaxprSDFG",
     "__author__",
     "__copyright__",
     "__license__",
diff --git a/src/jace/api.py b/src/jace/api.py
index 8afc20a..da42139 100644
--- a/src/jace/api.py
+++ b/src/jace/api.py
@@ -10,9 +10,11 @@
 from __future__ import annotations
 
 import functools
-from typing import TYPE_CHECKING, Any, Literal, overload
+import inspect
+from typing import TYPE_CHECKING, Literal, ParamSpec, TypedDict, TypeVar, overload
 
 from jax import grad, jacfwd, jacrev
+from typing_extensions import Unpack
 
 from jace import stages, translator
 
@@ -21,7 +23,22 @@
     from collections.abc import Callable, Mapping
 
 
-__all__ = ["grad", "jacfwd", "jacrev", "jit"]
+__all__ = ["JitOptions", "grad", "jacfwd", "jacrev", "jit"]
+
+# Used for type annotation, see the notes in `jace.stages` for more.
+_P = ParamSpec("_P")
+_RetrunType = TypeVar("_RetrunType")
+
+
+class JitOptions(TypedDict, total=False):
+    """
+    All known options to `jace.jit` that influence tracing.
+
+    Notes:
+        Currently there are no known options, but essentially it is a subset of some
+        of the options that are supported by `jax.jit` together with some additional
+        JaCe specific ones.
+    """
 
 
 @overload
@@ -29,31 +46,35 @@ def jit(
     fun: Literal[None] = None,
     /,
     primitive_translators: Mapping[str, translator.PrimitiveTranslator] | None = None,
-    **kwargs: Any,
-) -> Callable[[Callable], stages.JaCeWrapped]: ...
+    **kwargs: Unpack[JitOptions],
+) -> Callable[[Callable[_P, _RetrunType]], stages.JaCeWrapped[_P, _RetrunType]]: ...
 
 
 @overload
 def jit(
-    fun: Callable,
+    fun: Callable[_P, _RetrunType],
     /,
     primitive_translators: Mapping[str, translator.PrimitiveTranslator] | None = None,
-    **kwargs: Any,
-) -> stages.JaCeWrapped: ...
+    **kwargs: Unpack[JitOptions],
+) -> stages.JaCeWrapped[_P, _RetrunType]: ...
 
 
 def jit(
-    fun: Callable | None = None,
+    fun: Callable[_P, _RetrunType] | None = None,
     /,
     primitive_translators: Mapping[str, translator.PrimitiveTranslator] | None = None,
-    **kwargs: Any,
-) -> stages.JaCeWrapped | Callable[[Callable], stages.JaCeWrapped]:
+    **kwargs: Unpack[JitOptions],
+) -> (
+    Callable[[Callable[_P, _RetrunType]], stages.JaCeWrapped[_P, _RetrunType]]
+    | stages.JaCeWrapped[_P, _RetrunType]
+):
     """
     JaCe's replacement for `jax.jit` (just-in-time) wrapper.
 
-    It works the same way as `jax.jit` does, but instead of using XLA the
-    computation is lowered to DaCe. In addition it accepts some JaCe specific
-    arguments.
+    It works the same way as `jax.jit` does, but instead of lowering the
+    computation to XLA, it is lowered to DaCe.
+    The function supports a subset of the arguments that are accepted by `jax.jit()`,
+    currently none, and some JaCe specific ones.
 
     Args:
         fun: Function to wrap.
@@ -61,8 +82,8 @@ def jit(
             If not specified the translators in the global registry are used.
         kwargs: Jit arguments.
 
-    Notes:
-        After constructions any change to `primitive_translators` has no effect.
+    Note:
+        This function is the only valid way to obtain a JaCe computation.
     """
     if kwargs:
         # TODO(phimuell): Add proper name verification and exception type.
@@ -70,8 +91,12 @@ def jit(
             f"The following arguments to 'jace.jit' are not yet supported: {', '.join(kwargs)}."
         )
 
-    def wrapper(f: Callable) -> stages.JaCeWrapped:
-        # TODO(egparedes): Improve typing.
+    def wrapper(f: Callable[_P, _RetrunType]) -> stages.JaCeWrapped[_P, _RetrunType]:
+        if any(
+            param.default is not param.empty for param in inspect.signature(f).parameters.values()
+        ):
+            raise NotImplementedError("Default values are not yet supported.")
+
         jace_wrapper = stages.JaCeWrapped(
             fun=f,
             primitive_translators=(
diff --git a/src/jace/optimization.py b/src/jace/optimization.py
index b5af4fa..1346186 100644
--- a/src/jace/optimization.py
+++ b/src/jace/optimization.py
@@ -5,11 +5,7 @@
 #
 # SPDX-License-Identifier: BSD-3-Clause
 
-"""
-JaCe specific optimizations.
-
-Currently just a dummy exists for the sake of providing a callable function.
-"""
+"""JaCe specific optimizations."""
 
 from __future__ import annotations
 
@@ -19,7 +15,7 @@
 
 
 if TYPE_CHECKING:
-    from jace import translator
+    import jace
 
 
 class CompilerOptions(TypedDict, total=False):
@@ -35,15 +31,24 @@ class CompilerOptions(TypedDict, total=False):
 
     auto_optimize: bool
     simplify: bool
+    persistent: bool
 
 
 # TODO(phimuell): Add a context manager to modify the default.
-DEFAULT_OPTIMIZATIONS: Final[CompilerOptions] = {"auto_optimize": True, "simplify": True}
+DEFAULT_OPTIMIZATIONS: Final[CompilerOptions] = {
+    "auto_optimize": True,
+    "simplify": True,
+    "persistent": True,
+}
 
-NO_OPTIMIZATIONS: Final[CompilerOptions] = {"auto_optimize": False, "simplify": False}
+NO_OPTIMIZATIONS: Final[CompilerOptions] = {
+    "auto_optimize": False,
+    "simplify": False,
+    "persistent": False,
+}
 
 
-def jace_optimize(tsdfg: translator.TranslatedJaxprSDFG, **kwargs: Unpack[CompilerOptions]) -> None:  # noqa: D417  # Missing description for kwargs
+def jace_optimize(tsdfg: jace.TranslatedJaxprSDFG, **kwargs: Unpack[CompilerOptions]) -> None:  # noqa: D417  # Missing description for kwargs
     """
     Performs optimization of the translated SDFG _in place_.
 
@@ -55,6 +60,9 @@ def jace_optimize(tsdfg: translator.TranslatedJaxprSDFG, **kwargs: Unpack[Compil
         tsdfg: The translated SDFG that should be optimized.
         simplify: Run the simplification pipeline.
         auto_optimize: Run the auto optimization pipeline (currently does nothing)
+        persistent:  Make the memory allocation persistent, i.e. allocate the
+            transients only once at the beginning and then reuse the memory across
+            the lifetime of the SDFG.
     """
     # Currently this function exists primarily for the same of existing.
 
diff --git a/src/jace/stages.py b/src/jace/stages.py
index 4639b11..8b6bb5e 100644
--- a/src/jace/stages.py
+++ b/src/jace/stages.py
@@ -8,35 +8,36 @@
 Reimplementation of the `jax.stages` module.
 
 This module reimplements the public classes of that Jax module.
-However, they are a bit different, because JaCe uses DaCe as backend.
+However, because JaCe uses DaCe as backend they differ is some small aspects.
 
 As in Jax JaCe has different stages, the terminology is taken from
 [Jax' AOT-Tutorial](https://jax.readthedocs.io/en/latest/aot.html).
 - Stage out:
-    In this phase an executable Python function is translated to Jaxpr.
+    In this phase an executable Python function is translated to a Jaxpr.
 - Lower:
-    This will transform the Jaxpr into an SDFG equivalent. As a implementation
-    note, currently this and the previous step are handled as a single step.
+    This will transform the Jaxpr into its SDFG equivalent.
 - Compile:
-    This will turn the SDFG into an executable object, see `dace.codegen.CompiledSDFG`.
+    This will turn the SDFG into an executable object.
 - Execution:
     This is the actual running of the computation.
 
-As in Jax the `stages` module give access to the last three stages, but not
-the first one.
+As in Jax the in JaCe the user only has access to the last tree stages and
+staging out and lowering is handled as a single step.
 """
 
 from __future__ import annotations
 
 import copy
-from typing import TYPE_CHECKING, Any
+import inspect
+from typing import TYPE_CHECKING, Any, Generic, ParamSpec, TypeVar, Union
 
-import jax as _jax
+from jax import tree_util as jax_tree
 
-from jace import optimization, translator, util
+import jace
+from jace import api, optimization, tracing, translated_jaxpr_sdfg, translator, util
 from jace.optimization import CompilerOptions
-from jace.translator import post_translation as ptrans
-from jace.util import dace_helper, translation_cache as tcache
+from jace.translator import pre_post_translation as ptrans
+from jace.util import translation_cache as tcache
 
 
 if TYPE_CHECKING:
@@ -50,21 +51,42 @@
     "JaCeLowered",
     "JaCeWrapped",
     "Stage",
+    "finalize_compilation_options",
+    "get_active_compiler_options",
+    "update_active_compiler_options",
 ]
 
-
-class JaCeWrapped(tcache.CachingStage["JaCeLowered"]):
+#: Known compilation stages in JaCe.
+Stage = Union["JaCeWrapped", "JaCeLowered", "JaCeCompiled"]
+
+# These are used to annotated the `Stages`, however, there are some limitations.
+#  First, the only stage that is fully annotated is `JaCeWrapped`. Second, since
+#  static arguments modify the type signature of `JaCeCompiled.__call__()`, see
+#  [Jax](https://jax.readthedocs.io/en/latest/aot.html#lowering-with-static-arguments)
+#  for more, its argument can not be annotated, only its return type can.
+#  However, in case of scalar return values, the return type is wrong anyway, since
+#  JaCe and Jax for that matter, transforms scalars to arrays. Since there is no way of
+#  changing that, but from a semantic point they behave the same so it should not
+#  matter too much.
+_P = ParamSpec("_P")
+_RetrunType = TypeVar("_RetrunType")
+
+
+class JaCeWrapped(tcache.CachingStage["JaCeLowered"], Generic[_P, _RetrunType]):
     """
     A function ready to be specialized, lowered, and compiled.
 
     This class represents the output of functions such as `jace.jit()` and is
     the first stage in the translation/compilation chain of JaCe. A user should
     never create a `JaCeWrapped` object directly, instead `jace.jit` should be
-    used for that. While it supports just-in-time lowering and compilation, by
-    just calling it, these steps can also be performed explicitly. The lowering
-    performed by this stage is cached, thus if a `JaCeWrapped` object is lowered
-    later, with the same argument the result is taken from the cache.
-    Furthermore, a `JaCeWrapped` object is composable with all Jax transformations.
+    used. While it supports just-in-time lowering and compilation, by just
+    calling it, these steps can also be performed explicitly.
+    The lowering, performed by this stage is cached, thus if a `JaCeWrapped`
+    object is later lowered with the same arguments the result might be taken
+    from the cache.
+
+    Furthermore, a `JaCeWrapped` object is composable with all Jax transformations,
+    all other stages are not.
 
     Args:
         fun: The function that is wrapped.
@@ -72,181 +94,182 @@ class JaCeWrapped(tcache.CachingStage["JaCeLowered"]):
         jit_options: Options to influence the jit process.
 
     Todo:
-        - Support pytrees.
-        - Support keyword arguments and default values of the wrapped function.
+        - Support default values of the wrapped function.
         - Support static arguments.
 
     Note:
         The tracing of function will always happen with enabled `x64` mode,
-        which is implicitly and temporary activated while tracing.
+        which is implicitly and temporary activated during tracing.
     """
 
-    _fun: Callable
+    _fun: Callable[_P, _RetrunType]
     _primitive_translators: dict[str, translator.PrimitiveTranslator]
-    _jit_options: dict[str, Any]
+    _jit_options: api.JitOptions
 
     def __init__(
         self,
-        fun: Callable,
+        fun: Callable[_P, _RetrunType],
         primitive_translators: Mapping[str, translator.PrimitiveTranslator],
-        jit_options: Mapping[str, Any],
+        jit_options: api.JitOptions,
     ) -> None:
+        assert all(
+            param.default is param.empty for param in inspect.signature(fun).parameters.values()
+        )
         super().__init__()
-        # We have to shallow copy both the translator and the jit options.
-        #  This prevents that any modifications affect `self`.
-        #  Shallow is enough since the translators themselves are immutable.
         self._primitive_translators = {**primitive_translators}
-        # TODO(phimuell): Do we need to deepcopy the options?
         self._jit_options = {**jit_options}
         self._fun = fun
 
-    def __call__(self, *args: Any, **kwargs: Any) -> Any:
+    def __call__(self, *args: _P.args, **kwargs: _P.kwargs) -> _RetrunType:
         """
         Executes the wrapped function, lowering and compiling as needed in one step.
 
-        The arguments passed to this function are the same as the wrapped function uses.
+        This function will lower and compile in one go. The function accepts the same
+        arguments as the original computation and the return value is unflattened.
+
+        Note:
+            This function is also aware if a Jax tracing is going on. In this
+            case, it will forward the computation.
+            Currently, this function ignores the value of `jax.disable_jit()`.
         """
-        # If we are inside a traced context, then we forward the call to the wrapped
-        #  function. This ensures that JaCe is composable with Jax.
         if util.is_tracing_ongoing(*args, **kwargs):
             return self._fun(*args, **kwargs)
 
         lowered = self.lower(*args, **kwargs)
         compiled = lowered.compile()
+        # TODO(phimuell): Filter out static arguments
         return compiled(*args, **kwargs)
 
     @tcache.cached_transition
-    def lower(self, *args: Any, **kwargs: Any) -> JaCeLowered:
+    def lower(self, *args: _P.args, **kwargs: _P.kwargs) -> JaCeLowered[_RetrunType]:
         """
-        Lower this function explicitly for the given arguments.
+        Lower the wrapped computation for the given arguments.
+
+        Performs the first two steps of the AOT steps described above, i.e. trace the
+        wrapped function with the given arguments and stage it out to a Jaxpr. Then
+        translate it to an SDFG. The result is encapsulated inside a `JaCeLowered`
+        object that can later be compiled.
 
-        Performs the first two steps of the AOT steps described above, i.e.
-        trace the wrapped function with the given arguments and stage it out
-        to a Jaxpr. Then translate it to SDFG. The result is encapsulated
-        inside a `JaCeLowered` object which can later be compiled.
+        It should be noted that the current lowering process will hard code the strides
+        and the storage location of the input inside the SDFG. Thus if the SDFG is
+        lowered with arrays in C order, calling the compiled SDFG with FORTRAN order
+        will result in an error.
 
         Note:
-            The call to the function is cached. As key an abstract description
-            of the call, similar to the tracers used by Jax, is used.
             The tracing is always done with activated `x64` mode.
         """
-        if len(kwargs) != 0:
-            raise NotImplementedError("Currently only positional arguments are supported.")
-
-        # TODO(phimuell): Currently the SDFG that we build only supports `C_CONTIGUOUS`
-        #  memory order. Since we support the paradigm that "everything passed to
-        #  `lower()` should also be accepted as argument to call the result", we forbid
-        #  other memory orders here.
-        if not all((not util.is_array(arg)) or arg.flags["C_CONTIGUOUS"] for arg in args):
-            raise NotImplementedError("Currently can not yet handle strides beside 'C_CONTIGUOUS'.")
-
-        # In Jax `float32` is the main datatype, and they go to great lengths to avoid
-        #  some aggressive [type promotion](https://jax.readthedocs.io/en/latest/type_promotion.html).
-        #  However, in this case we will have problems when we call the SDFG, for some
-        #  reasons `CompiledSDFG` does not work in that case correctly, thus we enable
-        #  it for the tracing.
-        with _jax.experimental.enable_x64():
-            builder = translator.JaxprTranslationBuilder(
-                primitive_translators=self._primitive_translators
-            )
-            jaxpr = _jax.make_jaxpr(self._fun)(*args)
-            trans_ctx: translator.TranslationContext = builder.translate_jaxpr(jaxpr)
-
-        # Perform the post processing and turn it into a `TranslatedJaxprSDFG` that can
-        #  be compiled and called later.
-        # NOTE: `tsdfg` was deepcopied as a side effect of post processing.
-        tsdfg: translator.TranslatedJaxprSDFG = ptrans.postprocess_jaxpr_sdfg(
+        jaxpr_maker = tracing.make_jaxpr(
+            fun=self._fun,
+            trace_options=self._jit_options,
+            return_outtree=True,
+        )
+        jaxpr, outtree = jaxpr_maker(*args, **kwargs)
+        builder = translator.JaxprTranslationBuilder(
+            primitive_translators=self._primitive_translators
+        )
+        trans_ctx: translator.TranslationContext = builder.translate_jaxpr(jaxpr)
+
+        flat_call_args = jax_tree.tree_leaves((args, kwargs))
+        tsdfg: jace.TranslatedJaxprSDFG = ptrans.postprocess_jaxpr_sdfg(
             trans_ctx=trans_ctx,
             fun=self.wrapped_fun,
-            call_args=args,  # Already linearised, since we only accept positional args.
-            intree=None,  # Not yet implemented.
+            flat_call_args=flat_call_args,
         )
 
-        return JaCeLowered(tsdfg)
+        # NOTE: `tsdfg` is deepcopied as a side effect of post processing.
+        return JaCeLowered(tsdfg, outtree)
 
     @property
-    def wrapped_fun(self) -> Callable:
-        """Returns the wrapped function."""
+    def wrapped_fun(self) -> Callable:  # noqa: D102  # No docstring.
         return self._fun
 
-    def _make_call_description(self, *args: Any) -> tcache.StageTransformationSpec:
+    def _make_call_description(
+        self, intree: jax_tree.PyTreeDef, flat_call_args: Sequence[Any]
+    ) -> tcache.StageTransformationSpec:
         """
         Computes the key for the `JaCeWrapped.lower()` call inside the cache.
 
-        The function will compute a full abstract description on its argument.
+        For all non static arguments the function will generate an abstract description
+        of an argument and for all static arguments the concrete value.
+
+        Notes:
+            The abstract description also includes storage location, i.e. if on CPU or
+            on GPU, and the strides of the arrays.
         """
-        call_args = tuple(tcache._AbstractCallArgument.from_value(x) for x in args)
-        return tcache.StageTransformationSpec(stage_id=id(self), call_args=call_args)
+        # TODO(phimuell): Implement static arguments
+        flat_call_args = tuple(tcache._AbstractCallArgument.from_value(x) for x in flat_call_args)
+        return tcache.StageTransformationSpec(
+            stage_id=id(self), flat_call_args=tuple(flat_call_args), intree=intree
+        )
 
 
-class JaCeLowered(tcache.CachingStage["JaCeCompiled"]):
+class JaCeLowered(tcache.CachingStage["JaCeCompiled"], Generic[_RetrunType]):
     """
     Represents the original computation as an SDFG.
 
-    This class is the output type of `JaCeWrapped.lower()` and represents the
-    originally wrapped computation as an SDFG. This stage is followed by the
-    `JaCeCompiled` stage.
+    This class is the output type of `JaCeWrapped.lower()` and represents the original
+    computation as an SDFG. This stage is followed by the `JaCeCompiled` stage, by
+    calling `self.compile()`. A user should never directly construct a `JaCeLowered`
+    object directly, instead `JaCeWrapped.lower()` should be used.
+
+    Before the SDFG is compiled it is optimized, see `JaCeLowered.compile()` for how to
+    control the process.
 
     Args:
-        tsdfg: The translated SDFG object representing the computation.
+        tsdfg: The lowered SDFG with metadata.
+        outtree: The pytree describing how to unflatten the output.
 
     Note:
-        `self` will manage the passed `tsdfg` object. Modifying it results in
-        undefined behavior. Although `JaCeWrapped` is composable with Jax
-        transformations `JaCeLowered` is not. A user should never create such
-        an object, instead `JaCeWrapped.lower()` should be used.
+        `self` will manage the passed `tsdfg` object. Modifying it results is undefined
+        behavior. Although `JaCeWrapped` is composable with Jax transformations
+        `JaCeLowered` is not.
     """
 
-    _translated_sdfg: translator.TranslatedJaxprSDFG
+    _translated_sdfg: jace.TranslatedJaxprSDFG
+    _outtree: jax_tree.PyTreeDef
 
-    def __init__(self, tsdfg: translator.TranslatedJaxprSDFG) -> None:
+    def __init__(
+        self,
+        tsdfg: jace.TranslatedJaxprSDFG,
+        outtree: jax_tree.PyTreeDef,
+    ) -> None:
         super().__init__()
         self._translated_sdfg = tsdfg
+        self._outtree = outtree
 
     @tcache.cached_transition
-    def compile(self, compiler_options: CompilerOptions | None = None) -> JaCeCompiled:
+    def compile(self, compiler_options: CompilerOptions | None = None) -> JaCeCompiled[_RetrunType]:
         """
         Optimize and compile the lowered SDFG using `compiler_options`.
 
-        Returns an object that encapsulates a compiled SDFG object. To influence
-        the various optimizations and compile options of JaCe you can use the
-        `compiler_options` argument. If nothing is specified
-        `jace.optimization.DEFAULT_OPTIMIZATIONS` will be used.
+        To perform the optimizations `jace_optimize()` is used. The actual options that
+        are forwarded to it are obtained by passing `compiler_options` to
+        `finalize_compilation_options()`.
 
-        Note:
-            Before `compiler_options` is forwarded to `jace_optimize()` it
-            will be merged with the default arguments.
+        Args:
+            compiler_options: The optimization options to use.
         """
         # We **must** deepcopy before we do any optimization, because all optimizations
         #  are in place, to properly cache stages, stages needs to be immutable.
-        tsdfg: translator.TranslatedJaxprSDFG = copy.deepcopy(self._translated_sdfg)
-        optimization.jace_optimize(tsdfg=tsdfg, **self._make_compiler_options(compiler_options))
+        tsdfg: jace.TranslatedJaxprSDFG = copy.deepcopy(self._translated_sdfg)
+        optimization.jace_optimize(tsdfg=tsdfg, **finalize_compilation_options(compiler_options))
 
         return JaCeCompiled(
-            csdfg=dace_helper.compile_jax_sdfg(tsdfg),
-            inp_names=tsdfg.inp_names,
-            out_names=tsdfg.out_names,
+            csdfg=translated_jaxpr_sdfg.compile_jaxpr_sdfg(tsdfg),
+            outtree=self._outtree,
         )
 
-    def compiler_ir(self, dialect: str | None = None) -> translator.TranslatedJaxprSDFG:
+    def compiler_ir(self, dialect: str | None = None) -> jace.TranslatedJaxprSDFG:
         """
         Returns the internal SDFG.
 
-        The function returns a `TranslatedJaxprSDFG` object. Direct modification
-        of the returned object is forbidden and will cause undefined behaviour.
+        The function returns a `TranslatedJaxprSDFG` object. Direct modification of the
+        returned object is forbidden and results in undefined behaviour.
         """
         if (dialect is None) or (dialect.upper() == "SDFG"):
             return self._translated_sdfg
         raise ValueError(f"Unknown dialect '{dialect}'.")
 
-    def view(self, filename: str | None = None) -> None:
-        """
-        Runs the `view()` method of the underlying SDFG.
-
-        This will open a browser and display the SDFG.
-        """
-        self.compiler_ir().sdfg.view(filename=filename, verbose=False)
-
     def as_sdfg(self) -> dace.SDFG:
         """
         Returns the encapsulated SDFG.
@@ -256,64 +279,130 @@ def as_sdfg(self) -> dace.SDFG:
         return self.compiler_ir().sdfg
 
     def _make_call_description(
-        self, compiler_options: CompilerOptions | None = None
+        self, intree: jax_tree.PyTreeDef, flat_call_args: Sequence[Any]
     ) -> tcache.StageTransformationSpec:
         """
-        This function computes the key for the `self.compile()` call inside the cache.
+        Creates the key for the `self.compile()` transition function.
 
-        The key that is computed by this function is based on the concrete
-        values of the passed compiler options.
+        The key will depend on the final values that were used for optimization, i.e.
+        they it will also include the global set of optimization options.
         """
-        options = self._make_compiler_options(compiler_options)
-        call_args = tuple(sorted(options.items(), key=lambda x: x[0]))
-        return tcache.StageTransformationSpec(stage_id=id(self), call_args=call_args)
+        unflatted_args, unflatted_kwargs = jax_tree.tree_unflatten(intree, flat_call_args)
+        assert (not unflatted_kwargs) and (len(unflatted_args) <= 1)
 
-    @staticmethod
-    def _make_compiler_options(compiler_options: CompilerOptions | None) -> CompilerOptions:
-        return optimization.DEFAULT_OPTIMIZATIONS | (compiler_options or {})
+        options = finalize_compilation_options(unflatted_args[0] if unflatted_args else {})
+        flat_options, optiontree = jax_tree.tree_flatten(options)
+        return tcache.StageTransformationSpec(
+            stage_id=id(self), flat_call_args=tuple(flat_options), intree=optiontree
+        )
 
 
-class JaCeCompiled:
+class JaCeCompiled(Generic[_RetrunType]):
     """
     Compiled version of the SDFG.
 
-    This is the last stage of the jit chain. A user should never create a
+    This is the last stage of the JaCe's jit chain. A user should never create a
     `JaCeCompiled` instance, instead `JaCeLowered.compile()` should be used.
 
+    Since the strides and storage location of the arguments, that where used to lower
+    the computation are hard coded inside the SDFG, a `JaCeCompiled` object can only be
+    called with compatible arguments.
+
     Args:
         csdfg: The compiled SDFG object.
-        inp_names: Names of the SDFG variables used as inputs.
-        out_names: Names of the SDFG variables used as outputs.
+        inp_names: SDFG variables used as inputs.
+        out_names: SDFG variables used as outputs.
+        outtree: Pytree describing how to unflatten the output.
 
     Note:
         The class assumes ownership of its input arguments.
 
     Todo:
-        - Handle pytrees.
+        - Automatic strides adaption.
     """
 
-    _csdfg: dace_helper.CompiledSDFG
-    _inp_names: tuple[str, ...]
-    _out_names: tuple[str, ...]
+    _csdfg: jace.CompiledJaxprSDFG
+    _outtree: jax_tree.PyTreeDef
 
     def __init__(
-        self, csdfg: dace_helper.CompiledSDFG, inp_names: Sequence[str], out_names: Sequence[str]
+        self,
+        csdfg: jace.CompiledJaxprSDFG,
+        outtree: jax_tree.PyTreeDef,
     ) -> None:
-        if (not inp_names) or (not out_names):
-            raise ValueError("Input and output can not be empty.")
         self._csdfg = csdfg
-        self._inp_names = tuple(inp_names)
-        self._out_names = tuple(out_names)
+        self._outtree = outtree
 
-    def __call__(self, *args: Any, **kwargs: Any) -> Any:
+    def __call__(self, *args: Any, **kwargs: Any) -> _RetrunType:
         """
         Calls the embedded computation.
 
-        The arguments must be the same as for the wrapped function, but with
-        all static arguments removed.
+        Note:
+            Unlike the `lower()` function which takes the same arguments as the original
+            computation, to call this function you have to remove all static arguments.
+            Furthermore, all arguments must have strides and storage locations that is
+            compatible with the ones that were used for lowering.
         """
-        return dace_helper.run_jax_sdfg(self._csdfg, self._inp_names, self._out_names, args, kwargs)
+        flat_call_args = jax_tree.tree_leaves((args, kwargs))
+        flat_output = self._csdfg(flat_call_args)
+        if flat_output is None:
+            return None  # type: ignore[return-value]  # Type confusion.
+        return jax_tree.tree_unflatten(self._outtree, flat_output)
 
 
-#: Known compilation stages in JaCe.
-Stage = JaCeWrapped | JaCeLowered | JaCeCompiled
+# <--------------------------- Compilation/Optimization options management
+
+_JACELOWERED_ACTIVE_COMPILE_OPTIONS: CompilerOptions = optimization.DEFAULT_OPTIMIZATIONS.copy()
+"""Global set of currently active compilation/optimization options.
+
+The global set is initialized with `jace.optimization.DEFAULT_OPTIMIZATIONS`. It can be
+managed through `update_active_compiler_options()` and accessed through
+`get_active_compiler_options()`, however, it is advised that a user should use
+`finalize_compilation_options()` for getting the final options that should be used
+for optimization.
+"""
+
+
+def update_active_compiler_options(new_active_options: CompilerOptions) -> CompilerOptions:
+    """
+    Updates the set of active compiler options.
+
+    Merges the options passed as `new_active_options` with the currently active
+    compiler options. This set is used by `JaCeLowered.compile()` to determine
+    which options should be used.
+    The function will return the set of options that was active before the call.
+
+    To obtain the set of currently active options use `get_active_compiler_options()`.
+
+    Todo:
+        Make a proper context manager.
+    """
+    previous_active_options = _JACELOWERED_ACTIVE_COMPILE_OPTIONS.copy()
+    _JACELOWERED_ACTIVE_COMPILE_OPTIONS.update(new_active_options)
+    return previous_active_options
+
+
+def get_active_compiler_options() -> CompilerOptions:
+    """Returns the set of currently active compiler options."""
+    return _JACELOWERED_ACTIVE_COMPILE_OPTIONS.copy()
+
+
+def finalize_compilation_options(compiler_options: CompilerOptions | None) -> CompilerOptions:
+    """
+    Returns the final compilation options.
+
+    There are two different sources of optimization options. The first one is the global
+    set of currently active compiler options. The second one is the options that are
+    passed to this function, which takes precedence. Thus, the `compiler_options`
+    argument describes the difference from the currently active global options.
+
+    This function is used by `JaCeLowered` if it has to determine which options to use
+    for optimization, either for compiling the lowered SDFG or for computing the key.
+
+    Args:
+        compiler_options: The local compilation options.
+
+    See Also:
+        `get_active_compiler_options()` to inspect the set of currently active options
+        and `update_active_compiler_options()` to modify them.
+    """
+    return get_active_compiler_options() | (compiler_options or {})
diff --git a/src/jace/tracing.py b/src/jace/tracing.py
new file mode 100644
index 0000000..29b7eda
--- /dev/null
+++ b/src/jace/tracing.py
@@ -0,0 +1,123 @@
+# JaCe - JAX Just-In-Time compilation using DaCe (Data Centric Parallel Programming)
+#
+# Copyright (c) 2024, ETH Zurich
+# All rights reserved.
+#
+# SPDX-License-Identifier: BSD-3-Clause
+
+"""
+Implements the tracing machinery that is used to build the Jaxpr.
+
+Essentially, Jax provides `jax.make_jaxpr()` which is essentially a debug utility. Jax
+does not provide any public way to get a Jaxpr. This module provides the necessary
+functionality for use in JaCe.
+"""
+
+from __future__ import annotations
+
+import inspect
+from typing import TYPE_CHECKING, Any, Literal, ParamSpec, TypeVar, overload
+
+import jax
+from jax import tree_util as jax_tree
+
+
+if TYPE_CHECKING:
+    from collections.abc import Callable
+
+    from jace import api
+
+_P = ParamSpec("_P")
+_RetrunType = TypeVar("_RetrunType")
+
+
+@overload
+def make_jaxpr(
+    fun: Callable[_P, _RetrunType],
+    trace_options: api.JitOptions,
+    return_outtree: Literal[True],
+) -> Callable[_P, tuple[jax.core.ClosedJaxpr, jax_tree.PyTreeDef]]: ...
+
+
+@overload
+def make_jaxpr(
+    fun: Callable[_P, _RetrunType],
+    trace_options: api.JitOptions,
+    return_outtree: Literal[False] = False,
+) -> Callable[_P, jax.core.ClosedJaxpr]: ...
+
+
+def make_jaxpr(
+    fun: Callable[_P, Any],
+    trace_options: api.JitOptions,
+    return_outtree: bool = False,
+) -> (
+    Callable[_P, tuple[jax.core.ClosedJaxpr, jax_tree.PyTreeDef]]
+    | Callable[_P, jax.core.ClosedJaxpr]
+):
+    """
+    JaCe's replacement for `jax.make_jaxpr()`.
+
+    Returns a callable object that produces as Jaxpr and optionally a pytree defining
+    the output. By default the callable will only return the Jaxpr, however, by setting
+    `return_outtree` the function will also return the output tree, this is different
+    from the `return_shape` of `jax.make_jaxpr()`.
+
+    Currently the tracing is always performed with an enabled `x64` mode.
+
+    Returns:
+        The function returns a callable, that if passed arguments will performs the
+        tracing on them, this section will describe the return value of that function.
+        If `return_outtree` is `False` the function will simply return the generated
+        Jaxpr. If `return_outtree` is `True` the function will return a pair.
+        The first element is the Jaxpr and the second element is a pytree object
+        that describes the output.
+
+    Args:
+        fun: The original Python computation.
+        trace_options: The options used for tracing, the same arguments that
+            are supported by `jace.jit`.
+        return_outtree: Also return the pytree of the output.
+
+    Todo:
+        - Handle default arguments of `fun`.
+        - Handle static arguments.
+        - Turn `trace_options` into a `TypedDict` and sync with `jace.jit`.
+    """
+    if trace_options:
+        raise NotImplementedError(
+            f"Not supported tracing options: {', '.join(f'{k}' for k in trace_options)}"
+        )
+    assert all(param.default is param.empty for param in inspect.signature(fun).parameters.values())
+
+    def tracer_impl(
+        *args: _P.args,
+        **kwargs: _P.kwargs,
+    ) -> tuple[jax.core.ClosedJaxpr, jax_tree.PyTreeDef] | jax.core.ClosedJaxpr:
+        # In Jax `float32` is the main datatype, and they go to great lengths to avoid
+        #  some aggressive [type promotion](https://jax.readthedocs.io/en/latest/type_promotion.html).
+        #  However, in this case we will have problems when we call the SDFG, for some
+        #  reasons `CompiledSDFG` does not work in that case correctly, thus we enable
+        #  it for the tracing.
+        with jax.experimental.enable_x64():
+            # TODO(phimuell): copy the implementation of the real tracing
+            jaxpr_maker = jax.make_jaxpr(
+                fun,
+                **trace_options,
+                return_shape=True,
+            )
+            jaxpr, outshapes = jaxpr_maker(
+                *args,
+                **kwargs,
+            )
+
+        if not return_outtree:
+            return jaxpr
+
+        # Regardless what the documentation of `make_jaxpr` claims, it does not output
+        #  a pytree instead an abstract description of the shape, that we will
+        #  transform into a pytree.
+        outtree = jax_tree.tree_structure(outshapes)
+        return jaxpr, outtree
+
+    return tracer_impl  # type: ignore[return-value]  # Type confusion
diff --git a/src/jace/translated_jaxpr_sdfg.py b/src/jace/translated_jaxpr_sdfg.py
new file mode 100644
index 0000000..bbab2be
--- /dev/null
+++ b/src/jace/translated_jaxpr_sdfg.py
@@ -0,0 +1,229 @@
+# JaCe - JAX Just-In-Time compilation using DaCe (Data Centric Parallel Programming)
+#
+# Copyright (c) 2024, ETH Zurich
+# All rights reserved.
+#
+# SPDX-License-Identifier: BSD-3-Clause
+
+"""Extended versions of `SDFG` and `CompiledSDFG` with additional metadata."""
+
+from __future__ import annotations
+
+import dataclasses
+import os
+import pathlib
+import time
+from typing import TYPE_CHECKING, Any
+
+import dace
+from dace import data as dace_data
+
+from jace import util
+
+
+if TYPE_CHECKING:
+    from collections.abc import Sequence
+
+    import numpy as np
+    from dace.codegen import compiled_sdfg
+    from dace.codegen.compiled_sdfg import CompiledSDFG
+
+
+@dataclasses.dataclass(frozen=True, kw_only=True)
+class TranslatedJaxprSDFG:
+    """
+    Encapsulates a translated SDFG with additional the metadata.
+
+    Contrary to the SDFG that is encapsulated inside an `TranslationContext`
+    object, `self` carries a proper SDFG, however:
+    - It does not have `__return*` variables, instead all return arguments are
+        passed by arguments.
+    - All input arguments are passed through arguments mentioned in `inp_names`,
+        while the outputs are passed through `out_names`.
+    - Only variables listed as in/outputs are non transient.
+    - The order inside `inp_names` and `out_names` is the same as in the original Jaxpr.
+    - If an input is used as outputs it appears in both `inp_names` and `out_names`.
+    - Its `arg_names` is set to  `inp_names + out_names`, but arguments that are
+        input and outputs are only listed as inputs.
+
+    The only valid way to obtain a `TranslatedJaxprSDFG` is by passing a
+    `TranslationContext`, that was in turn constructed by
+    `JaxprTranslationBuilder.translate_jaxpr()`, to the
+    `finalize_translation_context()` or preferably to the `postprocess_jaxpr_sdfg()`
+    function.
+
+    Attributes:
+        sdfg: The encapsulated SDFG object.
+        inp_names: SDFG variables used as inputs.
+        out_names: SDFG variables used as outputs.
+
+    Todo:
+        After the SDFG is compiled a lot of code looks strange, because there is
+        no container to store the compiled SDFG and the metadata. This class
+        should be extended to address this need.
+    """
+
+    sdfg: dace.SDFG
+    inp_names: tuple[str, ...]
+    out_names: tuple[str, ...]
+
+    def validate(self) -> bool:
+        """Validate the underlying SDFG."""
+        if any(self.sdfg.arrays[inp].transient for inp in self.inp_names):
+            raise dace.sdfg.InvalidSDFGError(
+                f"Found transient inputs: {(inp for inp in self.inp_names if self.sdfg.arrays[inp].transient)}",
+                self.sdfg,
+                self.sdfg.node_id(self.sdfg.start_state),
+            )
+        if any(self.sdfg.arrays[out].transient for out in self.out_names):
+            raise dace.sdfg.InvalidSDFGError(
+                f"Found transient outputs: {(out for out in self.out_names if self.sdfg.arrays[out].transient)}",
+                self.sdfg,
+                self.sdfg.node_id(self.sdfg.start_state),
+            )
+        if self.sdfg.free_symbols:  # This is a simplification that makes our life simple.
+            raise dace.sdfg.InvalidSDFGError(
+                f"Found free symbols: {self.sdfg.free_symbols}",
+                self.sdfg,
+                self.sdfg.node_id(self.sdfg.start_state),
+            )
+        self.sdfg.validate()
+        return True
+
+
+class CompiledJaxprSDFG:
+    """
+    Compiled version of a `TranslatedJaxprSDFG` instance.
+
+    Essentially this class is a wrapper around DaCe's `CompiledSDFG` object, that
+    supports the calling convention used inside JaCe, as in `DaCe` it is callable.
+    The only valid way to obtain a `CompiledJaxprSDFG` instance is through
+    `compile_jaxpr_sdfg()`.
+
+    Args:
+        csdfg: The `CompiledSDFG` object.
+        inp_names: Names of the SDFG variables used as inputs.
+        out_names: Names of the SDFG variables used as outputs.
+
+    Attributes:
+        csdfg: The `CompiledSDFG` object.
+        sdfg: The encapsulated SDFG object.
+        inp_names: Names of the SDFG variables used as inputs.
+        out_names: Names of the SDFG variables used as outputs.
+
+    Notes:
+        Currently the strides of the input arguments must match the ones that were used
+        for lowering the SDFG.
+        In DaCe the return values are allocated on a per `CompiledSDFG` basis. Thus
+        every call to a compiled SDFG will override the value of the last call, in JaCe
+        the memory is allocated on every call. In addition scalars are returned as
+        arrays of length one.
+    """
+
+    csdfg: compiled_sdfg.CompiledSDFG
+    sdfg: dace.SDFG
+    inp_names: tuple[str, ...]
+    out_names: tuple[str, ...]
+
+    def __init__(
+        self,
+        csdfg: compiled_sdfg.CompiledSDFG,
+        inp_names: tuple[str, ...],
+        out_names: tuple[str, ...],
+    ) -> None:
+        self.csdfg = csdfg
+        self.sdfg = self.csdfg.sdfg
+        self.inp_names = inp_names
+        self.out_names = out_names
+
+    def __call__(
+        self,
+        flat_call_args: Sequence[Any],
+    ) -> list[np.ndarray] | None:
+        """
+        Run the compiled SDFG using the flattened input.
+
+        The function will not perform flattening of its input nor unflattening of
+        the output.
+
+        Args:
+            csdfg: The compiled SDFG to call.
+            flat_call_args: Flattened input arguments.
+        """
+        if len(self.inp_names) != len(flat_call_args):
+            # Either error or static arguments are not removed.
+            raise RuntimeError("Wrong number of arguments.")
+
+        sdfg_call_args: dict[str, Any] = {}
+        for in_name, in_val in zip(self.inp_names, flat_call_args):
+            # TODO(phimuell): Implement a stride matching process.
+            if util.is_jax_array(in_val):
+                if not util.is_fully_addressable(in_val):
+                    raise ValueError(f"Passed a not fully addressable Jax array as '{in_name}'")
+                in_val = in_val.__array__()  # noqa: PLW2901  # Jax arrays do not expose the __array_interface__.
+            sdfg_call_args[in_name] = in_val
+
+        arrays = self.sdfg.arrays
+        for out_name, sdfg_array in ((out_name, arrays[out_name]) for out_name in self.out_names):
+            if out_name in sdfg_call_args:
+                if util.is_jax_array(sdfg_call_args[out_name]):
+                    raise ValueError("Passed an immutable Jax array as output.")
+            else:
+                sdfg_call_args[out_name] = dace_data.make_array_from_descriptor(sdfg_array)
+
+        assert len(sdfg_call_args) == len(self.csdfg.argnames), (
+            "Failed to construct the call arguments,"
+            f" expected {len(self.csdfg.argnames)} but got {len(flat_call_args)}."
+            f"\nExpected: {self.csdfg.argnames}\nGot: {list(sdfg_call_args.keys())}"
+        )
+
+        # Calling the SDFG
+        with dace.config.temporary_config():
+            dace.Config.set("compiler", "allow_view_arguments", value=True)
+            self.csdfg(**sdfg_call_args)
+
+        if self.out_names:
+            return [sdfg_call_args[out_name] for out_name in self.out_names]
+        return None
+
+
+def compile_jaxpr_sdfg(tsdfg: TranslatedJaxprSDFG) -> CompiledJaxprSDFG:
+    """Compile `tsdfg` and return a `CompiledJaxprSDFG` object with the result."""
+    if any(  # We do not support the DaCe return mechanism
+        array_name.startswith("__return")
+        for array_name in tsdfg.sdfg.arrays.keys()  # noqa: SIM118  # We can not use `in` because we are not interested in `my_mangled_variable__return_zulu`!
+    ):
+        raise ValueError("Only support SDFGs without '__return' members.")
+    if tsdfg.sdfg.free_symbols:  # This is a simplification that makes our life simple.
+        raise NotImplementedError(f"No free symbols allowed, found: {tsdfg.sdfg.free_symbols}")
+    if not (tsdfg.out_names or tsdfg.inp_names):
+        raise ValueError("No input nor output.")
+
+    # To ensure that the SDFG is compiled and to get rid of a warning we must modify
+    #  some settings of the SDFG. But we also have to fake an immutable SDFG
+    sdfg = tsdfg.sdfg
+    org_sdfg_name = sdfg.name
+    org_recompile = sdfg._recompile
+    org_regenerate_code = sdfg._regenerate_code
+
+    try:
+        # We need to give the SDFG another name, this is needed to prevent a DaCe
+        #  error/warning. This happens if we compile the same lowered SDFG multiple
+        #  times with different options.
+        sdfg.name = f"{sdfg.name}__comp_{int(time.time() * 1000)}_{os.getpid()}"
+        assert len(sdfg.name) < 255  # noqa: PLR2004  # Not a magic number.
+
+        with dace.config.temporary_config():
+            dace.Config.set("compiler", "use_cache", value=False)
+            dace.Config.set("cache", value="name")
+            dace.Config.set("default_build_folder", value=pathlib.Path(".jacecache").resolve())
+            sdfg._recompile = True
+            sdfg._regenerate_code = True
+            csdfg: CompiledSDFG = sdfg.compile()
+
+    finally:
+        sdfg.name = org_sdfg_name
+        sdfg._recompile = org_recompile
+        sdfg._regenerate_code = org_regenerate_code
+
+    return CompiledJaxprSDFG(csdfg=csdfg, inp_names=tsdfg.inp_names, out_names=tsdfg.out_names)
diff --git a/src/jace/translator/__init__.py b/src/jace/translator/__init__.py
index 2f184a0..9cd3dfd 100644
--- a/src/jace/translator/__init__.py
+++ b/src/jace/translator/__init__.py
@@ -22,14 +22,12 @@
     make_primitive_translator,
     register_primitive_translator,
 )
-from .translated_jaxpr_sdfg import TranslatedJaxprSDFG
 
 
 __all__ = [
     "JaxprTranslationBuilder",
     "PrimitiveTranslator",
     "PrimitiveTranslatorCallable",
-    "TranslatedJaxprSDFG",
     "TranslationContext",
     "get_registered_primitive_translators",
     "make_primitive_translator",
diff --git a/src/jace/translator/jaxpr_translator_builder.py b/src/jace/translator/jaxpr_translator_builder.py
index da2e68f..deba4fe 100644
--- a/src/jace/translator/jaxpr_translator_builder.py
+++ b/src/jace/translator/jaxpr_translator_builder.py
@@ -33,8 +33,10 @@ class JaxprTranslationBuilder:
     - it has a single source and sink state.
     - all variable names are derived from Jax names,
     - there are only transient variables inside the SDFG,
-    - It lacks the special `__return` variable,
-    - the `arg_names` parameter is not set.
+    - it lacks the special `__return` variable,
+    - the `arg_names` parameter is not set,
+    - for all scalar values a ` Scalar` SDFG variable is used, thus they cannot
+        be used to return anything.
 
     For these reasons the SDFG is not directly usable, and further manipulations
     have to be performed. Especially, DaCe's validation function will fail and
@@ -66,8 +68,7 @@ class JaxprTranslationBuilder:
 
     Notes:
         After a translation has been performed the translator object can be used
-        again. Currently the builder will generate only Array as SDFG variables,
-        however, this is a temporary solution, see `add_array()`.
+        again.
     """
 
     _primitive_translators: Mapping[str, translator.PrimitiveTranslatorCallable]
@@ -119,7 +120,7 @@ def translate_jaxpr(
         #  context. Thus the builder will start to translate a second (nested)
         #  SDFG. Also note that there is no mechanism that forces the integration
         #  of the nested SDFG/Jaxpr, this must be done manually.
-        self._allocate_translation_ctx(name=name)
+        self._allocate_translation_ctx(name=name, jaxpr=jaxpr)
         self._create_constants(jaxpr=jaxpr)
         self._create_initial_input(jaxpr=jaxpr)
 
@@ -274,8 +275,8 @@ def add_jax_name_mapping(
             jax_var: The Jax variable.
             sdfg_name: The name of the corresponding SDFG variable.
         """
-        assert sdfg_name
-
+        if not sdfg_name:
+            raise ValueError("Supplied 'sdfg_name' is empty.")
         if jax_var in self._jax_name_map:
             raise ValueError(
                 f"Cannot change the mapping of '{jax_var}' from"
@@ -312,14 +313,6 @@ def add_array(
             arg: The Jax object for which a SDFG equivalent should be created.
             name_prefix: If given it will be used as prefix for the name.
             update_var_mapping: Update the internal variable mapping.
-
-        Notes:
-            As a temporary fix for handling scalar return values, the function
-            will always generate arrays, even if `arg` is a scalar. According to
-            the DaCe developer, the majority of the backend, i.e. optimization
-            pipeline, should be able to handle it. But there are some special
-            parts that might explicitly want a scalar, it also might block
-            certain compiler optimization.
         """
         if isinstance(arg, jax_core.Literal):
             raise TypeError(f"Can not generate an SDFG variable for literal '{arg}'.")
@@ -331,9 +324,6 @@ def add_array(
         as_transient = True
         strides = None
 
-        # Temporary fix for handling DaCe scalars, see above for more.
-        shape = shape or (1,)
-
         # Propose a name and if needed extend it.
         arg_name = util.propose_jax_name(arg, self._jax_name_map)
         if name_prefix:
@@ -347,15 +337,20 @@ def add_array(
         if arg_name in util.FORBIDDEN_SDFG_VAR_NAMES:
             raise ValueError(f"add_array({arg}): The proposed name '{arg_name}', is forbidden.")
 
-        self._ctx.sdfg.add_array(
-            name=arg_name,
-            shape=shape,
-            strides=strides,
-            offset=offset,
-            storage=storage,
-            dtype=dtype,
-            transient=as_transient,
-        )
+        if shape == ():
+            self._ctx.sdfg.add_scalar(
+                name=arg_name, storage=storage, dtype=dtype, transient=as_transient
+            )
+        else:
+            self._ctx.sdfg.add_array(
+                name=arg_name,
+                shape=shape,
+                strides=strides,
+                offset=offset,
+                storage=storage,
+                dtype=dtype,
+                transient=as_transient,
+            )
 
         if update_var_mapping:
             try:
@@ -451,7 +446,6 @@ def _create_initial_input(self, jaxpr: jax_core.ClosedJaxpr) -> None:
         Notes:
             The function will populate the `inp_names` member of the current context.
         """
-        assert self.is_allocated(), "Builder is not allocated, can not create constants."
         assert self._ctx.inp_names is None
 
         # Handle the initial input arguments
@@ -473,7 +467,6 @@ def _create_constants(self, jaxpr: jax_core.ClosedJaxpr) -> None:
         The function will create an SDFG variable and add them as constant to
         the SDFG. Their value is deepcopied.
         """
-        assert self.is_allocated(), "Builder is not allocated, can not create constants."
         if len(jaxpr.consts) == 0:
             return
 
@@ -489,14 +482,17 @@ def _create_constants(self, jaxpr: jax_core.ClosedJaxpr) -> None:
                 sdfg_name, copy.deepcopy(const_value), self._ctx.sdfg.arrays[sdfg_name]
             )
 
-    def _allocate_translation_ctx(self, name: str | None = None) -> JaxprTranslationBuilder:
+    def _allocate_translation_ctx(
+        self, name: str | None, jaxpr: jax_core.ClosedJaxpr
+    ) -> JaxprTranslationBuilder:
         """
         Allocate a new context and activate it.
 
         Args:
             name: The name of the SDFG.
+            jaxpr: The Jaxpr that should be translated.
         """
-        self._ctx_stack.append(TranslationContext(name=name))
+        self._ctx_stack.append(TranslationContext(name=name, jaxpr=jaxpr))
         return self
 
     @property
@@ -638,7 +634,7 @@ def _handle_null_jaxpr(self, jaxpr: jax_core.ClosedJaxpr) -> list[str]:
             The function will _not_ update the `out_names` field of the current context.
         """
         assert self._ctx.terminal_state is self._ctx.start_state
-        assert self._ctx.inp_names
+        assert isinstance(self._ctx.inp_names, tuple)
         assert self._ctx.out_names is None
 
         # There is not output so we do not have to copy anything around.
@@ -711,6 +707,7 @@ class TranslationContext:
         out_names: A list of the SDFG variables that are used as output.
         start_state: The first state in the SDFG state machine.
         terminal_state: The (currently) last state in the state machine.
+        jaxpr: The Jaxpr that was used to translate.
 
     Args:
         name: The name of the SDFG.
@@ -725,8 +722,9 @@ class TranslationContext:
     out_names: tuple[str, ...] | None
     start_state: dace.SDFGState
     terminal_state: dace.SDFGState
+    jaxpr: jax_core.ClosedJaxpr
 
-    def __init__(self, name: str | None = None) -> None:
+    def __init__(self, name: str | None, jaxpr: jax_core.ClosedJaxpr) -> None:
         if isinstance(name, str) and not util.VALID_SDFG_OBJ_NAME.fullmatch(name):
             raise ValueError(f"'{name}' is not a valid SDFG name.")
 
@@ -735,6 +733,7 @@ def __init__(self, name: str | None = None) -> None:
         self.out_names = None
         self.start_state = self.sdfg.add_state(label="initial_state", is_start_block=True)
         self.terminal_state = self.start_state
+        self.jaxpr = jaxpr
 
     def validate(self) -> bool:
         """
@@ -757,4 +756,22 @@ def validate(self) -> bool:
                 self.sdfg,
                 self.sdfg.node_id(self.terminal_state),
             )
+        if not (
+            self.inp_names is None
+            or all(inp_name in self.sdfg.arrays for inp_name in self.inp_names)
+        ):
+            raise dace.sdfg.InvalidSDFGError(
+                f"Missing input arguments: {(inp_name for inp_name in self.inp_names if inp_name not in self.sdfg.arrays)}",
+                self.sdfg,
+                self.sdfg.node_id(self.terminal_state),
+            )
+        if not (
+            self.out_names is None
+            or all(out_name in self.sdfg.arrays for out_name in self.out_names)
+        ):
+            raise dace.sdfg.InvalidSDFGError(
+                f"Missing output arguments: {(out_name for out_name in self.out_names if out_name not in self.sdfg.arrays)}",
+                self.sdfg,
+                self.sdfg.node_id(self.terminal_state),
+            )
         return True
diff --git a/src/jace/translator/post_translation.py b/src/jace/translator/post_translation.py
deleted file mode 100644
index ec445e9..0000000
--- a/src/jace/translator/post_translation.py
+++ /dev/null
@@ -1,108 +0,0 @@
-# JaCe - JAX Just-In-Time compilation using DaCe (Data Centric Parallel Programming)
-#
-# Copyright (c) 2024, ETH Zurich
-# All rights reserved.
-#
-# SPDX-License-Identifier: BSD-3-Clause
-
-"""
-This module contains all functions that are related to post processing the SDFG.
-
-Most of them operate on `TranslatedJaxprSDFG` objects.
-Currently they mostly exist for the sake of existing.
-"""
-
-from __future__ import annotations
-
-import copy
-from typing import TYPE_CHECKING, Any
-
-from jace import translator
-
-
-if TYPE_CHECKING:
-    from collections.abc import Callable, Sequence
-
-
-def postprocess_jaxpr_sdfg(
-    trans_ctx: translator.TranslationContext,
-    fun: Callable,  # noqa: ARG001  # Currently unused
-    call_args: Sequence[Any],  # noqa: ARG001  # Currently unused
-    intree: None,  # noqa: ARG001  # Currently unused
-) -> translator.TranslatedJaxprSDFG:
-    """
-    Perform the final post processing steps on the `TranslationContext` _in place_.
-
-    The function will perform post processing stages on the context in place.
-    However, the function will return a decoupled `TranslatedJaxprSDFG` object.
-
-    Args:
-        trans_ctx: The `TranslationContext` obtained from a `translate_jaxpr()` call.
-        fun: The original function that was translated.
-        call_args: The linearized input arguments.
-        intree: The pytree describing the inputs.
-
-    Todo:
-        - Setting correct input names (layer that does not depend on JAX).
-        - Setting the correct strides & storage properties.
-        - Fixing the scalar input problem on GPU.
-    """
-    # Currently we do nothing except finalizing.
-    trans_ctx.validate()
-
-    #
-    # Assume some post processing here.
-    #
-
-    return finalize_translation_context(trans_ctx, validate=True)
-
-
-def finalize_translation_context(
-    trans_ctx: translator.TranslationContext, validate: bool = True
-) -> translator.TranslatedJaxprSDFG:
-    """
-    Finalizes the supplied translation context `trans_ctx`.
-
-    The function will process the SDFG that is encapsulated inside the context,
-    i.e. a canonical one, into a proper SDFG, as it is described in
-    `TranslatedJaxprSDFG`. It is important to realize that this function does
-    not perform any optimization of the underlying SDFG itself, instead it
-    prepares an SDFG such that it can be passed to the optimization pipeline.
-
-    The function will not mutate the passed translation context and the output
-    is always decoupled from its output.
-
-    Args:
-        trans_ctx: The context that should be finalized.
-        validate: Call the validate function after the finalizing.
-    """
-    trans_ctx.validate()
-    if trans_ctx.inp_names is None:
-        raise ValueError("Input names are not specified.")
-    if trans_ctx.out_names is None:
-        raise ValueError("Output names are not specified.")
-
-    # We guarantee decoupling
-    tsdfg = translator.TranslatedJaxprSDFG(
-        sdfg=copy.deepcopy(trans_ctx.sdfg),
-        inp_names=trans_ctx.inp_names,
-        out_names=trans_ctx.out_names,
-    )
-
-    # Make inputs and outputs to globals.
-    sdfg_arg_names: list[str] = []
-    for glob_name in tsdfg.inp_names + tsdfg.out_names:
-        if glob_name in sdfg_arg_names:
-            continue
-        tsdfg.sdfg.arrays[glob_name].transient = False
-        sdfg_arg_names.append(glob_name)
-
-    # This forces the signature of the SDFG to include all arguments in order they
-    #  appear. If an argument is used as input and output then it is only listed as
-    #  input.
-    tsdfg.sdfg.arg_names = sdfg_arg_names
-
-    if validate:
-        tsdfg.validate()
-
-    return tsdfg
diff --git a/src/jace/translator/pre_post_translation.py b/src/jace/translator/pre_post_translation.py
new file mode 100644
index 0000000..c2a79cb
--- /dev/null
+++ b/src/jace/translator/pre_post_translation.py
@@ -0,0 +1,251 @@
+# JaCe - JAX Just-In-Time compilation using DaCe (Data Centric Parallel Programming)
+#
+# Copyright (c) 2024, ETH Zurich
+# All rights reserved.
+#
+# SPDX-License-Identifier: BSD-3-Clause
+
+"""Functions for the pre and post processing during the translation."""
+
+from __future__ import annotations
+
+import copy
+from typing import TYPE_CHECKING, Any
+
+import dace
+
+import jace
+from jace import util
+
+
+if TYPE_CHECKING:
+    from collections.abc import Callable, Sequence
+
+    from jace import translator
+
+
+def postprocess_jaxpr_sdfg(
+    trans_ctx: translator.TranslationContext,
+    fun: Callable,  # noqa: ARG001  # Currently unused
+    flat_call_args: Sequence[Any],
+    validate: bool = True,
+) -> jace.TranslatedJaxprSDFG:
+    """
+    Final post processing steps on the `TranslationContext`.
+
+    While the function performs the post processing on the context in place, the
+    returned `TranslatedJaxprSDFG` will be decoupled from the input.
+
+    Args:
+        trans_ctx: The `TranslationContext` obtained from a `translate_jaxpr()` call.
+        fun: The original function that was translated.
+        flat_call_args: The flattened input arguments.
+        validate: Perform validation.
+
+    Todo:
+        - Fixing the scalar input problem on GPU.
+        - Fixing stride problem of the input.
+    """
+    trans_ctx.validate()  # Always validate, it is cheap.
+    create_input_output_stages(trans_ctx=trans_ctx, flat_call_args=flat_call_args)
+    return finalize_translation_context(trans_ctx, validate=validate)
+
+
+def create_input_output_stages(
+    trans_ctx: translator.TranslationContext, flat_call_args: Sequence[Any]
+) -> None:
+    """
+    Creates an input and output state inside the SDFG in place.
+
+    See `_create_input_state()` and `_create_output_state()` for more information.
+
+    Args:
+        trans_ctx: The translation context that should be modified.
+        flat_call_args: The flattened call arguments that should be used.
+
+    Note:
+        The processed SDFG will remain canonical.
+    """
+    _create_input_state(trans_ctx, flat_call_args)
+    _create_output_state(trans_ctx)
+
+
+def _create_output_state(trans_ctx: translator.TranslationContext) -> None:
+    """
+    Creates the output processing stage for the SDFG in place.
+
+    The function will create a new terminal state, in which all outputs, denoted
+    in `trans_ctx.out_names`, will be written into new SDFG variables. In case the
+    output variable is a scalar, the output will be replaced by an array of length one.
+    This behaviour is consistent with Jax.
+
+    Args:
+        trans_ctx: The translation context to process.
+    """
+    assert trans_ctx.inp_names is not None and trans_ctx.out_names is not None
+
+    # NOTE: Currently we do not support to write back into an input argument, as Jax.
+    #  However, this is a requirement for handling ICON stencils, that we will support
+    #  eventually. If we get a translation context that lists a variable name in the
+    #  inputs and outputs, this means that it was returned unmodified. In Jax this
+    #  will lead to a copy and we also do it. This is implemented by just naïvely
+    #  creating a separate output variable for every output we have, irrespectively
+    #  of its name inside the Jaxpr.
+
+    output_pattern = "__jace_output_{}"
+    sdfg = trans_ctx.sdfg
+    new_output_state: dace.SDFGState = sdfg.add_state("output_processing_stage")
+    new_output_names: list[str] = []
+
+    for i, org_output_name in enumerate(trans_ctx.out_names):
+        new_output_name = output_pattern.format(i)
+        org_output_desc: dace.data.Data = sdfg.arrays[org_output_name]
+        assert org_output_desc.transient
+        assert (
+            new_output_name not in sdfg.arrays
+        ), f"Final output variable '{new_output_name}' is already present."
+
+        if isinstance(org_output_desc, dace.data.Scalar):
+            _, new_output_desc = sdfg.add_array(
+                new_output_name,
+                dtype=org_output_desc.dtype,
+                shape=(1,),
+                transient=True,  # Needed for an canonical SDFG
+            )
+            memlet = dace.Memlet.simple(new_output_name, subset_str="0", other_subset_str="0")
+
+        else:
+            new_output_desc = org_output_desc.clone()
+            sdfg.add_datadesc(new_output_name, new_output_desc)
+            memlet = dace.Memlet.from_array(org_output_name, org_output_desc)
+
+        new_output_state.add_nedge(
+            new_output_state.add_read(org_output_name),
+            new_output_state.add_write(new_output_name),
+            memlet,
+        )
+        new_output_names.append(new_output_name)
+
+    sdfg.add_edge(trans_ctx.terminal_state, new_output_state, dace.InterstateEdge())
+    trans_ctx.terminal_state = new_output_state
+    trans_ctx.out_names = tuple(new_output_names)
+
+
+def _create_input_state(
+    trans_ctx: translator.TranslationContext, flat_call_args: Sequence[Any]
+) -> None:
+    """
+    Creates the input processing state for the SDFG in place.
+
+    The function will create a new set of variables that are exposed as inputs. This
+    variables are based on the example input arguments passed through `flat_call_args`.
+    This process will hard code the memory location and strides into the SDFG.
+    The assignment is performed inside a new state, which is put at the beginning.
+
+    Args:
+        trans_ctx: The translation context that should be modified.
+        flat_call_args: The flattened call arguments for which the input
+            state should be specialized.
+
+    Todo:
+        Handle transfer of scalar input in GPU mode.
+    """
+    assert trans_ctx.inp_names is not None and trans_ctx.out_names is not None
+
+    # NOTE: This function will create a distinct variable for every input. Once we
+    #  allow write back arguments they will be handled in the `_create_output_state()`
+    #  function anyway, also see the comment in that function.
+
+    if len(flat_call_args) != len(trans_ctx.inp_names):
+        raise ValueError(f"Expected {len(trans_ctx.inp_names)}, but got {len(flat_call_args)}.")
+
+    sdfg = trans_ctx.sdfg
+    new_input_state: dace.SDFGState = sdfg.add_state(f"{sdfg.name}__start_state")
+    new_input_names: list[str] = []
+    input_pattern = "__jace_input_{}"
+
+    for i, (org_input_name, call_arg) in enumerate(zip(trans_ctx.inp_names, flat_call_args)):
+        org_input_desc: dace.data.Data = sdfg.arrays[org_input_name]
+        new_input_name = input_pattern.format(i)
+
+        if isinstance(org_input_desc, dace.data.Scalar):
+            # TODO(phimuell): In GPU mode: scalar -> GPU_ARRAY -> Old input name
+            new_input_desc: dace.data.Scalar = org_input_desc.clone()
+            sdfg.add_datadesc(new_input_name, new_input_desc)
+            memlet = dace.Memlet.simple(new_input_name, subset_str="0", other_subset_str="0")
+
+        else:
+            _, new_input_desc = sdfg.add_array(
+                name=new_input_name,
+                shape=org_input_desc.shape,
+                dtype=org_input_desc.dtype,
+                strides=util.get_strides_for_dace(call_arg),
+                transient=True,  # For canonical SDFG.
+                storage=(
+                    dace.StorageType.GPU_Global
+                    if util.is_on_device(call_arg)
+                    else dace.StorageType.CPU_Heap
+                ),
+            )
+            memlet = dace.Memlet.from_array(new_input_name, new_input_desc)
+
+        new_input_state.add_nedge(
+            new_input_state.add_read(new_input_name),
+            new_input_state.add_write(org_input_name),
+            memlet,
+        )
+        new_input_names.append(new_input_name)
+
+    sdfg.add_edge(new_input_state, trans_ctx.start_state, dace.InterstateEdge())
+    sdfg.start_block = sdfg.node_id(new_input_state)
+    trans_ctx.start_state = new_input_state
+    trans_ctx.inp_names = tuple(new_input_names)
+
+
+def finalize_translation_context(
+    trans_ctx: translator.TranslationContext,
+    validate: bool = True,
+) -> jace.TranslatedJaxprSDFG:
+    """
+    Finalizes the supplied translation context `trans_ctx`.
+
+    The function will process the SDFG that is encapsulated inside the context, i.e. a
+    canonical one, into a proper SDFG, as it is described in `TranslatedJaxprSDFG`. It
+    is important to realize that this function does not perform any optimization of the
+    underlying SDFG itself, instead it prepares an SDFG such that it can be passed to
+    the optimization pipeline.
+
+    The returned object is fully decoupled from its input and `trans_ctx` is not
+    modified.
+
+    Args:
+        trans_ctx: The context that should be finalized.
+        validate: Call the validate function after the finalizing.
+    """
+    trans_ctx.validate()
+    if trans_ctx.inp_names is None:
+        raise ValueError("Input names are not specified.")
+    if trans_ctx.out_names is None:
+        raise ValueError("Output names are not specified.")
+    if not (trans_ctx.out_names or trans_ctx.inp_names):
+        raise ValueError("No input nor output.")
+
+    # We guarantee decoupling
+    tsdfg = jace.TranslatedJaxprSDFG(
+        sdfg=copy.deepcopy(trans_ctx.sdfg),
+        inp_names=trans_ctx.inp_names,
+        out_names=trans_ctx.out_names,
+    )
+
+    # Make inputs and outputs to globals.
+    sdfg_arg_names: list[str] = []
+    for arg_name in tsdfg.inp_names + tsdfg.out_names:
+        if arg_name in sdfg_arg_names:
+            continue
+        tsdfg.sdfg.arrays[arg_name].transient = False
+        sdfg_arg_names.append(arg_name)
+    tsdfg.sdfg.arg_names = sdfg_arg_names
+
+    if validate:
+        tsdfg.validate()
+    return tsdfg
diff --git a/src/jace/translator/primitive_translator.py b/src/jace/translator/primitive_translator.py
index dc3bd74..dffe2f6 100644
--- a/src/jace/translator/primitive_translator.py
+++ b/src/jace/translator/primitive_translator.py
@@ -192,9 +192,9 @@ def register_primitive_translator(
         overwrite: Replace the current primitive translator with `primitive_translator`.
 
     Note:
-        To add a `primitive` property use the `@make_primitive_translator` decorator.
-        This function returns `primitive_translator` unmodified, which allows it to be
-        used as decorator.
+        To add a `primitive` property use the `@make_primitive_translator`
+        decorator. This function returns `primitive_translator` unmodified,
+        which allows it to be used as decorator.
     """
 
     def wrapper(
diff --git a/src/jace/translator/translated_jaxpr_sdfg.py b/src/jace/translator/translated_jaxpr_sdfg.py
deleted file mode 100644
index afa91ff..0000000
--- a/src/jace/translator/translated_jaxpr_sdfg.py
+++ /dev/null
@@ -1,71 +0,0 @@
-# JaCe - JAX Just-In-Time compilation using DaCe (Data Centric Parallel Programming)
-#
-# Copyright (c) 2024, ETH Zurich
-# All rights reserved.
-#
-# SPDX-License-Identifier: BSD-3-Clause
-
-"""Container for storing a translated SDFG."""
-
-from __future__ import annotations
-
-import dataclasses
-
-import dace
-
-
-@dataclasses.dataclass(kw_only=True, frozen=True)
-class TranslatedJaxprSDFG:
-    """
-    Encapsulates a translated SDFG with additional the metadata.
-
-    Contrary to the SDFG that is encapsulated inside the `TranslationContext`
-    object, `self` carries a proper SDFG, however:
-    - It does not have `__return*` variables, instead all return arguments are
-        passed by arguments.
-    - All input arguments are passed through arguments mentioned in `inp_names`,
-        while the outputs are passed through `out_names`.
-    - Only variables listed as in/outputs are non transient.
-    - The order inside `inp_names` and `out_names` is the same as in the original Jaxpr.
-    - If an input is used as outputs it appears in both `inp_names` and `out_names`.
-    - Its `arg_names` is set to  `inp_names + out_names`, but arguments that are
-        input and outputs are only listed as inputs.
-
-    The only valid way to obtain a `TranslatedJaxprSDFG` is by passing a
-    `TranslationContext`, that was in turn constructed by
-    `JaxprTranslationBuilder.translate_jaxpr()`, to the
-    `finalize_translation_context()` or preferably to the `postprocess_jaxpr_sdfg()`
-    function.
-
-    Attributes:
-        sdfg: The encapsulated SDFG object.
-        inp_names: A list of the SDFG variables that are used as input
-        out_names: A list of the SDFG variables that are used as output.
-    """
-
-    sdfg: dace.SDFG
-    inp_names: tuple[str, ...]
-    out_names: tuple[str, ...]
-
-    def validate(self) -> bool:
-        """Validate the underlying SDFG."""
-        if any(self.sdfg.arrays[inp].transient for inp in self.inp_names):
-            raise dace.sdfg.InvalidSDFGError(
-                f"Found transient inputs: {(inp for inp in self.inp_names if self.sdfg.arrays[inp].transient)}",
-                self.sdfg,
-                self.sdfg.node_id(self.sdfg.start_state),
-            )
-        if any(self.sdfg.arrays[out].transient for out in self.out_names):
-            raise dace.sdfg.InvalidSDFGError(
-                f"Found transient outputs: {(out for out in self.out_names if self.sdfg.arrays[out].transient)}",
-                self.sdfg,
-                self.sdfg.node_id(self.sdfg.start_state),
-            )
-        if self.sdfg.free_symbols:  # This is a simplification that makes our life simple.
-            raise dace.sdfg.InvalidSDFGError(
-                f"Found free symbols: {self.sdfg.free_symbols}",
-                self.sdfg,
-                self.sdfg.node_id(self.sdfg.start_state),
-            )
-        self.sdfg.validate()
-        return True
diff --git a/src/jace/util/__init__.py b/src/jace/util/__init__.py
index ab73e4e..9532454 100644
--- a/src/jace/util/__init__.py
+++ b/src/jace/util/__init__.py
@@ -12,6 +12,7 @@
 from .definitions import FORBIDDEN_SDFG_VAR_NAMES, VALID_SDFG_OBJ_NAME, VALID_SDFG_VAR_NAME
 from .jax_helper import (
     JaCeVar,
+    get_jax_literal_value,
     get_jax_var_dtype,
     get_jax_var_name,
     get_jax_var_shape,
@@ -20,7 +21,9 @@
     translate_dtype,
 )
 from .traits import (
+    get_strides_for_dace,
     is_array,
+    is_c_contiguous,
     is_drop_var,
     is_fully_addressable,
     is_jax_array,
@@ -34,10 +37,13 @@
     "VALID_SDFG_OBJ_NAME",
     "VALID_SDFG_VAR_NAME",
     "JaCeVar",
+    "get_jax_literal_value",
     "get_jax_var_dtype",
     "get_jax_var_name",
     "get_jax_var_shape",
+    "get_strides_for_dace",
     "is_array",
+    "is_c_contiguous",
     "is_drop_var",
     "is_fully_addressable",
     "is_jax_array",
diff --git a/src/jace/util/dace_helper.py b/src/jace/util/dace_helper.py
deleted file mode 100644
index 1828fac..0000000
--- a/src/jace/util/dace_helper.py
+++ /dev/null
@@ -1,144 +0,0 @@
-# JaCe - JAX Just-In-Time compilation using DaCe (Data Centric Parallel Programming)
-#
-# Copyright (c) 2024, ETH Zurich
-# All rights reserved.
-#
-# SPDX-License-Identifier: BSD-3-Clause
-
-"""Implements all utility functions that are related to DaCe."""
-
-from __future__ import annotations
-
-import time
-from typing import TYPE_CHECKING, Any
-
-import dace
-import numpy as np
-from dace import data as dace_data
-
-# The compiled SDFG is not available in the dace namespace or anywhere else
-#  Thus we import it here directly
-from dace.codegen.compiled_sdfg import CompiledSDFG
-
-from jace import util
-
-
-if TYPE_CHECKING:
-    from collections.abc import Mapping, Sequence
-
-    from jace import translator
-
-__all__ = ["CompiledSDFG", "compile_jax_sdfg", "run_jax_sdfg"]
-
-
-def compile_jax_sdfg(tsdfg: translator.TranslatedJaxprSDFG) -> CompiledSDFG:
-    """Compiles the embedded SDFG and return the resulting `CompiledSDFG` object."""
-    if any(  # We do not support the DaCe return mechanism
-        array_name.startswith("__return")
-        for array_name in tsdfg.sdfg.arrays.keys()  # noqa: SIM118  # we can not use `in` because we are also interested in `__return_`!
-    ):
-        raise ValueError("Only support SDFGs without '__return' members.")
-
-    # To ensure that the SDFG is compiled and to get rid of a warning we must modify
-    #  some settings of the SDFG. To fake an immutable SDFG, we will restore them later.
-    sdfg = tsdfg.sdfg
-    org_sdfg_name = sdfg.name
-    org_recompile = sdfg._recompile
-    org_regenerate_code = sdfg._regenerate_code
-
-    try:
-        # We need to give the SDFG another name, this is needed to prevent a DaCe
-        #  error/warning. This happens if we compile the same lowered SDFG multiple
-        #  times with different options.
-        sdfg.name = f"{sdfg.name}__comp_{int(time.time() * 1000)}"
-
-        with dace.config.temporary_config():
-            sdfg._recompile = True
-            sdfg._regenerate_code = True
-            dace.Config.set("compiler", "use_cache", value=False)
-            csdfg: CompiledSDFG = sdfg.compile()
-
-    finally:
-        sdfg.name = org_sdfg_name
-        sdfg._recompile = org_recompile
-        sdfg._regenerate_code = org_regenerate_code
-
-    return csdfg
-
-
-def run_jax_sdfg(
-    csdfg: CompiledSDFG,
-    inp_names: Sequence[str],
-    out_names: Sequence[str],
-    call_args: Sequence[Any],
-    call_kwargs: Mapping[str, Any],
-) -> tuple[Any, ...] | Any:
-    """
-    Run the compiled SDFG.
-
-    The function assumes that the SDFG was finalized and then compiled by
-    `compile_jax_sdfg()`. For running the SDFG you also have to pass the input
-    names (`inp_names`) and output names (`out_names`) that were inside the
-    `TranslatedJaxprSDFG` from which `csdfg` was compiled from.
-
-    Args:
-        csdfg: The `CompiledSDFG` object.
-        inp_names: List of names of the input arguments.
-        out_names: List of names of the output arguments.
-        call_args: All positional arguments of the call.
-        call_kwargs: All keyword arguments of the call.
-
-    Note:
-        There is no pytree mechanism jet, thus the return values are returned
-        inside a `tuple` or in case of one value, directly, in the order
-        determined by Jax. Furthermore, DaCe does not support scalar return
-        values, thus they are silently converted into arrays of length 1, the
-        same holds for inputs.
-
-    Todo:
-        - Implement non C strides.
-    """
-    sdfg: dace.SDFG = csdfg.sdfg
-
-    if len(call_kwargs) != 0:
-        raise NotImplementedError("No kwargs are supported yet.")
-    if len(inp_names) != len(call_args):
-        raise RuntimeError("Wrong number of arguments.")
-    if sdfg.free_symbols:  # This is a simplification that makes our life simple.
-        raise NotImplementedError(
-            f"No externally defined symbols are allowed, found: {sdfg.free_symbols}"
-        )
-
-    # Build the argument list that we will pass to the compiled object.
-    sdfg_call_args: dict[str, Any] = {}
-    for in_name, in_val in zip(inp_names, call_args, strict=True):
-        if util.is_scalar(in_val):
-            # Currently the translator makes scalar into arrays, this has to be
-            #  reflected here
-            in_val = np.array([in_val])  # noqa: PLW2901  # Loop variable is intentionally modified.
-        sdfg_call_args[in_name] = in_val
-
-    for out_name, sdfg_array in ((out_name, sdfg.arrays[out_name]) for out_name in out_names):
-        if out_name in sdfg_call_args:
-            if util.is_jax_array(sdfg_call_args[out_name]):
-                # Jax arrays are immutable, so they can not be return values too.
-                raise ValueError("Passed a Jax array as output.")
-        else:
-            sdfg_call_args[out_name] = dace_data.make_array_from_descriptor(sdfg_array)
-
-    assert len(sdfg_call_args) == len(csdfg.argnames), (
-        "Failed to construct the call arguments,"
-        f" expected {len(csdfg.argnames)} but got {len(call_args)}."
-        f"\nExpected: {csdfg.argnames}\nGot: {list(sdfg_call_args.keys())}"
-    )
-
-    # Calling the SDFG
-    with dace.config.temporary_config():
-        dace.Config.set("compiler", "allow_view_arguments", value=True)
-        csdfg(**sdfg_call_args)
-
-    # Handling the output (pytrees are missing)
-    if not out_names:
-        return None
-    ret_val: tuple[Any] = tuple(sdfg_call_args[out_name] for out_name in out_names)
-    return ret_val[0] if len(out_names) == 1 else ret_val
diff --git a/src/jace/util/jax_helper.py b/src/jace/util/jax_helper.py
index 175671f..c0997ba 100644
--- a/src/jace/util/jax_helper.py
+++ b/src/jace/util/jax_helper.py
@@ -19,6 +19,7 @@
 from typing import TYPE_CHECKING, Any
 
 import dace
+import jax
 import jax.core as jax_core
 import numpy as np
 
@@ -132,10 +133,19 @@ def is_tracing_ongoing(*args: Any, **kwargs: Any) -> bool:
     While a return value `True` guarantees that a translation is ongoing, a
     value of `False` does not guarantees that no tracing is ongoing.
     """
-    # The current implementation only checks the arguments if it contains tracers.
-    if (len(args) == 0) and (len(kwargs) == 0):
-        raise RuntimeError("Failed to determine if tracing is ongoing.")
-    return any(isinstance(x, jax_core.Tracer) for x in itertools.chain(args, kwargs.values()))
+    # To detect if there is tracing ongoing, we check the internal tracing stack of Jax.
+    #  Note that this is highly internal and depends on the precise implementation of
+    #  Jax. For that reason we first look at all arguments and check if they are
+    #  tracers. Furthermore, it seems that Jax always have a bottom interpreter on the
+    #  stack, thus it is empty if `len(...) == 1`!
+    #  See also: https://github.com/google/jax/pull/3370
+    if any(isinstance(x, jax_core.Tracer) for x in itertools.chain(args, kwargs.values())):
+        return True
+    if len(jax._src.core.thread_local_state.trace_state.trace_stack.stack) == 1:
+        return False
+    if len(jax._src.core.thread_local_state.trace_state.trace_stack.stack) > 1:
+        return True
+    raise RuntimeError("Failed to determine if tracing is ongoing.")
 
 
 def translate_dtype(dtype: Any) -> dace.typeclass:
diff --git a/src/jace/util/traits.py b/src/jace/util/traits.py
index a8e6bc8..f99d013 100644
--- a/src/jace/util/traits.py
+++ b/src/jace/util/traits.py
@@ -39,7 +39,7 @@ def is_jax_array(obj: Any) -> TypeGuard[jax.Array]:
     return isinstance(obj, jax.Array)
 
 
-def is_array(obj: Any) -> bool:
+def is_array(obj: Any) -> TypeGuard[jax.typing.ArrayLike]:
     """Identifies arrays, this also includes Jax arrays."""
     return dace.is_array(obj) or is_jax_array(obj)
 
@@ -74,6 +74,35 @@ def is_scalar(obj: Any) -> bool:
     return type(obj) in known_types
 
 
+def get_strides_for_dace(obj: Any) -> tuple[int, ...] | None:
+    """
+    Get the strides of `obj` in a DaCe compatible format.
+
+    The function returns the strides in number of elements, as it is used inside
+    DaCe and not in bytes as it is inside NumPy. As in NumPy and DaCe the function
+    returns `None` to indicate standard C order.
+
+    Notes:
+        If `obj` is not array like an error is generated.
+    """
+    if not is_array(obj):
+        raise TypeError(f"Passed '{obj}' ({type(obj).__name__}) is not array like.")
+
+    if is_jax_array(obj):
+        if not is_fully_addressable(obj):
+            raise NotImplementedError("Sharded jax arrays are not supported.")
+        obj = obj.__array__()
+    assert hasattr(obj, "strides")
+
+    if obj.strides is None:
+        return None
+    if not hasattr(obj, "itemsize"):
+        # No `itemsize` member so we assume that it is already in elements.
+        return obj.strides
+
+    return tuple(stride // obj.itemsize for stride in obj.strides)
+
+
 def is_on_device(obj: Any) -> bool:
     """
     Tests if `obj` is on a device.
@@ -91,3 +120,12 @@ def is_fully_addressable(obj: Any) -> bool:
     if is_jax_array(obj):
         return obj.is_fully_addressable
     return True
+
+
+def is_c_contiguous(obj: Any) -> bool:
+    """Tests if `obj` is in C order."""
+    if not is_array(obj):
+        return False
+    if is_jax_array(obj):
+        obj = obj.__array__()
+    return obj.flags["C_CONTIGUOUS"]
diff --git a/src/jace/util/translation_cache.py b/src/jace/util/translation_cache.py
index f6366bd..9361733 100644
--- a/src/jace/util/translation_cache.py
+++ b/src/jace/util/translation_cache.py
@@ -21,11 +21,11 @@
 import collections
 import dataclasses
 import functools
-from collections.abc import Callable, Hashable
+from collections.abc import Callable, Hashable, Sequence
 from typing import TYPE_CHECKING, Any, Concatenate, Generic, ParamSpec, TypeAlias, TypeVar, cast
 
 import dace
-from jax import core as jax_core
+from jax import core as jax_core, tree_util as jax_tree
 
 from jace import util
 
@@ -39,7 +39,7 @@
 
 
 # Denotes the stage that follows the current one.
-#  Used by the `NextStage` Mixin.
+#  Used by the `CachingStage` mixin.
 NextStage = TypeVar("NextStage", bound="stages.Stage")
 
 
@@ -47,17 +47,12 @@ class CachingStage(Generic[NextStage]):
     """
     Annotates a stage whose transition to the next stage is cacheable.
 
-    To make the transition of a stage cacheable, the stage must be derived from
-    this class, and its initialization must call `CachingStage.__init__()`.
-    Furthermore, its transition function must be annotated by the
-    `@cached_transition` decorator.
-
-    A class must implement the `_make_call_description()` to compute an abstract
-    description of the call. This is needed to operate the cache to store the
-    stage transitions.
-
-    Notes:
-        The `__init__()` function must explicitly be called to fully setup `self`.
+    To make a transition cacheable, a stage must:
+    - be derived from this class.
+    - its `__init__()` function must explicitly call `CachingStage.__init__()`.
+    - the transition function must be annotated by `@cached_transition`.
+    - it must implement the `_make_call_description()` to create the key.
+    - the stage object must be immutable.
 
     Todo:
         - Handle eviction from the cache due to collecting of unused predecessor stages.
@@ -70,9 +65,21 @@ def __init__(self) -> None:
 
     @abc.abstractmethod
     def _make_call_description(
-        self: CachingStage, *args: Any, **kwargs: Any
+        self: CachingStage, intree: jax_tree.PyTreeDef, flat_call_args: Sequence[Any]
     ) -> StageTransformationSpec:
-        """Generates the key that is used to store/locate the call in the cache."""
+        """
+        Computes the key used to represent the call.
+
+        This function is used by the `@cached_transition` decorator to perform
+        the lookup inside the cache. It should return a description of the call
+        that is encapsulated inside a `StageTransformationSpec` object, see
+        there for more information.
+
+        Args:
+            intree: Pytree object describing how the input arguments were flattened.
+            flat_call_args: The flattened arguments that were passed to the
+                annotated function.
+        """
         ...
 
 
@@ -88,9 +95,11 @@ def cached_transition(
     """
     Decorator for making the transition function of the stage cacheable.
 
-    In order to work, the stage must be derived from `CachingStage`. For computing
-    the key of a call the function will use the `_make_call_description()`
-    function of the cache.
+    See the description of `CachingStage` for the requirements.
+    The function will use `_make_call_description()` to decide if the call is
+    already known and if so it will return the cached object. If the call is
+    not known it will call the wrapped transition function and record its
+    return value inside the cache, before returning it.
 
     Todo:
         - Implement a way to temporary disable the cache.
@@ -98,12 +107,11 @@ def cached_transition(
 
     @functools.wraps(transition)
     def transition_wrapper(self: CachingStageType, *args: P.args, **kwargs: P.kwargs) -> NextStage:
-        key: StageTransformationSpec = self._make_call_description(*args, **kwargs)
-        if key in self._cache:
-            return self._cache[key]
-        next_stage = transition(self, *args, **kwargs)
-        self._cache[key] = next_stage
-        return next_stage
+        flat_call_args, intree = jax_tree.tree_flatten((args, kwargs))
+        key = self._make_call_description(flat_call_args=flat_call_args, intree=intree)
+        if key not in self._cache:
+            self._cache[key] = transition(self, *args, **kwargs)
+        return self._cache[key]
 
     return cast(TransitionFunction, transition_wrapper)
 
@@ -132,14 +140,15 @@ class _AbstractCallArgument:
     which is similar to tracers in Jax. This class represents the second way.
     To create an instance you should use `_AbstractCallArgument.from_value()`.
 
-    Its description is limited to scalars and arrays. To describe more complex
-    types, they should be processed by pytrees first.
-
     Attributes:
         shape: In case of an array its shape, in case of a scalar the empty tuple.
         dtype: The DaCe type of the argument.
         strides: The strides of the argument, or `None` if they are unknown or a scalar.
         storage: The storage type where the argument is stored.
+
+    Note:
+        This class is only able to describe scalars and arrays, thus it should
+        only be used after the arguments were flattened.
     """
 
     shape: tuple[int, ...]
@@ -160,8 +169,8 @@ def from_value(cls, value: Any) -> _AbstractCallArgument:
                 value = value.__array__()  # Passing `copy=False` leads to error in NumPy.
             shape = value.shape
             dtype = util.translate_dtype(value.dtype)
-            strides = getattr(value, "strides", None)
-            # Is `CPU_Heap` always okay? There would also be `CPU_Pinned`.
+            strides = util.get_strides_for_dace(value)
+            # TODO(phimuell): `CPU_Heap` vs. `CPU_Pinned`.
             storage = (
                 dace.StorageType.GPU_Global
                 if util.is_on_device(value)
@@ -182,11 +191,8 @@ def from_value(cls, value: Any) -> _AbstractCallArgument:
         raise TypeError(f"Can not make 'an abstract description from '{type(value).__name__}'.")
 
 
-#: This type is the abstract description of a function call.
-#:  It is part of the key used in the cache.
-CallArgsSpec: TypeAlias = tuple[
-    _AbstractCallArgument | Hashable | tuple[str, _AbstractCallArgument | Hashable], ...
-]
+#: Type to describe a single argument either in an abstract or concrete way.
+CallArgsSpec: TypeAlias = tuple[_AbstractCallArgument | Hashable]
 
 
 @dataclasses.dataclass(frozen=True)
@@ -195,27 +201,31 @@ class StageTransformationSpec:
     Represents the entire call to a state transformation function of a stage.
 
     State transition functions are annotated with `@cached_transition` and their
-    result may be cached. They key to locate them inside the cache is represented
+    result is cached. They key to locate them inside the cache is represented
     by this class and computed by the `CachingStage._make_call_description()`
-    function. The actual key is consists of two parts, `stage_id` and `call_args`.
+    function. The actual key is consists of three parts, `stage_id`, `call_args`
+    and `intree`, see below for more.
 
     Args:
         stage_id: Origin of the call, for which the id of the stage object should
             be used.
-        call_args: Description of the arguments of the call. There are two ways
-            to describe the arguments:
+        flat_call_args: Flat representation of the arguments of the call. Each element
+            describes a single argument. To describe an argument there are two ways:
             - Abstract description: In this way, the actual value of the argument
-                is irrelevant, only the structure of them are important, similar
-                to the tracers used in Jax.
-            - Concrete description: Here one caches on the actual value of the
-                argument. The only requirement is that they can be hashed.
+                is irrelevant, its structure is important, similar to the tracers
+                used in Jax. To represent it, use `_AbstractCallArgument`.
+            - Concrete description: Here the actual value of the argument is
+                considered, this is similar to how static arguments in Jax works.
+                The only requirement is that they can be hashed.
+        intree: A pytree structure that describes how the input was flatten.
     """
 
     stage_id: int
-    call_args: CallArgsSpec
+    flat_call_args: CallArgsSpec
+    intree: jax_tree.PyTreeDef
 
 
-# Denotes the stage that is stored inside the cache.
+#: Denotes the stage that is stored inside the cache.
 StageType = TypeVar("StageType", bound="stages.Stage")
 
 
@@ -224,16 +234,16 @@ class StageCache(Generic[StageType]):
     Simple LRU cache to cache the results of the stage transition function.
 
     Args:
-        size: The size of the cache, defaults to 256.
+        capacity: The size of the cache, defaults to 256.
     """
 
     # The most recently used entry is at the end of the `OrderedDict`.
     _memory: collections.OrderedDict[StageTransformationSpec, StageType]
-    _size: int
+    _capacity: int
 
-    def __init__(self, size: int = 256) -> None:
+    def __init__(self, capachity: int = 256) -> None:
         self._memory = collections.OrderedDict()
-        self._size = size
+        self._capacity = capachity
 
     def __contains__(self, key: StageTransformationSpec) -> bool:
         return key in self._memory
@@ -249,7 +259,7 @@ def __setitem__(self, key: StageTransformationSpec, res: StageType) -> None:
             self._memory.move_to_end(key, last=True)
             self._memory[key] = res
         else:
-            if len(self._memory) == self._size:
+            if len(self._memory) == self._capacity:
                 self.popitem(None)
             self._memory[key] = res
 
@@ -270,5 +280,16 @@ def popitem(self, key: StageTransformationSpec | None) -> None:
     def clear(self) -> None:  # noqa: D102  # Missing description.
         self._memory.clear()
 
+    def __len__(self) -> int:
+        return len(self._memory)
+
+    @property
+    def capacity(self) -> int:  # noqa: D102  # No docstring needed.
+        return self._capacity
+
+    def front(self) -> tuple[StageTransformationSpec, StageType]:
+        """Returns the front of the cache, i.e. its newest entry."""
+        return next(reversed(self._memory.items()))
+
     def __repr__(self) -> str:
-        return f"StageCache({len(self._memory)} / {self._size} || {', '.join('[' + repr(k) + ']' for k in self._memory)})"
+        return f"StageCache({len(self._memory)} / {self._capacity} || {', '.join('[' + repr(k) + ']' for k in self._memory)})"
diff --git a/tests/test_caching.py b/tests/test_caching.py
index bc0e44c..0cf1526 100644
--- a/tests/test_caching.py
+++ b/tests/test_caching.py
@@ -11,7 +11,6 @@
 from __future__ import annotations
 
 import itertools as it
-import re
 
 import numpy as np
 import pytest
@@ -244,13 +243,9 @@ def wrapped(A: np.ndarray) -> np.ndarray:
     #  But the cache is aware of this, which helps catch some nasty bugs.
     F_lower = None  # Remove later
     F_res = C_res.copy()  # Remove later
-    with pytest.raises(  # noqa: PT012 # Multiple calls
-        expected_exception=NotImplementedError,
-        match=re.escape("Currently can not yet handle strides beside 'C_CONTIGUOUS'."),
-    ):
-        F_lower = wrapped.lower(F)
-        F_res = wrapped(F)
-    assert F_lower is None  # Remove later.
+    F_lower = wrapped.lower(F)
+    F_res = wrapped(F)
+    assert F_lower is not C_lower
     assert C_res is not F_res
     assert np.allclose(F_res, C_res)
     assert F_lower is not C_lower
diff --git a/tests/test_jaxpr_translator_builder.py b/tests/test_jaxpr_translator_builder.py
deleted file mode 100644
index efc6657..0000000
--- a/tests/test_jaxpr_translator_builder.py
+++ /dev/null
@@ -1,539 +0,0 @@
-# JaCe - JAX Just-In-Time compilation using DaCe (Data Centric Parallel Programming)
-#
-# Copyright (c) 2024, ETH Zurich
-# All rights reserved.
-#
-# SPDX-License-Identifier: BSD-3-Clause
-
-"""Implements some tests of the subtranslator builder."""
-
-from __future__ import annotations
-
-import re
-
-import dace
-import jax
-import numpy as np
-import pytest
-from dace.data import Array
-from jax import core as jax_core
-
-import jace
-from jace import translator, util
-from jace.util import JaCeVar
-
-
-# These are some JaCe variables that we use inside the tests
-#  Unnamed arrays
-array1 = JaCeVar((10, 12), dace.float64)
-array2 = JaCeVar((10, 13), dace.float32)
-array3 = JaCeVar((11, 16), dace.int64)
-
-#  Unnamed scalars
-scal1 = JaCeVar((), dace.float16)
-scal2 = JaCeVar((), dace.float32)
-scal3 = JaCeVar((), dace.int64)
-
-# Named variables
-narray = JaCeVar((10,), dace.float16, "narr")
-nscal = JaCeVar((), dace.int32, "nscal")
-
-
-@pytest.fixture()
-def translation_builder():
-    """Returns an allocated builder instance."""
-    name = "fixture_builder"
-    builder = translator.JaxprTranslationBuilder(
-        primitive_translators=translator.get_registered_primitive_translators()
-    )
-    builder._allocate_translation_ctx(name=name)
-    return builder
-
-
-def test_builder_alloc() -> None:
-    """Tests the state right after allocation.
-
-    Does not use the fixture because it does it on its own.
-    """
-    builder = translator.JaxprTranslationBuilder(
-        primitive_translators=translator.get_registered_primitive_translators()
-    )
-    assert not builder.is_allocated(), "Builder was created allocated."
-    assert len(builder._ctx_stack) == 0
-
-    # The reserved names will be tested in `test_builder_fork()`.
-    sdfg_name = "qwertzuiopasdfghjkl"
-    builder._allocate_translation_ctx(name=sdfg_name)
-    assert len(builder._ctx_stack) == 1
-    assert builder.is_root_translator()
-
-    sdfg: dace.SDFG = builder.sdfg
-
-    assert builder._ctx.sdfg is sdfg
-    assert builder.sdfg.name == sdfg_name
-    assert sdfg.number_of_nodes() == 1
-    assert sdfg.number_of_edges() == 0
-    assert sdfg.start_block is builder._ctx.start_state
-    assert builder._terminal_sdfg_state is builder._ctx.start_state
-
-
-def test_builder_variable_alloc_auto_naming(
-    translation_builder: translator.JaxprTranslationBuilder,
-) -> None:
-    """Tests simple variable allocation."""
-    for i, var in enumerate([array1, array2, scal1, array3, scal2, scal3]):
-        sdfg_name = translation_builder.add_array(var, update_var_mapping=True)
-        sdfg_var = translation_builder.get_array(sdfg_name)
-        assert sdfg_name == chr(97 + i)
-        assert isinstance(sdfg_var, Array)  # Everything is now an array
-        assert sdfg_var.shape == ((1,) if var.shape == () else var.shape)
-        assert sdfg_var.dtype == var.dtype
-
-
-def test_builder_variable_alloc_mixed_naming(
-    translation_builder: translator.JaxprTranslationBuilder,
-) -> None:
-    """Tests the naming in a mixed setting.
-
-    If `update_var_mapping=True` is given, then the naming will skip variables,
-    see also `test_builder_variable_alloc_mixed_naming2()`.
-    """
-    #                        *       b       c       d      *      f      g
-    for i, var in enumerate([narray, array1, array2, scal1, nscal, scal2, scal3]):
-        sdfg_name = translation_builder.add_array(var, update_var_mapping=True)
-        sdfg_var = translation_builder.get_array(sdfg_name)
-        if var.name is None:
-            assert sdfg_name == chr(97 + i)
-        else:
-            assert sdfg_name == var.name
-        assert isinstance(sdfg_var, Array)  # Everything is now an array
-        assert sdfg_var.shape == ((1,) if var.shape == () else var.shape)
-        assert sdfg_var.dtype == var.dtype
-
-
-def test_builder_variable_alloc_mixed_naming2(
-    translation_builder: translator.JaxprTranslationBuilder,
-) -> None:
-    """Tests the naming in a mixed setting.
-
-    This time we do not use `update_var_mapping=True`, instead it now depends on the
-    name. This means that automatic naming will now again include all, letters, but not
-    in a linear order.
-    """
-    letoff = 0
-    #             *      a        b       c      *      d     e
-    for var in [narray, array1, array2, scal1, nscal, scal2, scal3]:
-        sdfg_name = translation_builder.add_array(var, update_var_mapping=var.name is None)
-        sdfg_var = translation_builder.get_array(sdfg_name)
-        if var.name is None:
-            assert sdfg_name == chr(97 + letoff)
-            letoff += 1
-        else:
-            assert sdfg_name == var.name
-        assert isinstance(sdfg_var, Array)  # Everything is now an array
-        assert sdfg_var.shape == ((1,) if var.shape == () else var.shape)
-        assert sdfg_var.dtype == var.dtype
-
-
-def test_builder_variable_alloc_prefix_naming(
-    translation_builder: translator.JaxprTranslationBuilder,
-) -> None:
-    """Using the prefix to name variables."""
-    prefix_1 = "__my_special_prefix"
-    exp_name_1 = prefix_1 + "a"
-    sdfg_name_1 = translation_builder.add_array(
-        array1, name_prefix=prefix_1, update_var_mapping=False
-    )
-    assert exp_name_1 == sdfg_name_1
-
-    # Because `update_var_mapping` is `False` above, 'a' will be reused.
-    prefix_2 = "__my_special_prefix_second_"
-    exp_name_2 = prefix_2 + "a"
-    sdfg_name_2 = translation_builder.add_array(
-        array1, name_prefix=prefix_2, update_var_mapping=False
-    )
-    assert exp_name_2 == sdfg_name_2
-
-    # Now we use a named variables, which are also affected.
-    prefix_3 = "__my_special_prefix_third_named_"
-    exp_name_3 = prefix_3 + nscal.name  # type: ignore[operator]  # `.name` is not `None`.
-    sdfg_name_3 = translation_builder.add_array(
-        nscal, name_prefix=prefix_3, update_var_mapping=False
-    )
-    assert exp_name_3 == sdfg_name_3
-
-
-def test_builder_variable_alloc_auto_naming_wrapped(
-    translation_builder: translator.JaxprTranslationBuilder,
-) -> None:
-    """Tests the variable naming if we have more than 26 variables."""
-    single_letters = [chr(x) for x in range(97, 123)]
-    i = 0
-    for let1 in ["", *single_letters[1:]]:  # Note `z` is followed by `ba` and not by `aa`.
-        for let2 in single_letters:
-            i += 1
-            # Create a variable and enter it into the variable naming.
-            var = JaCeVar(shape=(19, 19), dtype=dace.float64)
-            sdfg_name = translation_builder.add_array(arg=var, update_var_mapping=True)
-            mapped_name = translation_builder.map_jax_var_to_sdfg(var)
-            assert (
-                sdfg_name == mapped_name
-            ), f"Mapping for '{var}' failed, expected '{sdfg_name}' got '{mapped_name}'."
-
-            # Get the name that we really expect, we must also handle some situations.
-            exp_name = let1 + let2
-            if exp_name in util.FORBIDDEN_SDFG_VAR_NAMES:
-                exp_name = "__jace_forbidden_" + exp_name
-            assert (
-                exp_name == sdfg_name
-            ), f"Automated naming failed, expected '{exp_name}' but got '{sdfg_name}'."
-
-
-def test_builder_nested(translation_builder: translator.JaxprTranslationBuilder) -> None:
-    """Tests the ability of the nesting of the builder."""
-
-    # Now add a variable to the current subtext.
-    name_1 = translation_builder.add_array(array1, update_var_mapping=True)
-    assert name_1 == "a"
-    assert translation_builder.map_jax_var_to_sdfg(array1) == name_1
-
-    # For the sake of doing it add a new state to the SDFG.
-    translation_builder.append_new_state("sake_state")
-    assert translation_builder.sdfg.number_of_nodes() == 2
-    assert translation_builder.sdfg.number_of_edges() == 1
-
-    # Now we go one subcontext deeper
-    translation_builder._allocate_translation_ctx("builder")
-    assert len(translation_builder._ctx_stack) == 2
-    assert translation_builder.sdfg.name == "builder"
-    assert translation_builder.sdfg.number_of_nodes() == 1
-    assert translation_builder.sdfg.number_of_edges() == 0
-    assert not translation_builder.is_root_translator()
-
-    # Because we have a new SDFG the mapping to previous SDFG does not work,
-    #  regardless the fact that it still exists.
-    with pytest.raises(
-        expected_exception=KeyError,
-        match=re.escape(
-            f"Jax variable '{array1}' was supposed to map to '{name_1}', but no such SDFG variable is known."
-        ),
-    ):
-        _ = translation_builder.map_jax_var_to_sdfg(array1)
-
-    # Because the SDFGs are distinct it is possible to add `array1` to the nested one.
-    #  However, it is not able to update the mapping.
-    with pytest.raises(
-        expected_exception=ValueError,
-        match=re.escape(f"Cannot change the mapping of '{array1}' from '{name_1}' to '{name_1}'."),
-    ):
-        _ = translation_builder.add_array(array1, update_var_mapping=True)
-    assert name_1 not in translation_builder.sdfg.arrays
-
-    # Without updating the mapping it is possible create the variable.
-    assert name_1 == translation_builder.add_array(array1, update_var_mapping=False)
-
-    # Now add a new variable, the map is shared, so a new name will be generated.
-    name_2 = translation_builder.add_array(array2, update_var_mapping=True)
-    assert name_2 == "b"
-    assert name_2 == translation_builder.map_jax_var_to_sdfg(array2)
-
-    # Now we go one stack level back.
-    translation_builder._clear_translation_ctx()
-    assert len(translation_builder._ctx_stack) == 1
-    assert translation_builder.sdfg.number_of_nodes() == 2
-    assert translation_builder.sdfg.number_of_edges() == 1
-
-    # Again the variable that was declared in the last stack is now no longer present.
-    #  Note if the nested SDFG was integrated into the parent SDFG it would be
-    #  accessible
-    with pytest.raises(
-        expected_exception=KeyError,
-        match=re.escape(
-            f"Jax variable '{array2}' was supposed to map to '{name_2}', but no such SDFG variable is known."
-        ),
-    ):
-        _ = translation_builder.map_jax_var_to_sdfg(array2)
-    assert name_2 == translation_builder._jax_name_map[array2]
-
-    # Now add a new variable, since the map is shared, we will now get the next name.
-    name_3 = translation_builder.add_array(array3, update_var_mapping=True)
-    assert name_3 == "c"
-    assert name_3 == translation_builder.map_jax_var_to_sdfg(array3)
-
-
-def test_builder_append_state(translation_builder: translator.JaxprTranslationBuilder) -> None:
-    """Tests the functionality of appending states."""
-    sdfg: dace.SDFG = translation_builder.sdfg
-
-    terminal_state_1: dace.SDFGState = translation_builder.append_new_state("terminal_state_1")
-    assert sdfg.number_of_nodes() == 2
-    assert sdfg.number_of_edges() == 1
-    assert terminal_state_1 is translation_builder._terminal_sdfg_state
-    assert translation_builder._terminal_sdfg_state is translation_builder._ctx.terminal_state
-    assert translation_builder._ctx.start_state is sdfg.start_block
-    assert translation_builder._ctx.start_state is not terminal_state_1
-    assert next(iter(sdfg.edges())).src is sdfg.start_block
-    assert next(iter(sdfg.edges())).dst is terminal_state_1
-
-    # Specifying an explicit append state that is the terminal should also update the
-    #  terminal state of the builder.
-    terminal_state_2: dace.SDFGState = translation_builder.append_new_state(
-        "terminal_state_2", prev_state=terminal_state_1
-    )
-    assert sdfg.number_of_nodes() == 3
-    assert sdfg.number_of_edges() == 2
-    assert terminal_state_2 is translation_builder._terminal_sdfg_state
-    assert sdfg.out_degree(terminal_state_1) == 1
-    assert sdfg.out_degree(terminal_state_2) == 0
-    assert sdfg.in_degree(terminal_state_2) == 1
-    assert next(iter(sdfg.in_edges(terminal_state_2))).src is terminal_state_1
-
-    # Specifying a previous node that is not the terminal state should not do anything.
-    non_terminal_state: dace.SDFGState = translation_builder.append_new_state(
-        "non_terminal_state", prev_state=terminal_state_1
-    )
-    assert translation_builder._terminal_sdfg_state is not non_terminal_state
-    assert sdfg.in_degree(non_terminal_state) == 1
-    assert sdfg.out_degree(non_terminal_state) == 0
-    assert next(iter(sdfg.in_edges(non_terminal_state))).src is terminal_state_1
-
-
-def test_builder_variable_multiple_variables(
-    translation_builder: translator.JaxprTranslationBuilder,
-) -> None:
-    """Add an already known variable, but with a different name."""
-    # Now we will add `array1` and then different ways of updating it.
-    narray1: str = translation_builder.add_array(array1, update_var_mapping=True)
-
-    # It will fail if we use the prefix, because we also want to update.
-    prefix = "__jace_prefix"
-    prefix_expected_name = prefix + narray1
-    with pytest.raises(
-        expected_exception=ValueError,
-        match=re.escape(
-            f"Cannot change the mapping of '{array1}' from '{translation_builder.map_jax_var_to_sdfg(array1)}' to '{prefix_expected_name}'."
-        ),
-    ):
-        _ = translation_builder.add_array(array1, update_var_mapping=True, name_prefix=prefix)
-    assert prefix_expected_name not in translation_builder.sdfg.arrays
-
-    # But if we do not want to update it then it works.
-    prefix_sdfg_name = translation_builder.add_array(
-        array1, update_var_mapping=False, name_prefix=prefix
-    )
-    assert prefix_expected_name == prefix_sdfg_name
-    assert prefix_expected_name in translation_builder.sdfg.arrays
-    assert narray1 == translation_builder.map_jax_var_to_sdfg(array1)
-
-
-def test_builder_variable_invalid_prefix(
-    translation_builder: translator.JaxprTranslationBuilder,
-) -> None:
-    """Use invalid prefix."""
-    # It will fail if we use the prefix, because we also want to update.
-    for iprefix in ["0_", "_ja ", "_!"]:
-        with pytest.raises(
-            expected_exception=ValueError,
-            match=re.escape(f"add_array({array1}): The proposed name '{iprefix}a', is invalid."),
-        ):
-            _ = translation_builder.add_array(array1, update_var_mapping=False, name_prefix=iprefix)
-        assert len(translation_builder.sdfg.arrays) == 0
-
-
-def test_builder_variable_alloc_list(
-    translation_builder: translator.JaxprTranslationBuilder,
-) -> None:
-    """Tests part of the `JaxprTranslationBuilder.create_jax_var_list()` api."""
-    var_list_1 = [array1, nscal, scal2]
-    exp_names_1 = ["a", nscal.name, "c"]
-
-    res_names_1 = translation_builder.create_jax_var_list(var_list_1, update_var_mapping=True)
-    assert len(translation_builder.arrays) == 3
-    assert res_names_1 == exp_names_1
-
-    # Now a mixture of the collection and creation.
-    var_list_2 = [array2, nscal, scal1]
-    exp_names_2 = ["d", nscal.name, "e"]
-
-    res_names_2 = translation_builder.create_jax_var_list(var_list_2, update_var_mapping=True)
-    assert res_names_2 == exp_names_2
-    assert len(translation_builder.arrays) == 5
-
-
-@pytest.mark.skip(reason="'create_jax_var_list()' does not clean up in case of an error.")
-def test_builder_variable_alloc_list_cleaning(
-    translation_builder: translator.JaxprTranslationBuilder,
-) -> None:
-    """Tests part of the `JaxprTranslationBuilder.create_jax_var_list()` api.
-
-    It will fail because `update_var_mapping=False` thus the third variable will
-    cause an error because it is proposed to `a`, which is already used.
-    """
-    var_list = [array1, nscal, scal2]
-
-    with pytest.raises(
-        expected_exception=ValueError,
-        match=re.escape(f"add_array({scal2}): The proposed name 'a', is used."),
-    ):
-        _ = translation_builder.create_jax_var_list(var_list)
-
-    assert len(translation_builder.arrays) == 0
-
-
-def test_builder_variable_alloc_list_prevent_creation(
-    translation_builder: translator.JaxprTranslationBuilder,
-) -> None:
-    """Tests part of the `JaxprTranslationBuilder.create_jax_var_list()` api.
-
-    It will test the `prevent_creation` flag.
-    """
-    # First create a variable.
-    translation_builder.add_array(array1, update_var_mapping=True)
-    assert len(translation_builder.arrays) == 1
-
-    # Now create the variables
-    var_list = [array1, array2]
-
-    with pytest.raises(
-        expected_exception=ValueError,
-        match=re.escape(f"'prevent_creation' given but have to create '{array2}'."),
-    ):
-        translation_builder.create_jax_var_list(var_list, prevent_creation=True)
-    assert len(translation_builder.arrays) == 1
-    assert translation_builder.map_jax_var_to_sdfg(array1) == "a"
-
-
-@pytest.mark.skip(reason="'create_jax_var_list()' does not clean up in case of an error.")
-def test_builder_variable_alloc_list_only_creation(
-    translation_builder: translator.JaxprTranslationBuilder,
-) -> None:
-    """Tests part of the `JaxprTranslationBuilder.create_jax_var_list()` api.
-
-    It will test the `only_creation` flag.
-    """
-    # First create a variable.
-    translation_builder.add_array(array1, update_var_mapping=True)
-    assert len(translation_builder.arrays) == 1
-
-    # Now create the variables
-    var_list = [array2, array1]
-
-    with pytest.raises(
-        expected_exception=ValueError,
-        match=re.escape(f"'only_creation' given '{array1}' already exists."),
-    ):
-        translation_builder.create_jax_var_list(var_list, only_creation=True)
-    assert len(translation_builder.arrays) == 1
-    assert translation_builder.map_jax_var_to_sdfg(array1) == "a"
-
-
-def test_builder_variable_alloc_list_handle_literal(
-    translation_builder: translator.JaxprTranslationBuilder,
-) -> None:
-    """Tests part of the `JaxprTranslationBuilder.create_jax_var_list()` api.
-
-    It will test the `handle_literals` flag.
-    """
-
-    val = np.array(1)
-    aval = jax_core.get_aval(val)
-    lit = jax_core.Literal(val, aval)
-    var_list = [lit]
-
-    with pytest.raises(
-        expected_exception=ValueError,
-        match=re.escape("Encountered a literal but `handle_literals` was `False`."),
-    ):
-        translation_builder.create_jax_var_list(var_list, handle_literals=False)
-    assert len(translation_builder.arrays) == 0
-
-    name_list = translation_builder.create_jax_var_list(var_list, handle_literals=True)
-    assert len(translation_builder.arrays) == 0
-    assert name_list == [None]
-
-
-def test_builder_constants(translation_builder: translator.JaxprTranslationBuilder) -> None:
-    """Tests part of the `JaxprTranslationBuilder._create_constants()` api.
-
-    See also the `test_subtranslators_alu.py::test_add3` test.
-    """
-    # Create the Jaxpr that we need.
-    constant = [[1.0, 2.0, 3.0], [4.0, 5.0, 6.0], [7.0, 8.0, 9.0]]
-    jaxpr = jax.make_jaxpr(lambda A: A + jax.numpy.array(constant))(1.0)
-
-    # We have to manually allocate the builder context.
-    #  You should not do that.
-    translation_builder._allocate_translation_ctx(name="Manual_test")
-
-    # No create the constants.
-    translation_builder._create_constants(jaxpr)
-
-    # Test if it was created with the correct value.
-    assert len(translation_builder.arrays) == 1
-    assert len(translation_builder._jax_name_map) == 1
-    assert next(iter(translation_builder._jax_name_map.values())) == "__const_a"
-    assert len(translation_builder.sdfg.constants) == 1
-    assert np.all(translation_builder.sdfg.constants["__const_a"] == constant)
-
-
-def test_builder_scalar_return_value() -> None:
-    """Tests if scalars can be returned directly."""
-
-    def scalar_ops(A: float) -> float:
-        return A + A - A * A
-
-    lower_cnt = [0]
-
-    @jace.jit
-    def wrapped(A: float) -> float:
-        lower_cnt[0] += 1
-        return scalar_ops(A)
-
-    vals = np.random.random(100)  # noqa: NPY002
-    for i in range(vals.size):
-        res = wrapped(vals[i])
-        ref = scalar_ops(vals[i])
-        assert np.allclose(res, ref)
-    assert lower_cnt[0] == 1
-
-
-@pytest.mark.skip(reason="Currently 'scalar' return values, are actually shape '(1,)' arrays.")
-def test_builder_scalar_return_type() -> None:
-    """Tests if the type is the same, in case of scalar return."""
-
-    @jace.jit
-    def wrapped(A: np.float64) -> np.float64:
-        return A + A - A * A
-
-    A = np.float64(1.0)
-    assert type(A) is np.float64, f"Expected type 'np.float64', but got '{type(A).__name__}'."
-
-
-def test_builder_jace_var() -> None:
-    """Simple tests about the `JaCeVar` objects."""
-    for iname in ["do", "", "_ _", "9al", "_!"]:
-        with pytest.raises(
-            expected_exception=ValueError, match=re.escape(f"Supplied the invalid name '{iname}'.")
-        ):
-            _ = JaCeVar((), dace.int8, name=iname)
-
-
-def test_builder_F_strides() -> None:
-    """Tests if we can lower without a standard stride.
-
-    Notes:
-        This tests if the restriction is currently in place.
-        See also `tests/test_caching.py::test_caching_strides`.
-    """
-
-    @jace.jit
-    def testee(A: np.ndarray) -> np.ndarray:
-        return A + 10.0
-
-    F = np.full((4, 3), 10, dtype=np.float64, order="F")
-
-    with pytest.raises(
-        expected_exception=NotImplementedError,
-        match=re.escape("Currently can not yet handle strides beside 'C_CONTIGUOUS'."),
-    ):
-        _ = testee(F)
diff --git a/tests/test_subtranslator_helper.py b/tests/test_subtranslator_helper.py
index 56b30fb..a4c4ad9 100644
--- a/tests/test_subtranslator_helper.py
+++ b/tests/test_subtranslator_helper.py
@@ -177,7 +177,11 @@ def foo(A):
         D = C + 1
         return D + 1
 
-    _ = foo.lower(1)
+    with pytest.warns(
+        UserWarning,
+        match=re.escape('Use of uninitialized transient "e" in state output_processing_stage'),
+    ):
+        _ = foo.lower(1)
     assert trans_cnt[0] == 4
 
 
From 9fe9e2dd8292f4ab2e30b9e5dc880d51db8f4a59 Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Wed, 19 Jun 2024 15:27:04 +0200
Subject: [PATCH 389/458] Updated the translators a little bit.

Especially the slicing translator that now also do window start index adaptions for literals.
---
 .../arithmetic_logical_translators.py         | 19 +++--
 .../broadcast_in_dim_translator.py            |  8 +-
 .../convert_element_type_translator.py        |  5 +-
 .../primitive_translators/copy_translator.py  | 70 +++++++++-------
 .../primitive_translators/iota_translator.py  |  2 +-
 .../select_n_translator.py                    |  6 +-
 .../primitive_translators/slicing.py          | 84 +++++++++----------
 .../squeeze_translator.py                     |  5 +-
 src/jace/util/jax_helper.py                   | 10 ++-
 .../test_primitive_slicing.py                 |  2 +-
 10 files changed, 121 insertions(+), 90 deletions(-)

diff --git a/src/jace/translator/primitive_translators/arithmetic_logical_translators.py b/src/jace/translator/primitive_translators/arithmetic_logical_translators.py
index b54bd1f..d901682 100644
--- a/src/jace/translator/primitive_translators/arithmetic_logical_translators.py
+++ b/src/jace/translator/primitive_translators/arithmetic_logical_translators.py
@@ -33,8 +33,8 @@ class ArithmeticOperationTranslator(mapped_base.MappedOperationTranslatorBase):
     """
     Translator for all arithmetic operations.
 
-    The class makes use of the `MappedOperationTranslatorBase`. It only implements
-    the `write_tasklet_code()` to generate the code for a Tasklet from a template.
+    The class is derived from `MappedOperationTranslatorBase` and overwrites the
+    `write_tasklet_code()` function for the Tasklet code.
 
     Args:
         prim_name:      The name of the primitive that should be handled.
@@ -43,6 +43,7 @@ class ArithmeticOperationTranslator(mapped_base.MappedOperationTranslatorBase):
     Note:
         - It does not implement the logical operations, they are implemented by
             the `LogicalOperationTranslator` class.
+        - Despite its name this class also provides the comparison operators.
         - It does not implement `mod` nor `fmod` as they are translated to some
             nested `pjit` implementation by Jax for unknown reasons.
     """
@@ -70,17 +71,16 @@ class LogicalOperationTranslator(mapped_base.MappedOperationTranslatorBase):
     Translator for all logical operations.
 
     The reason why the logical operations are separated from the arithmetic
-    operation is quite complicated, and in fact the whole thing is harder than
+    operations is quite complicated and in fact the whole thing is harder than
     it should be. NumPy has two kinds of these operations, i.e.
     `logical_{and, or, xor, not}()` and `bitwise_{and, or, xor, not}()`, but Jax
-    has only a single kind of logical operations, that operate in bitwise mode.
+    has only a single kind of logical operation, that operate in bitwise mode.
     The first idea would be to use `ArithmeticOperationTranslator` with a template
     such as `__out = __in0 & __in1` or `__out = ~__in0`. Since DaCe eventually
     generates C++ code and C++ has a native bool type, and `true` is guaranteed
     to be `1` and `false` equals `0`, this works for all operations except `not`,
-    as `~true` in C++ is again `true`. Thus the `not` primitive must be handled
-    separately, however, it does not make sense to split the logical operations,
-    thus all of them are handled by this class.
+    as `~true` in C++ is essentially `~1`, which is again `true`!
+    Thus the `not` primitive must be handled separately.
 
     The solution to the problem is, to introduce two templates, one used for the
     bool context and one used in the integer context. This works because depending
@@ -93,8 +93,9 @@ class LogicalOperationTranslator(mapped_base.MappedOperationTranslatorBase):
         bool_tmpl:      The template used for the bool case.
 
     Notes:
-        This class does not do parameter substitution as the
-        `ArithmeticOperationTranslator` does.
+        Since it does not make sense to single out `not` and keep the other
+        logical operations in `ArithmeticOperationTranslator` all of them are
+        handled by this class.
     """
 
     def __init__(self, prim_name: str, int_tmpl: str, bool_tmpl: str) -> None:
diff --git a/src/jace/translator/primitive_translators/broadcast_in_dim_translator.py b/src/jace/translator/primitive_translators/broadcast_in_dim_translator.py
index 12852e5..7f24160 100644
--- a/src/jace/translator/primitive_translators/broadcast_in_dim_translator.py
+++ b/src/jace/translator/primitive_translators/broadcast_in_dim_translator.py
@@ -25,7 +25,13 @@
 
 
 class BroadcastInDimTranslator(mapped_base.MappedOperationTranslatorBase):
-    """Implements the `broadcast_in_dim` primitive."""
+    """
+    Implements the `broadcast_in_dim` primitive.
+
+    The primitive is implemented through the `MappedOperationTranslatorBase` base.
+    Essentially it creates a copy, but also creates special Memlets that replicate
+    the content of the input.
+    """
 
     def __init__(self) -> None:
         super().__init__(primitive_name="broadcast_in_dim")
diff --git a/src/jace/translator/primitive_translators/convert_element_type_translator.py b/src/jace/translator/primitive_translators/convert_element_type_translator.py
index e9caab5..28838e5 100644
--- a/src/jace/translator/primitive_translators/convert_element_type_translator.py
+++ b/src/jace/translator/primitive_translators/convert_element_type_translator.py
@@ -28,7 +28,10 @@ class ConvertElementTypeTranslator(mapped_base.MappedOperationTranslatorBase):
     """
     Implements the `convert_element_type` primitive.
 
-    Copies the input to the output and performs type conversion.
+    The primitive will expand to a "copy Map", however, the Tasklet will not
+    simply copy the input to the output, but also perform type conversion.
+    However, in cases where the input type is the same as the output type,
+    the Tasklet will just be a copy Tasklet, that can then be removed by DaCe.
 
     Notes:
         This translator ignores the `new_dtype` and `weak_type` parameters of
diff --git a/src/jace/translator/primitive_translators/copy_translator.py b/src/jace/translator/primitive_translators/copy_translator.py
index 5752e0d..650b483 100644
--- a/src/jace/translator/primitive_translators/copy_translator.py
+++ b/src/jace/translator/primitive_translators/copy_translator.py
@@ -11,10 +11,10 @@
 
 from typing import TYPE_CHECKING
 
+import dace
 from typing_extensions import override
 
 from jace import translator
-from jace.translator import mapped_operation_base_translator as mapped_base
 
 
 if TYPE_CHECKING:
@@ -23,55 +23,69 @@
     from jax import core as jax_core
 
 
-class CopyTranslator(mapped_base.MappedOperationTranslatorBase):
+class CopyTranslator:
     """
     Implements the `copy` primitive.
 
-    Copy operations are implemented as a map to ensure that they can be fused
-    with other maps
-    .
+    The translator is implemented by using a Memlet.
     """
 
-    def __init__(self) -> None:
-        super().__init__(primitive_name="copy")
+    @property
+    def primitive(self) -> str:  # noqa: D102  # No docstring needed.
+        return "copy"
 
-    @override
-    def write_tasklet_code(
+    def __call__(  # noqa: D102  # No docstring
         self,
-        tskl_ranges: Sequence[tuple[str, str]],
+        builder: translator.JaxprTranslationBuilder,
         in_var_names: Sequence[str | None],
-        eqn: jax_core.JaxprEqn,
-    ) -> str:
-        return "__out = __in0"
-
-
-class DevicePutTranslator(mapped_base.MappedOperationTranslatorBase):
+        out_var_names: Sequence[str],
+        eqn: jax_core.JaxprEqn,  # noqa: ARG002
+        eqn_state: dace.SDFGState,
+    ) -> None:
+        eqn_state.add_nedge(
+            eqn_state.add_read(in_var_names[0]),
+            eqn_state.add_write(out_var_names[0]),
+            dace.Memlet.from_array(
+                in_var_names[0],
+                builder.arrays[in_var_names[0]],  # type: ignore[index]  # Guaranteed to be a string
+            ),
+        )
+
+
+class DevicePutTranslator(CopyTranslator):
     """
     Implements the `device_put` primitive.
 
-    In Jax this primitive is used to copy data between the host and the device.
-    Because of the way how JaCe and the optimization pipeline works, either
-    everything is on the host or the device.
-
-    Todo:
-        Think about how to implement this correctly.
+    In Jax this primitive is used to copy data between the host and the device,
+    in DaCe Memlets can do this. However, because of the way JaCe operates, at
+    least in the beginning a computation is either fully on the host or on the
+    device this copy will essentially perform a copying.
     """
 
-    def __init__(self) -> None:
-        super().__init__(primitive_name="device_put")
+    @property
+    def primitive(self) -> str:  # noqa: D102  # No docstring
+        return "device_put"
 
     @override
-    def write_tasklet_code(
+    def __call__(  # No docstring
         self,
-        tskl_ranges: Sequence[tuple[str, str]],
+        builder: translator.JaxprTranslationBuilder,
         in_var_names: Sequence[str | None],
+        out_var_names: Sequence[str],
         eqn: jax_core.JaxprEqn,
-    ) -> str:
+        eqn_state: dace.SDFGState,
+    ) -> None:
         if not (eqn.params["device"] is None and eqn.params["src"] is None):
             raise NotImplementedError(
                 f"Can only copy on the host, but not from {eqn.params['src']} to {eqn.params['device']}."
             )
-        return "__out = __in0"
+        return super().__call__(
+            builder=builder,
+            in_var_names=in_var_names,
+            out_var_names=out_var_names,
+            eqn=eqn,
+            eqn_state=eqn_state,
+        )
 
 
 _ = translator.register_primitive_translator(CopyTranslator())
diff --git a/src/jace/translator/primitive_translators/iota_translator.py b/src/jace/translator/primitive_translators/iota_translator.py
index 54da87a..ce0d99f 100644
--- a/src/jace/translator/primitive_translators/iota_translator.py
+++ b/src/jace/translator/primitive_translators/iota_translator.py
@@ -28,7 +28,7 @@ class IotaTranslator(mapped_base.MappedOperationTranslatorBase):
     """
     Implements the `iota` primitive.
 
-    Essentially a very general `jnp.arange()` function.
+    Essentially, a very general `jnp.arange()` function.
     """
 
     def __init__(self) -> None:
diff --git a/src/jace/translator/primitive_translators/select_n_translator.py b/src/jace/translator/primitive_translators/select_n_translator.py
index 80d63f4..51b27b3 100644
--- a/src/jace/translator/primitive_translators/select_n_translator.py
+++ b/src/jace/translator/primitive_translators/select_n_translator.py
@@ -70,7 +70,6 @@ def make_input_memlets(
         in_var_names: Sequence[str | None],
         eqn: jax_core.JaxprEqn,
     ) -> dict[str, dace.Memlet]:
-        """We have to add the offsets to the Memlet accesses."""
         return {
             f"__in{i - 1}" if i else "__cond": dace.Memlet.simple(
                 in_var_name, ", ".join(f"{it_idx}" for it_idx, _ in tskl_ranges)
@@ -79,10 +78,11 @@ def make_input_memlets(
             if in_var_name
         }
 
-    def literal_substitution(  # noqa: PLR6301
+    @override
+    def literal_substitution(
         self, tskl_code: str, in_var_names: Sequence[str | None], eqn: jax_core.JaxprEqn
     ) -> str:
-        """Can not be done by the base because of the renaming."""
+        assert in_var_names[0]  # Condition can never be a literal.
         for i, in_var_name in enumerate(in_var_names[1:]):
             if in_var_name is not None:
                 continue
diff --git a/src/jace/translator/primitive_translators/slicing.py b/src/jace/translator/primitive_translators/slicing.py
index 2fb1a2f..3000377 100644
--- a/src/jace/translator/primitive_translators/slicing.py
+++ b/src/jace/translator/primitive_translators/slicing.py
@@ -29,8 +29,11 @@ class SlicingTranslator(mapped_base.MappedOperationTranslatorBase):
     Implements the `slice` primitive.
 
     This is the classical slicing operation which extracts a fixed sized window
-    from a fixed initial position. The `dynamic_slice` operation supports a
-    variable starting point.
+    from a fixed initial position. The slicing is implemented using a partial copy.
+
+    Notes:
+        Slices are essentially optimization barriers as they can not be fused
+        with Maps before them.
     """
 
     def __init__(self) -> None:
@@ -101,41 +104,47 @@ def __call__(
         # This is the sizes of the slice window.
         window_sizes: Sequence[int] = eqn.params["slice_sizes"]
 
-        # The first input to the primitive is the array we slice from, the others are
-        #  the start indices of the slice window, each is a scalar, maybe literals.
-        in_var_name: str = in_var_names[0]
-        start_indices: list[str | None] = list(in_var_names[1:])
-
-        # Access nodes for the modified start indexes.
+        # Maps the variable name, that stores the start index of the window in one
+        #  dimensions to the access node, that holds the value. The variable name
+        #  is also used as dynamic range offset.
+        #  Only present if the index is not a literal.
         in_access: dict[str, dace.nodes.AccessNode] = {}
 
+        # Name of the variable from where we get the start index of the window
+        #  or the value itself, if it is a literal; in the order of the dimension.
+        #  If the value is `None` then the literal was not yet processed.
+        window_start_indices: list[str | None] = list(in_var_names[1:])
+
         # We will always adapt the start indexes and not check if it is needed.
-        for dim, (start_index, dim_size, wsize) in enumerate(
-            zip(start_indices, util.get_jax_var_shape(eqn.invars[0]), window_sizes)
+        for dim, (window_start_index, dim_size, window_size) in enumerate(
+            zip(window_start_indices, util.get_jax_var_shape(eqn.invars[0]), window_sizes)
         ):
-            if start_index is None:
+            if window_start_index is None:
+                # Jax does not adjust the literals on its own
+                raw_window_start = int(util.get_jax_literal_value(eqn.invars[dim + 1]))  # type: ignore[arg-type]  # type confusion
+                adjusted_window_start = min(dim_size, raw_window_start + window_size) - window_size
+                window_start_indices[dim] = str(adjusted_window_start)
                 continue
 
-            # We use a Tasklet to perform the adjustment not a symbol, because this
-            # would need an interstage edge serving as kind of an optimization barrier.
+            # We do not use a symbol for the start of the window but a Tasklet, as
+            #  a symbol would need an interstage edge, which is an optimization barrier.
             tasklet = dace.nodes.Tasklet(
-                label=f"adjustment_of_slice_start_{start_index}_for_{out_var_names[0]}",
+                label=f"adjustment_of_slice_start_{window_start_index}_for_{out_var_names[0]}",
                 inputs={"unadjusted_start_idx": None},
                 outputs={"adjusted_start_idx": None},
-                code=f"adjusted_start_idx = min(unadjusted_start_idx + {wsize}, {dim_size}) - {wsize}",
+                code=f"adjusted_start_idx = min(unadjusted_start_idx + {window_size}, {dim_size}) - {window_size}",
             )
-
             new_start_idx_var_name = builder.add_array(
                 eqn.invars[dim + 1], name_prefix="__jace_adapted_start_idx_"
             )
             new_start_idx_acc = eqn_state.add_access(new_start_idx_var_name)
 
             eqn_state.add_edge(
-                eqn_state.add_read(start_index),
+                eqn_state.add_read(window_start_index),
                 None,
                 tasklet,
                 "unadjusted_start_idx",
-                dace.Memlet.simple(start_index, "0"),
+                dace.Memlet.simple(window_start_index, "0"),
             )
             eqn_state.add_edge(
                 tasklet,
@@ -144,33 +153,22 @@ def __call__(
                 None,
                 dace.Memlet.simple(new_start_idx_var_name, "0"),
             )
-            # Update the name of the start index
-            start_indices[dim] = new_start_idx_var_name
+            # Update the name of the start index, and store the access
+            #  node for later use.
+            window_start_indices[dim] = new_start_idx_var_name
             in_access[new_start_idx_var_name] = new_start_idx_acc
 
         tskl_ranges: list[tuple[str, str]] = [
             (f"__i{dim}", f"0:{N}") for dim, N in enumerate(util.get_jax_var_shape(eqn.outvars[0]))
         ]
 
-        # For copying the data, we use dynamic map ranges, which is basically an input
-        #  connector on the map entry whose name is not `IN_*`, this name can then be
-        #  used as a symbol inside the map scope; this symbol is then used as offset.
-        dynamic_map_ranges: dict[str, str] = {}
         memlet_accesses: list[str] = []
 
-        for i, ((it_var, _), start_index) in enumerate(zip(tskl_ranges, start_indices), 1):
-            if start_index is None:
-                offset = str(util.get_jax_literal_value(eqn.invars[i]))
-            else:
-                # Because of [issue 1579](https://github.com/spcl/dace/issues/1579) we
-                #  have to use the same name as the data container for the symbol and
-                #  can not mangle it.
-                # TODO(phimuell): Activate mangling when the issue is resolved.
-                offset = start_index
-                dynamic_map_ranges[offset] = start_index
-            memlet_accesses.append(f"{it_var} + {offset}")
-
-        tskl_input = dace.Memlet.simple(in_var_name, ", ".join(memlet_accesses))
+        for (it_var, _), offset_symbol_name in zip(tskl_ranges, window_start_indices):
+            assert offset_symbol_name is not None
+            memlet_accesses.append(f"{it_var} + {offset_symbol_name}")
+
+        tskl_input = dace.Memlet.simple(in_var_names[0], ", ".join(memlet_accesses))
         tskl_output = dace.Memlet.simple(
             out_var_names[0], ", ".join(name for name, _ in tskl_ranges)
         )
@@ -185,15 +183,17 @@ def __call__(
 
         # Creating the inputs for the dynamic map ranges. We have to use the same
         #  access nodes as above, to ensure a single order of computation.
-        for symb_name, start_index in dynamic_map_ranges.items():
+        for window_start_index_name, windows_start_access_node in in_access.items():
             eqn_state.add_edge(
-                in_access[start_index],
+                windows_start_access_node,
                 None,
                 map_entry,
-                symb_name,
-                dace.Memlet.simple(start_index, "0"),
+                window_start_index_name,
+                dace.Memlet.simple(window_start_index_name, "0"),
             )
-            map_entry.add_in_connector(symb_name)
+            map_entry.add_in_connector(window_start_index_name)
+
+        builder.sdfg.view()
 
 
 translator.register_primitive_translator(SlicingTranslator())
diff --git a/src/jace/translator/primitive_translators/squeeze_translator.py b/src/jace/translator/primitive_translators/squeeze_translator.py
index 6d04d29..de6f1f4 100644
--- a/src/jace/translator/primitive_translators/squeeze_translator.py
+++ b/src/jace/translator/primitive_translators/squeeze_translator.py
@@ -29,9 +29,8 @@ class SqueezeTranslator(mapped_base.MappedOperationTranslatorBase):
     """
     Implements the `squeeze` primitive.
 
-    The primitives allows to remove a dimension of size one. Essentially
-    equivalent to `np.squeeze` and the inverse to `np.expand_dims()`,
-    which is handled by the `broadcast_in_dim` primitive.
+    The primitives allows to remove dimensions of size one. Essentially
+    equivalent to `np.squeeze` and the inverse to `np.expand_dims()`.
     """
 
     def __init__(self) -> None:
diff --git a/src/jace/util/jax_helper.py b/src/jace/util/jax_helper.py
index c0997ba..d1e1364 100644
--- a/src/jace/util/jax_helper.py
+++ b/src/jace/util/jax_helper.py
@@ -16,7 +16,7 @@
 
 import dataclasses
 import itertools
-from typing import TYPE_CHECKING, Any
+from typing import TYPE_CHECKING, Any, overload
 
 import dace
 import jax
@@ -102,6 +102,14 @@ def get_jax_var_name(jax_var: jax_core.Atom | JaCeVar) -> str:
             )
 
 
+@overload
+def get_jax_var_shape(jax_var: jax_core.Atom) -> tuple[int, ...]: ...
+
+
+@overload
+def get_jax_var_shape(jax_var: JaCeVar) -> tuple[int | dace.symbol | str, ...]: ...
+
+
 def get_jax_var_shape(jax_var: jax_core.Atom | JaCeVar) -> tuple[int | dace.symbol | str, ...]:
     """Returns the shape of `jax_var`."""
     match jax_var:
diff --git a/tests/integration_tests/primitive_translators/test_primitive_slicing.py b/tests/integration_tests/primitive_translators/test_primitive_slicing.py
index 1615dd0..6df48e8 100644
--- a/tests/integration_tests/primitive_translators/test_primitive_slicing.py
+++ b/tests/integration_tests/primitive_translators/test_primitive_slicing.py
@@ -93,7 +93,7 @@ def testee(a: np.ndarray, s1: int, s2: int) -> jax.Array:
 
 def test_dynamic_slice_full_literal(a_4x4x4x4: np.ndarray) -> None:
     def testee(a: np.ndarray) -> jax.Array:
-        return jax.lax.dynamic_slice(a, (0, 1, 0, 2), (2, 2, 2, 2))
+        return jax.lax.dynamic_slice(a, (0, 1, 0, 3), (2, 2, 2, 2))
 
     res = jace.jit(testee)(a_4x4x4x4)
     ref = testee(a_4x4x4x4)

From 2ecb7ee3f55f7f6b5013eea0d83546995da35033 Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Wed, 19 Jun 2024 16:23:43 +0200
Subject: [PATCH 390/458] Added teh concatenation translator.

---
 .../primitive_translators/__init__.py         |  2 +
 .../primitive_translators/concatenate.py      | 85 +++++++++++++++++++
 .../test_primitive_concatenate.py             | 80 +++++++++++++++++
 3 files changed, 167 insertions(+)
 create mode 100644 src/jace/translator/primitive_translators/concatenate.py
 create mode 100644 tests/integration_tests/primitive_translators/test_primitive_concatenate.py

diff --git a/src/jace/translator/primitive_translators/__init__.py b/src/jace/translator/primitive_translators/__init__.py
index f06a67a..cf3e866 100644
--- a/src/jace/translator/primitive_translators/__init__.py
+++ b/src/jace/translator/primitive_translators/__init__.py
@@ -13,6 +13,7 @@
     LogicalOperationTranslator,
 )
 from .broadcast_in_dim_translator import BroadcastInDimTranslator
+from .concatenate import ConcatenateTranslator
 from .convert_element_type_translator import ConvertElementTypeTranslator
 from .copy_translator import CopyTranslator, DevicePutTranslator
 from .iota_translator import IotaTranslator
@@ -25,6 +26,7 @@
 __all__ = [
     "ArithmeticOperationTranslator",
     "BroadcastInDimTranslator",
+    "ConcatenateTranslator",
     "ConvertElementTypeTranslator",
     "CopyTranslator",
     "DevicePutTranslator",
diff --git a/src/jace/translator/primitive_translators/concatenate.py b/src/jace/translator/primitive_translators/concatenate.py
new file mode 100644
index 0000000..916d507
--- /dev/null
+++ b/src/jace/translator/primitive_translators/concatenate.py
@@ -0,0 +1,85 @@
+# JaCe - JAX Just-In-Time compilation using DaCe (Data Centric Parallel Programming)
+#
+# Copyright (c) 2024, ETH Zurich
+# All rights reserved.
+#
+# SPDX-License-Identifier: BSD-3-Clause
+
+"""Implements the concatenation primitive."""
+
+from __future__ import annotations
+
+from typing import TYPE_CHECKING
+
+import dace
+
+from jace import translator, util
+
+
+if TYPE_CHECKING:
+    from collections.abc import Sequence
+
+    from jax import core as jax_core
+
+
+class ConcatenateTranslator:
+    """
+    Implements the `concatenate` primitive.
+
+    It is implemented by a series of map that writes to the same access node.
+    It is probably the largest stretch of "written once" in the entire core.
+    """
+
+    @property
+    def primitive(self) -> str:  # noqa: D102  # No docstring needed.
+        return "concatenate"
+
+    def __call__(  # noqa: D102  # No docstring
+        self,
+        builder: translator.JaxprTranslationBuilder,  # noqa: ARG002  # Unused.
+        in_var_names: Sequence[str | None],
+        out_var_names: Sequence[str],
+        eqn: jax_core.JaxprEqn,
+        eqn_state: dace.SDFGState,
+    ) -> None:
+        if any(in_var_name is None for in_var_name in in_var_names):
+            raise NotImplementedError("Concatenate: No literal inputs supported.")
+
+        # Dimension along we concatenate.
+        cat_dim = eqn.params["dimension"]
+
+        # Offset counter for write back.
+        already_copied = 0
+
+        # This is the access node we use for the output
+        #  Is inside a dict for input to `add_mapped_tasklet()`.
+        output_nodes = {out_var_names[0]: eqn_state.add_write(out_var_names[0])}
+
+        # Now going over each input and copying the input in the correct location
+        #  of the output array.
+        for i, in_var_name in enumerate(in_var_names):
+            input_shape = util.get_jax_var_shape(eqn.invars[i])
+
+            tskl_range = [(f"__dim{d}", f"0:{dim_size}") for d, dim_size in enumerate(input_shape)]
+            tskl_input_access = [it_var for it_var, _ in tskl_range]
+
+            tskl_output_access = tskl_input_access.copy()
+            tskl_output_access[cat_dim] = f"{tskl_output_access[cat_dim]} + {already_copied}"
+
+            eqn_state.add_mapped_tasklet(
+                f"_concatenate_{out_var_names[0]}_{in_var_name}",
+                map_ranges=tskl_range,
+                inputs={"__in": dace.Memlet.simple(in_var_name, ", ".join(tskl_input_access))},
+                code="__out = __in",
+                outputs={
+                    "__out": dace.Memlet.simple(out_var_names[0], ",".join(tskl_output_access))
+                },
+                output_nodes=output_nodes,
+                external_edges=True,
+            )
+
+            # Update the counter that we have copied
+            already_copied += input_shape[cat_dim]
+
+
+_ = translator.register_primitive_translator(ConcatenateTranslator())
diff --git a/tests/integration_tests/primitive_translators/test_primitive_concatenate.py b/tests/integration_tests/primitive_translators/test_primitive_concatenate.py
new file mode 100644
index 0000000..29f44a8
--- /dev/null
+++ b/tests/integration_tests/primitive_translators/test_primitive_concatenate.py
@@ -0,0 +1,80 @@
+# JaCe - JAX Just-In-Time compilation using DaCe (Data Centric Parallel Programming)
+#
+# Copyright (c) 2024, ETH Zurich
+# All rights reserved.
+#
+# SPDX-License-Identifier: BSD-3-Clause
+
+from __future__ import annotations
+
+import jax
+import numpy as np
+import pytest
+from jax import numpy as jnp
+
+import jace
+from jace.util import translation_cache as tcache
+
+from tests import util as testutil
+
+
+def test_cat_1d_arrays() -> None:
+    """Concatenate two 1d arrays."""
+
+    a1 = testutil.make_array(10)
+    a2 = testutil.make_array(10)
+
+    def testee(a1: np.ndarray, a2: np.ndarray) -> jax.Array:
+        return jax.lax.concatenate((a1, a2), 0)
+
+    ref = testee(a1, a2)
+    res = jace.jit(testee)(a1, a2)
+
+    assert res.shape == ref.shape
+    assert np.all(ref == res)
+
+
+def test_cat_nd() -> None:
+    """Concatenate arrays of higher dimensions."""
+    nb_arrays = 4
+    std_shape: list[int] = [2, 3, 4, 5, 3]
+
+    for cat_dim in range(len(std_shape)):
+        tcache.clear_translation_cache()
+
+        # Create the input that we ware using.
+        input_arrays: list[np.ndarray] = []
+        for _ in range(nb_arrays):
+            shape = std_shape.copy()
+            shape[cat_dim] = (testutil.make_array((), dtype=np.int32) % 10) + 1  # type: ignore[call-overload]  # type confusion
+            input_arrays.append(testutil.make_array(shape))
+
+        def testee(inputs: list[np.ndarray]) -> np.ndarray | jax.Array:
+            return jax.lax.concatenate(inputs, cat_dim)  # noqa: B023  # Iteration variable capture.
+
+        ref = testee(input_arrays)
+        res = jace.jit(testee)(input_arrays)
+
+        assert res.shape == ref.shape
+        assert np.all(ref == res)
+
+
+@pytest.mark.skip(reason="Jax does not support scalars as inputs.")
+def test_cat_1d_array_scalars():
+    """Concatenate an 1d array with scalars.
+
+    This does not work, it is to observe Jax.
+    """
+
+    a1 = testutil.make_array(10)
+    s1 = testutil.make_array(())
+    s2 = testutil.make_array(())
+
+    def testee(a1: np.ndarray, s1: np.float64, s2: np.float64) -> np.ndarray | jax.Array:
+        return jnp.concatenate((s1, a1, s2), 0)
+
+    ref = testee(a1, s1, s2)
+    res = jace.jit(testee)(a1, s1, s2)
+
+    assert res.shape == ref.shape
+    assert np.all(ref == res)

From 0b52d4bd9e868055e092cc25262bd8027ac0a00d Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Fri, 21 Jun 2024 10:52:05 +0200
Subject: [PATCH 391/458] First batch of the first review.

---
 src/jace/__init__.py                          |   5 +-
 src/jace/api.py                               |  32 +++--
 src/jace/optimization.py                      |  17 ++-
 src/jace/stages.py                            | 110 +++++++++---------
 src/jace/tracing.py                           |  67 +++++------
 src/jace/translated_jaxpr_sdfg.py             |  57 +++++----
 .../translator/jaxpr_translator_builder.py    |  36 +++---
 src/jace/translator/pre_post_translation.py   |  17 ++-
 src/jace/translator/primitive_translator.py   |   8 +-
 .../primitive_translators/alu_translator.py   |   4 +-
 src/jace/util/jax_helper.py                   |  31 ++---
 src/jace/util/traits.py                       |   8 +-
 src/jace/util/translation_cache.py            |  26 ++---
 13 files changed, 200 insertions(+), 218 deletions(-)

diff --git a/src/jace/__init__.py b/src/jace/__init__.py
index 7d2536c..ca7e0f5 100644
--- a/src/jace/__init__.py
+++ b/src/jace/__init__.py
@@ -9,16 +9,13 @@
 
 from __future__ import annotations
 
-import jace.translator.primitive_translators as _  # noqa: F401  # Populate the internal registry.
+import jace.translator.primitive_translators as _  # noqa: F401 [unused-import]  # Needed to populate the internal translator registry.
 
 from .__about__ import __author__, __copyright__, __license__, __version__, __version_info__
 from .api import grad, jacfwd, jacrev, jit
-from .translated_jaxpr_sdfg import CompiledJaxprSDFG, TranslatedJaxprSDFG
 
 
 __all__ = [
-    "CompiledJaxprSDFG",
-    "TranslatedJaxprSDFG",
     "__author__",
     "__copyright__",
     "__license__",
diff --git a/src/jace/api.py b/src/jace/api.py
index da42139..3d6facd 100644
--- a/src/jace/api.py
+++ b/src/jace/api.py
@@ -10,7 +10,6 @@
 from __future__ import annotations
 
 import functools
-import inspect
 from typing import TYPE_CHECKING, Literal, ParamSpec, TypedDict, TypeVar, overload
 
 from jax import grad, jacfwd, jacrev
@@ -23,14 +22,14 @@
     from collections.abc import Callable, Mapping
 
 
-__all__ = ["JitOptions", "grad", "jacfwd", "jacrev", "jit"]
+__all__ = ["JITOptions", "grad", "jacfwd", "jacrev", "jit"]
 
 # Used for type annotation, see the notes in `jace.stages` for more.
 _P = ParamSpec("_P")
-_RetrunType = TypeVar("_RetrunType")
+_ReturnType = TypeVar("_ReturnType")
 
 
-class JitOptions(TypedDict, total=False):
+class JITOptions(TypedDict, total=False):
     """
     All known options to `jace.jit` that influence tracing.
 
@@ -46,27 +45,27 @@ def jit(
     fun: Literal[None] = None,
     /,
     primitive_translators: Mapping[str, translator.PrimitiveTranslator] | None = None,
-    **kwargs: Unpack[JitOptions],
-) -> Callable[[Callable[_P, _RetrunType]], stages.JaCeWrapped[_P, _RetrunType]]: ...
+    **kwargs: Unpack[JITOptions],
+) -> Callable[[Callable[_P, _ReturnType]], stages.JaCeWrapped[_P, _ReturnType]]: ...
 
 
 @overload
 def jit(
-    fun: Callable[_P, _RetrunType],
+    fun: Callable[_P, _ReturnType],
     /,
     primitive_translators: Mapping[str, translator.PrimitiveTranslator] | None = None,
-    **kwargs: Unpack[JitOptions],
-) -> stages.JaCeWrapped[_P, _RetrunType]: ...
+    **kwargs: Unpack[JITOptions],
+) -> stages.JaCeWrapped[_P, _ReturnType]: ...
 
 
 def jit(
-    fun: Callable[_P, _RetrunType] | None = None,
+    fun: Callable[_P, _ReturnType] | None = None,
     /,
     primitive_translators: Mapping[str, translator.PrimitiveTranslator] | None = None,
-    **kwargs: Unpack[JitOptions],
+    **kwargs: Unpack[JITOptions],
 ) -> (
-    Callable[[Callable[_P, _RetrunType]], stages.JaCeWrapped[_P, _RetrunType]]
-    | stages.JaCeWrapped[_P, _RetrunType]
+    Callable[[Callable[_P, _ReturnType]], stages.JaCeWrapped[_P, _ReturnType]]
+    | stages.JaCeWrapped[_P, _ReturnType]
 ):
     """
     JaCe's replacement for `jax.jit` (just-in-time) wrapper.
@@ -91,12 +90,7 @@ def jit(
             f"The following arguments to 'jace.jit' are not yet supported: {', '.join(kwargs)}."
         )
 
-    def wrapper(f: Callable[_P, _RetrunType]) -> stages.JaCeWrapped[_P, _RetrunType]:
-        if any(
-            param.default is not param.empty for param in inspect.signature(f).parameters.values()
-        ):
-            raise NotImplementedError("Default values are not yet supported.")
-
+    def wrapper(f: Callable[_P, _ReturnType]) -> stages.JaCeWrapped[_P, _ReturnType]:
         jace_wrapper = stages.JaCeWrapped(
             fun=f,
             primitive_translators=(
diff --git a/src/jace/optimization.py b/src/jace/optimization.py
index 1346186..33a94b8 100644
--- a/src/jace/optimization.py
+++ b/src/jace/optimization.py
@@ -15,7 +15,7 @@
 
 
 if TYPE_CHECKING:
-    import jace
+    from jace import translated_jaxpr_sdfg as tjsdfg
 
 
 class CompilerOptions(TypedDict, total=False):
@@ -31,24 +31,23 @@ class CompilerOptions(TypedDict, total=False):
 
     auto_optimize: bool
     simplify: bool
-    persistent: bool
+    persistent_transients: bool
 
 
-# TODO(phimuell): Add a context manager to modify the default.
 DEFAULT_OPTIMIZATIONS: Final[CompilerOptions] = {
     "auto_optimize": True,
     "simplify": True,
-    "persistent": True,
+    "persistent_transients": True,
 }
 
 NO_OPTIMIZATIONS: Final[CompilerOptions] = {
     "auto_optimize": False,
     "simplify": False,
-    "persistent": False,
+    "persistent_transients": False,
 }
 
 
-def jace_optimize(tsdfg: jace.TranslatedJaxprSDFG, **kwargs: Unpack[CompilerOptions]) -> None:  # noqa: D417  # Missing description for kwargs
+def jace_optimize(tsdfg: tjsdfg.TranslatedJaxprSDFG, **kwargs: Unpack[CompilerOptions]) -> None:  # noqa: D417 [undocumented-param]
     """
     Performs optimization of the translated SDFG _in place_.
 
@@ -60,9 +59,9 @@ def jace_optimize(tsdfg: jace.TranslatedJaxprSDFG, **kwargs: Unpack[CompilerOpti
         tsdfg: The translated SDFG that should be optimized.
         simplify: Run the simplification pipeline.
         auto_optimize: Run the auto optimization pipeline (currently does nothing)
-        persistent:  Make the memory allocation persistent, i.e. allocate the
-            transients only once at the beginning and then reuse the memory across
-            the lifetime of the SDFG.
+        persistent_transients: Set the allocation lifetime of (non register) transients
+            in the SDFG to `AllocationLifetime.Persistent`, i.e. keep them allocated
+            between different invocations.
     """
     # Currently this function exists primarily for the same of existing.
 
diff --git a/src/jace/stages.py b/src/jace/stages.py
index 8b6bb5e..e527dd8 100644
--- a/src/jace/stages.py
+++ b/src/jace/stages.py
@@ -7,11 +7,11 @@
 """
 Reimplementation of the `jax.stages` module.
 
-This module reimplements the public classes of that Jax module.
+This module reimplements the public classes of that JAX module.
 However, because JaCe uses DaCe as backend they differ is some small aspects.
 
-As in Jax JaCe has different stages, the terminology is taken from
-[Jax' AOT-Tutorial](https://jax.readthedocs.io/en/latest/aot.html).
+As in JAX JaCe has different stages, the terminology is taken from
+[JAX' AOT-Tutorial](https://jax.readthedocs.io/en/latest/aot.html).
 - Stage out:
     In this phase an executable Python function is translated to a Jaxpr.
 - Lower:
@@ -21,7 +21,7 @@
 - Execution:
     This is the actual running of the computation.
 
-As in Jax the in JaCe the user only has access to the last tree stages and
+As in JAX the in JaCe the user only has access to the last tree stages and
 staging out and lowering is handled as a single step.
 """
 
@@ -33,10 +33,9 @@
 
 from jax import tree_util as jax_tree
 
-import jace
-from jace import api, optimization, tracing, translated_jaxpr_sdfg, translator, util
+from jace import api, optimization, tracing, translated_jaxpr_sdfg as tjsdfg, translator, util
 from jace.optimization import CompilerOptions
-from jace.translator import pre_post_translation as ptrans
+from jace.translator import pre_post_translation as pptrans
 from jace.util import translation_cache as tcache
 
 
@@ -46,7 +45,7 @@
     import dace
 
 __all__ = [
-    "CompilerOptions",  # export for compatibility with Jax.
+    "CompilerOptions",  # export for compatibility with JAX.
     "JaCeCompiled",
     "JaCeLowered",
     "JaCeWrapped",
@@ -62,17 +61,17 @@
 # These are used to annotated the `Stages`, however, there are some limitations.
 #  First, the only stage that is fully annotated is `JaCeWrapped`. Second, since
 #  static arguments modify the type signature of `JaCeCompiled.__call__()`, see
-#  [Jax](https://jax.readthedocs.io/en/latest/aot.html#lowering-with-static-arguments)
+#  [JAX](https://jax.readthedocs.io/en/latest/aot.html#lowering-with-static-arguments)
 #  for more, its argument can not be annotated, only its return type can.
 #  However, in case of scalar return values, the return type is wrong anyway, since
-#  JaCe and Jax for that matter, transforms scalars to arrays. Since there is no way of
+#  JaCe and JAX for that matter, transforms scalars to arrays. Since there is no way of
 #  changing that, but from a semantic point they behave the same so it should not
 #  matter too much.
 _P = ParamSpec("_P")
-_RetrunType = TypeVar("_RetrunType")
+_ReturnType = TypeVar("_ReturnType")
 
 
-class JaCeWrapped(tcache.CachingStage["JaCeLowered"], Generic[_P, _RetrunType]):
+class JaCeWrapped(tcache.CachingStage["JaCeLowered"], Generic[_P, _ReturnType]):
     """
     A function ready to be specialized, lowered, and compiled.
 
@@ -85,7 +84,7 @@ class JaCeWrapped(tcache.CachingStage["JaCeLowered"], Generic[_P, _RetrunType]):
     object is later lowered with the same arguments the result might be taken
     from the cache.
 
-    Furthermore, a `JaCeWrapped` object is composable with all Jax transformations,
+    Furthermore, a `JaCeWrapped` object is composable with all JAX transformations,
     all other stages are not.
 
     Args:
@@ -102,15 +101,15 @@ class JaCeWrapped(tcache.CachingStage["JaCeLowered"], Generic[_P, _RetrunType]):
         which is implicitly and temporary activated during tracing.
     """
 
-    _fun: Callable[_P, _RetrunType]
+    _fun: Callable[_P, _ReturnType]
     _primitive_translators: dict[str, translator.PrimitiveTranslator]
-    _jit_options: api.JitOptions
+    _jit_options: api.JITOptions
 
     def __init__(
         self,
-        fun: Callable[_P, _RetrunType],
+        fun: Callable[_P, _ReturnType],
         primitive_translators: Mapping[str, translator.PrimitiveTranslator],
-        jit_options: api.JitOptions,
+        jit_options: api.JITOptions,
     ) -> None:
         assert all(
             param.default is param.empty for param in inspect.signature(fun).parameters.values()
@@ -120,7 +119,7 @@ def __init__(
         self._jit_options = {**jit_options}
         self._fun = fun
 
-    def __call__(self, *args: _P.args, **kwargs: _P.kwargs) -> _RetrunType:
+    def __call__(self, *args: _P.args, **kwargs: _P.kwargs) -> _ReturnType:
         """
         Executes the wrapped function, lowering and compiling as needed in one step.
 
@@ -128,7 +127,7 @@ def __call__(self, *args: _P.args, **kwargs: _P.kwargs) -> _RetrunType:
         arguments as the original computation and the return value is unflattened.
 
         Note:
-            This function is also aware if a Jax tracing is going on. In this
+            This function is also aware if a JAX tracing is going on. In this
             case, it will forward the computation.
             Currently, this function ignores the value of `jax.disable_jit()`.
         """
@@ -141,7 +140,7 @@ def __call__(self, *args: _P.args, **kwargs: _P.kwargs) -> _RetrunType:
         return compiled(*args, **kwargs)
 
     @tcache.cached_transition
-    def lower(self, *args: _P.args, **kwargs: _P.kwargs) -> JaCeLowered[_RetrunType]:
+    def lower(self, *args: _P.args, **kwargs: _P.kwargs) -> JaCeLowered[_ReturnType]:
         """
         Lower the wrapped computation for the given arguments.
 
@@ -161,30 +160,31 @@ def lower(self, *args: _P.args, **kwargs: _P.kwargs) -> JaCeLowered[_RetrunType]
         jaxpr_maker = tracing.make_jaxpr(
             fun=self._fun,
             trace_options=self._jit_options,
-            return_outtree=True,
+            return_out_tree=True,
         )
-        jaxpr, outtree = jaxpr_maker(*args, **kwargs)
+        jaxpr, out_tree = jaxpr_maker(*args, **kwargs)
         builder = translator.JaxprTranslationBuilder(
             primitive_translators=self._primitive_translators
         )
         trans_ctx: translator.TranslationContext = builder.translate_jaxpr(jaxpr)
 
         flat_call_args = jax_tree.tree_leaves((args, kwargs))
-        tsdfg: jace.TranslatedJaxprSDFG = ptrans.postprocess_jaxpr_sdfg(
+        tsdfg: tjsdfg.TranslatedJaxprSDFG = pptrans.postprocess_jaxpr_sdfg(
             trans_ctx=trans_ctx,
             fun=self.wrapped_fun,
             flat_call_args=flat_call_args,
         )
 
         # NOTE: `tsdfg` is deepcopied as a side effect of post processing.
-        return JaCeLowered(tsdfg, outtree)
+        return JaCeLowered(tsdfg, out_tree)
 
     @property
-    def wrapped_fun(self) -> Callable:  # noqa: D102  # No docstring.
+    def wrapped_fun(self) -> Callable:
+        """Return the underlying Python function."""
         return self._fun
 
     def _make_call_description(
-        self, intree: jax_tree.PyTreeDef, flat_call_args: Sequence[Any]
+        self, in_tree: jax_tree.PyTreeDef, flat_call_args: Sequence[Any]
     ) -> tcache.StageTransformationSpec:
         """
         Computes the key for the `JaCeWrapped.lower()` call inside the cache.
@@ -199,11 +199,11 @@ def _make_call_description(
         # TODO(phimuell): Implement static arguments
         flat_call_args = tuple(tcache._AbstractCallArgument.from_value(x) for x in flat_call_args)
         return tcache.StageTransformationSpec(
-            stage_id=id(self), flat_call_args=tuple(flat_call_args), intree=intree
+            stage_id=id(self), flat_call_args=tuple(flat_call_args), in_tree=in_tree
         )
 
 
-class JaCeLowered(tcache.CachingStage["JaCeCompiled"], Generic[_RetrunType]):
+class JaCeLowered(tcache.CachingStage["JaCeCompiled"], Generic[_ReturnType]):
     """
     Represents the original computation as an SDFG.
 
@@ -212,33 +212,33 @@ class JaCeLowered(tcache.CachingStage["JaCeCompiled"], Generic[_RetrunType]):
     calling `self.compile()`. A user should never directly construct a `JaCeLowered`
     object directly, instead `JaCeWrapped.lower()` should be used.
 
-    Before the SDFG is compiled it is optimized, see `JaCeLowered.compile()` for how to
+    The SDFG is optimized before the compilation, see `JaCeLowered.compile()` for how to
     control the process.
 
     Args:
         tsdfg: The lowered SDFG with metadata.
-        outtree: The pytree describing how to unflatten the output.
+        out_tree: The pytree describing how to unflatten the output.
 
     Note:
         `self` will manage the passed `tsdfg` object. Modifying it results is undefined
-        behavior. Although `JaCeWrapped` is composable with Jax transformations
+        behavior. Although `JaCeWrapped` is composable with JAX transformations
         `JaCeLowered` is not.
     """
 
-    _translated_sdfg: jace.TranslatedJaxprSDFG
-    _outtree: jax_tree.PyTreeDef
+    _translated_sdfg: tjsdfg.TranslatedJaxprSDFG
+    _out_tree: jax_tree.PyTreeDef
 
     def __init__(
         self,
-        tsdfg: jace.TranslatedJaxprSDFG,
-        outtree: jax_tree.PyTreeDef,
+        tsdfg: tjsdfg.TranslatedJaxprSDFG,
+        out_tree: jax_tree.PyTreeDef,
     ) -> None:
         super().__init__()
         self._translated_sdfg = tsdfg
-        self._outtree = outtree
+        self._out_tree = out_tree
 
     @tcache.cached_transition
-    def compile(self, compiler_options: CompilerOptions | None = None) -> JaCeCompiled[_RetrunType]:
+    def compile(self, compiler_options: CompilerOptions | None = None) -> JaCeCompiled[_ReturnType]:
         """
         Optimize and compile the lowered SDFG using `compiler_options`.
 
@@ -251,15 +251,15 @@ def compile(self, compiler_options: CompilerOptions | None = None) -> JaCeCompil
         """
         # We **must** deepcopy before we do any optimization, because all optimizations
         #  are in place, to properly cache stages, stages needs to be immutable.
-        tsdfg: jace.TranslatedJaxprSDFG = copy.deepcopy(self._translated_sdfg)
+        tsdfg: tjsdfg.TranslatedJaxprSDFG = copy.deepcopy(self._translated_sdfg)
         optimization.jace_optimize(tsdfg=tsdfg, **finalize_compilation_options(compiler_options))
 
         return JaCeCompiled(
-            csdfg=translated_jaxpr_sdfg.compile_jaxpr_sdfg(tsdfg),
-            outtree=self._outtree,
+            csdfg=tjsdfg.compile_jaxpr_sdfg(tsdfg),
+            out_tree=self._out_tree,
         )
 
-    def compiler_ir(self, dialect: str | None = None) -> jace.TranslatedJaxprSDFG:
+    def compiler_ir(self, dialect: str | None = None) -> tjsdfg.TranslatedJaxprSDFG:
         """
         Returns the internal SDFG.
 
@@ -279,7 +279,7 @@ def as_sdfg(self) -> dace.SDFG:
         return self.compiler_ir().sdfg
 
     def _make_call_description(
-        self, intree: jax_tree.PyTreeDef, flat_call_args: Sequence[Any]
+        self, in_tree: jax_tree.PyTreeDef, flat_call_args: Sequence[Any]
     ) -> tcache.StageTransformationSpec:
         """
         Creates the key for the `self.compile()` transition function.
@@ -287,17 +287,17 @@ def _make_call_description(
         The key will depend on the final values that were used for optimization, i.e.
         they it will also include the global set of optimization options.
         """
-        unflatted_args, unflatted_kwargs = jax_tree.tree_unflatten(intree, flat_call_args)
+        unflatted_args, unflatted_kwargs = jax_tree.tree_unflatten(in_tree, flat_call_args)
         assert (not unflatted_kwargs) and (len(unflatted_args) <= 1)
 
         options = finalize_compilation_options(unflatted_args[0] if unflatted_args else {})
-        flat_options, optiontree = jax_tree.tree_flatten(options)
+        flat_options, option_tree = jax_tree.tree_flatten(options)
         return tcache.StageTransformationSpec(
-            stage_id=id(self), flat_call_args=tuple(flat_options), intree=optiontree
+            stage_id=id(self), flat_call_args=tuple(flat_options), in_tree=option_tree
         )
 
 
-class JaCeCompiled(Generic[_RetrunType]):
+class JaCeCompiled(Generic[_ReturnType]):
     """
     Compiled version of the SDFG.
 
@@ -312,27 +312,27 @@ class JaCeCompiled(Generic[_RetrunType]):
         csdfg: The compiled SDFG object.
         inp_names: SDFG variables used as inputs.
         out_names: SDFG variables used as outputs.
-        outtree: Pytree describing how to unflatten the output.
+        out_tree: Pytree describing how to unflatten the output.
 
     Note:
         The class assumes ownership of its input arguments.
 
     Todo:
-        - Automatic strides adaption.
+        - Automatic strides adaptation.
     """
 
-    _csdfg: jace.CompiledJaxprSDFG
-    _outtree: jax_tree.PyTreeDef
+    _csdfg: tjsdfg.CompiledJaxprSDFG
+    _out_tree: jax_tree.PyTreeDef
 
     def __init__(
         self,
-        csdfg: jace.CompiledJaxprSDFG,
-        outtree: jax_tree.PyTreeDef,
+        csdfg: tjsdfg.CompiledJaxprSDFG,
+        out_tree: jax_tree.PyTreeDef,
     ) -> None:
         self._csdfg = csdfg
-        self._outtree = outtree
+        self._out_tree = out_tree
 
-    def __call__(self, *args: Any, **kwargs: Any) -> _RetrunType:
+    def __call__(self, *args: Any, **kwargs: Any) -> _ReturnType:
         """
         Calls the embedded computation.
 
@@ -346,7 +346,7 @@ def __call__(self, *args: Any, **kwargs: Any) -> _RetrunType:
         flat_output = self._csdfg(flat_call_args)
         if flat_output is None:
             return None  # type: ignore[return-value]  # Type confusion.
-        return jax_tree.tree_unflatten(self._outtree, flat_output)
+        return jax_tree.tree_unflatten(self._out_tree, flat_output)
 
 
 # <--------------------------- Compilation/Optimization options management
diff --git a/src/jace/tracing.py b/src/jace/tracing.py
index 29b7eda..71932e9 100644
--- a/src/jace/tracing.py
+++ b/src/jace/tracing.py
@@ -8,9 +8,9 @@
 """
 Implements the tracing machinery that is used to build the Jaxpr.
 
-Essentially, Jax provides `jax.make_jaxpr()` which is essentially a debug utility. Jax
-does not provide any public way to get a Jaxpr. This module provides the necessary
-functionality for use in JaCe.
+JAX provides `jax.make_jaxpr()`, which is essentially a debug utility, but it does not
+provide any other public way to get a Jaxpr. This module provides the necessary
+functionality for this in JaCe.
 """
 
 from __future__ import annotations
@@ -19,7 +19,7 @@
 from typing import TYPE_CHECKING, Any, Literal, ParamSpec, TypeVar, overload
 
 import jax
-from jax import tree_util as jax_tree
+from jax import core as jax_core, tree_util as jax_tree
 
 
 if TYPE_CHECKING:
@@ -28,56 +28,51 @@
     from jace import api
 
 _P = ParamSpec("_P")
-_RetrunType = TypeVar("_RetrunType")
+_ReturnType = TypeVar("_ReturnType")
 
 
 @overload
 def make_jaxpr(
-    fun: Callable[_P, _RetrunType],
-    trace_options: api.JitOptions,
-    return_outtree: Literal[True],
-) -> Callable[_P, tuple[jax.core.ClosedJaxpr, jax_tree.PyTreeDef]]: ...
+    fun: Callable[_P, _ReturnType],
+    trace_options: api.JITOptions,
+    return_out_tree: Literal[True],
+) -> Callable[_P, tuple[jax_core.ClosedJaxpr, jax_tree.PyTreeDef]]: ...
 
 
 @overload
 def make_jaxpr(
-    fun: Callable[_P, _RetrunType],
-    trace_options: api.JitOptions,
-    return_outtree: Literal[False] = False,
-) -> Callable[_P, jax.core.ClosedJaxpr]: ...
+    fun: Callable[_P, _ReturnType],
+    trace_options: api.JITOptions,
+    return_out_tree: Literal[False] = False,
+) -> Callable[_P, jax_core.ClosedJaxpr]: ...
 
 
 def make_jaxpr(
     fun: Callable[_P, Any],
-    trace_options: api.JitOptions,
-    return_outtree: bool = False,
-) -> (
-    Callable[_P, tuple[jax.core.ClosedJaxpr, jax_tree.PyTreeDef]]
-    | Callable[_P, jax.core.ClosedJaxpr]
-):
+    trace_options: api.JITOptions,
+    return_out_tree: bool = False,
+) -> Callable[_P, tuple[jax_core.ClosedJaxpr, jax_tree.PyTreeDef] | jax_core.ClosedJaxpr]:
     """
     JaCe's replacement for `jax.make_jaxpr()`.
 
-    Returns a callable object that produces as Jaxpr and optionally a pytree defining
+    Returns a callable object that produces a Jaxpr and optionally a pytree defining
     the output. By default the callable will only return the Jaxpr, however, by setting
-    `return_outtree` the function will also return the output tree, this is different
+    `return_out_tree` the function will also return the output tree, this is different
     from the `return_shape` of `jax.make_jaxpr()`.
 
     Currently the tracing is always performed with an enabled `x64` mode.
 
     Returns:
-        The function returns a callable, that if passed arguments will performs the
-        tracing on them, this section will describe the return value of that function.
-        If `return_outtree` is `False` the function will simply return the generated
-        Jaxpr. If `return_outtree` is `True` the function will return a pair.
-        The first element is the Jaxpr and the second element is a pytree object
-        that describes the output.
+        The function returns a callable that will perform the tracing on the passed
+        arguments. If `return_out_tree` is `False` that callable will simply return the
+        generated Jaxpr. If `return_out_tree` is `True` the function will return a tuple
+        with the Jaxpr and a pytree object describing the structure of the output.
 
     Args:
         fun: The original Python computation.
         trace_options: The options used for tracing, the same arguments that
             are supported by `jace.jit`.
-        return_outtree: Also return the pytree of the output.
+        return_out_tree: Also return the pytree of the output.
 
     Todo:
         - Handle default arguments of `fun`.
@@ -93,8 +88,8 @@ def make_jaxpr(
     def tracer_impl(
         *args: _P.args,
         **kwargs: _P.kwargs,
-    ) -> tuple[jax.core.ClosedJaxpr, jax_tree.PyTreeDef] | jax.core.ClosedJaxpr:
-        # In Jax `float32` is the main datatype, and they go to great lengths to avoid
+    ) -> tuple[jax_core.ClosedJaxpr, jax_tree.PyTreeDef] | jax_core.ClosedJaxpr:
+        # In JAX `float32` is the main datatype, and they go to great lengths to avoid
         #  some aggressive [type promotion](https://jax.readthedocs.io/en/latest/type_promotion.html).
         #  However, in this case we will have problems when we call the SDFG, for some
         #  reasons `CompiledSDFG` does not work in that case correctly, thus we enable
@@ -106,18 +101,18 @@ def tracer_impl(
                 **trace_options,
                 return_shape=True,
             )
-            jaxpr, outshapes = jaxpr_maker(
+            jaxpr, out_shapes = jaxpr_maker(
                 *args,
                 **kwargs,
             )
 
-        if not return_outtree:
+        if not return_out_tree:
             return jaxpr
 
         # Regardless what the documentation of `make_jaxpr` claims, it does not output
-        #  a pytree instead an abstract description of the shape, that we will
+        #  a pytree but an abstract description of the shape, that we will
         #  transform into a pytree.
-        outtree = jax_tree.tree_structure(outshapes)
-        return jaxpr, outtree
+        out_tree = jax_tree.tree_structure(out_shapes)
+        return jaxpr, out_tree
 
-    return tracer_impl  # type: ignore[return-value]  # Type confusion
+    return tracer_impl
diff --git a/src/jace/translated_jaxpr_sdfg.py b/src/jace/translated_jaxpr_sdfg.py
index bbab2be..46fc558 100644
--- a/src/jace/translated_jaxpr_sdfg.py
+++ b/src/jace/translated_jaxpr_sdfg.py
@@ -10,9 +10,8 @@
 from __future__ import annotations
 
 import dataclasses
-import os
 import pathlib
-import time
+import uuid
 from typing import TYPE_CHECKING, Any
 
 import dace
@@ -32,10 +31,10 @@
 @dataclasses.dataclass(frozen=True, kw_only=True)
 class TranslatedJaxprSDFG:
     """
-    Encapsulates a translated SDFG with additional the metadata.
+    Encapsulates the SDFG generated from a Jaxpr and additional metadata.
 
     Contrary to the SDFG that is encapsulated inside an `TranslationContext`
-    object, `self` carries a proper SDFG, however:
+    object, `self` carries a proper SDFG with the following structure:
     - It does not have `__return*` variables, instead all return arguments are
         passed by arguments.
     - All input arguments are passed through arguments mentioned in `inp_names`,
@@ -43,7 +42,7 @@ class TranslatedJaxprSDFG:
     - Only variables listed as in/outputs are non transient.
     - The order inside `inp_names` and `out_names` is the same as in the original Jaxpr.
     - If an input is used as outputs it appears in both `inp_names` and `out_names`.
-    - Its `arg_names` is set to  `inp_names + out_names`, but arguments that are
+    - Its `arg_names` is set to `inp_names + out_names`, but arguments that are
         input and outputs are only listed as inputs.
 
     The only valid way to obtain a `TranslatedJaxprSDFG` is by passing a
@@ -91,6 +90,7 @@ def validate(self) -> bool:
         return True
 
 
+@dataclasses.dataclass(frozen=True, kw_only=True)
 class CompiledJaxprSDFG:
     """
     Compiled version of a `TranslatedJaxprSDFG` instance.
@@ -121,20 +121,12 @@ class CompiledJaxprSDFG:
     """
 
     csdfg: compiled_sdfg.CompiledSDFG
-    sdfg: dace.SDFG
     inp_names: tuple[str, ...]
     out_names: tuple[str, ...]
 
-    def __init__(
-        self,
-        csdfg: compiled_sdfg.CompiledSDFG,
-        inp_names: tuple[str, ...],
-        out_names: tuple[str, ...],
-    ) -> None:
-        self.csdfg = csdfg
-        self.sdfg = self.csdfg.sdfg
-        self.inp_names = inp_names
-        self.out_names = out_names
+    @property
+    def sdfg(self) -> dace.SDFG:  # noqa: D102 [undocumented-public-method]
+        return self.csdfg.sdfg
 
     def __call__(
         self,
@@ -151,23 +143,25 @@ def __call__(
             flat_call_args: Flattened input arguments.
         """
         if len(self.inp_names) != len(flat_call_args):
-            # Either error or static arguments are not removed.
-            raise RuntimeError("Wrong number of arguments.")
+            raise RuntimeError(
+                f"Expected {len(self.inp_names)} flattened arguments, but got {len(flat_call_args)}."
+            )
 
         sdfg_call_args: dict[str, Any] = {}
         for in_name, in_val in zip(self.inp_names, flat_call_args):
             # TODO(phimuell): Implement a stride matching process.
             if util.is_jax_array(in_val):
                 if not util.is_fully_addressable(in_val):
-                    raise ValueError(f"Passed a not fully addressable Jax array as '{in_name}'")
-                in_val = in_val.__array__()  # noqa: PLW2901  # Jax arrays do not expose the __array_interface__.
+                    raise ValueError(f"Passed a not fully addressable JAX array as '{in_name}'")
+                in_val = in_val.__array__()  # noqa: PLW2901 [redefined-loop-name]  # JAX arrays do not expose the __array_interface__.
             sdfg_call_args[in_name] = in_val
 
         arrays = self.sdfg.arrays
-        for out_name, sdfg_array in ((out_name, arrays[out_name]) for out_name in self.out_names):
+        for out_name in self.out_names:
+            sdfg_array = arrays[out_name]
             if out_name in sdfg_call_args:
                 if util.is_jax_array(sdfg_call_args[out_name]):
-                    raise ValueError("Passed an immutable Jax array as output.")
+                    raise ValueError("Passed an immutable JAX array as output.")
             else:
                 sdfg_call_args[out_name] = dace_data.make_array_from_descriptor(sdfg_array)
 
@@ -191,7 +185,7 @@ def compile_jaxpr_sdfg(tsdfg: TranslatedJaxprSDFG) -> CompiledJaxprSDFG:
     """Compile `tsdfg` and return a `CompiledJaxprSDFG` object with the result."""
     if any(  # We do not support the DaCe return mechanism
         array_name.startswith("__return")
-        for array_name in tsdfg.sdfg.arrays.keys()  # noqa: SIM118  # We can not use `in` because we are not interested in `my_mangled_variable__return_zulu`!
+        for array_name in tsdfg.sdfg.arrays.keys()  # noqa: SIM118 [in-dict-keys]  # We can not use `in` because we are not interested in `my_mangled_variable__return_zulu`!
     ):
         raise ValueError("Only support SDFGs without '__return' members.")
     if tsdfg.sdfg.free_symbols:  # This is a simplification that makes our life simple.
@@ -202,19 +196,20 @@ def compile_jaxpr_sdfg(tsdfg: TranslatedJaxprSDFG) -> CompiledJaxprSDFG:
     # To ensure that the SDFG is compiled and to get rid of a warning we must modify
     #  some settings of the SDFG. But we also have to fake an immutable SDFG
     sdfg = tsdfg.sdfg
-    org_sdfg_name = sdfg.name
-    org_recompile = sdfg._recompile
-    org_regenerate_code = sdfg._regenerate_code
+    original_sdfg_name = sdfg.name
+    original_recompile = sdfg._recompile
+    original_regenerate_code = sdfg._regenerate_code
 
     try:
         # We need to give the SDFG another name, this is needed to prevent a DaCe
         #  error/warning. This happens if we compile the same lowered SDFG multiple
         #  times with different options.
-        sdfg.name = f"{sdfg.name}__comp_{int(time.time() * 1000)}_{os.getpid()}"
-        assert len(sdfg.name) < 255  # noqa: PLR2004  # Not a magic number.
+        sdfg.name = f"{sdfg.name}__{uuid.uuid1()}"
+        assert len(sdfg.name) < 255  # noqa: PLR2004 magic-value-comparison  # 255 maximal file name size on UNIX.
 
         with dace.config.temporary_config():
             dace.Config.set("compiler", "use_cache", value=False)
+            # TODO(egparedes/phimuell): Add a configuration option.
             dace.Config.set("cache", value="name")
             dace.Config.set("default_build_folder", value=pathlib.Path(".jacecache").resolve())
             sdfg._recompile = True
@@ -222,8 +217,8 @@ def compile_jaxpr_sdfg(tsdfg: TranslatedJaxprSDFG) -> CompiledJaxprSDFG:
             csdfg: CompiledSDFG = sdfg.compile()
 
     finally:
-        sdfg.name = org_sdfg_name
-        sdfg._recompile = org_recompile
-        sdfg._regenerate_code = org_regenerate_code
+        sdfg.name = original_sdfg_name
+        sdfg._recompile = original_recompile
+        sdfg._regenerate_code = original_regenerate_code
 
     return CompiledJaxprSDFG(csdfg=csdfg, inp_names=tsdfg.inp_names, out_names=tsdfg.out_names)
diff --git a/src/jace/translator/jaxpr_translator_builder.py b/src/jace/translator/jaxpr_translator_builder.py
index deba4fe..73202b2 100644
--- a/src/jace/translator/jaxpr_translator_builder.py
+++ b/src/jace/translator/jaxpr_translator_builder.py
@@ -13,7 +13,7 @@
 from typing import TYPE_CHECKING, Any, Literal, cast, overload
 
 import dace
-from dace import data as ddata, properties as dprop
+from dace import data as dace_data, properties as dace_properties
 from jax import core as jax_core
 
 from jace import util
@@ -31,7 +31,7 @@ class JaxprTranslationBuilder:
     canonical. The main features of such an SDFG are:
     - the SDFG is a list of states,
     - it has a single source and sink state.
-    - all variable names are derived from Jax names,
+    - all variable names are derived from JAX names,
     - there are only transient variables inside the SDFG,
     - it lacks the special `__return` variable,
     - the `arg_names` parameter is not set,
@@ -81,7 +81,7 @@ def __init__(
         # Maps name of primitives to the associated translator.
         self._primitive_translators = {**primitive_translators}
 
-        # Maps Jax variables to the name of its SDFG equivalent.
+        # Maps JAX variables to the name of its SDFG equivalent.
         #  Shared between all translation contexts, to ensure consecutive variable
         #  naming as seen as in a pretty printed Jaxpr. Will be cleared by
         #  `_clear_translation_ctx()` at the end of the root translation.
@@ -129,7 +129,7 @@ def translate_jaxpr(
     def append_new_state(
         self,
         label: str | None = None,
-        condition: dprop.CodeBlock | None = None,
+        condition: dace_properties.CodeBlock | None = None,
         assignments: Mapping[str, Any] | None = None,
         prev_state: dace.SDFGState | None = None,
     ) -> dace.SDFGState:
@@ -176,7 +176,7 @@ def append_new_state(
         return new_state
 
     @property
-    def arrays(self) -> Mapping[str, ddata.Data]:
+    def arrays(self) -> Mapping[str, dace_data.Data]:
         """
         Get all data descriptors that are currently known to the SDFG.
 
@@ -184,14 +184,14 @@ def arrays(self) -> Mapping[str, ddata.Data]:
             Essentially a shorthand and preferred way for `self.sdfg.arrays`.
             For getting a specific data descriptor use `self.get_array()`.
         """
-        return cast(Mapping[str, ddata.Data], self._ctx.sdfg.arrays)
+        return cast(Mapping[str, dace_data.Data], self._ctx.sdfg.arrays)
 
-    def get_array(self, name: str | jax_core.Atom | util.JaCeVar) -> ddata.Data:
+    def get_array(self, name: str | jax_core.Atom | util.JaCeVar) -> dace_data.Data:
         """
         Returns the SDFG `Data` object `name` referees to.
 
         `name` can either be a string, in which case it is interpreted as a
-        verbatim SDFG name. If it is a Jax or JaCe variable, the function will
+        verbatim SDFG name. If it is a JAX or JaCe variable, the function will
         first perform a lookup using `self.map_jax_var_to_sdfg(name)`.
         """
         if isinstance(name, (jax_core.Var, util.JaCeVar)):
@@ -221,7 +221,7 @@ def map_jax_var_to_sdfg(
         Get the name of the SDFG variable to which `jax_var` is referring to.
 
         Args:
-            jax_var: The Jax variable to look up.
+            jax_var: The JAX variable to look up.
             allow_fail: Return `None` instead of raising a `KeyError`.
         """
         if isinstance(jax_var, jax_core.Literal):
@@ -231,10 +231,10 @@ def map_jax_var_to_sdfg(
         elif allow_fail:
             return None
         else:
-            raise KeyError(f"The Jax variable '{jax_var}' was never registered.")
+            raise KeyError(f"The JAX variable '{jax_var}' was never registered.")
         if sdfg_name not in self._ctx.sdfg.arrays:
             raise KeyError(
-                f"Jax variable '{jax_var}' was supposed to map to '{sdfg_name}',"
+                f"JAX variable '{jax_var}' was supposed to map to '{sdfg_name}',"
                 " but no such SDFG variable is known."
             )
         return sdfg_name
@@ -272,7 +272,7 @@ def add_jax_name_mapping(
         is not able to delete a variable mapping that was established before.
 
         Args:
-            jax_var: The Jax variable.
+            jax_var: The JAX variable.
             sdfg_name: The name of the corresponding SDFG variable.
         """
         if not sdfg_name:
@@ -298,7 +298,7 @@ def add_array(
         update_var_mapping: bool = False,
     ) -> str:
         """
-        Creates an SDFG variable for Jax variable `arg` and returns its SDFG name.
+        Creates an SDFG variable for JAX variable `arg` and returns its SDFG name.
 
         The SDFG object is always created as a transient. Furthermore, the
         function will not update the internal variable mapping, by default.
@@ -310,7 +310,7 @@ def add_array(
         should be used.
 
         Args:
-            arg: The Jax object for which a SDFG equivalent should be created.
+            arg: The JAX object for which a SDFG equivalent should be created.
             name_prefix: If given it will be used as prefix for the name.
             update_var_mapping: Update the internal variable mapping.
         """
@@ -391,9 +391,9 @@ def create_jax_var_list(  # type: ignore[misc]
         **kwargs: Any,
     ) -> list[None | str]:
         """
-        Create SDFG variables from the passed Jax variables.
+        Create SDFG variables from the passed JAX variables.
 
-        If a Jax variable already has a SDFG equivalent then the function will
+        If a JAX variable already has a SDFG equivalent then the function will
         use this variable. If no corresponding SDFG variable is known the function
         will create one using `add_array()`.
 
@@ -407,7 +407,7 @@ def create_jax_var_list(  # type: ignore[misc]
         to `True` literals will will be included in the output with the value `None`.
 
         Args:
-            jax_var_list: The list of Jax variables that should be processed.
+            jax_var_list: The list of JAX variables that should be processed.
             prevent_creation: Never create a variable, all must already be known.
             only_creation: Always create a variable.
             handle_literals: Allow the processing of literals.
@@ -653,7 +653,7 @@ def _handle_null_jaxpr(self, jaxpr: jax_core.ClosedJaxpr) -> list[str]:
             sdfg_in_name: str = self.map_jax_var_to_sdfg(jax_out_var)
 
             # Now we create a variable that serves as true output, however, since the
-            #  Jax variable is already known we can not update the variable mapping and
+            #  JAX variable is already known we can not update the variable mapping and
             #  must use another name.
             sdfg_out_name = self.add_array(
                 jax_out_var, name_prefix="_zero_equation_output_for_", update_var_mapping=False
diff --git a/src/jace/translator/pre_post_translation.py b/src/jace/translator/pre_post_translation.py
index c2a79cb..c5cc204 100644
--- a/src/jace/translator/pre_post_translation.py
+++ b/src/jace/translator/pre_post_translation.py
@@ -14,8 +14,7 @@
 
 import dace
 
-import jace
-from jace import util
+from jace import translated_jaxpr_sdfg as tjsdfg, util
 
 
 if TYPE_CHECKING:
@@ -26,10 +25,10 @@
 
 def postprocess_jaxpr_sdfg(
     trans_ctx: translator.TranslationContext,
-    fun: Callable,  # noqa: ARG001  # Currently unused
+    fun: Callable,  # noqa: ARG001 [unused-function-argument]  # Currently unused.
     flat_call_args: Sequence[Any],
     validate: bool = True,
-) -> jace.TranslatedJaxprSDFG:
+) -> tjsdfg.TranslatedJaxprSDFG:
     """
     Final post processing steps on the `TranslationContext`.
 
@@ -77,17 +76,17 @@ def _create_output_state(trans_ctx: translator.TranslationContext) -> None:
     The function will create a new terminal state, in which all outputs, denoted
     in `trans_ctx.out_names`, will be written into new SDFG variables. In case the
     output variable is a scalar, the output will be replaced by an array of length one.
-    This behaviour is consistent with Jax.
+    This behaviour is consistent with JAX.
 
     Args:
         trans_ctx: The translation context to process.
     """
     assert trans_ctx.inp_names is not None and trans_ctx.out_names is not None
 
-    # NOTE: Currently we do not support to write back into an input argument, as Jax.
+    # NOTE: Currently we do not support to write back into an input argument, as JAX.
     #  However, this is a requirement for handling ICON stencils, that we will support
     #  eventually. If we get a translation context that lists a variable name in the
-    #  inputs and outputs, this means that it was returned unmodified. In Jax this
+    #  inputs and outputs, this means that it was returned unmodified. In JAX this
     #  will lead to a copy and we also do it. This is implemented by just naïvely
     #  creating a separate output variable for every output we have, irrespectively
     #  of its name inside the Jaxpr.
@@ -205,7 +204,7 @@ def _create_input_state(
 def finalize_translation_context(
     trans_ctx: translator.TranslationContext,
     validate: bool = True,
-) -> jace.TranslatedJaxprSDFG:
+) -> tjsdfg.TranslatedJaxprSDFG:
     """
     Finalizes the supplied translation context `trans_ctx`.
 
@@ -231,7 +230,7 @@ def finalize_translation_context(
         raise ValueError("No input nor output.")
 
     # We guarantee decoupling
-    tsdfg = jace.TranslatedJaxprSDFG(
+    tsdfg = tjsdfg.TranslatedJaxprSDFG(
         sdfg=copy.deepcopy(trans_ctx.sdfg),
         inp_names=trans_ctx.inp_names,
         out_names=trans_ctx.out_names,
diff --git a/src/jace/translator/primitive_translator.py b/src/jace/translator/primitive_translator.py
index dffe2f6..5fa5e6c 100644
--- a/src/jace/translator/primitive_translator.py
+++ b/src/jace/translator/primitive_translator.py
@@ -43,7 +43,7 @@ def __call__(
         eqn_state: dace.SDFGState,
     ) -> dace.SDFGState | None:
         """
-        Translates the Jax primitive into its SDFG equivalent.
+        Translates the JAX primitive into its SDFG equivalent.
 
         Before the builder calls this function it will perform the following
         preparatory tasks:
@@ -82,7 +82,7 @@ def __call__(
                 SDFG for the inpts or `None` in case of a literal.
             out_var_names: List of the names of the arrays created inside the
                 SDFG for the outputs.
-            eqn: The Jax primitive that should be translated.
+            eqn: The JAX primitive that should be translated.
             eqn_state: State into which the primitive`s SDFG representation
                 should be constructed.
         """
@@ -92,7 +92,7 @@ def __call__(
 @runtime_checkable
 class PrimitiveTranslator(PrimitiveTranslatorCallable, Protocol):
     """
-    Interface for all Jax primitive translators.
+    Interface for all JAX primitive translators.
 
     A translator for a primitive translates a single equation of a Jaxpr into
     its SDFG equivalent. For satisfying this interface a concrete implementation
@@ -111,7 +111,7 @@ class PrimitiveTranslator(PrimitiveTranslatorCallable, Protocol):
     @property
     @abc.abstractmethod
     def primitive(self) -> str:
-        """Returns the name of the Jax primitive that `self` is able to handle."""
+        """Returns the name of the JAX primitive that `self` is able to handle."""
         ...
 
 
diff --git a/src/jace/translator/primitive_translators/alu_translator.py b/src/jace/translator/primitive_translators/alu_translator.py
index d865ee8..436cebd 100644
--- a/src/jace/translator/primitive_translators/alu_translator.py
+++ b/src/jace/translator/primitive_translators/alu_translator.py
@@ -61,7 +61,7 @@ def __call__(
             builder:         The builder object of the translation.
             in_var_names:   List of the names of the arrays created inside the SDFG for the inpts or 'None' in case of a literal.
             out_var_names:  List of the names of the arrays created inside the SDFG for the outputs.
-            eqn:            The Jax equation that is translated.
+            eqn:            The JAX equation that is translated.
             eqn_state:      State into which the primitive's SDFG representation is constructed.
         """
         assert self._prim_name == eqn.primitive.name
@@ -101,7 +101,7 @@ def __call__(
         else:
             # This is the general broadcasting case
             #  We assume that both inputs and the output have the same rank but different sizes in each dimension.
-            #  It seems that Jax ensures this.
+            #  It seems that JAX ensures this.
             #  We further assume that if the size in a dimension differs then one must have size 1.
             #  This is the size we broadcast over, i.e. conceptually replicated.
             out_shps = tuple(util.get_jax_var_shape(eqn.outvars[0]))  # Shape of the output
diff --git a/src/jace/util/jax_helper.py b/src/jace/util/jax_helper.py
index c0997ba..c462798 100644
--- a/src/jace/util/jax_helper.py
+++ b/src/jace/util/jax_helper.py
@@ -6,9 +6,9 @@
 # SPDX-License-Identifier: BSD-3-Clause
 
 """
-Implements all utility functions that are related to Jax.
+Implements all utility functions that are related to JAX.
 
-Most of the functions defined here allow an unified access to Jax' internal in
+Most of the functions defined here allow an unified access to JAX' internal in
 a consistent and stable way.
 """
 
@@ -37,12 +37,12 @@ class JaCeVar:
 
     This class can be seen as some kind of substitute `jax.core.Var`. The main
     intention of this class is as an internal representation of values, as they
-    are used in Jax, but without the Jax machinery. As abstract values in Jax
+    are used in JAX, but without the JAX machinery. As abstract values in JAX
     this class has a datatype, which is a `dace.typeclass` instance and a shape.
     In addition it has an optional name, which allows to create variables with
     a certain name using `JaxprTranslationBuilder.add_array()`.
 
-    If it is expected that code must handle both Jax variables and `JaCeVar`
+    If it is expected that code must handle both JAX variables and `JaCeVar`
     then the `get_jax_var_*()` functions should be used.
 
     Args:
@@ -52,7 +52,7 @@ class JaCeVar:
 
     Note:
         If the name of a `JaCeVar` is '_' it is considered a drop variable. The
-        definitions of `__hash__` and `__eq__` are in accordance with how Jax
+        definitions of `__hash__` and `__eq__` are in accordance with how JAX
         variable works.
 
     Todo:
@@ -94,7 +94,7 @@ def get_jax_var_name(jax_var: jax_core.Atom | JaCeVar) -> str:
             #  but leads to stable and valid names.
             return f"jax{jax_var.count}{jax_var.suffix}"
         case jax_core.Literal():
-            raise TypeError("Can not derive a name from a Jax Literal.")
+            raise TypeError("Can not derive a name from a JAX Literal.")
         case _:
             raise TypeError(
                 f"Does not know how to transform '{jax_var}' (type: '{type(jax_var).__name__}') "
@@ -133,23 +133,26 @@ def is_tracing_ongoing(*args: Any, **kwargs: Any) -> bool:
     While a return value `True` guarantees that a translation is ongoing, a
     value of `False` does not guarantees that no tracing is ongoing.
     """
-    # To detect if there is tracing ongoing, we check the internal tracing stack of Jax.
+    # To detect if there is tracing ongoing, we check the internal tracing stack of JAX.
     #  Note that this is highly internal and depends on the precise implementation of
-    #  Jax. For that reason we first look at all arguments and check if they are
-    #  tracers. Furthermore, it seems that Jax always have a bottom interpreter on the
+    #  JAX. For that reason we first look at all arguments and check if they are
+    #  tracers. Furthermore, it seems that JAX always have a bottom interpreter on the
     #  stack, thus it is empty if `len(...) == 1`!
     #  See also: https://github.com/google/jax/pull/3370
     if any(isinstance(x, jax_core.Tracer) for x in itertools.chain(args, kwargs.values())):
         return True
-    if len(jax._src.core.thread_local_state.trace_state.trace_stack.stack) == 1:
+    if (
+        trace_stack_length := (len(jax._src.core.thread_local_state.trace_state.trace_stack.stack))
+        == 1
+    ):
         return False
-    if len(jax._src.core.thread_local_state.trace_state.trace_stack.stack) > 1:
+    if trace_stack_length > 1:
         return True
     raise RuntimeError("Failed to determine if tracing is ongoing.")
 
 
 def translate_dtype(dtype: Any) -> dace.typeclass:
-    """Turns a Jax datatype into a DaCe datatype."""
+    """Turns a JAX datatype into a DaCe datatype."""
     if dtype is None:
         raise NotImplementedError  # Handling a special case in DaCe.
     if isinstance(dtype, dace.typeclass):
@@ -179,7 +182,7 @@ def propose_jax_name(
 
     Args:
         jax_var: The variable for which a name to propose.
-        jax_name_map: A mapping of all Jax variables that were already named.
+        jax_name_map: A mapping of all JAX variables that were already named.
 
     Note:
         The function guarantees that the returned name passes `VALID_SDFG_VAR_NAME`
@@ -195,7 +198,7 @@ def propose_jax_name(
     if isinstance(jax_var, JaCeVar) and (jax_var.name is not None):
         return jax_var.name
 
-    # This code is taken from Jax so it will generate similar ways, the difference is
+    # This code is taken from JAX so it will generate similar ways, the difference is
     #  that we do the counting differently.
     #  Note that `z` is followed by `ba` and not `aa` as it is in Excel.
     c = len(jax_name_map)
diff --git a/src/jace/util/traits.py b/src/jace/util/traits.py
index f99d013..07cec9a 100644
--- a/src/jace/util/traits.py
+++ b/src/jace/util/traits.py
@@ -30,17 +30,17 @@ def is_drop_var(jax_var: jax_core.Atom | util.JaCeVar) -> TypeGuard[jax_core.Dro
 
 def is_jax_array(obj: Any) -> TypeGuard[jax.Array]:
     """
-    Tests if `obj` is a Jax array.
+    Tests if `obj` is a JAX array.
 
     Note:
-     Jax arrays are special as they can not be mutated. Furthermore, they always
+     JAX arrays are special as they can not be mutated. Furthermore, they always
      allocate on the CPU _and_ on the GPU, if present.
     """
     return isinstance(obj, jax.Array)
 
 
 def is_array(obj: Any) -> TypeGuard[jax.typing.ArrayLike]:
-    """Identifies arrays, this also includes Jax arrays."""
+    """Identifies arrays, this also includes JAX arrays."""
     return dace.is_array(obj) or is_jax_array(obj)
 
 
@@ -107,7 +107,7 @@ def is_on_device(obj: Any) -> bool:
     """
     Tests if `obj` is on a device.
 
-    Jax arrays are always on the CPU and GPU (if there is one). Thus for Jax
+    JAX arrays are always on the CPU and GPU (if there is one). Thus for JAX
     arrays this function is more of a test, if there is a GPU at all.
     """
     if is_jax_array(obj):
diff --git a/src/jace/util/translation_cache.py b/src/jace/util/translation_cache.py
index 9361733..264097e 100644
--- a/src/jace/util/translation_cache.py
+++ b/src/jace/util/translation_cache.py
@@ -65,7 +65,7 @@ def __init__(self) -> None:
 
     @abc.abstractmethod
     def _make_call_description(
-        self: CachingStage, intree: jax_tree.PyTreeDef, flat_call_args: Sequence[Any]
+        self: CachingStage, in_tree: jax_tree.PyTreeDef, flat_call_args: Sequence[Any]
     ) -> StageTransformationSpec:
         """
         Computes the key used to represent the call.
@@ -76,7 +76,7 @@ def _make_call_description(
         there for more information.
 
         Args:
-            intree: Pytree object describing how the input arguments were flattened.
+            in_tree: Pytree object describing how the input arguments were flattened.
             flat_call_args: The flattened arguments that were passed to the
                 annotated function.
         """
@@ -107,8 +107,8 @@ def cached_transition(
 
     @functools.wraps(transition)
     def transition_wrapper(self: CachingStageType, *args: P.args, **kwargs: P.kwargs) -> NextStage:
-        flat_call_args, intree = jax_tree.tree_flatten((args, kwargs))
-        key = self._make_call_description(flat_call_args=flat_call_args, intree=intree)
+        flat_call_args, in_tree = jax_tree.tree_flatten((args, kwargs))
+        key = self._make_call_description(flat_call_args=flat_call_args, in_tree=in_tree)
         if key not in self._cache:
             self._cache[key] = transition(self, *args, **kwargs)
         return self._cache[key]
@@ -137,7 +137,7 @@ class _AbstractCallArgument:
 
     As noted in `StageTransformationSpec` there are two ways to describe an
     argument, either by using its concrete value or an abstract description,
-    which is similar to tracers in Jax. This class represents the second way.
+    which is similar to tracers in JAX. This class represents the second way.
     To create an instance you should use `_AbstractCallArgument.from_value()`.
 
     Attributes:
@@ -162,7 +162,7 @@ def from_value(cls, value: Any) -> _AbstractCallArgument:
         if not util.is_fully_addressable(value):
             raise NotImplementedError("Distributed arrays are not addressed yet.")
         if isinstance(value, jax_core.Literal):
-            raise TypeError("Jax Literals are not supported as cache keys.")
+            raise TypeError("JAX Literals are not supported as cache keys.")
 
         if util.is_array(value):
             if util.is_jax_array(value):
@@ -204,7 +204,7 @@ class StageTransformationSpec:
     result is cached. They key to locate them inside the cache is represented
     by this class and computed by the `CachingStage._make_call_description()`
     function. The actual key is consists of three parts, `stage_id`, `call_args`
-    and `intree`, see below for more.
+    and `in_tree`, see below for more.
 
     Args:
         stage_id: Origin of the call, for which the id of the stage object should
@@ -213,16 +213,16 @@ class StageTransformationSpec:
             describes a single argument. To describe an argument there are two ways:
             - Abstract description: In this way, the actual value of the argument
                 is irrelevant, its structure is important, similar to the tracers
-                used in Jax. To represent it, use `_AbstractCallArgument`.
+                used in JAX. To represent it, use `_AbstractCallArgument`.
             - Concrete description: Here the actual value of the argument is
-                considered, this is similar to how static arguments in Jax works.
+                considered, this is similar to how static arguments in JAX works.
                 The only requirement is that they can be hashed.
-        intree: A pytree structure that describes how the input was flatten.
+        in_tree: A pytree structure that describes how the input was flatten.
     """
 
     stage_id: int
     flat_call_args: CallArgsSpec
-    intree: jax_tree.PyTreeDef
+    in_tree: jax_tree.PyTreeDef
 
 
 #: Denotes the stage that is stored inside the cache.
@@ -277,14 +277,14 @@ def popitem(self, key: StageTransformationSpec | None) -> None:
             self._memory.move_to_end(key, last=False)
             self._memory.popitem(last=False)
 
-    def clear(self) -> None:  # noqa: D102  # Missing description.
+    def clear(self) -> None:  # noqa: D102 [undocumented-public-method]
         self._memory.clear()
 
     def __len__(self) -> int:
         return len(self._memory)
 
     @property
-    def capacity(self) -> int:  # noqa: D102  # No docstring needed.
+    def capacity(self) -> int:  # noqa: D102 [undocumented-public-method]
         return self._capacity
 
     def front(self) -> tuple[StageTransformationSpec, StageType]:

From 4eb806fa68049c04cc42debfc62bd3ce66bcd43a Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Fri, 21 Jun 2024 16:58:53 +0200
Subject: [PATCH 392/458] second batch of first review round.

---
 src/jace/api.py                               |  7 +--
 src/jace/optimization.py                      | 33 +++++-----
 src/jace/stages.py                            | 23 +++----
 src/jace/tracing.py                           |  3 +-
 src/jace/translated_jaxpr_sdfg.py             | 63 +++++++++----------
 .../translator/jaxpr_translator_builder.py    | 24 +++----
 ...ost_translation.py => post_translation.py} | 23 ++++---
 src/jace/translator/primitive_translator.py   | 18 ++++--
 .../primitive_translators/alu_translator.py   | 25 ++++----
 src/jace/util/jax_helper.py                   |  7 +--
 src/jace/util/translation_cache.py            | 32 +++++-----
 tests/test_caching.py                         |  7 ++-
 12 files changed, 134 insertions(+), 131 deletions(-)
 rename src/jace/translator/{pre_post_translation.py => post_translation.py} (93%)

diff --git a/src/jace/api.py b/src/jace/api.py
index 3d6facd..18a81e6 100644
--- a/src/jace/api.py
+++ b/src/jace/api.py
@@ -10,7 +10,8 @@
 from __future__ import annotations
 
 import functools
-from typing import TYPE_CHECKING, Literal, ParamSpec, TypedDict, TypeVar, overload
+from collections.abc import Callable, Mapping
+from typing import Literal, ParamSpec, TypedDict, TypeVar, overload
 
 from jax import grad, jacfwd, jacrev
 from typing_extensions import Unpack
@@ -18,10 +19,6 @@
 from jace import stages, translator
 
 
-if TYPE_CHECKING:
-    from collections.abc import Callable, Mapping
-
-
 __all__ = ["JITOptions", "grad", "jacfwd", "jacrev", "jit"]
 
 # Used for type annotation, see the notes in `jace.stages` for more.
diff --git a/src/jace/optimization.py b/src/jace/optimization.py
index 33a94b8..65e97b4 100644
--- a/src/jace/optimization.py
+++ b/src/jace/optimization.py
@@ -5,7 +5,12 @@
 #
 # SPDX-License-Identifier: BSD-3-Clause
 
-"""JaCe specific optimizations."""
+"""
+JaCe specific optimizations.
+
+Todo:
+    Organize this module once it is a package.
+"""
 
 from __future__ import annotations
 
@@ -18,6 +23,19 @@
     from jace import translated_jaxpr_sdfg as tjsdfg
 
 
+DEFAULT_OPTIMIZATIONS: Final[CompilerOptions] = {
+    "auto_optimize": True,
+    "simplify": True,
+    "persistent_transients": True,
+}
+
+NO_OPTIMIZATIONS: Final[CompilerOptions] = {
+    "auto_optimize": False,
+    "simplify": False,
+    "persistent_transients": False,
+}
+
+
 class CompilerOptions(TypedDict, total=False):
     """
     All known compiler options to `JaCeLowered.compile()`.
@@ -34,19 +52,6 @@ class CompilerOptions(TypedDict, total=False):
     persistent_transients: bool
 
 
-DEFAULT_OPTIMIZATIONS: Final[CompilerOptions] = {
-    "auto_optimize": True,
-    "simplify": True,
-    "persistent_transients": True,
-}
-
-NO_OPTIMIZATIONS: Final[CompilerOptions] = {
-    "auto_optimize": False,
-    "simplify": False,
-    "persistent_transients": False,
-}
-
-
 def jace_optimize(tsdfg: tjsdfg.TranslatedJaxprSDFG, **kwargs: Unpack[CompilerOptions]) -> None:  # noqa: D417 [undocumented-param]
     """
     Performs optimization of the translated SDFG _in place_.
diff --git a/src/jace/stages.py b/src/jace/stages.py
index e527dd8..327017c 100644
--- a/src/jace/stages.py
+++ b/src/jace/stages.py
@@ -29,19 +29,18 @@
 
 import copy
 import inspect
+from collections.abc import Callable, Mapping, Sequence
 from typing import TYPE_CHECKING, Any, Generic, ParamSpec, TypeVar, Union
 
 from jax import tree_util as jax_tree
 
 from jace import api, optimization, tracing, translated_jaxpr_sdfg as tjsdfg, translator, util
 from jace.optimization import CompilerOptions
-from jace.translator import pre_post_translation as pptrans
+from jace.translator import post_translation as ptrans
 from jace.util import translation_cache as tcache
 
 
 if TYPE_CHECKING:
-    from collections.abc import Callable, Mapping, Sequence
-
     import dace
 
 __all__ = [
@@ -169,7 +168,7 @@ def lower(self, *args: _P.args, **kwargs: _P.kwargs) -> JaCeLowered[_ReturnType]
         trans_ctx: translator.TranslationContext = builder.translate_jaxpr(jaxpr)
 
         flat_call_args = jax_tree.tree_leaves((args, kwargs))
-        tsdfg: tjsdfg.TranslatedJaxprSDFG = pptrans.postprocess_jaxpr_sdfg(
+        tsdfg: tjsdfg.TranslatedJaxprSDFG = ptrans.postprocess_jaxpr_sdfg(
             trans_ctx=trans_ctx,
             fun=self.wrapped_fun,
             flat_call_args=flat_call_args,
@@ -255,7 +254,7 @@ def compile(self, compiler_options: CompilerOptions | None = None) -> JaCeCompil
         optimization.jace_optimize(tsdfg=tsdfg, **finalize_compilation_options(compiler_options))
 
         return JaCeCompiled(
-            csdfg=tjsdfg.compile_jaxpr_sdfg(tsdfg),
+            compiled_sdfg=tjsdfg.compile_jaxpr_sdfg(tsdfg),
             out_tree=self._out_tree,
         )
 
@@ -309,8 +308,8 @@ class JaCeCompiled(Generic[_ReturnType]):
     called with compatible arguments.
 
     Args:
-        csdfg: The compiled SDFG object.
-        inp_names: SDFG variables used as inputs.
+        compiled_sdfg: The compiled SDFG object.
+        input_names: SDFG variables used as inputs.
         out_names: SDFG variables used as outputs.
         out_tree: Pytree describing how to unflatten the output.
 
@@ -321,15 +320,15 @@ class JaCeCompiled(Generic[_ReturnType]):
         - Automatic strides adaptation.
     """
 
-    _csdfg: tjsdfg.CompiledJaxprSDFG
+    _compiled_sdfg: tjsdfg.CompiledJaxprSDFG
     _out_tree: jax_tree.PyTreeDef
 
     def __init__(
         self,
-        csdfg: tjsdfg.CompiledJaxprSDFG,
+        compiled_sdfg: tjsdfg.CompiledJaxprSDFG,
         out_tree: jax_tree.PyTreeDef,
     ) -> None:
-        self._csdfg = csdfg
+        self._compiled_sdfg = compiled_sdfg
         self._out_tree = out_tree
 
     def __call__(self, *args: Any, **kwargs: Any) -> _ReturnType:
@@ -343,9 +342,7 @@ def __call__(self, *args: Any, **kwargs: Any) -> _ReturnType:
             compatible with the ones that were used for lowering.
         """
         flat_call_args = jax_tree.tree_leaves((args, kwargs))
-        flat_output = self._csdfg(flat_call_args)
-        if flat_output is None:
-            return None  # type: ignore[return-value]  # Type confusion.
+        flat_output = self._compiled_sdfg(flat_call_args)
         return jax_tree.tree_unflatten(self._out_tree, flat_output)
 
 
diff --git a/src/jace/tracing.py b/src/jace/tracing.py
index 71932e9..c28101d 100644
--- a/src/jace/tracing.py
+++ b/src/jace/tracing.py
@@ -16,6 +16,7 @@
 from __future__ import annotations
 
 import inspect
+from collections.abc import Callable
 from typing import TYPE_CHECKING, Any, Literal, ParamSpec, TypeVar, overload
 
 import jax
@@ -23,8 +24,6 @@
 
 
 if TYPE_CHECKING:
-    from collections.abc import Callable
-
     from jace import api
 
 _P = ParamSpec("_P")
diff --git a/src/jace/translated_jaxpr_sdfg.py b/src/jace/translated_jaxpr_sdfg.py
index 46fc558..5ad00c6 100644
--- a/src/jace/translated_jaxpr_sdfg.py
+++ b/src/jace/translated_jaxpr_sdfg.py
@@ -12,6 +12,7 @@
 import dataclasses
 import pathlib
 import uuid
+from collections.abc import Sequence
 from typing import TYPE_CHECKING, Any
 
 import dace
@@ -21,8 +22,6 @@
 
 
 if TYPE_CHECKING:
-    from collections.abc import Sequence
-
     import numpy as np
     from dace.codegen import compiled_sdfg
     from dace.codegen.compiled_sdfg import CompiledSDFG
@@ -37,12 +36,12 @@ class TranslatedJaxprSDFG:
     object, `self` carries a proper SDFG with the following structure:
     - It does not have `__return*` variables, instead all return arguments are
         passed by arguments.
-    - All input arguments are passed through arguments mentioned in `inp_names`,
+    - All input arguments are passed through arguments mentioned in `input_names`,
         while the outputs are passed through `out_names`.
     - Only variables listed as in/outputs are non transient.
-    - The order inside `inp_names` and `out_names` is the same as in the original Jaxpr.
-    - If an input is used as outputs it appears in both `inp_names` and `out_names`.
-    - Its `arg_names` is set to `inp_names + out_names`, but arguments that are
+    - The order of `input_names` and `out_names` is the same as in the original Jaxpr.
+    - If an input is used as outputs it appears in both `input_names` and `out_names`.
+    - Its `arg_names` is set to `input_names + out_names`, but arguments that are
         input and outputs are only listed as inputs.
 
     The only valid way to obtain a `TranslatedJaxprSDFG` is by passing a
@@ -53,7 +52,7 @@ class TranslatedJaxprSDFG:
 
     Attributes:
         sdfg: The encapsulated SDFG object.
-        inp_names: SDFG variables used as inputs.
+        input_names: SDFG variables used as inputs.
         out_names: SDFG variables used as outputs.
 
     Todo:
@@ -63,14 +62,14 @@ class TranslatedJaxprSDFG:
     """
 
     sdfg: dace.SDFG
-    inp_names: tuple[str, ...]
+    input_names: tuple[str, ...]
     out_names: tuple[str, ...]
 
     def validate(self) -> bool:
         """Validate the underlying SDFG."""
-        if any(self.sdfg.arrays[inp].transient for inp in self.inp_names):
+        if any(self.sdfg.arrays[inp].transient for inp in self.input_names):
             raise dace.sdfg.InvalidSDFGError(
-                f"Found transient inputs: {(inp for inp in self.inp_names if self.sdfg.arrays[inp].transient)}",
+                f"Found transient inputs: {(inp for inp in self.input_names if self.sdfg.arrays[inp].transient)}",
                 self.sdfg,
                 self.sdfg.node_id(self.sdfg.start_state),
             )
@@ -101,14 +100,14 @@ class CompiledJaxprSDFG:
     `compile_jaxpr_sdfg()`.
 
     Args:
-        csdfg: The `CompiledSDFG` object.
-        inp_names: Names of the SDFG variables used as inputs.
+        compiled_sdfg: The `CompiledSDFG` object.
+        input_names: Names of the SDFG variables used as inputs.
         out_names: Names of the SDFG variables used as outputs.
 
     Attributes:
-        csdfg: The `CompiledSDFG` object.
+        compiled_sdfg: The `CompiledSDFG` object.
         sdfg: The encapsulated SDFG object.
-        inp_names: Names of the SDFG variables used as inputs.
+        input_names: Names of the SDFG variables used as inputs.
         out_names: Names of the SDFG variables used as outputs.
 
     Notes:
@@ -120,18 +119,18 @@ class CompiledJaxprSDFG:
         arrays of length one.
     """
 
-    csdfg: compiled_sdfg.CompiledSDFG
-    inp_names: tuple[str, ...]
+    compiled_sdfg: compiled_sdfg.CompiledSDFG
+    input_names: tuple[str, ...]
     out_names: tuple[str, ...]
 
     @property
     def sdfg(self) -> dace.SDFG:  # noqa: D102 [undocumented-public-method]
-        return self.csdfg.sdfg
+        return self.compiled_sdfg.sdfg
 
     def __call__(
         self,
         flat_call_args: Sequence[Any],
-    ) -> list[np.ndarray] | None:
+    ) -> list[np.ndarray]:
         """
         Run the compiled SDFG using the flattened input.
 
@@ -139,16 +138,16 @@ def __call__(
         the output.
 
         Args:
-            csdfg: The compiled SDFG to call.
+            compiled_sdfg: The compiled SDFG to call.
             flat_call_args: Flattened input arguments.
         """
-        if len(self.inp_names) != len(flat_call_args):
+        if len(self.input_names) != len(flat_call_args):
             raise RuntimeError(
-                f"Expected {len(self.inp_names)} flattened arguments, but got {len(flat_call_args)}."
+                f"Expected {len(self.input_names)} flattened arguments, but got {len(flat_call_args)}."
             )
 
         sdfg_call_args: dict[str, Any] = {}
-        for in_name, in_val in zip(self.inp_names, flat_call_args):
+        for in_name, in_val in zip(self.input_names, flat_call_args):
             # TODO(phimuell): Implement a stride matching process.
             if util.is_jax_array(in_val):
                 if not util.is_fully_addressable(in_val):
@@ -165,20 +164,18 @@ def __call__(
             else:
                 sdfg_call_args[out_name] = dace_data.make_array_from_descriptor(sdfg_array)
 
-        assert len(sdfg_call_args) == len(self.csdfg.argnames), (
+        assert len(sdfg_call_args) == len(self.compiled_sdfg.argnames), (
             "Failed to construct the call arguments,"
-            f" expected {len(self.csdfg.argnames)} but got {len(flat_call_args)}."
-            f"\nExpected: {self.csdfg.argnames}\nGot: {list(sdfg_call_args.keys())}"
+            f" expected {len(self.compiled_sdfg.argnames)} but got {len(flat_call_args)}."
+            f"\nExpected: {self.compiled_sdfg.argnames}\nGot: {list(sdfg_call_args.keys())}"
         )
 
         # Calling the SDFG
         with dace.config.temporary_config():
             dace.Config.set("compiler", "allow_view_arguments", value=True)
-            self.csdfg(**sdfg_call_args)
+            self.compiled_sdfg(**sdfg_call_args)
 
-        if self.out_names:
-            return [sdfg_call_args[out_name] for out_name in self.out_names]
-        return None
+        return [sdfg_call_args[out_name] for out_name in self.out_names]
 
 
 def compile_jaxpr_sdfg(tsdfg: TranslatedJaxprSDFG) -> CompiledJaxprSDFG:
@@ -190,7 +187,7 @@ def compile_jaxpr_sdfg(tsdfg: TranslatedJaxprSDFG) -> CompiledJaxprSDFG:
         raise ValueError("Only support SDFGs without '__return' members.")
     if tsdfg.sdfg.free_symbols:  # This is a simplification that makes our life simple.
         raise NotImplementedError(f"No free symbols allowed, found: {tsdfg.sdfg.free_symbols}")
-    if not (tsdfg.out_names or tsdfg.inp_names):
+    if not (tsdfg.out_names or tsdfg.input_names):
         raise ValueError("No input nor output.")
 
     # To ensure that the SDFG is compiled and to get rid of a warning we must modify
@@ -214,11 +211,13 @@ def compile_jaxpr_sdfg(tsdfg: TranslatedJaxprSDFG) -> CompiledJaxprSDFG:
             dace.Config.set("default_build_folder", value=pathlib.Path(".jacecache").resolve())
             sdfg._recompile = True
             sdfg._regenerate_code = True
-            csdfg: CompiledSDFG = sdfg.compile()
+            compiled_sdfg: CompiledSDFG = sdfg.compile()
 
     finally:
         sdfg.name = original_sdfg_name
         sdfg._recompile = original_recompile
         sdfg._regenerate_code = original_regenerate_code
 
-    return CompiledJaxprSDFG(csdfg=csdfg, inp_names=tsdfg.inp_names, out_names=tsdfg.out_names)
+    return CompiledJaxprSDFG(
+        compiled_sdfg=compiled_sdfg, input_names=tsdfg.input_names, out_names=tsdfg.out_names
+    )
diff --git a/src/jace/translator/jaxpr_translator_builder.py b/src/jace/translator/jaxpr_translator_builder.py
index 73202b2..7ef6d06 100644
--- a/src/jace/translator/jaxpr_translator_builder.py
+++ b/src/jace/translator/jaxpr_translator_builder.py
@@ -444,9 +444,9 @@ def _create_initial_input(self, jaxpr: jax_core.ClosedJaxpr) -> None:
         Creates the input variables of `jaxpr`.
 
         Notes:
-            The function will populate the `inp_names` member of the current context.
+            The function will populate the `input_names` member of the current context.
         """
-        assert self._ctx.inp_names is None
+        assert self._ctx.input_names is None
 
         # Handle the initial input arguments
         init_in_var_names: Sequence[str] = self.create_jax_var_list(
@@ -458,7 +458,7 @@ def _create_initial_input(self, jaxpr: jax_core.ClosedJaxpr) -> None:
         self.sdfg.arg_names = []
 
         # The output list is populated by `self._translate_jaxpr_internal()`
-        self._ctx.inp_names = tuple(init_in_var_names)
+        self._ctx.input_names = tuple(init_in_var_names)
 
     def _create_constants(self, jaxpr: jax_core.ClosedJaxpr) -> None:
         """
@@ -634,7 +634,7 @@ def _handle_null_jaxpr(self, jaxpr: jax_core.ClosedJaxpr) -> list[str]:
             The function will _not_ update the `out_names` field of the current context.
         """
         assert self._ctx.terminal_state is self._ctx.start_state
-        assert isinstance(self._ctx.inp_names, tuple)
+        assert isinstance(self._ctx.input_names, tuple)
         assert self._ctx.out_names is None
 
         # There is not output so we do not have to copy anything around.
@@ -662,10 +662,10 @@ def _handle_null_jaxpr(self, jaxpr: jax_core.ClosedJaxpr) -> list[str]:
 
             # Now we perform the copy from the input variable in the newly created
             #  output variable.
-            inp_acc = self._start_state.add_read(sdfg_in_name)
+            input_acc = self._start_state.add_read(sdfg_in_name)
             out_acc = self._start_state.add_write(sdfg_out_name)
             self._start_state.add_nedge(
-                src=inp_acc,
+                src=input_acc,
                 dst=out_acc,
                 data=dace.Memlet.from_array(sdfg_in_name, self.get_array(sdfg_in_name)),
             )
@@ -703,7 +703,7 @@ class TranslationContext:
 
     Attributes:
         sdfg: The encapsulated SDFG object.
-        inp_names: A list of the SDFG variables that are used as input
+        input_names: A list of the SDFG variables that are used as input
         out_names: A list of the SDFG variables that are used as output.
         start_state: The first state in the SDFG state machine.
         terminal_state: The (currently) last state in the state machine.
@@ -718,7 +718,7 @@ class TranslationContext:
     """
 
     sdfg: dace.SDFG
-    inp_names: tuple[str, ...] | None
+    input_names: tuple[str, ...] | None
     out_names: tuple[str, ...] | None
     start_state: dace.SDFGState
     terminal_state: dace.SDFGState
@@ -729,7 +729,7 @@ def __init__(self, name: str | None, jaxpr: jax_core.ClosedJaxpr) -> None:
             raise ValueError(f"'{name}' is not a valid SDFG name.")
 
         self.sdfg = dace.SDFG(name=(name or f"unnamed_SDFG_{id(self)}"))
-        self.inp_names = None
+        self.input_names = None
         self.out_names = None
         self.start_state = self.sdfg.add_state(label="initial_state", is_start_block=True)
         self.terminal_state = self.start_state
@@ -757,11 +757,11 @@ def validate(self) -> bool:
                 self.sdfg.node_id(self.terminal_state),
             )
         if not (
-            self.inp_names is None
-            or all(inp_name in self.sdfg.arrays for inp_name in self.inp_names)
+            self.input_names is None
+            or all(input_name in self.sdfg.arrays for input_name in self.input_names)
         ):
             raise dace.sdfg.InvalidSDFGError(
-                f"Missing input arguments: {(inp_name for inp_name in self.inp_names if inp_name not in self.sdfg.arrays)}",
+                f"Missing input arguments: {(input_name for input_name in self.input_names if input_name not in self.sdfg.arrays)}",
                 self.sdfg,
                 self.sdfg.node_id(self.terminal_state),
             )
diff --git a/src/jace/translator/pre_post_translation.py b/src/jace/translator/post_translation.py
similarity index 93%
rename from src/jace/translator/pre_post_translation.py
rename to src/jace/translator/post_translation.py
index c5cc204..8242060 100644
--- a/src/jace/translator/pre_post_translation.py
+++ b/src/jace/translator/post_translation.py
@@ -10,6 +10,7 @@
 from __future__ import annotations
 
 import copy
+from collections.abc import Callable, Sequence
 from typing import TYPE_CHECKING, Any
 
 import dace
@@ -18,8 +19,6 @@
 
 
 if TYPE_CHECKING:
-    from collections.abc import Callable, Sequence
-
     from jace import translator
 
 
@@ -81,7 +80,7 @@ def _create_output_state(trans_ctx: translator.TranslationContext) -> None:
     Args:
         trans_ctx: The translation context to process.
     """
-    assert trans_ctx.inp_names is not None and trans_ctx.out_names is not None
+    assert trans_ctx.input_names is not None and trans_ctx.out_names is not None
 
     # NOTE: Currently we do not support to write back into an input argument, as JAX.
     #  However, this is a requirement for handling ICON stencils, that we will support
@@ -149,21 +148,21 @@ def _create_input_state(
     Todo:
         Handle transfer of scalar input in GPU mode.
     """
-    assert trans_ctx.inp_names is not None and trans_ctx.out_names is not None
+    assert trans_ctx.input_names is not None and trans_ctx.out_names is not None
 
     # NOTE: This function will create a distinct variable for every input. Once we
     #  allow write back arguments they will be handled in the `_create_output_state()`
     #  function anyway, also see the comment in that function.
 
-    if len(flat_call_args) != len(trans_ctx.inp_names):
-        raise ValueError(f"Expected {len(trans_ctx.inp_names)}, but got {len(flat_call_args)}.")
+    if len(flat_call_args) != len(trans_ctx.input_names):
+        raise ValueError(f"Expected {len(trans_ctx.input_names)}, but got {len(flat_call_args)}.")
 
     sdfg = trans_ctx.sdfg
     new_input_state: dace.SDFGState = sdfg.add_state(f"{sdfg.name}__start_state")
     new_input_names: list[str] = []
     input_pattern = "__jace_input_{}"
 
-    for i, (org_input_name, call_arg) in enumerate(zip(trans_ctx.inp_names, flat_call_args)):
+    for i, (org_input_name, call_arg) in enumerate(zip(trans_ctx.input_names, flat_call_args)):
         org_input_desc: dace.data.Data = sdfg.arrays[org_input_name]
         new_input_name = input_pattern.format(i)
 
@@ -198,7 +197,7 @@ def _create_input_state(
     sdfg.add_edge(new_input_state, trans_ctx.start_state, dace.InterstateEdge())
     sdfg.start_block = sdfg.node_id(new_input_state)
     trans_ctx.start_state = new_input_state
-    trans_ctx.inp_names = tuple(new_input_names)
+    trans_ctx.input_names = tuple(new_input_names)
 
 
 def finalize_translation_context(
@@ -222,23 +221,23 @@ def finalize_translation_context(
         validate: Call the validate function after the finalizing.
     """
     trans_ctx.validate()
-    if trans_ctx.inp_names is None:
+    if trans_ctx.input_names is None:
         raise ValueError("Input names are not specified.")
     if trans_ctx.out_names is None:
         raise ValueError("Output names are not specified.")
-    if not (trans_ctx.out_names or trans_ctx.inp_names):
+    if not (trans_ctx.out_names or trans_ctx.input_names):
         raise ValueError("No input nor output.")
 
     # We guarantee decoupling
     tsdfg = tjsdfg.TranslatedJaxprSDFG(
         sdfg=copy.deepcopy(trans_ctx.sdfg),
-        inp_names=trans_ctx.inp_names,
+        input_names=trans_ctx.input_names,
         out_names=trans_ctx.out_names,
     )
 
     # Make inputs and outputs to globals.
     sdfg_arg_names: list[str] = []
-    for arg_name in tsdfg.inp_names + tsdfg.out_names:
+    for arg_name in tsdfg.input_names + tsdfg.out_names:
         if arg_name in sdfg_arg_names:
             continue
         tsdfg.sdfg.arrays[arg_name].transient = False
diff --git a/src/jace/translator/primitive_translator.py b/src/jace/translator/primitive_translator.py
index 5fa5e6c..bcc0b8b 100644
--- a/src/jace/translator/primitive_translator.py
+++ b/src/jace/translator/primitive_translator.py
@@ -14,21 +14,16 @@
 from __future__ import annotations
 
 import abc
+from collections.abc import Callable, Sequence
 from typing import TYPE_CHECKING, Literal, Protocol, cast, overload, runtime_checkable
 
 
 if TYPE_CHECKING:
-    from collections.abc import Callable, Sequence
-
     import dace
     from jax import core as jax_core
 
     from jace import translator
 
-#: Global registry of the active primitive translators.
-#:  The `dict` maps the name of a primitive to its associated translators.
-_PRIMITIVE_TRANSLATORS_REGISTRY: dict[str, translator.PrimitiveTranslator] = {}
-
 
 class PrimitiveTranslatorCallable(Protocol):
     """Callable version of the primitive translators."""
@@ -158,6 +153,17 @@ def wrapper(
     return wrapper if primitive_translator is None else wrapper(primitive_translator)
 
 
+# <--------------------------- Managing translators
+
+
+_PRIMITIVE_TRANSLATORS_REGISTRY: dict[str, translator.PrimitiveTranslator] = {}
+"""Global registry of the active primitive translators.
+
+Use `register_primitive_translator()` to add a translator to the registry and
+`get_registered_primitive_translators()` get the current active set.
+"""
+
+
 @overload
 def register_primitive_translator(
     primitive_translator: Literal[None] = None, overwrite: bool = False
diff --git a/src/jace/translator/primitive_translators/alu_translator.py b/src/jace/translator/primitive_translators/alu_translator.py
index 436cebd..f217924 100644
--- a/src/jace/translator/primitive_translators/alu_translator.py
+++ b/src/jace/translator/primitive_translators/alu_translator.py
@@ -10,7 +10,8 @@
 
 from __future__ import annotations
 
-from typing import TYPE_CHECKING, Any, Final, cast
+from collections.abc import Sequence
+from typing import Any, Final, cast
 
 import dace
 import numpy as np
@@ -20,10 +21,6 @@
 from jace import translator, util
 
 
-if TYPE_CHECKING:
-    from collections.abc import Sequence
-
-
 class ALUTranslator(translator.PrimitiveTranslator):
     """
     This translator handles all arithmetic and logical operations.
@@ -68,8 +65,8 @@ def __call__(
 
         # Determine what kind of input we got and how we should proceed.
         is_scalar = len(util.get_jax_var_shape(eqn.outvars[0])) == 0
-        inp_scalars = [len(util.get_jax_var_shape(Inp)) == 0 for i, Inp in enumerate(eqn.invars)]
-        has_scalars_as_inputs = any(inp_scalars)
+        input_scalars = [len(util.get_jax_var_shape(Inp)) == 0 for i, Inp in enumerate(eqn.invars)]
+        has_scalars_as_inputs = any(input_scalars)
         has_some_literals = any(x is None for x in in_var_names)
         inps_same_shape = all(
             util.get_jax_var_shape(eqn.invars[0]) == util.get_jax_var_shape(eqn.invars[i])
@@ -105,15 +102,19 @@ def __call__(
             #  We further assume that if the size in a dimension differs then one must have size 1.
             #  This is the size we broadcast over, i.e. conceptually replicated.
             out_shps = tuple(util.get_jax_var_shape(eqn.outvars[0]))  # Shape of the output
-            inp_shpl = tuple(util.get_jax_var_shape(eqn.invars[0]))  # Shape of the left/first input
-            inp_shpr = tuple(
+            input_shpl = tuple(
+                util.get_jax_var_shape(eqn.invars[0])
+            )  # Shape of the left/first input
+            input_shpr = tuple(
                 util.get_jax_var_shape(eqn.invars[1])
             )  # Shape of the right/second input
 
-            if not ((len(inp_shpl) == len(inp_shpr)) and (len(out_shps) == len(inp_shpr))):
+            if not ((len(input_shpl) == len(input_shpr)) and (len(out_shps) == len(input_shpr))):
                 raise NotImplementedError("Can not broadcast over different ranks.")
 
-            for dim, (shp_lft, shp_rgt, out_shp) in enumerate(zip(inp_shpl, inp_shpr, out_shps)):
+            for dim, (shp_lft, shp_rgt, out_shp) in enumerate(
+                zip(input_shpl, input_shpr, out_shps)
+            ):
                 if shp_lft == shp_rgt:
                     assert out_shp == shp_lft
                 elif shp_lft == 1:
@@ -139,7 +140,7 @@ def __call__(
             if in_var_names[i] is None:  # Literal: No input needed.
                 tskl_inputs.append((None, None))
                 continue
-            if inp_scalars[i]:  # Scalar
+            if input_scalars[i]:  # Scalar
                 assert len(dims_to_bcast) == 0
                 i_memlet = dace.Memlet.simple(in_var_names[i], "0")
             else:  # Array: We may have to broadcast
diff --git a/src/jace/util/jax_helper.py b/src/jace/util/jax_helper.py
index c462798..71d3660 100644
--- a/src/jace/util/jax_helper.py
+++ b/src/jace/util/jax_helper.py
@@ -16,7 +16,8 @@
 
 import dataclasses
 import itertools
-from typing import TYPE_CHECKING, Any
+from collections.abc import Mapping
+from typing import Any
 
 import dace
 import jax
@@ -26,10 +27,6 @@
 from jace import util
 
 
-if TYPE_CHECKING:
-    from collections.abc import Mapping
-
-
 @dataclasses.dataclass(repr=True, frozen=True, eq=False)
 class JaCeVar:
     """
diff --git a/src/jace/util/translation_cache.py b/src/jace/util/translation_cache.py
index 264097e..cbec1ba 100644
--- a/src/jace/util/translation_cache.py
+++ b/src/jace/util/translation_cache.py
@@ -33,14 +33,21 @@
 if TYPE_CHECKING:
     from jace import stages
 
-#: Caches used to store the state transition.
-#: The caches are on a per stage and not per instant basis.
 _TRANSLATION_CACHES: dict[type[CachingStage], StageCache] = {}
+"""Caches used to store the state transition.
+
+The caches are on a per stage and not per instant basis.
+"""
 
 
-# Denotes the stage that follows the current one.
-#  Used by the `CachingStage` mixin.
+# Type annotation for the caching.
+P = ParamSpec("P")
 NextStage = TypeVar("NextStage", bound="stages.Stage")
+TransitionFunction: TypeAlias = "Callable[Concatenate[CachingStage[NextStage], P], NextStage]"
+CachingStageType = TypeVar("CachingStageType", bound="CachingStage")
+
+# Type to describe a single argument either in an abstract or concrete way.
+CallArgsSpec: TypeAlias = tuple["_AbstractCallArgument | Hashable"]
 
 
 class CachingStage(Generic[NextStage]):
@@ -83,12 +90,6 @@ def _make_call_description(
         ...
 
 
-# Type annotation for the caching.
-P = ParamSpec("P")
-TransitionFunction = Callable[Concatenate[CachingStage[NextStage], P], NextStage]
-CachingStageType = TypeVar("CachingStageType", bound=CachingStage)
-
-
 def cached_transition(
     transition: Callable[Concatenate[CachingStageType, P], NextStage],
 ) -> Callable[Concatenate[CachingStage[NextStage], P], NextStage]:
@@ -191,10 +192,6 @@ def from_value(cls, value: Any) -> _AbstractCallArgument:
         raise TypeError(f"Can not make 'an abstract description from '{type(value).__name__}'.")
 
 
-#: Type to describe a single argument either in an abstract or concrete way.
-CallArgsSpec: TypeAlias = tuple[_AbstractCallArgument | Hashable]
-
-
 @dataclasses.dataclass(frozen=True)
 class StageTransformationSpec:
     """
@@ -241,9 +238,12 @@ class StageCache(Generic[StageType]):
     _memory: collections.OrderedDict[StageTransformationSpec, StageType]
     _capacity: int
 
-    def __init__(self, capachity: int = 256) -> None:
+    def __init__(
+        self,
+        capacity: int = 256,
+    ) -> None:
+        self._capacity = capacity
         self._memory = collections.OrderedDict()
-        self._capacity = capachity
 
     def __contains__(self, key: StageTransformationSpec) -> bool:
         return key in self._memory
diff --git a/tests/test_caching.py b/tests/test_caching.py
index 0cf1526..01fabc9 100644
--- a/tests/test_caching.py
+++ b/tests/test_caching.py
@@ -191,8 +191,11 @@ def jaceWrapped(A: np.ndarray, B: np.ndarray) -> np.ndarray:
     # Because of the way how things work the optimized must have more than the
     #  unoptimized. If there is sharing, then this would not be the case.
     assert unoptiCompiled is not optiCompiled
-    assert optiCompiled._csdfg.sdfg.number_of_nodes() == 1
-    assert optiCompiled._csdfg.sdfg.number_of_nodes() < unoptiCompiled._csdfg.sdfg.number_of_nodes()
+    assert optiCompiled._compiled_sdfg.sdfg.number_of_nodes() == 1
+    assert (
+        optiCompiled._compiled_sdfg.sdfg.number_of_nodes()
+        < unoptiCompiled._compiled_sdfg.sdfg.number_of_nodes()
+    )
 
 
 def test_caching_dtype():

From 744738b595d0af8b4c27f00a9500f56a0fb62b4a Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Fri, 21 Jun 2024 17:09:43 +0200
Subject: [PATCH 393/458] DaCe does not consider dashes as valid names.

---
 src/jace/translated_jaxpr_sdfg.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/src/jace/translated_jaxpr_sdfg.py b/src/jace/translated_jaxpr_sdfg.py
index 5ad00c6..9bcec78 100644
--- a/src/jace/translated_jaxpr_sdfg.py
+++ b/src/jace/translated_jaxpr_sdfg.py
@@ -201,7 +201,7 @@ def compile_jaxpr_sdfg(tsdfg: TranslatedJaxprSDFG) -> CompiledJaxprSDFG:
         # We need to give the SDFG another name, this is needed to prevent a DaCe
         #  error/warning. This happens if we compile the same lowered SDFG multiple
         #  times with different options.
-        sdfg.name = f"{sdfg.name}__{uuid.uuid1()}"
+        sdfg.name = f"{sdfg.name}__{str(uuid.uuid1()).replace('-', '_')}"
         assert len(sdfg.name) < 255  # noqa: PLR2004 magic-value-comparison  # 255 maximal file name size on UNIX.
 
         with dace.config.temporary_config():

From 71b6422a1dea2486a628b665907777e7fae50f40 Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Sun, 23 Jun 2024 12:23:05 +0200
Subject: [PATCH 394/458] Changed `finalize_compilation_options()` to
 `make_final_compilation_options()` which should be a bit better.

---
 src/jace/stages.py | 12 ++++++------
 1 file changed, 6 insertions(+), 6 deletions(-)

diff --git a/src/jace/stages.py b/src/jace/stages.py
index 327017c..5d9e68f 100644
--- a/src/jace/stages.py
+++ b/src/jace/stages.py
@@ -49,8 +49,8 @@
     "JaCeLowered",
     "JaCeWrapped",
     "Stage",
-    "finalize_compilation_options",
     "get_active_compiler_options",
+    "make_final_compilation_options",
     "update_active_compiler_options",
 ]
 
@@ -243,7 +243,7 @@ def compile(self, compiler_options: CompilerOptions | None = None) -> JaCeCompil
 
         To perform the optimizations `jace_optimize()` is used. The actual options that
         are forwarded to it are obtained by passing `compiler_options` to
-        `finalize_compilation_options()`.
+        `make_final_compilation_options()`.
 
         Args:
             compiler_options: The optimization options to use.
@@ -251,7 +251,7 @@ def compile(self, compiler_options: CompilerOptions | None = None) -> JaCeCompil
         # We **must** deepcopy before we do any optimization, because all optimizations
         #  are in place, to properly cache stages, stages needs to be immutable.
         tsdfg: tjsdfg.TranslatedJaxprSDFG = copy.deepcopy(self._translated_sdfg)
-        optimization.jace_optimize(tsdfg=tsdfg, **finalize_compilation_options(compiler_options))
+        optimization.jace_optimize(tsdfg=tsdfg, **make_final_compilation_options(compiler_options))
 
         return JaCeCompiled(
             compiled_sdfg=tjsdfg.compile_jaxpr_sdfg(tsdfg),
@@ -289,7 +289,7 @@ def _make_call_description(
         unflatted_args, unflatted_kwargs = jax_tree.tree_unflatten(in_tree, flat_call_args)
         assert (not unflatted_kwargs) and (len(unflatted_args) <= 1)
 
-        options = finalize_compilation_options(unflatted_args[0] if unflatted_args else {})
+        options = make_final_compilation_options(unflatted_args[0] if unflatted_args else {})
         flat_options, option_tree = jax_tree.tree_flatten(options)
         return tcache.StageTransformationSpec(
             stage_id=id(self), flat_call_args=tuple(flat_options), in_tree=option_tree
@@ -354,7 +354,7 @@ def __call__(self, *args: Any, **kwargs: Any) -> _ReturnType:
 The global set is initialized with `jace.optimization.DEFAULT_OPTIMIZATIONS`. It can be
 managed through `update_active_compiler_options()` and accessed through
 `get_active_compiler_options()`, however, it is advised that a user should use
-`finalize_compilation_options()` for getting the final options that should be used
+`make_final_compilation_options()` for getting the final options that should be used
 for optimization.
 """
 
@@ -383,7 +383,7 @@ def get_active_compiler_options() -> CompilerOptions:
     return _JACELOWERED_ACTIVE_COMPILE_OPTIONS.copy()
 
 
-def finalize_compilation_options(compiler_options: CompilerOptions | None) -> CompilerOptions:
+def make_final_compilation_options(compiler_options: CompilerOptions | None) -> CompilerOptions:
     """
     Returns the final compilation options.
 

From bcd941f48f96b7cd7639c06ec4ecb99431fb68d8 Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Sun, 23 Jun 2024 13:01:31 +0200
Subject: [PATCH 395/458] It seems that `dace.is_array()` does not considers
 zero dimensional arrays as arrays.

I am not sure why it worked before, but think it is related to a change in JAX itself, i.e. the parts that failed now, would actually go through the `is_jax_array()` function before, but now no longer.
I also changed the Typeguard, it is technically still wrong, but it no longer considers scalars as problems.
I think in th elong run we need our own array defintion.
---
 src/jace/util/traits.py | 11 ++++++-----
 1 file changed, 6 insertions(+), 5 deletions(-)

diff --git a/src/jace/util/traits.py b/src/jace/util/traits.py
index 07cec9a..af7affe 100644
--- a/src/jace/util/traits.py
+++ b/src/jace/util/traits.py
@@ -32,16 +32,17 @@ def is_jax_array(obj: Any) -> TypeGuard[jax.Array]:
     """
     Tests if `obj` is a JAX array.
 
-    Note:
-     JAX arrays are special as they can not be mutated. Furthermore, they always
-     allocate on the CPU _and_ on the GPU, if present.
+    Notes:
+        JAX arrays are special as they can not be mutated. Furthermore, they always
+        allocate on the CPU _and_ on the GPU, if present.
     """
     return isinstance(obj, jax.Array)
 
 
-def is_array(obj: Any) -> TypeGuard[jax.typing.ArrayLike]:
+def is_array(obj: Any) -> TypeGuard[jax.Array]:
     """Identifies arrays, this also includes JAX arrays."""
-    return dace.is_array(obj) or is_jax_array(obj)
+    # `dace.is_array()` does not seem to recognise shape zero arrays.
+    return isinstance(obj, np.ndarray) or dace.is_array(obj) or is_jax_array(obj)
 
 
 def is_scalar(obj: Any) -> bool:

From 4be66b1a0383a72c6ee5a7250f1c8e95d5d587f0 Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Sun, 23 Jun 2024 13:05:39 +0200
Subject: [PATCH 396/458] Fixed a bug in `is_tracing_ongoing()`.

I also now made the assignement outside, it is just better to understand.
---
 src/jace/util/jax_helper.py | 8 +++-----
 1 file changed, 3 insertions(+), 5 deletions(-)

diff --git a/src/jace/util/jax_helper.py b/src/jace/util/jax_helper.py
index 0f59c0b..41f4c20 100644
--- a/src/jace/util/jax_helper.py
+++ b/src/jace/util/jax_helper.py
@@ -146,12 +146,10 @@ def is_tracing_ongoing(*args: Any, **kwargs: Any) -> bool:
     #  See also: https://github.com/google/jax/pull/3370
     if any(isinstance(x, jax_core.Tracer) for x in itertools.chain(args, kwargs.values())):
         return True
-    if (
-        trace_stack_length := (len(jax._src.core.thread_local_state.trace_state.trace_stack.stack))
-        == 1
-    ):
+    trace_stack_height = len(jax._src.core.thread_local_state.trace_state.trace_stack.stack)
+    if trace_stack_height == 1:
         return False
-    if trace_stack_length > 1:
+    if trace_stack_height > 1:
         return True
     raise RuntimeError("Failed to determine if tracing is ongoing.")
 

From 617c5c1273204df2ab5b3838b13bb15402ab9899 Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Sun, 23 Jun 2024 13:11:57 +0200
Subject: [PATCH 397/458] Updated the `get_jax_literal_value()` function.

It seems that in newer JAX versions literals are passed either as arrays (with zero dimensions) or as scalars.
---
 src/jace/util/jax_helper.py | 18 ++++++++++++------
 1 file changed, 12 insertions(+), 6 deletions(-)

diff --git a/src/jace/util/jax_helper.py b/src/jace/util/jax_helper.py
index 41f4c20..bc2de21 100644
--- a/src/jace/util/jax_helper.py
+++ b/src/jace/util/jax_helper.py
@@ -17,16 +17,19 @@
 import dataclasses
 import itertools
 from collections.abc import Mapping
-from typing import Any, overload
+from typing import TYPE_CHECKING, Any, overload
 
 import dace
 import jax
 import jax.core as jax_core
-import numpy as np
 
 from jace import util
 
 
+if TYPE_CHECKING:
+    import numpy as np
+
+
 @dataclasses.dataclass(repr=True, frozen=True, eq=False)
 class JaCeVar:
     """
@@ -225,9 +228,12 @@ def get_jax_literal_value(lit: jax_core.Atom) -> bool | float | int | np.generic
     if not isinstance(lit, jax_core.Literal):
         raise TypeError(f"Can only extract literals not '{type(lit)}'.")
     val = lit.val
-    if isinstance(val, np.ndarray):
+    # In previous versions of JAX literals were always 0-dim arrays, but it seems
+    #  that in newer versions the values are either arrays or scalars.
+    #  I saw both thus we have to keep both branches.
+    if util.is_array(val):
         assert val.shape == ()
-        return val.max()
-    if isinstance(val, (bool, float, int)):
+        return val.dtype.type(val.max())
+    if util.is_scalar(val):
         return val
-    raise TypeError(f"Failed to extract value from '{lit}'.")
+    raise TypeError(f"Failed to extract value from '{lit}' ('{val}' type: {type(val).__name__}).")

From 031b33f9a4f6faffb4f6d67539944b31f5217de7 Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Sun, 23 Jun 2024 13:12:42 +0200
Subject: [PATCH 398/458] Updated the tests after merging the new PR into the
 development branch.

---
 tests/conftest.py                              | 12 ++++++------
 ..._primitive_arithmetic_logical_operations.py |  2 +-
 .../test_primitive_concatenate.py              |  4 ++--
 .../test_primitive_squeeze_expand_dims.py      |  2 +-
 tests/integration_tests/test_empty_jaxpr.py    |  4 ++--
 .../test_jaxpr_translator_builder.py           | 18 +++++++++---------
 tests/unit_tests/test_caching.py               |  6 +++---
 tests/unit_tests/test_jax_api.py               | 12 ++++++------
 8 files changed, 30 insertions(+), 30 deletions(-)

diff --git a/tests/conftest.py b/tests/conftest.py
index f5c9a23..607e7e6 100644
--- a/tests/conftest.py
+++ b/tests/conftest.py
@@ -29,11 +29,11 @@
 
 @pytest.fixture(autouse=True)
 def _enable_x64_mode_in_jax() -> Generator[None, None, None]:
-    """Fixture of enable the `x64` mode in Jax.
+    """Fixture of enable the `x64` mode in JAX.
 
-    Currently, JaCe requires that `x64` mode is enabled and will do all Jax
-    things with it enabled. However, if we use Jax with the intend to compare
-    it against JaCe we must also enable it for Jax.
+    Currently, JaCe requires that `x64` mode is enabled and will do all JAX
+    things with it enabled. However, if we use JAX with the intend to compare
+    it against JaCe we must also enable it for JAX.
     """
     with jax.experimental.enable_x64():
         yield
@@ -41,9 +41,9 @@ def _enable_x64_mode_in_jax() -> Generator[None, None, None]:
 
 @pytest.fixture(autouse=True)
 def _disable_jit() -> Generator[None, None, None]:
-    """Fixture for disable the dynamic jiting in Jax.
+    """Fixture for disable the dynamic jiting in JAX.
 
-    For certain reasons Jax puts certain primitives inside a `pjit` primitive,
+    For certain reasons JAX puts certain primitives inside a `pjit` primitive,
     i.e. nested Jaxpr. The intent is, that these operations can/should run on
     an accelerator.
 
diff --git a/tests/integration_tests/primitive_translators/test_primitive_arithmetic_logical_operations.py b/tests/integration_tests/primitive_translators/test_primitive_arithmetic_logical_operations.py
index fc15ecf..76afe44 100644
--- a/tests/integration_tests/primitive_translators/test_primitive_arithmetic_logical_operations.py
+++ b/tests/integration_tests/primitive_translators/test_primitive_arithmetic_logical_operations.py
@@ -44,7 +44,7 @@ class such as
 def _only_alt_translators() -> Generator[None, None, None]:
     """Removes all non arithmetic/logical translator from the registry.
 
-    This ensures that Jax is not doing some stuff that is supposed to be handled by the
+    This ensures that JAX is not doing some stuff that is supposed to be handled by the
     test class, such as broadcasting. It makes writing tests a bit harder, but it is
     worth. For some reasons also type conversion s allowed.
     """
diff --git a/tests/integration_tests/primitive_translators/test_primitive_concatenate.py b/tests/integration_tests/primitive_translators/test_primitive_concatenate.py
index 29f44a8..12fe735 100644
--- a/tests/integration_tests/primitive_translators/test_primitive_concatenate.py
+++ b/tests/integration_tests/primitive_translators/test_primitive_concatenate.py
@@ -59,11 +59,11 @@ def testee(inputs: list[np.ndarray]) -> np.ndarray | jax.Array:
         assert np.all(ref == res)
 
 
-@pytest.mark.skip(reason="Jax does not support scalars as inputs.")
+@pytest.mark.skip(reason="JAX does not support scalars as inputs.")
 def test_cat_1d_array_scalars():
     """Concatenate an 1d array with scalars.
 
-    This does not work, it is to observe Jax.
+    This does not work, it is to observe JAX.
     """
 
     a1 = testutil.make_array(10)
diff --git a/tests/integration_tests/primitive_translators/test_primitive_squeeze_expand_dims.py b/tests/integration_tests/primitive_translators/test_primitive_squeeze_expand_dims.py
index 5ff6a49..672458b 100644
--- a/tests/integration_tests/primitive_translators/test_primitive_squeeze_expand_dims.py
+++ b/tests/integration_tests/primitive_translators/test_primitive_squeeze_expand_dims.py
@@ -50,7 +50,7 @@ def _roundtrip_implementation(shape: Sequence[int], axis: int | Sequence[int]) -
         assert ref.shape == res.shape, f"a.shape = {shape}; Expected: {ref.shape}; Got: {res.shape}"
         assert ref.dtype == res.dtype
         assert np.all(ref == res), f"Value error for shape '{shape}' and axis={axis}"
-        a = np.array(ref, copy=True)  # It is a Jax array, and we have to reverse this.
+        a = np.array(ref, copy=True)  # It is a JAX array, and we have to reverse this.
     assert a_org.shape == res.shape
     assert np.all(a_org == res)
 
diff --git a/tests/integration_tests/test_empty_jaxpr.py b/tests/integration_tests/test_empty_jaxpr.py
index 58f8f65..68d7716 100644
--- a/tests/integration_tests/test_empty_jaxpr.py
+++ b/tests/integration_tests/test_empty_jaxpr.py
@@ -59,8 +59,8 @@ def wrapped(a: np.ndarray, b: np.float64) -> np.ndarray:  # noqa: ARG001  # Expl
     compiled = lowered.compile()
     res = compiled(a, b)
 
-    assert len(lowered._translated_sdfg.inp_names) == 2
-    assert len(compiled._csdfg.inp_names) == 2
+    assert len(lowered._translated_sdfg.input_names) == 2
+    assert len(compiled._compiled_sdfg.input_names) == 2
     assert isinstance(res, np.ndarray)
     assert np.all(res == a)
     assert res.__array_interface__["data"][0] != a.__array_interface__["data"][0]
diff --git a/tests/integration_tests/test_jaxpr_translator_builder.py b/tests/integration_tests/test_jaxpr_translator_builder.py
index ebbc075..b1a85c5 100644
--- a/tests/integration_tests/test_jaxpr_translator_builder.py
+++ b/tests/integration_tests/test_jaxpr_translator_builder.py
@@ -231,7 +231,7 @@ def test_builder_nested(translation_builder: translator.JaxprTranslationBuilder)
     with pytest.raises(
         expected_exception=KeyError,
         match=re.escape(
-            f"Jax variable '{array1}' was supposed to map to '{name_1}', but no such SDFG variable is known."
+            f"JAX variable '{array1}' was supposed to map to '{name_1}', but no such SDFG variable is known."
         ),
     ):
         _ = translation_builder.map_jax_var_to_sdfg(array1)
@@ -265,7 +265,7 @@ def test_builder_nested(translation_builder: translator.JaxprTranslationBuilder)
     with pytest.raises(
         expected_exception=KeyError,
         match=re.escape(
-            f"Jax variable '{array2}' was supposed to map to '{name_2}', but no such SDFG variable is known."
+            f"JAX variable '{array2}' was supposed to map to '{name_2}', but no such SDFG variable is known."
         ),
     ):
         _ = translation_builder.map_jax_var_to_sdfg(array2)
@@ -514,7 +514,7 @@ def wrapped(a: float) -> float:
 
 
 def test_builder_scalar_return_type() -> None:
-    """As Jax we always return an array, even for a scalar."""
+    """As JAX we always return an array, even for a scalar."""
 
     @jace.jit
     def wrapped(a: np.float64) -> np.float64:
@@ -546,10 +546,10 @@ def wrapped(a: np.ndarray, b: np.ndarray) -> tuple[np.ndarray, np.ndarray]:
     ref = (a + b, a - b)
     res = compiled(a, b)
 
-    assert len(lowered._translated_sdfg.inp_names) == 2
-    assert len(compiled._csdfg.inp_names) == 2
+    assert len(lowered._translated_sdfg.input_names) == 2
+    assert len(compiled._compiled_sdfg.input_names) == 2
     assert len(lowered._translated_sdfg.out_names) == 2
-    assert len(compiled._csdfg.out_names) == 2
+    assert len(compiled._compiled_sdfg.out_names) == 2
     assert isinstance(res, tuple), f"Expected 'tuple', but got '{type(res).__name__}'."
     assert len(res) == 2
     assert np.allclose(ref, res)
@@ -562,7 +562,7 @@ def test_builder_direct_return() -> None:
         The test function below will not return a reference to its input,
         but perform an actual copy. This behaviour does look strange from a
         Python point of view, however, it is (at the time of writing)
-        consistent with what Jax does, even when passing Jax arrays directly.
+        consistent with what JAX does, even when passing JAX arrays directly.
     """
 
     @jace.jit
@@ -619,8 +619,8 @@ def testee(a: np.ndarray, b: np.ndarray) -> np.ndarray:  # noqa: ARG001  # Expli
     res1 = compiled(a, b)  # Correct call
     res2 = compiled(a, c)  # wrong call to show that nothing is affected.
 
-    assert len(lowered._translated_sdfg.inp_names) == 2
-    assert len(compiled._csdfg.inp_names) == 2
+    assert len(lowered._translated_sdfg.input_names) == 2
+    assert len(compiled._compiled_sdfg.input_names) == 2
     assert np.all(res1 == res2)
     assert np.allclose(ref, res1)
 
diff --git a/tests/unit_tests/test_caching.py b/tests/unit_tests/test_caching.py
index a6fa29b..564d0ea 100644
--- a/tests/unit_tests/test_caching.py
+++ b/tests/unit_tests/test_caching.py
@@ -201,10 +201,10 @@ def jace_wrapped(a: np.ndarray, b: np.ndarray) -> np.ndarray:
     # Because of the way how things work the optimized must have more than the
     #  unoptimized. If there is sharing, then this would not be the case.
     assert unoptized_compiled is not optized_compiled
-    assert optized_compiled._csdfg.sdfg.number_of_nodes() == 1
+    assert optized_compiled._compiled_sdfg.sdfg.number_of_nodes() == 1
     assert (
-        optized_compiled._csdfg.sdfg.number_of_nodes()
-        < unoptized_compiled._csdfg.sdfg.number_of_nodes()
+        optized_compiled._compiled_sdfg.sdfg.number_of_nodes()
+        < unoptized_compiled._compiled_sdfg.sdfg.number_of_nodes()
     )
 
     # Now we check if they are still inside the cache.
diff --git a/tests/unit_tests/test_jax_api.py b/tests/unit_tests/test_jax_api.py
index 6cd7860..534650a 100644
--- a/tests/unit_tests/test_jax_api.py
+++ b/tests/unit_tests/test_jax_api.py
@@ -5,7 +5,7 @@
 #
 # SPDX-License-Identifier: BSD-3-Clause
 
-"""Tests the compatibility of the JaCe api to Jax."""
+"""Tests the compatibility of the JaCe api to JAX."""
 
 from __future__ import annotations
 
@@ -78,7 +78,7 @@ def ddf(x):
 
 @pytest.mark.skip(reason="Nested Jaxpr are not handled.")
 def test_composition_with_jax() -> None:
-    """Tests if JaCe can interact with Jax and vice versa."""
+    """Tests if JaCe can interact with JAX and vice versa."""
 
     def base_fun(a, b, c):
         return a + b * jnp.sin(c) - a * b
@@ -97,7 +97,7 @@ def jax_fun(a, b, c):
 
 @pytest.mark.skip(reason="Nested Jaxpr are not handled.")
 def test_composition_with_jax_2() -> None:
-    """Second test if JaCe can interact with Jax and vice versa."""
+    """Second test if JaCe can interact with JAX and vice versa."""
 
     @jax.jit
     def f1_jax(a, b):
@@ -121,7 +121,7 @@ def f3_jace(a, b, c, d):
     res_jax = f3_jax(a, b, c, d)
     res_jace = f3_jace(a, b, c, d)
 
-    assert np.allclose(ref, res_jax), "Jax failed."
+    assert np.allclose(ref, res_jax), "JAX failed."
     assert np.allclose(ref, res_jace), "JaCe Failed."
 
 
@@ -202,7 +202,7 @@ def testee(a: np.ndarray, b: np.float64) -> np.ndarray:
         trans_ctx=trans_ctx, fun=testee, flat_call_args=flat_call_args
     )
 
-    # Because x64 is disabled Jax traces the input as float32, even if we have passed
+    # Because x64 is disabled JAX traces the input as float32, even if we have passed
     #  float64 as input! Calling the resulting SDFG with the arguments we used for
     #  lowering will result in an error, because of the situation,
     #  `sizeof(float32) < sizeof(float64)`, no out of bound error would result, but the
@@ -252,7 +252,7 @@ def ones10x10() -> jax.Array:
 
 
 def test_jax_array_as_input() -> None:
-    """This function tests if we use Jax arrays as inputs."""
+    """This function tests if we use JAX arrays as inputs."""
 
     def testee(a: jax.Array) -> jax.Array:
         return jnp.sin(a + 1.0)

From c5826694a4f91b0643d23ee8fc25e31396f727e3 Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Sun, 23 Jun 2024 13:05:39 +0200
Subject: [PATCH 399/458] Fixed a bug in `is_tracing_ongoing()`.

I also now made the assignement outside, it is just better to understand.
---
 src/jace/util/jax_helper.py | 8 +++-----
 1 file changed, 3 insertions(+), 5 deletions(-)

diff --git a/src/jace/util/jax_helper.py b/src/jace/util/jax_helper.py
index 71d3660..6075343 100644
--- a/src/jace/util/jax_helper.py
+++ b/src/jace/util/jax_helper.py
@@ -138,12 +138,10 @@ def is_tracing_ongoing(*args: Any, **kwargs: Any) -> bool:
     #  See also: https://github.com/google/jax/pull/3370
     if any(isinstance(x, jax_core.Tracer) for x in itertools.chain(args, kwargs.values())):
         return True
-    if (
-        trace_stack_length := (len(jax._src.core.thread_local_state.trace_state.trace_stack.stack))
-        == 1
-    ):
+    trace_stack_height = len(jax._src.core.thread_local_state.trace_state.trace_stack.stack)
+    if trace_stack_height == 1:
         return False
-    if trace_stack_length > 1:
+    if trace_stack_height > 1:
         return True
     raise RuntimeError("Failed to determine if tracing is ongoing.")
 

From 565c69d30c7a11bf83b4f912289a0b9769556158 Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Sun, 23 Jun 2024 13:11:57 +0200
Subject: [PATCH 400/458] Updated the `get_jax_literal_value()` function.

It seems that in newer JAX versions literals are passed either as arrays (with zero dimensions) or as scalars.
---
 src/jace/util/jax_helper.py | 18 ++++++++++++------
 1 file changed, 12 insertions(+), 6 deletions(-)

diff --git a/src/jace/util/jax_helper.py b/src/jace/util/jax_helper.py
index 6075343..51bf2e4 100644
--- a/src/jace/util/jax_helper.py
+++ b/src/jace/util/jax_helper.py
@@ -17,16 +17,19 @@
 import dataclasses
 import itertools
 from collections.abc import Mapping
-from typing import Any
+from typing import TYPE_CHECKING, Any
 
 import dace
 import jax
 import jax.core as jax_core
-import numpy as np
 
 from jace import util
 
 
+if TYPE_CHECKING:
+    import numpy as np
+
+
 @dataclasses.dataclass(repr=True, frozen=True, eq=False)
 class JaCeVar:
     """
@@ -217,9 +220,12 @@ def get_jax_literal_value(lit: jax_core.Atom) -> bool | float | int | np.generic
     if not isinstance(lit, jax_core.Literal):
         raise TypeError(f"Can only extract literals not '{type(lit)}'.")
     val = lit.val
-    if isinstance(val, np.ndarray):
+    # In previous versions of JAX literals were always 0-dim arrays, but it seems
+    #  that in newer versions the values are either arrays or scalars.
+    #  I saw both thus we have to keep both branches.
+    if util.is_array(val):
         assert val.shape == ()
-        return val.max()
-    if isinstance(val, (bool, float, int)):
+        return val.dtype.type(val.max())
+    if util.is_scalar(val):
         return val
-    raise TypeError(f"Failed to extract value from '{lit}'.")
+    raise TypeError(f"Failed to extract value from '{lit}' ('{val}' type: {type(val).__name__}).")

From 0dd9404719d72875f97898dc24d00c6d40804ace Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Sun, 23 Jun 2024 13:16:37 +0200
Subject: [PATCH 401/458] Imported some files to silence mypy.

---
 src/jace/util/jax_helper.py | 10 +++++++++-
 src/jace/util/traits.py     | 11 ++++++-----
 2 files changed, 15 insertions(+), 6 deletions(-)

diff --git a/src/jace/util/jax_helper.py b/src/jace/util/jax_helper.py
index 51bf2e4..bc2de21 100644
--- a/src/jace/util/jax_helper.py
+++ b/src/jace/util/jax_helper.py
@@ -17,7 +17,7 @@
 import dataclasses
 import itertools
 from collections.abc import Mapping
-from typing import TYPE_CHECKING, Any
+from typing import TYPE_CHECKING, Any, overload
 
 import dace
 import jax
@@ -102,6 +102,14 @@ def get_jax_var_name(jax_var: jax_core.Atom | JaCeVar) -> str:
             )
 
 
+@overload
+def get_jax_var_shape(jax_var: jax_core.Atom) -> tuple[int, ...]: ...
+
+
+@overload
+def get_jax_var_shape(jax_var: JaCeVar) -> tuple[int | dace.symbol | str, ...]: ...
+
+
 def get_jax_var_shape(jax_var: jax_core.Atom | JaCeVar) -> tuple[int | dace.symbol | str, ...]:
     """Returns the shape of `jax_var`."""
     match jax_var:
diff --git a/src/jace/util/traits.py b/src/jace/util/traits.py
index 07cec9a..af7affe 100644
--- a/src/jace/util/traits.py
+++ b/src/jace/util/traits.py
@@ -32,16 +32,17 @@ def is_jax_array(obj: Any) -> TypeGuard[jax.Array]:
     """
     Tests if `obj` is a JAX array.
 
-    Note:
-     JAX arrays are special as they can not be mutated. Furthermore, they always
-     allocate on the CPU _and_ on the GPU, if present.
+    Notes:
+        JAX arrays are special as they can not be mutated. Furthermore, they always
+        allocate on the CPU _and_ on the GPU, if present.
     """
     return isinstance(obj, jax.Array)
 
 
-def is_array(obj: Any) -> TypeGuard[jax.typing.ArrayLike]:
+def is_array(obj: Any) -> TypeGuard[jax.Array]:
     """Identifies arrays, this also includes JAX arrays."""
-    return dace.is_array(obj) or is_jax_array(obj)
+    # `dace.is_array()` does not seem to recognise shape zero arrays.
+    return isinstance(obj, np.ndarray) or dace.is_array(obj) or is_jax_array(obj)
 
 
 def is_scalar(obj: Any) -> bool:

From 6b69a456f9b009d2c6b242a196eb6e3734e88c86 Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Mon, 24 Jun 2024 07:19:31 +0200
Subject: [PATCH 402/458] Fixed a naming error.

---
 src/jace/stages.py | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/src/jace/stages.py b/src/jace/stages.py
index 5d9e68f..28dad20 100644
--- a/src/jace/stages.py
+++ b/src/jace/stages.py
@@ -36,7 +36,7 @@
 
 from jace import api, optimization, tracing, translated_jaxpr_sdfg as tjsdfg, translator, util
 from jace.optimization import CompilerOptions
-from jace.translator import post_translation as ptrans
+from jace.translator import post_translation as ptranslation
 from jace.util import translation_cache as tcache
 
 
@@ -168,7 +168,7 @@ def lower(self, *args: _P.args, **kwargs: _P.kwargs) -> JaCeLowered[_ReturnType]
         trans_ctx: translator.TranslationContext = builder.translate_jaxpr(jaxpr)
 
         flat_call_args = jax_tree.tree_leaves((args, kwargs))
-        tsdfg: tjsdfg.TranslatedJaxprSDFG = ptrans.postprocess_jaxpr_sdfg(
+        tsdfg: tjsdfg.TranslatedJaxprSDFG = ptranslation.postprocess_jaxpr_sdfg(
             trans_ctx=trans_ctx,
             fun=self.wrapped_fun,
             flat_call_args=flat_call_args,

From f7ee981fb2fb764c5c1f4c9eebc9bb62334ffbb3 Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Mon, 24 Jun 2024 07:20:20 +0200
Subject: [PATCH 403/458] Fixed a naming issue.

---
 src/jace/stages.py               | 4 ++--
 tests/unit_tests/test_jax_api.py | 4 ++--
 2 files changed, 4 insertions(+), 4 deletions(-)

diff --git a/src/jace/stages.py b/src/jace/stages.py
index 5d9e68f..28dad20 100644
--- a/src/jace/stages.py
+++ b/src/jace/stages.py
@@ -36,7 +36,7 @@
 
 from jace import api, optimization, tracing, translated_jaxpr_sdfg as tjsdfg, translator, util
 from jace.optimization import CompilerOptions
-from jace.translator import post_translation as ptrans
+from jace.translator import post_translation as ptranslation
 from jace.util import translation_cache as tcache
 
 
@@ -168,7 +168,7 @@ def lower(self, *args: _P.args, **kwargs: _P.kwargs) -> JaCeLowered[_ReturnType]
         trans_ctx: translator.TranslationContext = builder.translate_jaxpr(jaxpr)
 
         flat_call_args = jax_tree.tree_leaves((args, kwargs))
-        tsdfg: tjsdfg.TranslatedJaxprSDFG = ptrans.postprocess_jaxpr_sdfg(
+        tsdfg: tjsdfg.TranslatedJaxprSDFG = ptranslation.postprocess_jaxpr_sdfg(
             trans_ctx=trans_ctx,
             fun=self.wrapped_fun,
             flat_call_args=flat_call_args,
diff --git a/tests/unit_tests/test_jax_api.py b/tests/unit_tests/test_jax_api.py
index 534650a..f73c535 100644
--- a/tests/unit_tests/test_jax_api.py
+++ b/tests/unit_tests/test_jax_api.py
@@ -16,7 +16,7 @@
 
 import jace
 from jace import translated_jaxpr_sdfg as tjsdfg, translator, util
-from jace.translator import post_translation as ptrans
+from jace.translator import post_translation as ptranslation
 
 from tests import util as testutil
 
@@ -198,7 +198,7 @@ def testee(a: np.ndarray, b: np.float64) -> np.ndarray:
     )
     trans_ctx: translator.TranslationContext = builder.translate_jaxpr(jaxpr)
 
-    tsdfg: tjsdfg.TranslatedJaxprSDFG = ptrans.postprocess_jaxpr_sdfg(
+    tsdfg: tjsdfg.TranslatedJaxprSDFG = ptranslation.postprocess_jaxpr_sdfg(
         trans_ctx=trans_ctx, fun=testee, flat_call_args=flat_call_args
     )
 

From 8698397f6e1b42d0fcc9cd9c075441d4ec6d58ef Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Mon, 24 Jun 2024 07:28:54 +0200
Subject: [PATCH 404/458] Specified that a transient is exactly written once.

This si not fully true, actually there is onyl one access node that writes to the transient.
This is needed to implement primitives such as `concatenation`.
However, by a special prefix a variable can be written to multiple time, this is needed to implement the scans.
However, it might be possiblt to avoid that.
---
 src/jace/translator/jaxpr_translator_builder.py | 7 +++++--
 1 file changed, 5 insertions(+), 2 deletions(-)

diff --git a/src/jace/translator/jaxpr_translator_builder.py b/src/jace/translator/jaxpr_translator_builder.py
index 7ef6d06..8562686 100644
--- a/src/jace/translator/jaxpr_translator_builder.py
+++ b/src/jace/translator/jaxpr_translator_builder.py
@@ -35,8 +35,11 @@ class JaxprTranslationBuilder:
     - there are only transient variables inside the SDFG,
     - it lacks the special `__return` variable,
     - the `arg_names` parameter is not set,
-    - for all scalar values a ` Scalar` SDFG variable is used, thus they cannot
-        be used to return anything.
+    - for all scalar values a `Scalar` SDFG variable is used, thus they cannot
+        be used for return values,
+    - for every transient there is exactly one access node that writes to it,
+        except the name of the array starts with `__jace_mutable_`, which can
+        be written to multiple times.
 
     For these reasons the SDFG is not directly usable, and further manipulations
     have to be performed. Especially, DaCe's validation function will fail and

From f3a65d6725c2b360622ecfd72c3e76ebf89b2ea6 Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Mon, 24 Jun 2024 08:03:04 +0200
Subject: [PATCH 405/458] Fixed the noxfile, it now uses the correct Sphinx
 version.

---
 noxfile.py | 5 ++++-
 1 file changed, 4 insertions(+), 1 deletion(-)

diff --git a/noxfile.py b/noxfile.py
index b6aec1b..76e0a2e 100644
--- a/noxfile.py
+++ b/noxfile.py
@@ -134,7 +134,10 @@ def docs(session: nox.Session) -> None:
 @nox.session(reuse_venv=True)
 def api_docs(session: nox.Session) -> None:
     """Build (regenerate) API docs."""
-    session.install(f"sphinx=={REQUIREMENTS['sphinx']}")
+    sphinx_req = REQUIREMENTS["sphinx"]
+    if sphinx_req.isdigit():
+        sphinx_req = "==" + sphinx_req
+    session.install(f"sphinx{sphinx_req}")
     session.chdir("docs")
     session.run(
         "sphinx-apidoc",

From 969f2f88ad472e48154faac3a853411dc809356a Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Mon, 24 Jun 2024 08:04:03 +0200
Subject: [PATCH 406/458] The README is now included in the documentation.

---
 docs/index.md | 2 --
 1 file changed, 2 deletions(-)

diff --git a/docs/index.md b/docs/index.md
index e447b26..c395a73 100644
--- a/docs/index.md
+++ b/docs/index.md
@@ -3,11 +3,9 @@
 ```{toctree}
 :maxdepth: 2
 :hidden:
-
 ```
 
 ```{include} ../README.md
-:start-after: <!-- SPHINX-START -->
 ```
 
 ## Indices and tables

From 29d09e77e8411e6df775847cb595d03b1beab017 Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Mon, 24 Jun 2024 08:04:53 +0200
Subject: [PATCH 407/458] It should be `Note:` instead of `Notes:`.

---
 src/jace/api.py                                        |  2 +-
 src/jace/stages.py                                     |  2 +-
 src/jace/translated_jaxpr_sdfg.py                      |  2 +-
 src/jace/translator/jaxpr_translator_builder.py        | 10 +++++-----
 .../translator/mapped_operation_base_translator.py     |  2 +-
 src/jace/translator/primitive_translator.py            |  2 +-
 .../arithmetic_logical_translators.py                  |  2 +-
 .../convert_element_type_translator.py                 |  2 +-
 src/jace/translator/primitive_translators/slicing.py   |  2 +-
 src/jace/util/traits.py                                |  4 ++--
 10 files changed, 15 insertions(+), 15 deletions(-)

diff --git a/src/jace/api.py b/src/jace/api.py
index 18a81e6..05bfa1e 100644
--- a/src/jace/api.py
+++ b/src/jace/api.py
@@ -30,7 +30,7 @@ class JITOptions(TypedDict, total=False):
     """
     All known options to `jace.jit` that influence tracing.
 
-    Notes:
+    Note:
         Currently there are no known options, but essentially it is a subset of some
         of the options that are supported by `jax.jit` together with some additional
         JaCe specific ones.
diff --git a/src/jace/stages.py b/src/jace/stages.py
index 28dad20..b51fac0 100644
--- a/src/jace/stages.py
+++ b/src/jace/stages.py
@@ -191,7 +191,7 @@ def _make_call_description(
         For all non static arguments the function will generate an abstract description
         of an argument and for all static arguments the concrete value.
 
-        Notes:
+        Note:
             The abstract description also includes storage location, i.e. if on CPU or
             on GPU, and the strides of the arrays.
         """
diff --git a/src/jace/translated_jaxpr_sdfg.py b/src/jace/translated_jaxpr_sdfg.py
index 9bcec78..04eae37 100644
--- a/src/jace/translated_jaxpr_sdfg.py
+++ b/src/jace/translated_jaxpr_sdfg.py
@@ -110,7 +110,7 @@ class CompiledJaxprSDFG:
         input_names: Names of the SDFG variables used as inputs.
         out_names: Names of the SDFG variables used as outputs.
 
-    Notes:
+    Note:
         Currently the strides of the input arguments must match the ones that were used
         for lowering the SDFG.
         In DaCe the return values are allocated on a per `CompiledSDFG` basis. Thus
diff --git a/src/jace/translator/jaxpr_translator_builder.py b/src/jace/translator/jaxpr_translator_builder.py
index 8562686..ea4606d 100644
--- a/src/jace/translator/jaxpr_translator_builder.py
+++ b/src/jace/translator/jaxpr_translator_builder.py
@@ -69,7 +69,7 @@ class JaxprTranslationBuilder:
     Args:
         primitive_translators: Primitive translators to use in the translation.
 
-    Notes:
+    Note:
         After a translation has been performed the translator object can be used
         again.
     """
@@ -150,7 +150,7 @@ def append_new_state(
             assignments: Symbol assignments on the `InterstateEdge`.
             prev_state: Alternative state at which we append.
 
-        Notes:
+        Note:
             It is potentially dangerous to not append to the current terminal
             state, as a canonical SDFG only has one sink state. If this is done
             the user has to ensure, that at the end of the processing the SDFG
@@ -183,7 +183,7 @@ def arrays(self) -> Mapping[str, dace_data.Data]:
         """
         Get all data descriptors that are currently known to the SDFG.
 
-        Notes:
+        Note:
             Essentially a shorthand and preferred way for `self.sdfg.arrays`.
             For getting a specific data descriptor use `self.get_array()`.
         """
@@ -446,7 +446,7 @@ def _create_initial_input(self, jaxpr: jax_core.ClosedJaxpr) -> None:
         """
         Creates the input variables of `jaxpr`.
 
-        Notes:
+        Note:
             The function will populate the `input_names` member of the current context.
         """
         assert self._ctx.input_names is None
@@ -589,7 +589,7 @@ def _translate_jaxpr_internal(self, jaxpr: jax_core.ClosedJaxpr) -> TranslationC
         Args:
             jaxpr: The Jaxpr to translate.
 
-        Notes:
+        Note:
             Equations that store into drop variables, i.e. with name `_`,
             will be ignored.
         """
diff --git a/src/jace/translator/mapped_operation_base_translator.py b/src/jace/translator/mapped_operation_base_translator.py
index f5a4103..9f0f402 100644
--- a/src/jace/translator/mapped_operation_base_translator.py
+++ b/src/jace/translator/mapped_operation_base_translator.py
@@ -53,7 +53,7 @@ class MappedOperationTranslatorBase(translator.PrimitiveTranslator):
     Args:
         primitive_name:     The name of the primitive `self` should bind to.
 
-    Notes:
+    Note:
         This class will always generate a mapped Tasklet, even if a scalar is handled.
     """
 
diff --git a/src/jace/translator/primitive_translator.py b/src/jace/translator/primitive_translator.py
index bcc0b8b..ab84c5d 100644
--- a/src/jace/translator/primitive_translator.py
+++ b/src/jace/translator/primitive_translator.py
@@ -135,7 +135,7 @@ def make_primitive_translator(
     that it satisfy the `PrimitiveTranslator` protocol. However, it does not add
     it to the registry, for that `register_primitive_translator()` has to be used.
 
-    Notes:
+    Note:
         This function can also be used as decorator.
     """
 
diff --git a/src/jace/translator/primitive_translators/arithmetic_logical_translators.py b/src/jace/translator/primitive_translators/arithmetic_logical_translators.py
index d901682..59494e9 100644
--- a/src/jace/translator/primitive_translators/arithmetic_logical_translators.py
+++ b/src/jace/translator/primitive_translators/arithmetic_logical_translators.py
@@ -92,7 +92,7 @@ class LogicalOperationTranslator(mapped_base.MappedOperationTranslatorBase):
         int_tmpl:       The template used for the integer case.
         bool_tmpl:      The template used for the bool case.
 
-    Notes:
+    Note:
         Since it does not make sense to single out `not` and keep the other
         logical operations in `ArithmeticOperationTranslator` all of them are
         handled by this class.
diff --git a/src/jace/translator/primitive_translators/convert_element_type_translator.py b/src/jace/translator/primitive_translators/convert_element_type_translator.py
index 28838e5..ee05a2a 100644
--- a/src/jace/translator/primitive_translators/convert_element_type_translator.py
+++ b/src/jace/translator/primitive_translators/convert_element_type_translator.py
@@ -33,7 +33,7 @@ class ConvertElementTypeTranslator(mapped_base.MappedOperationTranslatorBase):
     However, in cases where the input type is the same as the output type,
     the Tasklet will just be a copy Tasklet, that can then be removed by DaCe.
 
-    Notes:
+    Note:
         This translator ignores the `new_dtype` and `weak_type` parameters of
         the equation and only performs the casting based on the type of the fields.
     """
diff --git a/src/jace/translator/primitive_translators/slicing.py b/src/jace/translator/primitive_translators/slicing.py
index 3000377..1741fef 100644
--- a/src/jace/translator/primitive_translators/slicing.py
+++ b/src/jace/translator/primitive_translators/slicing.py
@@ -31,7 +31,7 @@ class SlicingTranslator(mapped_base.MappedOperationTranslatorBase):
     This is the classical slicing operation which extracts a fixed sized window
     from a fixed initial position. The slicing is implemented using a partial copy.
 
-    Notes:
+    Note:
         Slices are essentially optimization barriers as they can not be fused
         with Maps before them.
     """
diff --git a/src/jace/util/traits.py b/src/jace/util/traits.py
index af7affe..d7efb30 100644
--- a/src/jace/util/traits.py
+++ b/src/jace/util/traits.py
@@ -32,7 +32,7 @@ def is_jax_array(obj: Any) -> TypeGuard[jax.Array]:
     """
     Tests if `obj` is a JAX array.
 
-    Notes:
+    Note:
         JAX arrays are special as they can not be mutated. Furthermore, they always
         allocate on the CPU _and_ on the GPU, if present.
     """
@@ -83,7 +83,7 @@ def get_strides_for_dace(obj: Any) -> tuple[int, ...] | None:
     DaCe and not in bytes as it is inside NumPy. As in NumPy and DaCe the function
     returns `None` to indicate standard C order.
 
-    Notes:
+    Note:
         If `obj` is not array like an error is generated.
     """
     if not is_array(obj):

From d029d1316ee450931f51c6783651407ba1561ae8 Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Mon, 24 Jun 2024 08:06:15 +0200
Subject: [PATCH 408/458] It should be `Note:` insteed of `Notes:`.

---
 src/jace/api.py                                 |  2 +-
 src/jace/stages.py                              |  2 +-
 src/jace/translated_jaxpr_sdfg.py               |  2 +-
 src/jace/translator/jaxpr_translator_builder.py | 10 +++++-----
 src/jace/translator/primitive_translator.py     |  2 +-
 src/jace/util/traits.py                         |  4 ++--
 6 files changed, 11 insertions(+), 11 deletions(-)

diff --git a/src/jace/api.py b/src/jace/api.py
index 18a81e6..05bfa1e 100644
--- a/src/jace/api.py
+++ b/src/jace/api.py
@@ -30,7 +30,7 @@ class JITOptions(TypedDict, total=False):
     """
     All known options to `jace.jit` that influence tracing.
 
-    Notes:
+    Note:
         Currently there are no known options, but essentially it is a subset of some
         of the options that are supported by `jax.jit` together with some additional
         JaCe specific ones.
diff --git a/src/jace/stages.py b/src/jace/stages.py
index 28dad20..b51fac0 100644
--- a/src/jace/stages.py
+++ b/src/jace/stages.py
@@ -191,7 +191,7 @@ def _make_call_description(
         For all non static arguments the function will generate an abstract description
         of an argument and for all static arguments the concrete value.
 
-        Notes:
+        Note:
             The abstract description also includes storage location, i.e. if on CPU or
             on GPU, and the strides of the arrays.
         """
diff --git a/src/jace/translated_jaxpr_sdfg.py b/src/jace/translated_jaxpr_sdfg.py
index 9bcec78..04eae37 100644
--- a/src/jace/translated_jaxpr_sdfg.py
+++ b/src/jace/translated_jaxpr_sdfg.py
@@ -110,7 +110,7 @@ class CompiledJaxprSDFG:
         input_names: Names of the SDFG variables used as inputs.
         out_names: Names of the SDFG variables used as outputs.
 
-    Notes:
+    Note:
         Currently the strides of the input arguments must match the ones that were used
         for lowering the SDFG.
         In DaCe the return values are allocated on a per `CompiledSDFG` basis. Thus
diff --git a/src/jace/translator/jaxpr_translator_builder.py b/src/jace/translator/jaxpr_translator_builder.py
index 7ef6d06..9285323 100644
--- a/src/jace/translator/jaxpr_translator_builder.py
+++ b/src/jace/translator/jaxpr_translator_builder.py
@@ -66,7 +66,7 @@ class JaxprTranslationBuilder:
     Args:
         primitive_translators: Primitive translators to use in the translation.
 
-    Notes:
+    Note:
         After a translation has been performed the translator object can be used
         again.
     """
@@ -147,7 +147,7 @@ def append_new_state(
             assignments: Symbol assignments on the `InterstateEdge`.
             prev_state: Alternative state at which we append.
 
-        Notes:
+        Note:
             It is potentially dangerous to not append to the current terminal
             state, as a canonical SDFG only has one sink state. If this is done
             the user has to ensure, that at the end of the processing the SDFG
@@ -180,7 +180,7 @@ def arrays(self) -> Mapping[str, dace_data.Data]:
         """
         Get all data descriptors that are currently known to the SDFG.
 
-        Notes:
+        Note:
             Essentially a shorthand and preferred way for `self.sdfg.arrays`.
             For getting a specific data descriptor use `self.get_array()`.
         """
@@ -443,7 +443,7 @@ def _create_initial_input(self, jaxpr: jax_core.ClosedJaxpr) -> None:
         """
         Creates the input variables of `jaxpr`.
 
-        Notes:
+        Note:
             The function will populate the `input_names` member of the current context.
         """
         assert self._ctx.input_names is None
@@ -586,7 +586,7 @@ def _translate_jaxpr_internal(self, jaxpr: jax_core.ClosedJaxpr) -> TranslationC
         Args:
             jaxpr: The Jaxpr to translate.
 
-        Notes:
+        Note:
             Equations that store into drop variables, i.e. with name `_`,
             will be ignored.
         """
diff --git a/src/jace/translator/primitive_translator.py b/src/jace/translator/primitive_translator.py
index bcc0b8b..ab84c5d 100644
--- a/src/jace/translator/primitive_translator.py
+++ b/src/jace/translator/primitive_translator.py
@@ -135,7 +135,7 @@ def make_primitive_translator(
     that it satisfy the `PrimitiveTranslator` protocol. However, it does not add
     it to the registry, for that `register_primitive_translator()` has to be used.
 
-    Notes:
+    Note:
         This function can also be used as decorator.
     """
 
diff --git a/src/jace/util/traits.py b/src/jace/util/traits.py
index af7affe..d7efb30 100644
--- a/src/jace/util/traits.py
+++ b/src/jace/util/traits.py
@@ -32,7 +32,7 @@ def is_jax_array(obj: Any) -> TypeGuard[jax.Array]:
     """
     Tests if `obj` is a JAX array.
 
-    Notes:
+    Note:
         JAX arrays are special as they can not be mutated. Furthermore, they always
         allocate on the CPU _and_ on the GPU, if present.
     """
@@ -83,7 +83,7 @@ def get_strides_for_dace(obj: Any) -> tuple[int, ...] | None:
     DaCe and not in bytes as it is inside NumPy. As in NumPy and DaCe the function
     returns `None` to indicate standard C order.
 
-    Notes:
+    Note:
         If `obj` is not array like an error is generated.
     """
     if not is_array(obj):

From 4f343b31c0c778efba9eb86da74f78b41c6f897e Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Mon, 24 Jun 2024 08:42:21 +0200
Subject: [PATCH 409/458] Started with a document that outlines differences
 between JaCe and JAX, mostly a reminder for me.

---
 docs/main_differences.md | 20 ++++++++++++++++++++
 1 file changed, 20 insertions(+)
 create mode 100644 docs/main_differences.md

diff --git a/docs/main_differences.md b/docs/main_differences.md
new file mode 100644
index 0000000..953bef0
--- /dev/null
+++ b/docs/main_differences.md
@@ -0,0 +1,20 @@
+# Main Differences Between DaCe and JaCe and JAX and JaCe
+
+Essentially JaCe is a frontend that allows DaCe to process JAX code, thus it has to be compatible with both, at least in some sense.
+We will now list the main differences between them, furthermore, you should also consult the ROADMAP.
+
+### JAX vs. JaCe:
+
+- JaCe always traces with enabled `x64` mode.
+  This is a restriction that might be lifted in the future.
+- JAX returns scalars as zero-dimensional arrays, JaCe returns them as array with shape `(1, )`.
+- In JAX parts of the computation runs on CPU parts on GPU, in JaCe everything runs (currently) either on CPU or GPU.
+- Currently JaCe is only able to run on CPU (will be lifted soon).
+- Currently JaCe is not able to run distributed (will be lifted later).
+- Currently not all primitives are supported.
+- JaCe does not return `jax.Array` instances, but NumPy/CuPy arrays.
+
+### DaCe vs. JaCe:
+
+- JaCe accepts complex objects using JAX' pytrees.
+- JaCe will support scalar inputs on GPU.

From 72d6771359121cfc5cc306b0c55e0ebdd6204597 Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Mon, 24 Jun 2024 09:28:24 +0200
Subject: [PATCH 410/458] Added the clamp primitive, that we will need later.

This also introduces ternary operations.
---
 .../arithmetic_logical_translators.py          |  3 +++
 ..._primitive_arithmetic_logical_operations.py | 18 ++++++++++++++++++
 2 files changed, 21 insertions(+)

diff --git a/src/jace/translator/primitive_translators/arithmetic_logical_translators.py b/src/jace/translator/primitive_translators/arithmetic_logical_translators.py
index 59494e9..c9c0a35 100644
--- a/src/jace/translator/primitive_translators/arithmetic_logical_translators.py
+++ b/src/jace/translator/primitive_translators/arithmetic_logical_translators.py
@@ -175,6 +175,9 @@ def write_tasklet_code(
     "atan2": "__out = atan2((__in0), (__in1))",
 
     "nextafter": "__out = nextafter((__in0), (__in1))",
+
+    # Ternary operations
+    "clamp": "__out = (__in0 if __in1 < __in0 else (__in1 if __in1 < __in2 else __in2))"
 }
 
 
diff --git a/tests/integration_tests/primitive_translators/test_primitive_arithmetic_logical_operations.py b/tests/integration_tests/primitive_translators/test_primitive_arithmetic_logical_operations.py
index 76afe44..71e92eb 100644
--- a/tests/integration_tests/primitive_translators/test_primitive_arithmetic_logical_operations.py
+++ b/tests/integration_tests/primitive_translators/test_primitive_arithmetic_logical_operations.py
@@ -330,6 +330,24 @@ def testee(a: np.ndarray, b: np.ndarray) -> np.ndarray:
     _perform_alt_test(testee, *alt_binary_ops_float[1])
 
 
+def test_alt_ternary_clamp() -> None:
+    """Tests `jax.lax.clamp()` primitive.
+
+    This primitive is similar to `numpy.clip()` but with a different signature.
+    Furthermore, this is a ternary operation.
+    """
+
+    def testee(min_: np.ndarray, val_: np.ndarray, max_: np.ndarray) -> np.ndarray:
+        return jax.lax.clamp(min_, val_, max_)  # type: ignore[return-value]
+
+    shape = (20, 20)
+    min_ = testutil.make_array(shape) / 2.0
+    max_ = testutil.make_array(shape) / 2.0 + 0.5
+    val_ = testutil.make_array(shape)
+
+    _perform_alt_test(testee, min_, val_, max_)
+
+
 def test_alt_compare_operation(
     alt_binary_compare_ops: tuple[Callable, tuple[np.ndarray, np.ndarray]],
 ) -> None:

From 1766bc390684cbee146cbb9ab8b8967a7991ce4a Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Mon, 24 Jun 2024 09:36:36 +0200
Subject: [PATCH 411/458] Modified the test function.

---
 .../test_primitive_arithmetic_logical_operations.py | 13 ++++++++++---
 1 file changed, 10 insertions(+), 3 deletions(-)

diff --git a/tests/integration_tests/primitive_translators/test_primitive_arithmetic_logical_operations.py b/tests/integration_tests/primitive_translators/test_primitive_arithmetic_logical_operations.py
index 71e92eb..e7dc93f 100644
--- a/tests/integration_tests/primitive_translators/test_primitive_arithmetic_logical_operations.py
+++ b/tests/integration_tests/primitive_translators/test_primitive_arithmetic_logical_operations.py
@@ -184,8 +184,11 @@ def broadcast_input(request) -> tuple[np.ndarray, np.ndarray]:
     return tuple(testutil.make_array(shape) for shape in request.param)  # type: ignore[return-value] # can not deduce that it is only size 2.
 
 
-def _perform_alt_test(testee: Callable, *args: Any) -> None:
-    """General function that just performs the test."""
+def _perform_alt_test(testee: Callable, *args: Any) -> Any:
+    """General function that just performs the test.
+
+    The function returns the JaCe result.
+    """
     wrapped = jace.jit(testee)
 
     ref = testee(*args)
@@ -197,6 +200,7 @@ def _perform_alt_test(testee: Callable, *args: Any) -> None:
         assert ref.shape == res.shape
     assert ref.dtype == res.dtype
     assert np.allclose(ref, res), f"Expected '{ref.tolist()}' got '{res.tolist()}'"
+    return res
 
 
 # <------------ Tests for `MappedOperationTranslatorBase`
@@ -345,7 +349,10 @@ def testee(min_: np.ndarray, val_: np.ndarray, max_: np.ndarray) -> np.ndarray:
     max_ = testutil.make_array(shape) / 2.0 + 0.5
     val_ = testutil.make_array(shape)
 
-    _perform_alt_test(testee, min_, val_, max_)
+    jace_res = _perform_alt_test(testee, min_, val_, max_)
+
+    # Ensure that all branches were taken.
+    assert not any(np.all(jace_res == x) for x in (min_, val_, max_))
 
 
 def test_alt_compare_operation(

From d3dac222a89809e530381900a12d79d655cfbf47 Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Mon, 24 Jun 2024 09:49:46 +0200
Subject: [PATCH 412/458] Added a test for proper broadcasting of ternary
 operators.

---
 ...primitive_arithmetic_logical_operations.py | 44 ++++++++++++++++---
 1 file changed, 39 insertions(+), 5 deletions(-)

diff --git a/tests/integration_tests/primitive_translators/test_primitive_arithmetic_logical_operations.py b/tests/integration_tests/primitive_translators/test_primitive_arithmetic_logical_operations.py
index e7dc93f..14d8cb1 100644
--- a/tests/integration_tests/primitive_translators/test_primitive_arithmetic_logical_operations.py
+++ b/tests/integration_tests/primitive_translators/test_primitive_arithmetic_logical_operations.py
@@ -179,11 +179,36 @@ def alt_binary_compare_ops(request) -> tuple[Callable, tuple[np.ndarray, np.ndar
         [(5, 1, 3, 4, 1, 5), (5, 1, 3, 1, 2, 5)],
     ]
 )
-def broadcast_input(request) -> tuple[np.ndarray, np.ndarray]:
-    """Inputs to be used for the broadcast test."""
+def binary_broadcast_input(request) -> tuple[np.ndarray, np.ndarray]:
+    """Inputs to be used for the binary broadcast test."""
     return tuple(testutil.make_array(shape) for shape in request.param)  # type: ignore[return-value] # can not deduce that it is only size 2.
 
 
+@pytest.fixture(
+    params=[
+        [(100, 100), (100, 100), (100, 100)],
+        [(100, 1), (100, 100), (100, 100)],
+        [(100, 100), (100, 1), (100, 100)],
+        [(100, 100), (100, 100), (100, 1)],
+        [(100, 1), (100, 1), (100, 100)],
+        [(100, 100), (100, 1), (100, 1)],
+        [(100, 1), (100, 100), (100, 1)],
+        [(100, 100), (), ()],
+        [(), (100, 100), ()],
+        [(), (), (100, 100)],
+        [(), (100, 100), (100, 100)],
+        [(100, 100), (), (100, 100)],
+    ]
+)
+def ternary_broadcast_input(request) -> tuple[np.ndarray, np.ndarray, np.ndarray]:
+    """Inputs to be used for the ternary broadcast test."""
+
+    min_val = testutil.make_array(request.param[0]) / 2.0
+    value = testutil.make_array(request.param[1])
+    max_val = testutil.make_array(request.param[2]) / 2.0 + 0.5
+    return (min_val, value, max_val)
+
+
 def _perform_alt_test(testee: Callable, *args: Any) -> Any:
     """General function that just performs the test.
 
@@ -289,16 +314,25 @@ def testee(a: np.ndarray) -> np.ndarray:
     _perform_alt_test(testee, a)
 
 
-def test_mapped_broadcast(broadcast_input: tuple[np.ndarray, np.ndarray]) -> None:
+def test_mapped_broadcast_binary(binary_broadcast_input: tuple[np.ndarray, np.ndarray]) -> None:
     def testee(a: np.ndarray, b: np.ndarray) -> np.ndarray:
         return a + b
 
-    a = broadcast_input[0]
-    b = broadcast_input[1]
+    a = binary_broadcast_input[0]
+    b = binary_broadcast_input[1]
     _perform_alt_test(testee, a, b)
     _perform_alt_test(testee, b, a)
 
 
+def test_mapped_broadcast_ternary(
+    ternary_broadcast_input: tuple[np.ndarray, np.ndarray, np.ndarray],
+) -> None:
+    def testee(min_val: np.ndarray, value: np.ndarray, max_val: np.ndarray) -> np.ndarray:
+        return jax.numpy.clip(value, min_val, max_val)  # type: ignore[return-value]  # JAX returns JAX Arrays.
+
+    _perform_alt_test(testee, *ternary_broadcast_input)
+
+
 # <------------ Tests for arithmetic and logical translators/operations
 
 
From 25f52a9fbccec407d96ef0a9cc3e8c9e525023ff Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Mon, 24 Jun 2024 10:58:43 +0200
Subject: [PATCH 413/458] Added a function that is able to incorporate a
 context into an other context as nested SDFG.

---
 src/jace/translator/post_translation.py | 92 +++++++++++++++++++++++++
 1 file changed, 92 insertions(+)

diff --git a/src/jace/translator/post_translation.py b/src/jace/translator/post_translation.py
index 8242060..dcc851a 100644
--- a/src/jace/translator/post_translation.py
+++ b/src/jace/translator/post_translation.py
@@ -19,6 +19,8 @@
 
 
 if TYPE_CHECKING:
+    from dace.sdfg import nodes as dace_nodes
+
     from jace import translator
 
 
@@ -247,3 +249,93 @@ def finalize_translation_context(
     if validate:
         tsdfg.validate()
     return tsdfg
+
+
+def add_nested_sdfg(
+    state: dace.SDFGState,
+    child_ctx: translator.TranslationContext,
+    parent_ctx: translator.TranslationContext,
+    in_var_names: Sequence[str],
+    out_var_names: Sequence[str],
+) -> dace_nodes.NestedSDFG:
+    """
+    Adds the SDFG in `child_ctx` as nested SDFG at state `state` in `parent_ctx`.
+
+    The function is a convenience wrapper that operates directly on translation
+    contexts instead of SDFGs. The function will also create the necessary Memlet
+    connections.
+
+    Args:
+        state: The state at which the nested SDFG should be inserted.
+            Must be part of `parent_ctx`.
+        child_ctx: The translation context representing the SDFG that should be added.
+        parent_ctx: The parent SDFG to which `child_ctx` should be added as nested
+            SDFG in state `state`.
+        in_var_names: Names of the variables in `parent_ctx` that are used as inputs for
+            the nested SDFG, must have the same order as `child_ctx.input_names`.
+        out_var_names: Names of the variables in `parent_ctx` that are used as outputs
+            for the nested SDFG, must have the same order as `child_ctx.out_names`.
+
+    Returns:
+        The nested SDFG object.
+
+    Note:
+        The function will not add `child_ctx` directly as nested SDFG. Instead it
+        will first pass it to `finalize_translation_context()` and operates on the
+        return values. This means that `child_ctx` will be modified in place, and
+        a copy will be added to `parent_ctx`.
+        It is highly recommended that `state` is empty.
+    """
+    if child_ctx.sdfg.free_symbols:
+        raise NotImplementedError("Symbol Mapping is not implemented.")
+    assert not (child_ctx.input_names is None or child_ctx.out_names is None)  # Silence mypy
+    assert len(child_ctx.input_names) == len(in_var_names)
+    assert len(child_ctx.out_names) == len(out_var_names)
+    assert state in parent_ctx.sdfg.nodes()
+    assert not set(in_var_names).intersection(out_var_names)
+
+    if any(input_name.startswith("__jace_mutable_") for input_name in in_var_names):
+        raise NotImplementedError(
+            "'__jace_mutable_' variables are not yet handled in 'add_nested_sdfg()'."
+        )
+    if len(set(in_var_names)) != len(in_var_names):
+        raise ValueError(
+            f"An input can only be passed once, but { {in_var_name for in_var_name in in_var_names if in_var_names.count(in_var_name) > 1} } were passed multiple times."
+        )
+    if len(set(out_var_names)) != len(out_var_names):
+        raise NotImplementedError(
+            f"Tried to write multiple times to variables: { {out_var_name for out_var_name in out_var_names if out_var_names.count(out_var_name) > 1} }."
+        )
+
+    final_child_ctx = finalize_translation_context(child_ctx)
+    nested_sdfg: dace_nodes.NestedSDFG = state.add_nested_sdfg(
+        sdfg=final_child_ctx.sdfg,
+        parent=parent_ctx.sdfg,
+        # Bug in DaCe must be a set.
+        inputs=set(final_child_ctx.input_names),
+        outputs=set(final_child_ctx.out_names),
+    )
+
+    # Now create the connections for the input.
+    for outer_name, inner_name in zip(in_var_names, final_child_ctx.input_names):
+        outer_array = parent_ctx.sdfg.arrays[outer_name]
+        state.add_edge(
+            state.add_read(outer_name),
+            None,
+            nested_sdfg,
+            inner_name,
+            dace.Memlet.from_array(outer_name, outer_array),
+        )
+
+    # Now we create the output connections.
+    for outer_name, inner_name in zip(out_var_names, final_child_ctx.out_names):
+        outer_array = parent_ctx.sdfg.arrays[outer_name]
+        state.add_edge(
+            nested_sdfg,
+            inner_name,
+            state.add_write(outer_name),
+            None,
+            dace.Memlet.from_array(outer_name, outer_array),
+        )
+
+    return nested_sdfg

From ed8f6531e7a6eefc90d7ddb1868491bc7532c26f Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Mon, 24 Jun 2024 11:28:14 +0200
Subject: [PATCH 414/458] Fixed the concatenate translator.

---
 src/jace/translator/primitive_translators/__init__.py     | 2 +-
 .../{concatenate.py => concatenate_translator.py}         | 8 +++++---
 2 files changed, 6 insertions(+), 4 deletions(-)
 rename src/jace/translator/primitive_translators/{concatenate.py => concatenate_translator.py} (93%)

diff --git a/src/jace/translator/primitive_translators/__init__.py b/src/jace/translator/primitive_translators/__init__.py
index cf3e866..79704cb 100644
--- a/src/jace/translator/primitive_translators/__init__.py
+++ b/src/jace/translator/primitive_translators/__init__.py
@@ -13,7 +13,7 @@
     LogicalOperationTranslator,
 )
 from .broadcast_in_dim_translator import BroadcastInDimTranslator
-from .concatenate import ConcatenateTranslator
+from .concatenate_translator import ConcatenateTranslator
 from .convert_element_type_translator import ConvertElementTypeTranslator
 from .copy_translator import CopyTranslator, DevicePutTranslator
 from .iota_translator import IotaTranslator
diff --git a/src/jace/translator/primitive_translators/concatenate.py b/src/jace/translator/primitive_translators/concatenate_translator.py
similarity index 93%
rename from src/jace/translator/primitive_translators/concatenate.py
rename to src/jace/translator/primitive_translators/concatenate_translator.py
index 916d507..e8bd144 100644
--- a/src/jace/translator/primitive_translators/concatenate.py
+++ b/src/jace/translator/primitive_translators/concatenate_translator.py
@@ -12,6 +12,7 @@
 from typing import TYPE_CHECKING
 
 import dace
+from typing_extensions import override
 
 from jace import translator, util
 
@@ -22,7 +23,7 @@
     from jax import core as jax_core
 
 
-class ConcatenateTranslator:
+class ConcatenateTranslator(translator.PrimitiveTranslator):
     """
     Implements the `concatenate` primitive.
 
@@ -34,9 +35,10 @@ class ConcatenateTranslator:
     def primitive(self) -> str:  # noqa: D102  # No docstring needed.
         return "concatenate"
 
-    def __call__(  # noqa: D102  # No docstring
+    @override
+    def __call__(
         self,
-        builder: translator.JaxprTranslationBuilder,  # noqa: ARG002  # Unused.
+        builder: translator.JaxprTranslationBuilder,
         in_var_names: Sequence[str | None],
         out_var_names: Sequence[str],
         eqn: jax_core.JaxprEqn,

From f4104b865bb7cbe1448fdd299247f0a25627d659 Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Mon, 24 Jun 2024 11:34:23 +0200
Subject: [PATCH 415/458] Added a translator for the `pjit` primitive.

---
 .../primitive_translators/__init__.py         |  2 +
 .../primitive_translators/pjit_translator.py  | 93 +++++++++++++++++++
 2 files changed, 95 insertions(+)
 create mode 100644 src/jace/translator/primitive_translators/pjit_translator.py

diff --git a/src/jace/translator/primitive_translators/__init__.py b/src/jace/translator/primitive_translators/__init__.py
index 79704cb..429fb6f 100644
--- a/src/jace/translator/primitive_translators/__init__.py
+++ b/src/jace/translator/primitive_translators/__init__.py
@@ -17,6 +17,7 @@
 from .convert_element_type_translator import ConvertElementTypeTranslator
 from .copy_translator import CopyTranslator, DevicePutTranslator
 from .iota_translator import IotaTranslator
+from .pjit_translator import PJITTranslator
 from .reshape_translator import ReshapeTranslator
 from .select_n_translator import SelectNTranslator
 from .slicing import SlicingTranslator
@@ -32,6 +33,7 @@
     "DevicePutTranslator",
     "IotaTranslator",
     "LogicalOperationTranslator",
+    "PJITTranslator",
     "ReshapeTranslator",
     "SelectNTranslator",
     "SlicingTranslator",
diff --git a/src/jace/translator/primitive_translators/pjit_translator.py b/src/jace/translator/primitive_translators/pjit_translator.py
new file mode 100644
index 0000000..eeb26aa
--- /dev/null
+++ b/src/jace/translator/primitive_translators/pjit_translator.py
@@ -0,0 +1,93 @@
+# JaCe - JAX Just-In-Time compilation using DaCe (Data Centric Parallel Programming)
+#
+# Copyright (c) 2024, ETH Zurich
+# All rights reserved.
+#
+# SPDX-License-Identifier: BSD-3-Clause
+
+"""Implements the `pjit` translator, i.e. nested Jaxpr expressions."""
+
+from __future__ import annotations
+
+import re
+from collections.abc import Sequence
+from typing import TYPE_CHECKING, Any
+
+from jax._src import sharding_impls as jax_sharding  # noqa: PLC2701 [import-private-name]
+
+from jace import translator
+from jace.translator import post_translation as ptranslation
+
+
+if TYPE_CHECKING:
+    import dace
+    from jax._src import core as jax_core
+
+
+@translator.register_primitive_translator()
+@translator.make_primitive_translator("pjit")
+def PJITTranslator(  # noqa: N802 [invalid-function-name]
+    builder: translator.JaxprTranslationBuilder,
+    in_var_names: Sequence[str | None],
+    out_var_names: Sequence[str],
+    eqn: jax_core.JaxprEqn,
+    eqn_state: dace.SDFGState,
+) -> None:
+    """
+    Implements the `pjit` translator that handles nested Jaxpr.
+
+    `pjit` primitives in JAX represents nested calls, for example the body of a scan
+    is inside a nested Jaxpr. However, `pjit` is used to indicate that a computation
+    should be done on the device or on sharded memory.
+
+    However, due to the current state and working of JaCe, this aspect is essentially
+    ignored and the computation is always inlined.
+
+    Args:
+        builder: The builder object of the translation.
+        in_var_names: Names of the SDFG variables that should be used as inputs
+            inside the parent SDFG.
+        out_var_names: Names of SDFG variables that should be used as outputs
+            inside the parent SDFG.
+        eqn: The equation that contains the `pjit` primitive.
+        eqn_state: State into which the nested SDFG should be constructed.
+    """
+    params: dict[str, Any] = eqn.params
+    nested_jaxpr: jax_core.ClosedJaxpr = params["jaxpr"]
+    in_shardings = params["in_shardings"]
+    out_shardings = params["out_shardings"]
+    _ = params["donated_invars"]  # Always ignored
+    _ = params["keep_unused"]
+    _ = params["inline"]
+
+    # TODO(phimuell): Controlflow region and name
+    pjit_name = params["name"]
+
+    if not all(in_sharding is jax_sharding.UNSPECIFIED for in_sharding in in_shardings):
+        raise NotImplementedError("Currently 'pjit' does not support sharding in its input.")
+    if not all(out_sharding is jax_sharding.UNSPECIFIED for out_sharding in out_shardings):
+        raise NotImplementedError("Currently 'pjit' does not support sharding in its output.")
+    if any(in_var_name is None for in_var_name in in_var_names):
+        raise NotImplementedError("Literal inputs to 'pjit' are not implemented.")
+
+    # TODO(phimuell): Controlflow region and name
+    #  They will introduce a feature like that to address them in optimizations.
+    pjit_name = params["name"]
+
+    # Name in SDFG must be unique, thus we mangle it, furthermore, we have to clean it.
+    sdfg_name = f"pjit_{re.subn('[^a-zA-Z0-9_]', '_', pjit_name)[0]}__{'_'.join(out_var_names)}"
+
+    # Now get the translated SDFG.
+    nested_context: translator.TranslationContext = builder.translate_jaxpr(
+        jaxpr=nested_jaxpr,
+        name=sdfg_name,
+    )
+
+    # Now lets add the nested SDFG
+    ptranslation.add_nested_sdfg(
+        state=eqn_state,
+        child_ctx=nested_context,
+        parent_ctx=builder._ctx,
+        in_var_names=in_var_names,  # type: ignore[arg-type]  # Is checked above.
+        out_var_names=out_var_names,
+    )

From 95853a3f13677814f1d4d262533b1a63c69dbcda Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Mon, 24 Jun 2024 13:09:50 +0200
Subject: [PATCH 416/458] Added a constructor to `JaCeVar` to construct it from
 an JAX Atom.

---
 src/jace/util/jax_helper.py | 21 +++++++++++++++++++++
 1 file changed, 21 insertions(+)

diff --git a/src/jace/util/jax_helper.py b/src/jace/util/jax_helper.py
index bc2de21..7c9f2f0 100644
--- a/src/jace/util/jax_helper.py
+++ b/src/jace/util/jax_helper.py
@@ -81,6 +81,27 @@ def __eq__(self, other: Any) -> bool:
             return NotImplemented
         return id(self) == id(other)
 
+    @classmethod
+    def from_atom(
+        cls,
+        jax_var: jax_core.Atom,
+        name: str | None,
+    ) -> JaCeVar:
+        """
+        Generates a `JaCeVar` from the JAX variable `jax_var`.
+
+        If `jax_var` is a literal its value is ignored.
+
+        Args:
+            jax_var: The variable to process.
+            name: The optional name of the variable.
+        """
+        return cls(
+            shape=get_jax_var_shape(jax_var),
+            dtype=get_jax_var_dtype(jax_var),
+            name=name,
+        )
+
 
 def get_jax_var_name(jax_var: jax_core.Atom | JaCeVar) -> str:
     """Returns the name of `jax_var` as a string."""

From 67e546c28043c5dc423850b5bbeb752b9e53106f Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Mon, 24 Jun 2024 13:12:23 +0200
Subject: [PATCH 417/458] Added the functionality to the `pjit` translator to
 handle literal inputs.

They are translated to a constant and then feeded in.
I did not use a Tasklet, because this could block inline.
However, this also blocks literal substitution.
---
 .../primitive_translators/pjit_translator.py  | 34 +++++++++++++++----
 1 file changed, 28 insertions(+), 6 deletions(-)

diff --git a/src/jace/translator/primitive_translators/pjit_translator.py b/src/jace/translator/primitive_translators/pjit_translator.py
index eeb26aa..291cddf 100644
--- a/src/jace/translator/primitive_translators/pjit_translator.py
+++ b/src/jace/translator/primitive_translators/pjit_translator.py
@@ -15,7 +15,7 @@
 
 from jax._src import sharding_impls as jax_sharding  # noqa: PLC2701 [import-private-name]
 
-from jace import translator
+from jace import translator, util
 from jace.translator import post_translation as ptranslation
 
 
@@ -43,6 +43,8 @@ def PJITTranslator(  # noqa: N802 [invalid-function-name]
     However, due to the current state and working of JaCe, this aspect is essentially
     ignored and the computation is always inlined.
 
+    In case an input is a literal the translator will create a constant for it.
+
     Args:
         builder: The builder object of the translation.
         in_var_names: Names of the SDFG variables that should be used as inputs
@@ -60,15 +62,13 @@ def PJITTranslator(  # noqa: N802 [invalid-function-name]
     _ = params["keep_unused"]
     _ = params["inline"]
 
-    # TODO(phimuell): Controlflow region and name
-    pjit_name = params["name"]
-
     if not all(in_sharding is jax_sharding.UNSPECIFIED for in_sharding in in_shardings):
         raise NotImplementedError("Currently 'pjit' does not support sharding in its input.")
     if not all(out_sharding is jax_sharding.UNSPECIFIED for out_sharding in out_shardings):
         raise NotImplementedError("Currently 'pjit' does not support sharding in its output.")
-    if any(in_var_name is None for in_var_name in in_var_names):
-        raise NotImplementedError("Literal inputs to 'pjit' are not implemented.")
+
+    # TODO(phimuell): Controlflow region and name
+    pjit_name = params["name"]
 
     # TODO(phimuell): Controlflow region and name
     #  They will introduce a feature like that to address them in optimizations.
@@ -77,6 +77,28 @@ def PJITTranslator(  # noqa: N802 [invalid-function-name]
     # Name in SDFG must be unique, thus we mangle it, furthermore, we have to clean it.
     sdfg_name = f"pjit_{re.subn('[^a-zA-Z0-9_]', '_', pjit_name)[0]}__{'_'.join(out_var_names)}"
 
+    # If needed turn literal inputs into constants.
+    # TODO(phimuell): Is using constants really a good idea?
+    if any(in_var_name is None for in_var_name in in_var_names):
+        final_input_names: list[str] = []
+        for i, in_var_name in enumerate(in_var_names):
+            if in_var_name is None:
+                new_input_name = f"__const_{sdfg_name}_literal_input_{i}"
+                jax_input: jax_core.Atom = eqn.invars[i]
+                new_input_var = util.JaCeVar.from_atom(
+                    jax_var=jax_input,
+                    name=new_input_name,
+                )
+                builder.add_array(new_input_var)
+                builder.sdfg.add_constant(
+                    new_input_name,
+                    util.get_jax_literal_value(jax_input),
+                    builder.arrays[new_input_name],
+                )
+                in_var_name = new_input_name  # noqa: PLW2901 [redefined-loop-name]
+            final_input_names.append(in_var_name)
+        in_var_names = final_input_names
+
     # Now get the translated SDFG.
     nested_context: translator.TranslationContext = builder.translate_jaxpr(
         jaxpr=nested_jaxpr,

From 0ec665b2e65ec9b3243cd5040b91b2443ab3cdcd Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Mon, 24 Jun 2024 13:21:14 +0200
Subject: [PATCH 418/458] The Jaxpr that is translated is now aviable in the
 lowered object.

This is mostly for debugging.
---
 src/jace/stages.py | 10 ++++++++--
 1 file changed, 8 insertions(+), 2 deletions(-)

diff --git a/src/jace/stages.py b/src/jace/stages.py
index b51fac0..32e1af8 100644
--- a/src/jace/stages.py
+++ b/src/jace/stages.py
@@ -42,6 +42,7 @@
 
 if TYPE_CHECKING:
     import dace
+    from jax import core as jax_core
 
 __all__ = [
     "CompilerOptions",  # export for compatibility with JAX.
@@ -128,7 +129,8 @@ def __call__(self, *args: _P.args, **kwargs: _P.kwargs) -> _ReturnType:
         Note:
             This function is also aware if a JAX tracing is going on. In this
             case, it will forward the computation.
-            Currently, this function ignores the value of `jax.disable_jit()`.
+            Currently, this function ignores the value of `jax.disable_jit()`,
+            however, tracing will consider this value.
         """
         if util.is_tracing_ongoing(*args, **kwargs):
             return self._fun(*args, **kwargs)
@@ -175,7 +177,7 @@ def lower(self, *args: _P.args, **kwargs: _P.kwargs) -> JaCeLowered[_ReturnType]
         )
 
         # NOTE: `tsdfg` is deepcopied as a side effect of post processing.
-        return JaCeLowered(tsdfg, out_tree)
+        return JaCeLowered(tsdfg, out_tree, trans_ctx.jaxpr)
 
     @property
     def wrapped_fun(self) -> Callable:
@@ -217,6 +219,7 @@ class JaCeLowered(tcache.CachingStage["JaCeCompiled"], Generic[_ReturnType]):
     Args:
         tsdfg: The lowered SDFG with metadata.
         out_tree: The pytree describing how to unflatten the output.
+        jaxpr: The Jaxpr expression that was translated.
 
     Note:
         `self` will manage the passed `tsdfg` object. Modifying it results is undefined
@@ -226,15 +229,18 @@ class JaCeLowered(tcache.CachingStage["JaCeCompiled"], Generic[_ReturnType]):
 
     _translated_sdfg: tjsdfg.TranslatedJaxprSDFG
     _out_tree: jax_tree.PyTreeDef
+    _jaxpr: jax_core.ClosedJaxpr
 
     def __init__(
         self,
         tsdfg: tjsdfg.TranslatedJaxprSDFG,
         out_tree: jax_tree.PyTreeDef,
+        jaxpr: jax_core.ClosedJaxpr,
     ) -> None:
         super().__init__()
         self._translated_sdfg = tsdfg
         self._out_tree = out_tree
+        self._jaxpr = jaxpr
 
     @tcache.cached_transition
     def compile(self, compiler_options: CompilerOptions | None = None) -> JaCeCompiled[_ReturnType]:

From 5bc6220cbbe035eee2ab93ba501f4de9ff68f4c9 Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Mon, 24 Jun 2024 14:00:49 +0200
Subject: [PATCH 419/458] Added tests for the `pjit` primitives.

---
 tests/conftest.py                             | 24 ++++---
 ...primitive_arithmetic_logical_operations.py |  2 +-
 .../test_primitive_pjit.py                    | 68 +++++++++++++++++++
 .../test_primitive_select_n.py                |  7 +-
 .../test_primitive_translator_managing.py     |  6 ++
 tests/unit_tests/test_jax_api.py              |  1 -
 tests/util.py                                 |  2 +-
 7 files changed, 91 insertions(+), 19 deletions(-)
 create mode 100644 tests/integration_tests/primitive_translators/test_primitive_pjit.py

diff --git a/tests/conftest.py b/tests/conftest.py
index 607e7e6..cf23878 100644
--- a/tests/conftest.py
+++ b/tests/conftest.py
@@ -41,21 +41,22 @@ def _enable_x64_mode_in_jax() -> Generator[None, None, None]:
 
 @pytest.fixture(autouse=True)
 def _disable_jit() -> Generator[None, None, None]:
-    """Fixture for disable the dynamic jiting in JAX.
+    """Fixture for disable the dynamic jiting in JAX, used by default.
 
-    For certain reasons JAX puts certain primitives inside a `pjit` primitive,
-    i.e. nested Jaxpr. The intent is, that these operations can/should run on
-    an accelerator.
+    Using this fixture has two effects.
+    - JAX will not cache the results, i.e. every call to a jitted function will
+        result in a tracing operation.
+    - JAX will not use implicit jit operations, i.e. nested Jaxpr expressions
+        using `pjit` are avoided.
 
-    But this is a problem, since JaCe can not handle this primitive, it leads
-    to an error. To overcome this problem, we will globally disable this feature
-    until we can handle `pjit`.
-
-    Note this essentially disable the `jax.jit` decorator, however, the `jace.jit`
+    This essentially disable the `jax.jit` decorator, however, the `jace.jit`
     decorator is still working.
 
-    Todo:
-        Remove as soon as we can handle nested `jit`.
+    Note:
+        The second point, i.e. preventing JAX from running certain things in `pjit`,
+        is the main reason why this fixture is used by default, without it
+        literal substitution is useless and essentially untestable.
+        In certain situation it can be disabled.
     """
     with jax.disable_jit(disable=True):
         yield
@@ -66,6 +67,7 @@ def _enable_jit() -> Generator[None, None, None]:
     """Fixture to enable jit compilation.
 
     Essentially it undoes the effects of the `_disable_jit()` fixture.
+    It is important that this fixture is not automatically activated.
     """
     with jax.disable_jit(disable=False):
         yield
diff --git a/tests/integration_tests/primitive_translators/test_primitive_arithmetic_logical_operations.py b/tests/integration_tests/primitive_translators/test_primitive_arithmetic_logical_operations.py
index 14d8cb1..a833786 100644
--- a/tests/integration_tests/primitive_translators/test_primitive_arithmetic_logical_operations.py
+++ b/tests/integration_tests/primitive_translators/test_primitive_arithmetic_logical_operations.py
@@ -58,7 +58,7 @@ def _only_alt_translators() -> Generator[None, None, None]:
     allowed_translators = (
         _LOGICAL_OPERATION_TEMPLATES.keys()
         | _ARITMETIC_OPERATION_TEMPLATES.keys()
-        | {"convert_element_type"}
+        | {"convert_element_type", "pjit"}
     )
     testutil.set_active_primitive_translators_to({
         p: t for p, t in primitive_translators.items() if p in allowed_translators
diff --git a/tests/integration_tests/primitive_translators/test_primitive_pjit.py b/tests/integration_tests/primitive_translators/test_primitive_pjit.py
new file mode 100644
index 0000000..512185b
--- /dev/null
+++ b/tests/integration_tests/primitive_translators/test_primitive_pjit.py
@@ -0,0 +1,68 @@
+# JaCe - JAX Just-In-Time compilation using DaCe (Data Centric Parallel Programming)
+#
+# Copyright (c) 2024, ETH Zurich
+# All rights reserved.
+#
+# SPDX-License-Identifier: BSD-3-Clause
+
+"""Tests for the `pjit` primitive."""
+
+from __future__ import annotations
+
+from collections.abc import Generator
+
+import jax
+import numpy as np
+import pytest
+from jax import numpy as jnp
+
+import jace
+
+from tests import util as testutil
+
+
+@pytest.fixture(autouse=True)
+def _disable_jit() -> Generator[None, None, None]:
+    """Overwrites the global `_disable_jit` fixture and enables jit operations."""
+    with jax.disable_jit(disable=False):
+        yield
+
+
+def test_pjit_simple() -> None:
+    """Simple nested Jaxpr expression."""
+
+    def testee(a: np.ndarray) -> np.ndarray:
+        return jax.jit(lambda a: jnp.sin(a))(a)  # noqa: PLW0108 [unnecessary-lambda]  # Lambda needed to trigger a `pjit` level.
+
+    a = testutil.make_array((10, 10))
+
+    jace_wrapped = jace.jit(testee)
+    jace_lowered = jace_wrapped.lower(a)
+    res = jace_wrapped(a)
+    ref = testee(a)
+
+    assert jace_lowered._jaxpr.eqns[0].primitive.name == "pjit"
+    assert np.allclose(res, ref)
+    assert res.dtype == ref.dtype
+    assert res.shape == ref.shape
+
+
+@pytest.mark.parametrize("shape", [(10, 10), ()])
+def test_pjit_literal(shape) -> None:
+    """Test for `pjit` with literal inputs."""
+
+    def testee(pred: np.ndarray, fbranch: np.ndarray) -> jax.Array:
+        return jnp.where(pred, 2, fbranch)
+
+    pred = testutil.make_array(shape, np.bool_)
+    fbranch = pred * 0
+
+    jace_wrapped = jace.jit(testee)
+    jace_lowered = jace_wrapped.lower(pred, fbranch)
+    res = jace_wrapped(pred, fbranch)
+    ref = testee(pred, fbranch)
+
+    assert np.all(ref == res)
+    assert jace_lowered._jaxpr.eqns[0].primitive.name == "pjit"
+    assert any(isinstance(invar, jax.core.Literal) for invar in jace_lowered._jaxpr.eqns[0].invars)
+    assert res.dtype == ref.dtype
diff --git a/tests/integration_tests/primitive_translators/test_primitive_select_n.py b/tests/integration_tests/primitive_translators/test_primitive_select_n.py
index 0981c97..a87088f 100644
--- a/tests/integration_tests/primitive_translators/test_primitive_select_n.py
+++ b/tests/integration_tests/primitive_translators/test_primitive_select_n.py
@@ -9,7 +9,8 @@
 
 from __future__ import annotations
 
-from typing import TYPE_CHECKING, Any
+from collections.abc import Callable
+from typing import Any
 
 import jax
 import numpy as np
@@ -20,10 +21,6 @@
 from tests import util as testutil
 
 
-if TYPE_CHECKING:
-    from collections.abc import Callable
-
-
 def _perform_test(testee: Callable, *args: Any) -> None:
     res = testee(*args)
     ref = jace.jit(testee)(*args)
diff --git a/tests/integration_tests/test_primitive_translator_managing.py b/tests/integration_tests/test_primitive_translator_managing.py
index 7cab00b..1655d40 100644
--- a/tests/integration_tests/test_primitive_translator_managing.py
+++ b/tests/integration_tests/test_primitive_translator_managing.py
@@ -72,6 +72,12 @@ def fake_add_translator(*args: Any, **kwargs: Any) -> None:  # noqa: ARG001
     raise NotImplementedError("'fake_add_translator()' was called.")
 
 
+def test_has_pjit():
+    print(f"ADDRESS: {translator.get_registered_primitive_translators()['pjit']}")
+    print(f"FUN ADDRESS: {translator.primitive_translators.pjit_translator.PJITTranslator}")
+    assert "pjit" in translator.get_registered_primitive_translators()
+
+
 @pytest.mark.usefixtures("no_builtin_translators")
 def test_subtranslatior_managing() -> None:
     """Basic functionality of the subtranslators."""
diff --git a/tests/unit_tests/test_jax_api.py b/tests/unit_tests/test_jax_api.py
index f73c535..23f7503 100644
--- a/tests/unit_tests/test_jax_api.py
+++ b/tests/unit_tests/test_jax_api.py
@@ -213,7 +213,6 @@ def testee(a: np.ndarray, b: np.float64) -> np.ndarray:
     )
 
 
-@pytest.mark.usefixtures("_enable_jit")
 def test_tracing_detection() -> None:
     """Tests our ability to detect if tracing is going on."""
     expected_tracing_state = False
diff --git a/tests/util.py b/tests/util.py
index 45af5aa..3b61d26 100644
--- a/tests/util.py
+++ b/tests/util.py
@@ -40,7 +40,7 @@ def make_array(
     """
 
     if shape == ():
-        return make_array((1,), dtype)[0]
+        return dtype(make_array((1,), dtype)[0])
     if isinstance(shape, int):
         shape = (shape,)
 

From 5385a5c484993343bc345d5b1a9e95482bdbde0d Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Mon, 24 Jun 2024 14:13:21 +0200
Subject: [PATCH 420/458] Cleared a bit the tests.

---
 tests/conftest.py                             |  8 ++------
 .../primitive_translators/conftest.py         |  6 +-----
 ...primitive_arithmetic_logical_operations.py | 13 +++++--------
 .../test_primitive_concatenate.py             |  2 +-
 .../test_primitive_reshape.py                 |  6 +-----
 .../test_primitive_squeeze_expand_dims.py     |  8 ++------
 tests/integration_tests/test_empty_jaxpr.py   |  2 +-
 .../test_jaxpr_translator_builder.py          |  4 ++--
 .../test_primitive_translator_managing.py     | 17 +++++++----------
 tests/unit_tests/test_misc.py                 |  2 +-
 tests/util.py                                 | 19 +++++++++----------
 11 files changed, 32 insertions(+), 55 deletions(-)

diff --git a/tests/conftest.py b/tests/conftest.py
index cf23878..94cd805 100644
--- a/tests/conftest.py
+++ b/tests/conftest.py
@@ -13,7 +13,7 @@
 
 from __future__ import annotations
 
-from typing import TYPE_CHECKING
+from collections.abc import Generator
 
 import jax
 import numpy as np
@@ -23,10 +23,6 @@
 from jace.util import translation_cache as tcache
 
 
-if TYPE_CHECKING:
-    from collections.abc import Generator
-
-
 @pytest.fixture(autouse=True)
 def _enable_x64_mode_in_jax() -> Generator[None, None, None]:
     """Fixture of enable the `x64` mode in JAX.
@@ -91,7 +87,7 @@ def _reset_random_seed() -> None:
     This ensures that for every test the random seed of NumPy is reset.
     This seed is used by the `util.mkarray()` helper.
     """
-    np.random.seed(42)  # noqa: NPY002  # We use this seed for the time being.
+    np.random.seed(42)  # noqa: NPY002 [numpy-legacy-random]
 
 
 @pytest.fixture(autouse=True)
diff --git a/tests/integration_tests/primitive_translators/conftest.py b/tests/integration_tests/primitive_translators/conftest.py
index 1c4008b..677d9ed 100644
--- a/tests/integration_tests/primitive_translators/conftest.py
+++ b/tests/integration_tests/primitive_translators/conftest.py
@@ -9,17 +9,13 @@
 
 from __future__ import annotations
 
-from typing import TYPE_CHECKING
+from collections.abc import Generator
 
 import pytest
 
 from jace import optimization, stages
 
 
-if TYPE_CHECKING:
-    from collections.abc import Generator
-
-
 @pytest.fixture(
     autouse=True,
     params=[
diff --git a/tests/integration_tests/primitive_translators/test_primitive_arithmetic_logical_operations.py b/tests/integration_tests/primitive_translators/test_primitive_arithmetic_logical_operations.py
index a833786..7573de5 100644
--- a/tests/integration_tests/primitive_translators/test_primitive_arithmetic_logical_operations.py
+++ b/tests/integration_tests/primitive_translators/test_primitive_arithmetic_logical_operations.py
@@ -23,7 +23,8 @@ class such as
 
 from __future__ import annotations
 
-from typing import TYPE_CHECKING, Any
+from collections.abc import Callable, Generator
+from typing import Any
 
 import dace
 import jax
@@ -36,10 +37,6 @@ class such as
 from tests import util as testutil
 
 
-if TYPE_CHECKING:
-    from collections.abc import Callable, Generator
-
-
 @pytest.fixture(autouse=True)
 def _only_alt_translators() -> Generator[None, None, None]:
     """Removes all non arithmetic/logical translator from the registry.
@@ -48,9 +45,9 @@ def _only_alt_translators() -> Generator[None, None, None]:
     test class, such as broadcasting. It makes writing tests a bit harder, but it is
     worth. For some reasons also type conversion s allowed.
     """
-    from jace.translator.primitive_translators.arithmetic_logical_translators import (  # noqa: PLC0415  # Direct import.
-        _ARITMETIC_OPERATION_TEMPLATES,  # noqa: PLC2701  # Import of private variables.
-        _LOGICAL_OPERATION_TEMPLATES,  # noqa: PLC2701
+    from jace.translator.primitive_translators.arithmetic_logical_translators import (  # noqa: PLC0415  [import-outside-top-level]
+        _ARITMETIC_OPERATION_TEMPLATES,  # noqa: PLC2701 [import-private-name]
+        _LOGICAL_OPERATION_TEMPLATES,  # noqa: PLC2701 [import-private-name]
     )
 
     # Remove all non ALU translators from the registry
diff --git a/tests/integration_tests/primitive_translators/test_primitive_concatenate.py b/tests/integration_tests/primitive_translators/test_primitive_concatenate.py
index 12fe735..e09160d 100644
--- a/tests/integration_tests/primitive_translators/test_primitive_concatenate.py
+++ b/tests/integration_tests/primitive_translators/test_primitive_concatenate.py
@@ -50,7 +50,7 @@ def test_cat_nd() -> None:
             input_arrays.append(testutil.make_array(shape))
 
         def testee(inputs: list[np.ndarray]) -> np.ndarray | jax.Array:
-            return jax.lax.concatenate(inputs, cat_dim)  # noqa: B023  # Iteration variable capture.
+            return jax.lax.concatenate(inputs, cat_dim)  # noqa: B023 [function-uses-loop-variable]
 
         ref = testee(input_arrays)
         res = jace.jit(testee)(input_arrays)
diff --git a/tests/integration_tests/primitive_translators/test_primitive_reshape.py b/tests/integration_tests/primitive_translators/test_primitive_reshape.py
index 9d3948f..bd1d6ab 100644
--- a/tests/integration_tests/primitive_translators/test_primitive_reshape.py
+++ b/tests/integration_tests/primitive_translators/test_primitive_reshape.py
@@ -9,7 +9,7 @@
 
 from __future__ import annotations
 
-from typing import TYPE_CHECKING
+from collections.abc import Sequence
 
 import jax
 import numpy as np
@@ -21,10 +21,6 @@
 from tests import util as testutil
 
 
-if TYPE_CHECKING:
-    from collections.abc import Sequence
-
-
 def _test_impl_reshaping(
     src_shape: Sequence[int], dst_shape: Sequence[int], order: str = "C"
 ) -> None:
diff --git a/tests/integration_tests/primitive_translators/test_primitive_squeeze_expand_dims.py b/tests/integration_tests/primitive_translators/test_primitive_squeeze_expand_dims.py
index 672458b..c823cf6 100644
--- a/tests/integration_tests/primitive_translators/test_primitive_squeeze_expand_dims.py
+++ b/tests/integration_tests/primitive_translators/test_primitive_squeeze_expand_dims.py
@@ -14,7 +14,7 @@
 
 from __future__ import annotations
 
-from typing import TYPE_CHECKING
+from collections.abc import Sequence
 
 import jax
 import numpy as np
@@ -26,10 +26,6 @@
 from tests import util as testutil
 
 
-if TYPE_CHECKING:
-    from collections.abc import Sequence
-
-
 def _roundtrip_implementation(shape: Sequence[int], axis: int | Sequence[int]) -> None:
     """Implementation of the test for `expand_dims()` and `squeeze()`.
 
@@ -45,7 +41,7 @@ def _roundtrip_implementation(shape: Sequence[int], axis: int | Sequence[int]) -
     for ops in [jnp.expand_dims, jnp.squeeze]:
         with jax.experimental.enable_x64():
             ref = ops(a, axis)  # type: ignore[operator]  # Function of unknown type.
-            res = jace.jit(lambda a: ops(a, axis))(a)  # type: ignore[operator]  # noqa: B023
+            res = jace.jit(lambda a: ops(a, axis))(a)  # type: ignore[operator]  # noqa: B023 [function-uses-loop-variable]
 
         assert ref.shape == res.shape, f"a.shape = {shape}; Expected: {ref.shape}; Got: {res.shape}"
         assert ref.dtype == res.dtype
diff --git a/tests/integration_tests/test_empty_jaxpr.py b/tests/integration_tests/test_empty_jaxpr.py
index 68d7716..29ba9a4 100644
--- a/tests/integration_tests/test_empty_jaxpr.py
+++ b/tests/integration_tests/test_empty_jaxpr.py
@@ -50,7 +50,7 @@ def test_empty_unused_argument() -> None:
     """Empty body and an unused input argument."""
 
     @jace.jit
-    def wrapped(a: np.ndarray, b: np.float64) -> np.ndarray:  # noqa: ARG001  # Explicitly unused.
+    def wrapped(a: np.ndarray, b: np.float64) -> np.ndarray:  # noqa: ARG001 [unused-function-argument]
         return a
 
     a = np.arange(12, dtype=np.float64).reshape((4, 3))
diff --git a/tests/integration_tests/test_jaxpr_translator_builder.py b/tests/integration_tests/test_jaxpr_translator_builder.py
index b1a85c5..e71a189 100644
--- a/tests/integration_tests/test_jaxpr_translator_builder.py
+++ b/tests/integration_tests/test_jaxpr_translator_builder.py
@@ -604,7 +604,7 @@ def testee(a: np.ndarray) -> tuple[np.ndarray, np.float64, np.ndarray]:
 def test_builder_unused_arg() -> None:
     """Tests if there is an unused argument."""
 
-    def testee(a: np.ndarray, b: np.ndarray) -> np.ndarray:  # noqa: ARG001  # Explicitly unused.
+    def testee(a: np.ndarray, b: np.ndarray) -> np.ndarray:  # noqa: ARG001 [unused-function-argument]
         return a + 3.0
 
     a = testutil.make_array((10, 10))
@@ -634,7 +634,7 @@ def test_builder_jace_var() -> None:
             _ = JaCeVar((), dace.int8, name=iname)
 
 
-def test_builder_FORTRAN_strides() -> None:  # noqa: N802  # Function name
+def test_builder_FORTRAN_strides() -> None:  # noqa: N802 [invalid-function-name]
     """Tests if we can lower without a standard stride.
 
     Notes:
diff --git a/tests/integration_tests/test_primitive_translator_managing.py b/tests/integration_tests/test_primitive_translator_managing.py
index 1655d40..a52ab01 100644
--- a/tests/integration_tests/test_primitive_translator_managing.py
+++ b/tests/integration_tests/test_primitive_translator_managing.py
@@ -10,7 +10,8 @@
 from __future__ import annotations
 
 import re
-from typing import TYPE_CHECKING, Any
+from collections.abc import Generator, Mapping
+from typing import Any
 
 import numpy as np
 import pytest
@@ -21,10 +22,6 @@
 from tests import util as testutil
 
 
-if TYPE_CHECKING:
-    from collections.abc import Generator, Mapping
-
-
 @pytest.fixture(autouse=True)
 def _conserve_builtin_translators() -> Generator[None, None, None]:
     """Restores the set of registered subtranslators after a test."""
@@ -34,7 +31,7 @@ def _conserve_builtin_translators() -> Generator[None, None, None]:
 
 
 @pytest.fixture()
-def no_builtin_translators() -> Generator[None, None, None]:  # noqa: PT004  # This is how you should do it: https://docs.pytest.org/en/7.1.x/how-to/fixtures.html#use-fixtures-in-classes-and-modules-with-usefixtures
+def no_builtin_translators() -> Generator[None, None, None]:  # noqa: PT004 [pytest-missing-fixture-name-underscore] # This is how you should do it: https://docs.pytest.org/en/7.1.x/how-to/fixtures.html#use-fixtures-in-classes-and-modules-with-usefixtures
     """This fixture can be used if the test does not want any builtin translators."""
     initial_translators = testutil.set_active_primitive_translators_to({})
     yield
@@ -63,12 +60,12 @@ def __call__(self) -> None:  # type: ignore[override]  # Arguments
 
 
 @translator.make_primitive_translator("non_existing_callable_primitive3")
-def primitive_translator_3_callable(*args: Any, **kwargs: Any) -> None:  # noqa: ARG001
+def primitive_translator_3_callable(*args: Any, **kwargs: Any) -> None:  # noqa: ARG001 [unused-function-argument]
     raise NotImplementedError
 
 
 @translator.make_primitive_translator("add")
-def fake_add_translator(*args: Any, **kwargs: Any) -> None:  # noqa: ARG001
+def fake_add_translator(*args: Any, **kwargs: Any) -> None:  # noqa: ARG001 [unused-function-argument]
     raise NotImplementedError("'fake_add_translator()' was called.")
 
 
@@ -131,7 +128,7 @@ def test_subtranslatior_managing_callable_annotation() -> None:
     prim_name = "non_existing_property"
 
     @translator.make_primitive_translator(prim_name)
-    def non_existing_translator(*args: Any, **kwargs: Any) -> None:  # noqa: ARG001
+    def non_existing_translator(*args: Any, **kwargs: Any) -> None:  # noqa: ARG001 [unused-function-argument]
         raise NotImplementedError
 
     assert hasattr(non_existing_translator, "primitive")
@@ -170,7 +167,7 @@ def test_subtranslatior_managing_overwriting_2() -> None:
 
     @translator.register_primitive_translator(overwrite=True)
     @translator.make_primitive_translator("add")
-    def still_useless_but_a_bit_less(*args: Any, **kwargs: Any) -> None:  # noqa: ARG001
+    def still_useless_but_a_bit_less(*args: Any, **kwargs: Any) -> None:  # noqa: ARG001 [unused-function-argument]
         trans_cnt[0] += 1
 
     @jace.jit
diff --git a/tests/unit_tests/test_misc.py b/tests/unit_tests/test_misc.py
index fa235f8..263df3e 100644
--- a/tests/unit_tests/test_misc.py
+++ b/tests/unit_tests/test_misc.py
@@ -38,5 +38,5 @@ def testee(a: np.ndarray) -> np.ndarray:
     callee = testee.lower(a1).compile()
 
     # But calling with the second type
-    with pytest.raises(Exception):  # noqa: B017, PT011 # Unknown exception.
+    with pytest.raises(Exception):  # noqa: B017, PT011 [assert-raises-exception, pytest-raises-too-broad]  # Unknown exception.
         _ = callee(a2)
diff --git a/tests/util.py b/tests/util.py
index 3b61d26..aa89d2b 100644
--- a/tests/util.py
+++ b/tests/util.py
@@ -9,22 +9,21 @@
 
 from __future__ import annotations
 
-from typing import TYPE_CHECKING
+from collections.abc import Mapping, Sequence
+from typing import Literal
 
 import numpy as np
 
 from jace import translator
 
 
-if TYPE_CHECKING:
-    from collections.abc import Mapping, Sequence
-
-
 __all__ = ["make_array"]
 
 
 def make_array(
-    shape: Sequence[int] | int, dtype: type = np.float64, order: str = "C"
+    shape: Sequence[int] | int,
+    dtype: type = np.float64,
+    order: Literal[None, "K", "A", "C", "F"] = "C",
 ) -> np.ndarray:
     """Generates a NumPy ndarray with shape `shape`.
 
@@ -45,17 +44,17 @@ def make_array(
         shape = (shape,)
 
     if dtype == np.bool_:
-        res = np.random.random(shape) > 0.5  # noqa: NPY002
+        res = np.random.random(shape) > 0.5  # noqa: NPY002 [numpy-legacy-random]
     elif np.issubdtype(dtype, np.integer):
         iinfo: np.iinfo = np.iinfo(dtype)
-        res = np.random.randint(  # noqa: NPY002
+        res = np.random.randint(  # noqa: NPY002 [numpy-legacy-random]
             low=iinfo.min, high=iinfo.max, size=shape, dtype=dtype
         )
     elif np.issubdtype(dtype, np.complexfloating):
         res = make_array(shape, np.float64) + 1.0j * make_array(shape, np.float64)
     else:
-        res = np.random.random(shape)  # type: ignore[assignment]  # noqa: NPY002
-    return np.array(res, order=order, dtype=dtype)  # type: ignore[call-overload]
+        res = np.random.random(shape)  # type: ignore[assignment]  # noqa: NPY002 [numpy-legacy-random]
+    return np.array(res, order=order, dtype=dtype)
 
 
 def set_active_primitive_translators_to(

From 1296b9dcba029c60fbb6420397ecef41616e966d Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Mon, 24 Jun 2024 15:33:51 +0200
Subject: [PATCH 421/458] The function to promote literals to constant is now a
 free function, however it is only aviable at a strange location.

---
 .../primitive_translators/pjit_translator.py  | 76 +++++++++++++------
 1 file changed, 54 insertions(+), 22 deletions(-)

diff --git a/src/jace/translator/primitive_translators/pjit_translator.py b/src/jace/translator/primitive_translators/pjit_translator.py
index 291cddf..59bfd7e 100644
--- a/src/jace/translator/primitive_translators/pjit_translator.py
+++ b/src/jace/translator/primitive_translators/pjit_translator.py
@@ -24,6 +24,52 @@
     from jax._src import core as jax_core
 
 
+def _promote_literals_to_constants(
+    builder: translator.JaxprTranslationBuilder,
+    var_names: Sequence[str | None],
+    jax_vars: Sequence[jax_core.Atom],
+    name_pattern: str,
+) -> list[str]:
+    """
+    Promotes all literals in `var_names` to DaCe constants and add them to the SDFG.
+
+    The function assumes that `var_names` are the SDFG variables equivalents of
+    `jax_vars`, as by convention `None` indicates a literal. The function will create
+    a constant for each literal and return `var_names` cleared of all literals.
+    For naming the variables the function will use `name_pattern`.
+
+    Args:
+        builder: The builder that is used for translation.
+        var_names: Names of the SDFG variables, `None` indicates a literal.
+        jax_vars: The JAX variables, in the same order than `var_names`.
+        name_pattern: A pattern to generate a unique name for the variables.
+
+    Todo:
+        Is a constant the right idea or should we generate a symbol?
+    """
+    promoted_var_names: list[str] = []
+    for i, var_name in enumerate(var_names):
+        if var_name is None:
+            promoted_var_name = f"__const_{name_pattern}_literal_promotion_{i}"
+            jax_var = jax_vars[i]
+            promoted_jace_var = util.JaCeVar.from_atom(
+                jax_var=jax_var,
+                name=promoted_var_name,
+            )
+            builder.add_array(promoted_jace_var)
+            builder.sdfg.add_constant(
+                promoted_var_name,
+                util.get_jax_literal_value(jax_var),
+                builder.arrays[promoted_var_name],
+            )
+
+        else:
+            # Already an SDFG variable, so nothing to do.
+            promoted_var_name = var_name
+        promoted_var_names.append(promoted_var_name)
+    return promoted_var_names
+
+
 @translator.register_primitive_translator()
 @translator.make_primitive_translator("pjit")
 def PJITTranslator(  # noqa: N802 [invalid-function-name]
@@ -77,27 +123,13 @@ def PJITTranslator(  # noqa: N802 [invalid-function-name]
     # Name in SDFG must be unique, thus we mangle it, furthermore, we have to clean it.
     sdfg_name = f"pjit_{re.subn('[^a-zA-Z0-9_]', '_', pjit_name)[0]}__{'_'.join(out_var_names)}"
 
-    # If needed turn literal inputs into constants.
-    # TODO(phimuell): Is using constants really a good idea?
-    if any(in_var_name is None for in_var_name in in_var_names):
-        final_input_names: list[str] = []
-        for i, in_var_name in enumerate(in_var_names):
-            if in_var_name is None:
-                new_input_name = f"__const_{sdfg_name}_literal_input_{i}"
-                jax_input: jax_core.Atom = eqn.invars[i]
-                new_input_var = util.JaCeVar.from_atom(
-                    jax_var=jax_input,
-                    name=new_input_name,
-                )
-                builder.add_array(new_input_var)
-                builder.sdfg.add_constant(
-                    new_input_name,
-                    util.get_jax_literal_value(jax_input),
-                    builder.arrays[new_input_name],
-                )
-                in_var_name = new_input_name  # noqa: PLW2901 [redefined-loop-name]
-            final_input_names.append(in_var_name)
-        in_var_names = final_input_names
+    # Ensure that all inputs are SDFG variables
+    final_input_names = _promote_literals_to_constants(
+        builder=builder,
+        var_names=in_var_names,
+        jax_vars=eqn.invars,
+        name_pattern=sdfg_name,
+    )
 
     # Now get the translated SDFG.
     nested_context: translator.TranslationContext = builder.translate_jaxpr(
@@ -110,6 +142,6 @@ def PJITTranslator(  # noqa: N802 [invalid-function-name]
         state=eqn_state,
         child_ctx=nested_context,
         parent_ctx=builder._ctx,
-        in_var_names=in_var_names,  # type: ignore[arg-type]  # Is checked above.
+        in_var_names=final_input_names,
         out_var_names=out_var_names,
     )

From 7615be3c203a10d5dc76bf30176ebed8a8366122 Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Mon, 24 Jun 2024 15:35:09 +0200
Subject: [PATCH 422/458] Why was that thing there?

---
 src/jace/translator/primitive_translators/slicing.py | 2 --
 1 file changed, 2 deletions(-)

diff --git a/src/jace/translator/primitive_translators/slicing.py b/src/jace/translator/primitive_translators/slicing.py
index 1741fef..ae4f167 100644
--- a/src/jace/translator/primitive_translators/slicing.py
+++ b/src/jace/translator/primitive_translators/slicing.py
@@ -193,8 +193,6 @@ def __call__(
             )
             map_entry.add_in_connector(window_start_index_name)
 
-        builder.sdfg.view()
-
 
 translator.register_primitive_translator(SlicingTranslator())
 translator.register_primitive_translator(DynamicSlicingTranslator())

From 70710c13f6b59964a9d261fa3ec3c2171ffa831a Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Tue, 25 Jun 2024 09:56:49 +0200
Subject: [PATCH 423/458] First implementation of the conditional primitive.

Only the integer version is used, but it seems JAX only uses that.
The boolean version is provided but only to generate an error to notice if JAX now implements it.
---
 .../primitive_translators/conditions.py       | 182 ++++++++++++++++++
 1 file changed, 182 insertions(+)
 create mode 100644 src/jace/translator/primitive_translators/conditions.py

diff --git a/src/jace/translator/primitive_translators/conditions.py b/src/jace/translator/primitive_translators/conditions.py
new file mode 100644
index 0000000..d291016
--- /dev/null
+++ b/src/jace/translator/primitive_translators/conditions.py
@@ -0,0 +1,182 @@
+# JaCe - JAX Just-In-Time compilation using DaCe (Data Centric Parallel Programming)
+#
+# Copyright (c) 2024, ETH Zurich
+# All rights reserved.
+#
+# SPDX-License-Identifier: BSD-3-Clause
+
+"""Implements all conditions that are supported in JAX."""
+
+from __future__ import annotations
+
+from collections.abc import Sequence
+from typing import TYPE_CHECKING
+
+import dace
+
+from jace import translator, util
+from jace.translator import post_translation as ptranslation
+from jace.translator.primitive_translators import pjit_translator as pjit
+
+
+if TYPE_CHECKING:
+    from jax._src import core as jax_core
+
+
+@translator.register_primitive_translator()
+@translator.make_primitive_translator("cond")
+def condition_translator(
+    builder: translator.JaxprTranslationBuilder,
+    in_var_names: Sequence[str | None],
+    out_var_names: Sequence[str],
+    eqn: jax_core.JaxprEqn,
+    eqn_state: dace.SDFGState,
+) -> dace.SDFGState:
+    """
+    Implements the translation of the `cond` primitive, i.e. a scalar if.
+
+    XLA, JAX' backend, supports two versions, one in which the selector, i.e. the
+    variable indicating which branch should be executed is an integer or a boolean.
+
+    Args:
+        builder: The builder object of the translation.
+        in_var_names: The SDFG variables used an input arguments. First is the index,
+            the variable that selects the branch, the remaining ones are passed as
+            inputs to the branches.
+        out_var_names: Names of SDFG variables that should be used as outputs.
+        eqn: The equation that should be translated.
+        eqn_state: State into which the nested SDFG should be constructed.
+
+    Returns:
+        Because of the nature of this primitive, the translator has to construct
+        new states and will return the new SDFG state that serves as terminal state.
+
+    Note:
+        The implementation assumes that the selector, i.e. the variables indicating
+        which branch should be taken is inside its bound.
+    """
+    if util.get_jax_var_dtype(eqn.invars[0]) is dace.bool_:
+        return _cond_primitive_boolean_impl(
+            builder=builder,
+            in_var_names=in_var_names,
+            out_var_names=out_var_names,
+            eqn=eqn,
+            eqn_state=eqn_state,
+        )
+    return _cond_primitive_multi_switch_impl(
+        builder=builder,
+        in_var_names=in_var_names,
+        out_var_names=out_var_names,
+        eqn=eqn,
+        eqn_state=eqn_state,
+    )
+
+
+def _cond_primitive_multi_switch_impl(
+    builder: translator.JaxprTranslationBuilder,
+    in_var_names: Sequence[str | None],
+    out_var_names: Sequence[str],
+    eqn: jax_core.JaxprEqn,
+    eqn_state: dace.SDFGState,
+) -> dace.SDFGState:
+    """
+    Implements the integer version of the conditional primitive.
+
+    For arguments see `ConditionTranslator`.
+
+    This [version](https://openxla.org/xla/operation_semantics#conditional) is
+    essentially a C switch statement without a default branch.
+    """
+    # To make names in the SDFG unique we use the name of the equation state
+    name_pattern = eqn_state.name
+
+    # Promote all inputs to the branches to variables, this are all except the first
+    #  which is the selection variable.
+    branch_input_variable_names: list[str] = pjit._promote_literals_to_constants(
+        builder=builder,
+        var_names=in_var_names[1:],
+        jax_vars=eqn.invars[1:],
+        name_pattern=name_pattern,
+    )
+
+    if in_var_names[0] is None:
+        # The selection variable is a literal, so we will now pretend it is a symbol.
+        #  This also means that we do not need a state transition to promote the
+        #  variable to a symbol.
+        selection_symbol = str(util.get_jax_literal_value(eqn.invars[0]))
+        selection_state = eqn_state
+
+    else:
+        # The selection variable is an input.
+        #  For the implementation of the condition we need to promote the selection
+        #  variable to a symbol, for which we need an interstate edge.
+        #  As a side effect it will update the terminal state.
+        selection_variable_name = in_var_names[0]
+        selection_symbol = f"{selection_variable_name}_symb"
+
+        selection_state = builder.append_new_state(
+            label=f"{name_pattern}_fork",
+            assignments={selection_symbol: selection_variable_name},
+            prev_state=eqn_state,
+        )
+
+    # Now iterate through all branches, translate them and integrate them
+    #  for each branch we will generate a dedicated state.
+    branch_states: list[dace.SDFGState] = []
+    for i, branch_jaxpr in enumerate(eqn.params["branches"]):
+        branch_pattern = f"{name_pattern}_{{}}_branch_{i}"
+        branch_ctx = builder.translate_jaxpr(jaxpr=branch_jaxpr, name=branch_pattern.format("sdfg"))
+
+        # This will update the terminal state only the first time.
+        branch_state = builder.append_new_state(
+            label=branch_pattern.format("state"),
+            condition=f"{selection_symbol} == {i}",
+            prev_state=selection_state,
+        )
+
+        # Integrating it.
+        ptranslation.add_nested_sdfg(
+            state=branch_state,
+            child_ctx=branch_ctx,
+            parent_ctx=builder._ctx,
+            in_var_names=branch_input_variable_names,
+            out_var_names=out_var_names,
+        )
+        branch_states.append(branch_state)
+
+    # Now we have to generate a join state that will serve as new terminal state.
+    #  We append it to the first branch state, which is the current terminal state.
+    assert builder._terminal_sdfg_state is branch_states[0]
+    terminal_state = builder.append_new_state(
+        label=f"{name_pattern}_join",
+        prev_state=branch_states[0],
+    )
+    for branch_state in branch_states[1:]:
+        builder.sdfg.add_edge(
+            branch_state,
+            terminal_state,
+            dace.sdfg.InterstateEdge(),
+        )
+
+    # We return it, because otherwise the builder will assume that `eqn_state` was used.
+    return terminal_state
+
+
+def _cond_primitive_boolean_impl(
+    builder: translator.JaxprTranslationBuilder,  # noqa: ARG001 [unused-function-argument]
+    in_var_names: Sequence[str | None],  # noqa: ARG001 [unused-function-argument]
+    out_var_names: Sequence[str],  # noqa: ARG001 [unused-function-argument]
+    eqn: jax_core.JaxprEqn,  # noqa: ARG001 [unused-function-argument]
+    eqn_state: dace.SDFGState,  # noqa: ARG001 [unused-function-argument]
+) -> dace.SDFGState:
+    """
+    Implements the case the selector of the primitive is a bool.
+
+    XLA explicitly provides this
+    [form of the primitive](https://openxla.org/xla/operation_semantics#conditional)
+    JAX however, does not seem to use it and instead forwards it to the integer
+    implementation.
+    JaCe will not implement it and instead generate an error.
+    """
+    # NOTE: This is mostly to notice if JAX decided to implement that branch.
+    raise NotImplementedError("The boolean conditional primitive is not implemented.")

From 44a8a80dc0f874ef3ce26b729370bfd7791e4443 Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Tue, 25 Jun 2024 13:47:05 +0200
Subject: [PATCH 424/458] Addressed Enruiques Suggestions.

---
 CODING_GUIDELINES.md              | 14 +++++++++++++-
 src/jace/api.py                   | 17 +++++++---------
 src/jace/optimization.py          |  3 ++-
 src/jace/stages.py                | 21 ++++++++++----------
 src/jace/tracing.py               |  6 +++---
 src/jace/translated_jaxpr_sdfg.py | 32 ++++++++++++++-----------------
 src/jace/util/traits.py           |  4 ++--
 7 files changed, 52 insertions(+), 45 deletions(-)

diff --git a/CODING_GUIDELINES.md b/CODING_GUIDELINES.md
index 3e7fabb..72cff79 100644
--- a/CODING_GUIDELINES.md
+++ b/CODING_GUIDELINES.md
@@ -29,6 +29,18 @@ We deviate from the [Google Python Style Guide][google-style-guide] only in the
 
 - According to subsection [_3.19.12 Imports For Typing_](https://google.github.io/styleguide/pyguide.html#31912-imports-for-typing), symbols from `typing` and `collections.abc` modules used in type annotations _"can be imported directly to keep common annotations concise and match standard typing practices"_. Following the same spirit, we allow symbols to be imported directly from third-party or internal modules when they only contain a collection of frequently used typying definitions.
 
+### Aliasing of Modules
+
+According to subsection [2.2](https://google.github.io/styleguide/pyguide.html#22-imports) in certain cases it is allowed to introduce an alias for an import.
+Inside JaCe the following convention is applied:
+
+- If the module has a standard abbreviation use that, e.g. `import numpy as np`.
+- For a JaCe module use:
+  - If the module name is only a single word use it directly, e.g. `from jace import translator`
+  - If the module name consists of multiple words use the last word prefixed with the first letters of the others, e.g. `from jace.translator import post_translator as ptranslator` or `from jace import translated_jaxpr_sdfg as tjsdfg`.
+  - In case of a clash use your best judgment.
+- For an external module use the rule above, but prefix the name with the main package's name, e.g. `from dace.codegen import compiled_sdfg as dace_csdfg`.
+
 ### Python usage recommendations
 
 - `pass` vs `...` (`Ellipsis`)
@@ -104,7 +116,7 @@ We generate the API documentation automatically from the docstrings using [Sphin
 Sphinx supports the [reStructuredText][sphinx-rest] (reST) markup language for defining additional formatting options in the generated documentation, however section [_3.8 Comments and Docstrings_](https://google.github.io/styleguide/pyguide.html#38-comments-and-docstrings) of the Google Python Style Guide does not specify how to use markups in docstrings. As a result, we decided to forbid reST markup in docstrings, except for the following cases:
 
 - Cross-referencing other objects using Sphinx text roles for the [Python domain](https://www.sphinx-doc.org/en/master/usage/restructuredtext/domains.html#the-python-domain) (as explained [here](https://www.sphinx-doc.org/en/master/usage/restructuredtext/domains.html#python-roles)).
-- Very basic formatting markup to improve _readability_ of the generated documentation without obscuring the source docstring (e.g. ``` ``literal`` ``` strings, bulleted lists).
+- Very basic formatting markup to improve _readability_ of the generated documentation without obscuring the source docstring (e.g. `"literal"` strings, bulleted lists).
 
 We highly encourage the [doctest] format for code examples in docstrings. In fact, doctest runs code examples and makes sure they are in sync with the codebase.
 
diff --git a/src/jace/api.py b/src/jace/api.py
index 05bfa1e..6def2f4 100644
--- a/src/jace/api.py
+++ b/src/jace/api.py
@@ -23,7 +23,7 @@
 
 # Used for type annotation, see the notes in `jace.stages` for more.
 _P = ParamSpec("_P")
-_ReturnType = TypeVar("_ReturnType")
+_R = TypeVar("_R")
 
 
 class JITOptions(TypedDict, total=False):
@@ -43,27 +43,24 @@ def jit(
     /,
     primitive_translators: Mapping[str, translator.PrimitiveTranslator] | None = None,
     **kwargs: Unpack[JITOptions],
-) -> Callable[[Callable[_P, _ReturnType]], stages.JaCeWrapped[_P, _ReturnType]]: ...
+) -> Callable[[Callable[_P, _R]], stages.JaCeWrapped[_P, _R]]: ...
 
 
 @overload
 def jit(
-    fun: Callable[_P, _ReturnType],
+    fun: Callable[_P, _R],
     /,
     primitive_translators: Mapping[str, translator.PrimitiveTranslator] | None = None,
     **kwargs: Unpack[JITOptions],
-) -> stages.JaCeWrapped[_P, _ReturnType]: ...
+) -> stages.JaCeWrapped[_P, _R]: ...
 
 
 def jit(
-    fun: Callable[_P, _ReturnType] | None = None,
+    fun: Callable[_P, _R] | None = None,
     /,
     primitive_translators: Mapping[str, translator.PrimitiveTranslator] | None = None,
     **kwargs: Unpack[JITOptions],
-) -> (
-    Callable[[Callable[_P, _ReturnType]], stages.JaCeWrapped[_P, _ReturnType]]
-    | stages.JaCeWrapped[_P, _ReturnType]
-):
+) -> Callable[[Callable[_P, _R]], stages.JaCeWrapped[_P, _R]] | stages.JaCeWrapped[_P, _R]:
     """
     JaCe's replacement for `jax.jit` (just-in-time) wrapper.
 
@@ -87,7 +84,7 @@ def jit(
             f"The following arguments to 'jace.jit' are not yet supported: {', '.join(kwargs)}."
         )
 
-    def wrapper(f: Callable[_P, _ReturnType]) -> stages.JaCeWrapped[_P, _ReturnType]:
+    def wrapper(f: Callable[_P, _R]) -> stages.JaCeWrapped[_P, _R]:
         jace_wrapper = stages.JaCeWrapped(
             fun=f,
             primitive_translators=(
diff --git a/src/jace/optimization.py b/src/jace/optimization.py
index 65e97b4..5dc159b 100644
--- a/src/jace/optimization.py
+++ b/src/jace/optimization.py
@@ -68,7 +68,8 @@ def jace_optimize(tsdfg: tjsdfg.TranslatedJaxprSDFG, **kwargs: Unpack[CompilerOp
             in the SDFG to `AllocationLifetime.Persistent`, i.e. keep them allocated
             between different invocations.
     """
-    # Currently this function exists primarily for the same of existing.
+    # TODO(phimuell): Implement the functionality.
+    # Currently this function exists primarily for the sake of existing.
 
     simplify = kwargs.get("simplify", False)
     auto_optimize = kwargs.get("auto_optimize", False)
diff --git a/src/jace/stages.py b/src/jace/stages.py
index b51fac0..1b1fa16 100644
--- a/src/jace/stages.py
+++ b/src/jace/stages.py
@@ -67,10 +67,10 @@
 #  changing that, but from a semantic point they behave the same so it should not
 #  matter too much.
 _P = ParamSpec("_P")
-_ReturnType = TypeVar("_ReturnType")
+_R = TypeVar("_R")
 
 
-class JaCeWrapped(tcache.CachingStage["JaCeLowered"], Generic[_P, _ReturnType]):
+class JaCeWrapped(tcache.CachingStage["JaCeLowered"], Generic[_P, _R]):
     """
     A function ready to be specialized, lowered, and compiled.
 
@@ -100,16 +100,17 @@ class JaCeWrapped(tcache.CachingStage["JaCeLowered"], Generic[_P, _ReturnType]):
         which is implicitly and temporary activated during tracing.
     """
 
-    _fun: Callable[_P, _ReturnType]
+    _fun: Callable[_P, _R]
     _primitive_translators: dict[str, translator.PrimitiveTranslator]
     _jit_options: api.JITOptions
 
     def __init__(
         self,
-        fun: Callable[_P, _ReturnType],
+        fun: Callable[_P, _R],
         primitive_translators: Mapping[str, translator.PrimitiveTranslator],
         jit_options: api.JITOptions,
     ) -> None:
+        # TODO(phimuell): Test if this restriction is needed.
         assert all(
             param.default is param.empty for param in inspect.signature(fun).parameters.values()
         )
@@ -118,7 +119,7 @@ def __init__(
         self._jit_options = {**jit_options}
         self._fun = fun
 
-    def __call__(self, *args: _P.args, **kwargs: _P.kwargs) -> _ReturnType:
+    def __call__(self, *args: _P.args, **kwargs: _P.kwargs) -> _R:
         """
         Executes the wrapped function, lowering and compiling as needed in one step.
 
@@ -139,7 +140,7 @@ def __call__(self, *args: _P.args, **kwargs: _P.kwargs) -> _ReturnType:
         return compiled(*args, **kwargs)
 
     @tcache.cached_transition
-    def lower(self, *args: _P.args, **kwargs: _P.kwargs) -> JaCeLowered[_ReturnType]:
+    def lower(self, *args: _P.args, **kwargs: _P.kwargs) -> JaCeLowered[_R]:
         """
         Lower the wrapped computation for the given arguments.
 
@@ -202,7 +203,7 @@ def _make_call_description(
         )
 
 
-class JaCeLowered(tcache.CachingStage["JaCeCompiled"], Generic[_ReturnType]):
+class JaCeLowered(tcache.CachingStage["JaCeCompiled"], Generic[_R]):
     """
     Represents the original computation as an SDFG.
 
@@ -237,7 +238,7 @@ def __init__(
         self._out_tree = out_tree
 
     @tcache.cached_transition
-    def compile(self, compiler_options: CompilerOptions | None = None) -> JaCeCompiled[_ReturnType]:
+    def compile(self, compiler_options: CompilerOptions | None = None) -> JaCeCompiled[_R]:
         """
         Optimize and compile the lowered SDFG using `compiler_options`.
 
@@ -296,7 +297,7 @@ def _make_call_description(
         )
 
 
-class JaCeCompiled(Generic[_ReturnType]):
+class JaCeCompiled(Generic[_R]):
     """
     Compiled version of the SDFG.
 
@@ -331,7 +332,7 @@ def __init__(
         self._compiled_sdfg = compiled_sdfg
         self._out_tree = out_tree
 
-    def __call__(self, *args: Any, **kwargs: Any) -> _ReturnType:
+    def __call__(self, *args: Any, **kwargs: Any) -> _R:
         """
         Calls the embedded computation.
 
diff --git a/src/jace/tracing.py b/src/jace/tracing.py
index c28101d..2e51251 100644
--- a/src/jace/tracing.py
+++ b/src/jace/tracing.py
@@ -27,12 +27,12 @@
     from jace import api
 
 _P = ParamSpec("_P")
-_ReturnType = TypeVar("_ReturnType")
+_R = TypeVar("_R")
 
 
 @overload
 def make_jaxpr(
-    fun: Callable[_P, _ReturnType],
+    fun: Callable[_P, _R],
     trace_options: api.JITOptions,
     return_out_tree: Literal[True],
 ) -> Callable[_P, tuple[jax_core.ClosedJaxpr, jax_tree.PyTreeDef]]: ...
@@ -40,7 +40,7 @@ def make_jaxpr(
 
 @overload
 def make_jaxpr(
-    fun: Callable[_P, _ReturnType],
+    fun: Callable[_P, _R],
     trace_options: api.JITOptions,
     return_out_tree: Literal[False] = False,
 ) -> Callable[_P, jax_core.ClosedJaxpr]: ...
diff --git a/src/jace/translated_jaxpr_sdfg.py b/src/jace/translated_jaxpr_sdfg.py
index 04eae37..78c7c8b 100644
--- a/src/jace/translated_jaxpr_sdfg.py
+++ b/src/jace/translated_jaxpr_sdfg.py
@@ -23,8 +23,7 @@
 
 if TYPE_CHECKING:
     import numpy as np
-    from dace.codegen import compiled_sdfg
-    from dace.codegen.compiled_sdfg import CompiledSDFG
+    from dace.codegen import compiled_sdfg as dace_csdfg
 
 
 @dataclasses.dataclass(frozen=True, kw_only=True)
@@ -100,12 +99,12 @@ class CompiledJaxprSDFG:
     `compile_jaxpr_sdfg()`.
 
     Args:
-        compiled_sdfg: The `CompiledSDFG` object.
+        dace_csdfg: The `CompiledSDFG` object.
         input_names: Names of the SDFG variables used as inputs.
         out_names: Names of the SDFG variables used as outputs.
 
     Attributes:
-        compiled_sdfg: The `CompiledSDFG` object.
+        dace_csdfg: The `CompiledSDFG` object.
         sdfg: The encapsulated SDFG object.
         input_names: Names of the SDFG variables used as inputs.
         out_names: Names of the SDFG variables used as outputs.
@@ -119,13 +118,13 @@ class CompiledJaxprSDFG:
         arrays of length one.
     """
 
-    compiled_sdfg: compiled_sdfg.CompiledSDFG
+    csdfg: dace_csdfg.CompiledSDFG
     input_names: tuple[str, ...]
     out_names: tuple[str, ...]
 
     @property
     def sdfg(self) -> dace.SDFG:  # noqa: D102 [undocumented-public-method]
-        return self.compiled_sdfg.sdfg
+        return self.csdfg.sdfg
 
     def __call__(
         self,
@@ -138,7 +137,7 @@ def __call__(
         the output.
 
         Args:
-            compiled_sdfg: The compiled SDFG to call.
+            dace_csdfg: The compiled SDFG to call.
             flat_call_args: Flattened input arguments.
         """
         if len(self.input_names) != len(flat_call_args):
@@ -164,25 +163,24 @@ def __call__(
             else:
                 sdfg_call_args[out_name] = dace_data.make_array_from_descriptor(sdfg_array)
 
-        assert len(sdfg_call_args) == len(self.compiled_sdfg.argnames), (
+        assert len(sdfg_call_args) == len(self.csdfg.argnames), (
             "Failed to construct the call arguments,"
-            f" expected {len(self.compiled_sdfg.argnames)} but got {len(flat_call_args)}."
-            f"\nExpected: {self.compiled_sdfg.argnames}\nGot: {list(sdfg_call_args.keys())}"
+            f" expected {len(self.csdfg.argnames)} but got {len(flat_call_args)}."
+            f"\nExpected: {self.csdfg.argnames}\nGot: {list(sdfg_call_args.keys())}"
         )
 
         # Calling the SDFG
         with dace.config.temporary_config():
             dace.Config.set("compiler", "allow_view_arguments", value=True)
-            self.compiled_sdfg(**sdfg_call_args)
+            self.csdfg(**sdfg_call_args)
 
         return [sdfg_call_args[out_name] for out_name in self.out_names]
 
 
-def compile_jaxpr_sdfg(tsdfg: TranslatedJaxprSDFG) -> CompiledJaxprSDFG:
+def compile_jaxpr_sdfg(tsdfg: TranslatedJaxprSDFG) -> dace_csdfg.CompiledJaxprSDFG:
     """Compile `tsdfg` and return a `CompiledJaxprSDFG` object with the result."""
     if any(  # We do not support the DaCe return mechanism
-        array_name.startswith("__return")
-        for array_name in tsdfg.sdfg.arrays.keys()  # noqa: SIM118 [in-dict-keys]  # We can not use `in` because we are not interested in `my_mangled_variable__return_zulu`!
+        array_name.startswith("__return") for array_name in tsdfg.sdfg.arrays
     ):
         raise ValueError("Only support SDFGs without '__return' members.")
     if tsdfg.sdfg.free_symbols:  # This is a simplification that makes our life simple.
@@ -211,13 +209,11 @@ def compile_jaxpr_sdfg(tsdfg: TranslatedJaxprSDFG) -> CompiledJaxprSDFG:
             dace.Config.set("default_build_folder", value=pathlib.Path(".jacecache").resolve())
             sdfg._recompile = True
             sdfg._regenerate_code = True
-            compiled_sdfg: CompiledSDFG = sdfg.compile()
+            csdfg: dace_csdfg.CompiledSDFG = sdfg.compile()
 
     finally:
         sdfg.name = original_sdfg_name
         sdfg._recompile = original_recompile
         sdfg._regenerate_code = original_regenerate_code
 
-    return CompiledJaxprSDFG(
-        compiled_sdfg=compiled_sdfg, input_names=tsdfg.input_names, out_names=tsdfg.out_names
-    )
+    return CompiledJaxprSDFG(csdfg=csdfg, input_names=tsdfg.input_names, out_names=tsdfg.out_names)
diff --git a/src/jace/util/traits.py b/src/jace/util/traits.py
index d7efb30..af2b290 100644
--- a/src/jace/util/traits.py
+++ b/src/jace/util/traits.py
@@ -80,8 +80,8 @@ def get_strides_for_dace(obj: Any) -> tuple[int, ...] | None:
     Get the strides of `obj` in a DaCe compatible format.
 
     The function returns the strides in number of elements, as it is used inside
-    DaCe and not in bytes as it is inside NumPy. As in NumPy and DaCe the function
-    returns `None` to indicate standard C order.
+    DaCe and not in bytes as it is inside NumPy. As in DaCe `None` is returned to
+    indicate standard C order.
 
     Note:
         If `obj` is not array like an error is generated.

From c8a6aa8a4724111119ff9a790bd9fe08583c2b90 Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Tue, 25 Jun 2024 13:51:04 +0200
Subject: [PATCH 425/458] Squashed commit of the following:

commit 44a8a80dc0f874ef3ce26b729370bfd7791e4443
Author: Philip Mueller <philip.mueller@cscs.ch>
Date:   Tue Jun 25 13:47:05 2024 +0200

    Addressed Enruiques Suggestions.
---
 CODING_GUIDELINES.md              | 14 +++++++++++++-
 src/jace/api.py                   | 17 +++++++---------
 src/jace/optimization.py          |  3 ++-
 src/jace/stages.py                | 21 ++++++++++----------
 src/jace/tracing.py               |  6 +++---
 src/jace/translated_jaxpr_sdfg.py | 32 ++++++++++++++-----------------
 src/jace/util/traits.py           |  4 ++--
 7 files changed, 52 insertions(+), 45 deletions(-)

diff --git a/CODING_GUIDELINES.md b/CODING_GUIDELINES.md
index 3e7fabb..72cff79 100644
--- a/CODING_GUIDELINES.md
+++ b/CODING_GUIDELINES.md
@@ -29,6 +29,18 @@ We deviate from the [Google Python Style Guide][google-style-guide] only in the
 
 - According to subsection [_3.19.12 Imports For Typing_](https://google.github.io/styleguide/pyguide.html#31912-imports-for-typing), symbols from `typing` and `collections.abc` modules used in type annotations _"can be imported directly to keep common annotations concise and match standard typing practices"_. Following the same spirit, we allow symbols to be imported directly from third-party or internal modules when they only contain a collection of frequently used typying definitions.
 
+### Aliasing of Modules
+
+According to subsection [2.2](https://google.github.io/styleguide/pyguide.html#22-imports) in certain cases it is allowed to introduce an alias for an import.
+Inside JaCe the following convention is applied:
+
+- If the module has a standard abbreviation use that, e.g. `import numpy as np`.
+- For a JaCe module use:
+  - If the module name is only a single word use it directly, e.g. `from jace import translator`
+  - If the module name consists of multiple words use the last word prefixed with the first letters of the others, e.g. `from jace.translator import post_translator as ptranslator` or `from jace import translated_jaxpr_sdfg as tjsdfg`.
+  - In case of a clash use your best judgment.
+- For an external module use the rule above, but prefix the name with the main package's name, e.g. `from dace.codegen import compiled_sdfg as dace_csdfg`.
+
 ### Python usage recommendations
 
 - `pass` vs `...` (`Ellipsis`)
@@ -104,7 +116,7 @@ We generate the API documentation automatically from the docstrings using [Sphin
 Sphinx supports the [reStructuredText][sphinx-rest] (reST) markup language for defining additional formatting options in the generated documentation, however section [_3.8 Comments and Docstrings_](https://google.github.io/styleguide/pyguide.html#38-comments-and-docstrings) of the Google Python Style Guide does not specify how to use markups in docstrings. As a result, we decided to forbid reST markup in docstrings, except for the following cases:
 
 - Cross-referencing other objects using Sphinx text roles for the [Python domain](https://www.sphinx-doc.org/en/master/usage/restructuredtext/domains.html#the-python-domain) (as explained [here](https://www.sphinx-doc.org/en/master/usage/restructuredtext/domains.html#python-roles)).
-- Very basic formatting markup to improve _readability_ of the generated documentation without obscuring the source docstring (e.g. ``` ``literal`` ``` strings, bulleted lists).
+- Very basic formatting markup to improve _readability_ of the generated documentation without obscuring the source docstring (e.g. `"literal"` strings, bulleted lists).
 
 We highly encourage the [doctest] format for code examples in docstrings. In fact, doctest runs code examples and makes sure they are in sync with the codebase.
 
diff --git a/src/jace/api.py b/src/jace/api.py
index 05bfa1e..6def2f4 100644
--- a/src/jace/api.py
+++ b/src/jace/api.py
@@ -23,7 +23,7 @@
 
 # Used for type annotation, see the notes in `jace.stages` for more.
 _P = ParamSpec("_P")
-_ReturnType = TypeVar("_ReturnType")
+_R = TypeVar("_R")
 
 
 class JITOptions(TypedDict, total=False):
@@ -43,27 +43,24 @@ def jit(
     /,
     primitive_translators: Mapping[str, translator.PrimitiveTranslator] | None = None,
     **kwargs: Unpack[JITOptions],
-) -> Callable[[Callable[_P, _ReturnType]], stages.JaCeWrapped[_P, _ReturnType]]: ...
+) -> Callable[[Callable[_P, _R]], stages.JaCeWrapped[_P, _R]]: ...
 
 
 @overload
 def jit(
-    fun: Callable[_P, _ReturnType],
+    fun: Callable[_P, _R],
     /,
     primitive_translators: Mapping[str, translator.PrimitiveTranslator] | None = None,
     **kwargs: Unpack[JITOptions],
-) -> stages.JaCeWrapped[_P, _ReturnType]: ...
+) -> stages.JaCeWrapped[_P, _R]: ...
 
 
 def jit(
-    fun: Callable[_P, _ReturnType] | None = None,
+    fun: Callable[_P, _R] | None = None,
     /,
     primitive_translators: Mapping[str, translator.PrimitiveTranslator] | None = None,
     **kwargs: Unpack[JITOptions],
-) -> (
-    Callable[[Callable[_P, _ReturnType]], stages.JaCeWrapped[_P, _ReturnType]]
-    | stages.JaCeWrapped[_P, _ReturnType]
-):
+) -> Callable[[Callable[_P, _R]], stages.JaCeWrapped[_P, _R]] | stages.JaCeWrapped[_P, _R]:
     """
     JaCe's replacement for `jax.jit` (just-in-time) wrapper.
 
@@ -87,7 +84,7 @@ def jit(
             f"The following arguments to 'jace.jit' are not yet supported: {', '.join(kwargs)}."
         )
 
-    def wrapper(f: Callable[_P, _ReturnType]) -> stages.JaCeWrapped[_P, _ReturnType]:
+    def wrapper(f: Callable[_P, _R]) -> stages.JaCeWrapped[_P, _R]:
         jace_wrapper = stages.JaCeWrapped(
             fun=f,
             primitive_translators=(
diff --git a/src/jace/optimization.py b/src/jace/optimization.py
index 65e97b4..5dc159b 100644
--- a/src/jace/optimization.py
+++ b/src/jace/optimization.py
@@ -68,7 +68,8 @@ def jace_optimize(tsdfg: tjsdfg.TranslatedJaxprSDFG, **kwargs: Unpack[CompilerOp
             in the SDFG to `AllocationLifetime.Persistent`, i.e. keep them allocated
             between different invocations.
     """
-    # Currently this function exists primarily for the same of existing.
+    # TODO(phimuell): Implement the functionality.
+    # Currently this function exists primarily for the sake of existing.
 
     simplify = kwargs.get("simplify", False)
     auto_optimize = kwargs.get("auto_optimize", False)
diff --git a/src/jace/stages.py b/src/jace/stages.py
index 32e1af8..e642212 100644
--- a/src/jace/stages.py
+++ b/src/jace/stages.py
@@ -68,10 +68,10 @@
 #  changing that, but from a semantic point they behave the same so it should not
 #  matter too much.
 _P = ParamSpec("_P")
-_ReturnType = TypeVar("_ReturnType")
+_R = TypeVar("_R")
 
 
-class JaCeWrapped(tcache.CachingStage["JaCeLowered"], Generic[_P, _ReturnType]):
+class JaCeWrapped(tcache.CachingStage["JaCeLowered"], Generic[_P, _R]):
     """
     A function ready to be specialized, lowered, and compiled.
 
@@ -101,16 +101,17 @@ class JaCeWrapped(tcache.CachingStage["JaCeLowered"], Generic[_P, _ReturnType]):
         which is implicitly and temporary activated during tracing.
     """
 
-    _fun: Callable[_P, _ReturnType]
+    _fun: Callable[_P, _R]
     _primitive_translators: dict[str, translator.PrimitiveTranslator]
     _jit_options: api.JITOptions
 
     def __init__(
         self,
-        fun: Callable[_P, _ReturnType],
+        fun: Callable[_P, _R],
         primitive_translators: Mapping[str, translator.PrimitiveTranslator],
         jit_options: api.JITOptions,
     ) -> None:
+        # TODO(phimuell): Test if this restriction is needed.
         assert all(
             param.default is param.empty for param in inspect.signature(fun).parameters.values()
         )
@@ -119,7 +120,7 @@ def __init__(
         self._jit_options = {**jit_options}
         self._fun = fun
 
-    def __call__(self, *args: _P.args, **kwargs: _P.kwargs) -> _ReturnType:
+    def __call__(self, *args: _P.args, **kwargs: _P.kwargs) -> _R:
         """
         Executes the wrapped function, lowering and compiling as needed in one step.
 
@@ -141,7 +142,7 @@ def __call__(self, *args: _P.args, **kwargs: _P.kwargs) -> _ReturnType:
         return compiled(*args, **kwargs)
 
     @tcache.cached_transition
-    def lower(self, *args: _P.args, **kwargs: _P.kwargs) -> JaCeLowered[_ReturnType]:
+    def lower(self, *args: _P.args, **kwargs: _P.kwargs) -> JaCeLowered[_R]:
         """
         Lower the wrapped computation for the given arguments.
 
@@ -204,7 +205,7 @@ def _make_call_description(
         )
 
 
-class JaCeLowered(tcache.CachingStage["JaCeCompiled"], Generic[_ReturnType]):
+class JaCeLowered(tcache.CachingStage["JaCeCompiled"], Generic[_R]):
     """
     Represents the original computation as an SDFG.
 
@@ -243,7 +244,7 @@ def __init__(
         self._jaxpr = jaxpr
 
     @tcache.cached_transition
-    def compile(self, compiler_options: CompilerOptions | None = None) -> JaCeCompiled[_ReturnType]:
+    def compile(self, compiler_options: CompilerOptions | None = None) -> JaCeCompiled[_R]:
         """
         Optimize and compile the lowered SDFG using `compiler_options`.
 
@@ -302,7 +303,7 @@ def _make_call_description(
         )
 
 
-class JaCeCompiled(Generic[_ReturnType]):
+class JaCeCompiled(Generic[_R]):
     """
     Compiled version of the SDFG.
 
@@ -337,7 +338,7 @@ def __init__(
         self._compiled_sdfg = compiled_sdfg
         self._out_tree = out_tree
 
-    def __call__(self, *args: Any, **kwargs: Any) -> _ReturnType:
+    def __call__(self, *args: Any, **kwargs: Any) -> _R:
         """
         Calls the embedded computation.
 
diff --git a/src/jace/tracing.py b/src/jace/tracing.py
index c28101d..2e51251 100644
--- a/src/jace/tracing.py
+++ b/src/jace/tracing.py
@@ -27,12 +27,12 @@
     from jace import api
 
 _P = ParamSpec("_P")
-_ReturnType = TypeVar("_ReturnType")
+_R = TypeVar("_R")
 
 
 @overload
 def make_jaxpr(
-    fun: Callable[_P, _ReturnType],
+    fun: Callable[_P, _R],
     trace_options: api.JITOptions,
     return_out_tree: Literal[True],
 ) -> Callable[_P, tuple[jax_core.ClosedJaxpr, jax_tree.PyTreeDef]]: ...
@@ -40,7 +40,7 @@ def make_jaxpr(
 
 @overload
 def make_jaxpr(
-    fun: Callable[_P, _ReturnType],
+    fun: Callable[_P, _R],
     trace_options: api.JITOptions,
     return_out_tree: Literal[False] = False,
 ) -> Callable[_P, jax_core.ClosedJaxpr]: ...
diff --git a/src/jace/translated_jaxpr_sdfg.py b/src/jace/translated_jaxpr_sdfg.py
index 04eae37..78c7c8b 100644
--- a/src/jace/translated_jaxpr_sdfg.py
+++ b/src/jace/translated_jaxpr_sdfg.py
@@ -23,8 +23,7 @@
 
 if TYPE_CHECKING:
     import numpy as np
-    from dace.codegen import compiled_sdfg
-    from dace.codegen.compiled_sdfg import CompiledSDFG
+    from dace.codegen import compiled_sdfg as dace_csdfg
 
 
 @dataclasses.dataclass(frozen=True, kw_only=True)
@@ -100,12 +99,12 @@ class CompiledJaxprSDFG:
     `compile_jaxpr_sdfg()`.
 
     Args:
-        compiled_sdfg: The `CompiledSDFG` object.
+        dace_csdfg: The `CompiledSDFG` object.
         input_names: Names of the SDFG variables used as inputs.
         out_names: Names of the SDFG variables used as outputs.
 
     Attributes:
-        compiled_sdfg: The `CompiledSDFG` object.
+        dace_csdfg: The `CompiledSDFG` object.
         sdfg: The encapsulated SDFG object.
         input_names: Names of the SDFG variables used as inputs.
         out_names: Names of the SDFG variables used as outputs.
@@ -119,13 +118,13 @@ class CompiledJaxprSDFG:
         arrays of length one.
     """
 
-    compiled_sdfg: compiled_sdfg.CompiledSDFG
+    csdfg: dace_csdfg.CompiledSDFG
     input_names: tuple[str, ...]
     out_names: tuple[str, ...]
 
     @property
     def sdfg(self) -> dace.SDFG:  # noqa: D102 [undocumented-public-method]
-        return self.compiled_sdfg.sdfg
+        return self.csdfg.sdfg
 
     def __call__(
         self,
@@ -138,7 +137,7 @@ def __call__(
         the output.
 
         Args:
-            compiled_sdfg: The compiled SDFG to call.
+            dace_csdfg: The compiled SDFG to call.
             flat_call_args: Flattened input arguments.
         """
         if len(self.input_names) != len(flat_call_args):
@@ -164,25 +163,24 @@ def __call__(
             else:
                 sdfg_call_args[out_name] = dace_data.make_array_from_descriptor(sdfg_array)
 
-        assert len(sdfg_call_args) == len(self.compiled_sdfg.argnames), (
+        assert len(sdfg_call_args) == len(self.csdfg.argnames), (
             "Failed to construct the call arguments,"
-            f" expected {len(self.compiled_sdfg.argnames)} but got {len(flat_call_args)}."
-            f"\nExpected: {self.compiled_sdfg.argnames}\nGot: {list(sdfg_call_args.keys())}"
+            f" expected {len(self.csdfg.argnames)} but got {len(flat_call_args)}."
+            f"\nExpected: {self.csdfg.argnames}\nGot: {list(sdfg_call_args.keys())}"
         )
 
         # Calling the SDFG
         with dace.config.temporary_config():
             dace.Config.set("compiler", "allow_view_arguments", value=True)
-            self.compiled_sdfg(**sdfg_call_args)
+            self.csdfg(**sdfg_call_args)
 
         return [sdfg_call_args[out_name] for out_name in self.out_names]
 
 
-def compile_jaxpr_sdfg(tsdfg: TranslatedJaxprSDFG) -> CompiledJaxprSDFG:
+def compile_jaxpr_sdfg(tsdfg: TranslatedJaxprSDFG) -> dace_csdfg.CompiledJaxprSDFG:
     """Compile `tsdfg` and return a `CompiledJaxprSDFG` object with the result."""
     if any(  # We do not support the DaCe return mechanism
-        array_name.startswith("__return")
-        for array_name in tsdfg.sdfg.arrays.keys()  # noqa: SIM118 [in-dict-keys]  # We can not use `in` because we are not interested in `my_mangled_variable__return_zulu`!
+        array_name.startswith("__return") for array_name in tsdfg.sdfg.arrays
     ):
         raise ValueError("Only support SDFGs without '__return' members.")
     if tsdfg.sdfg.free_symbols:  # This is a simplification that makes our life simple.
@@ -211,13 +209,11 @@ def compile_jaxpr_sdfg(tsdfg: TranslatedJaxprSDFG) -> CompiledJaxprSDFG:
             dace.Config.set("default_build_folder", value=pathlib.Path(".jacecache").resolve())
             sdfg._recompile = True
             sdfg._regenerate_code = True
-            compiled_sdfg: CompiledSDFG = sdfg.compile()
+            csdfg: dace_csdfg.CompiledSDFG = sdfg.compile()
 
     finally:
         sdfg.name = original_sdfg_name
         sdfg._recompile = original_recompile
         sdfg._regenerate_code = original_regenerate_code
 
-    return CompiledJaxprSDFG(
-        compiled_sdfg=compiled_sdfg, input_names=tsdfg.input_names, out_names=tsdfg.out_names
-    )
+    return CompiledJaxprSDFG(csdfg=csdfg, input_names=tsdfg.input_names, out_names=tsdfg.out_names)
diff --git a/src/jace/util/traits.py b/src/jace/util/traits.py
index d7efb30..af2b290 100644
--- a/src/jace/util/traits.py
+++ b/src/jace/util/traits.py
@@ -80,8 +80,8 @@ def get_strides_for_dace(obj: Any) -> tuple[int, ...] | None:
     Get the strides of `obj` in a DaCe compatible format.
 
     The function returns the strides in number of elements, as it is used inside
-    DaCe and not in bytes as it is inside NumPy. As in NumPy and DaCe the function
-    returns `None` to indicate standard C order.
+    DaCe and not in bytes as it is inside NumPy. As in DaCe `None` is returned to
+    indicate standard C order.
 
     Note:
         If `obj` is not array like an error is generated.

From 819eebbbe3050a53885730c53f8af0bba1d1206b Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Tue, 25 Jun 2024 14:02:43 +0200
Subject: [PATCH 426/458] Made a fix to the tests.

---
 tests/unit_tests/test_jax_api.py | 1 +
 1 file changed, 1 insertion(+)

diff --git a/tests/unit_tests/test_jax_api.py b/tests/unit_tests/test_jax_api.py
index 23f7503..f73c535 100644
--- a/tests/unit_tests/test_jax_api.py
+++ b/tests/unit_tests/test_jax_api.py
@@ -213,6 +213,7 @@ def testee(a: np.ndarray, b: np.float64) -> np.ndarray:
     )
 
 
+@pytest.mark.usefixtures("_enable_jit")
 def test_tracing_detection() -> None:
     """Tests our ability to detect if tracing is going on."""
     expected_tracing_state = False

From 110b6f4565796edccbcee888c9814881933a20a7 Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Tue, 25 Jun 2024 14:03:27 +0200
Subject: [PATCH 427/458] WIP: Started with a primitive.

---
 .../test_primitive_cond.py                    | 31 +++++++++++++++++++
 1 file changed, 31 insertions(+)
 create mode 100644 tests/integration_tests/primitive_translators/test_primitive_cond.py

diff --git a/tests/integration_tests/primitive_translators/test_primitive_cond.py b/tests/integration_tests/primitive_translators/test_primitive_cond.py
new file mode 100644
index 0000000..895e042
--- /dev/null
+++ b/tests/integration_tests/primitive_translators/test_primitive_cond.py
@@ -0,0 +1,31 @@
+# JaCe - JAX Just-In-Time compilation using DaCe (Data Centric Parallel Programming)
+#
+# Copyright (c) 2024, ETH Zurich
+# All rights reserved.
+#
+# SPDX-License-Identifier: BSD-3-Clause
+
+from __future__ import annotations
+
+import jax
+import numpy as np
+import pytest
+from jax import numpy as jnp
+
+import jace
+from jace.util import translation_cache as tcache
+
+from tests import util as testutil
+
+
+def test_cond_simple1() -> None:
+
+    def testee(val: np.float64, cond_arg: tuple[np.ndarray, np.ndarray]) -> np.ndarray:
+        return jax.lax.cond(
+                0.5 > val.
+                lambda arg: arg[0],
+                lambda arg: jnp.array([13]) + arg[1],
+                cond_arg,
+        )
+
+    vals: list[np.float64] = list(

From 380399a2c38b3f5fadec2045028f0edba7a216a8 Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Tue, 25 Jun 2024 16:46:09 +0200
Subject: [PATCH 428/458] Updated the list of differences.

---
 docs/main_differences.md | 1 +
 1 file changed, 1 insertion(+)

diff --git a/docs/main_differences.md b/docs/main_differences.md
index 953bef0..5ac19aa 100644
--- a/docs/main_differences.md
+++ b/docs/main_differences.md
@@ -13,6 +13,7 @@ We will now list the main differences between them, furthermore, you should also
 - Currently JaCe is not able to run distributed (will be lifted later).
 - Currently not all primitives are supported.
 - JaCe does not return `jax.Array` instances, but NumPy/CuPy arrays.
+- The execution is not asynchronous.
 
 ### DaCe vs. JaCe:
 

From 320c528905492d467fa6361c0d2ba901cd9458d9 Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Tue, 25 Jun 2024 16:53:16 +0200
Subject: [PATCH 429/458] Added tests for the condition.

---
 .../primitive_translators/__init__.py         |   2 +
 .../test_primitive_cond.py                    | 184 +++++++++++++++++-
 tests/integration_tests/test_empty_jaxpr.py   |   1 -
 tests/unit_tests/test_jax_api.py              |   2 -
 4 files changed, 179 insertions(+), 10 deletions(-)

diff --git a/src/jace/translator/primitive_translators/__init__.py b/src/jace/translator/primitive_translators/__init__.py
index 429fb6f..e0ef301 100644
--- a/src/jace/translator/primitive_translators/__init__.py
+++ b/src/jace/translator/primitive_translators/__init__.py
@@ -14,6 +14,7 @@
 )
 from .broadcast_in_dim_translator import BroadcastInDimTranslator
 from .concatenate_translator import ConcatenateTranslator
+from .conditions import condition_translator
 from .convert_element_type_translator import ConvertElementTypeTranslator
 from .copy_translator import CopyTranslator, DevicePutTranslator
 from .iota_translator import IotaTranslator
@@ -38,4 +39,5 @@
     "SelectNTranslator",
     "SlicingTranslator",
     "SqueezeTranslator",
+    "condition_translator",
 ]
diff --git a/tests/integration_tests/primitive_translators/test_primitive_cond.py b/tests/integration_tests/primitive_translators/test_primitive_cond.py
index 895e042..5be5e19 100644
--- a/tests/integration_tests/primitive_translators/test_primitive_cond.py
+++ b/tests/integration_tests/primitive_translators/test_primitive_cond.py
@@ -7,6 +7,9 @@
 
 from __future__ import annotations
 
+from collections.abc import Callable
+from typing import Any
+
 import jax
 import numpy as np
 import pytest
@@ -18,14 +21,181 @@
 from tests import util as testutil
 
 
-def test_cond_simple1() -> None:
+def _perform_cond_test(
+    testee: Callable[[np.float64, tuple[Any, ...]], Any], branch_args: tuple[Any, ...]
+) -> None:
+    """
+    Performs a test for the condition primitives.
+
+    It assumes that the first argument is used for the condition and that the
+    conditions is applied at `0.5`.
+    The test function adds a prologue, that performs some operations on the
+    `branch_args` and performs some computations on the final value.
+    This is done to simulate the typical usage, as it was observed that
+    sometimes the optimization fails.
+    """
+    tcache.clear_translation_cache()
+
+    def prologue(branch_args: tuple[Any, ...]) -> tuple[Any, ...]:
+        return tuple(
+            jnp.exp(jnp.cos(jnp.sin(branch_arg))) ** i
+            for i, branch_arg in enumerate(branch_args, 2)
+        )
+
+    def epilogue(result: Any) -> Any:
+        return jnp.exp(jnp.sin(jnp.sin(result)))
+
+    def final_testee(
+        val: np.float64,
+        branch_args: tuple[Any, ...],
+    ) -> Any:
+        return epilogue(testee(jnp.sin(val) + 0.5, prologue(branch_args)))  # type: ignore[arg-type]
 
-    def testee(val: np.float64, cond_arg: tuple[np.ndarray, np.ndarray]) -> np.ndarray:
+    vals: list[np.float64] = [np.float64(-0.5), np.float64(0.6)]
+    wrapped = jace.jit(testee)
+
+    for val in vals:
+        res = wrapped(val, branch_args)
+        ref = testee(val, branch_args)
+
+        assert np.all(res == ref)
+        assert ref.shape == res.shape
+
+
+def test_cond_full_branches() -> None:
+    def testee(val: np.float64, branch_args: tuple[np.ndarray, np.ndarray]) -> np.ndarray:
         return jax.lax.cond(
-                0.5 > val.
-                lambda arg: arg[0],
-                lambda arg: jnp.array([13]) + arg[1],
-                cond_arg,
+            val < 0.5,
+            lambda arg: jnp.sin(arg[0]),
+            lambda arg: jnp.cos(arg[1]),
+            branch_args,
         )
 
-    vals: list[np.float64] = list(
+    branch_args = tuple(testutil.make_array(1) for _ in range(2))
+    _perform_cond_test(testee, branch_args)
+
+
+def test_cond_literal_bool() -> None:
+    for branch_sel in [True, False]:
+
+        def testee(val: np.float64, branch_args: tuple[np.ndarray, np.ndarray]) -> np.ndarray:
+            return jax.lax.cond(
+                branch_sel,  # noqa: B023 [function-uses-loop-variable]
+                lambda arg: jnp.sin(arg[0]) + val,
+                lambda arg: jnp.cos(arg[1]),
+                branch_args,
+            )
+
+        branch_args = tuple(testutil.make_array(1) for _ in range(2))
+        _perform_cond_test(testee, branch_args)
+
+
+def test_cond_one_empty_branch() -> None:
+    def testee(val, branch_args: tuple[np.ndarray, np.ndarray]) -> np.ndarray:
+        return jax.lax.cond(
+            val < 0.5,
+            lambda xtrue: xtrue[0],
+            lambda xfalse: jnp.array([1]) + xfalse[1],
+            branch_args,
+        )
+
+    branch_args = tuple(testutil.make_array(1) for _ in range(2))
+    _perform_cond_test(testee, branch_args)
+
+
+@pytest.mark.skip(reason="Literal return value is not implemented.")
+def test_cond_literal_branch() -> None:
+    def testee(val: np.float64, branch_args: tuple[np.ndarray, np.ndarray]) -> np.ndarray:
+        return jax.lax.cond(
+            val < 0.5,
+            lambda xtrue: 1.0,  # noqa: ARG005 [unused-lambda-argument]
+            lambda xfalse: xfalse[1],
+            branch_args,
+        )
+
+    branch_args = tuple(testutil.make_array(()) for _ in range(2))
+    _perform_cond_test(testee, branch_args)
+
+
+def test_cond_complex_branches() -> None:
+    def true_branch(arg: np.ndarray) -> np.ndarray:
+        return jnp.where(
+            jnp.asin(arg) <= 0.0,
+            jnp.exp(jnp.cos(jnp.sin(arg))),
+            arg * 4.0,
+        )
+
+    def false_branch(arg: np.ndarray) -> np.ndarray:
+        return true_branch(jnp.exp(jnp.cos(arg) ** 7))  # type: ignore[arg-type]
+
+    def testee(val: np.float64, branch_args: tuple[np.ndarray, np.ndarray]) -> np.ndarray:
+        cond_res = jax.lax.cond(
+            val < 0.5,
+            lambda arg: true_branch(arg[0]),
+            lambda arg: false_branch(arg[1]),
+            branch_args,
+        )
+        return true_branch(cond_res)
+
+    branch_args = tuple(testutil.make_array((100, 100)) for _ in range(2))
+    _perform_cond_test(testee, branch_args)
+
+
+def test_cond_switch() -> None:
+    def testee(
+        selector: int,
+        branch_args: tuple[Any, ...],
+    ) -> np.ndarray:
+        return jax.lax.switch(
+            selector,
+            (
+                lambda args: jnp.sin(args[0]),
+                lambda args: jnp.exp(args[1]),
+                lambda args: jnp.cos(args[2]),
+            ),
+            branch_args,
+        )
+
+    wrapped = jace.jit(testee)
+    branch_args = tuple(testutil.make_array((100, 100)) for _ in range(3))
+
+    # These are the values that we will use for the selector.
+    #  Note that we also use some invalid values.
+    selectors = [-1, 0, 1, 2, 3, 4]
+
+    for selector in selectors:
+        ref = testee(selector, branch_args)
+        res = wrapped(selector, branch_args)
+
+        assert ref.shape == res.shape
+        assert np.allclose(ref, res)
+
+
+@pytest.mark.skip("DaCe is not able to optimize it away.")
+def test_cond_switch_literal_selector() -> None:
+    def testee(
+        branch_args: tuple[Any, ...],
+    ) -> np.ndarray:
+        return jax.lax.switch(
+            2,
+            (
+                lambda args: jnp.sin(args[0]),
+                lambda args: jnp.exp(args[1]),
+                lambda args: jnp.cos(args[2]),
+            ),
+            branch_args,
+        )
+
+    branch_args = tuple(testutil.make_array((100, 100)) for _ in range(3))
+
+    wrapped = jace.jit(testee)
+    lowered = wrapped.lower(branch_args)
+    compiled = lowered.compile(jace.optimization.DEFAULT_OPTIMIZATIONS)
+
+    ref = testee(branch_args)
+    res = wrapped(branch_args)
+
+    assert ref.shape == res.shape
+    assert np.allclose(ref, res)
+    lowered.as_sdfg().view()
+    assert compiled._compiled_sdfg.sdfg.number_of_nodes() == 1
diff --git a/tests/integration_tests/test_empty_jaxpr.py b/tests/integration_tests/test_empty_jaxpr.py
index 29ba9a4..598efc9 100644
--- a/tests/integration_tests/test_empty_jaxpr.py
+++ b/tests/integration_tests/test_empty_jaxpr.py
@@ -76,7 +76,6 @@ def wrapped(a: np.float64) -> np.float64:
     assert np.all(wrapped(a) == a)
 
 
-@pytest.mark.skip(reason="Nested Jaxpr are not handled.")
 def test_empty_nested() -> None:
     @jace.jit
     def wrapped(a: np.float64) -> np.float64:
diff --git a/tests/unit_tests/test_jax_api.py b/tests/unit_tests/test_jax_api.py
index f73c535..b4327b7 100644
--- a/tests/unit_tests/test_jax_api.py
+++ b/tests/unit_tests/test_jax_api.py
@@ -76,7 +76,6 @@ def ddf(x):
         assert np.allclose(ref, res), f"f: Expected '{ref}', got '{res}'."
 
 
-@pytest.mark.skip(reason="Nested Jaxpr are not handled.")
 def test_composition_with_jax() -> None:
     """Tests if JaCe can interact with JAX and vice versa."""
 
@@ -95,7 +94,6 @@ def jax_fun(a, b, c):
     assert np.allclose(jace_fun(a, b, c), jax_fun(a, b, c))
 
 
-@pytest.mark.skip(reason="Nested Jaxpr are not handled.")
 def test_composition_with_jax_2() -> None:
     """Second test if JaCe can interact with JAX and vice versa."""
 

From e2ebc4e81c58d167c4db5d8aa8491c8a2c45f0eb Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Wed, 26 Jun 2024 11:00:20 +0200
Subject: [PATCH 430/458] Implemented propagation of Memlets in the generated
 graphs.

---
 .../translator/jaxpr_translator_builder.py    | 52 ++++++++++++++++++-
 src/jace/translator/primitive_translator.py   |  3 ++
 2 files changed, 53 insertions(+), 2 deletions(-)

diff --git a/src/jace/translator/jaxpr_translator_builder.py b/src/jace/translator/jaxpr_translator_builder.py
index ea4606d..908580a 100644
--- a/src/jace/translator/jaxpr_translator_builder.py
+++ b/src/jace/translator/jaxpr_translator_builder.py
@@ -14,6 +14,7 @@
 
 import dace
 from dace import data as dace_data, properties as dace_properties
+from dace.sdfg import propagation as dace_propagation
 from jax import core as jax_core
 
 from jace import util
@@ -553,6 +554,7 @@ def _translate_single_eqn(self, eqn: jax_core.JaxprEqn) -> None:
         translator = self._primitive_translators[primitive_name]
 
         # Create the state into which the equation should be translated
+        prev_terminal_state = self._ctx.terminal_state
         eqn_state = self.append_new_state(
             label=f"{primitive_name}_{'_'.join(out_var_names)}",
             prev_state=None,  # forces the creation of a new terminal state
@@ -572,8 +574,13 @@ def _translate_single_eqn(self, eqn: jax_core.JaxprEqn) -> None:
             if eqn_state is not self._ctx.terminal_state:
                 raise RuntimeError("Inconsistent terminal state was detected.")
             new_sdfg_term_state = eqn_state
-        if not self._ctx.validate():
-            raise RuntimeError("Detected an invalid SDFG under construction.")
+
+        # Propagate the Memlets through the newly created state machine
+        self._propagate_memlets_in_new_states(
+            prev_terminal_state,
+            new_sdfg_term_state,
+        )
+        self._ctx.validate()
 
         # Modify terminal root state of 'self'
         self._ctx.terminal_state = new_sdfg_term_state
@@ -682,6 +689,47 @@ def _handle_null_jaxpr(self, jaxpr: jax_core.ClosedJaxpr) -> list[str]:
 
         return out_var_names
 
+    def _propagate_memlets_in_new_states(
+        self,
+        prev_terminal_state: dace.SDFGState,
+        new_terminal_state: dace.SDFGState,
+    ) -> None:
+        """
+        Propagate the Memlets inside the newly added parts of the state machine.
+
+        This function performs BFS starting at `prev_terminal_state` that is bound
+        by `new_terminal_state`.
+
+        Args:
+            prev_terminal_state: Terminal state before the expansion of the
+                state machine.
+            new_terminal_state: Terminal state after the expansion.
+        """
+        seen: set[dace.SDFGState] = {prev_terminal_state}
+        nodes_to_process: list[dace.SDFGState] = [
+            edge.dst for edge in self.sdfg.out_edges(prev_terminal_state)
+        ]
+
+        while nodes_to_process:
+            currently_processing = nodes_to_process.pop(-1)
+            if (
+                self.sdfg.out_degree(currently_processing) == 0
+                and currently_processing != new_terminal_state
+            ):
+                raise dace.sdfg.InvalidSDFGError(
+                    f"Found leaf node '{currently_processing}' that is not the terminal node.",
+                    self.sdfg,
+                    self.sdfg.node_id(currently_processing),
+                )
+
+            seen.add(currently_processing)
+            dace_propagation.propagate_memlets_state(self.sdfg, currently_processing)
+            nodes_to_process.extend(
+                edge.dst
+                for edge in self.sdfg.out_edges(currently_processing)
+                if edge.dst not in seen
+            )
+
     @property
     def _start_state(self) -> dace.SDFGState:
         return cast(dace.SDFGState, self._ctx.start_state)
diff --git a/src/jace/translator/primitive_translator.py b/src/jace/translator/primitive_translator.py
index ab84c5d..2000731 100644
--- a/src/jace/translator/primitive_translator.py
+++ b/src/jace/translator/primitive_translator.py
@@ -64,6 +64,9 @@ def __call__(
         primitive translator was able to fully construct the dataflow graph
         within `eqn_state`.
 
+        After the primitive translator returns, the builder will propagate the
+        Memlets in all states that were newly created.
+
         A primitive translator has to use the passed input variables,
         `in_var_names` and must write its output into the variables indicated
         by `out_var_names`. But it is allowed that a primitive translator

From 071923c28bad3338a40d3538483da36c3544c5d2 Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Thu, 27 Jun 2024 11:21:22 +0200
Subject: [PATCH 431/458] Added a test for scalar branches.

---
 .../primitive_translators/test_primitive_cond.py  | 15 ++++++++++++++-
 1 file changed, 14 insertions(+), 1 deletion(-)

diff --git a/tests/integration_tests/primitive_translators/test_primitive_cond.py b/tests/integration_tests/primitive_translators/test_primitive_cond.py
index 5be5e19..da8e61d 100644
--- a/tests/integration_tests/primitive_translators/test_primitive_cond.py
+++ b/tests/integration_tests/primitive_translators/test_primitive_cond.py
@@ -59,7 +59,7 @@ def final_testee(
         ref = testee(val, branch_args)
 
         assert np.all(res == ref)
-        assert ref.shape == res.shape
+        assert (1,) if ref.shape == () else ref.shape == res.shape
 
 
 def test_cond_full_branches() -> None:
@@ -75,6 +75,19 @@ def testee(val: np.float64, branch_args: tuple[np.ndarray, np.ndarray]) -> np.nd
     _perform_cond_test(testee, branch_args)
 
 
+def test_cond_scalar_brnaches() -> None:
+    def testee(val: np.float64, branch_args: tuple[np.float64, np.float64]) -> np.float64:
+        return jax.lax.cond(
+            val < 0.5,
+            lambda arg: arg[0] + 2.0,
+            lambda arg: arg[1] + 3.0,
+            branch_args,
+        )
+
+    branch_args = tuple(testutil.make_array(()) for _ in range(2))
+    _perform_cond_test(testee, branch_args)
+
+
 def test_cond_literal_bool() -> None:
     for branch_sel in [True, False]:
 

From 086928720e0df793b797f4db0a3970d2d1ba0455 Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Mon, 1 Jul 2024 10:55:05 +0200
Subject: [PATCH 432/458] Added Enriques suggestions.

---
 CODING_GUIDELINES.md                          |  4 +-
 src/jace/api.py                               |  1 -
 src/jace/stages.py                            | 88 +++++++++----------
 src/jace/tracing.py                           |  1 +
 src/jace/translated_jaxpr_sdfg.py             | 74 +++++++++-------
 .../translator/jaxpr_translator_builder.py    | 29 +++---
 src/jace/translator/post_translation.py       | 45 ++++------
 src/jace/util/translation_cache.py            | 18 ++--
 8 files changed, 126 insertions(+), 134 deletions(-)

diff --git a/CODING_GUIDELINES.md b/CODING_GUIDELINES.md
index 72cff79..2fd6961 100644
--- a/CODING_GUIDELINES.md
+++ b/CODING_GUIDELINES.md
@@ -36,7 +36,7 @@ Inside JaCe the following convention is applied:
 
 - If the module has a standard abbreviation use that, e.g. `import numpy as np`.
 - For a JaCe module use:
-  - If the module name is only a single word use it directly, e.g. `from jace import translator`
+  - If the module name is only a single word use it directly, e.g. `from jace import translator`.
   - If the module name consists of multiple words use the last word prefixed with the first letters of the others, e.g. `from jace.translator import post_translator as ptranslator` or `from jace import translated_jaxpr_sdfg as tjsdfg`.
   - In case of a clash use your best judgment.
 - For an external module use the rule above, but prefix the name with the main package's name, e.g. `from dace.codegen import compiled_sdfg as dace_csdfg`.
@@ -116,7 +116,7 @@ We generate the API documentation automatically from the docstrings using [Sphin
 Sphinx supports the [reStructuredText][sphinx-rest] (reST) markup language for defining additional formatting options in the generated documentation, however section [_3.8 Comments and Docstrings_](https://google.github.io/styleguide/pyguide.html#38-comments-and-docstrings) of the Google Python Style Guide does not specify how to use markups in docstrings. As a result, we decided to forbid reST markup in docstrings, except for the following cases:
 
 - Cross-referencing other objects using Sphinx text roles for the [Python domain](https://www.sphinx-doc.org/en/master/usage/restructuredtext/domains.html#the-python-domain) (as explained [here](https://www.sphinx-doc.org/en/master/usage/restructuredtext/domains.html#python-roles)).
-- Very basic formatting markup to improve _readability_ of the generated documentation without obscuring the source docstring (e.g. `"literal"` strings, bulleted lists).
+- Very basic formatting markup to improve _readability_ of the generated documentation without obscuring the source docstring (e.g. `` `literal` `` strings, bulleted lists).
 
 We highly encourage the [doctest] format for code examples in docstrings. In fact, doctest runs code examples and makes sure they are in sync with the codebase.
 
diff --git a/src/jace/api.py b/src/jace/api.py
index 6def2f4..35d722a 100644
--- a/src/jace/api.py
+++ b/src/jace/api.py
@@ -21,7 +21,6 @@
 
 __all__ = ["JITOptions", "grad", "jacfwd", "jacrev", "jit"]
 
-# Used for type annotation, see the notes in `jace.stages` for more.
 _P = ParamSpec("_P")
 _R = TypeVar("_R")
 
diff --git a/src/jace/stages.py b/src/jace/stages.py
index e642212..ea3312f 100644
--- a/src/jace/stages.py
+++ b/src/jace/stages.py
@@ -27,15 +27,15 @@
 
 from __future__ import annotations
 
+import contextlib
 import copy
-import inspect
-from collections.abc import Callable, Mapping, Sequence
+from collections.abc import Callable, Generator, Mapping, Sequence
 from typing import TYPE_CHECKING, Any, Generic, ParamSpec, TypeVar, Union
 
 from jax import tree_util as jax_tree
 
 from jace import api, optimization, tracing, translated_jaxpr_sdfg as tjsdfg, translator, util
-from jace.optimization import CompilerOptions
+from jace.optimization import CompilerOptions  # Reexport for compatibility with JAX.
 from jace.translator import post_translation as ptranslation
 from jace.util import translation_cache as tcache
 
@@ -45,14 +45,14 @@
     from jax import core as jax_core
 
 __all__ = [
-    "CompilerOptions",  # export for compatibility with JAX.
+    "CompilerOptions",
     "JaCeCompiled",
     "JaCeLowered",
     "JaCeWrapped",
     "Stage",
     "get_active_compiler_options",
-    "make_final_compilation_options",
-    "update_active_compiler_options",
+    "get_active_compiler_options",
+    "temporary_compiler_options",
 ]
 
 #: Known compilation stages in JaCe.
@@ -111,10 +111,6 @@ def __init__(
         primitive_translators: Mapping[str, translator.PrimitiveTranslator],
         jit_options: api.JITOptions,
     ) -> None:
-        # TODO(phimuell): Test if this restriction is needed.
-        assert all(
-            param.default is param.empty for param in inspect.signature(fun).parameters.values()
-        )
         super().__init__()
         self._primitive_translators = {**primitive_translators}
         self._jit_options = {**jit_options}
@@ -250,7 +246,8 @@ def compile(self, compiler_options: CompilerOptions | None = None) -> JaCeCompil
 
         To perform the optimizations `jace_optimize()` is used. The actual options that
         are forwarded to it are obtained by passing `compiler_options` to
-        `make_final_compilation_options()`.
+        `get_active_compiler_options()`, these options are also included in the
+        key used to cache the result.
 
         Args:
             compiler_options: The optimization options to use.
@@ -258,7 +255,7 @@ def compile(self, compiler_options: CompilerOptions | None = None) -> JaCeCompil
         # We **must** deepcopy before we do any optimization, because all optimizations
         #  are in place, to properly cache stages, stages needs to be immutable.
         tsdfg: tjsdfg.TranslatedJaxprSDFG = copy.deepcopy(self._translated_sdfg)
-        optimization.jace_optimize(tsdfg=tsdfg, **make_final_compilation_options(compiler_options))
+        optimization.jace_optimize(tsdfg=tsdfg, **get_active_compiler_options(compiler_options))
 
         return JaCeCompiled(
             compiled_sdfg=tjsdfg.compile_jaxpr_sdfg(tsdfg),
@@ -296,7 +293,7 @@ def _make_call_description(
         unflatted_args, unflatted_kwargs = jax_tree.tree_unflatten(in_tree, flat_call_args)
         assert (not unflatted_kwargs) and (len(unflatted_args) <= 1)
 
-        options = make_final_compilation_options(unflatted_args[0] if unflatted_args else {})
+        options = get_active_compiler_options(unflatted_args[0] if unflatted_args else None)
         flat_options, option_tree = jax_tree.tree_flatten(options)
         return tcache.StageTransformationSpec(
             stage_id=id(self), flat_call_args=tuple(flat_options), in_tree=option_tree
@@ -317,7 +314,7 @@ class JaCeCompiled(Generic[_R]):
     Args:
         compiled_sdfg: The compiled SDFG object.
         input_names: SDFG variables used as inputs.
-        out_names: SDFG variables used as outputs.
+        output_names: SDFG variables used as outputs.
         out_tree: Pytree describing how to unflatten the output.
 
     Note:
@@ -358,55 +355,54 @@ def __call__(self, *args: Any, **kwargs: Any) -> _R:
 _JACELOWERED_ACTIVE_COMPILE_OPTIONS: CompilerOptions = optimization.DEFAULT_OPTIMIZATIONS.copy()
 """Global set of currently active compilation/optimization options.
 
-The global set is initialized with `jace.optimization.DEFAULT_OPTIMIZATIONS`. It can be
-managed through `update_active_compiler_options()` and accessed through
-`get_active_compiler_options()`, however, it is advised that a user should use
-`make_final_compilation_options()` for getting the final options that should be used
-for optimization.
+The global set is initialized to `jace.optimization.DEFAULT_OPTIMIZATIONS`.
+For modifying the set of active options the the `temporary_compiler_options()`
+context manager is provided.
+To obtain the currently active compiler options use `get_active_compiler_options()`.
 """
 
 
-def update_active_compiler_options(new_active_options: CompilerOptions) -> CompilerOptions:
+@contextlib.contextmanager
+def temporary_compiler_options(new_active_options: CompilerOptions) -> Generator[None, None, None]:
     """
-    Updates the set of active compiler options.
+    Temporary modifies the set of active compiler options.
 
-    Merges the options passed as `new_active_options` with the currently active
-    compiler options. This set is used by `JaCeLowered.compile()` to determine
-    which options should be used.
-    The function will return the set of options that was active before the call.
+    During the activation of this context the active set of active compiler option
+    consists of the set of option that were previously active merged with the ones
+    passed through `new_active_options`.
 
-    To obtain the set of currently active options use `get_active_compiler_options()`.
+    Args:
+        new_active_options: Options that should be temporary merged with the currently
+            active options.
 
-    Todo:
-        Make a proper context manager.
+    See Also:
+        `get_active_compiler_options()` to get the set of active options that is
+        currently active.
     """
+    global _JACELOWERED_ACTIVE_COMPILE_OPTIONS  # noqa: PLW0603 [global-statement]
     previous_active_options = _JACELOWERED_ACTIVE_COMPILE_OPTIONS.copy()
-    _JACELOWERED_ACTIVE_COMPILE_OPTIONS.update(new_active_options)
-    return previous_active_options
-
+    try:
+        _JACELOWERED_ACTIVE_COMPILE_OPTIONS.update(new_active_options)
+        yield None
+    finally:
+        _JACELOWERED_ACTIVE_COMPILE_OPTIONS = previous_active_options
 
-def get_active_compiler_options() -> CompilerOptions:
-    """Returns the set of currently active compiler options."""
-    return _JACELOWERED_ACTIVE_COMPILE_OPTIONS.copy()
 
-
-def make_final_compilation_options(compiler_options: CompilerOptions | None) -> CompilerOptions:
+def get_active_compiler_options(compiler_options: CompilerOptions | None) -> CompilerOptions:
     """
-    Returns the final compilation options.
+    Get the final compiler options.
 
     There are two different sources of optimization options. The first one is the global
-    set of currently active compiler options. The second one is the options that are
-    passed to this function, which takes precedence. Thus, the `compiler_options`
-    argument describes the difference from the currently active global options.
-
-    This function is used by `JaCeLowered` if it has to determine which options to use
-    for optimization, either for compiling the lowered SDFG or for computing the key.
+    set of currently active compiler options, which is returned if `None` is passed.
+    The second one is the options that are passed to this function, which takes
+    precedence. This mode is also used by `JaCeLowered.compile()` to determine the
+    final compiler options.
 
     Args:
         compiler_options: The local compilation options.
 
     See Also:
-        `get_active_compiler_options()` to inspect the set of currently active options
-        and `update_active_compiler_options()` to modify them.
+        `temporary_compiler_options()` to modify the currently active set of compiler
+        options.
     """
-    return get_active_compiler_options() | (compiler_options or {})
+    return _JACELOWERED_ACTIVE_COMPILE_OPTIONS | (compiler_options or {})
diff --git a/src/jace/tracing.py b/src/jace/tracing.py
index 2e51251..4df5d00 100644
--- a/src/jace/tracing.py
+++ b/src/jace/tracing.py
@@ -82,6 +82,7 @@ def make_jaxpr(
         raise NotImplementedError(
             f"Not supported tracing options: {', '.join(f'{k}' for k in trace_options)}"
         )
+    # TODO(phimuell): Test if this restriction is needed.
     assert all(param.default is param.empty for param in inspect.signature(fun).parameters.values())
 
     def tracer_impl(
diff --git a/src/jace/translated_jaxpr_sdfg.py b/src/jace/translated_jaxpr_sdfg.py
index 78c7c8b..9cb9908 100644
--- a/src/jace/translated_jaxpr_sdfg.py
+++ b/src/jace/translated_jaxpr_sdfg.py
@@ -36,12 +36,14 @@ class TranslatedJaxprSDFG:
     - It does not have `__return*` variables, instead all return arguments are
         passed by arguments.
     - All input arguments are passed through arguments mentioned in `input_names`,
-        while the outputs are passed through `out_names`.
+        while the outputs are passed through `output_names`.
     - Only variables listed as in/outputs are non transient.
-    - The order of `input_names` and `out_names` is the same as in the original Jaxpr.
-    - If an input is used as outputs it appears in both `input_names` and `out_names`.
-    - Its `arg_names` is set to `input_names + out_names`, but arguments that are
+    - The order of `input_names` and `output_names` is the same as in the Jaxpr.
+    - Its `arg_names` is set to `input_names + output_names`, but arguments that are
         input and outputs are only listed as inputs.
+    - For every transient there is exactly one access node that writes to it,
+        except the name of the array starts with `__jace_mutable_`, which can
+        be written to multiple times.
 
     The only valid way to obtain a `TranslatedJaxprSDFG` is by passing a
     `TranslationContext`, that was in turn constructed by
@@ -52,7 +54,7 @@ class TranslatedJaxprSDFG:
     Attributes:
         sdfg: The encapsulated SDFG object.
         input_names: SDFG variables used as inputs.
-        out_names: SDFG variables used as outputs.
+        output_names: SDFG variables used as outputs.
 
     Todo:
         After the SDFG is compiled a lot of code looks strange, because there is
@@ -62,7 +64,7 @@ class TranslatedJaxprSDFG:
 
     sdfg: dace.SDFG
     input_names: tuple[str, ...]
-    out_names: tuple[str, ...]
+    output_names: tuple[str, ...]
 
     def validate(self) -> bool:
         """Validate the underlying SDFG."""
@@ -72,9 +74,9 @@ def validate(self) -> bool:
                 self.sdfg,
                 self.sdfg.node_id(self.sdfg.start_state),
             )
-        if any(self.sdfg.arrays[out].transient for out in self.out_names):
+        if any(self.sdfg.arrays[out].transient for out in self.output_names):
             raise dace.sdfg.InvalidSDFGError(
-                f"Found transient outputs: {(out for out in self.out_names if self.sdfg.arrays[out].transient)}",
+                f"Found transient outputs: {(out for out in self.output_names if self.sdfg.arrays[out].transient)}",
                 self.sdfg,
                 self.sdfg.node_id(self.sdfg.start_state),
             )
@@ -84,6 +86,14 @@ def validate(self) -> bool:
                 self.sdfg,
                 self.sdfg.node_id(self.sdfg.start_state),
             )
+        if (self.output_names is not None and self.input_names is not None) and (
+            set(self.output_names).intersection(self.input_names)
+        ):
+            raise dace.sdfg.InvalidSDFGError(
+                f"Inputs can not be outputs: {set(self.output_names).intersection(self.input_names)}.",
+                self.sdfg,
+                None,
+            )
         self.sdfg.validate()
         return True
 
@@ -99,15 +109,15 @@ class CompiledJaxprSDFG:
     `compile_jaxpr_sdfg()`.
 
     Args:
-        dace_csdfg: The `CompiledSDFG` object.
+        compiled_sdfg: The `CompiledSDFG` object.
         input_names: Names of the SDFG variables used as inputs.
-        out_names: Names of the SDFG variables used as outputs.
+        output_names: Names of the SDFG variables used as outputs.
 
     Attributes:
-        dace_csdfg: The `CompiledSDFG` object.
-        sdfg: The encapsulated SDFG object.
+        compiled_sdfg: The `CompiledSDFG` object.
+        sdfg: SDFG object used to generate/compile `self.compiled_sdfg`.
         input_names: Names of the SDFG variables used as inputs.
-        out_names: Names of the SDFG variables used as outputs.
+        output_names: Names of the SDFG variables used as outputs.
 
     Note:
         Currently the strides of the input arguments must match the ones that were used
@@ -118,13 +128,13 @@ class CompiledJaxprSDFG:
         arrays of length one.
     """
 
-    csdfg: dace_csdfg.CompiledSDFG
+    compiled_sdfg: dace_csdfg.CompiledSDFG
     input_names: tuple[str, ...]
-    out_names: tuple[str, ...]
+    output_names: tuple[str, ...]
 
     @property
     def sdfg(self) -> dace.SDFG:  # noqa: D102 [undocumented-public-method]
-        return self.csdfg.sdfg
+        return self.compiled_sdfg.sdfg
 
     def __call__(
         self,
@@ -137,7 +147,6 @@ def __call__(
         the output.
 
         Args:
-            dace_csdfg: The compiled SDFG to call.
             flat_call_args: Flattened input arguments.
         """
         if len(self.input_names) != len(flat_call_args):
@@ -155,26 +164,21 @@ def __call__(
             sdfg_call_args[in_name] = in_val
 
         arrays = self.sdfg.arrays
-        for out_name in self.out_names:
-            sdfg_array = arrays[out_name]
-            if out_name in sdfg_call_args:
-                if util.is_jax_array(sdfg_call_args[out_name]):
-                    raise ValueError("Passed an immutable JAX array as output.")
-            else:
-                sdfg_call_args[out_name] = dace_data.make_array_from_descriptor(sdfg_array)
-
-        assert len(sdfg_call_args) == len(self.csdfg.argnames), (
+        for output_name in self.output_names:
+            sdfg_call_args[output_name] = dace_data.make_array_from_descriptor(arrays[output_name])
+
+        assert len(sdfg_call_args) == len(self.compiled_sdfg.argnames), (
             "Failed to construct the call arguments,"
-            f" expected {len(self.csdfg.argnames)} but got {len(flat_call_args)}."
-            f"\nExpected: {self.csdfg.argnames}\nGot: {list(sdfg_call_args.keys())}"
+            f" expected {len(self.compiled_sdfg.argnames)} but got {len(flat_call_args)}."
+            f"\nExpected: {self.compiled_sdfg.argnames}\nGot: {list(sdfg_call_args.keys())}"
         )
 
         # Calling the SDFG
         with dace.config.temporary_config():
             dace.Config.set("compiler", "allow_view_arguments", value=True)
-            self.csdfg(**sdfg_call_args)
+            self.compiled_sdfg(**sdfg_call_args)
 
-        return [sdfg_call_args[out_name] for out_name in self.out_names]
+        return [sdfg_call_args[output_name] for output_name in self.output_names]
 
 
 def compile_jaxpr_sdfg(tsdfg: TranslatedJaxprSDFG) -> dace_csdfg.CompiledJaxprSDFG:
@@ -185,7 +189,7 @@ def compile_jaxpr_sdfg(tsdfg: TranslatedJaxprSDFG) -> dace_csdfg.CompiledJaxprSD
         raise ValueError("Only support SDFGs without '__return' members.")
     if tsdfg.sdfg.free_symbols:  # This is a simplification that makes our life simple.
         raise NotImplementedError(f"No free symbols allowed, found: {tsdfg.sdfg.free_symbols}")
-    if not (tsdfg.out_names or tsdfg.input_names):
+    if not (tsdfg.output_names or tsdfg.input_names):
         raise ValueError("No input nor output.")
 
     # To ensure that the SDFG is compiled and to get rid of a warning we must modify
@@ -200,7 +204,7 @@ def compile_jaxpr_sdfg(tsdfg: TranslatedJaxprSDFG) -> dace_csdfg.CompiledJaxprSD
         #  error/warning. This happens if we compile the same lowered SDFG multiple
         #  times with different options.
         sdfg.name = f"{sdfg.name}__{str(uuid.uuid1()).replace('-', '_')}"
-        assert len(sdfg.name) < 255  # noqa: PLR2004 magic-value-comparison  # 255 maximal file name size on UNIX.
+        assert len(sdfg.name) < 255  # noqa: PLR2004 [magic-value-comparison]  # 255 maximal file name size on UNIX.
 
         with dace.config.temporary_config():
             dace.Config.set("compiler", "use_cache", value=False)
@@ -209,11 +213,13 @@ def compile_jaxpr_sdfg(tsdfg: TranslatedJaxprSDFG) -> dace_csdfg.CompiledJaxprSD
             dace.Config.set("default_build_folder", value=pathlib.Path(".jacecache").resolve())
             sdfg._recompile = True
             sdfg._regenerate_code = True
-            csdfg: dace_csdfg.CompiledSDFG = sdfg.compile()
+            compiled_sdfg: dace_csdfg.CompiledSDFG = sdfg.compile()
 
     finally:
         sdfg.name = original_sdfg_name
         sdfg._recompile = original_recompile
         sdfg._regenerate_code = original_regenerate_code
 
-    return CompiledJaxprSDFG(csdfg=csdfg, input_names=tsdfg.input_names, out_names=tsdfg.out_names)
+    return CompiledJaxprSDFG(
+        compiled_sdfg=compiled_sdfg, input_names=tsdfg.input_names, output_names=tsdfg.output_names
+    )
diff --git a/src/jace/translator/jaxpr_translator_builder.py b/src/jace/translator/jaxpr_translator_builder.py
index 908580a..7ccd47c 100644
--- a/src/jace/translator/jaxpr_translator_builder.py
+++ b/src/jace/translator/jaxpr_translator_builder.py
@@ -618,7 +618,7 @@ def _translate_jaxpr_internal(self, jaxpr: jax_core.ClosedJaxpr) -> TranslationC
                 jaxpr.jaxpr.outvars, prevent_creation=True, handle_literals=False
             )
 
-        self._ctx.out_names = tuple(out_var_names)
+        self._ctx.output_names = tuple(out_var_names)
 
         return cast(TranslationContext, self._clear_translation_ctx())
 
@@ -641,11 +641,12 @@ def _handle_null_jaxpr(self, jaxpr: jax_core.ClosedJaxpr) -> list[str]:
             - Handle the case if if the output is a literal.
 
         Note:
-            The function will _not_ update the `out_names` field of the current context.
+            The function will _not_ update the `output_names` field of the current
+            context.
         """
         assert self._ctx.terminal_state is self._ctx.start_state
         assert isinstance(self._ctx.input_names, tuple)
-        assert self._ctx.out_names is None
+        assert self._ctx.output_names is None
 
         # There is not output so we do not have to copy anything around.
         if not jaxpr.out_avals:
@@ -755,7 +756,7 @@ class TranslationContext:
     Attributes:
         sdfg: The encapsulated SDFG object.
         input_names: A list of the SDFG variables that are used as input
-        out_names: A list of the SDFG variables that are used as output.
+        output_names: A list of the SDFG variables that are used as output.
         start_state: The first state in the SDFG state machine.
         terminal_state: The (currently) last state in the state machine.
         jaxpr: The Jaxpr that was used to translate.
@@ -766,11 +767,13 @@ class TranslationContext:
     Note:
         Access of any attribute of this class by an outside user is considered
         undefined behaviour.
+        Furthermore, the encapsulated SDFG should be seen as a verbatim translation
+        of the initial Jaxpr.
     """
 
     sdfg: dace.SDFG
     input_names: tuple[str, ...] | None
-    out_names: tuple[str, ...] | None
+    output_names: tuple[str, ...] | None
     start_state: dace.SDFGState
     terminal_state: dace.SDFGState
     jaxpr: jax_core.ClosedJaxpr
@@ -781,7 +784,7 @@ def __init__(self, name: str | None, jaxpr: jax_core.ClosedJaxpr) -> None:
 
         self.sdfg = dace.SDFG(name=(name or f"unnamed_SDFG_{id(self)}"))
         self.input_names = None
-        self.out_names = None
+        self.output_names = None
         self.start_state = self.sdfg.add_state(label="initial_state", is_start_block=True)
         self.terminal_state = self.start_state
         self.jaxpr = jaxpr
@@ -798,14 +801,14 @@ def validate(self) -> bool:
                 f"Expected to find '{self.start_state}' as start state,"
                 f" but instead found '{self.sdfg.start_block}'.",
                 self.sdfg,
-                self.sdfg.node_id(self.start_state),
+                None,
             )
         if {self.terminal_state} != set(self.sdfg.sink_nodes()):
             raise dace.sdfg.InvalidSDFGError(
                 f"Expected to find as terminal state '{self.terminal_state}',"
                 f" but instead found '{self.sdfg.sink_nodes()}'.",
                 self.sdfg,
-                self.sdfg.node_id(self.terminal_state),
+                None,
             )
         if not (
             self.input_names is None
@@ -814,15 +817,15 @@ def validate(self) -> bool:
             raise dace.sdfg.InvalidSDFGError(
                 f"Missing input arguments: {(input_name for input_name in self.input_names if input_name not in self.sdfg.arrays)}",
                 self.sdfg,
-                self.sdfg.node_id(self.terminal_state),
+                None,
             )
         if not (
-            self.out_names is None
-            or all(out_name in self.sdfg.arrays for out_name in self.out_names)
+            self.output_names is None
+            or all(output_name in self.sdfg.arrays for output_name in self.output_names)
         ):
             raise dace.sdfg.InvalidSDFGError(
-                f"Missing output arguments: {(out_name for out_name in self.out_names if out_name not in self.sdfg.arrays)}",
+                f"Missing output arguments: {(output_name for output_name in self.output_names if output_name not in self.sdfg.arrays)}",
                 self.sdfg,
-                self.sdfg.node_id(self.terminal_state),
+                None,
             )
         return True
diff --git a/src/jace/translator/post_translation.py b/src/jace/translator/post_translation.py
index dcc851a..9831f35 100644
--- a/src/jace/translator/post_translation.py
+++ b/src/jace/translator/post_translation.py
@@ -45,6 +45,7 @@ def postprocess_jaxpr_sdfg(
     Todo:
         - Fixing the scalar input problem on GPU.
         - Fixing stride problem of the input.
+        - Make it such that the context is not modified as a side effect.
     """
     trans_ctx.validate()  # Always validate, it is cheap.
     create_input_output_stages(trans_ctx=trans_ctx, flat_call_args=flat_call_args)
@@ -75,29 +76,21 @@ def _create_output_state(trans_ctx: translator.TranslationContext) -> None:
     Creates the output processing stage for the SDFG in place.
 
     The function will create a new terminal state, in which all outputs, denoted
-    in `trans_ctx.out_names`, will be written into new SDFG variables. In case the
+    in `trans_ctx.output_names`, will be written into new SDFG variables. In case the
     output variable is a scalar, the output will be replaced by an array of length one.
     This behaviour is consistent with JAX.
 
     Args:
         trans_ctx: The translation context to process.
     """
-    assert trans_ctx.input_names is not None and trans_ctx.out_names is not None
-
-    # NOTE: Currently we do not support to write back into an input argument, as JAX.
-    #  However, this is a requirement for handling ICON stencils, that we will support
-    #  eventually. If we get a translation context that lists a variable name in the
-    #  inputs and outputs, this means that it was returned unmodified. In JAX this
-    #  will lead to a copy and we also do it. This is implemented by just naïvely
-    #  creating a separate output variable for every output we have, irrespectively
-    #  of its name inside the Jaxpr.
+    assert trans_ctx.input_names is not None and trans_ctx.output_names is not None
 
     output_pattern = "__jace_output_{}"
     sdfg = trans_ctx.sdfg
     new_output_state: dace.SDFGState = sdfg.add_state("output_processing_stage")
     new_output_names: list[str] = []
 
-    for i, org_output_name in enumerate(trans_ctx.out_names):
+    for i, org_output_name in enumerate(trans_ctx.output_names):
         new_output_name = output_pattern.format(i)
         org_output_desc: dace.data.Data = sdfg.arrays[org_output_name]
         assert org_output_desc.transient
@@ -128,7 +121,7 @@ def _create_output_state(trans_ctx: translator.TranslationContext) -> None:
 
     sdfg.add_edge(trans_ctx.terminal_state, new_output_state, dace.InterstateEdge())
     trans_ctx.terminal_state = new_output_state
-    trans_ctx.out_names = tuple(new_output_names)
+    trans_ctx.output_names = tuple(new_output_names)
 
 
 def _create_input_state(
@@ -150,11 +143,7 @@ def _create_input_state(
     Todo:
         Handle transfer of scalar input in GPU mode.
     """
-    assert trans_ctx.input_names is not None and trans_ctx.out_names is not None
-
-    # NOTE: This function will create a distinct variable for every input. Once we
-    #  allow write back arguments they will be handled in the `_create_output_state()`
-    #  function anyway, also see the comment in that function.
+    assert trans_ctx.input_names is not None and trans_ctx.output_names is not None
 
     if len(flat_call_args) != len(trans_ctx.input_names):
         raise ValueError(f"Expected {len(trans_ctx.input_names)}, but got {len(flat_call_args)}.")
@@ -207,7 +196,7 @@ def finalize_translation_context(
     validate: bool = True,
 ) -> tjsdfg.TranslatedJaxprSDFG:
     """
-    Finalizes the supplied translation context `trans_ctx`.
+    Finalizes the translation context and returns a `TranslatedJaxprSDFG` object.
 
     The function will process the SDFG that is encapsulated inside the context, i.e. a
     canonical one, into a proper SDFG, as it is described in `TranslatedJaxprSDFG`. It
@@ -225,23 +214,21 @@ def finalize_translation_context(
     trans_ctx.validate()
     if trans_ctx.input_names is None:
         raise ValueError("Input names are not specified.")
-    if trans_ctx.out_names is None:
+    if trans_ctx.output_names is None:
         raise ValueError("Output names are not specified.")
-    if not (trans_ctx.out_names or trans_ctx.input_names):
+    if not (trans_ctx.output_names or trans_ctx.input_names):
         raise ValueError("No input nor output.")
 
     # We guarantee decoupling
     tsdfg = tjsdfg.TranslatedJaxprSDFG(
         sdfg=copy.deepcopy(trans_ctx.sdfg),
         input_names=trans_ctx.input_names,
-        out_names=trans_ctx.out_names,
+        output_names=trans_ctx.output_names,
     )
 
     # Make inputs and outputs to globals.
     sdfg_arg_names: list[str] = []
-    for arg_name in tsdfg.input_names + tsdfg.out_names:
-        if arg_name in sdfg_arg_names:
-            continue
+    for arg_name in tsdfg.input_names + tsdfg.output_names:
         tsdfg.sdfg.arrays[arg_name].transient = False
         sdfg_arg_names.append(arg_name)
     tsdfg.sdfg.arg_names = sdfg_arg_names
@@ -274,7 +261,7 @@ def add_nested_sdfg(
         in_var_names: Names of the variables in `parent_ctx` that are used as inputs for
             the nested SDFG, must have the same order as `child_ctx.input_names`.
         out_var_names: Names of the variables in `parent_ctx` that are used as outputs
-            for the nested SDFG, must have the same order as `child_ctx.out_names`.
+            for the nested SDFG, must have the same order as `child_ctx.output_names`.
 
     Returns:
         The nested SDFG object.
@@ -288,9 +275,9 @@ def add_nested_sdfg(
     """
     if child_ctx.sdfg.free_symbols:
         raise NotImplementedError("Symbol Mapping is not implemented.")
-    assert not (child_ctx.input_names is None or child_ctx.out_names is None)  # Silence mypy
+    assert not (child_ctx.input_names is None or child_ctx.output_names is None)  # Silence mypy
     assert len(child_ctx.input_names) == len(in_var_names)
-    assert len(child_ctx.out_names) == len(out_var_names)
+    assert len(child_ctx.output_names) == len(out_var_names)
     assert state in parent_ctx.sdfg.nodes()
     assert not set(in_var_names).intersection(out_var_names)
 
@@ -313,7 +300,7 @@ def add_nested_sdfg(
         parent=parent_ctx.sdfg,
         # Bug in DaCe must be a set.
         inputs=set(final_child_ctx.input_names),
-        outputs=set(final_child_ctx.out_names),
+        outputs=set(final_child_ctx.output_names),
     )
 
     # Now create the connections for the input.
@@ -328,7 +315,7 @@ def add_nested_sdfg(
         )
 
     # Now we create the output connections.
-    for outer_name, inner_name in zip(out_var_names, final_child_ctx.out_names):
+    for outer_name, inner_name in zip(out_var_names, final_child_ctx.output_names):
         outer_array = parent_ctx.sdfg.arrays[outer_name]
         state.add_edge(
             nested_sdfg,
diff --git a/src/jace/util/translation_cache.py b/src/jace/util/translation_cache.py
index cbec1ba..bbb214c 100644
--- a/src/jace/util/translation_cache.py
+++ b/src/jace/util/translation_cache.py
@@ -44,7 +44,7 @@
 P = ParamSpec("P")
 NextStage = TypeVar("NextStage", bound="stages.Stage")
 TransitionFunction: TypeAlias = "Callable[Concatenate[CachingStage[NextStage], P], NextStage]"
-CachingStageType = TypeVar("CachingStageType", bound="CachingStage")
+CachingStageT = TypeVar("CachingStageT", bound="CachingStage")
 
 # Type to describe a single argument either in an abstract or concrete way.
 CallArgsSpec: TypeAlias = tuple["_AbstractCallArgument | Hashable"]
@@ -91,7 +91,7 @@ def _make_call_description(
 
 
 def cached_transition(
-    transition: Callable[Concatenate[CachingStageType, P], NextStage],
+    transition: Callable[Concatenate[CachingStageT, P], NextStage],
 ) -> Callable[Concatenate[CachingStage[NextStage], P], NextStage]:
     """
     Decorator for making the transition function of the stage cacheable.
@@ -107,7 +107,7 @@ def cached_transition(
     """
 
     @functools.wraps(transition)
-    def transition_wrapper(self: CachingStageType, *args: P.args, **kwargs: P.kwargs) -> NextStage:
+    def transition_wrapper(self: CachingStageT, *args: P.args, **kwargs: P.kwargs) -> NextStage:
         flat_call_args, in_tree = jax_tree.tree_flatten((args, kwargs))
         key = self._make_call_description(flat_call_args=flat_call_args, in_tree=in_tree)
         if key not in self._cache:
@@ -223,10 +223,10 @@ class StageTransformationSpec:
 
 
 #: Denotes the stage that is stored inside the cache.
-StageType = TypeVar("StageType", bound="stages.Stage")
+StageT = TypeVar("StageT", bound="stages.Stage")
 
 
-class StageCache(Generic[StageType]):
+class StageCache(Generic[StageT]):
     """
     Simple LRU cache to cache the results of the stage transition function.
 
@@ -235,7 +235,7 @@ class StageCache(Generic[StageType]):
     """
 
     # The most recently used entry is at the end of the `OrderedDict`.
-    _memory: collections.OrderedDict[StageTransformationSpec, StageType]
+    _memory: collections.OrderedDict[StageTransformationSpec, StageT]
     _capacity: int
 
     def __init__(
@@ -248,13 +248,13 @@ def __init__(
     def __contains__(self, key: StageTransformationSpec) -> bool:
         return key in self._memory
 
-    def __getitem__(self, key: StageTransformationSpec) -> StageType:
+    def __getitem__(self, key: StageTransformationSpec) -> StageT:
         if key not in self:
             raise KeyError(f"Key '{key}' is unknown.")
         self._memory.move_to_end(key, last=True)
         return self._memory[key]
 
-    def __setitem__(self, key: StageTransformationSpec, res: StageType) -> None:
+    def __setitem__(self, key: StageTransformationSpec, res: StageT) -> None:
         if key in self:
             self._memory.move_to_end(key, last=True)
             self._memory[key] = res
@@ -287,7 +287,7 @@ def __len__(self) -> int:
     def capacity(self) -> int:  # noqa: D102 [undocumented-public-method]
         return self._capacity
 
-    def front(self) -> tuple[StageTransformationSpec, StageType]:
+    def front(self) -> tuple[StageTransformationSpec, StageT]:
         """Returns the front of the cache, i.e. its newest entry."""
         return next(reversed(self._memory.items()))
 

From e7fa770e4672c3f2fb863a181e37dedc53200749 Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Mon, 1 Jul 2024 11:25:24 +0200
Subject: [PATCH 433/458] Adapted the tests.

---
 tests/conftest.py                             |  5 +--
 .../primitive_translators/conftest.py         |  5 +--
 .../test_jaxpr_translator_builder.py          |  4 +-
 tests/unit_tests/test_caching.py              | 39 ++++++++-----------
 4 files changed, 23 insertions(+), 30 deletions(-)

diff --git a/tests/conftest.py b/tests/conftest.py
index 94cd805..bbf0eb3 100644
--- a/tests/conftest.py
+++ b/tests/conftest.py
@@ -98,6 +98,5 @@ def _set_compile_options() -> Generator[None, None, None]:
     perform any optimizations.
     Please not that certain tests might override this fixture.
     """
-    initial_compile_options = stages.update_active_compiler_options(optimization.NO_OPTIMIZATIONS)
-    yield
-    stages.update_active_compiler_options(initial_compile_options)
+    with stages.temporary_compiler_options(optimization.NO_OPTIMIZATIONS):
+        yield
diff --git a/tests/integration_tests/primitive_translators/conftest.py b/tests/integration_tests/primitive_translators/conftest.py
index 677d9ed..841f1f2 100644
--- a/tests/integration_tests/primitive_translators/conftest.py
+++ b/tests/integration_tests/primitive_translators/conftest.py
@@ -34,6 +34,5 @@ def _set_compile_options(request) -> Generator[None, None, None]:
     Todo:
         Implement a system that only runs the optimization case in CI.
     """
-    initial_compile_options = stages.update_active_compiler_options(request.param)
-    yield
-    stages.update_active_compiler_options(initial_compile_options)
+    with stages.temporary_compiler_options(request.param):
+        yield
diff --git a/tests/integration_tests/test_jaxpr_translator_builder.py b/tests/integration_tests/test_jaxpr_translator_builder.py
index e71a189..df708dc 100644
--- a/tests/integration_tests/test_jaxpr_translator_builder.py
+++ b/tests/integration_tests/test_jaxpr_translator_builder.py
@@ -548,8 +548,8 @@ def wrapped(a: np.ndarray, b: np.ndarray) -> tuple[np.ndarray, np.ndarray]:
 
     assert len(lowered._translated_sdfg.input_names) == 2
     assert len(compiled._compiled_sdfg.input_names) == 2
-    assert len(lowered._translated_sdfg.out_names) == 2
-    assert len(compiled._compiled_sdfg.out_names) == 2
+    assert len(lowered._translated_sdfg.output_names) == 2
+    assert len(compiled._compiled_sdfg.output_names) == 2
     assert isinstance(res, tuple), f"Expected 'tuple', but got '{type(res).__name__}'."
     assert len(res) == 2
     assert np.allclose(ref, res)
diff --git a/tests/unit_tests/test_caching.py b/tests/unit_tests/test_caching.py
index 564d0ea..8f388b3 100644
--- a/tests/unit_tests/test_caching.py
+++ b/tests/unit_tests/test_caching.py
@@ -214,25 +214,23 @@ def jace_wrapped(a: np.ndarray, b: np.ndarray) -> np.ndarray:
 
 def test_caching_compilation_options() -> None:
     """Tests if the global optimization managing works."""
-    original_compile_options = stages.get_active_compiler_options()
-    try:
-        lowering_cnt = [0]
+    lowering_cnt = [0]
 
-        @jace.jit
-        def wrapped(a: float) -> float:
-            lowering_cnt[0] += 1
-            return a + 1.0
+    @jace.jit
+    def wrapped(a: float) -> float:
+        lowering_cnt[0] += 1
+        return a + 1.0
 
-        lower_cache = wrapped._cache
-        lowered = wrapped.lower(1.0)
-        compile_cache = lowered._cache
+    lower_cache = wrapped._cache
+    lowered = wrapped.lower(1.0)
+    compile_cache = lowered._cache
 
-        assert len(lower_cache) == 1
-        assert len(compile_cache) == 0
-        assert lowering_cnt[0] == 1
+    assert len(lower_cache) == 1
+    assert len(compile_cache) == 0
+    assert lowering_cnt[0] == 1
 
-        # Using the first set of options.
-        stages.update_active_compiler_options(optimization.NO_OPTIMIZATIONS)
+    # Using the first set of options.
+    with stages.temporary_compiler_options(optimization.NO_OPTIMIZATIONS):
         _ = wrapped(2.0)
 
         # Except from one entry in the compile cache, nothing should have changed.
@@ -241,9 +239,9 @@ def wrapped(a: float) -> float:
         assert compile_cache.front()[0].stage_id == id(lowered)
         assert lowering_cnt[0] == 1
 
-        # Now we change the options again which then will lead to another compilation,
-        #  but not to another lowering.
-        stages.update_active_compiler_options(optimization.DEFAULT_OPTIMIZATIONS)
+    # Now we change the options again which then will lead to another compilation,
+    #  but not to another lowering.
+    with stages.temporary_compiler_options(optimization.DEFAULT_OPTIMIZATIONS):
         _ = wrapped(2.0)
 
         assert len(lower_cache) == 1
@@ -251,9 +249,6 @@ def wrapped(a: float) -> float:
         assert compile_cache.front()[0].stage_id == id(lowered)
         assert lowering_cnt[0] == 1
 
-    finally:
-        stages.update_active_compiler_options(original_compile_options)
-
 
 def test_caching_dtype() -> None:
     """Tests if the data type is properly included in the test."""
@@ -396,7 +391,7 @@ def wrapped(a: np.ndarray) -> np.ndarray:
         return a + 10.0
 
     shape = (10, 100, 1000)
-    array_c = testutil.make_array(shape, order="c")
+    array_c = testutil.make_array(shape, order="C")
     array_f = np.array(array_c, copy=True, order="F")
 
     # First we compile run it with c strides.

From aa92f01f0825496f263bc994d0022a8f4cb55971 Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Mon, 1 Jul 2024 11:33:23 +0200
Subject: [PATCH 434/458] Applied Enrique's suggestions.

---
 CODING_GUIDELINES.md                          |  4 +-
 src/jace/api.py                               |  1 -
 src/jace/stages.py                            | 88 +++++++++----------
 src/jace/tracing.py                           |  1 +
 src/jace/translated_jaxpr_sdfg.py             | 74 +++++++++-------
 .../translator/jaxpr_translator_builder.py    | 29 +++---
 src/jace/translator/post_translation.py       | 35 +++-----
 src/jace/util/translation_cache.py            | 18 ++--
 8 files changed, 121 insertions(+), 129 deletions(-)

diff --git a/CODING_GUIDELINES.md b/CODING_GUIDELINES.md
index 72cff79..2fd6961 100644
--- a/CODING_GUIDELINES.md
+++ b/CODING_GUIDELINES.md
@@ -36,7 +36,7 @@ Inside JaCe the following convention is applied:
 
 - If the module has a standard abbreviation use that, e.g. `import numpy as np`.
 - For a JaCe module use:
-  - If the module name is only a single word use it directly, e.g. `from jace import translator`
+  - If the module name is only a single word use it directly, e.g. `from jace import translator`.
   - If the module name consists of multiple words use the last word prefixed with the first letters of the others, e.g. `from jace.translator import post_translator as ptranslator` or `from jace import translated_jaxpr_sdfg as tjsdfg`.
   - In case of a clash use your best judgment.
 - For an external module use the rule above, but prefix the name with the main package's name, e.g. `from dace.codegen import compiled_sdfg as dace_csdfg`.
@@ -116,7 +116,7 @@ We generate the API documentation automatically from the docstrings using [Sphin
 Sphinx supports the [reStructuredText][sphinx-rest] (reST) markup language for defining additional formatting options in the generated documentation, however section [_3.8 Comments and Docstrings_](https://google.github.io/styleguide/pyguide.html#38-comments-and-docstrings) of the Google Python Style Guide does not specify how to use markups in docstrings. As a result, we decided to forbid reST markup in docstrings, except for the following cases:
 
 - Cross-referencing other objects using Sphinx text roles for the [Python domain](https://www.sphinx-doc.org/en/master/usage/restructuredtext/domains.html#the-python-domain) (as explained [here](https://www.sphinx-doc.org/en/master/usage/restructuredtext/domains.html#python-roles)).
-- Very basic formatting markup to improve _readability_ of the generated documentation without obscuring the source docstring (e.g. `"literal"` strings, bulleted lists).
+- Very basic formatting markup to improve _readability_ of the generated documentation without obscuring the source docstring (e.g. `` `literal` `` strings, bulleted lists).
 
 We highly encourage the [doctest] format for code examples in docstrings. In fact, doctest runs code examples and makes sure they are in sync with the codebase.
 
diff --git a/src/jace/api.py b/src/jace/api.py
index 6def2f4..35d722a 100644
--- a/src/jace/api.py
+++ b/src/jace/api.py
@@ -21,7 +21,6 @@
 
 __all__ = ["JITOptions", "grad", "jacfwd", "jacrev", "jit"]
 
-# Used for type annotation, see the notes in `jace.stages` for more.
 _P = ParamSpec("_P")
 _R = TypeVar("_R")
 
diff --git a/src/jace/stages.py b/src/jace/stages.py
index 1b1fa16..d16c8f1 100644
--- a/src/jace/stages.py
+++ b/src/jace/stages.py
@@ -27,15 +27,15 @@
 
 from __future__ import annotations
 
+import contextlib
 import copy
-import inspect
-from collections.abc import Callable, Mapping, Sequence
+from collections.abc import Callable, Generator, Mapping, Sequence
 from typing import TYPE_CHECKING, Any, Generic, ParamSpec, TypeVar, Union
 
 from jax import tree_util as jax_tree
 
 from jace import api, optimization, tracing, translated_jaxpr_sdfg as tjsdfg, translator, util
-from jace.optimization import CompilerOptions
+from jace.optimization import CompilerOptions  # Reexport for compatibility with JAX.
 from jace.translator import post_translation as ptranslation
 from jace.util import translation_cache as tcache
 
@@ -44,14 +44,14 @@
     import dace
 
 __all__ = [
-    "CompilerOptions",  # export for compatibility with JAX.
+    "CompilerOptions",
     "JaCeCompiled",
     "JaCeLowered",
     "JaCeWrapped",
     "Stage",
     "get_active_compiler_options",
-    "make_final_compilation_options",
-    "update_active_compiler_options",
+    "get_active_compiler_options",
+    "temporary_compiler_options",
 ]
 
 #: Known compilation stages in JaCe.
@@ -110,10 +110,6 @@ def __init__(
         primitive_translators: Mapping[str, translator.PrimitiveTranslator],
         jit_options: api.JITOptions,
     ) -> None:
-        # TODO(phimuell): Test if this restriction is needed.
-        assert all(
-            param.default is param.empty for param in inspect.signature(fun).parameters.values()
-        )
         super().__init__()
         self._primitive_translators = {**primitive_translators}
         self._jit_options = {**jit_options}
@@ -244,7 +240,8 @@ def compile(self, compiler_options: CompilerOptions | None = None) -> JaCeCompil
 
         To perform the optimizations `jace_optimize()` is used. The actual options that
         are forwarded to it are obtained by passing `compiler_options` to
-        `make_final_compilation_options()`.
+        `get_active_compiler_options()`, these options are also included in the
+        key used to cache the result.
 
         Args:
             compiler_options: The optimization options to use.
@@ -252,7 +249,7 @@ def compile(self, compiler_options: CompilerOptions | None = None) -> JaCeCompil
         # We **must** deepcopy before we do any optimization, because all optimizations
         #  are in place, to properly cache stages, stages needs to be immutable.
         tsdfg: tjsdfg.TranslatedJaxprSDFG = copy.deepcopy(self._translated_sdfg)
-        optimization.jace_optimize(tsdfg=tsdfg, **make_final_compilation_options(compiler_options))
+        optimization.jace_optimize(tsdfg=tsdfg, **get_active_compiler_options(compiler_options))
 
         return JaCeCompiled(
             compiled_sdfg=tjsdfg.compile_jaxpr_sdfg(tsdfg),
@@ -290,7 +287,7 @@ def _make_call_description(
         unflatted_args, unflatted_kwargs = jax_tree.tree_unflatten(in_tree, flat_call_args)
         assert (not unflatted_kwargs) and (len(unflatted_args) <= 1)
 
-        options = make_final_compilation_options(unflatted_args[0] if unflatted_args else {})
+        options = get_active_compiler_options(unflatted_args[0] if unflatted_args else None)
         flat_options, option_tree = jax_tree.tree_flatten(options)
         return tcache.StageTransformationSpec(
             stage_id=id(self), flat_call_args=tuple(flat_options), in_tree=option_tree
@@ -311,7 +308,7 @@ class JaCeCompiled(Generic[_R]):
     Args:
         compiled_sdfg: The compiled SDFG object.
         input_names: SDFG variables used as inputs.
-        out_names: SDFG variables used as outputs.
+        output_names: SDFG variables used as outputs.
         out_tree: Pytree describing how to unflatten the output.
 
     Note:
@@ -352,55 +349,54 @@ def __call__(self, *args: Any, **kwargs: Any) -> _R:
 _JACELOWERED_ACTIVE_COMPILE_OPTIONS: CompilerOptions = optimization.DEFAULT_OPTIMIZATIONS.copy()
 """Global set of currently active compilation/optimization options.
 
-The global set is initialized with `jace.optimization.DEFAULT_OPTIMIZATIONS`. It can be
-managed through `update_active_compiler_options()` and accessed through
-`get_active_compiler_options()`, however, it is advised that a user should use
-`make_final_compilation_options()` for getting the final options that should be used
-for optimization.
+The global set is initialized to `jace.optimization.DEFAULT_OPTIMIZATIONS`.
+For modifying the set of active options the the `temporary_compiler_options()`
+context manager is provided.
+To obtain the currently active compiler options use `get_active_compiler_options()`.
 """
 
 
-def update_active_compiler_options(new_active_options: CompilerOptions) -> CompilerOptions:
+@contextlib.contextmanager
+def temporary_compiler_options(new_active_options: CompilerOptions) -> Generator[None, None, None]:
     """
-    Updates the set of active compiler options.
+    Temporary modifies the set of active compiler options.
 
-    Merges the options passed as `new_active_options` with the currently active
-    compiler options. This set is used by `JaCeLowered.compile()` to determine
-    which options should be used.
-    The function will return the set of options that was active before the call.
+    During the activation of this context the active set of active compiler option
+    consists of the set of option that were previously active merged with the ones
+    passed through `new_active_options`.
 
-    To obtain the set of currently active options use `get_active_compiler_options()`.
+    Args:
+        new_active_options: Options that should be temporary merged with the currently
+            active options.
 
-    Todo:
-        Make a proper context manager.
+    See Also:
+        `get_active_compiler_options()` to get the set of active options that is
+        currently active.
     """
+    global _JACELOWERED_ACTIVE_COMPILE_OPTIONS  # noqa: PLW0603 [global-statement]
     previous_active_options = _JACELOWERED_ACTIVE_COMPILE_OPTIONS.copy()
-    _JACELOWERED_ACTIVE_COMPILE_OPTIONS.update(new_active_options)
-    return previous_active_options
-
+    try:
+        _JACELOWERED_ACTIVE_COMPILE_OPTIONS.update(new_active_options)
+        yield None
+    finally:
+        _JACELOWERED_ACTIVE_COMPILE_OPTIONS = previous_active_options
 
-def get_active_compiler_options() -> CompilerOptions:
-    """Returns the set of currently active compiler options."""
-    return _JACELOWERED_ACTIVE_COMPILE_OPTIONS.copy()
 
-
-def make_final_compilation_options(compiler_options: CompilerOptions | None) -> CompilerOptions:
+def get_active_compiler_options(compiler_options: CompilerOptions | None) -> CompilerOptions:
     """
-    Returns the final compilation options.
+    Get the final compiler options.
 
     There are two different sources of optimization options. The first one is the global
-    set of currently active compiler options. The second one is the options that are
-    passed to this function, which takes precedence. Thus, the `compiler_options`
-    argument describes the difference from the currently active global options.
-
-    This function is used by `JaCeLowered` if it has to determine which options to use
-    for optimization, either for compiling the lowered SDFG or for computing the key.
+    set of currently active compiler options, which is returned if `None` is passed.
+    The second one is the options that are passed to this function, which takes
+    precedence. This mode is also used by `JaCeLowered.compile()` to determine the
+    final compiler options.
 
     Args:
         compiler_options: The local compilation options.
 
     See Also:
-        `get_active_compiler_options()` to inspect the set of currently active options
-        and `update_active_compiler_options()` to modify them.
+        `temporary_compiler_options()` to modify the currently active set of compiler
+        options.
     """
-    return get_active_compiler_options() | (compiler_options or {})
+    return _JACELOWERED_ACTIVE_COMPILE_OPTIONS | (compiler_options or {})
diff --git a/src/jace/tracing.py b/src/jace/tracing.py
index 2e51251..4df5d00 100644
--- a/src/jace/tracing.py
+++ b/src/jace/tracing.py
@@ -82,6 +82,7 @@ def make_jaxpr(
         raise NotImplementedError(
             f"Not supported tracing options: {', '.join(f'{k}' for k in trace_options)}"
         )
+    # TODO(phimuell): Test if this restriction is needed.
     assert all(param.default is param.empty for param in inspect.signature(fun).parameters.values())
 
     def tracer_impl(
diff --git a/src/jace/translated_jaxpr_sdfg.py b/src/jace/translated_jaxpr_sdfg.py
index 78c7c8b..9cb9908 100644
--- a/src/jace/translated_jaxpr_sdfg.py
+++ b/src/jace/translated_jaxpr_sdfg.py
@@ -36,12 +36,14 @@ class TranslatedJaxprSDFG:
     - It does not have `__return*` variables, instead all return arguments are
         passed by arguments.
     - All input arguments are passed through arguments mentioned in `input_names`,
-        while the outputs are passed through `out_names`.
+        while the outputs are passed through `output_names`.
     - Only variables listed as in/outputs are non transient.
-    - The order of `input_names` and `out_names` is the same as in the original Jaxpr.
-    - If an input is used as outputs it appears in both `input_names` and `out_names`.
-    - Its `arg_names` is set to `input_names + out_names`, but arguments that are
+    - The order of `input_names` and `output_names` is the same as in the Jaxpr.
+    - Its `arg_names` is set to `input_names + output_names`, but arguments that are
         input and outputs are only listed as inputs.
+    - For every transient there is exactly one access node that writes to it,
+        except the name of the array starts with `__jace_mutable_`, which can
+        be written to multiple times.
 
     The only valid way to obtain a `TranslatedJaxprSDFG` is by passing a
     `TranslationContext`, that was in turn constructed by
@@ -52,7 +54,7 @@ class TranslatedJaxprSDFG:
     Attributes:
         sdfg: The encapsulated SDFG object.
         input_names: SDFG variables used as inputs.
-        out_names: SDFG variables used as outputs.
+        output_names: SDFG variables used as outputs.
 
     Todo:
         After the SDFG is compiled a lot of code looks strange, because there is
@@ -62,7 +64,7 @@ class TranslatedJaxprSDFG:
 
     sdfg: dace.SDFG
     input_names: tuple[str, ...]
-    out_names: tuple[str, ...]
+    output_names: tuple[str, ...]
 
     def validate(self) -> bool:
         """Validate the underlying SDFG."""
@@ -72,9 +74,9 @@ def validate(self) -> bool:
                 self.sdfg,
                 self.sdfg.node_id(self.sdfg.start_state),
             )
-        if any(self.sdfg.arrays[out].transient for out in self.out_names):
+        if any(self.sdfg.arrays[out].transient for out in self.output_names):
             raise dace.sdfg.InvalidSDFGError(
-                f"Found transient outputs: {(out for out in self.out_names if self.sdfg.arrays[out].transient)}",
+                f"Found transient outputs: {(out for out in self.output_names if self.sdfg.arrays[out].transient)}",
                 self.sdfg,
                 self.sdfg.node_id(self.sdfg.start_state),
             )
@@ -84,6 +86,14 @@ def validate(self) -> bool:
                 self.sdfg,
                 self.sdfg.node_id(self.sdfg.start_state),
             )
+        if (self.output_names is not None and self.input_names is not None) and (
+            set(self.output_names).intersection(self.input_names)
+        ):
+            raise dace.sdfg.InvalidSDFGError(
+                f"Inputs can not be outputs: {set(self.output_names).intersection(self.input_names)}.",
+                self.sdfg,
+                None,
+            )
         self.sdfg.validate()
         return True
 
@@ -99,15 +109,15 @@ class CompiledJaxprSDFG:
     `compile_jaxpr_sdfg()`.
 
     Args:
-        dace_csdfg: The `CompiledSDFG` object.
+        compiled_sdfg: The `CompiledSDFG` object.
         input_names: Names of the SDFG variables used as inputs.
-        out_names: Names of the SDFG variables used as outputs.
+        output_names: Names of the SDFG variables used as outputs.
 
     Attributes:
-        dace_csdfg: The `CompiledSDFG` object.
-        sdfg: The encapsulated SDFG object.
+        compiled_sdfg: The `CompiledSDFG` object.
+        sdfg: SDFG object used to generate/compile `self.compiled_sdfg`.
         input_names: Names of the SDFG variables used as inputs.
-        out_names: Names of the SDFG variables used as outputs.
+        output_names: Names of the SDFG variables used as outputs.
 
     Note:
         Currently the strides of the input arguments must match the ones that were used
@@ -118,13 +128,13 @@ class CompiledJaxprSDFG:
         arrays of length one.
     """
 
-    csdfg: dace_csdfg.CompiledSDFG
+    compiled_sdfg: dace_csdfg.CompiledSDFG
     input_names: tuple[str, ...]
-    out_names: tuple[str, ...]
+    output_names: tuple[str, ...]
 
     @property
     def sdfg(self) -> dace.SDFG:  # noqa: D102 [undocumented-public-method]
-        return self.csdfg.sdfg
+        return self.compiled_sdfg.sdfg
 
     def __call__(
         self,
@@ -137,7 +147,6 @@ def __call__(
         the output.
 
         Args:
-            dace_csdfg: The compiled SDFG to call.
             flat_call_args: Flattened input arguments.
         """
         if len(self.input_names) != len(flat_call_args):
@@ -155,26 +164,21 @@ def __call__(
             sdfg_call_args[in_name] = in_val
 
         arrays = self.sdfg.arrays
-        for out_name in self.out_names:
-            sdfg_array = arrays[out_name]
-            if out_name in sdfg_call_args:
-                if util.is_jax_array(sdfg_call_args[out_name]):
-                    raise ValueError("Passed an immutable JAX array as output.")
-            else:
-                sdfg_call_args[out_name] = dace_data.make_array_from_descriptor(sdfg_array)
-
-        assert len(sdfg_call_args) == len(self.csdfg.argnames), (
+        for output_name in self.output_names:
+            sdfg_call_args[output_name] = dace_data.make_array_from_descriptor(arrays[output_name])
+
+        assert len(sdfg_call_args) == len(self.compiled_sdfg.argnames), (
             "Failed to construct the call arguments,"
-            f" expected {len(self.csdfg.argnames)} but got {len(flat_call_args)}."
-            f"\nExpected: {self.csdfg.argnames}\nGot: {list(sdfg_call_args.keys())}"
+            f" expected {len(self.compiled_sdfg.argnames)} but got {len(flat_call_args)}."
+            f"\nExpected: {self.compiled_sdfg.argnames}\nGot: {list(sdfg_call_args.keys())}"
         )
 
         # Calling the SDFG
         with dace.config.temporary_config():
             dace.Config.set("compiler", "allow_view_arguments", value=True)
-            self.csdfg(**sdfg_call_args)
+            self.compiled_sdfg(**sdfg_call_args)
 
-        return [sdfg_call_args[out_name] for out_name in self.out_names]
+        return [sdfg_call_args[output_name] for output_name in self.output_names]
 
 
 def compile_jaxpr_sdfg(tsdfg: TranslatedJaxprSDFG) -> dace_csdfg.CompiledJaxprSDFG:
@@ -185,7 +189,7 @@ def compile_jaxpr_sdfg(tsdfg: TranslatedJaxprSDFG) -> dace_csdfg.CompiledJaxprSD
         raise ValueError("Only support SDFGs without '__return' members.")
     if tsdfg.sdfg.free_symbols:  # This is a simplification that makes our life simple.
         raise NotImplementedError(f"No free symbols allowed, found: {tsdfg.sdfg.free_symbols}")
-    if not (tsdfg.out_names or tsdfg.input_names):
+    if not (tsdfg.output_names or tsdfg.input_names):
         raise ValueError("No input nor output.")
 
     # To ensure that the SDFG is compiled and to get rid of a warning we must modify
@@ -200,7 +204,7 @@ def compile_jaxpr_sdfg(tsdfg: TranslatedJaxprSDFG) -> dace_csdfg.CompiledJaxprSD
         #  error/warning. This happens if we compile the same lowered SDFG multiple
         #  times with different options.
         sdfg.name = f"{sdfg.name}__{str(uuid.uuid1()).replace('-', '_')}"
-        assert len(sdfg.name) < 255  # noqa: PLR2004 magic-value-comparison  # 255 maximal file name size on UNIX.
+        assert len(sdfg.name) < 255  # noqa: PLR2004 [magic-value-comparison]  # 255 maximal file name size on UNIX.
 
         with dace.config.temporary_config():
             dace.Config.set("compiler", "use_cache", value=False)
@@ -209,11 +213,13 @@ def compile_jaxpr_sdfg(tsdfg: TranslatedJaxprSDFG) -> dace_csdfg.CompiledJaxprSD
             dace.Config.set("default_build_folder", value=pathlib.Path(".jacecache").resolve())
             sdfg._recompile = True
             sdfg._regenerate_code = True
-            csdfg: dace_csdfg.CompiledSDFG = sdfg.compile()
+            compiled_sdfg: dace_csdfg.CompiledSDFG = sdfg.compile()
 
     finally:
         sdfg.name = original_sdfg_name
         sdfg._recompile = original_recompile
         sdfg._regenerate_code = original_regenerate_code
 
-    return CompiledJaxprSDFG(csdfg=csdfg, input_names=tsdfg.input_names, out_names=tsdfg.out_names)
+    return CompiledJaxprSDFG(
+        compiled_sdfg=compiled_sdfg, input_names=tsdfg.input_names, output_names=tsdfg.output_names
+    )
diff --git a/src/jace/translator/jaxpr_translator_builder.py b/src/jace/translator/jaxpr_translator_builder.py
index 9285323..0d6adaa 100644
--- a/src/jace/translator/jaxpr_translator_builder.py
+++ b/src/jace/translator/jaxpr_translator_builder.py
@@ -608,7 +608,7 @@ def _translate_jaxpr_internal(self, jaxpr: jax_core.ClosedJaxpr) -> TranslationC
                 jaxpr.jaxpr.outvars, prevent_creation=True, handle_literals=False
             )
 
-        self._ctx.out_names = tuple(out_var_names)
+        self._ctx.output_names = tuple(out_var_names)
 
         return cast(TranslationContext, self._clear_translation_ctx())
 
@@ -631,11 +631,12 @@ def _handle_null_jaxpr(self, jaxpr: jax_core.ClosedJaxpr) -> list[str]:
             - Handle the case if if the output is a literal.
 
         Note:
-            The function will _not_ update the `out_names` field of the current context.
+            The function will _not_ update the `output_names` field of the current
+            context.
         """
         assert self._ctx.terminal_state is self._ctx.start_state
         assert isinstance(self._ctx.input_names, tuple)
-        assert self._ctx.out_names is None
+        assert self._ctx.output_names is None
 
         # There is not output so we do not have to copy anything around.
         if not jaxpr.out_avals:
@@ -704,7 +705,7 @@ class TranslationContext:
     Attributes:
         sdfg: The encapsulated SDFG object.
         input_names: A list of the SDFG variables that are used as input
-        out_names: A list of the SDFG variables that are used as output.
+        output_names: A list of the SDFG variables that are used as output.
         start_state: The first state in the SDFG state machine.
         terminal_state: The (currently) last state in the state machine.
         jaxpr: The Jaxpr that was used to translate.
@@ -715,11 +716,13 @@ class TranslationContext:
     Note:
         Access of any attribute of this class by an outside user is considered
         undefined behaviour.
+        Furthermore, the encapsulated SDFG should be seen as a verbatim translation
+        of the initial Jaxpr.
     """
 
     sdfg: dace.SDFG
     input_names: tuple[str, ...] | None
-    out_names: tuple[str, ...] | None
+    output_names: tuple[str, ...] | None
     start_state: dace.SDFGState
     terminal_state: dace.SDFGState
     jaxpr: jax_core.ClosedJaxpr
@@ -730,7 +733,7 @@ def __init__(self, name: str | None, jaxpr: jax_core.ClosedJaxpr) -> None:
 
         self.sdfg = dace.SDFG(name=(name or f"unnamed_SDFG_{id(self)}"))
         self.input_names = None
-        self.out_names = None
+        self.output_names = None
         self.start_state = self.sdfg.add_state(label="initial_state", is_start_block=True)
         self.terminal_state = self.start_state
         self.jaxpr = jaxpr
@@ -747,14 +750,14 @@ def validate(self) -> bool:
                 f"Expected to find '{self.start_state}' as start state,"
                 f" but instead found '{self.sdfg.start_block}'.",
                 self.sdfg,
-                self.sdfg.node_id(self.start_state),
+                None,
             )
         if {self.terminal_state} != set(self.sdfg.sink_nodes()):
             raise dace.sdfg.InvalidSDFGError(
                 f"Expected to find as terminal state '{self.terminal_state}',"
                 f" but instead found '{self.sdfg.sink_nodes()}'.",
                 self.sdfg,
-                self.sdfg.node_id(self.terminal_state),
+                None,
             )
         if not (
             self.input_names is None
@@ -763,15 +766,15 @@ def validate(self) -> bool:
             raise dace.sdfg.InvalidSDFGError(
                 f"Missing input arguments: {(input_name for input_name in self.input_names if input_name not in self.sdfg.arrays)}",
                 self.sdfg,
-                self.sdfg.node_id(self.terminal_state),
+                None,
             )
         if not (
-            self.out_names is None
-            or all(out_name in self.sdfg.arrays for out_name in self.out_names)
+            self.output_names is None
+            or all(output_name in self.sdfg.arrays for output_name in self.output_names)
         ):
             raise dace.sdfg.InvalidSDFGError(
-                f"Missing output arguments: {(out_name for out_name in self.out_names if out_name not in self.sdfg.arrays)}",
+                f"Missing output arguments: {(output_name for output_name in self.output_names if output_name not in self.sdfg.arrays)}",
                 self.sdfg,
-                self.sdfg.node_id(self.terminal_state),
+                None,
             )
         return True
diff --git a/src/jace/translator/post_translation.py b/src/jace/translator/post_translation.py
index 8242060..a00b651 100644
--- a/src/jace/translator/post_translation.py
+++ b/src/jace/translator/post_translation.py
@@ -43,6 +43,7 @@ def postprocess_jaxpr_sdfg(
     Todo:
         - Fixing the scalar input problem on GPU.
         - Fixing stride problem of the input.
+        - Make it such that the context is not modified as a side effect.
     """
     trans_ctx.validate()  # Always validate, it is cheap.
     create_input_output_stages(trans_ctx=trans_ctx, flat_call_args=flat_call_args)
@@ -73,29 +74,21 @@ def _create_output_state(trans_ctx: translator.TranslationContext) -> None:
     Creates the output processing stage for the SDFG in place.
 
     The function will create a new terminal state, in which all outputs, denoted
-    in `trans_ctx.out_names`, will be written into new SDFG variables. In case the
+    in `trans_ctx.output_names`, will be written into new SDFG variables. In case the
     output variable is a scalar, the output will be replaced by an array of length one.
     This behaviour is consistent with JAX.
 
     Args:
         trans_ctx: The translation context to process.
     """
-    assert trans_ctx.input_names is not None and trans_ctx.out_names is not None
-
-    # NOTE: Currently we do not support to write back into an input argument, as JAX.
-    #  However, this is a requirement for handling ICON stencils, that we will support
-    #  eventually. If we get a translation context that lists a variable name in the
-    #  inputs and outputs, this means that it was returned unmodified. In JAX this
-    #  will lead to a copy and we also do it. This is implemented by just naïvely
-    #  creating a separate output variable for every output we have, irrespectively
-    #  of its name inside the Jaxpr.
+    assert trans_ctx.input_names is not None and trans_ctx.output_names is not None
 
     output_pattern = "__jace_output_{}"
     sdfg = trans_ctx.sdfg
     new_output_state: dace.SDFGState = sdfg.add_state("output_processing_stage")
     new_output_names: list[str] = []
 
-    for i, org_output_name in enumerate(trans_ctx.out_names):
+    for i, org_output_name in enumerate(trans_ctx.output_names):
         new_output_name = output_pattern.format(i)
         org_output_desc: dace.data.Data = sdfg.arrays[org_output_name]
         assert org_output_desc.transient
@@ -126,7 +119,7 @@ def _create_output_state(trans_ctx: translator.TranslationContext) -> None:
 
     sdfg.add_edge(trans_ctx.terminal_state, new_output_state, dace.InterstateEdge())
     trans_ctx.terminal_state = new_output_state
-    trans_ctx.out_names = tuple(new_output_names)
+    trans_ctx.output_names = tuple(new_output_names)
 
 
 def _create_input_state(
@@ -148,11 +141,7 @@ def _create_input_state(
     Todo:
         Handle transfer of scalar input in GPU mode.
     """
-    assert trans_ctx.input_names is not None and trans_ctx.out_names is not None
-
-    # NOTE: This function will create a distinct variable for every input. Once we
-    #  allow write back arguments they will be handled in the `_create_output_state()`
-    #  function anyway, also see the comment in that function.
+    assert trans_ctx.input_names is not None and trans_ctx.output_names is not None
 
     if len(flat_call_args) != len(trans_ctx.input_names):
         raise ValueError(f"Expected {len(trans_ctx.input_names)}, but got {len(flat_call_args)}.")
@@ -205,7 +194,7 @@ def finalize_translation_context(
     validate: bool = True,
 ) -> tjsdfg.TranslatedJaxprSDFG:
     """
-    Finalizes the supplied translation context `trans_ctx`.
+    Finalizes the translation context and returns a `TranslatedJaxprSDFG` object.
 
     The function will process the SDFG that is encapsulated inside the context, i.e. a
     canonical one, into a proper SDFG, as it is described in `TranslatedJaxprSDFG`. It
@@ -223,23 +212,21 @@ def finalize_translation_context(
     trans_ctx.validate()
     if trans_ctx.input_names is None:
         raise ValueError("Input names are not specified.")
-    if trans_ctx.out_names is None:
+    if trans_ctx.output_names is None:
         raise ValueError("Output names are not specified.")
-    if not (trans_ctx.out_names or trans_ctx.input_names):
+    if not (trans_ctx.output_names or trans_ctx.input_names):
         raise ValueError("No input nor output.")
 
     # We guarantee decoupling
     tsdfg = tjsdfg.TranslatedJaxprSDFG(
         sdfg=copy.deepcopy(trans_ctx.sdfg),
         input_names=trans_ctx.input_names,
-        out_names=trans_ctx.out_names,
+        output_names=trans_ctx.output_names,
     )
 
     # Make inputs and outputs to globals.
     sdfg_arg_names: list[str] = []
-    for arg_name in tsdfg.input_names + tsdfg.out_names:
-        if arg_name in sdfg_arg_names:
-            continue
+    for arg_name in tsdfg.input_names + tsdfg.output_names:
         tsdfg.sdfg.arrays[arg_name].transient = False
         sdfg_arg_names.append(arg_name)
     tsdfg.sdfg.arg_names = sdfg_arg_names
diff --git a/src/jace/util/translation_cache.py b/src/jace/util/translation_cache.py
index cbec1ba..bbb214c 100644
--- a/src/jace/util/translation_cache.py
+++ b/src/jace/util/translation_cache.py
@@ -44,7 +44,7 @@
 P = ParamSpec("P")
 NextStage = TypeVar("NextStage", bound="stages.Stage")
 TransitionFunction: TypeAlias = "Callable[Concatenate[CachingStage[NextStage], P], NextStage]"
-CachingStageType = TypeVar("CachingStageType", bound="CachingStage")
+CachingStageT = TypeVar("CachingStageT", bound="CachingStage")
 
 # Type to describe a single argument either in an abstract or concrete way.
 CallArgsSpec: TypeAlias = tuple["_AbstractCallArgument | Hashable"]
@@ -91,7 +91,7 @@ def _make_call_description(
 
 
 def cached_transition(
-    transition: Callable[Concatenate[CachingStageType, P], NextStage],
+    transition: Callable[Concatenate[CachingStageT, P], NextStage],
 ) -> Callable[Concatenate[CachingStage[NextStage], P], NextStage]:
     """
     Decorator for making the transition function of the stage cacheable.
@@ -107,7 +107,7 @@ def cached_transition(
     """
 
     @functools.wraps(transition)
-    def transition_wrapper(self: CachingStageType, *args: P.args, **kwargs: P.kwargs) -> NextStage:
+    def transition_wrapper(self: CachingStageT, *args: P.args, **kwargs: P.kwargs) -> NextStage:
         flat_call_args, in_tree = jax_tree.tree_flatten((args, kwargs))
         key = self._make_call_description(flat_call_args=flat_call_args, in_tree=in_tree)
         if key not in self._cache:
@@ -223,10 +223,10 @@ class StageTransformationSpec:
 
 
 #: Denotes the stage that is stored inside the cache.
-StageType = TypeVar("StageType", bound="stages.Stage")
+StageT = TypeVar("StageT", bound="stages.Stage")
 
 
-class StageCache(Generic[StageType]):
+class StageCache(Generic[StageT]):
     """
     Simple LRU cache to cache the results of the stage transition function.
 
@@ -235,7 +235,7 @@ class StageCache(Generic[StageType]):
     """
 
     # The most recently used entry is at the end of the `OrderedDict`.
-    _memory: collections.OrderedDict[StageTransformationSpec, StageType]
+    _memory: collections.OrderedDict[StageTransformationSpec, StageT]
     _capacity: int
 
     def __init__(
@@ -248,13 +248,13 @@ def __init__(
     def __contains__(self, key: StageTransformationSpec) -> bool:
         return key in self._memory
 
-    def __getitem__(self, key: StageTransformationSpec) -> StageType:
+    def __getitem__(self, key: StageTransformationSpec) -> StageT:
         if key not in self:
             raise KeyError(f"Key '{key}' is unknown.")
         self._memory.move_to_end(key, last=True)
         return self._memory[key]
 
-    def __setitem__(self, key: StageTransformationSpec, res: StageType) -> None:
+    def __setitem__(self, key: StageTransformationSpec, res: StageT) -> None:
         if key in self:
             self._memory.move_to_end(key, last=True)
             self._memory[key] = res
@@ -287,7 +287,7 @@ def __len__(self) -> int:
     def capacity(self) -> int:  # noqa: D102 [undocumented-public-method]
         return self._capacity
 
-    def front(self) -> tuple[StageTransformationSpec, StageType]:
+    def front(self) -> tuple[StageTransformationSpec, StageT]:
         """Returns the front of the cache, i.e. its newest entry."""
         return next(reversed(self._memory.items()))
 

From a25ecb79e01ad30bac14fc4b44736fb3d184214c Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Tue, 2 Jul 2024 08:11:11 +0200
Subject: [PATCH 435/458] Added Enrique's suggestions.

---
 src/jace/stages.py                            | 36 +++++++++----------
 .../translator/jaxpr_translator_builder.py    |  3 +-
 2 files changed, 20 insertions(+), 19 deletions(-)

diff --git a/src/jace/stages.py b/src/jace/stages.py
index ea3312f..93e0f85 100644
--- a/src/jace/stages.py
+++ b/src/jace/stages.py
@@ -50,9 +50,8 @@
     "JaCeLowered",
     "JaCeWrapped",
     "Stage",
-    "get_active_compiler_options",
-    "get_active_compiler_options",
-    "temporary_compiler_options",
+    "get_compiler_options",
+    "set_compiler_options",
 ]
 
 #: Known compilation stages in JaCe.
@@ -216,7 +215,8 @@ class JaCeLowered(tcache.CachingStage["JaCeCompiled"], Generic[_R]):
     Args:
         tsdfg: The lowered SDFG with metadata.
         out_tree: The pytree describing how to unflatten the output.
-        jaxpr: The Jaxpr expression that was translated.
+        jaxpr: The Jaxpr expression that was translated into an SDFG. Intended to be
+            used during debugging and inspection.
 
     Note:
         `self` will manage the passed `tsdfg` object. Modifying it results is undefined
@@ -246,7 +246,7 @@ def compile(self, compiler_options: CompilerOptions | None = None) -> JaCeCompil
 
         To perform the optimizations `jace_optimize()` is used. The actual options that
         are forwarded to it are obtained by passing `compiler_options` to
-        `get_active_compiler_options()`, these options are also included in the
+        `get_compiler_options()`, these options are also included in the
         key used to cache the result.
 
         Args:
@@ -255,7 +255,7 @@ def compile(self, compiler_options: CompilerOptions | None = None) -> JaCeCompil
         # We **must** deepcopy before we do any optimization, because all optimizations
         #  are in place, to properly cache stages, stages needs to be immutable.
         tsdfg: tjsdfg.TranslatedJaxprSDFG = copy.deepcopy(self._translated_sdfg)
-        optimization.jace_optimize(tsdfg=tsdfg, **get_active_compiler_options(compiler_options))
+        optimization.jace_optimize(tsdfg=tsdfg, **get_compiler_options(compiler_options))
 
         return JaCeCompiled(
             compiled_sdfg=tjsdfg.compile_jaxpr_sdfg(tsdfg),
@@ -293,7 +293,7 @@ def _make_call_description(
         unflatted_args, unflatted_kwargs = jax_tree.tree_unflatten(in_tree, flat_call_args)
         assert (not unflatted_kwargs) and (len(unflatted_args) <= 1)
 
-        options = get_active_compiler_options(unflatted_args[0] if unflatted_args else None)
+        options = get_compiler_options(unflatted_args[0] if unflatted_args else None)
         flat_options, option_tree = jax_tree.tree_flatten(options)
         return tcache.StageTransformationSpec(
             stage_id=id(self), flat_call_args=tuple(flat_options), in_tree=option_tree
@@ -356,39 +356,39 @@ def __call__(self, *args: Any, **kwargs: Any) -> _R:
 """Global set of currently active compilation/optimization options.
 
 The global set is initialized to `jace.optimization.DEFAULT_OPTIMIZATIONS`.
-For modifying the set of active options the the `temporary_compiler_options()`
+For modifying the set of active options the the `set_compiler_options()`
 context manager is provided.
-To obtain the currently active compiler options use `get_active_compiler_options()`.
+To obtain the currently active compiler options use `get_compiler_options()`.
 """
 
 
 @contextlib.contextmanager
-def temporary_compiler_options(new_active_options: CompilerOptions) -> Generator[None, None, None]:
+def set_compiler_options(compiler_options: CompilerOptions) -> Generator[None, None, None]:
     """
     Temporary modifies the set of active compiler options.
 
     During the activation of this context the active set of active compiler option
     consists of the set of option that were previously active merged with the ones
-    passed through `new_active_options`.
+    passed through `compiler_options`.
 
     Args:
-        new_active_options: Options that should be temporary merged with the currently
+        compiler_options: Options that should be temporary merged with the currently
             active options.
 
     See Also:
-        `get_active_compiler_options()` to get the set of active options that is
+        `get_compiler_options()` to get the set of active options that is
         currently active.
     """
     global _JACELOWERED_ACTIVE_COMPILE_OPTIONS  # noqa: PLW0603 [global-statement]
-    previous_active_options = _JACELOWERED_ACTIVE_COMPILE_OPTIONS.copy()
+    previous_compiler_options = _JACELOWERED_ACTIVE_COMPILE_OPTIONS.copy()
     try:
-        _JACELOWERED_ACTIVE_COMPILE_OPTIONS.update(new_active_options)
+        _JACELOWERED_ACTIVE_COMPILE_OPTIONS.update(compiler_options)
         yield None
     finally:
-        _JACELOWERED_ACTIVE_COMPILE_OPTIONS = previous_active_options
+        _JACELOWERED_ACTIVE_COMPILE_OPTIONS = previous_compiler_options
 
 
-def get_active_compiler_options(compiler_options: CompilerOptions | None) -> CompilerOptions:
+def get_compiler_options(compiler_options: CompilerOptions | None) -> CompilerOptions:
     """
     Get the final compiler options.
 
@@ -402,7 +402,7 @@ def get_active_compiler_options(compiler_options: CompilerOptions | None) -> Com
         compiler_options: The local compilation options.
 
     See Also:
-        `temporary_compiler_options()` to modify the currently active set of compiler
+        `set_compiler_options()` to modify the currently active set of compiler
         options.
     """
     return _JACELOWERED_ACTIVE_COMPILE_OPTIONS | (compiler_options or {})
diff --git a/src/jace/translator/jaxpr_translator_builder.py b/src/jace/translator/jaxpr_translator_builder.py
index 7ccd47c..9b76407 100644
--- a/src/jace/translator/jaxpr_translator_builder.py
+++ b/src/jace/translator/jaxpr_translator_builder.py
@@ -759,7 +759,8 @@ class TranslationContext:
         output_names: A list of the SDFG variables that are used as output.
         start_state: The first state in the SDFG state machine.
         terminal_state: The (currently) last state in the state machine.
-        jaxpr: The Jaxpr that was used to translate.
+        jaxpr: The Jaxpr expression that was translated into an SDFG. Intended to be
+            used during debugging and inspection.
 
     Args:
         name: The name of the SDFG.

From 3048019fc896ec5481531593e868e78214f24ea2 Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Tue, 2 Jul 2024 08:11:25 +0200
Subject: [PATCH 436/458] Updated the tests.

---
 tests/conftest.py                                         | 2 +-
 tests/integration_tests/primitive_translators/conftest.py | 2 +-
 tests/unit_tests/test_caching.py                          | 4 ++--
 3 files changed, 4 insertions(+), 4 deletions(-)

diff --git a/tests/conftest.py b/tests/conftest.py
index bbf0eb3..9f454a1 100644
--- a/tests/conftest.py
+++ b/tests/conftest.py
@@ -98,5 +98,5 @@ def _set_compile_options() -> Generator[None, None, None]:
     perform any optimizations.
     Please not that certain tests might override this fixture.
     """
-    with stages.temporary_compiler_options(optimization.NO_OPTIMIZATIONS):
+    with stages.set_compiler_options(optimization.NO_OPTIMIZATIONS):
         yield
diff --git a/tests/integration_tests/primitive_translators/conftest.py b/tests/integration_tests/primitive_translators/conftest.py
index 841f1f2..9ff54e6 100644
--- a/tests/integration_tests/primitive_translators/conftest.py
+++ b/tests/integration_tests/primitive_translators/conftest.py
@@ -34,5 +34,5 @@ def _set_compile_options(request) -> Generator[None, None, None]:
     Todo:
         Implement a system that only runs the optimization case in CI.
     """
-    with stages.temporary_compiler_options(request.param):
+    with stages.set_compiler_options(request.param):
         yield
diff --git a/tests/unit_tests/test_caching.py b/tests/unit_tests/test_caching.py
index 8f388b3..60be130 100644
--- a/tests/unit_tests/test_caching.py
+++ b/tests/unit_tests/test_caching.py
@@ -230,7 +230,7 @@ def wrapped(a: float) -> float:
     assert lowering_cnt[0] == 1
 
     # Using the first set of options.
-    with stages.temporary_compiler_options(optimization.NO_OPTIMIZATIONS):
+    with stages.set_compiler_options(optimization.NO_OPTIMIZATIONS):
         _ = wrapped(2.0)
 
         # Except from one entry in the compile cache, nothing should have changed.
@@ -241,7 +241,7 @@ def wrapped(a: float) -> float:
 
     # Now we change the options again which then will lead to another compilation,
     #  but not to another lowering.
-    with stages.temporary_compiler_options(optimization.DEFAULT_OPTIMIZATIONS):
+    with stages.set_compiler_options(optimization.DEFAULT_OPTIMIZATIONS):
         _ = wrapped(2.0)
 
         assert len(lower_cache) == 1

From f9ee01a66c083f25621a57bec0035a31ca886369 Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Fri, 13 Sep 2024 13:59:12 +0200
Subject: [PATCH 437/458] Made some small modifications.

---
 src/jace/translator/primitive_translators/copy_translator.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/src/jace/translator/primitive_translators/copy_translator.py b/src/jace/translator/primitive_translators/copy_translator.py
index 650b483..6de5ab9 100644
--- a/src/jace/translator/primitive_translators/copy_translator.py
+++ b/src/jace/translator/primitive_translators/copy_translator.py
@@ -23,7 +23,7 @@
     from jax import core as jax_core
 
 
-class CopyTranslator:
+class CopyTranslator(translator.PrimitiveTranslator):
     """
     Implements the `copy` primitive.
 

From fa65ee7744b3028cbc27f02ddc1cbb3bdbc11ceb Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Fri, 13 Sep 2024 14:17:48 +0200
Subject: [PATCH 438/458] Ported the gather translator.

It is just ported and some variables are renamed.
---
 .../primitive_translators/__init__.py         |   2 +
 .../gather_translator.py                      | 211 ++++++++++++++++++
 2 files changed, 213 insertions(+)
 create mode 100644 src/jace/translator/primitive_translators/gather_translator.py

diff --git a/src/jace/translator/primitive_translators/__init__.py b/src/jace/translator/primitive_translators/__init__.py
index e0ef301..9e2fec0 100644
--- a/src/jace/translator/primitive_translators/__init__.py
+++ b/src/jace/translator/primitive_translators/__init__.py
@@ -17,6 +17,7 @@
 from .conditions import condition_translator
 from .convert_element_type_translator import ConvertElementTypeTranslator
 from .copy_translator import CopyTranslator, DevicePutTranslator
+from .gather_translator import GatherTranslator
 from .iota_translator import IotaTranslator
 from .pjit_translator import PJITTranslator
 from .reshape_translator import ReshapeTranslator
@@ -32,6 +33,7 @@
     "ConvertElementTypeTranslator",
     "CopyTranslator",
     "DevicePutTranslator",
+    "GatherTranslator",
     "IotaTranslator",
     "LogicalOperationTranslator",
     "PJITTranslator",
diff --git a/src/jace/translator/primitive_translators/gather_translator.py b/src/jace/translator/primitive_translators/gather_translator.py
new file mode 100644
index 0000000..343ee15
--- /dev/null
+++ b/src/jace/translator/primitive_translators/gather_translator.py
@@ -0,0 +1,211 @@
+# JaCe - JAX Just-In-Time compilation using DaCe (Data Centric Parallel Programming)
+#
+# Copyright (c) 2024, ETH Zurich
+# All rights reserved.
+#
+# SPDX-License-Identifier: BSD-3-Clause
+
+"""Implements the translator for the `gather` primitive."""
+
+from __future__ import annotations
+
+from typing import TYPE_CHECKING
+
+import dace
+from jax import lax as jax_lax
+from typing_extensions import override
+
+from jace import translator, util
+
+
+if TYPE_CHECKING:
+    from collections.abc import Sequence
+
+    from jax import core as jax_core
+
+
+class GatherTranslator(translator.PrimitiveTranslator):
+    """
+    Garther Translator.
+
+    The gather operation extracts patches of a certain size, known as `slice_size`,
+    from an array, called source or input array. Where these patches starts is
+    given by another array, the index array.
+
+    See Also:
+        https://www.tensorflow.org/xla/operation_semantics#gather
+        https://jax.readthedocs.io/en/latest/_autosummary/jax.lax.gather.html
+    """
+
+    @property
+    def primitive(self) -> str:  # noqa: D102  # No docstring needed.
+        return "gather"
+
+    @override
+    def __call__(  # noqa: PLR0914, PLR0915  # Just ported from the prototype, cleanup postponed.
+        self,
+        builder: translator.JaxprTranslationBuilder,
+        in_var_names: Sequence[str | None],
+        out_var_names: Sequence[str],
+        eqn: jax_core.JaxprEqn,
+        eqn_state: dace.SDFGState,
+    ) -> None:
+        """
+        Performs the gather operation.
+
+        Args:
+            builder: The builder object that is active.
+            in_var_names: The names of the input variables, the first array is
+                assumed as source array and the second is the index array.
+            out_var_names: The names of the output variables.
+            eqn: The equation to translate.
+            eqn_state: The state in which we put the extraction.
+        """
+        assert len(eqn.invars) == 2  # noqa: PLR2004  # XLA supports more inputs.
+
+        out_name = out_var_names[0]
+        out_shape = util.get_jax_var_shape(eqn.outvars[0])
+
+        src_name = in_var_names[0]
+        src_shape = util.get_jax_var_shape(eqn.invars[0])
+
+        idx_name = in_var_names[1]
+        idx_shape = util.get_jax_var_shape(eqn.invars[1])
+
+        dimension_numbers = eqn.params["dimension_numbers"]
+        offset_dims: Sequence[int] = dimension_numbers.offset_dims
+        collapsed_slice_dims: Sequence[int] = dimension_numbers.collapsed_slice_dims
+        start_index_map: Sequence[int] = dimension_numbers.start_index_map
+        slice_sizes: Sequence[int] = eqn.params["slice_sizes"]
+        mode: jax_lax.GatherScatterMode = eqn.params["mode"]
+        assert len(start_index_map) == idx_shape[-1]
+
+        if mode != jax_lax.GatherScatterMode.PROMISE_IN_BOUNDS:
+            raise NotImplementedError(f"The mode {mode} is not implemented.")
+
+        # Over these dimensions the copy of the patches goes.
+        batch_dims = tuple(d for d in range(len(out_shape)) if d not in offset_dims)
+
+        # Every batch dimension is associated with one dimension of of the index
+        #  array, but there is always one dimension more in the index array. This
+        #  dimension contains the start indexes of the slice, if there is only
+        #  one index that should be loaded is not strictly necessary, but Jax
+        #  (currently adds) it implicitly, probably to make life easier.
+        if (len(batch_dims) + 1) != len(idx_shape):
+            raise ValueError(
+                f"Expected that the index array has {len(batch_dims) + 1} dimensions, but it had {len(idx_shape)}."
+            )
+
+        # These are the dimensions (of the input) for which a map index is created.
+        #  Note that we exclude collapsed dimensions here.
+        src_dim_with_map_idx = tuple(
+            dim for dim in range(len(slice_sizes)) if dim not in collapsed_slice_dims
+        )
+        assert len(src_dim_with_map_idx) == len(offset_dims)
+
+        # The final map is the composition of two loops. The first map iterates over
+        #  the index array, except the last dimension, and is used to "copy" the
+        #  different patches from the source to the output array. These map parameters
+        #  follow the pattern `__i{out_name}_gather{bd}`, where `bd` is a batch
+        #  dimension. These variables are used to access the index array.
+        #  The second loop performs the actual copy of the slices. For these
+        #  the variables `__i{i}` is used were, these are known as offset
+        #  dimensions.
+        #  What is a bit difficult, that the actual access/dereferencing of the source
+        #  array is done within the tasklet.
+
+        # Access pattern of the source array _within_ the tasklet.
+        src_access_pattern: list[str] = []
+
+        # These are the map ranges for the coying of the slicing.
+        slice_map_ranges: list[tuple[str, str]] = []
+
+        # Compute the access pattern within the tasklet.
+        #  As a side effect we also compute the map ranges, but only for the slices.
+        for dim, slice_size in enumerate(slice_sizes):
+            # Order is important!
+            if dim not in start_index_map:
+                # This dimension is fully copied
+                slice_map_ranges.append((f"__i{dim}", f"0:{slice_size}"))
+                src_access_pattern.append(slice_map_ranges[-1][0])
+                assert dim in src_dim_with_map_idx
+                assert slice_size == src_shape[dim]
+
+            elif dim in collapsed_slice_dims:
+                # This dimension is only partially copied, however, since the
+                #  dimension is collapsed, only a single element is copied that
+                #  comes from the index array.
+                src_access_pattern.append(f"__gather_{dim}")
+
+            else:
+                # This dimension is partially copied, but is _not colapsed_, we need
+                #  a map index to copy the range. However, there is also an offset
+                #  that is involved from copying.
+                slice_map_ranges.append((f"__i{dim}", f"0:{slice_size}"))
+                src_access_pattern.append(f"__gather_{dim} + {slice_map_ranges[-1][0]}")
+                assert dim in src_dim_with_map_idx
+                assert slice_size <= src_shape[dim]
+
+        # These are the map variable that go over the index array.
+        patch_loop_vars = tuple(f"__i{out_name}_gather{bd}" for bd in batch_dims)
+        patch_map_ranges = [
+            (map_param, f"0:{patch_loop_bound}")
+            for map_param, patch_loop_bound in zip(patch_loop_vars, idx_shape[:-1])
+        ]
+
+        # Creating the input memlet that allows us to access the source array from
+        #  inside the tasklet and make it accessible through the name `__arr`. At
+        #  this point it is not possible to tell where we access, because we are
+        #  missing a index variables, they will only be accessible inside the
+        #  tasklet (see below), however, we know that we will access only one
+        #  element from the array.
+        tasklet_inputs: dict[str, dace.Memlet] = {
+            "__arr": dace.Memlet.simple(
+                data=src_name,
+                subset_str=", ".join(f"0:{size}" for size in src_shape),
+                num_accesses=1,
+            ),
+        }
+
+        # Now we are creating the memlets that access the index array.
+        for i, dim in enumerate(start_index_map):
+            tasklet_inputs[f"__gather_{dim}"] = dace.Memlet.simple(
+                data=idx_name, subset_str=(", ".join(patch_loop_vars) + f", {i}")
+            )
+
+        # The tasklet code.
+        tasklet_code = "__out = __arr[" + ", ".join(src_access_pattern) + "]"
+
+        # Now we generate the output memlet.
+        outpt_access_pattern: list[str] = []
+        dim_counter = 0
+        for dim in range(len(out_shape)):
+            if dim in batch_dims:
+                # This is a batch dimension, thus a loop variable is used for it.
+                patch_loop_var = patch_loop_vars[batch_dims.index(dim)]
+                outpt_access_pattern.append(str(patch_loop_var))
+
+            else:
+                # This is a dimension for copying the slices.
+                assert dim_counter <= len(src_dim_with_map_idx)
+                associated_map_idx = src_dim_with_map_idx[dim_counter]
+                dim_counter += 1
+                outpt_access_pattern.append(f"__i{associated_map_idx}")
+        assert dim_counter == len(src_dim_with_map_idx)
+
+        tasklet_outputs: dict[str, dace.Memlet] = {
+            "__out": dace.Memlet.simple(data=out_name, subset_str=", ".join(outpt_access_pattern))
+        }
+        assert len(patch_map_ranges) + len(slice_map_ranges) == len(out_shape)
+
+        eqn_state.add_mapped_tasklet(
+            name=f"_gather_map_{out_name}",
+            map_ranges=patch_map_ranges + slice_map_ranges,
+            inputs=tasklet_inputs,
+            code=tasklet_code,
+            outputs=tasklet_outputs,
+            external_edges=True,
+        )
+
+
+_ = translator.register_primitive_translator(GatherTranslator())

From b9f94274fd7680aec7e7e48ccbb7608b8a0be4e0 Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Fri, 13 Sep 2024 14:52:11 +0200
Subject: [PATCH 439/458] Made it possible the the `make_array()` function is
 able scale automatically.

---
 tests/util.py | 29 ++++++++++++++++++++++-------
 1 file changed, 22 insertions(+), 7 deletions(-)

diff --git a/tests/util.py b/tests/util.py
index aa89d2b..1fa2e07 100644
--- a/tests/util.py
+++ b/tests/util.py
@@ -10,7 +10,7 @@
 from __future__ import annotations
 
 from collections.abc import Mapping, Sequence
-from typing import Literal
+from typing import Any, Literal
 
 import numpy as np
 
@@ -24,6 +24,8 @@ def make_array(
     shape: Sequence[int] | int,
     dtype: type = np.float64,
     order: Literal[None, "K", "A", "C", "F"] = "C",
+    low: Any = None,
+    high: Any = None,
 ) -> np.ndarray:
     """Generates a NumPy ndarray with shape `shape`.
 
@@ -31,11 +33,17 @@ def make_array(
     fixture. Thus inside a function the value will be deterministic.
 
     Args:
-        shape:      The shape to use.
-        dtype:      The data type to use.
-
-    Notes:
-        Floating point based values are generated in the range 0 to 1.0.
+        shape: The shape to use.
+        dtype: The data type to use.
+        order: The order of the underlying array
+        low: Minimal value.
+        high: Maximal value.
+
+    Note:
+        The exact meaning of `low` and `high` depend on the type. For `bool` they
+        are ignored. For float both must be specified and then values inside
+        `[low, high)` are generated. For integer it is possible to specify only one.
+        The appropriate numeric limit is used for the other.
     """
 
     if shape == ():
@@ -48,12 +56,19 @@ def make_array(
     elif np.issubdtype(dtype, np.integer):
         iinfo: np.iinfo = np.iinfo(dtype)
         res = np.random.randint(  # noqa: NPY002 [numpy-legacy-random]
-            low=iinfo.min, high=iinfo.max, size=shape, dtype=dtype
+            low=iinfo.min if low is None else low,
+            high=iinfo.max if high is None else high,
+            size=shape,
+            dtype=dtype,
         )
     elif np.issubdtype(dtype, np.complexfloating):
         res = make_array(shape, np.float64) + 1.0j * make_array(shape, np.float64)
     else:
         res = np.random.random(shape)  # type: ignore[assignment]  # noqa: NPY002 [numpy-legacy-random]
+        if low is not None and high is not None:
+            res = low + (high - low) * res
+        assert (low is None) == (high is None)
+
     return np.array(res, order=order, dtype=dtype)
 
 
From 5a3c87fc69c53fe675e0a4a71b85db274781d2c4 Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Fri, 13 Sep 2024 14:55:24 +0200
Subject: [PATCH 440/458] Added tests for the gather primitive.

---
 .../test_primitive_gather.py                  | 83 +++++++++++++++++++
 1 file changed, 83 insertions(+)
 create mode 100644 tests/integration_tests/primitive_translators/test_primitive_gather.py

diff --git a/tests/integration_tests/primitive_translators/test_primitive_gather.py b/tests/integration_tests/primitive_translators/test_primitive_gather.py
new file mode 100644
index 0000000..35cfbb2
--- /dev/null
+++ b/tests/integration_tests/primitive_translators/test_primitive_gather.py
@@ -0,0 +1,83 @@
+# JaCe - JAX Just-In-Time compilation using DaCe (Data Centric Parallel Programming)
+#
+# Copyright (c) 2024, ETH Zurich
+# All rights reserved.
+#
+# SPDX-License-Identifier: BSD-3-Clause
+
+from __future__ import annotations
+
+from collections.abc import Callable
+from typing import Any
+
+import numpy as np
+from jax import numpy as jnp
+
+import jace
+
+from tests import util as testutil
+
+
+def _perform_gather_test(
+    testee: Callable,
+    *args: Any,
+) -> None:
+    wrapped = jace.jit(testee)
+
+    expected = testee(*args)
+    result = wrapped(*args)
+
+    assert np.allclose(expected, result)
+
+
+def test_gather_simple_1():
+    def testee(
+        a: np.ndarray,
+        idx: np.ndarray,
+    ) -> np.ndarray:
+        return a[idx]
+
+    a = testutil.make_array(100)
+    idx = testutil.make_array(300, dtype=np.int32, low=0, high=100)
+    _perform_gather_test(testee, a, idx)
+
+
+def test_gather_1():
+    def testee(
+        a: np.ndarray,
+        idx: np.ndarray,
+    ) -> np.ndarray:
+        return a[idx, :, idx]
+
+    a = testutil.make_array((300, 3, 300))
+    idx = testutil.make_array(400, dtype=np.int32, low=1, high=300)
+    _perform_gather_test(testee, a, idx)
+
+
+def test_gather_2():
+    def testee(
+        a: np.ndarray,
+        idx: np.ndarray,
+    ) -> np.ndarray:
+        return a[idx, :, :]
+
+    a = testutil.make_array((300, 3, 300))
+    idx = testutil.make_array(400, dtype=np.int32, low=1, high=300)
+    _perform_gather_test(testee, a, idx)
+
+
+def test_gather_3():
+    def testee(
+        a: np.ndarray,
+        b: np.ndarray,
+        idx: np.ndarray,
+        idx2: np.ndarray,
+    ) -> np.ndarray:
+        c = jnp.sin(a) + b
+        return jnp.exp(c[idx, :, idx2])  # type: ignore[return-value]  # Type confusion.
+
+    a = testutil.make_array((300, 3, 300))
+    b = testutil.make_array((300, 3, 300))
+    idx = testutil.make_array(400, dtype=np.int32, low=1, high=300)
+    idx2 = testutil.make_array(400, dtype=np.int32, low=1, high=300)
+    _perform_gather_test(testee, a, b, idx, idx2)

From d6265bc55a7516563400a4063907fc60d526be7c Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Fri, 13 Sep 2024 15:03:41 +0200
Subject: [PATCH 441/458] Added all translators from teh development branch.

I just copied them and did not do a merge, which is not so nice.
Furthermore, the tests are not yet there, in my view it makes sense to first have something that can be checked.
---
 .../translator/jaxpr_translator_builder.py    |  59 +++-
 .../mapped_operation_base_translator.py       | 214 +++++++++++++
 src/jace/translator/post_translation.py       |  92 ++++++
 src/jace/translator/primitive_translator.py   |   3 +
 .../primitive_translators/__init__.py         |  35 ++-
 .../primitive_translators/alu_translator.py   | 287 ------------------
 .../arithmetic_logical_translators.py         | 200 ++++++++++++
 .../broadcast_in_dim_translator.py            |  67 ++++
 .../concatenate_translator.py                 |  87 ++++++
 .../primitive_translators/conditions.py       | 182 +++++++++++
 .../convert_element_type_translator.py        |  85 ++++++
 .../primitive_translators/copy_translator.py  |  92 ++++++
 .../gather_translator.py                      | 211 +++++++++++++
 .../primitive_translators/iota_translator.py  |  56 ++++
 .../primitive_translators/pjit_translator.py  | 147 +++++++++
 .../reshape_translator.py                     |  67 ++++
 .../select_n_translator.py                    |  94 ++++++
 .../primitive_translators/slicing.py          | 198 ++++++++++++
 .../squeeze_translator.py                     |  69 +++++
 src/jace/util/jax_helper.py                   |  21 ++
 20 files changed, 1973 insertions(+), 293 deletions(-)
 create mode 100644 src/jace/translator/mapped_operation_base_translator.py
 delete mode 100644 src/jace/translator/primitive_translators/alu_translator.py
 create mode 100644 src/jace/translator/primitive_translators/arithmetic_logical_translators.py
 create mode 100644 src/jace/translator/primitive_translators/broadcast_in_dim_translator.py
 create mode 100644 src/jace/translator/primitive_translators/concatenate_translator.py
 create mode 100644 src/jace/translator/primitive_translators/conditions.py
 create mode 100644 src/jace/translator/primitive_translators/convert_element_type_translator.py
 create mode 100644 src/jace/translator/primitive_translators/copy_translator.py
 create mode 100644 src/jace/translator/primitive_translators/gather_translator.py
 create mode 100644 src/jace/translator/primitive_translators/iota_translator.py
 create mode 100644 src/jace/translator/primitive_translators/pjit_translator.py
 create mode 100644 src/jace/translator/primitive_translators/reshape_translator.py
 create mode 100644 src/jace/translator/primitive_translators/select_n_translator.py
 create mode 100644 src/jace/translator/primitive_translators/slicing.py
 create mode 100644 src/jace/translator/primitive_translators/squeeze_translator.py

diff --git a/src/jace/translator/jaxpr_translator_builder.py b/src/jace/translator/jaxpr_translator_builder.py
index 3d7d04c..9b76407 100644
--- a/src/jace/translator/jaxpr_translator_builder.py
+++ b/src/jace/translator/jaxpr_translator_builder.py
@@ -14,6 +14,7 @@
 
 import dace
 from dace import data as dace_data, properties as dace_properties
+from dace.sdfg import propagation as dace_propagation
 from jax import core as jax_core
 
 from jace import util
@@ -35,8 +36,11 @@ class JaxprTranslationBuilder:
     - there are only transient variables inside the SDFG,
     - it lacks the special `__return` variable,
     - the `arg_names` parameter is not set,
-    - for all scalar values a ` Scalar` SDFG variable is used, thus they cannot
-        be used to return anything.
+    - for all scalar values a `Scalar` SDFG variable is used, thus they cannot
+        be used for return values,
+    - for every transient there is exactly one access node that writes to it,
+        except the name of the array starts with `__jace_mutable_`, which can
+        be written to multiple times.
 
     For these reasons the SDFG is not directly usable, and further manipulations
     have to be performed. Especially, DaCe's validation function will fail and
@@ -550,6 +554,7 @@ def _translate_single_eqn(self, eqn: jax_core.JaxprEqn) -> None:
         translator = self._primitive_translators[primitive_name]
 
         # Create the state into which the equation should be translated
+        prev_terminal_state = self._ctx.terminal_state
         eqn_state = self.append_new_state(
             label=f"{primitive_name}_{'_'.join(out_var_names)}",
             prev_state=None,  # forces the creation of a new terminal state
@@ -569,8 +574,13 @@ def _translate_single_eqn(self, eqn: jax_core.JaxprEqn) -> None:
             if eqn_state is not self._ctx.terminal_state:
                 raise RuntimeError("Inconsistent terminal state was detected.")
             new_sdfg_term_state = eqn_state
-        if not self._ctx.validate():
-            raise RuntimeError("Detected an invalid SDFG under construction.")
+
+        # Propagate the Memlets through the newly created state machine
+        self._propagate_memlets_in_new_states(
+            prev_terminal_state,
+            new_sdfg_term_state,
+        )
+        self._ctx.validate()
 
         # Modify terminal root state of 'self'
         self._ctx.terminal_state = new_sdfg_term_state
@@ -680,6 +690,47 @@ def _handle_null_jaxpr(self, jaxpr: jax_core.ClosedJaxpr) -> list[str]:
 
         return out_var_names
 
+    def _propagate_memlets_in_new_states(
+        self,
+        prev_terminal_state: dace.SDFGState,
+        new_terminal_state: dace.SDFGState,
+    ) -> None:
+        """
+        Propagate the Memlets inside the newly added parts of the state machine.
+
+        This function performs BFS starting at `prev_terminal_state` that is bound
+        by `new_terminal_state`.
+
+        Args:
+            prev_terminal_state: Terminal state before the expansion of the
+                state machine.
+            new_terminal_state: Terminal state after the expansion.
+        """
+        seen: set[dace.SDFGState] = {prev_terminal_state}
+        nodes_to_process: list[dace.SDFGState] = [
+            edge.dst for edge in self.sdfg.out_edges(prev_terminal_state)
+        ]
+
+        while nodes_to_process:
+            currently_processing = nodes_to_process.pop(-1)
+            if (
+                self.sdfg.out_degree(currently_processing) == 0
+                and currently_processing != new_terminal_state
+            ):
+                raise dace.sdfg.InvalidSDFGError(
+                    f"Found leaf node '{currently_processing}' that is not the terminal node.",
+                    self.sdfg,
+                    self.sdfg.node_id(currently_processing),
+                )
+
+            seen.add(currently_processing)
+            dace_propagation.propagate_memlets_state(self.sdfg, currently_processing)
+            nodes_to_process.extend(
+                edge.dst
+                for edge in self.sdfg.out_edges(currently_processing)
+                if edge.dst not in seen
+            )
+
     @property
     def _start_state(self) -> dace.SDFGState:
         return cast(dace.SDFGState, self._ctx.start_state)
diff --git a/src/jace/translator/mapped_operation_base_translator.py b/src/jace/translator/mapped_operation_base_translator.py
new file mode 100644
index 0000000..9f0f402
--- /dev/null
+++ b/src/jace/translator/mapped_operation_base_translator.py
@@ -0,0 +1,214 @@
+# JaCe - JAX Just-In-Time compilation using DaCe (Data Centric Parallel Programming)
+#
+# Copyright (c) 2024, ETH Zurich
+# All rights reserved.
+#
+# SPDX-License-Identifier: BSD-3-Clause
+
+"""Module containing all translators related to arithmetic logical operations."""
+
+from __future__ import annotations
+
+from abc import abstractmethod
+from typing import TYPE_CHECKING
+
+import dace
+from typing_extensions import final, override
+
+from jace import translator, util
+
+
+if TYPE_CHECKING:
+    from collections.abc import Sequence
+
+    from jax import core as jax_core
+
+
+class MappedOperationTranslatorBase(translator.PrimitiveTranslator):
+    """
+    Implements the base for all "mapped base operations".
+
+    A mapped base operation `f` is an operation that has several inputs arrays
+    that are elementwise combined to a single output array. A prime example for
+    this would be the addition of two arrays. Essentially it assumes that the
+    Tasklet code can be written as:
+    ```
+        __out = f(__in0, __in1, __in3, ...)
+    ```
+    where `__in*` are the connector names of the Tasklet and `__out` is the
+    output connector. For problems such as this, the SDFG API provides the
+    `SDFGState.add_mapped_tasklet()` function, however, in most cases it can not
+    be directly used, for various reasons. Thus this class acts like a
+    convenience wrapper around it.
+
+    To use this class a user has to overwrite the `write_tasklet_code()` function.
+    This function generates the entire code that should be put into the Tasklet,
+    include the assignment to `__out`. If needed the translator will perform
+    literal substitution on the returned code and broadcast the inputs to match
+    the outputs.
+
+    If needed a subclass can also override the `make_input_memlets()` function
+    to generate custom input Memlets, such as adding an offset.
+
+    Args:
+        primitive_name:     The name of the primitive `self` should bind to.
+
+    Note:
+        This class will always generate a mapped Tasklet, even if a scalar is handled.
+    """
+
+    def __init__(self, primitive_name: str) -> None:
+        self._prim_name = primitive_name
+
+    @property
+    def primitive(self) -> str:
+        """Returns the primitive that should be translated."""
+        return self._prim_name
+
+    @final
+    @override
+    def __call__(
+        self,
+        builder: translator.JaxprTranslationBuilder,
+        in_var_names: Sequence[str | None],
+        out_var_names: Sequence[str],
+        eqn: jax_core.JaxprEqn,
+        eqn_state: dace.SDFGState,
+    ) -> None:
+        """
+        Create the mapped Tasklet.
+
+        The function will create the map ranges and based on the shape of the
+        output array. It will then call `make_input_memlets()` to get the input
+        Memlets. After that it calls `write_tasklet_code()` to get the Tasklet
+        code and perform literal substitution by forwarding it to
+        `self.literal_substitution()`. After that it will create the mapped Tasklet.
+
+        Note:
+            For a description of the arguments see `PrimitiveTranslatorCallable`.
+        """
+        assert len(out_var_names) == 1
+        if util.get_jax_var_shape(eqn.outvars[0]) != ():
+            tskl_ranges: list[tuple[str, str]] = [
+                (f"__i{dim}", f"0:{N}")
+                for dim, N in enumerate(util.get_jax_var_shape(eqn.outvars[0]))
+            ]
+            tskl_output: dict[str, dace.Memlet] = {
+                "__out": dace.Memlet.simple(
+                    out_var_names[0], ", ".join(name for name, _ in tskl_ranges)
+                )
+            }
+
+        else:
+            # If we have a scalar we will generate a Map, but it will be trivial.
+            tskl_ranges = [("__jace_iterator_SCALAR", "0:1")]
+            tskl_output = {"__out": dace.Memlet.simple(out_var_names[0], "0")}
+
+        tskl_inputs: dict[str, dace.Memlet] = self.make_input_memlets(
+            tskl_ranges, in_var_names, eqn
+        )
+        tskl_name = f"{self.primitive}_{out_var_names[0]}"
+        tskl_code = self.write_tasklet_code(tskl_ranges, in_var_names, eqn)
+        tskl_code = self.literal_substitution(tskl_code, in_var_names, eqn)
+
+        eqn_state.add_mapped_tasklet(
+            name=tskl_name,
+            map_ranges=tskl_ranges,
+            inputs=tskl_inputs,
+            code=tskl_code,
+            outputs=tskl_output,
+            external_edges=True,
+        )
+
+        return eqn_state
+
+    @abstractmethod
+    def write_tasklet_code(
+        self,
+        tskl_ranges: Sequence[tuple[str, str]],
+        in_var_names: Sequence[str | None],
+        eqn: jax_core.JaxprEqn,
+    ) -> str:
+        """
+        Return the (Python) code that should be put inside the Tasklet.
+
+        This also includes the assignment statement, i.e. `__out`.
+        However, the base will do literal substitution on the returned object.
+
+        Args:
+            tskl_ranges:    List of pairs used as map parameter, first element
+                is the name iteration index of the dimension, second is its range.
+            in_var_names:   The list of SDFG variables used as input, `None` if literal.
+            eqn:            The equation.
+        """
+        ...
+
+    def make_input_memlets(  # noqa: PLR6301  # Subclasses might need them.
+        self,
+        tskl_ranges: Sequence[tuple[str, str]],
+        in_var_names: Sequence[str | None],
+        eqn: jax_core.JaxprEqn,
+    ) -> dict[str, dace.Memlet]:
+        """
+        Generate the input Memlets for the non literal operators of the primitive.
+
+        The returned `dict` maps the input connector of the Tasklet to the Memlet
+        that is used to connect it to the Map entry node.
+
+        Args:
+            tskl_ranges:    List of pairs used as map parameter, first element
+                is the name iteration index of the dimension, second is its range
+            in_var_names:   The list of SDFG variables used as input, `None` if literal.
+            eqn:            The equation object.
+        """
+        out_shp = tuple(util.get_jax_var_shape(eqn.outvars[0]))  # Shape of the output
+        out_rank = len(out_shp)
+        if any(len(util.get_jax_var_shape(invar)) not in {0, out_rank} for invar in eqn.invars):
+            raise NotImplementedError(
+                f"'MappedOperationTranslatorBase' Inputs must have the same rank as the output! "
+                f"Eqn: {eqn} || {tuple(util.get_jax_var_shape(eqn.outvars[0]))}"
+            )
+
+        # Now we will generate the input Memlets.
+        tskl_inputs: dict[str, dace.Memlet] = {}
+        for i, (in_var_name, inp_shp) in enumerate(
+            zip(in_var_names, (util.get_jax_var_shape(invar) for invar in eqn.invars))
+        ):
+            if in_var_name is None:  # Input is a literal: No Memlet needed
+                continue
+
+            if inp_shp == ():  # Scalars
+                tskl_inputs[f"__in{i}"] = dace.Memlet.simple(in_var_name, "0")  # Scalar
+                continue
+
+            # We have to to broadcasting (combine yes and no together)
+            dims_to_bcast: Sequence[int] = [dim for dim in range(out_rank) if inp_shp[dim] == 1]
+            tskl_inputs[f"__in{i}"] = dace.Memlet.simple(
+                in_var_name,
+                ", ".join(
+                    ("0" if i in dims_to_bcast else it_var)
+                    for i, (it_var, _) in enumerate(tskl_ranges)
+                ),
+            )
+        return tskl_inputs
+
+    def literal_substitution(  # noqa: PLR6301  # Subclasses might need it.
+        self, tskl_code: str, in_var_names: Sequence[str | None], eqn: jax_core.JaxprEqn
+    ) -> str:
+        """
+        Perform literal substitution on the proto Tasklet code `tskl_code`.
+
+        Args:
+            tskl_code:      The proto Tasklet code with literal.
+            in_var_names:   The list of SDFG variables used as input.
+            eqn:            The equation.
+
+        Note:
+            It is allowed but not recommended to override this function.
+        """
+        for i, in_var_name in enumerate(in_var_names):
+            if in_var_name is not None:
+                continue
+            t_val = util.get_jax_literal_value(eqn.invars[i])
+            tskl_code = tskl_code.replace(f"__in{i}", str(t_val))
+        return tskl_code
diff --git a/src/jace/translator/post_translation.py b/src/jace/translator/post_translation.py
index a00b651..9831f35 100644
--- a/src/jace/translator/post_translation.py
+++ b/src/jace/translator/post_translation.py
@@ -19,6 +19,8 @@
 
 
 if TYPE_CHECKING:
+    from dace.sdfg import nodes as dace_nodes
+
     from jace import translator
 
 
@@ -234,3 +236,93 @@ def finalize_translation_context(
     if validate:
         tsdfg.validate()
     return tsdfg
+
+
+def add_nested_sdfg(
+    state: dace.SDFGState,
+    child_ctx: translator.TranslationContext,
+    parent_ctx: translator.TranslationContext,
+    in_var_names: Sequence[str],
+    out_var_names: Sequence[str],
+) -> dace_nodes.NestedSDFG:
+    """
+    Adds the SDFG in `child_ctx` as nested SDFG at state `state` in `parent_ctx`.
+
+    The function is a convenience wrapper that operates directly on translation
+    contexts instead of SDFGs. The function will also create the necessary Memlet
+    connections.
+
+    Args:
+        state: The state at which the nested SDFG should be inserted.
+            Must be part of `parent_ctx`.
+        child_ctx: The translation context representing the SDFG that should be added.
+        parent_ctx: The parent SDFG to which `child_ctx` should be added as nested
+            SDFG in state `state`.
+        in_var_names: Names of the variables in `parent_ctx` that are used as inputs for
+            the nested SDFG, must have the same order as `child_ctx.input_names`.
+        out_var_names: Names of the variables in `parent_ctx` that are used as outputs
+            for the nested SDFG, must have the same order as `child_ctx.output_names`.
+
+    Returns:
+        The nested SDFG object.
+
+    Note:
+        The function will not add `child_ctx` directly as nested SDFG. Instead it
+        will first pass it to `finalize_translation_context()` and operates on the
+        return values. This means that `child_ctx` will be modified in place, and
+        a copy will be added to `parent_ctx`.
+        It is highly recommended that `state` is empty.
+    """
+    if child_ctx.sdfg.free_symbols:
+        raise NotImplementedError("Symbol Mapping is not implemented.")
+    assert not (child_ctx.input_names is None or child_ctx.output_names is None)  # Silence mypy
+    assert len(child_ctx.input_names) == len(in_var_names)
+    assert len(child_ctx.output_names) == len(out_var_names)
+    assert state in parent_ctx.sdfg.nodes()
+    assert not set(in_var_names).intersection(out_var_names)
+
+    if any(input_name.startswith("__jace_mutable_") for input_name in in_var_names):
+        raise NotImplementedError(
+            "'__jace_mutable_' variables are not yet handled in 'add_nested_sdfg()'."
+        )
+    if len(set(in_var_names)) != len(in_var_names):
+        raise ValueError(
+            f"An input can only be passed once, but { {in_var_name for in_var_name in in_var_names if in_var_names.count(in_var_name) > 1} } were passed multiple times."
+        )
+    if len(set(out_var_names)) != len(out_var_names):
+        raise NotImplementedError(
+            f"Tried to write multiple times to variables: { {out_var_name for out_var_name in out_var_names if out_var_names.count(out_var_name) > 1} }."
+        )
+
+    final_child_ctx = finalize_translation_context(child_ctx)
+    nested_sdfg: dace_nodes.NestedSDFG = state.add_nested_sdfg(
+        sdfg=final_child_ctx.sdfg,
+        parent=parent_ctx.sdfg,
+        # Bug in DaCe must be a set.
+        inputs=set(final_child_ctx.input_names),
+        outputs=set(final_child_ctx.output_names),
+    )
+
+    # Now create the connections for the input.
+    for outer_name, inner_name in zip(in_var_names, final_child_ctx.input_names):
+        outer_array = parent_ctx.sdfg.arrays[outer_name]
+        state.add_edge(
+            state.add_read(outer_name),
+            None,
+            nested_sdfg,
+            inner_name,
+            dace.Memlet.from_array(outer_name, outer_array),
+        )
+
+    # Now we create the output connections.
+    for outer_name, inner_name in zip(out_var_names, final_child_ctx.output_names):
+        outer_array = parent_ctx.sdfg.arrays[outer_name]
+        state.add_edge(
+            nested_sdfg,
+            inner_name,
+            state.add_write(outer_name),
+            None,
+            dace.Memlet.from_array(outer_name, outer_array),
+        )
+
+    return nested_sdfg
diff --git a/src/jace/translator/primitive_translator.py b/src/jace/translator/primitive_translator.py
index ab84c5d..2000731 100644
--- a/src/jace/translator/primitive_translator.py
+++ b/src/jace/translator/primitive_translator.py
@@ -64,6 +64,9 @@ def __call__(
         primitive translator was able to fully construct the dataflow graph
         within `eqn_state`.
 
+        After the primitive translator returns, the builder will propagate the
+        Memlets in all states that were newly created.
+
         A primitive translator has to use the passed input variables,
         `in_var_names` and must write its output into the variables indicated
         by `out_var_names`. But it is allowed that a primitive translator
diff --git a/src/jace/translator/primitive_translators/__init__.py b/src/jace/translator/primitive_translators/__init__.py
index 65f9153..9e2fec0 100644
--- a/src/jace/translator/primitive_translators/__init__.py
+++ b/src/jace/translator/primitive_translators/__init__.py
@@ -8,7 +8,38 @@
 
 from __future__ import annotations
 
-from .alu_translator import ALUTranslator
+from .arithmetic_logical_translators import (
+    ArithmeticOperationTranslator,
+    LogicalOperationTranslator,
+)
+from .broadcast_in_dim_translator import BroadcastInDimTranslator
+from .concatenate_translator import ConcatenateTranslator
+from .conditions import condition_translator
+from .convert_element_type_translator import ConvertElementTypeTranslator
+from .copy_translator import CopyTranslator, DevicePutTranslator
+from .gather_translator import GatherTranslator
+from .iota_translator import IotaTranslator
+from .pjit_translator import PJITTranslator
+from .reshape_translator import ReshapeTranslator
+from .select_n_translator import SelectNTranslator
+from .slicing import SlicingTranslator
+from .squeeze_translator import SqueezeTranslator
 
 
-__all__ = ["ALUTranslator"]
+__all__ = [
+    "ArithmeticOperationTranslator",
+    "BroadcastInDimTranslator",
+    "ConcatenateTranslator",
+    "ConvertElementTypeTranslator",
+    "CopyTranslator",
+    "DevicePutTranslator",
+    "GatherTranslator",
+    "IotaTranslator",
+    "LogicalOperationTranslator",
+    "PJITTranslator",
+    "ReshapeTranslator",
+    "SelectNTranslator",
+    "SlicingTranslator",
+    "SqueezeTranslator",
+    "condition_translator",
+]
diff --git a/src/jace/translator/primitive_translators/alu_translator.py b/src/jace/translator/primitive_translators/alu_translator.py
deleted file mode 100644
index f217924..0000000
--- a/src/jace/translator/primitive_translators/alu_translator.py
+++ /dev/null
@@ -1,287 +0,0 @@
-# JaCe - JAX Just-In-Time compilation using DaCe (Data Centric Parallel Programming)
-#
-# Copyright (c) 2024, ETH Zurich
-# All rights reserved.
-#
-# SPDX-License-Identifier: BSD-3-Clause
-
-"""This module contains the `ALUTranslator` which translates all arithmetic and logic primitives."""
-# ruff: noqa: W505 PLR0912 C901 PLR0914 PLR0915 D417
-
-from __future__ import annotations
-
-from collections.abc import Sequence
-from typing import Any, Final, cast
-
-import dace
-import numpy as np
-from jax import core as jax_core
-from typing_extensions import override
-
-from jace import translator, util
-
-
-class ALUTranslator(translator.PrimitiveTranslator):
-    """
-    This translator handles all arithmetic and logical operations.
-
-    This translator will be reworked soon, it just exists that the initial PR can do anything at all!!
-    """
-
-    def __init__(self, prim_name: str, prim_tmpl: str) -> None:
-        """Initialize the `ALUTranslator`."""
-        self._prim_name = prim_name
-        self._prim_tmpl = prim_tmpl
-
-    @property
-    @override
-    def primitive(self) -> str:
-        return self._prim_name
-
-    @override
-    def __call__(
-        self,
-        builder: translator.JaxprTranslationBuilder,
-        in_var_names: Sequence[str | None],
-        out_var_names: Sequence[str],
-        eqn: jax_core.JaxprEqn,
-        eqn_state: dace.SDFGState,
-    ) -> None:
-        """
-        Perform the translation.
-
-        Deepening on the shapes of the input the function will either create a Tasklet or a mapped Tasklet.
-        The translator is able to handle broadcasting with NumPy rules.
-        The function will always perform the translation inside the provided state.
-
-        Args:
-            builder:         The builder object of the translation.
-            in_var_names:   List of the names of the arrays created inside the SDFG for the inpts or 'None' in case of a literal.
-            out_var_names:  List of the names of the arrays created inside the SDFG for the outputs.
-            eqn:            The JAX equation that is translated.
-            eqn_state:      State into which the primitive's SDFG representation is constructed.
-        """
-        assert self._prim_name == eqn.primitive.name
-
-        # Determine what kind of input we got and how we should proceed.
-        is_scalar = len(util.get_jax_var_shape(eqn.outvars[0])) == 0
-        input_scalars = [len(util.get_jax_var_shape(Inp)) == 0 for i, Inp in enumerate(eqn.invars)]
-        has_scalars_as_inputs = any(input_scalars)
-        has_some_literals = any(x is None for x in in_var_names)
-        inps_same_shape = all(
-            util.get_jax_var_shape(eqn.invars[0]) == util.get_jax_var_shape(eqn.invars[i])
-            for i in range(1, len(eqn.invars))
-        )
-
-        # We will now look which dimensions have to be broadcasted on which operator.
-        #  I.e. in the dimensions in the lists below there will be no map iteration index.
-        dims_to_bcastl: list[int] = []
-        dims_to_bcastr: list[int] = []
-
-        # Determine if and how we have to broadcast.
-        if inps_same_shape or is_scalar:
-            pass
-
-        elif has_some_literals or has_scalars_as_inputs:
-            # This is essentially an array plus a scalar, that is eitehr a literal or a variable.
-            assert (not has_some_literals) or all(
-                util.get_jax_var_shape(invar) == util.get_jax_var_shape(eqn.outvars[0])
-                for (invar, x) in zip(eqn.invars, in_var_names, strict=False)
-                if x is not None
-            )
-            assert (not has_scalars_as_inputs) or all(
-                util.get_jax_var_shape(invar) in {util.get_jax_var_shape(eqn.outvars[0]), ()}
-                for (invar, x) in zip(eqn.invars, in_var_names, strict=False)
-                if x is not None
-            )
-
-        else:
-            # This is the general broadcasting case
-            #  We assume that both inputs and the output have the same rank but different sizes in each dimension.
-            #  It seems that JAX ensures this.
-            #  We further assume that if the size in a dimension differs then one must have size 1.
-            #  This is the size we broadcast over, i.e. conceptually replicated.
-            out_shps = tuple(util.get_jax_var_shape(eqn.outvars[0]))  # Shape of the output
-            input_shpl = tuple(
-                util.get_jax_var_shape(eqn.invars[0])
-            )  # Shape of the left/first input
-            input_shpr = tuple(
-                util.get_jax_var_shape(eqn.invars[1])
-            )  # Shape of the right/second input
-
-            if not ((len(input_shpl) == len(input_shpr)) and (len(out_shps) == len(input_shpr))):
-                raise NotImplementedError("Can not broadcast over different ranks.")
-
-            for dim, (shp_lft, shp_rgt, out_shp) in enumerate(
-                zip(input_shpl, input_shpr, out_shps)
-            ):
-                if shp_lft == shp_rgt:
-                    assert out_shp == shp_lft
-                elif shp_lft == 1:
-                    assert shp_rgt == out_shp
-                    dims_to_bcastl.append(dim)
-                elif shp_rgt == 1:
-                    assert shp_lft == out_shp
-                    dims_to_bcastr.append(dim)
-                else:
-                    raise ValueError(f"Invalid shapes in dimension {dim} for broadcasting.")
-
-        # Now we create the Tasklet in which the calculation is performed.
-        tskl_code: str = self._write_tasklet_code(in_var_names, eqn)
-        tskl_name: str = eqn.primitive.name
-        tskl_map_ranges: list[tuple[str, str]] = [
-            (f"__i{dim}", f"0:{N}") for dim, N in enumerate(util.get_jax_var_shape(eqn.outvars[0]))
-        ]
-        tskl_output: tuple[str, dace.Memlet] = None  # type: ignore[assignment]
-        tskl_inputs: list[tuple[str, dace.Memlet] | tuple[None, None]] = []
-
-        # Generate the Memlets for the input.
-        for i, dims_to_bcast in zip(range(len(in_var_names)), [dims_to_bcastl, dims_to_bcastr]):
-            if in_var_names[i] is None:  # Literal: No input needed.
-                tskl_inputs.append((None, None))
-                continue
-            if input_scalars[i]:  # Scalar
-                assert len(dims_to_bcast) == 0
-                i_memlet = dace.Memlet.simple(in_var_names[i], "0")
-            else:  # Array: We may have to broadcast
-                inputs_: list[str] = []
-                for dim, (map_var, _) in enumerate(tskl_map_ranges):
-                    if dim in dims_to_bcast:
-                        inputs_.append("0")
-                    else:
-                        inputs_.append(map_var)
-                i_memlet = dace.Memlet.simple(in_var_names[i], ", ".join(inputs_))
-                del inputs_
-            tskl_inputs.append((f"__in{i}", i_memlet))
-
-        # Now generate the Memlets for the output
-        if is_scalar:
-            tskl_output = ("__out0", dace.Memlet.simple(out_var_names[0], "0"))
-        else:
-            tskl_output = (
-                "__out0",
-                dace.Memlet.simple(out_var_names[0], ", ".join([X[0] for X in tskl_map_ranges])),
-            )
-
-        if is_scalar:
-            tskl_tasklet = eqn_state.add_tasklet(
-                tskl_name,
-                _list_to_dict(tskl_inputs).keys(),
-                _list_to_dict([tskl_output]).keys(),
-                tskl_code,
-            )
-            for in_var, (in_connector, in_memlet) in zip(in_var_names, tskl_inputs, strict=False):
-                if in_var is None:  # So access node for literal
-                    continue
-                eqn_state.add_edge(
-                    eqn_state.add_read(in_var), None, tskl_tasklet, in_connector, in_memlet
-                )
-            eqn_state.add_edge(
-                tskl_tasklet,
-                tskl_output[0],
-                eqn_state.add_write(out_var_names[0]),
-                None,
-                tskl_output[1],
-            )
-        else:
-            eqn_state.add_mapped_tasklet(
-                name=tskl_name,
-                map_ranges=_list_to_dict(tskl_map_ranges),
-                inputs=_list_to_dict(tskl_inputs),
-                code=tskl_code,
-                outputs=_list_to_dict([tskl_output]),
-                external_edges=True,
-            )
-
-        return eqn_state
-
-    def _write_tasklet_code(
-        self, in_var_names: Sequence[str | None], eqn: jax_core.JaxprEqn
-    ) -> str:
-        """
-        This function generates the Tasklet code based on a primitive.
-
-        The function will also perform literal substitution and parameter handling.
-
-        Args:
-            in_var_names:   The list of SDFG variables used as input.
-        """
-        t_code = self._prim_tmpl
-
-        # Now we handle Literal substitution
-        for i, in_var_name in enumerate(in_var_names):
-            if in_var_name is not None:
-                continue
-
-            jax_in_var: jax_core.Literal = cast(jax_core.Literal, eqn.invars[i])
-            if util.get_jax_var_shape(jax_in_var) == ():
-                t_val = jax_in_var.val
-                if isinstance(t_val, np.ndarray):
-                    t_val = jax_in_var.val.max()  # I do not know a better way in that case
-                t_code = t_code.replace(f"__in{i}", str(t_val))
-            else:
-                raise ValueError(
-                    f"Can not handle the literal case of shape: {util.get_jax_var_shape(jax_in_var)}"
-                )
-
-        # Now replace the parameters
-        if len(eqn.params) != 0:
-            t_code = t_code.format(**eqn.params)
-
-        return t_code
-
-
-def _list_to_dict(inp: Sequence[tuple[None | Any, Any]]) -> dict[Any, Any]:
-    """
-    This method turns a `list` of pairs into a `dict` and applies a `None` filter.
-
-    The function will only include pairs whose key, i.e. first element is not `None`.
-    """
-    return {k: v for k, v in inp if k is not None}
-
-
-# Contains all the templates for ALU operations.
-_ALU_OPS_TASKLET_TEMPLATES: Final[dict[str, str]] = {
-    # Unary operations
-    "pos": "__out0 = +(__in0)",
-    "neg": "__out0 = -(__in0)",
-    "not": "__out0 = not (__in0)",
-    "floor": "__out0 = floor(__in0)",
-    "ceil": "__out0 = ceil(__in0)",
-    "round": "__out0 = round(__in0)",
-    "abs": "__out0 = abs(__in0)",
-    "sign": "__out0 = sign(__in0)",
-    "sqrt": "__out0 = sqrt(__in0)",
-    "log": "__out0 = log(__in0)",
-    "exp": "__out0 = exp(__in0)",
-    "integer_pow": "__out0 = (__in0)**({y})",  # 'y' is a parameter of the primitive
-    "sin": "__out0 = sin(__in0)",
-    "asin": "__out0 = asin(__in0)",
-    "cos": "__out0 = cos(__in0)",
-    "acos": "__out0 = acos(__in0)",
-    "tan": "__out0 = tan(__in0)",
-    "atan": "__out0 = atan(__in0)",
-    "tanh": "__out0 = tanh(__in0)",
-    # Binary operations
-    "add": "__out0 = (__in0)+(__in1)",
-    "add_any": "__out0 = (__in0)+(__in1)",  # No idea what makes `add_any` differ from `add`
-    "sub": "__out0 = (__in0)-(__in1)",
-    "mul": "__out0 = (__in0)*(__in1)",
-    "div": "__out0 = (__in0)/(__in1)",
-    "rem": "__out0 = (__in0)%(__in1)",
-    "and": "__out0 = (__in0) and (__in1)",
-    "or": "__out0 = (__in0) or  (__in1)",
-    "pow": "__out0 = (__in0)**(__in1)",
-    "ipow": "__out0 = (__in0)**(int(__in1))",
-    "min": "__out0 = min(__in0, __in1)",
-    "max": "__out0 = max(__in0, __in1)",
-    "eq": "__out0 = __in0 == __in1",
-    "ne": "__out0 = __in0 != __in1",
-    "ge": "__out0 = __in0 >= __in1",
-    "gt": "__out0 = __in0 > __in1",
-    "le": "__out0 = __in0 <= __in1",
-    "lt": "__out0 = __in0 < __in1",
-}
-
-for prim_name, prim_tmpl in _ALU_OPS_TASKLET_TEMPLATES.items():
-    translator.register_primitive_translator(ALUTranslator(prim_name, prim_tmpl))
diff --git a/src/jace/translator/primitive_translators/arithmetic_logical_translators.py b/src/jace/translator/primitive_translators/arithmetic_logical_translators.py
new file mode 100644
index 0000000..c9c0a35
--- /dev/null
+++ b/src/jace/translator/primitive_translators/arithmetic_logical_translators.py
@@ -0,0 +1,200 @@
+# JaCe - JAX Just-In-Time compilation using DaCe (Data Centric Parallel Programming)
+#
+# Copyright (c) 2024, ETH Zurich
+# All rights reserved.
+#
+# SPDX-License-Identifier: BSD-3-Clause
+
+"""
+Module containing all translators related to arithmetic and logical operations.
+
+Todo:
+    - Hijack Jax to inject a proper modulo operation.
+"""
+
+from __future__ import annotations
+
+from typing import TYPE_CHECKING, Final
+
+import dace
+from typing_extensions import override
+
+from jace import translator, util
+from jace.translator import mapped_operation_base_translator as mapped_base
+
+
+if TYPE_CHECKING:
+    from collections.abc import Sequence
+
+    from jax import core as jax_core
+
+
+class ArithmeticOperationTranslator(mapped_base.MappedOperationTranslatorBase):
+    """
+    Translator for all arithmetic operations.
+
+    The class is derived from `MappedOperationTranslatorBase` and overwrites the
+    `write_tasklet_code()` function for the Tasklet code.
+
+    Args:
+        prim_name:      The name of the primitive that should be handled.
+        tskl_tmpl:      Template used for generating the Tasklet code.
+
+    Note:
+        - It does not implement the logical operations, they are implemented by
+            the `LogicalOperationTranslator` class.
+        - Despite its name this class also provides the comparison operators.
+        - It does not implement `mod` nor `fmod` as they are translated to some
+            nested `pjit` implementation by Jax for unknown reasons.
+    """
+
+    def __init__(self, prim_name: str, tskl_tmpl: str) -> None:
+        super().__init__(primitive_name=prim_name)
+        self._tskl_tmpl = tskl_tmpl
+
+    @override
+    def write_tasklet_code(
+        self,
+        tskl_ranges: Sequence[tuple[str, str]],
+        in_var_names: Sequence[str | None],
+        eqn: jax_core.JaxprEqn,
+    ) -> str:
+        """Returns the code for the Tasklet, with all parameters replaced."""
+        tskl_code = self._tskl_tmpl
+        if len(eqn.params) != 0:
+            tskl_code = tskl_code.format(**eqn.params)
+        return tskl_code
+
+
+class LogicalOperationTranslator(mapped_base.MappedOperationTranslatorBase):
+    """
+    Translator for all logical operations.
+
+    The reason why the logical operations are separated from the arithmetic
+    operations is quite complicated and in fact the whole thing is harder than
+    it should be. NumPy has two kinds of these operations, i.e.
+    `logical_{and, or, xor, not}()` and `bitwise_{and, or, xor, not}()`, but Jax
+    has only a single kind of logical operation, that operate in bitwise mode.
+    The first idea would be to use `ArithmeticOperationTranslator` with a template
+    such as `__out = __in0 & __in1` or `__out = ~__in0`. Since DaCe eventually
+    generates C++ code and C++ has a native bool type, and `true` is guaranteed
+    to be `1` and `false` equals `0`, this works for all operations except `not`,
+    as `~true` in C++ is essentially `~1`, which is again `true`!
+    Thus the `not` primitive must be handled separately.
+
+    The solution to the problem is, to introduce two templates, one used for the
+    bool context and one used in the integer context. This works because depending
+    if the `logical_*()` or `bitwise_*()` functions are used the input is either
+    of type bool or an integer.
+
+    Args:
+        prim_name:      The name of the primitive that should be handled.
+        int_tmpl:       The template used for the integer case.
+        bool_tmpl:      The template used for the bool case.
+
+    Note:
+        Since it does not make sense to single out `not` and keep the other
+        logical operations in `ArithmeticOperationTranslator` all of them are
+        handled by this class.
+    """
+
+    def __init__(self, prim_name: str, int_tmpl: str, bool_tmpl: str) -> None:
+        super().__init__(primitive_name=prim_name)
+        self._int_tmpl = int_tmpl
+        self._bool_tmpl = bool_tmpl
+
+    @override
+    def write_tasklet_code(
+        self,
+        tskl_ranges: Sequence[tuple[str, str]],
+        in_var_names: Sequence[str | None],
+        eqn: jax_core.JaxprEqn,
+    ) -> str:
+        if all(util.get_jax_var_dtype(invar) is dace.bool_ for invar in eqn.invars):
+            return self._bool_tmpl
+        return self._int_tmpl
+
+
+# Contains the code templates for all supported arithmetic operations.
+# fmt: off
+_ARITMETIC_OPERATION_TEMPLATES: Final[dict[str, str]] = {
+    # Unary operations
+    "pos": "__out = +(__in0)",
+    "neg": "__out = -(__in0)",
+
+    "floor": "__out = floor(__in0)",
+    "ceil": "__out = ceil(__in0)",
+    "round": "__out = round(__in0)",
+
+    "abs": "__out = abs(__in0)",
+    "sign": "__out = sign(__in0)",
+    "exp": "__out = exp(__in0)",
+    "exp2": "__out = exp2(__in0)",
+    "expm1": "__out = expm1(__in0)",
+    "log": "__out = log(__in0)",
+    "log1p": "__out = log1p(__in0)",
+    "conj": "__out = conj(__in0)",
+    "sqrt": "__out = sqrt(__in0)",
+    "cbrt": "__out = cbrt(__in0)",
+
+    "integer_pow": "__out = (__in0)**({y})",  # 'y' is a parameter of the primitive
+    "is_finite": "__out = isfinite(__in0)",
+
+    "sin": "__out = sin(__in0)",
+    "asin": "__out = asin(__in0)",
+    "cos": "__out = cos(__in0)",
+    "acos": "__out = acos(__in0)",
+    "tan": "__out = tan(__in0)",
+    "atan": "__out = atan(__in0)",
+
+    "sinh": "__out = sinh(__in0)",
+    "asinh": "__out = asinh(__in0)",
+    "cosh": "__out = cosh(__in0)",
+    "acosh": "__out = acosh(__in0)",
+    "tanh": "__out = tanh(__in0)",
+    "atanh": "__out = atanh(__in0)",
+
+    # Binary operations
+    "add": "__out = (__in0)+(__in1)",
+    "add_any": "__out = (__in0)+(__in1)",  # No idea what makes `add_any` differ from `add`
+    "sub": "__out = (__in0)-(__in1)",
+    "mul": "__out = (__in0)*(__in1)",
+    "div": "__out = (__in0)/(__in1)",
+    "rem": "__out = (__in0)%(__in1)",
+    "pow": "__out = (__in0)**(__in1)",
+    "min": "__out = min((__in0), (__in1))",
+    "max": "__out = max((__in0), (__in1))",
+
+    "eq": "__out = (__in0) == (__in1)",
+    "ne": "__out = (__in0) != (__in1)",
+    "ge": "__out = (__in0) >= (__in1)",
+    "gt": "__out = (__in0) > (__in1)",
+    "le": "__out = (__in0) <= (__in1)",
+    "lt": "__out = (__in0) < (__in1)",
+
+    "atan2": "__out = atan2((__in0), (__in1))",
+
+    "nextafter": "__out = nextafter((__in0), (__in1))",
+
+    # Ternary operations
+    "clamp": "__out = (__in0 if __in1 < __in0 else (__in1 if __in1 < __in2 else __in2))"
+}
+
+
+# Contains the code templates for all logical operations.
+#  The first one is for the integer case, the second for the bool case.
+_LOGICAL_OPERATION_TEMPLATES: Final[dict[str, tuple[str, str]]] = {
+    "or": ("__out = (__in0) | (__in1)",  "__out = (__in0) or (__in1)"),
+    "not": ("__out = ~(__in0)", "__out = not (__in0)"),
+    "and": ("__out = (__in0) & (__in1)", "__out = (__in0) and (__in1)"),
+    "xor": ("__out = (__in0) ^ (__in1)", "__out = (__in0) != (__in1)"),
+}
+
+
+# Create the arithmetic translators
+for pname, ptmpl in _ARITMETIC_OPERATION_TEMPLATES.items():
+    translator.register_primitive_translator(ArithmeticOperationTranslator(pname, ptmpl))
+
+# Create the logical translators.
+for pname, (itmpl, btmpl) in _LOGICAL_OPERATION_TEMPLATES.items():
+    translator.register_primitive_translator(LogicalOperationTranslator(pname, itmpl, btmpl))
diff --git a/src/jace/translator/primitive_translators/broadcast_in_dim_translator.py b/src/jace/translator/primitive_translators/broadcast_in_dim_translator.py
new file mode 100644
index 0000000..7f24160
--- /dev/null
+++ b/src/jace/translator/primitive_translators/broadcast_in_dim_translator.py
@@ -0,0 +1,67 @@
+# JaCe - JAX Just-In-Time compilation using DaCe (Data Centric Parallel Programming)
+#
+# Copyright (c) 2024, ETH Zurich
+# All rights reserved.
+#
+# SPDX-License-Identifier: BSD-3-Clause
+
+"""This implements the `broadcast_in_dim` primitive."""
+
+from __future__ import annotations
+
+from typing import TYPE_CHECKING
+
+import dace
+from typing_extensions import override
+
+from jace import translator
+from jace.translator import mapped_operation_base_translator as mapped_base
+
+
+if TYPE_CHECKING:
+    from collections.abc import Sequence
+
+    from jax import core as jax_core
+
+
+class BroadcastInDimTranslator(mapped_base.MappedOperationTranslatorBase):
+    """
+    Implements the `broadcast_in_dim` primitive.
+
+    The primitive is implemented through the `MappedOperationTranslatorBase` base.
+    Essentially it creates a copy, but also creates special Memlets that replicate
+    the content of the input.
+    """
+
+    def __init__(self) -> None:
+        super().__init__(primitive_name="broadcast_in_dim")
+
+    @override
+    def write_tasklet_code(
+        self,
+        tskl_ranges: Sequence[tuple[str, str]],
+        in_var_names: Sequence[str | None],
+        eqn: jax_core.JaxprEqn,
+    ) -> str:
+        return "__out = __in0"
+
+    @override
+    def make_input_memlets(
+        self,
+        tskl_ranges: Sequence[tuple[str, str]],
+        in_var_names: Sequence[str | None],
+        eqn: jax_core.JaxprEqn,
+    ) -> dict[str, dace.Memlet]:
+        if in_var_names[0] is None:
+            return {}
+        return {
+            "__in0": dace.Memlet.simple(
+                in_var_names[0],
+                ", ".join(tskl_ranges[bdim][0] for bdim in eqn.params["broadcast_dimensions"])
+                if eqn.params["broadcast_dimensions"]
+                else "0",
+            )
+        }
+
+
+translator.register_primitive_translator(BroadcastInDimTranslator())
diff --git a/src/jace/translator/primitive_translators/concatenate_translator.py b/src/jace/translator/primitive_translators/concatenate_translator.py
new file mode 100644
index 0000000..e8bd144
--- /dev/null
+++ b/src/jace/translator/primitive_translators/concatenate_translator.py
@@ -0,0 +1,87 @@
+# JaCe - JAX Just-In-Time compilation using DaCe (Data Centric Parallel Programming)
+#
+# Copyright (c) 2024, ETH Zurich
+# All rights reserved.
+#
+# SPDX-License-Identifier: BSD-3-Clause
+
+"""Implements the concatenation primitive."""
+
+from __future__ import annotations
+
+from typing import TYPE_CHECKING
+
+import dace
+from typing_extensions import override
+
+from jace import translator, util
+
+
+if TYPE_CHECKING:
+    from collections.abc import Sequence
+
+    from jax import core as jax_core
+
+
+class ConcatenateTranslator(translator.PrimitiveTranslator):
+    """
+    Implements the `concatenate` primitive.
+
+    It is implemented by a series of map that writes to the same access node.
+    It is probably the largest stretch of "written once" in the entire core.
+    """
+
+    @property
+    def primitive(self) -> str:  # noqa: D102  # No docstring needed.
+        return "concatenate"
+
+    @override
+    def __call__(
+        self,
+        builder: translator.JaxprTranslationBuilder,
+        in_var_names: Sequence[str | None],
+        out_var_names: Sequence[str],
+        eqn: jax_core.JaxprEqn,
+        eqn_state: dace.SDFGState,
+    ) -> None:
+        if any(in_var_name is None for in_var_name in in_var_names):
+            raise NotImplementedError("Concatenate: No literal inputs supported.")
+
+        # Dimension along we concatenate.
+        cat_dim = eqn.params["dimension"]
+
+        # Offset counter for write back.
+        already_copied = 0
+
+        # This is the access node we use for the output
+        #  Is inside a dict for input to `add_mapped_tasklet()`.
+        output_nodes = {out_var_names[0]: eqn_state.add_write(out_var_names[0])}
+
+        # Now going over each input and copying the input in the correct location
+        #  of the output array.
+        for i, in_var_name in enumerate(in_var_names):
+            input_shape = util.get_jax_var_shape(eqn.invars[i])
+
+            tskl_range = [(f"__dim{d}", f"0:{dim_size}") for d, dim_size in enumerate(input_shape)]
+            tskl_input_access = [it_var for it_var, _ in tskl_range]
+
+            tskl_output_access = tskl_input_access.copy()
+            tskl_output_access[cat_dim] = f"{tskl_output_access[cat_dim]} + {already_copied}"
+
+            eqn_state.add_mapped_tasklet(
+                f"_concatenate_{out_var_names[0]}_{in_var_name}",
+                map_ranges=tskl_range,
+                inputs={"__in": dace.Memlet.simple(in_var_name, ", ".join(tskl_input_access))},
+                code="__out = __in",
+                outputs={
+                    "__out": dace.Memlet.simple(out_var_names[0], ",".join(tskl_output_access))
+                },
+                output_nodes=output_nodes,
+                external_edges=True,
+            )
+
+            # Update the counter that we have copied
+            already_copied += input_shape[cat_dim]
+
+
+_ = translator.register_primitive_translator(ConcatenateTranslator())
diff --git a/src/jace/translator/primitive_translators/conditions.py b/src/jace/translator/primitive_translators/conditions.py
new file mode 100644
index 0000000..d291016
--- /dev/null
+++ b/src/jace/translator/primitive_translators/conditions.py
@@ -0,0 +1,182 @@
+# JaCe - JAX Just-In-Time compilation using DaCe (Data Centric Parallel Programming)
+#
+# Copyright (c) 2024, ETH Zurich
+# All rights reserved.
+#
+# SPDX-License-Identifier: BSD-3-Clause
+
+"""Implements all conditions that are supported in JAX."""
+
+from __future__ import annotations
+
+from collections.abc import Sequence
+from typing import TYPE_CHECKING
+
+import dace
+
+from jace import translator, util
+from jace.translator import post_translation as ptranslation
+from jace.translator.primitive_translators import pjit_translator as pjit
+
+
+if TYPE_CHECKING:
+    from jax._src import core as jax_core
+
+
+@translator.register_primitive_translator()
+@translator.make_primitive_translator("cond")
+def condition_translator(
+    builder: translator.JaxprTranslationBuilder,
+    in_var_names: Sequence[str | None],
+    out_var_names: Sequence[str],
+    eqn: jax_core.JaxprEqn,
+    eqn_state: dace.SDFGState,
+) -> dace.SDFGState:
+    """
+    Implements the translation of the `cond` primitive, i.e. a scalar if.
+
+    XLA, JAX' backend, supports two versions, one in which the selector, i.e. the
+    variable indicating which branch should be executed is an integer or a boolean.
+
+    Args:
+        builder: The builder object of the translation.
+        in_var_names: The SDFG variables used an input arguments. First is the index,
+            the variable that selects the branch, the remaining ones are passed as
+            inputs to the branches.
+        out_var_names: Names of SDFG variables that should be used as outputs.
+        eqn: The equation that should be translated.
+        eqn_state: State into which the nested SDFG should be constructed.
+
+    Returns:
+        Because of the nature of this primitive, the translator has to construct
+        new states and will return the new SDFG state that serves as terminal state.
+
+    Note:
+        The implementation assumes that the selector, i.e. the variables indicating
+        which branch should be taken is inside its bound.
+    """
+    if util.get_jax_var_dtype(eqn.invars[0]) is dace.bool_:
+        return _cond_primitive_boolean_impl(
+            builder=builder,
+            in_var_names=in_var_names,
+            out_var_names=out_var_names,
+            eqn=eqn,
+            eqn_state=eqn_state,
+        )
+    return _cond_primitive_multi_switch_impl(
+        builder=builder,
+        in_var_names=in_var_names,
+        out_var_names=out_var_names,
+        eqn=eqn,
+        eqn_state=eqn_state,
+    )
+
+
+def _cond_primitive_multi_switch_impl(
+    builder: translator.JaxprTranslationBuilder,
+    in_var_names: Sequence[str | None],
+    out_var_names: Sequence[str],
+    eqn: jax_core.JaxprEqn,
+    eqn_state: dace.SDFGState,
+) -> dace.SDFGState:
+    """
+    Implements the integer version of the conditional primitive.
+
+    For arguments see `ConditionTranslator`.
+
+    This [version](https://openxla.org/xla/operation_semantics#conditional) is
+    essentially a C switch statement without a default branch.
+    """
+    # To make names in the SDFG unique we use the name of the equation state
+    name_pattern = eqn_state.name
+
+    # Promote all inputs to the branches to variables, this are all except the first
+    #  which is the selection variable.
+    branch_input_variable_names: list[str] = pjit._promote_literals_to_constants(
+        builder=builder,
+        var_names=in_var_names[1:],
+        jax_vars=eqn.invars[1:],
+        name_pattern=name_pattern,
+    )
+
+    if in_var_names[0] is None:
+        # The selection variable is a literal, so we will now pretend it is a symbol.
+        #  This also means that we do not need a state transition to promote the
+        #  variable to a symbol.
+        selection_symbol = str(util.get_jax_literal_value(eqn.invars[0]))
+        selection_state = eqn_state
+
+    else:
+        # The selection variable is an input.
+        #  For the implementation of the condition we need to promote the selection
+        #  variable to a symbol, for which we need an interstate edge.
+        #  As a side effect it will update the terminal state.
+        selection_variable_name = in_var_names[0]
+        selection_symbol = f"{selection_variable_name}_symb"
+
+        selection_state = builder.append_new_state(
+            label=f"{name_pattern}_fork",
+            assignments={selection_symbol: selection_variable_name},
+            prev_state=eqn_state,
+        )
+
+    # Now iterate through all branches, translate them and integrate them
+    #  for each branch we will generate a dedicated state.
+    branch_states: list[dace.SDFGState] = []
+    for i, branch_jaxpr in enumerate(eqn.params["branches"]):
+        branch_pattern = f"{name_pattern}_{{}}_branch_{i}"
+        branch_ctx = builder.translate_jaxpr(jaxpr=branch_jaxpr, name=branch_pattern.format("sdfg"))
+
+        # This will update the terminal state only the first time.
+        branch_state = builder.append_new_state(
+            label=branch_pattern.format("state"),
+            condition=f"{selection_symbol} == {i}",
+            prev_state=selection_state,
+        )
+
+        # Integrating it.
+        ptranslation.add_nested_sdfg(
+            state=branch_state,
+            child_ctx=branch_ctx,
+            parent_ctx=builder._ctx,
+            in_var_names=branch_input_variable_names,
+            out_var_names=out_var_names,
+        )
+        branch_states.append(branch_state)
+
+    # Now we have to generate a join state that will serve as new terminal state.
+    #  We append it to the first branch state, which is the current terminal state.
+    assert builder._terminal_sdfg_state is branch_states[0]
+    terminal_state = builder.append_new_state(
+        label=f"{name_pattern}_join",
+        prev_state=branch_states[0],
+    )
+    for branch_state in branch_states[1:]:
+        builder.sdfg.add_edge(
+            branch_state,
+            terminal_state,
+            dace.sdfg.InterstateEdge(),
+        )
+
+    # We return it, because otherwise the builder will assume that `eqn_state` was used.
+    return terminal_state
+
+
+def _cond_primitive_boolean_impl(
+    builder: translator.JaxprTranslationBuilder,  # noqa: ARG001 [unused-function-argument]
+    in_var_names: Sequence[str | None],  # noqa: ARG001 [unused-function-argument]
+    out_var_names: Sequence[str],  # noqa: ARG001 [unused-function-argument]
+    eqn: jax_core.JaxprEqn,  # noqa: ARG001 [unused-function-argument]
+    eqn_state: dace.SDFGState,  # noqa: ARG001 [unused-function-argument]
+) -> dace.SDFGState:
+    """
+    Implements the case the selector of the primitive is a bool.
+
+    XLA explicitly provides this
+    [form of the primitive](https://openxla.org/xla/operation_semantics#conditional)
+    JAX however, does not seem to use it and instead forwards it to the integer
+    implementation.
+    JaCe will not implement it and instead generate an error.
+    """
+    # NOTE: This is mostly to notice if JAX decided to implement that branch.
+    raise NotImplementedError("The boolean conditional primitive is not implemented.")
diff --git a/src/jace/translator/primitive_translators/convert_element_type_translator.py b/src/jace/translator/primitive_translators/convert_element_type_translator.py
new file mode 100644
index 0000000..ee05a2a
--- /dev/null
+++ b/src/jace/translator/primitive_translators/convert_element_type_translator.py
@@ -0,0 +1,85 @@
+# JaCe - JAX Just-In-Time compilation using DaCe (Data Centric Parallel Programming)
+#
+# Copyright (c) 2024, ETH Zurich
+# All rights reserved.
+#
+# SPDX-License-Identifier: BSD-3-Clause
+
+"""Implements the translator for the `convert_element_type` primitive."""
+
+from __future__ import annotations
+
+from typing import TYPE_CHECKING
+
+import dace
+from typing_extensions import override
+
+from jace import translator, util
+from jace.translator import mapped_operation_base_translator as mapped_base
+
+
+if TYPE_CHECKING:
+    from collections.abc import Sequence
+
+    from jax import core as jax_core
+
+
+class ConvertElementTypeTranslator(mapped_base.MappedOperationTranslatorBase):
+    """
+    Implements the `convert_element_type` primitive.
+
+    The primitive will expand to a "copy Map", however, the Tasklet will not
+    simply copy the input to the output, but also perform type conversion.
+    However, in cases where the input type is the same as the output type,
+    the Tasklet will just be a copy Tasklet, that can then be removed by DaCe.
+
+    Note:
+        This translator ignores the `new_dtype` and `weak_type` parameters of
+        the equation and only performs the casting based on the type of the fields.
+    """
+
+    def __init__(self) -> None:
+        super().__init__(primitive_name="convert_element_type")
+
+    @override
+    def write_tasklet_code(
+        self,
+        tskl_ranges: Sequence[tuple[str, str]],
+        in_var_names: Sequence[str | None],
+        eqn: jax_core.JaxprEqn,
+    ) -> str:
+        if in_var_names[0] is None:
+            raise NotImplementedError("'convert_element_type' is not supported for literals.")
+
+        in_dtype = util.get_jax_var_dtype(eqn.invars[0]).type
+        in_dtype_s: str = in_dtype.__name__
+        out_dtype = util.get_jax_var_dtype(eqn.outvars[0]).type
+        out_dtype_s: str = out_dtype.__name__
+
+        # This is the base of the template that we use for conversion. You should notice
+        #  that the Tasklet `__out = __in0` will fail, see commit `f5aabc3` of the
+        #  prototype. Thus we have to do it in this way.
+        conv_code = "__in0"
+
+        if in_dtype == out_dtype:
+            # For some reason Jax sometimes adds conversions where no are needed. In
+            #  these cases we explicitly create a copy Tasklet, which is trivial and can
+            #  be removed by DaCe.
+            # TODO(phimuell): Create a Memlet instead.
+            return f"__out = {conv_code}"
+
+        if in_dtype_s.startswith("bool"):
+            # Interestingly `__out = int(__in0)` will not work.
+            conv_code = f"(1 if {conv_code} else 0)"
+        if out_dtype_s.startswith("bool"):
+            conv_code = f"dace.bool_({conv_code})"
+        elif hasattr(dace.dtypes, out_dtype_s):
+            conv_code = f"dace.{out_dtype_s}({conv_code})"
+        else:
+            raise NotImplementedError(
+                f"Cannot convert '{in_dtype}' to '{out_dtype}' as this type is not known to DaCe."
+            )
+        return f"__out = {conv_code}"
+
+
+_ = translator.register_primitive_translator(ConvertElementTypeTranslator())
diff --git a/src/jace/translator/primitive_translators/copy_translator.py b/src/jace/translator/primitive_translators/copy_translator.py
new file mode 100644
index 0000000..6de5ab9
--- /dev/null
+++ b/src/jace/translator/primitive_translators/copy_translator.py
@@ -0,0 +1,92 @@
+# JaCe - JAX Just-In-Time compilation using DaCe (Data Centric Parallel Programming)
+#
+# Copyright (c) 2024, ETH Zurich
+# All rights reserved.
+#
+# SPDX-License-Identifier: BSD-3-Clause
+
+"""Implements the translator related to data movement."""
+
+from __future__ import annotations
+
+from typing import TYPE_CHECKING
+
+import dace
+from typing_extensions import override
+
+from jace import translator
+
+
+if TYPE_CHECKING:
+    from collections.abc import Sequence
+
+    from jax import core as jax_core
+
+
+class CopyTranslator(translator.PrimitiveTranslator):
+    """
+    Implements the `copy` primitive.
+
+    The translator is implemented by using a Memlet.
+    """
+
+    @property
+    def primitive(self) -> str:  # noqa: D102  # No docstring needed.
+        return "copy"
+
+    def __call__(  # noqa: D102  # No docstring
+        self,
+        builder: translator.JaxprTranslationBuilder,
+        in_var_names: Sequence[str | None],
+        out_var_names: Sequence[str],
+        eqn: jax_core.JaxprEqn,  # noqa: ARG002
+        eqn_state: dace.SDFGState,
+    ) -> None:
+        eqn_state.add_nedge(
+            eqn_state.add_read(in_var_names[0]),
+            eqn_state.add_write(out_var_names[0]),
+            dace.Memlet.from_array(
+                in_var_names[0],
+                builder.arrays[in_var_names[0]],  # type: ignore[index]  # Guaranteed to be a string
+            ),
+        )
+
+
+class DevicePutTranslator(CopyTranslator):
+    """
+    Implements the `device_put` primitive.
+
+    In Jax this primitive is used to copy data between the host and the device,
+    in DaCe Memlets can do this. However, because of the way JaCe operates, at
+    least in the beginning a computation is either fully on the host or on the
+    device this copy will essentially perform a copying.
+    """
+
+    @property
+    def primitive(self) -> str:  # noqa: D102  # No docstring
+        return "device_put"
+
+    @override
+    def __call__(  # No docstring
+        self,
+        builder: translator.JaxprTranslationBuilder,
+        in_var_names: Sequence[str | None],
+        out_var_names: Sequence[str],
+        eqn: jax_core.JaxprEqn,
+        eqn_state: dace.SDFGState,
+    ) -> None:
+        if not (eqn.params["device"] is None and eqn.params["src"] is None):
+            raise NotImplementedError(
+                f"Can only copy on the host, but not from {eqn.params['src']} to {eqn.params['device']}."
+            )
+        return super().__call__(
+            builder=builder,
+            in_var_names=in_var_names,
+            out_var_names=out_var_names,
+            eqn=eqn,
+            eqn_state=eqn_state,
+        )
+
+
+_ = translator.register_primitive_translator(CopyTranslator())
+_ = translator.register_primitive_translator(DevicePutTranslator())
diff --git a/src/jace/translator/primitive_translators/gather_translator.py b/src/jace/translator/primitive_translators/gather_translator.py
new file mode 100644
index 0000000..343ee15
--- /dev/null
+++ b/src/jace/translator/primitive_translators/gather_translator.py
@@ -0,0 +1,211 @@
+# JaCe - JAX Just-In-Time compilation using DaCe (Data Centric Parallel Programming)
+#
+# Copyright (c) 2024, ETH Zurich
+# All rights reserved.
+#
+# SPDX-License-Identifier: BSD-3-Clause
+
+"""Implements the translator for the `gather` primitive."""
+
+from __future__ import annotations
+
+from typing import TYPE_CHECKING
+
+import dace
+from jax import lax as jax_lax
+from typing_extensions import override
+
+from jace import translator, util
+
+
+if TYPE_CHECKING:
+    from collections.abc import Sequence
+
+    from jax import core as jax_core
+
+
+class GatherTranslator(translator.PrimitiveTranslator):
+    """
+    Garther Translator.
+
+    The gather operation extracts patches of a certain size, known as `slice_size`,
+    from an array, called source or input array. Where these patches starts is
+    given by another array, the index array.
+
+    See Also:
+        https://www.tensorflow.org/xla/operation_semantics#gather
+        https://jax.readthedocs.io/en/latest/_autosummary/jax.lax.gather.html
+    """
+
+    @property
+    def primitive(self) -> str:  # noqa: D102  # No docstring needed.
+        return "gather"
+
+    @override
+    def __call__(  # noqa: PLR0914, PLR0915  # Just ported from the prototype, cleanup postponed.
+        self,
+        builder: translator.JaxprTranslationBuilder,
+        in_var_names: Sequence[str | None],
+        out_var_names: Sequence[str],
+        eqn: jax_core.JaxprEqn,
+        eqn_state: dace.SDFGState,
+    ) -> None:
+        """
+        Performs the gather operation.
+
+        Args:
+            builder: The builder object that is active.
+            in_var_names: The names of the input variables, the first array is
+                assumed as source array and the second is the index array.
+            out_var_names: The names of the output variables.
+            eqn: The equation to translate.
+            eqn_state: The state in which we put the extraction.
+        """
+        assert len(eqn.invars) == 2  # noqa: PLR2004  # XLA supports more inputs.
+
+        out_name = out_var_names[0]
+        out_shape = util.get_jax_var_shape(eqn.outvars[0])
+
+        src_name = in_var_names[0]
+        src_shape = util.get_jax_var_shape(eqn.invars[0])
+
+        idx_name = in_var_names[1]
+        idx_shape = util.get_jax_var_shape(eqn.invars[1])
+
+        dimension_numbers = eqn.params["dimension_numbers"]
+        offset_dims: Sequence[int] = dimension_numbers.offset_dims
+        collapsed_slice_dims: Sequence[int] = dimension_numbers.collapsed_slice_dims
+        start_index_map: Sequence[int] = dimension_numbers.start_index_map
+        slice_sizes: Sequence[int] = eqn.params["slice_sizes"]
+        mode: jax_lax.GatherScatterMode = eqn.params["mode"]
+        assert len(start_index_map) == idx_shape[-1]
+
+        if mode != jax_lax.GatherScatterMode.PROMISE_IN_BOUNDS:
+            raise NotImplementedError(f"The mode {mode} is not implemented.")
+
+        # Over these dimensions the copy of the patches goes.
+        batch_dims = tuple(d for d in range(len(out_shape)) if d not in offset_dims)
+
+        # Every batch dimension is associated with one dimension of of the index
+        #  array, but there is always one dimension more in the index array. This
+        #  dimension contains the start indexes of the slice, if there is only
+        #  one index that should be loaded is not strictly necessary, but Jax
+        #  (currently adds) it implicitly, probably to make life easier.
+        if (len(batch_dims) + 1) != len(idx_shape):
+            raise ValueError(
+                f"Expected that the index array has {len(batch_dims) + 1} dimensions, but it had {len(idx_shape)}."
+            )
+
+        # These are the dimensions (of the input) for which a map index is created.
+        #  Note that we exclude collapsed dimensions here.
+        src_dim_with_map_idx = tuple(
+            dim for dim in range(len(slice_sizes)) if dim not in collapsed_slice_dims
+        )
+        assert len(src_dim_with_map_idx) == len(offset_dims)
+
+        # The final map is the composition of two loops. The first map iterates over
+        #  the index array, except the last dimension, and is used to "copy" the
+        #  different patches from the source to the output array. These map parameters
+        #  follow the pattern `__i{out_name}_gather{bd}`, where `bd` is a batch
+        #  dimension. These variables are used to access the index array.
+        #  The second loop performs the actual copy of the slices. For these
+        #  the variables `__i{i}` is used were, these are known as offset
+        #  dimensions.
+        #  What is a bit difficult, that the actual access/dereferencing of the source
+        #  array is done within the tasklet.
+
+        # Access pattern of the source array _within_ the tasklet.
+        src_access_pattern: list[str] = []
+
+        # These are the map ranges for the coying of the slicing.
+        slice_map_ranges: list[tuple[str, str]] = []
+
+        # Compute the access pattern within the tasklet.
+        #  As a side effect we also compute the map ranges, but only for the slices.
+        for dim, slice_size in enumerate(slice_sizes):
+            # Order is important!
+            if dim not in start_index_map:
+                # This dimension is fully copied
+                slice_map_ranges.append((f"__i{dim}", f"0:{slice_size}"))
+                src_access_pattern.append(slice_map_ranges[-1][0])
+                assert dim in src_dim_with_map_idx
+                assert slice_size == src_shape[dim]
+
+            elif dim in collapsed_slice_dims:
+                # This dimension is only partially copied, however, since the
+                #  dimension is collapsed, only a single element is copied that
+                #  comes from the index array.
+                src_access_pattern.append(f"__gather_{dim}")
+
+            else:
+                # This dimension is partially copied, but is _not colapsed_, we need
+                #  a map index to copy the range. However, there is also an offset
+                #  that is involved from copying.
+                slice_map_ranges.append((f"__i{dim}", f"0:{slice_size}"))
+                src_access_pattern.append(f"__gather_{dim} + {slice_map_ranges[-1][0]}")
+                assert dim in src_dim_with_map_idx
+                assert slice_size <= src_shape[dim]
+
+        # These are the map variable that go over the index array.
+        patch_loop_vars = tuple(f"__i{out_name}_gather{bd}" for bd in batch_dims)
+        patch_map_ranges = [
+            (map_param, f"0:{patch_loop_bound}")
+            for map_param, patch_loop_bound in zip(patch_loop_vars, idx_shape[:-1])
+        ]
+
+        # Creating the input memlet that allows us to access the source array from
+        #  inside the tasklet and make it accessible through the name `__arr`. At
+        #  this point it is not possible to tell where we access, because we are
+        #  missing a index variables, they will only be accessible inside the
+        #  tasklet (see below), however, we know that we will access only one
+        #  element from the array.
+        tasklet_inputs: dict[str, dace.Memlet] = {
+            "__arr": dace.Memlet.simple(
+                data=src_name,
+                subset_str=", ".join(f"0:{size}" for size in src_shape),
+                num_accesses=1,
+            ),
+        }
+
+        # Now we are creating the memlets that access the index array.
+        for i, dim in enumerate(start_index_map):
+            tasklet_inputs[f"__gather_{dim}"] = dace.Memlet.simple(
+                data=idx_name, subset_str=(", ".join(patch_loop_vars) + f", {i}")
+            )
+
+        # The tasklet code.
+        tasklet_code = "__out = __arr[" + ", ".join(src_access_pattern) + "]"
+
+        # Now we generate the output memlet.
+        outpt_access_pattern: list[str] = []
+        dim_counter = 0
+        for dim in range(len(out_shape)):
+            if dim in batch_dims:
+                # This is a batch dimension, thus a loop variable is used for it.
+                patch_loop_var = patch_loop_vars[batch_dims.index(dim)]
+                outpt_access_pattern.append(str(patch_loop_var))
+
+            else:
+                # This is a dimension for copying the slices.
+                assert dim_counter <= len(src_dim_with_map_idx)
+                associated_map_idx = src_dim_with_map_idx[dim_counter]
+                dim_counter += 1
+                outpt_access_pattern.append(f"__i{associated_map_idx}")
+        assert dim_counter == len(src_dim_with_map_idx)
+
+        tasklet_outputs: dict[str, dace.Memlet] = {
+            "__out": dace.Memlet.simple(data=out_name, subset_str=", ".join(outpt_access_pattern))
+        }
+        assert len(patch_map_ranges) + len(slice_map_ranges) == len(out_shape)
+
+        eqn_state.add_mapped_tasklet(
+            name=f"_gather_map_{out_name}",
+            map_ranges=patch_map_ranges + slice_map_ranges,
+            inputs=tasklet_inputs,
+            code=tasklet_code,
+            outputs=tasklet_outputs,
+            external_edges=True,
+        )
+
+
+_ = translator.register_primitive_translator(GatherTranslator())
diff --git a/src/jace/translator/primitive_translators/iota_translator.py b/src/jace/translator/primitive_translators/iota_translator.py
new file mode 100644
index 0000000..ce0d99f
--- /dev/null
+++ b/src/jace/translator/primitive_translators/iota_translator.py
@@ -0,0 +1,56 @@
+# JaCe - JAX Just-In-Time compilation using DaCe (Data Centric Parallel Programming)
+#
+# Copyright (c) 2024, ETH Zurich
+# All rights reserved.
+#
+# SPDX-License-Identifier: BSD-3-Clause
+
+"""This implements the `iota` primitive."""
+
+from __future__ import annotations
+
+from typing import TYPE_CHECKING
+
+from typing_extensions import override
+
+from jace import translator
+from jace.translator import mapped_operation_base_translator as mapped_base
+
+
+if TYPE_CHECKING:
+    from collections.abc import Sequence
+
+    import dace
+    from jax import core as jax_core
+
+
+class IotaTranslator(mapped_base.MappedOperationTranslatorBase):
+    """
+    Implements the `iota` primitive.
+
+    Essentially, a very general `jnp.arange()` function.
+    """
+
+    def __init__(self) -> None:
+        super().__init__(primitive_name="iota")
+
+    @override
+    def write_tasklet_code(
+        self,
+        tskl_ranges: Sequence[tuple[str, str]],
+        in_var_names: Sequence[str | None],
+        eqn: jax_core.JaxprEqn,
+    ) -> str:
+        return f"__out = {tskl_ranges[eqn.params['dimension']][0]}"
+
+    @override
+    def make_input_memlets(
+        self,
+        tskl_ranges: Sequence[tuple[str, str]],
+        in_var_names: Sequence[str | None],
+        eqn: jax_core.JaxprEqn,
+    ) -> dict[str, dace.Memlet]:
+        return {}
+
+
+translator.register_primitive_translator(IotaTranslator())
diff --git a/src/jace/translator/primitive_translators/pjit_translator.py b/src/jace/translator/primitive_translators/pjit_translator.py
new file mode 100644
index 0000000..59bfd7e
--- /dev/null
+++ b/src/jace/translator/primitive_translators/pjit_translator.py
@@ -0,0 +1,147 @@
+# JaCe - JAX Just-In-Time compilation using DaCe (Data Centric Parallel Programming)
+#
+# Copyright (c) 2024, ETH Zurich
+# All rights reserved.
+#
+# SPDX-License-Identifier: BSD-3-Clause
+
+"""Implements the `pjit` translator, i.e. nested Jaxpr expressions."""
+
+from __future__ import annotations
+
+import re
+from collections.abc import Sequence
+from typing import TYPE_CHECKING, Any
+
+from jax._src import sharding_impls as jax_sharding  # noqa: PLC2701 [import-private-name]
+
+from jace import translator, util
+from jace.translator import post_translation as ptranslation
+
+
+if TYPE_CHECKING:
+    import dace
+    from jax._src import core as jax_core
+
+
+def _promote_literals_to_constants(
+    builder: translator.JaxprTranslationBuilder,
+    var_names: Sequence[str | None],
+    jax_vars: Sequence[jax_core.Atom],
+    name_pattern: str,
+) -> list[str]:
+    """
+    Promotes all literals in `var_names` to DaCe constants and add them to the SDFG.
+
+    The function assumes that `var_names` are the SDFG variables equivalents of
+    `jax_vars`, as by convention `None` indicates a literal. The function will create
+    a constant for each literal and return `var_names` cleared of all literals.
+    For naming the variables the function will use `name_pattern`.
+
+    Args:
+        builder: The builder that is used for translation.
+        var_names: Names of the SDFG variables, `None` indicates a literal.
+        jax_vars: The JAX variables, in the same order than `var_names`.
+        name_pattern: A pattern to generate a unique name for the variables.
+
+    Todo:
+        Is a constant the right idea or should we generate a symbol?
+    """
+    promoted_var_names: list[str] = []
+    for i, var_name in enumerate(var_names):
+        if var_name is None:
+            promoted_var_name = f"__const_{name_pattern}_literal_promotion_{i}"
+            jax_var = jax_vars[i]
+            promoted_jace_var = util.JaCeVar.from_atom(
+                jax_var=jax_var,
+                name=promoted_var_name,
+            )
+            builder.add_array(promoted_jace_var)
+            builder.sdfg.add_constant(
+                promoted_var_name,
+                util.get_jax_literal_value(jax_var),
+                builder.arrays[promoted_var_name],
+            )
+
+        else:
+            # Already an SDFG variable, so nothing to do.
+            promoted_var_name = var_name
+        promoted_var_names.append(promoted_var_name)
+    return promoted_var_names
+
+
+@translator.register_primitive_translator()
+@translator.make_primitive_translator("pjit")
+def PJITTranslator(  # noqa: N802 [invalid-function-name]
+    builder: translator.JaxprTranslationBuilder,
+    in_var_names: Sequence[str | None],
+    out_var_names: Sequence[str],
+    eqn: jax_core.JaxprEqn,
+    eqn_state: dace.SDFGState,
+) -> None:
+    """
+    Implements the `pjit` translator that handles nested Jaxpr.
+
+    `pjit` primitives in JAX represents nested calls, for example the body of a scan
+    is inside a nested Jaxpr. However, `pjit` is used to indicate that a computation
+    should be done on the device or on sharded memory.
+
+    However, due to the current state and working of JaCe, this aspect is essentially
+    ignored and the computation is always inlined.
+
+    In case an input is a literal the translator will create a constant for it.
+
+    Args:
+        builder: The builder object of the translation.
+        in_var_names: Names of the SDFG variables that should be used as inputs
+            inside the parent SDFG.
+        out_var_names: Names of SDFG variables that should be used as outputs
+            inside the parent SDFG.
+        eqn: The equation that contains the `pjit` primitive.
+        eqn_state: State into which the nested SDFG should be constructed.
+    """
+    params: dict[str, Any] = eqn.params
+    nested_jaxpr: jax_core.ClosedJaxpr = params["jaxpr"]
+    in_shardings = params["in_shardings"]
+    out_shardings = params["out_shardings"]
+    _ = params["donated_invars"]  # Always ignored
+    _ = params["keep_unused"]
+    _ = params["inline"]
+
+    if not all(in_sharding is jax_sharding.UNSPECIFIED for in_sharding in in_shardings):
+        raise NotImplementedError("Currently 'pjit' does not support sharding in its input.")
+    if not all(out_sharding is jax_sharding.UNSPECIFIED for out_sharding in out_shardings):
+        raise NotImplementedError("Currently 'pjit' does not support sharding in its output.")
+
+    # TODO(phimuell): Controlflow region and name
+    pjit_name = params["name"]
+
+    # TODO(phimuell): Controlflow region and name
+    #  They will introduce a feature like that to address them in optimizations.
+    pjit_name = params["name"]
+
+    # Name in SDFG must be unique, thus we mangle it, furthermore, we have to clean it.
+    sdfg_name = f"pjit_{re.subn('[^a-zA-Z0-9_]', '_', pjit_name)[0]}__{'_'.join(out_var_names)}"
+
+    # Ensure that all inputs are SDFG variables
+    final_input_names = _promote_literals_to_constants(
+        builder=builder,
+        var_names=in_var_names,
+        jax_vars=eqn.invars,
+        name_pattern=sdfg_name,
+    )
+
+    # Now get the translated SDFG.
+    nested_context: translator.TranslationContext = builder.translate_jaxpr(
+        jaxpr=nested_jaxpr,
+        name=sdfg_name,
+    )
+
+    # Now lets add the nested SDFG
+    ptranslation.add_nested_sdfg(
+        state=eqn_state,
+        child_ctx=nested_context,
+        parent_ctx=builder._ctx,
+        in_var_names=final_input_names,
+        out_var_names=out_var_names,
+    )
diff --git a/src/jace/translator/primitive_translators/reshape_translator.py b/src/jace/translator/primitive_translators/reshape_translator.py
new file mode 100644
index 0000000..241cc94
--- /dev/null
+++ b/src/jace/translator/primitive_translators/reshape_translator.py
@@ -0,0 +1,67 @@
+# JaCe - JAX Just-In-Time compilation using DaCe (Data Centric Parallel Programming)
+#
+# Copyright (c) 2024, ETH Zurich
+# All rights reserved.
+#
+# SPDX-License-Identifier: BSD-3-Clause
+
+"""Implements the translator for the `reshape` primitive."""
+
+from __future__ import annotations
+
+from typing import TYPE_CHECKING
+
+import dace
+from typing_extensions import override
+
+from jace import translator, util
+
+
+if TYPE_CHECKING:
+    from collections.abc import Sequence
+
+    from jax import core as jax_core
+
+
+class ReshapeTranslator(translator.PrimitiveTranslator):
+    """
+    Implements the `reshape` primitive.
+
+    The current implementation uses a Memlet for this and essentially acts as
+    an optimization barrier. Furthermore the Jax primitive also has the optional
+    `dimensions` parameters which allows to permute the input, this is not
+    supported.
+    """
+
+    @property
+    def primitive(self) -> str:  # noqa: D102  # No docstring needed.
+        return "reshape"
+
+    @override
+    def __call__(
+        self,
+        builder: translator.JaxprTranslationBuilder,
+        in_var_names: Sequence[str | None],
+        out_var_names: Sequence[str],
+        eqn: jax_core.JaxprEqn,
+        eqn_state: dace.SDFGState,
+    ) -> None:
+        """
+        Performs the reshaping.
+
+        Currently a copy using a Memlet is performed.
+        """
+        if eqn.params["dimensions"] is not None:
+            raise NotImplementedError("Currently 'dimensions' must be 'None'.")
+        eqn_state.add_nedge(
+            eqn_state.add_read(in_var_names[0]),
+            eqn_state.add_write(out_var_names[0]),
+            dace.Memlet(
+                data=in_var_names[0],
+                subset=", ".join(f"0:{size}" for size in util.get_jax_var_shape(eqn.invars[0])),
+                other_subset=", ".join(f"0:{size}" for size in eqn.params["new_sizes"]),
+            ),
+        )
+
+
+translator.register_primitive_translator(ReshapeTranslator())
diff --git a/src/jace/translator/primitive_translators/select_n_translator.py b/src/jace/translator/primitive_translators/select_n_translator.py
new file mode 100644
index 0000000..51b27b3
--- /dev/null
+++ b/src/jace/translator/primitive_translators/select_n_translator.py
@@ -0,0 +1,94 @@
+# JaCe - JAX Just-In-Time compilation using DaCe (Data Centric Parallel Programming)
+#
+# Copyright (c) 2024, ETH Zurich
+# All rights reserved.
+#
+# SPDX-License-Identifier: BSD-3-Clause
+
+"""Implements `select_n`."""
+
+from __future__ import annotations
+
+from typing import TYPE_CHECKING
+
+import dace
+from typing_extensions import override
+
+from jace import translator, util
+from jace.translator import mapped_operation_base_translator as mapped_base
+
+
+if TYPE_CHECKING:
+    from collections.abc import Sequence
+
+    from jax import core as jax_core
+
+
+class SelectNTranslator(mapped_base.MappedOperationTranslatorBase):
+    """
+    Implements the `select_n` primitive.
+
+    The `select_n` primitive is a generalization of `np.where`, that can take an
+    arbitrary number of branches, which are selected by an integer predicate.
+    The behaviour is undefined if the predicate is out of bound.
+
+    Note:
+        For a better understanding this function renames its input connectors.
+        The first one, which is the predicate, is renamed to `__cond` and the
+        others are renamed again to `__in{i}`, starting with zero.
+
+    Todo:
+        Implement the primitive as a nested SDFG.
+    """
+
+    def __init__(self) -> None:
+        super().__init__(primitive_name="select_n")
+
+    @override
+    def write_tasklet_code(
+        self,
+        tskl_ranges: Sequence[tuple[str, str]],
+        in_var_names: Sequence[str | None],
+        eqn: jax_core.JaxprEqn,
+    ) -> str:
+        if len(in_var_names) == 3:  # noqa: PLR2004  # `3` is not magic.
+            # This order is correct, since `False` is interpreted as `0`, which means
+            #  the first case. DaCe seems to have some problems with bools and integer
+            #  casting around, so we handle the bool case explicitly here.
+            #  See also `ConvertElementTypeTranslator`.
+            return "__out = __in1 if __cond else __in0"
+
+        return "\n".join(
+            ["if __cond == 0:  __out = __in0"]
+            + [f"elif __cond == {i}: __out = __in{i}" for i in range(1, len(in_var_names) - 1)]
+        )
+
+    @override
+    def make_input_memlets(
+        self,
+        tskl_ranges: Sequence[tuple[str, str]],
+        in_var_names: Sequence[str | None],
+        eqn: jax_core.JaxprEqn,
+    ) -> dict[str, dace.Memlet]:
+        return {
+            f"__in{i - 1}" if i else "__cond": dace.Memlet.simple(
+                in_var_name, ", ".join(f"{it_idx}" for it_idx, _ in tskl_ranges)
+            )
+            for i, in_var_name in enumerate(in_var_names)
+            if in_var_name
+        }
+
+    @override
+    def literal_substitution(
+        self, tskl_code: str, in_var_names: Sequence[str | None], eqn: jax_core.JaxprEqn
+    ) -> str:
+        assert in_var_names[0]  # Condition can never be a literal.
+        for i, in_var_name in enumerate(in_var_names[1:]):
+            if in_var_name is not None:
+                continue
+            t_val = util.get_jax_literal_value(eqn.invars[i + 1])
+            tskl_code = tskl_code.replace(f"__in{i}", str(t_val))
+        return tskl_code
+
+
+translator.register_primitive_translator(SelectNTranslator())
diff --git a/src/jace/translator/primitive_translators/slicing.py b/src/jace/translator/primitive_translators/slicing.py
new file mode 100644
index 0000000..ae4f167
--- /dev/null
+++ b/src/jace/translator/primitive_translators/slicing.py
@@ -0,0 +1,198 @@
+# JaCe - JAX Just-In-Time compilation using DaCe (Data Centric Parallel Programming)
+#
+# Copyright (c) 2024, ETH Zurich
+# All rights reserved.
+#
+# SPDX-License-Identifier: BSD-3-Clause
+
+"""Implements slicing."""
+
+from __future__ import annotations
+
+from typing import TYPE_CHECKING
+
+import dace
+from typing_extensions import override
+
+from jace import translator, util
+from jace.translator import mapped_operation_base_translator as mapped_base
+
+
+if TYPE_CHECKING:
+    from collections.abc import Sequence
+
+    from jax import core as jax_core
+
+
+class SlicingTranslator(mapped_base.MappedOperationTranslatorBase):
+    """
+    Implements the `slice` primitive.
+
+    This is the classical slicing operation which extracts a fixed sized window
+    from a fixed initial position. The slicing is implemented using a partial copy.
+
+    Note:
+        Slices are essentially optimization barriers as they can not be fused
+        with Maps before them.
+    """
+
+    def __init__(self) -> None:
+        super().__init__(primitive_name="slice")
+
+    @override
+    def write_tasklet_code(
+        self,
+        tskl_ranges: Sequence[tuple[str, str]],
+        in_var_names: Sequence[str | None],
+        eqn: jax_core.JaxprEqn,
+    ) -> str:
+        return "__out = __in0"
+
+    @override
+    def make_input_memlets(
+        self,
+        tskl_ranges: Sequence[tuple[str, str]],
+        in_var_names: Sequence[str | None],
+        eqn: jax_core.JaxprEqn,
+    ) -> dict[str, dace.Memlet]:
+        """We have to add the offsets to the Memlet accesses."""
+        strides: Sequence[int] = (
+            ((1,) * len(tskl_ranges)) if eqn.params["strides"] is None else eqn.params["strides"]
+        )
+        start_indices: Sequence[int] = eqn.params["start_indices"]  # Fist index to slice
+        return {
+            "__in0": dace.Memlet.simple(
+                in_var_names[0],
+                ", ".join(
+                    f"{start_index} + {it_idx} * {stride}"
+                    for (it_idx, _), start_index, stride in zip(tskl_ranges, start_indices, strides)
+                ),
+            )
+        }
+
+
+class DynamicSlicingTranslator(translator.PrimitiveTranslator):
+    """
+    Implements the `dynamic_slice` primitive.
+
+    [Dynamic slicing](https://jax.readthedocs.io/en/latest/_autosummary/jax.lax.dynamic_slice.html)
+    performs a slicing of a _fixed_ window, but the start of the window is
+    not fix, instead it is passed by variables. Furthermore, (as it is in Jax),
+    if the window would overrun the start indexes are adjusted.
+
+    Todo:
+        - Prevent that the modified start indexes are promoted to symbols,
+            to ensure mergability.
+    """
+
+    @property
+    def primitive(self) -> str:  # noqa: D102  # No docstring needed.
+        return "dynamic_slice"
+
+    @override
+    def __call__(
+        self,
+        builder: translator.JaxprTranslationBuilder,
+        in_var_names: Sequence[str | None],
+        out_var_names: Sequence[str],
+        eqn: jax_core.JaxprEqn,
+        eqn_state: dace.SDFGState,
+    ) -> None:
+        assert in_var_names[0]
+        assert len(in_var_names) == len(util.get_jax_var_shape(eqn.invars[0])) + 1
+
+        # This is the sizes of the slice window.
+        window_sizes: Sequence[int] = eqn.params["slice_sizes"]
+
+        # Maps the variable name, that stores the start index of the window in one
+        #  dimensions to the access node, that holds the value. The variable name
+        #  is also used as dynamic range offset.
+        #  Only present if the index is not a literal.
+        in_access: dict[str, dace.nodes.AccessNode] = {}
+
+        # Name of the variable from where we get the start index of the window
+        #  or the value itself, if it is a literal; in the order of the dimension.
+        #  If the value is `None` then the literal was not yet processed.
+        window_start_indices: list[str | None] = list(in_var_names[1:])
+
+        # We will always adapt the start indexes and not check if it is needed.
+        for dim, (window_start_index, dim_size, window_size) in enumerate(
+            zip(window_start_indices, util.get_jax_var_shape(eqn.invars[0]), window_sizes)
+        ):
+            if window_start_index is None:
+                # Jax does not adjust the literals on its own
+                raw_window_start = int(util.get_jax_literal_value(eqn.invars[dim + 1]))  # type: ignore[arg-type]  # type confusion
+                adjusted_window_start = min(dim_size, raw_window_start + window_size) - window_size
+                window_start_indices[dim] = str(adjusted_window_start)
+                continue
+
+            # We do not use a symbol for the start of the window but a Tasklet, as
+            #  a symbol would need an interstage edge, which is an optimization barrier.
+            tasklet = dace.nodes.Tasklet(
+                label=f"adjustment_of_slice_start_{window_start_index}_for_{out_var_names[0]}",
+                inputs={"unadjusted_start_idx": None},
+                outputs={"adjusted_start_idx": None},
+                code=f"adjusted_start_idx = min(unadjusted_start_idx + {window_size}, {dim_size}) - {window_size}",
+            )
+            new_start_idx_var_name = builder.add_array(
+                eqn.invars[dim + 1], name_prefix="__jace_adapted_start_idx_"
+            )
+            new_start_idx_acc = eqn_state.add_access(new_start_idx_var_name)
+
+            eqn_state.add_edge(
+                eqn_state.add_read(window_start_index),
+                None,
+                tasklet,
+                "unadjusted_start_idx",
+                dace.Memlet.simple(window_start_index, "0"),
+            )
+            eqn_state.add_edge(
+                tasklet,
+                "adjusted_start_idx",
+                new_start_idx_acc,
+                None,
+                dace.Memlet.simple(new_start_idx_var_name, "0"),
+            )
+            # Update the name of the start index, and store the access
+            #  node for later use.
+            window_start_indices[dim] = new_start_idx_var_name
+            in_access[new_start_idx_var_name] = new_start_idx_acc
+
+        tskl_ranges: list[tuple[str, str]] = [
+            (f"__i{dim}", f"0:{N}") for dim, N in enumerate(util.get_jax_var_shape(eqn.outvars[0]))
+        ]
+
+        memlet_accesses: list[str] = []
+
+        for (it_var, _), offset_symbol_name in zip(tskl_ranges, window_start_indices):
+            assert offset_symbol_name is not None
+            memlet_accesses.append(f"{it_var} + {offset_symbol_name}")
+
+        tskl_input = dace.Memlet.simple(in_var_names[0], ", ".join(memlet_accesses))
+        tskl_output = dace.Memlet.simple(
+            out_var_names[0], ", ".join(name for name, _ in tskl_ranges)
+        )
+        _, map_entry, _ = eqn_state.add_mapped_tasklet(
+            name=f"{self.primitive}_{out_var_names[0]}",
+            map_ranges=tskl_ranges,
+            inputs={"__in": tskl_input},
+            code="__out = __in",
+            outputs={"__out": tskl_output},
+            external_edges=True,
+        )
+
+        # Creating the inputs for the dynamic map ranges. We have to use the same
+        #  access nodes as above, to ensure a single order of computation.
+        for window_start_index_name, windows_start_access_node in in_access.items():
+            eqn_state.add_edge(
+                windows_start_access_node,
+                None,
+                map_entry,
+                window_start_index_name,
+                dace.Memlet.simple(window_start_index_name, "0"),
+            )
+            map_entry.add_in_connector(window_start_index_name)
+
+
+translator.register_primitive_translator(SlicingTranslator())
+translator.register_primitive_translator(DynamicSlicingTranslator())
diff --git a/src/jace/translator/primitive_translators/squeeze_translator.py b/src/jace/translator/primitive_translators/squeeze_translator.py
new file mode 100644
index 0000000..de6f1f4
--- /dev/null
+++ b/src/jace/translator/primitive_translators/squeeze_translator.py
@@ -0,0 +1,69 @@
+# JaCe - JAX Just-In-Time compilation using DaCe (Data Centric Parallel Programming)
+#
+# Copyright (c) 2024, ETH Zurich
+# All rights reserved.
+#
+# SPDX-License-Identifier: BSD-3-Clause
+
+"""Implements the `squeeze` primitive."""
+
+from __future__ import annotations
+
+import itertools
+from typing import TYPE_CHECKING
+
+import dace
+from typing_extensions import override
+
+from jace import translator, util
+from jace.translator import mapped_operation_base_translator as mapped_base
+
+
+if TYPE_CHECKING:
+    from collections.abc import Sequence
+
+    from jax import core as jax_core
+
+
+class SqueezeTranslator(mapped_base.MappedOperationTranslatorBase):
+    """
+    Implements the `squeeze` primitive.
+
+    The primitives allows to remove dimensions of size one. Essentially
+    equivalent to `np.squeeze` and the inverse to `np.expand_dims()`.
+    """
+
+    def __init__(self) -> None:
+        super().__init__(primitive_name="squeeze")
+
+    @override
+    def write_tasklet_code(
+        self,
+        tskl_ranges: Sequence[tuple[str, str]],
+        in_var_names: Sequence[str | None],
+        eqn: jax_core.JaxprEqn,
+    ) -> str:
+        return "__out = __in0"
+
+    @override
+    def make_input_memlets(
+        self,
+        tskl_ranges: Sequence[tuple[str, str]],
+        in_var_names: Sequence[str | None],
+        eqn: jax_core.JaxprEqn,
+    ) -> dict[str, dace.Memlet]:
+        dims_to_delete: Sequence[str] = eqn.params["dimensions"]
+        in_rank: int = len(util.get_jax_var_shape(eqn.invars[0]))
+        cnt = itertools.count(0)
+        return {
+            "__in0": dace.Memlet.simple(
+                in_var_names[0],
+                ", ".join(
+                    "0" if dim in dims_to_delete else tskl_ranges[next(cnt)][0]
+                    for dim in range(in_rank)
+                ),
+            )
+        }
+
+
+translator.register_primitive_translator(SqueezeTranslator())
diff --git a/src/jace/util/jax_helper.py b/src/jace/util/jax_helper.py
index bc2de21..7c9f2f0 100644
--- a/src/jace/util/jax_helper.py
+++ b/src/jace/util/jax_helper.py
@@ -81,6 +81,27 @@ def __eq__(self, other: Any) -> bool:
             return NotImplemented
         return id(self) == id(other)
 
+    @classmethod
+    def from_atom(
+        cls,
+        jax_var: jax_core.Atom,
+        name: str | None,
+    ) -> JaCeVar:
+        """
+        Generates a `JaCeVar` from the JAX variable `jax_var`.
+
+        If `jax_var` is a literal its value is ignored.
+
+        Args:
+            jax_var: The variable to process.
+            name: The optional name of the variable.
+        """
+        return cls(
+            shape=get_jax_var_shape(jax_var),
+            dtype=get_jax_var_dtype(jax_var),
+            name=name,
+        )
+
 
 def get_jax_var_name(jax_var: jax_core.Atom | JaCeVar) -> str:
     """Returns the name of `jax_var` as a string."""

From 25616ae13f12a4d4d6574e9740b632496b5e757e Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Fri, 13 Sep 2024 15:20:35 +0200
Subject: [PATCH 442/458] Modified the condition primitive.

Before it was implementewd as a switch, for the case JAX would use the bool overload of XLA.
The check for this was now essentially moved inside the function.
---
 .../primitive_translators/conditions.py       | 58 ++-----------------
 1 file changed, 6 insertions(+), 52 deletions(-)

diff --git a/src/jace/translator/primitive_translators/conditions.py b/src/jace/translator/primitive_translators/conditions.py
index d291016..38ba2c2 100644
--- a/src/jace/translator/primitive_translators/conditions.py
+++ b/src/jace/translator/primitive_translators/conditions.py
@@ -52,41 +52,15 @@ def condition_translator(
         new states and will return the new SDFG state that serves as terminal state.
 
     Note:
-        The implementation assumes that the selector, i.e. the variables indicating
-        which branch should be taken is inside its bound.
+        This function essentially implements a C `switch` statement, however, there
+        is no default branch.
     """
     if util.get_jax_var_dtype(eqn.invars[0]) is dace.bool_:
-        return _cond_primitive_boolean_impl(
-            builder=builder,
-            in_var_names=in_var_names,
-            out_var_names=out_var_names,
-            eqn=eqn,
-            eqn_state=eqn_state,
-        )
-    return _cond_primitive_multi_switch_impl(
-        builder=builder,
-        in_var_names=in_var_names,
-        out_var_names=out_var_names,
-        eqn=eqn,
-        eqn_state=eqn_state,
-    )
-
+        # XLA explicitly provides this [form of the primitive](https://openxla.org/xla/operation_semantics#conditional)
+        # JAX however, does not seem to use it at the moment and instead forwards it
+        #  to the integer implementation.
+        raise NotImplementedError("The boolean conditional primitive is not implemented.")
 
-def _cond_primitive_multi_switch_impl(
-    builder: translator.JaxprTranslationBuilder,
-    in_var_names: Sequence[str | None],
-    out_var_names: Sequence[str],
-    eqn: jax_core.JaxprEqn,
-    eqn_state: dace.SDFGState,
-) -> dace.SDFGState:
-    """
-    Implements the integer version of the conditional primitive.
-
-    For arguments see `ConditionTranslator`.
-
-    This [version](https://openxla.org/xla/operation_semantics#conditional) is
-    essentially a C switch statement without a default branch.
-    """
     # To make names in the SDFG unique we use the name of the equation state
     name_pattern = eqn_state.name
 
@@ -160,23 +134,3 @@ def _cond_primitive_multi_switch_impl(
 
     # We return it, because otherwise the builder will assume that `eqn_state` was used.
     return terminal_state
-
-
-def _cond_primitive_boolean_impl(
-    builder: translator.JaxprTranslationBuilder,  # noqa: ARG001 [unused-function-argument]
-    in_var_names: Sequence[str | None],  # noqa: ARG001 [unused-function-argument]
-    out_var_names: Sequence[str],  # noqa: ARG001 [unused-function-argument]
-    eqn: jax_core.JaxprEqn,  # noqa: ARG001 [unused-function-argument]
-    eqn_state: dace.SDFGState,  # noqa: ARG001 [unused-function-argument]
-) -> dace.SDFGState:
-    """
-    Implements the case the selector of the primitive is a bool.
-
-    XLA explicitly provides this
-    [form of the primitive](https://openxla.org/xla/operation_semantics#conditional)
-    JAX however, does not seem to use it and instead forwards it to the integer
-    implementation.
-    JaCe will not implement it and instead generate an error.
-    """
-    # NOTE: This is mostly to notice if JAX decided to implement that branch.
-    raise NotImplementedError("The boolean conditional primitive is not implemented.")

From 24d97fb47ee759fd601c29c9191ade23fbc0b01e Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Fri, 13 Sep 2024 15:23:18 +0200
Subject: [PATCH 443/458] Nobody needs that thest in this form.

---
 tests/test_subtranslator_helper.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/tests/test_subtranslator_helper.py b/tests/test_subtranslator_helper.py
index a4c4ad9..52672b0 100644
--- a/tests/test_subtranslator_helper.py
+++ b/tests/test_subtranslator_helper.py
@@ -75,7 +75,7 @@ def fake_add_translator(*args: Any, **kwargs: Any) -> None:  # noqa: ARG001
 def test_are_subtranslators_imported():
     """Tests if something is inside the list of subtranslators."""
     # Must be adapted if new primitives are implemented.
-    assert len(get_registered_primitive_translators()) == 37
+    assert len(get_registered_primitive_translators()) > 0
 
 
 @pytest.mark.usefixtures("no_builtin_translators")

From 411bd7bdbae121d897b6792bc0397e08044ba940 Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Fri, 13 Sep 2024 15:39:17 +0200
Subject: [PATCH 444/458] Since the bug mention in DaCe issue |1595 was
 resolved we can enable it.

However, a similar issue (#1644) in DaCe is still open.
---
 tests/integration_tests/primitive_translators/conftest.py | 5 +----
 1 file changed, 1 insertion(+), 4 deletions(-)

diff --git a/tests/integration_tests/primitive_translators/conftest.py b/tests/integration_tests/primitive_translators/conftest.py
index 9ff54e6..b914da2 100644
--- a/tests/integration_tests/primitive_translators/conftest.py
+++ b/tests/integration_tests/primitive_translators/conftest.py
@@ -20,10 +20,7 @@
     autouse=True,
     params=[
         optimization.NO_OPTIMIZATIONS,
-        pytest.param(
-            optimization.DEFAULT_OPTIMIZATIONS,
-            marks=pytest.mark.skip("Simplify bug 'https://github.com/spcl/dace/issues/1595'"),
-        ),
+        optimization.DEFAULT_OPTIMIZATIONS,
     ],
 )
 def _set_compile_options(request) -> Generator[None, None, None]:

From c8b7d86e5f7a6158a7e02768ec1ac6627a538817 Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Tue, 24 Sep 2024 09:00:01 +0200
Subject: [PATCH 445/458] First batch of Enrique's suggestions, but still not
 done.

---
 .../translator/jaxpr_translator_builder.py    |  29 ++-
 .../mapped_operation_base_translator.py       |  50 ++---
 src/jace/translator/post_translation.py       |  51 +++++-
 src/jace/translator/primitive_translator.py   |   2 +-
 .../primitive_translators/__init__.py         |  21 ++-
 .../arithmetic_logical_translators.py         |  54 +++---
 .../broadcast_in_dim_translator.py            |  23 +--
 .../concatenate_translator.py                 |  99 ++++------
 .../primitive_translators/conditions.py       |  80 ++++----
 .../convert_element_type_translator.py        |  31 ++--
 .../primitive_translators/copy_translator.py  |  99 +++++-----
 .../gather_translator.py                      |   2 +-
 .../primitive_translators/iota_translator.py  |   2 +-
 .../primitive_translators/pjit_translator.py  |  74 ++------
 .../reshape_translator.py                     |  66 +++----
 .../select_n_translator.py                    |  22 +--
 .../primitive_translators/slicing.py          | 171 ++++++++----------
 .../squeeze_translator.py                     |   2 +-
 18 files changed, 401 insertions(+), 477 deletions(-)

diff --git a/src/jace/translator/jaxpr_translator_builder.py b/src/jace/translator/jaxpr_translator_builder.py
index 9b76407..c82c277 100644
--- a/src/jace/translator/jaxpr_translator_builder.py
+++ b/src/jace/translator/jaxpr_translator_builder.py
@@ -37,10 +37,10 @@ class JaxprTranslationBuilder:
     - it lacks the special `__return` variable,
     - the `arg_names` parameter is not set,
     - for all scalar values a `Scalar` SDFG variable is used, thus they cannot
-        be used for return values,
+        be used for returning values,
     - for every transient there is exactly one access node that writes to it,
-        except the name of the array starts with `__jace_mutable_`, which can
-        be written to multiple times.
+        except if the name of the array starts with `__jace_mutable_`, in which case
+        it can be written to multiple times.
 
     For these reasons the SDFG is not directly usable, and further manipulations
     have to be performed. Especially, DaCe's validation function will fail and
@@ -179,6 +179,24 @@ def append_new_state(
             self._ctx.terminal_state = new_state
         return new_state
 
+    def add_orphan_state(
+        self,
+        label: str,
+    ) -> dace.SDFGState:
+        """
+        Add a new orphan state to the SDFG.
+
+        The state is not connected to any other state, nor it is the new start state.
+        Except you know what you are doing you should not use this function and
+        instead use `self.append_new_state()`.
+
+        Args:
+            label: The name of the state.
+        """
+        if not self.is_allocated():
+            raise RuntimeError("Builder is not allocated.")
+        return self._ctx.sdfg.add_state(label=label, is_start_block=False)
+
     @property
     def arrays(self) -> Mapping[str, dace_data.Data]:
         """
@@ -712,7 +730,7 @@ def _propagate_memlets_in_new_states(
         ]
 
         while nodes_to_process:
-            currently_processing = nodes_to_process.pop(-1)
+            currently_processing = nodes_to_process.pop()
             if (
                 self.sdfg.out_degree(currently_processing) == 0
                 and currently_processing != new_terminal_state
@@ -790,7 +808,7 @@ def __init__(self, name: str | None, jaxpr: jax_core.ClosedJaxpr) -> None:
         self.terminal_state = self.start_state
         self.jaxpr = jaxpr
 
-    def validate(self) -> bool:
+    def validate(self) -> None:
         """
         Validate internal state of `self`.
 
@@ -829,4 +847,3 @@ def validate(self) -> bool:
                 self.sdfg,
                 None,
             )
-        return True
diff --git a/src/jace/translator/mapped_operation_base_translator.py b/src/jace/translator/mapped_operation_base_translator.py
index 9f0f402..17a5c35 100644
--- a/src/jace/translator/mapped_operation_base_translator.py
+++ b/src/jace/translator/mapped_operation_base_translator.py
@@ -37,11 +37,10 @@ class MappedOperationTranslatorBase(translator.PrimitiveTranslator):
     ```
     where `__in*` are the connector names of the Tasklet and `__out` is the
     output connector. For problems such as this, the SDFG API provides the
-    `SDFGState.add_mapped_tasklet()` function, however, in most cases it can not
-    be directly used, for various reasons. Thus this class acts like a
-    convenience wrapper around it.
+    `SDFGState.add_mapped_tasklet()` function, however, because it is very low
+    level and very verbose to use, this class acts as a convenience wrapper around it.
 
-    To use this class a user has to overwrite the `write_tasklet_code()` function.
+    To use this class a user has to define the abstract `write_tasklet_code()` method.
     This function generates the entire code that should be put into the Tasklet,
     include the assignment to `__out`. If needed the translator will perform
     literal substitution on the returned code and broadcast the inputs to match
@@ -51,7 +50,7 @@ class MappedOperationTranslatorBase(translator.PrimitiveTranslator):
     to generate custom input Memlets, such as adding an offset.
 
     Args:
-        primitive_name:     The name of the primitive `self` should bind to.
+        primitive_name: The name of the primitive `self` should bind to.
 
     Note:
         This class will always generate a mapped Tasklet, even if a scalar is handled.
@@ -78,7 +77,7 @@ def __call__(
         """
         Create the mapped Tasklet.
 
-        The function will create the map ranges and based on the shape of the
+        The function will create the map ranges based on the shape of the
         output array. It will then call `make_input_memlets()` to get the input
         Memlets. After that it calls `write_tasklet_code()` to get the Tasklet
         code and perform literal substitution by forwarding it to
@@ -88,7 +87,7 @@ def __call__(
             For a description of the arguments see `PrimitiveTranslatorCallable`.
         """
         assert len(out_var_names) == 1
-        if util.get_jax_var_shape(eqn.outvars[0]) != ():
+        if util.get_jax_var_shape(eqn.outvars[0]):
             tskl_ranges: list[tuple[str, str]] = [
                 (f"__i{dim}", f"0:{N}")
                 for dim, N in enumerate(util.get_jax_var_shape(eqn.outvars[0]))
@@ -130,20 +129,20 @@ def write_tasklet_code(
         eqn: jax_core.JaxprEqn,
     ) -> str:
         """
-        Return the (Python) code that should be put inside the Tasklet.
+        Return the Python code that should be put inside the Tasklet.
 
         This also includes the assignment statement, i.e. `__out`.
         However, the base will do literal substitution on the returned object.
 
         Args:
-            tskl_ranges:    List of pairs used as map parameter, first element
+            tskl_ranges: List of pairs used as map parameter, first element
                 is the name iteration index of the dimension, second is its range.
-            in_var_names:   The list of SDFG variables used as input, `None` if literal.
-            eqn:            The equation.
+            in_var_names: The list of SDFG variables used as input, `None` if literal.
+            eqn: The equation.
         """
         ...
 
-    def make_input_memlets(  # noqa: PLR6301  # Subclasses might need them.
+    def make_input_memlets(  # noqa: PLR6301 [no-self-use]  # Subclasses might need them.
         self,
         tskl_ranges: Sequence[tuple[str, str]],
         in_var_names: Sequence[str | None],
@@ -156,10 +155,10 @@ def make_input_memlets(  # noqa: PLR6301  # Subclasses might need them.
         that is used to connect it to the Map entry node.
 
         Args:
-            tskl_ranges:    List of pairs used as map parameter, first element
+            tskl_ranges: List of pairs used as map parameter, first element
                 is the name iteration index of the dimension, second is its range
-            in_var_names:   The list of SDFG variables used as input, `None` if literal.
-            eqn:            The equation object.
+            in_var_names: The list of SDFG variables used as input, `None` if literal.
+            eqn: The equation object.
         """
         out_shp = tuple(util.get_jax_var_shape(eqn.outvars[0]))  # Shape of the output
         out_rank = len(out_shp)
@@ -181,7 +180,11 @@ def make_input_memlets(  # noqa: PLR6301  # Subclasses might need them.
                 tskl_inputs[f"__in{i}"] = dace.Memlet.simple(in_var_name, "0")  # Scalar
                 continue
 
-            # We have to to broadcasting (combine yes and no together)
+            # We might have to do broadcasting.
+            #  We ensured that input and output have the same rank (JAX is doing that
+            #  for us). So we must do broadcasting, i.e. replicating that input
+            #  dimension, if its size is 1. We threat the case where the output has
+            #  size 1 in that dimension as broadcasting as well.
             dims_to_bcast: Sequence[int] = [dim for dim in range(out_rank) if inp_shp[dim] == 1]
             tskl_inputs[f"__in{i}"] = dace.Memlet.simple(
                 in_var_name,
@@ -192,23 +195,22 @@ def make_input_memlets(  # noqa: PLR6301  # Subclasses might need them.
             )
         return tskl_inputs
 
-    def literal_substitution(  # noqa: PLR6301  # Subclasses might need it.
+    def literal_substitution(  # noqa: PLR6301 [no-self-use]  # Subclasses might need it.
         self, tskl_code: str, in_var_names: Sequence[str | None], eqn: jax_core.JaxprEqn
     ) -> str:
         """
         Perform literal substitution on the proto Tasklet code `tskl_code`.
 
         Args:
-            tskl_code:      The proto Tasklet code with literal.
-            in_var_names:   The list of SDFG variables used as input.
-            eqn:            The equation.
+            tskl_code: The proto Tasklet code with literal.
+            in_var_names: The list of SDFG variables used as input.
+            eqn: The equation.
 
         Note:
             It is allowed but not recommended to override this function.
         """
         for i, in_var_name in enumerate(in_var_names):
-            if in_var_name is not None:
-                continue
-            t_val = util.get_jax_literal_value(eqn.invars[i])
-            tskl_code = tskl_code.replace(f"__in{i}", str(t_val))
+            if in_var_name is None:
+                t_val = util.get_jax_literal_value(eqn.invars[i])
+                tskl_code = tskl_code.replace(f"__in{i}", str(t_val))
         return tskl_code
diff --git a/src/jace/translator/post_translation.py b/src/jace/translator/post_translation.py
index 9831f35..6b27b4f 100644
--- a/src/jace/translator/post_translation.py
+++ b/src/jace/translator/post_translation.py
@@ -20,6 +20,7 @@
 
 if TYPE_CHECKING:
     from dace.sdfg import nodes as dace_nodes
+    from jax import core as jax_core
 
     from jace import translator
 
@@ -271,7 +272,8 @@ def add_nested_sdfg(
         will first pass it to `finalize_translation_context()` and operates on the
         return values. This means that `child_ctx` will be modified in place, and
         a copy will be added to `parent_ctx`.
-        It is highly recommended that `state` is empty.
+        It is highly recommended that `state` is empty, this makes subsequent
+        inlining of the nested SDFG simpler.
     """
     if child_ctx.sdfg.free_symbols:
         raise NotImplementedError("Symbol Mapping is not implemented.")
@@ -298,7 +300,6 @@ def add_nested_sdfg(
     nested_sdfg: dace_nodes.NestedSDFG = state.add_nested_sdfg(
         sdfg=final_child_ctx.sdfg,
         parent=parent_ctx.sdfg,
-        # Bug in DaCe must be a set.
         inputs=set(final_child_ctx.input_names),
         outputs=set(final_child_ctx.output_names),
     )
@@ -326,3 +327,49 @@ def add_nested_sdfg(
         )
 
     return nested_sdfg
+
+
+def promote_literals_to_constants(
+    builder: translator.JaxprTranslationBuilder,
+    var_names: Sequence[str | None],
+    jax_vars: Sequence[jax_core.Atom],
+    name_pattern: str,
+) -> list[str]:
+    """
+    Promotes all literals in `var_names` to DaCe constants and add them to the SDFG.
+
+    The function assumes that `var_names` are the SDFG variables equivalents of
+    `jax_vars`, as by convention `None` indicates a literal. The function will create
+    a constant for each literal and return `var_names` cleared of all literals.
+    For naming the variables the function will use `name_pattern`.
+
+    Args:
+        builder: The builder that is used for translation.
+        var_names: Names of the SDFG variables, `None` indicates a literal.
+        jax_vars: The JAX variables, in the same order than `var_names`.
+        name_pattern: A pattern to generate a unique name for the variables.
+
+    Todo:
+        Is a constant the right idea or should we generate a symbol?
+    """
+    promoted_var_names: list[str] = []
+    for i, var_name in enumerate(var_names):
+        if var_name is None:
+            promoted_var_name = f"__const_{name_pattern}_literal_promotion_{i}"
+            jax_var = jax_vars[i]
+            promoted_jace_var = util.JaCeVar.from_atom(
+                jax_var=jax_var,
+                name=promoted_var_name,
+            )
+            builder.add_array(promoted_jace_var)
+            builder.sdfg.add_constant(
+                promoted_var_name,
+                util.get_jax_literal_value(jax_var),
+                builder.arrays[promoted_var_name],
+            )
+
+        else:
+            # Already an SDFG variable, so nothing to do.
+            promoted_var_name = var_name
+        promoted_var_names.append(promoted_var_name)
+    return promoted_var_names
diff --git a/src/jace/translator/primitive_translator.py b/src/jace/translator/primitive_translator.py
index 2000731..71aa067 100644
--- a/src/jace/translator/primitive_translator.py
+++ b/src/jace/translator/primitive_translator.py
@@ -77,7 +77,7 @@ def __call__(
         Args:
             builder: The builder object of the translation.
             in_var_names: List of the names of the arrays created inside the
-                SDFG for the inpts or `None` in case of a literal.
+                SDFG for the inputs or `None` in case of a literal.
             out_var_names: List of the names of the arrays created inside the
                 SDFG for the outputs.
             eqn: The JAX primitive that should be translated.
diff --git a/src/jace/translator/primitive_translators/__init__.py b/src/jace/translator/primitive_translators/__init__.py
index 9e2fec0..757743e 100644
--- a/src/jace/translator/primitive_translators/__init__.py
+++ b/src/jace/translator/primitive_translators/__init__.py
@@ -13,33 +13,34 @@
     LogicalOperationTranslator,
 )
 from .broadcast_in_dim_translator import BroadcastInDimTranslator
-from .concatenate_translator import ConcatenateTranslator
+from .concatenate_translator import concatenate_translator
 from .conditions import condition_translator
 from .convert_element_type_translator import ConvertElementTypeTranslator
-from .copy_translator import CopyTranslator, DevicePutTranslator
+from .copy_translator import copy_translator, device_put_translator
 from .gather_translator import GatherTranslator
 from .iota_translator import IotaTranslator
-from .pjit_translator import PJITTranslator
-from .reshape_translator import ReshapeTranslator
+from .pjit_translator import pjit_translator
+from .reshape_translator import reshape_translator
 from .select_n_translator import SelectNTranslator
-from .slicing import SlicingTranslator
+from .slicing import SlicingTranslator, dynamic_slicing_translator
 from .squeeze_translator import SqueezeTranslator
 
 
 __all__ = [
     "ArithmeticOperationTranslator",
     "BroadcastInDimTranslator",
-    "ConcatenateTranslator",
     "ConvertElementTypeTranslator",
-    "CopyTranslator",
-    "DevicePutTranslator",
     "GatherTranslator",
     "IotaTranslator",
     "LogicalOperationTranslator",
-    "PJITTranslator",
-    "ReshapeTranslator",
     "SelectNTranslator",
     "SlicingTranslator",
     "SqueezeTranslator",
+    "concatenate_translator",
     "condition_translator",
+    "copy_translator",
+    "device_put_translator",
+    "dynamic_slicing_translator",
+    "pjit_translator",
+    "reshape_translator",
 ]
diff --git a/src/jace/translator/primitive_translators/arithmetic_logical_translators.py b/src/jace/translator/primitive_translators/arithmetic_logical_translators.py
index c9c0a35..667e1ac 100644
--- a/src/jace/translator/primitive_translators/arithmetic_logical_translators.py
+++ b/src/jace/translator/primitive_translators/arithmetic_logical_translators.py
@@ -6,7 +6,7 @@
 # SPDX-License-Identifier: BSD-3-Clause
 
 """
-Module containing all translators related to arithmetic and logical operations.
+Primitive translators related to all arithmetic, logical and comparison operations.
 
 Todo:
     - Hijack Jax to inject a proper modulo operation.
@@ -31,21 +31,14 @@
 
 class ArithmeticOperationTranslator(mapped_base.MappedOperationTranslatorBase):
     """
-    Translator for all arithmetic operations.
-
-    The class is derived from `MappedOperationTranslatorBase` and overwrites the
-    `write_tasklet_code()` function for the Tasklet code.
+    Translator for all arithmetic operations and comparisons.
 
     Args:
-        prim_name:      The name of the primitive that should be handled.
-        tskl_tmpl:      Template used for generating the Tasklet code.
+        prim_name: The name of the primitive that should be handled.
+        tskl_tmpl: Template used for generating the Tasklet code.
 
     Note:
-        - It does not implement the logical operations, they are implemented by
-            the `LogicalOperationTranslator` class.
-        - Despite its name this class also provides the comparison operators.
-        - It does not implement `mod` nor `fmod` as they are translated to some
-            nested `pjit` implementation by Jax for unknown reasons.
+        Logical and bitwise operations are implemented by `LogicalOperationTranslator`.
     """
 
     def __init__(self, prim_name: str, tskl_tmpl: str) -> None:
@@ -60,10 +53,7 @@ def write_tasklet_code(
         eqn: jax_core.JaxprEqn,
     ) -> str:
         """Returns the code for the Tasklet, with all parameters replaced."""
-        tskl_code = self._tskl_tmpl
-        if len(eqn.params) != 0:
-            tskl_code = tskl_code.format(**eqn.params)
-        return tskl_code
+        return self._tskl_tmpl.format(**eqn.params)
 
 
 class LogicalOperationTranslator(mapped_base.MappedOperationTranslatorBase):
@@ -82,15 +72,15 @@ class LogicalOperationTranslator(mapped_base.MappedOperationTranslatorBase):
     as `~true` in C++ is essentially `~1`, which is again `true`!
     Thus the `not` primitive must be handled separately.
 
-    The solution to the problem is, to introduce two templates, one used for the
+    The solution to the problem is to introduce two templates, one used for the
     bool context and one used in the integer context. This works because depending
     if the `logical_*()` or `bitwise_*()` functions are used the input is either
     of type bool or an integer.
 
     Args:
-        prim_name:      The name of the primitive that should be handled.
-        int_tmpl:       The template used for the integer case.
-        bool_tmpl:      The template used for the bool case.
+        prim_name: The name of the primitive that should be handled.
+        int_tmpl: The template used for the integer case.
+        bool_tmpl: The template used for the bool case.
 
     Note:
         Since it does not make sense to single out `not` and keep the other
@@ -110,12 +100,16 @@ def write_tasklet_code(
         in_var_names: Sequence[str | None],
         eqn: jax_core.JaxprEqn,
     ) -> str:
-        if all(util.get_jax_var_dtype(invar) is dace.bool_ for invar in eqn.invars):
-            return self._bool_tmpl
-        return self._int_tmpl
+        return (
+            self._bool_tmpl
+            if all(util.get_jax_var_dtype(invar) is dace.bool_ for invar in eqn.invars)
+            else self._int_tmpl
+        )
 
 
-# Contains the code templates for all supported arithmetic operations.
+# Maps the name of an arithmetic primitives to the code template that is used to
+#  generate the body of the mapped tasklet. These are used to instantiate the
+#  `ArithmeticOperationTranslator` objects.
 # fmt: off
 _ARITMETIC_OPERATION_TEMPLATES: Final[dict[str, str]] = {
     # Unary operations
@@ -177,24 +171,24 @@ def write_tasklet_code(
     "nextafter": "__out = nextafter((__in0), (__in1))",
 
     # Ternary operations
-    "clamp": "__out = (__in0 if __in1 < __in0 else (__in1 if __in1 < __in2 else __in2))"
+    "clamp": "__out = ((__in0) if (__in1) < (__in0) else ((__in1) if (__in1) < (__in2) else (__in2)))"
 }
 
 
-# Contains the code templates for all logical operations.
-#  The first one is for the integer case, the second for the bool case.
+# Maps the name of a logical primitive to the two code templates (first the integer
+#  case and second the boolean case) used to create the body of the mapped tasklet.
+#  They are used to instantiate the `LogicalOperationTranslator` translators.
 _LOGICAL_OPERATION_TEMPLATES: Final[dict[str, tuple[str, str]]] = {
     "or": ("__out = (__in0) | (__in1)",  "__out = (__in0) or (__in1)"),
     "not": ("__out = ~(__in0)", "__out = not (__in0)"),
     "and": ("__out = (__in0) & (__in1)", "__out = (__in0) and (__in1)"),
     "xor": ("__out = (__in0) ^ (__in1)", "__out = (__in0) != (__in1)"),
 }
+# fmt: on
 
 
-# Create the arithmetic translators
+# Instantiate the arithmetic and logical translators from the templates.
 for pname, ptmpl in _ARITMETIC_OPERATION_TEMPLATES.items():
     translator.register_primitive_translator(ArithmeticOperationTranslator(pname, ptmpl))
-
-# Create the logical translators.
 for pname, (itmpl, btmpl) in _LOGICAL_OPERATION_TEMPLATES.items():
     translator.register_primitive_translator(LogicalOperationTranslator(pname, itmpl, btmpl))
diff --git a/src/jace/translator/primitive_translators/broadcast_in_dim_translator.py b/src/jace/translator/primitive_translators/broadcast_in_dim_translator.py
index 7f24160..964a2f6 100644
--- a/src/jace/translator/primitive_translators/broadcast_in_dim_translator.py
+++ b/src/jace/translator/primitive_translators/broadcast_in_dim_translator.py
@@ -5,7 +5,7 @@
 #
 # SPDX-License-Identifier: BSD-3-Clause
 
-"""This implements the `broadcast_in_dim` primitive."""
+"""Primitive translator for broadcasting operations."""
 
 from __future__ import annotations
 
@@ -28,9 +28,8 @@ class BroadcastInDimTranslator(mapped_base.MappedOperationTranslatorBase):
     """
     Implements the `broadcast_in_dim` primitive.
 
-    The primitive is implemented through the `MappedOperationTranslatorBase` base.
-    Essentially it creates a copy, but also creates special Memlets that replicate
-    the content of the input.
+    Essentially creates a copy tasklet, however, the memlets are made in such a
+    way that some dimensions are replicated.
     """
 
     def __init__(self) -> None:
@@ -52,16 +51,14 @@ def make_input_memlets(
         in_var_names: Sequence[str | None],
         eqn: jax_core.JaxprEqn,
     ) -> dict[str, dace.Memlet]:
-        if in_var_names[0] is None:
+        if in_var_names[0] is None:  # Broadcast a literal (scalar) to a matrix.
             return {}
-        return {
-            "__in0": dace.Memlet.simple(
-                in_var_names[0],
-                ", ".join(tskl_ranges[bdim][0] for bdim in eqn.params["broadcast_dimensions"])
-                if eqn.params["broadcast_dimensions"]
-                else "0",
-            )
-        }
+        subset_str = (
+            ", ".join(tskl_ranges[bdim][0] for bdim in eqn.params["broadcast_dimensions"])
+            if eqn.params["broadcast_dimensions"]
+            else "0",
+        )
+        return {"__in0": dace.Memlet.simple(in_var_names[0], subset_str)}
 
 
 translator.register_primitive_translator(BroadcastInDimTranslator())
diff --git a/src/jace/translator/primitive_translators/concatenate_translator.py b/src/jace/translator/primitive_translators/concatenate_translator.py
index e8bd144..1b5f679 100644
--- a/src/jace/translator/primitive_translators/concatenate_translator.py
+++ b/src/jace/translator/primitive_translators/concatenate_translator.py
@@ -5,14 +5,13 @@
 #
 # SPDX-License-Identifier: BSD-3-Clause
 
-"""Implements the concatenation primitive."""
+"""Primitive translator for concatenation operations."""
 
 from __future__ import annotations
 
 from typing import TYPE_CHECKING
 
 import dace
-from typing_extensions import override
 
 from jace import translator, util
 
@@ -23,65 +22,45 @@
     from jax import core as jax_core
 
 
-class ConcatenateTranslator(translator.PrimitiveTranslator):
+@translator.register_primitive_translator()
+@translator.make_primitive_translator("concatenate")
+def concatenate_translator(
+    builder: translator.JaxprTranslationBuilder,  # noqa: ARG001  # Required by the interface.
+    in_var_names: Sequence[str | None],
+    out_var_names: Sequence[str],
+    eqn: jax_core.JaxprEqn,
+    eqn_state: dace.SDFGState,
+) -> None:
     """
     Implements the `concatenate` primitive.
 
-    It is implemented by a series of map that writes to the same access node.
-    It is probably the largest stretch of "written once" in the entire core.
+    Each source array is copied by its own map, but all maps write to the same
+    access node.
     """
-
-    @property
-    def primitive(self) -> str:  # noqa: D102  # No docstring needed.
-        return "concatenate"
-
-    @override
-    def __call__(
-        self,
-        builder: translator.JaxprTranslationBuilder,
-        in_var_names: Sequence[str | None],
-        out_var_names: Sequence[str],
-        eqn: jax_core.JaxprEqn,
-        eqn_state: dace.SDFGState,
-    ) -> None:
-        if any(in_var_name is None for in_var_name in in_var_names):
-            raise NotImplementedError("Concatenate: No literal inputs supported.")
-
-        # Dimension along we concatenate.
-        cat_dim = eqn.params["dimension"]
-
-        # Offset counter for write back.
-        already_copied = 0
-
-        # This is the access node we use for the output
-        #  Is inside a dict for input to `add_mapped_tasklet()`.
-        output_nodes = {out_var_names[0]: eqn_state.add_write(out_var_names[0])}
-
-        # Now going over each input and copying the input in the correct location
-        #  of the output array.
-        for i, in_var_name in enumerate(in_var_names):
-            input_shape = util.get_jax_var_shape(eqn.invars[i])
-
-            tskl_range = [(f"__dim{d}", f"0:{dim_size}") for d, dim_size in enumerate(input_shape)]
-            tskl_input_access = [it_var for it_var, _ in tskl_range]
-
-            tskl_output_access = tskl_input_access.copy()
-            tskl_output_access[cat_dim] = f"{tskl_output_access[cat_dim]} + {already_copied}"
-
-            eqn_state.add_mapped_tasklet(
-                f"_concatenate_{out_var_names[0]}_{in_var_name}",
-                map_ranges=tskl_range,
-                inputs={"__in": dace.Memlet.simple(in_var_name, ", ".join(tskl_input_access))},
-                code="__out = __in",
-                outputs={
-                    "__out": dace.Memlet.simple(out_var_names[0], ",".join(tskl_output_access))
-                },
-                output_nodes=output_nodes,
-                external_edges=True,
-            )
-
-            # Update the counter that we have copied
-            already_copied += input_shape[cat_dim]
-
-
-_ = translator.register_primitive_translator(ConcatenateTranslator())
+    if any(in_var_name is None for in_var_name in in_var_names):
+        raise NotImplementedError("Concatenate: No literal inputs supported.")
+
+    # Access node that is used by all maps.
+    output_nodes = {out_var_names[0]: eqn_state.add_write(out_var_names[0])}
+
+    cat_dim = eqn.params["dimension"]
+    cat_offset = 0
+    for i, in_var_name in enumerate(in_var_names):
+        input_shape = util.get_jax_var_shape(eqn.invars[i])
+
+        tskl_range = [(f"__dim{d}", f"0:{dim_size}") for d, dim_size in enumerate(input_shape)]
+        tskl_input_access = [it_var for it_var, _ in tskl_range]
+
+        tskl_output_access = tskl_input_access.copy()
+        tskl_output_access[cat_dim] = f"{tskl_output_access[cat_dim]} + {cat_offset}"
+
+        eqn_state.add_mapped_tasklet(
+            f"_concatenate_{out_var_names[0]}_{in_var_name}",
+            map_ranges=tskl_range,
+            inputs={"__in": dace.Memlet.simple(in_var_name, ", ".join(tskl_input_access))},
+            code="__out = __in",
+            outputs={"__out": dace.Memlet.simple(out_var_names[0], ",".join(tskl_output_access))},
+            output_nodes=output_nodes,
+            external_edges=True,
+        )
+        cat_offset += input_shape[cat_dim]
diff --git a/src/jace/translator/primitive_translators/conditions.py b/src/jace/translator/primitive_translators/conditions.py
index 38ba2c2..4f7363d 100644
--- a/src/jace/translator/primitive_translators/conditions.py
+++ b/src/jace/translator/primitive_translators/conditions.py
@@ -5,7 +5,7 @@
 #
 # SPDX-License-Identifier: BSD-3-Clause
 
-"""Implements all conditions that are supported in JAX."""
+"""Primitive translator for condition operations, i.e. scalar `if` and `switch`."""
 
 from __future__ import annotations
 
@@ -16,7 +16,6 @@
 
 from jace import translator, util
 from jace.translator import post_translation as ptranslation
-from jace.translator.primitive_translators import pjit_translator as pjit
 
 
 if TYPE_CHECKING:
@@ -33,10 +32,12 @@ def condition_translator(
     eqn_state: dace.SDFGState,
 ) -> dace.SDFGState:
     """
-    Implements the translation of the `cond` primitive, i.e. a scalar if.
+    Implements the translation of scalar conditional branches.
 
-    XLA, JAX' backend, supports two versions, one in which the selector, i.e. the
-    variable indicating which branch should be executed is an integer or a boolean.
+    This translator handles both `jax.lax.cond()` and `jax.lax.switch()` cases.
+    The sub expression of the branches are each translated into a separate nested
+    SDFG, each located in their own state. These state are then connected to the
+    joint state which is returned.
 
     Args:
         builder: The builder object of the translation.
@@ -47,68 +48,62 @@ def condition_translator(
         eqn: The equation that should be translated.
         eqn_state: State into which the nested SDFG should be constructed.
 
-    Returns:
-        Because of the nature of this primitive, the translator has to construct
-        new states and will return the new SDFG state that serves as terminal state.
-
-    Note:
-        This function essentially implements a C `switch` statement, however, there
-        is no default branch.
+    Notes:
+        According to the JAX documentation (https://jax.readthedocs.io/en/latest/_autosummary/jax.lax.switch.html)
+        the selector is clamped. But according to XLA (https://openxla.org/xla/operation_semantics#conditional)
+        an out of range selector uses the last branch. JaCe conforms to JAX semantic.
+        After this function the terminal state of the `builder` is unspecific.
     """
     if util.get_jax_var_dtype(eqn.invars[0]) is dace.bool_:
-        # XLA explicitly provides this [form of the primitive](https://openxla.org/xla/operation_semantics#conditional)
-        # JAX however, does not seem to use it at the moment and instead forwards it
-        #  to the integer implementation.
+        # XLA explicitly provides a binary form of the primitive
+        #  (https://openxla.org/xla/operation_semantics#conditional) JAX however,
+        #  does not seem to use it at the moment and instead forwards it to the
+        #  integer implementation.
         raise NotImplementedError("The boolean conditional primitive is not implemented.")
 
-    # To make names in the SDFG unique we use the name of the equation state
+    # To make names in the (nested) SDFG unique we use the name of the equation state
     name_pattern = eqn_state.name
 
-    # Promote all inputs to the branches to variables, this are all except the first
-    #  which is the selection variable.
-    branch_input_variable_names: list[str] = pjit._promote_literals_to_constants(
+    # To avoid special cases promote all symbols to constants.
+    branch_input_variable_names: list[str] = ptranslation.promote_literals_to_constants(
         builder=builder,
         var_names=in_var_names[1:],
         jax_vars=eqn.invars[1:],
         name_pattern=name_pattern,
     )
 
+    # expressions of the branches.
+    branches: list[jax_core.ClosedJaxpr] = eqn.params["branches"]
+
+    # Make sure that the selection variable is a DaCe symbol.
     if in_var_names[0] is None:
-        # The selection variable is a literal, so we will now pretend it is a symbol.
-        #  This also means that we do not need a state transition to promote the
-        #  variable to a symbol.
-        selection_symbol = str(util.get_jax_literal_value(eqn.invars[0]))
+        literal_selection_value = str(util.get_jax_literal_value(eqn.invars[0]))
+        selection_symbol = f"max({len(branches)}, min(0, {literal_selection_value}))"
         selection_state = eqn_state
 
     else:
-        # The selection variable is an input.
-        #  For the implementation of the condition we need to promote the selection
-        #  variable to a symbol, for which we need an interstate edge.
-        #  As a side effect it will update the terminal state.
+        # Promotion of a scalar to a symbol through a state transition.
         selection_variable_name = in_var_names[0]
         selection_symbol = f"{selection_variable_name}_symb"
-
         selection_state = builder.append_new_state(
             label=f"{name_pattern}_fork",
-            assignments={selection_symbol: selection_variable_name},
+            assignments={
+                selection_symbol: f"max({len(branches)}, min(0, {selection_variable_name}[0]))"
+            },
             prev_state=eqn_state,
         )
 
-    # Now iterate through all branches, translate them and integrate them
-    #  for each branch we will generate a dedicated state.
     branch_states: list[dace.SDFGState] = []
-    for i, branch_jaxpr in enumerate(eqn.params["branches"]):
+    for i, branch_jaxpr in enumerate(branches):
         branch_pattern = f"{name_pattern}_{{}}_branch_{i}"
         branch_ctx = builder.translate_jaxpr(jaxpr=branch_jaxpr, name=branch_pattern.format("sdfg"))
 
-        # This will update the terminal state only the first time.
+        # This will update the terminal state only for the first branch
         branch_state = builder.append_new_state(
             label=branch_pattern.format("state"),
             condition=f"{selection_symbol} == {i}",
             prev_state=selection_state,
         )
-
-        # Integrating it.
         ptranslation.add_nested_sdfg(
             state=branch_state,
             child_ctx=branch_ctx,
@@ -118,19 +113,12 @@ def condition_translator(
         )
         branch_states.append(branch_state)
 
-    # Now we have to generate a join state that will serve as new terminal state.
-    #  We append it to the first branch state, which is the current terminal state.
-    assert builder._terminal_sdfg_state is branch_states[0]
-    terminal_state = builder.append_new_state(
-        label=f"{name_pattern}_join",
-        prev_state=branch_states[0],
-    )
-    for branch_state in branch_states[1:]:
+    join_state = builder.add_orphan_state(f"{name_pattern}__join_state")
+    for branch_state in branch_states:
         builder.sdfg.add_edge(
             branch_state,
-            terminal_state,
+            join_state,
             dace.sdfg.InterstateEdge(),
         )
 
-    # We return it, because otherwise the builder will assume that `eqn_state` was used.
-    return terminal_state
+    return join_state
diff --git a/src/jace/translator/primitive_translators/convert_element_type_translator.py b/src/jace/translator/primitive_translators/convert_element_type_translator.py
index ee05a2a..118f4e3 100644
--- a/src/jace/translator/primitive_translators/convert_element_type_translator.py
+++ b/src/jace/translator/primitive_translators/convert_element_type_translator.py
@@ -5,7 +5,7 @@
 #
 # SPDX-License-Identifier: BSD-3-Clause
 
-"""Implements the translator for the `convert_element_type` primitive."""
+"""Primitive translator for type casting operations."""
 
 from __future__ import annotations
 
@@ -28,14 +28,12 @@ class ConvertElementTypeTranslator(mapped_base.MappedOperationTranslatorBase):
     """
     Implements the `convert_element_type` primitive.
 
-    The primitive will expand to a "copy Map", however, the Tasklet will not
-    simply copy the input to the output, but also perform type conversion.
-    However, in cases where the input type is the same as the output type,
-    the Tasklet will just be a copy Tasklet, that can then be removed by DaCe.
+    The primitive is implemented as a copy operation. However, the tasklet body
+    will perform the type conversion operation.
 
     Note:
-        This translator ignores the `new_dtype` and `weak_type` parameters of
-        the equation and only performs the casting based on the type of the fields.
+        The type to cast to id inferred from the output variable and the `new_dtype`
+        parameter of the equation is ignored.
     """
 
     def __init__(self) -> None:
@@ -56,20 +54,19 @@ def write_tasklet_code(
         out_dtype = util.get_jax_var_dtype(eqn.outvars[0]).type
         out_dtype_s: str = out_dtype.__name__
 
-        # This is the base of the template that we use for conversion. You should notice
-        #  that the Tasklet `__out = __in0` will fail, see commit `f5aabc3` of the
-        #  prototype. Thus we have to do it in this way.
-        conv_code = "__in0"
-
         if in_dtype == out_dtype:
-            # For some reason Jax sometimes adds conversions where no are needed. In
-            #  these cases we explicitly create a copy Tasklet, which is trivial and can
-            #  be removed by DaCe.
+            # JAX sometimes adds conversions which are not needed. In these cases
+            #  we perform a copy.
             # TODO(phimuell): Create a Memlet instead.
-            return f"__out = {conv_code}"
+            return "__out = __in0"
+
+        # A simple copy tasklet `__out = __in0` and rely on the implicit type
+        #  conversion of the C++ compiler, is not enough. Due to a bug in DaCe
+        #  (see https://github.com/spcl/dace/issues/1665) this conversion might be
+        #  lost, thus we have to perform the conversion explicitly in the tasklet.
+        conv_code = "__in0"
 
         if in_dtype_s.startswith("bool"):
-            # Interestingly `__out = int(__in0)` will not work.
             conv_code = f"(1 if {conv_code} else 0)"
         if out_dtype_s.startswith("bool"):
             conv_code = f"dace.bool_({conv_code})"
diff --git a/src/jace/translator/primitive_translators/copy_translator.py b/src/jace/translator/primitive_translators/copy_translator.py
index 6de5ab9..5cc0d3c 100644
--- a/src/jace/translator/primitive_translators/copy_translator.py
+++ b/src/jace/translator/primitive_translators/copy_translator.py
@@ -5,14 +5,13 @@
 #
 # SPDX-License-Identifier: BSD-3-Clause
 
-"""Implements the translator related to data movement."""
+"""Primitive translators related to data movement operations."""
 
 from __future__ import annotations
 
 from typing import TYPE_CHECKING
 
 import dace
-from typing_extensions import override
 
 from jace import translator
 
@@ -23,70 +22,56 @@
     from jax import core as jax_core
 
 
-class CopyTranslator(translator.PrimitiveTranslator):
+@translator.register_primitive_translator()
+@translator.make_primitive_translator("copy")
+def copy_translator(
+    builder: translator.JaxprTranslationBuilder,
+    in_var_names: Sequence[str | None],
+    out_var_names: Sequence[str],
+    eqn: jax_core.JaxprEqn,  # noqa: ARG001  # Required by the interface.
+    eqn_state: dace.SDFGState,
+) -> None:
     """
     Implements the `copy` primitive.
 
-    The translator is implemented by using a Memlet.
+    Todo:
+        Investigate if operation should expand to a map.
     """
-
-    @property
-    def primitive(self) -> str:  # noqa: D102  # No docstring needed.
-        return "copy"
-
-    def __call__(  # noqa: D102  # No docstring
-        self,
-        builder: translator.JaxprTranslationBuilder,
-        in_var_names: Sequence[str | None],
-        out_var_names: Sequence[str],
-        eqn: jax_core.JaxprEqn,  # noqa: ARG002
-        eqn_state: dace.SDFGState,
-    ) -> None:
-        eqn_state.add_nedge(
-            eqn_state.add_read(in_var_names[0]),
-            eqn_state.add_write(out_var_names[0]),
-            dace.Memlet.from_array(
-                in_var_names[0],
-                builder.arrays[in_var_names[0]],  # type: ignore[index]  # Guaranteed to be a string
-            ),
-        )
-
-
-class DevicePutTranslator(CopyTranslator):
+    eqn_state.add_nedge(
+        eqn_state.add_read(in_var_names[0]),
+        eqn_state.add_write(out_var_names[0]),
+        dace.Memlet.from_array(
+            in_var_names[0],
+            builder.arrays[in_var_names[0]],  # type: ignore[index]  # Guaranteed to be a string
+        ),
+    )
+
+
+@translator.register_primitive_translator()
+@translator.make_primitive_translator("device_put")
+def device_put_translator(
+    builder: translator.JaxprTranslationBuilder,
+    in_var_names: Sequence[str | None],
+    out_var_names: Sequence[str],
+    eqn: jax_core.JaxprEqn,
+    eqn_state: dace.SDFGState,
+) -> None:
     """
     Implements the `device_put` primitive.
 
-    In Jax this primitive is used to copy data between the host and the device,
+    In JAX this primitive is used to copy data between the host and the device,
     in DaCe Memlets can do this. However, because of the way JaCe operates, at
     least in the beginning a computation is either fully on the host or on the
     device this copy will essentially perform a copying.
     """
-
-    @property
-    def primitive(self) -> str:  # noqa: D102  # No docstring
-        return "device_put"
-
-    @override
-    def __call__(  # No docstring
-        self,
-        builder: translator.JaxprTranslationBuilder,
-        in_var_names: Sequence[str | None],
-        out_var_names: Sequence[str],
-        eqn: jax_core.JaxprEqn,
-        eqn_state: dace.SDFGState,
-    ) -> None:
-        if not (eqn.params["device"] is None and eqn.params["src"] is None):
-            raise NotImplementedError(
-                f"Can only copy on the host, but not from {eqn.params['src']} to {eqn.params['device']}."
-            )
-        return super().__call__(
-            builder=builder,
-            in_var_names=in_var_names,
-            out_var_names=out_var_names,
-            eqn=eqn,
-            eqn_state=eqn_state,
+    if not (eqn.params["device"] is None and eqn.params["src"] is None):
+        raise NotImplementedError(
+            f"Can only copy on the host, but not from {eqn.params['src']} to {eqn.params['device']}."
         )
-
-
-_ = translator.register_primitive_translator(CopyTranslator())
-_ = translator.register_primitive_translator(DevicePutTranslator())
+    copy_translator(
+        builder=builder,
+        in_var_names=in_var_names,
+        out_var_names=out_var_names,
+        eqn=eqn,
+        eqn_state=eqn_state,
+    )
diff --git a/src/jace/translator/primitive_translators/gather_translator.py b/src/jace/translator/primitive_translators/gather_translator.py
index 343ee15..4b58e70 100644
--- a/src/jace/translator/primitive_translators/gather_translator.py
+++ b/src/jace/translator/primitive_translators/gather_translator.py
@@ -5,7 +5,7 @@
 #
 # SPDX-License-Identifier: BSD-3-Clause
 
-"""Implements the translator for the `gather` primitive."""
+"""Primitive translator for indexing operations."""
 
 from __future__ import annotations
 
diff --git a/src/jace/translator/primitive_translators/iota_translator.py b/src/jace/translator/primitive_translators/iota_translator.py
index ce0d99f..035caf7 100644
--- a/src/jace/translator/primitive_translators/iota_translator.py
+++ b/src/jace/translator/primitive_translators/iota_translator.py
@@ -5,7 +5,7 @@
 #
 # SPDX-License-Identifier: BSD-3-Clause
 
-"""This implements the `iota` primitive."""
+"""Primitive translator for the `iota` primitive."""
 
 from __future__ import annotations
 
diff --git a/src/jace/translator/primitive_translators/pjit_translator.py b/src/jace/translator/primitive_translators/pjit_translator.py
index 59bfd7e..b3b9d97 100644
--- a/src/jace/translator/primitive_translators/pjit_translator.py
+++ b/src/jace/translator/primitive_translators/pjit_translator.py
@@ -5,7 +5,7 @@
 #
 # SPDX-License-Identifier: BSD-3-Clause
 
-"""Implements the `pjit` translator, i.e. nested Jaxpr expressions."""
+"""Primitive translator related handling nested Jaxpr operations."""
 
 from __future__ import annotations
 
@@ -15,7 +15,7 @@
 
 from jax._src import sharding_impls as jax_sharding  # noqa: PLC2701 [import-private-name]
 
-from jace import translator, util
+from jace import translator
 from jace.translator import post_translation as ptranslation
 
 
@@ -24,55 +24,9 @@
     from jax._src import core as jax_core
 
 
-def _promote_literals_to_constants(
-    builder: translator.JaxprTranslationBuilder,
-    var_names: Sequence[str | None],
-    jax_vars: Sequence[jax_core.Atom],
-    name_pattern: str,
-) -> list[str]:
-    """
-    Promotes all literals in `var_names` to DaCe constants and add them to the SDFG.
-
-    The function assumes that `var_names` are the SDFG variables equivalents of
-    `jax_vars`, as by convention `None` indicates a literal. The function will create
-    a constant for each literal and return `var_names` cleared of all literals.
-    For naming the variables the function will use `name_pattern`.
-
-    Args:
-        builder: The builder that is used for translation.
-        var_names: Names of the SDFG variables, `None` indicates a literal.
-        jax_vars: The JAX variables, in the same order than `var_names`.
-        name_pattern: A pattern to generate a unique name for the variables.
-
-    Todo:
-        Is a constant the right idea or should we generate a symbol?
-    """
-    promoted_var_names: list[str] = []
-    for i, var_name in enumerate(var_names):
-        if var_name is None:
-            promoted_var_name = f"__const_{name_pattern}_literal_promotion_{i}"
-            jax_var = jax_vars[i]
-            promoted_jace_var = util.JaCeVar.from_atom(
-                jax_var=jax_var,
-                name=promoted_var_name,
-            )
-            builder.add_array(promoted_jace_var)
-            builder.sdfg.add_constant(
-                promoted_var_name,
-                util.get_jax_literal_value(jax_var),
-                builder.arrays[promoted_var_name],
-            )
-
-        else:
-            # Already an SDFG variable, so nothing to do.
-            promoted_var_name = var_name
-        promoted_var_names.append(promoted_var_name)
-    return promoted_var_names
-
-
 @translator.register_primitive_translator()
 @translator.make_primitive_translator("pjit")
-def PJITTranslator(  # noqa: N802 [invalid-function-name]
+def pjit_translator(
     builder: translator.JaxprTranslationBuilder,
     in_var_names: Sequence[str | None],
     out_var_names: Sequence[str],
@@ -82,13 +36,9 @@ def PJITTranslator(  # noqa: N802 [invalid-function-name]
     """
     Implements the `pjit` translator that handles nested Jaxpr.
 
-    `pjit` primitives in JAX represents nested calls, for example the body of a scan
-    is inside a nested Jaxpr. However, `pjit` is used to indicate that a computation
-    should be done on the device or on sharded memory.
-
-    However, due to the current state and working of JaCe, this aspect is essentially
-    ignored and the computation is always inlined.
-
+    `pjit` primitives in JAX represents nested calls, for example the branches of a
+    conditional are nested Jaxpr. However, in JAX `pjit` is also used to indicate that
+    a computation should be done on the device or on sharded memory.
     In case an input is a literal the translator will create a constant for it.
 
     Args:
@@ -99,6 +49,10 @@ def PJITTranslator(  # noqa: N802 [invalid-function-name]
             inside the parent SDFG.
         eqn: The equation that contains the `pjit` primitive.
         eqn_state: State into which the nested SDFG should be constructed.
+
+    Note:
+        The translator ignores the `donated_invars`, the `keep_unused` and the
+        `inline` parameter and let's DaCe handle it.
     """
     params: dict[str, Any] = eqn.params
     nested_jaxpr: jax_core.ClosedJaxpr = params["jaxpr"]
@@ -116,22 +70,18 @@ def PJITTranslator(  # noqa: N802 [invalid-function-name]
     # TODO(phimuell): Controlflow region and name
     pjit_name = params["name"]
 
-    # TODO(phimuell): Controlflow region and name
-    #  They will introduce a feature like that to address them in optimizations.
-    pjit_name = params["name"]
-
     # Name in SDFG must be unique, thus we mangle it, furthermore, we have to clean it.
     sdfg_name = f"pjit_{re.subn('[^a-zA-Z0-9_]', '_', pjit_name)[0]}__{'_'.join(out_var_names)}"
 
     # Ensure that all inputs are SDFG variables
-    final_input_names = _promote_literals_to_constants(
+    final_input_names = ptranslation.promote_literals_to_constants(
         builder=builder,
         var_names=in_var_names,
         jax_vars=eqn.invars,
         name_pattern=sdfg_name,
     )
 
-    # Now get the translated SDFG.
+    # Translate the nested expression
     nested_context: translator.TranslationContext = builder.translate_jaxpr(
         jaxpr=nested_jaxpr,
         name=sdfg_name,
diff --git a/src/jace/translator/primitive_translators/reshape_translator.py b/src/jace/translator/primitive_translators/reshape_translator.py
index 241cc94..1bcbc5a 100644
--- a/src/jace/translator/primitive_translators/reshape_translator.py
+++ b/src/jace/translator/primitive_translators/reshape_translator.py
@@ -5,14 +5,13 @@
 #
 # SPDX-License-Identifier: BSD-3-Clause
 
-"""Implements the translator for the `reshape` primitive."""
+"""Primitive translator for reshaping operations."""
 
 from __future__ import annotations
 
 from typing import TYPE_CHECKING
 
 import dace
-from typing_extensions import override
 
 from jace import translator, util
 
@@ -23,45 +22,30 @@
     from jax import core as jax_core
 
 
-class ReshapeTranslator(translator.PrimitiveTranslator):
+@translator.register_primitive_translator()
+@translator.make_primitive_translator("reshape")
+def reshape_translator(
+    builder: translator.JaxprTranslationBuilder,  # noqa: ARG001  # Required by the interface.
+    in_var_names: Sequence[str | None],
+    out_var_names: Sequence[str],
+    eqn: jax_core.JaxprEqn,
+    eqn_state: dace.SDFGState,
+) -> None:
     """
-    Implements the `reshape` primitive.
+    Implements the `reshape` primitive, through a memlet.
 
-    The current implementation uses a Memlet for this and essentially acts as
-    an optimization barrier. Furthermore the Jax primitive also has the optional
-    `dimensions` parameters which allows to permute the input, this is not
-    supported.
+    Note:
+        The optional `dimensions` parameters which allows to permute the input
+        is not supported.
     """
-
-    @property
-    def primitive(self) -> str:  # noqa: D102  # No docstring needed.
-        return "reshape"
-
-    @override
-    def __call__(
-        self,
-        builder: translator.JaxprTranslationBuilder,
-        in_var_names: Sequence[str | None],
-        out_var_names: Sequence[str],
-        eqn: jax_core.JaxprEqn,
-        eqn_state: dace.SDFGState,
-    ) -> None:
-        """
-        Performs the reshaping.
-
-        Currently a copy using a Memlet is performed.
-        """
-        if eqn.params["dimensions"] is not None:
-            raise NotImplementedError("Currently 'dimensions' must be 'None'.")
-        eqn_state.add_nedge(
-            eqn_state.add_read(in_var_names[0]),
-            eqn_state.add_write(out_var_names[0]),
-            dace.Memlet(
-                data=in_var_names[0],
-                subset=", ".join(f"0:{size}" for size in util.get_jax_var_shape(eqn.invars[0])),
-                other_subset=", ".join(f"0:{size}" for size in eqn.params["new_sizes"]),
-            ),
-        )
-
-
-translator.register_primitive_translator(ReshapeTranslator())
+    if eqn.params["dimensions"] is not None:
+        raise NotImplementedError("Currently 'dimensions' must be 'None'.")
+    eqn_state.add_nedge(
+        eqn_state.add_read(in_var_names[0]),
+        eqn_state.add_write(out_var_names[0]),
+        dace.Memlet(
+            data=in_var_names[0],
+            subset=", ".join(f"0:{size}" for size in util.get_jax_var_shape(eqn.invars[0])),
+            other_subset=", ".join(f"0:{size}" for size in eqn.params["new_sizes"]),
+        ),
+    )
diff --git a/src/jace/translator/primitive_translators/select_n_translator.py b/src/jace/translator/primitive_translators/select_n_translator.py
index 51b27b3..0b9a0d1 100644
--- a/src/jace/translator/primitive_translators/select_n_translator.py
+++ b/src/jace/translator/primitive_translators/select_n_translator.py
@@ -5,7 +5,7 @@
 #
 # SPDX-License-Identifier: BSD-3-Clause
 
-"""Implements `select_n`."""
+"""Primitive translator for select operations, i.e. generalized `np.where()`."""
 
 from __future__ import annotations
 
@@ -29,16 +29,13 @@ class SelectNTranslator(mapped_base.MappedOperationTranslatorBase):
     Implements the `select_n` primitive.
 
     The `select_n` primitive is a generalization of `np.where`, that can take an
-    arbitrary number of branches, which are selected by an integer predicate.
+    arbitrary number of cases, which are selected by an integer predicate.
     The behaviour is undefined if the predicate is out of bound.
 
     Note:
         For a better understanding this function renames its input connectors.
         The first one, which is the predicate, is renamed to `__cond` and the
         others are renamed again to `__in{i}`, starting with zero.
-
-    Todo:
-        Implement the primitive as a nested SDFG.
     """
 
     def __init__(self) -> None:
@@ -51,11 +48,9 @@ def write_tasklet_code(
         in_var_names: Sequence[str | None],
         eqn: jax_core.JaxprEqn,
     ) -> str:
-        if len(in_var_names) == 3:  # noqa: PLR2004  # `3` is not magic.
-            # This order is correct, since `False` is interpreted as `0`, which means
-            #  the first case. DaCe seems to have some problems with bools and integer
-            #  casting around, so we handle the bool case explicitly here.
-            #  See also `ConvertElementTypeTranslator`.
+        if len(in_var_names) == 3:  # noqa: PLR2004  # Ternary conditional expression.
+            # The order is correct, since `False` is interpreted as `0`,
+            #  which means "the first case".
             return "__out = __in1 if __cond else __in0"
 
         return "\n".join(
@@ -84,10 +79,9 @@ def literal_substitution(
     ) -> str:
         assert in_var_names[0]  # Condition can never be a literal.
         for i, in_var_name in enumerate(in_var_names[1:]):
-            if in_var_name is not None:
-                continue
-            t_val = util.get_jax_literal_value(eqn.invars[i + 1])
-            tskl_code = tskl_code.replace(f"__in{i}", str(t_val))
+            if in_var_name is None:
+                t_val = util.get_jax_literal_value(eqn.invars[i + 1])
+                tskl_code = tskl_code.replace(f"__in{i}", str(t_val))
         return tskl_code
 
 
diff --git a/src/jace/translator/primitive_translators/slicing.py b/src/jace/translator/primitive_translators/slicing.py
index ae4f167..c53c3d0 100644
--- a/src/jace/translator/primitive_translators/slicing.py
+++ b/src/jace/translator/primitive_translators/slicing.py
@@ -5,7 +5,7 @@
 #
 # SPDX-License-Identifier: BSD-3-Clause
 
-"""Implements slicing."""
+"""Primitive translators for slicing operations."""
 
 from __future__ import annotations
 
@@ -28,12 +28,13 @@ class SlicingTranslator(mapped_base.MappedOperationTranslatorBase):
     """
     Implements the `slice` primitive.
 
-    This is the classical slicing operation which extracts a fixed sized window
-    from a fixed initial position. The slicing is implemented using a partial copy.
+    The `slice` primitive represents the static case of slicing, i.e. a fixed
+    window starting from a fixed starting point.
+    The slicing is implemented by performing a partial copy.
 
     Note:
         Slices are essentially optimization barriers as they can not be fused
-        with Maps before them.
+        with Maps _before_ them.
     """
 
     def __init__(self) -> None:
@@ -55,7 +56,6 @@ def make_input_memlets(
         in_var_names: Sequence[str | None],
         eqn: jax_core.JaxprEqn,
     ) -> dict[str, dace.Memlet]:
-        """We have to add the offsets to the Memlet accesses."""
         strides: Sequence[int] = (
             ((1,) * len(tskl_ranges)) if eqn.params["strides"] is None else eqn.params["strides"]
         )
@@ -64,76 +64,71 @@ def make_input_memlets(
             "__in0": dace.Memlet.simple(
                 in_var_names[0],
                 ", ".join(
-                    f"{start_index} + {it_idx} * {stride}"
+                    f"{start_index} + ({it_idx} * {stride})"
                     for (it_idx, _), start_index, stride in zip(tskl_ranges, start_indices, strides)
                 ),
             )
         }
 
 
-class DynamicSlicingTranslator(translator.PrimitiveTranslator):
+@translator.register_primitive_translator()
+@translator.make_primitive_translator("dynamic_slice")
+def dynamic_slicing_translator(
+    builder: translator.JaxprTranslationBuilder,
+    in_var_names: Sequence[str | None],
+    out_var_names: Sequence[str],
+    eqn: jax_core.JaxprEqn,
+    eqn_state: dace.SDFGState,
+) -> None:
     """
     Implements the `dynamic_slice` primitive.
 
-    [Dynamic slicing](https://jax.readthedocs.io/en/latest/_autosummary/jax.lax.dynamic_slice.html)
-    performs a slicing of a _fixed_ window, but the start of the window is
-    not fix, instead it is passed by variables. Furthermore, (as it is in Jax),
-    if the window would overrun the start indexes are adjusted.
+    Dynamic slicing (see: https://jax.readthedocs.io/en/latest/_autosummary/jax.lax.dynamic_slice.html)
+    performs a slicing of a _fixed_ window, but the start of the window is defined
+    through some input variables. Furthermore, if the window would overrun the
+    start indexes are adjusted.
 
     Todo:
         - Prevent that the modified start indexes are promoted to symbols,
             to ensure mergability.
     """
-
-    @property
-    def primitive(self) -> str:  # noqa: D102  # No docstring needed.
-        return "dynamic_slice"
-
-    @override
-    def __call__(
-        self,
-        builder: translator.JaxprTranslationBuilder,
-        in_var_names: Sequence[str | None],
-        out_var_names: Sequence[str],
-        eqn: jax_core.JaxprEqn,
-        eqn_state: dace.SDFGState,
-    ) -> None:
-        assert in_var_names[0]
-        assert len(in_var_names) == len(util.get_jax_var_shape(eqn.invars[0])) + 1
-
-        # This is the sizes of the slice window.
-        window_sizes: Sequence[int] = eqn.params["slice_sizes"]
-
-        # Maps the variable name, that stores the start index of the window in one
-        #  dimensions to the access node, that holds the value. The variable name
-        #  is also used as dynamic range offset.
-        #  Only present if the index is not a literal.
-        in_access: dict[str, dace.nodes.AccessNode] = {}
-
-        # Name of the variable from where we get the start index of the window
-        #  or the value itself, if it is a literal; in the order of the dimension.
-        #  If the value is `None` then the literal was not yet processed.
-        window_start_indices: list[str | None] = list(in_var_names[1:])
-
-        # We will always adapt the start indexes and not check if it is needed.
-        for dim, (window_start_index, dim_size, window_size) in enumerate(
-            zip(window_start_indices, util.get_jax_var_shape(eqn.invars[0]), window_sizes)
-        ):
-            if window_start_index is None:
-                # Jax does not adjust the literals on its own
-                raw_window_start = int(util.get_jax_literal_value(eqn.invars[dim + 1]))  # type: ignore[arg-type]  # type confusion
-                adjusted_window_start = min(dim_size, raw_window_start + window_size) - window_size
-                window_start_indices[dim] = str(adjusted_window_start)
-                continue
-
-            # We do not use a symbol for the start of the window but a Tasklet, as
-            #  a symbol would need an interstage edge, which is an optimization barrier.
+    assert in_var_names[0]
+    assert len(in_var_names) == len(util.get_jax_var_shape(eqn.invars[0])) + 1
+
+    window_sizes: Sequence[int] = eqn.params["slice_sizes"]
+
+    # Maps the variable name, that stores the _adjusted_ start index of the window
+    #  of a dimension to the access node that holds the value. Needed to ensure the
+    #  correct order of computation.
+    in_access: dict[str, dace.nodes.AccessNode] = {}
+
+    # Name of the variables (DaCe arrays) from where we get the start index of the
+    #  window or the value itself if it is a literal (`None` means not yet processed).
+    # The first input argument is always the array we slice from.
+    window_start_indices: list[str | None] = list(in_var_names[1:])
+
+    for dim, (window_start_index, dim_size, window_size) in enumerate(
+        zip(window_start_indices, util.get_jax_var_shape(eqn.invars[0]), window_sizes)
+    ):
+        if window_start_index is None:
+            # The start is a literal value.
+            #  Jax does not adjust the literals on its own so we have to do it.
+            raw_window_start = int(util.get_jax_literal_value(eqn.invars[dim + 1]))  # type: ignore[arg-type]  # type confusion
+            adjusted_window_start = min(dim_size, raw_window_start + window_size) - window_size
+            window_start_indices[dim] = str(adjusted_window_start)
+
+        else:
             tasklet = dace.nodes.Tasklet(
                 label=f"adjustment_of_slice_start_{window_start_index}_for_{out_var_names[0]}",
                 inputs={"unadjusted_start_idx": None},
                 outputs={"adjusted_start_idx": None},
                 code=f"adjusted_start_idx = min(unadjusted_start_idx + {window_size}, {dim_size}) - {window_size}",
             )
+            # Name of the variable holding the (adjusted) start of the window.
+            #  It is important that this name is also used for the dynamic map range
+            #  symbols created below. This prevents some errors if DaCe promotes them
+            #  to symbols and does not handle the DMR correctly.
+            #  (see https://github.com/spcl/dace/issues/1665)
             new_start_idx_var_name = builder.add_array(
                 eqn.invars[dim + 1], name_prefix="__jace_adapted_start_idx_"
             )
@@ -153,46 +148,40 @@ def __call__(
                 None,
                 dace.Memlet.simple(new_start_idx_var_name, "0"),
             )
-            # Update the name of the start index, and store the access
-            #  node for later use.
             window_start_indices[dim] = new_start_idx_var_name
             in_access[new_start_idx_var_name] = new_start_idx_acc
 
-        tskl_ranges: list[tuple[str, str]] = [
-            (f"__i{dim}", f"0:{N}") for dim, N in enumerate(util.get_jax_var_shape(eqn.outvars[0]))
-        ]
-
-        memlet_accesses: list[str] = []
-
-        for (it_var, _), offset_symbol_name in zip(tskl_ranges, window_start_indices):
-            assert offset_symbol_name is not None
-            memlet_accesses.append(f"{it_var} + {offset_symbol_name}")
-
-        tskl_input = dace.Memlet.simple(in_var_names[0], ", ".join(memlet_accesses))
-        tskl_output = dace.Memlet.simple(
-            out_var_names[0], ", ".join(name for name, _ in tskl_ranges)
+    tskl_ranges: list[tuple[str, str]] = [
+        (f"__i{dim}", f"0:{N}") for dim, N in enumerate(util.get_jax_var_shape(eqn.outvars[0]))
+    ]
+    tskl_input = dace.Memlet.simple(
+        in_var_names[0],
+        ", ".join(
+            f"{it_var} + {offset_symbol_name}"
+            for (it_var, _), offset_symbol_name in zip(tskl_ranges, window_start_indices)
+        ),
+    )
+    tskl_output = dace.Memlet.simple(out_var_names[0], ", ".join(name for name, _ in tskl_ranges))
+    _, map_entry, _ = eqn_state.add_mapped_tasklet(
+        name=f"dynamic_slice_{out_var_names[0]}",
+        map_ranges=tskl_ranges,
+        inputs={"__in": tskl_input},
+        code="__out = __in",
+        outputs={"__out": tskl_output},
+        external_edges=True,
+    )
+
+    # Create the dynamic ranges, i.e. read the start indexes for the window
+    #  from variable and create symbols out of it, without an interstate edge.
+    for window_start_index_name, windows_start_access_node in in_access.items():
+        eqn_state.add_edge(
+            windows_start_access_node,
+            None,
+            map_entry,
+            window_start_index_name,
+            dace.Memlet.simple(window_start_index_name, "0"),
         )
-        _, map_entry, _ = eqn_state.add_mapped_tasklet(
-            name=f"{self.primitive}_{out_var_names[0]}",
-            map_ranges=tskl_ranges,
-            inputs={"__in": tskl_input},
-            code="__out = __in",
-            outputs={"__out": tskl_output},
-            external_edges=True,
-        )
-
-        # Creating the inputs for the dynamic map ranges. We have to use the same
-        #  access nodes as above, to ensure a single order of computation.
-        for window_start_index_name, windows_start_access_node in in_access.items():
-            eqn_state.add_edge(
-                windows_start_access_node,
-                None,
-                map_entry,
-                window_start_index_name,
-                dace.Memlet.simple(window_start_index_name, "0"),
-            )
-            map_entry.add_in_connector(window_start_index_name)
+        map_entry.add_in_connector(window_start_index_name)
 
 
 translator.register_primitive_translator(SlicingTranslator())
-translator.register_primitive_translator(DynamicSlicingTranslator())
diff --git a/src/jace/translator/primitive_translators/squeeze_translator.py b/src/jace/translator/primitive_translators/squeeze_translator.py
index de6f1f4..dbaa548 100644
--- a/src/jace/translator/primitive_translators/squeeze_translator.py
+++ b/src/jace/translator/primitive_translators/squeeze_translator.py
@@ -5,7 +5,7 @@
 #
 # SPDX-License-Identifier: BSD-3-Clause
 
-"""Implements the `squeeze` primitive."""
+"""Primitive translator for squeezing (the removal of size 1 dimensions) operations."""
 
 from __future__ import annotations
 

From cb600d397aaa8d12a9bb82467457a522aab5d4c2 Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Tue, 24 Sep 2024 12:37:20 +0200
Subject: [PATCH 446/458] Refactored the gather translator.

It is now better confiugured.
---
 .../primitive_translators/__init__.py         |   4 +-
 .../gather_translator.py                      | 333 +++++++++---------
 2 files changed, 160 insertions(+), 177 deletions(-)

diff --git a/src/jace/translator/primitive_translators/__init__.py b/src/jace/translator/primitive_translators/__init__.py
index 757743e..f019964 100644
--- a/src/jace/translator/primitive_translators/__init__.py
+++ b/src/jace/translator/primitive_translators/__init__.py
@@ -17,7 +17,7 @@
 from .conditions import condition_translator
 from .convert_element_type_translator import ConvertElementTypeTranslator
 from .copy_translator import copy_translator, device_put_translator
-from .gather_translator import GatherTranslator
+from .gather_translator import gather_translator
 from .iota_translator import IotaTranslator
 from .pjit_translator import pjit_translator
 from .reshape_translator import reshape_translator
@@ -30,7 +30,6 @@
     "ArithmeticOperationTranslator",
     "BroadcastInDimTranslator",
     "ConvertElementTypeTranslator",
-    "GatherTranslator",
     "IotaTranslator",
     "LogicalOperationTranslator",
     "SelectNTranslator",
@@ -41,6 +40,7 @@
     "copy_translator",
     "device_put_translator",
     "dynamic_slicing_translator",
+    "gather_translator",
     "pjit_translator",
     "reshape_translator",
 ]
diff --git a/src/jace/translator/primitive_translators/gather_translator.py b/src/jace/translator/primitive_translators/gather_translator.py
index 4b58e70..8d0f60f 100644
--- a/src/jace/translator/primitive_translators/gather_translator.py
+++ b/src/jace/translator/primitive_translators/gather_translator.py
@@ -13,7 +13,6 @@
 
 import dace
 from jax import lax as jax_lax
-from typing_extensions import override
 
 from jace import translator, util
 
@@ -24,188 +23,172 @@
     from jax import core as jax_core
 
 
-class GatherTranslator(translator.PrimitiveTranslator):
+@translator.register_primitive_translator()
+@translator.make_primitive_translator("gather")
+def gather_translator(  # noqa: PLR0914 [too-many-locals]  # Can not reduce any further.
+    builder: translator.JaxprTranslationBuilder,  # noqa: ARG001  # Required by the interface.
+    in_var_names: Sequence[str | None],
+    out_var_names: Sequence[str],
+    eqn: jax_core.JaxprEqn,
+    eqn_state: dace.SDFGState,
+) -> None:
     """
-    Garther Translator.
+    Implements the `gather` primitive.
 
-    The gather operation extracts patches of a certain size, known as `slice_size`,
-    from an array, called source or input array. Where these patches starts is
-    given by another array, the index array.
+    These primitive is used to implement the `array.at[...].get()` access. In the
+    end the primitive extracts patches/windows of a certain size, known as
+    `slice_size`, from an array, which is called source or input array. The start
+    points of these windows are given by another array, the so called index array.
+
+    Args:
+        builder: The builder object that is active.
+        in_var_names: The names of the input variables, the first array is
+            assumed as source array and the second is the index array.
+        out_var_names: The names of the output variables.
+        eqn: The equation to translate.
+        eqn_state: The state in which we put the extraction.
 
     See Also:
         https://www.tensorflow.org/xla/operation_semantics#gather
         https://jax.readthedocs.io/en/latest/_autosummary/jax.lax.gather.html
     """
-
-    @property
-    def primitive(self) -> str:  # noqa: D102  # No docstring needed.
-        return "gather"
-
-    @override
-    def __call__(  # noqa: PLR0914, PLR0915  # Just ported from the prototype, cleanup postponed.
-        self,
-        builder: translator.JaxprTranslationBuilder,
-        in_var_names: Sequence[str | None],
-        out_var_names: Sequence[str],
-        eqn: jax_core.JaxprEqn,
-        eqn_state: dace.SDFGState,
-    ) -> None:
-        """
-        Performs the gather operation.
-
-        Args:
-            builder: The builder object that is active.
-            in_var_names: The names of the input variables, the first array is
-                assumed as source array and the second is the index array.
-            out_var_names: The names of the output variables.
-            eqn: The equation to translate.
-            eqn_state: The state in which we put the extraction.
-        """
-        assert len(eqn.invars) == 2  # noqa: PLR2004  # XLA supports more inputs.
-
-        out_name = out_var_names[0]
-        out_shape = util.get_jax_var_shape(eqn.outvars[0])
-
-        src_name = in_var_names[0]
-        src_shape = util.get_jax_var_shape(eqn.invars[0])
-
-        idx_name = in_var_names[1]
-        idx_shape = util.get_jax_var_shape(eqn.invars[1])
-
-        dimension_numbers = eqn.params["dimension_numbers"]
-        offset_dims: Sequence[int] = dimension_numbers.offset_dims
-        collapsed_slice_dims: Sequence[int] = dimension_numbers.collapsed_slice_dims
-        start_index_map: Sequence[int] = dimension_numbers.start_index_map
-        slice_sizes: Sequence[int] = eqn.params["slice_sizes"]
-        mode: jax_lax.GatherScatterMode = eqn.params["mode"]
-        assert len(start_index_map) == idx_shape[-1]
-
-        if mode != jax_lax.GatherScatterMode.PROMISE_IN_BOUNDS:
-            raise NotImplementedError(f"The mode {mode} is not implemented.")
-
-        # Over these dimensions the copy of the patches goes.
-        batch_dims = tuple(d for d in range(len(out_shape)) if d not in offset_dims)
-
-        # Every batch dimension is associated with one dimension of of the index
-        #  array, but there is always one dimension more in the index array. This
-        #  dimension contains the start indexes of the slice, if there is only
-        #  one index that should be loaded is not strictly necessary, but Jax
-        #  (currently adds) it implicitly, probably to make life easier.
-        if (len(batch_dims) + 1) != len(idx_shape):
-            raise ValueError(
-                f"Expected that the index array has {len(batch_dims) + 1} dimensions, but it had {len(idx_shape)}."
-            )
-
-        # These are the dimensions (of the input) for which a map index is created.
-        #  Note that we exclude collapsed dimensions here.
-        src_dim_with_map_idx = tuple(
-            dim for dim in range(len(slice_sizes)) if dim not in collapsed_slice_dims
+    out_name = out_var_names[0]
+    out_shape = util.get_jax_var_shape(eqn.outvars[0])
+    src_name = in_var_names[0]
+    src_shape = util.get_jax_var_shape(eqn.invars[0])
+    idx_name = in_var_names[1]
+    idx_shape = util.get_jax_var_shape(eqn.invars[1])
+    dimension_numbers = eqn.params["dimension_numbers"]
+
+    if eqn.params["mode"] != jax_lax.GatherScatterMode.PROMISE_IN_BOUNDS:
+        raise NotImplementedError(f"The mode {eqn.params['mode']} is not implemented.")
+
+    # This is the size of the slice window that is copied. Its length equal the rank
+    #  of the source array, dimensions that should not be copied are listed in
+    #  `collapsed_slice_dims`.
+    slice_sizes: Sequence[int] = eqn.params["slice_sizes"]
+    collapsed_slice_dims: Sequence[int] = dimension_numbers.collapsed_slice_dims
+    not_collapsed_slice_dims = tuple(
+        dim for dim in range(len(slice_sizes)) if dim not in collapsed_slice_dims
+    )
+    assert len(slice_sizes) == len(src_shape)
+
+    # The batch dimensions are used to iterate through the slice windows, thus access
+    #  the index array, with the exception of the last dimension, see below.
+    # NOTE: In pure XLA this last dimension might not be present, however, JAX
+    #   adds it and our implementation relies on it.
+    batch_dims = tuple(d for d in range(len(out_shape)) if d not in dimension_numbers.offset_dims)
+    if (len(batch_dims) + 1) != len(idx_shape):
+        raise ValueError(
+            f"Expected that the index array has {len(batch_dims) + 1} dimensions, but it had {len(idx_shape)}."
         )
-        assert len(src_dim_with_map_idx) == len(offset_dims)
-
-        # The final map is the composition of two loops. The first map iterates over
-        #  the index array, except the last dimension, and is used to "copy" the
-        #  different patches from the source to the output array. These map parameters
-        #  follow the pattern `__i{out_name}_gather{bd}`, where `bd` is a batch
-        #  dimension. These variables are used to access the index array.
-        #  The second loop performs the actual copy of the slices. For these
-        #  the variables `__i{i}` is used were, these are known as offset
-        #  dimensions.
-        #  What is a bit difficult, that the actual access/dereferencing of the source
-        #  array is done within the tasklet.
-
-        # Access pattern of the source array _within_ the tasklet.
-        src_access_pattern: list[str] = []
-
-        # These are the map ranges for the coying of the slicing.
-        slice_map_ranges: list[tuple[str, str]] = []
-
-        # Compute the access pattern within the tasklet.
-        #  As a side effect we also compute the map ranges, but only for the slices.
-        for dim, slice_size in enumerate(slice_sizes):
-            # Order is important!
-            if dim not in start_index_map:
-                # This dimension is fully copied
-                slice_map_ranges.append((f"__i{dim}", f"0:{slice_size}"))
-                src_access_pattern.append(slice_map_ranges[-1][0])
-                assert dim in src_dim_with_map_idx
-                assert slice_size == src_shape[dim]
-
-            elif dim in collapsed_slice_dims:
-                # This dimension is only partially copied, however, since the
-                #  dimension is collapsed, only a single element is copied that
-                #  comes from the index array.
-                src_access_pattern.append(f"__gather_{dim}")
-
-            else:
-                # This dimension is partially copied, but is _not colapsed_, we need
-                #  a map index to copy the range. However, there is also an offset
-                #  that is involved from copying.
-                slice_map_ranges.append((f"__i{dim}", f"0:{slice_size}"))
-                src_access_pattern.append(f"__gather_{dim} + {slice_map_ranges[-1][0]}")
-                assert dim in src_dim_with_map_idx
-                assert slice_size <= src_shape[dim]
-
-        # These are the map variable that go over the index array.
-        patch_loop_vars = tuple(f"__i{out_name}_gather{bd}" for bd in batch_dims)
-        patch_map_ranges = [
-            (map_param, f"0:{patch_loop_bound}")
-            for map_param, patch_loop_bound in zip(patch_loop_vars, idx_shape[:-1])
-        ]
-
-        # Creating the input memlet that allows us to access the source array from
-        #  inside the tasklet and make it accessible through the name `__arr`. At
-        #  this point it is not possible to tell where we access, because we are
-        #  missing a index variables, they will only be accessible inside the
-        #  tasklet (see below), however, we know that we will access only one
-        #  element from the array.
-        tasklet_inputs: dict[str, dace.Memlet] = {
-            "__arr": dace.Memlet.simple(
-                data=src_name,
-                subset_str=", ".join(f"0:{size}" for size in src_shape),
-                num_accesses=1,
+
+    # The last dimension is special, as it contains the actual start point for the
+    #  slice window when the dimension is only partially copied. The `start_index_map`
+    #  associates each position element in the last dimension with the corresponding
+    #  dimension of the source array.
+    start_index_map: Sequence[int] = dimension_numbers.start_index_map
+    assert len(start_index_map) == idx_shape[-1]
+
+    # The final map has two parts. The first part iterates through all the slice
+    #  windows that are given through the index array (except last dimension).
+    #  If a dimension is not fully copied then the start index of the window is
+    #  given through the elements of the last dimensions of the index array.
+    #  Map variables that are used for this use the pattern `__i{out_name}_gather{bd}`.
+    #  The second loop is used to copy the slice windows themselves, their map
+    #  variables follow the pattern `__i{i}`.
+
+    # Because the offsets of the slice window (which are given by the elements of
+    #  the last dimension of the index array) are variables and not symbols, it
+    #  can not be included in the memlets. Instead we generate an tasklet that
+    #  performs an indirect access and get all elements of the last dimension of the
+    #  index array (with the names `__gather_{dim}`), together with the full source
+    #  array as input.
+
+    # Access pattern of the source array _inside_ the tasklet.
+    src_access_pattern: list[str] = []
+
+    # The ranges of the second part implicit loop (the one that copies the windows).
+    inside_window_map_ranges: list[tuple[str, str]] = []
+
+    for dim, slice_size in enumerate(slice_sizes):
+        # Order is important!
+        if dim not in start_index_map:
+            # This dimension is fully copied
+            inside_window_map_ranges.append((f"__i{dim}", f"0:{slice_size}"))
+            src_access_pattern.append(inside_window_map_ranges[-1][0])
+            assert dim in not_collapsed_slice_dims
+            assert dim not in batch_dims
+
+        elif dim in collapsed_slice_dims:
+            # This dimension is only partially copied, but because it is collapsed,
+            #  only a single element is copied. Thus the offset is only given by the
+            #  index array.
+            src_access_pattern.append(f"__gather_{dim}")
+            assert dim in batch_dims
+
+        else:
+            # This dimension is partially copied, but _not colapsed_. This creates a
+            #  slice index and the offset (of a single element) is given by the static
+            #  start of the window and the current position inside of the window.
+            inside_window_map_ranges.append((f"__i{dim}", f"0:{slice_size}"))
+            src_access_pattern.append(f"__gather_{dim} + {inside_window_map_ranges[-1][0]}")
+            assert dim in batch_dims
+            assert dim in not_collapsed_slice_dims
+
+    # These are the map variables that are associated to the first implicit loop (the
+    #  iteration over the index array, excluding the last dimension).
+    batch_map_ranges = [
+        (f"__i{out_name}_gather{batch_dim}", f"0:{batch_loop_bound}")
+        for batch_dim, batch_loop_bound in zip(batch_dims, idx_shape[:-1])
+    ]
+    assert len(batch_map_ranges) + len(inside_window_map_ranges) == len(out_shape)
+
+    tasklet_inputs: dict[str, dace.Memlet] = {}
+
+    # We need to pass the full array into the tasklet, however, we know that we
+    #  will read only one element.
+    tasklet_inputs["__arr"] = dace.Memlet.simple(
+        data=src_name,
+        subset_str=", ".join(f"0:{size}" for size in src_shape),
+        num_accesses=1,
+    )
+
+    # The static offset of the slice window, which is given through the elements
+    #  of the last dimensions of the index array, for every element in that dimension
+    #  there is an input.
+    for i, dim in enumerate(start_index_map):
+        tasklet_inputs[f"__gather_{dim}"] = dace.Memlet.simple(
+            data=idx_name,
+            subset_str=(
+                ", ".join(batch_loop_var for batch_loop_var, _ in batch_map_ranges) + f", {i}"
             ),
-        }
-
-        # Now we are creating the memlets that access the index array.
-        for i, dim in enumerate(start_index_map):
-            tasklet_inputs[f"__gather_{dim}"] = dace.Memlet.simple(
-                data=idx_name, subset_str=(", ".join(patch_loop_vars) + f", {i}")
-            )
-
-        # The tasklet code.
-        tasklet_code = "__out = __arr[" + ", ".join(src_access_pattern) + "]"
-
-        # Now we generate the output memlet.
-        outpt_access_pattern: list[str] = []
-        dim_counter = 0
-        for dim in range(len(out_shape)):
-            if dim in batch_dims:
-                # This is a batch dimension, thus a loop variable is used for it.
-                patch_loop_var = patch_loop_vars[batch_dims.index(dim)]
-                outpt_access_pattern.append(str(patch_loop_var))
-
-            else:
-                # This is a dimension for copying the slices.
-                assert dim_counter <= len(src_dim_with_map_idx)
-                associated_map_idx = src_dim_with_map_idx[dim_counter]
-                dim_counter += 1
-                outpt_access_pattern.append(f"__i{associated_map_idx}")
-        assert dim_counter == len(src_dim_with_map_idx)
-
-        tasklet_outputs: dict[str, dace.Memlet] = {
-            "__out": dace.Memlet.simple(data=out_name, subset_str=", ".join(outpt_access_pattern))
-        }
-        assert len(patch_map_ranges) + len(slice_map_ranges) == len(out_shape)
-
-        eqn_state.add_mapped_tasklet(
-            name=f"_gather_map_{out_name}",
-            map_ranges=patch_map_ranges + slice_map_ranges,
-            inputs=tasklet_inputs,
-            code=tasklet_code,
-            outputs=tasklet_outputs,
-            external_edges=True,
         )
 
-
-_ = translator.register_primitive_translator(GatherTranslator())
+    # The output shape is given by the combination of the non collapsed slice sizes
+    #  and the index array (without the last dimension) with some permutation.
+    #  Note that the relative order of slice sizes can not be changed, but they
+    #  might be interleaved with the batch variables.
+    output_memlet_pattern: list[str] = []
+    dim_counter = 0
+    for dim in range(len(out_shape)):
+        if dim in batch_dims:
+            batch_loop_var = batch_map_ranges[batch_dims.index(dim)][0]
+            output_memlet_pattern.append(str(batch_loop_var))
+
+        else:
+            associated_map_idx = not_collapsed_slice_dims[dim_counter]
+            dim_counter += 1
+            output_memlet_pattern.append(f"__i{associated_map_idx}")
+    assert dim_counter == len(not_collapsed_slice_dims)
+
+    eqn_state.add_mapped_tasklet(
+        name=f"_gather_map_{out_name}",
+        map_ranges=batch_map_ranges + inside_window_map_ranges,
+        inputs=tasklet_inputs,
+        code="__out = __arr[" + ", ".join(src_access_pattern) + "]",
+        outputs={
+            "__out": dace.Memlet.simple(data=out_name, subset_str=", ".join(output_memlet_pattern))
+        },
+        external_edges=True,
+    )

From c29fc0dbf0377e67baea172d282e6b1da0995c7a Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Tue, 24 Sep 2024 14:15:02 +0200
Subject: [PATCH 447/458] Some more corrections.

Now let's test if it works.
---
 .../mapped_operation_base_translator.py       | 50 +++++++--------
 .../arithmetic_logical_translators.py         | 16 ++---
 .../concatenate_translator.py                 | 11 +++-
 .../primitive_translators/conditions.py       | 25 ++++----
 .../convert_element_type_translator.py        |  2 +-
 .../primitive_translators/copy_translator.py  | 27 ++++++--
 .../gather_translator.py                      | 64 ++++++++++---------
 .../primitive_translators/pjit_translator.py  | 17 +++--
 .../reshape_translator.py                     | 18 +++++-
 .../select_n_translator.py                    |  2 +-
 10 files changed, 136 insertions(+), 96 deletions(-)

diff --git a/src/jace/translator/mapped_operation_base_translator.py b/src/jace/translator/mapped_operation_base_translator.py
index 17a5c35..508ad13 100644
--- a/src/jace/translator/mapped_operation_base_translator.py
+++ b/src/jace/translator/mapped_operation_base_translator.py
@@ -5,7 +5,7 @@
 #
 # SPDX-License-Identifier: BSD-3-Clause
 
-"""Module containing all translators related to arithmetic logical operations."""
+"""Module implementing the `MappedOperationTranslatorBase` helper class."""
 
 from __future__ import annotations
 
@@ -37,8 +37,9 @@ class MappedOperationTranslatorBase(translator.PrimitiveTranslator):
     ```
     where `__in*` are the connector names of the Tasklet and `__out` is the
     output connector. For problems such as this, the SDFG API provides the
-    `SDFGState.add_mapped_tasklet()` function, however, because it is very low
-    level and very verbose to use, this class acts as a convenience wrapper around it.
+    `SDFGState.add_mapped_tasklet()` function. However, because the function
+    operates on a very low level and is very verbose to use, this class acts
+    as a convenience wrapper around it.
 
     To use this class a user has to define the abstract `write_tasklet_code()` method.
     This function generates the entire code that should be put into the Tasklet,
@@ -160,8 +161,8 @@ def make_input_memlets(  # noqa: PLR6301 [no-self-use]  # Subclasses might need
             in_var_names: The list of SDFG variables used as input, `None` if literal.
             eqn: The equation object.
         """
-        out_shp = tuple(util.get_jax_var_shape(eqn.outvars[0]))  # Shape of the output
-        out_rank = len(out_shp)
+        out_shape = tuple(util.get_jax_var_shape(eqn.outvars[0]))
+        out_rank = len(out_shape)
         if any(len(util.get_jax_var_shape(invar)) not in {0, out_rank} for invar in eqn.invars):
             raise NotImplementedError(
                 f"'MappedOperationTranslatorBase' Inputs must have the same rank as the output! "
@@ -170,29 +171,26 @@ def make_input_memlets(  # noqa: PLR6301 [no-self-use]  # Subclasses might need
 
         # Now we will generate the input Memlets.
         tskl_inputs: dict[str, dace.Memlet] = {}
-        for i, (in_var_name, inp_shp) in enumerate(
+        for i, (in_var_name, in_shape) in enumerate(
             zip(in_var_names, (util.get_jax_var_shape(invar) for invar in eqn.invars))
         ):
-            if in_var_name is None:  # Input is a literal: No Memlet needed
-                continue
-
-            if inp_shp == ():  # Scalars
-                tskl_inputs[f"__in{i}"] = dace.Memlet.simple(in_var_name, "0")  # Scalar
-                continue
-
-            # We might have to do broadcasting.
-            #  We ensured that input and output have the same rank (JAX is doing that
-            #  for us). So we must do broadcasting, i.e. replicating that input
-            #  dimension, if its size is 1. We threat the case where the output has
-            #  size 1 in that dimension as broadcasting as well.
-            dims_to_bcast: Sequence[int] = [dim for dim in range(out_rank) if inp_shp[dim] == 1]
-            tskl_inputs[f"__in{i}"] = dace.Memlet.simple(
-                in_var_name,
-                ", ".join(
-                    ("0" if i in dims_to_bcast else it_var)
-                    for i, (it_var, _) in enumerate(tskl_ranges)
-                ),
-            )
+            if in_var_name is None:
+                pass
+
+            elif in_shape == ():
+                tskl_inputs[f"__in{i}"] = dace.Memlet.simple(in_var_name, "0")
+
+            else:
+                dims_to_bcast = [
+                    dim for dim in range(out_rank) if in_shape[dim] == 1 and out_shape[dim] != 1
+                ]
+                tskl_inputs[f"__in{i}"] = dace.Memlet.simple(
+                    in_var_name,
+                    ", ".join(
+                        ("0" if i in dims_to_bcast else it_var)
+                        for i, (it_var, _) in enumerate(tskl_ranges)
+                    ),
+                )
         return tskl_inputs
 
     def literal_substitution(  # noqa: PLR6301 [no-self-use]  # Subclasses might need it.
diff --git a/src/jace/translator/primitive_translators/arithmetic_logical_translators.py b/src/jace/translator/primitive_translators/arithmetic_logical_translators.py
index 667e1ac..7cf321f 100644
--- a/src/jace/translator/primitive_translators/arithmetic_logical_translators.py
+++ b/src/jace/translator/primitive_translators/arithmetic_logical_translators.py
@@ -100,14 +100,12 @@ def write_tasklet_code(
         in_var_names: Sequence[str | None],
         eqn: jax_core.JaxprEqn,
     ) -> str:
-        return (
-            self._bool_tmpl
-            if all(util.get_jax_var_dtype(invar) is dace.bool_ for invar in eqn.invars)
-            else self._int_tmpl
-        )
+        if all(util.get_jax_var_dtype(invar) is dace.bool_ for invar in eqn.invars):
+            return self._bool_tmpl
+        return self._int_tmpl
 
 
-# Maps the name of an arithmetic primitives to the code template that is used to
+# Maps the name of an arithmetic JAX primitive to the code template that is used to
 #  generate the body of the mapped tasklet. These are used to instantiate the
 #  `ArithmeticOperationTranslator` objects.
 # fmt: off
@@ -175,9 +173,9 @@ def write_tasklet_code(
 }
 
 
-# Maps the name of a logical primitive to the two code templates (first the integer
-#  case and second the boolean case) used to create the body of the mapped tasklet.
-#  They are used to instantiate the `LogicalOperationTranslator` translators.
+# Maps the name of a logical primitive to the two code templates, first the integer
+#  case and second the boolean case, that are used to create the body of the mapped
+#  tasklet. They are used to instantiate the `LogicalOperationTranslator` translators.
 _LOGICAL_OPERATION_TEMPLATES: Final[dict[str, tuple[str, str]]] = {
     "or": ("__out = (__in0) | (__in1)",  "__out = (__in0) or (__in1)"),
     "not": ("__out = ~(__in0)", "__out = not (__in0)"),
diff --git a/src/jace/translator/primitive_translators/concatenate_translator.py b/src/jace/translator/primitive_translators/concatenate_translator.py
index 1b5f679..b327bde 100644
--- a/src/jace/translator/primitive_translators/concatenate_translator.py
+++ b/src/jace/translator/primitive_translators/concatenate_translator.py
@@ -25,7 +25,7 @@
 @translator.register_primitive_translator()
 @translator.make_primitive_translator("concatenate")
 def concatenate_translator(
-    builder: translator.JaxprTranslationBuilder,  # noqa: ARG001  # Required by the interface.
+    builder: translator.JaxprTranslationBuilder,  # noqa: ARG001 [unused-function-argument]  # Required by the interface.
     in_var_names: Sequence[str | None],
     out_var_names: Sequence[str],
     eqn: jax_core.JaxprEqn,
@@ -36,6 +36,15 @@ def concatenate_translator(
 
     Each source array is copied by its own map, but all maps write to the same
     access node.
+
+    Args:
+        builder: The builder object of the translation; unused.
+        in_var_names: The SDFG variables used an input arguments in order as they
+            should be concatenated.
+        out_var_names: Names of SDFG variables that should be used as outputs.
+        eqn: The equation that should be translated, the concatenation dimensions
+            is read from the `dimension` parameter.
+        eqn_state: State into which the nested SDFG should be constructed.
     """
     if any(in_var_name is None for in_var_name in in_var_names):
         raise NotImplementedError("Concatenate: No literal inputs supported.")
diff --git a/src/jace/translator/primitive_translators/conditions.py b/src/jace/translator/primitive_translators/conditions.py
index 4f7363d..6e37a7a 100644
--- a/src/jace/translator/primitive_translators/conditions.py
+++ b/src/jace/translator/primitive_translators/conditions.py
@@ -41,18 +41,19 @@ def condition_translator(
 
     Args:
         builder: The builder object of the translation.
-        in_var_names: The SDFG variables used an input arguments. First is the index,
-            the variable that selects the branch, the remaining ones are passed as
-            inputs to the branches.
+        in_var_names: The SDFG variables used an input arguments. First is the
+            selection variable. The remaining ones are passed to the branches as
+            inputs.
         out_var_names: Names of SDFG variables that should be used as outputs.
         eqn: The equation that should be translated.
         eqn_state: State into which the nested SDFG should be constructed.
 
     Notes:
-        According to the JAX documentation (https://jax.readthedocs.io/en/latest/_autosummary/jax.lax.switch.html)
-        the selector is clamped. But according to XLA (https://openxla.org/xla/operation_semantics#conditional)
-        an out of range selector uses the last branch. JaCe conforms to JAX semantic.
-        After this function the terminal state of the `builder` is unspecific.
+        - According to the JAX documentation (https://jax.readthedocs.io/en/latest/_autosummary/jax.lax.switch.html)
+            the selector is clamped. But according to XLA (https://openxla.org/xla/operation_semantics#conditional)
+            an out of range selector uses the last branch. JaCe conforms to JAX
+            semantic.
+        - After this function the terminal state of the `builder` is unspecific.
     """
     if util.get_jax_var_dtype(eqn.invars[0]) is dace.bool_:
         # XLA explicitly provides a binary form of the primitive
@@ -61,7 +62,7 @@ def condition_translator(
         #  integer implementation.
         raise NotImplementedError("The boolean conditional primitive is not implemented.")
 
-    # To make names in the (nested) SDFG unique we use the name of the equation state
+    # Used as prefix to give all additional states/variables a unique name.
     name_pattern = eqn_state.name
 
     # To avoid special cases promote all symbols to constants.
@@ -80,9 +81,7 @@ def condition_translator(
         literal_selection_value = str(util.get_jax_literal_value(eqn.invars[0]))
         selection_symbol = f"max({len(branches)}, min(0, {literal_selection_value}))"
         selection_state = eqn_state
-
     else:
-        # Promotion of a scalar to a symbol through a state transition.
         selection_variable_name = in_var_names[0]
         selection_symbol = f"{selection_variable_name}_symb"
         selection_state = builder.append_new_state(
@@ -93,12 +92,15 @@ def condition_translator(
             prev_state=eqn_state,
         )
 
+    # Translate the subbranches, the branches are all connected from `selection_state`.
     branch_states: list[dace.SDFGState] = []
     for i, branch_jaxpr in enumerate(branches):
         branch_pattern = f"{name_pattern}_{{}}_branch_{i}"
         branch_ctx = builder.translate_jaxpr(jaxpr=branch_jaxpr, name=branch_pattern.format("sdfg"))
 
-        # This will update the terminal state only for the first branch
+        # The first time it is called it will update the builder's terminal state
+        #  but since we will return the join state it will be updated later. But
+        #  until then the terminal state of the builder is invalid.
         branch_state = builder.append_new_state(
             label=branch_pattern.format("state"),
             condition=f"{selection_symbol} == {i}",
@@ -113,6 +115,7 @@ def condition_translator(
         )
         branch_states.append(branch_state)
 
+    # Connect all branch states to the join state
     join_state = builder.add_orphan_state(f"{name_pattern}__join_state")
     for branch_state in branch_states:
         builder.sdfg.add_edge(
diff --git a/src/jace/translator/primitive_translators/convert_element_type_translator.py b/src/jace/translator/primitive_translators/convert_element_type_translator.py
index 118f4e3..a9f179c 100644
--- a/src/jace/translator/primitive_translators/convert_element_type_translator.py
+++ b/src/jace/translator/primitive_translators/convert_element_type_translator.py
@@ -56,7 +56,7 @@ def write_tasklet_code(
 
         if in_dtype == out_dtype:
             # JAX sometimes adds conversions which are not needed. In these cases
-            #  we perform a copy.
+            #  make a copy out of it.
             # TODO(phimuell): Create a Memlet instead.
             return "__out = __in0"
 
diff --git a/src/jace/translator/primitive_translators/copy_translator.py b/src/jace/translator/primitive_translators/copy_translator.py
index 5cc0d3c..9e0d2d1 100644
--- a/src/jace/translator/primitive_translators/copy_translator.py
+++ b/src/jace/translator/primitive_translators/copy_translator.py
@@ -28,21 +28,31 @@ def copy_translator(
     builder: translator.JaxprTranslationBuilder,
     in_var_names: Sequence[str | None],
     out_var_names: Sequence[str],
-    eqn: jax_core.JaxprEqn,  # noqa: ARG001  # Required by the interface.
+    eqn: jax_core.JaxprEqn,  # noqa: ARG001 [unused-function-argument]  # Required by the interface.
     eqn_state: dace.SDFGState,
 ) -> None:
     """
     Implements the `copy` primitive.
 
+    The copy is implemented by creating a memlet between the source and destination.
+
+    Args:
+        builder: The builder object of the translation.
+        in_var_names: The SDFG variable that acts as source.
+        out_var_names: The SDFG variable that acts as destination of the copy.
+        eqn: The equation that should be translated; unused.
+        eqn_state: State into which the nested SDFG should be constructed.
+
     Todo:
         Investigate if operation should expand to a map.
     """
+    assert in_var_names[0] is not None
     eqn_state.add_nedge(
         eqn_state.add_read(in_var_names[0]),
         eqn_state.add_write(out_var_names[0]),
         dace.Memlet.from_array(
             in_var_names[0],
-            builder.arrays[in_var_names[0]],  # type: ignore[index]  # Guaranteed to be a string
+            builder.arrays[in_var_names[0]],
         ),
     )
 
@@ -60,9 +70,16 @@ def device_put_translator(
     Implements the `device_put` primitive.
 
     In JAX this primitive is used to copy data between the host and the device,
-    in DaCe Memlets can do this. However, because of the way JaCe operates, at
-    least in the beginning a computation is either fully on the host or on the
-    device this copy will essentially perform a copying.
+    in DaCe only memlets can do this. However, because of the way JaCe (currently)
+    operates (a computation is either fully on the host or on GPU), the `device_put`
+    primitive essentially decays to a copy.
+
+    Args:
+        builder: The builder object of the translation.
+        in_var_names: The SDFG variable that acts as source.
+        out_var_names: The SDFG variable that acts as destination of the copy.
+        eqn: The equation that should be translated.
+        eqn_state: State into which the nested SDFG should be constructed.
     """
     if not (eqn.params["device"] is None and eqn.params["src"] is None):
         raise NotImplementedError(
diff --git a/src/jace/translator/primitive_translators/gather_translator.py b/src/jace/translator/primitive_translators/gather_translator.py
index 8d0f60f..daacb56 100644
--- a/src/jace/translator/primitive_translators/gather_translator.py
+++ b/src/jace/translator/primitive_translators/gather_translator.py
@@ -26,7 +26,7 @@
 @translator.register_primitive_translator()
 @translator.make_primitive_translator("gather")
 def gather_translator(  # noqa: PLR0914 [too-many-locals]  # Can not reduce any further.
-    builder: translator.JaxprTranslationBuilder,  # noqa: ARG001  # Required by the interface.
+    builder: translator.JaxprTranslationBuilder,  # noqa: ARG001 [unused-function-argument]  # Required by the interface.
     in_var_names: Sequence[str | None],
     out_var_names: Sequence[str],
     eqn: jax_core.JaxprEqn,
@@ -64,8 +64,8 @@ def gather_translator(  # noqa: PLR0914 [too-many-locals]  # Can not reduce any
         raise NotImplementedError(f"The mode {eqn.params['mode']} is not implemented.")
 
     # This is the size of the slice window that is copied. Its length equal the rank
-    #  of the source array, dimensions that should not be copied are listed in
-    #  `collapsed_slice_dims`.
+    #  of the source array, dimensions that are excluded from copying are listed
+    #  in `collapsed_slice_dims`.
     slice_sizes: Sequence[int] = eqn.params["slice_sizes"]
     collapsed_slice_dims: Sequence[int] = dimension_numbers.collapsed_slice_dims
     not_collapsed_slice_dims = tuple(
@@ -73,34 +73,38 @@ def gather_translator(  # noqa: PLR0914 [too-many-locals]  # Can not reduce any
     )
     assert len(slice_sizes) == len(src_shape)
 
-    # The batch dimensions are used to iterate through the slice windows, thus access
-    #  the index array, with the exception of the last dimension, see below.
-    # NOTE: In pure XLA this last dimension might not be present, however, JAX
-    #   adds it and our implementation relies on it.
+    # The batch dimensions are used to iterate through the different slice windows
+    #  (not inside them) thus they access the index array, with the exception of the
+    #  last dimension, see below.
+    # NOTE: In pure XLA this last dimension is in certain cases optional, however,
+    #   JAX adds it and our implementation relies on it.
     batch_dims = tuple(d for d in range(len(out_shape)) if d not in dimension_numbers.offset_dims)
     if (len(batch_dims) + 1) != len(idx_shape):
         raise ValueError(
             f"Expected that the index array has {len(batch_dims) + 1} dimensions, but it had {len(idx_shape)}."
         )
 
-    # The last dimension is special, as it contains the actual start point for the
-    #  slice window when the dimension is only partially copied. The `start_index_map`
-    #  associates each position element in the last dimension with the corresponding
+    # The last dimension of the index array is special, as it contains the actual
+    #  start point for the slice windows when the dimension is only partially copied.
+    #  Thus the last dimension must be seen as a list of start indexes and the other
+    #  dimensions are used to enumerate the slice windows. The `start_index_map`
+    #  associates each position in the last dimension with the corresponding
     #  dimension of the source array.
     start_index_map: Sequence[int] = dimension_numbers.start_index_map
     assert len(start_index_map) == idx_shape[-1]
 
-    # The final map has two parts. The first part iterates through all the slice
-    #  windows that are given through the index array (except last dimension).
-    #  If a dimension is not fully copied then the start index of the window is
-    #  given through the elements of the last dimensions of the index array.
-    #  Map variables that are used for this use the pattern `__i{out_name}_gather{bd}`.
-    #  The second loop is used to copy the slice windows themselves, their map
-    #  variables follow the pattern `__i{i}`.
+    # The iteration variable of the final map can be divided into two parts or
+    #  categories. The first part iterates through all the slice windows that are
+    #  given through the index array. If a dimension is not fully copied then the
+    #  start index of the window is given through the elements of the last dimensions
+    #  of the index array. Map variables that are used for this use the pattern
+    #  `__i{out_name}_gather{bd}`. The second kind of variables are used to copy the
+    #  content of the slice windows themselves, these map variables follow the
+    #  pattern `__i{i}`.
 
     # Because the offsets of the slice window (which are given by the elements of
-    #  the last dimension of the index array) are variables and not symbols, it
-    #  can not be included in the memlets. Instead we generate an tasklet that
+    #  the last dimension of the index array) are variables and not symbols, they
+    #  can not be included in the memlets. Instead we generate a tasklet that
     #  performs an indirect access and get all elements of the last dimension of the
     #  index array (with the names `__gather_{dim}`), together with the full source
     #  array as input.
@@ -108,7 +112,8 @@ def gather_translator(  # noqa: PLR0914 [too-many-locals]  # Can not reduce any
     # Access pattern of the source array _inside_ the tasklet.
     src_access_pattern: list[str] = []
 
-    # The ranges of the second part implicit loop (the one that copies the windows).
+    # The map variables and their ranges of the second part implicit loop; the one
+    #  that copy the content inside the window.
     inside_window_map_ranges: list[tuple[str, str]] = []
 
     for dim, slice_size in enumerate(slice_sizes):
@@ -123,14 +128,14 @@ def gather_translator(  # noqa: PLR0914 [too-many-locals]  # Can not reduce any
         elif dim in collapsed_slice_dims:
             # This dimension is only partially copied, but because it is collapsed,
             #  only a single element is copied. Thus the offset is only given by the
-            #  index array.
+            #  what we read from the index array.
             src_access_pattern.append(f"__gather_{dim}")
             assert dim in batch_dims
 
         else:
-            # This dimension is partially copied, but _not colapsed_. This creates a
-            #  slice index and the offset (of a single element) is given by the static
-            #  start of the window and the current position inside of the window.
+            # This dimension is partially copied, but _not colapsed_. This the element
+            #  that is read depends on the (static) offset of this window and the
+            #  current position within the slicing window.
             inside_window_map_ranges.append((f"__i{dim}", f"0:{slice_size}"))
             src_access_pattern.append(f"__gather_{dim} + {inside_window_map_ranges[-1][0]}")
             assert dim in batch_dims
@@ -154,9 +159,8 @@ def gather_translator(  # noqa: PLR0914 [too-many-locals]  # Can not reduce any
         num_accesses=1,
     )
 
-    # The static offset of the slice window, which is given through the elements
-    #  of the last dimensions of the index array, for every element in that dimension
-    #  there is an input.
+    # The static offsets of the slice window, are given through the elements of the
+    #  last dimensions of the index array.
     for i, dim in enumerate(start_index_map):
         tasklet_inputs[f"__gather_{dim}"] = dace.Memlet.simple(
             data=idx_name,
@@ -165,10 +169,10 @@ def gather_translator(  # noqa: PLR0914 [too-many-locals]  # Can not reduce any
             ),
         )
 
-    # The output shape is given by the combination of the non collapsed slice sizes
+    # The output shape is given by the combination of the not collapsed slice sizes
     #  and the index array (without the last dimension) with some permutation.
-    #  Note that the relative order of slice sizes can not be changed, but they
-    #  might be interleaved with the batch variables.
+    #  While the relative order of slice window does not change, `start_index_map`
+    #  already applied a permutation, it might be interleaved with batch dimensions.
     output_memlet_pattern: list[str] = []
     dim_counter = 0
     for dim in range(len(out_shape)):
diff --git a/src/jace/translator/primitive_translators/pjit_translator.py b/src/jace/translator/primitive_translators/pjit_translator.py
index b3b9d97..43bc3ea 100644
--- a/src/jace/translator/primitive_translators/pjit_translator.py
+++ b/src/jace/translator/primitive_translators/pjit_translator.py
@@ -11,7 +11,7 @@
 
 import re
 from collections.abc import Sequence
-from typing import TYPE_CHECKING, Any
+from typing import TYPE_CHECKING
 
 from jax._src import sharding_impls as jax_sharding  # noqa: PLC2701 [import-private-name]
 
@@ -54,13 +54,12 @@ def pjit_translator(
         The translator ignores the `donated_invars`, the `keep_unused` and the
         `inline` parameter and let's DaCe handle it.
     """
-    params: dict[str, Any] = eqn.params
-    nested_jaxpr: jax_core.ClosedJaxpr = params["jaxpr"]
-    in_shardings = params["in_shardings"]
-    out_shardings = params["out_shardings"]
-    _ = params["donated_invars"]  # Always ignored
-    _ = params["keep_unused"]
-    _ = params["inline"]
+    nested_jaxpr: jax_core.ClosedJaxpr = eqn.params["jaxpr"]
+    in_shardings = eqn.params["in_shardings"]
+    out_shardings = eqn.params["out_shardings"]
+    _ = eqn.params["donated_invars"]  # Always ignored
+    _ = eqn.params["keep_unused"]
+    _ = eqn.params["inline"]
 
     if not all(in_sharding is jax_sharding.UNSPECIFIED for in_sharding in in_shardings):
         raise NotImplementedError("Currently 'pjit' does not support sharding in its input.")
@@ -68,7 +67,7 @@ def pjit_translator(
         raise NotImplementedError("Currently 'pjit' does not support sharding in its output.")
 
     # TODO(phimuell): Controlflow region and name
-    pjit_name = params["name"]
+    pjit_name = eqn.params["name"]
 
     # Name in SDFG must be unique, thus we mangle it, furthermore, we have to clean it.
     sdfg_name = f"pjit_{re.subn('[^a-zA-Z0-9_]', '_', pjit_name)[0]}__{'_'.join(out_var_names)}"
diff --git a/src/jace/translator/primitive_translators/reshape_translator.py b/src/jace/translator/primitive_translators/reshape_translator.py
index 1bcbc5a..79b9bb0 100644
--- a/src/jace/translator/primitive_translators/reshape_translator.py
+++ b/src/jace/translator/primitive_translators/reshape_translator.py
@@ -25,17 +25,29 @@
 @translator.register_primitive_translator()
 @translator.make_primitive_translator("reshape")
 def reshape_translator(
-    builder: translator.JaxprTranslationBuilder,  # noqa: ARG001  # Required by the interface.
+    builder: translator.JaxprTranslationBuilder,  # noqa: ARG001 [unused-function-argument]  # Required by the interface.
     in_var_names: Sequence[str | None],
     out_var_names: Sequence[str],
     eqn: jax_core.JaxprEqn,
     eqn_state: dace.SDFGState,
 ) -> None:
     """
-    Implements the `reshape` primitive, through a memlet.
+    Implements the `reshape` primitive.
+
+    The function creates a memlet between the input (old shape) and output (final
+    shape). Because of this, it is best if both arrays do not have any paddings.
+
+    Args:
+        builder: The builder object of the translation.
+        in_var_names: Name of the SDFG variable of the source array,
+            with the old shape.
+        out_var_names: Name of SDFG variable that acts as destination,
+            with the new shape.
+        eqn: The equation that contains the `pjit` primitive.
+        eqn_state: State into which the nested SDFG should be constructed.
 
     Note:
-        The optional `dimensions` parameters which allows to permute the input
+        The optional `dimensions` parameters, which allows to permute the input,
         is not supported.
     """
     if eqn.params["dimensions"] is not None:
diff --git a/src/jace/translator/primitive_translators/select_n_translator.py b/src/jace/translator/primitive_translators/select_n_translator.py
index 0b9a0d1..aa96922 100644
--- a/src/jace/translator/primitive_translators/select_n_translator.py
+++ b/src/jace/translator/primitive_translators/select_n_translator.py
@@ -48,7 +48,7 @@ def write_tasklet_code(
         in_var_names: Sequence[str | None],
         eqn: jax_core.JaxprEqn,
     ) -> str:
-        if len(in_var_names) == 3:  # noqa: PLR2004  # Ternary conditional expression.
+        if len(in_var_names) == 3:  # noqa: PLR2004 [magic-value-comparison]  # Ternary conditional expression.
             # The order is correct, since `False` is interpreted as `0`,
             #  which means "the first case".
             return "__out = __in1 if __cond else __in0"

From 3ee8dad963fb1f45a26622ffc9e896c505ef164d Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Tue, 24 Sep 2024 14:37:42 +0200
Subject: [PATCH 448/458] Made it run again.

---
 src/jace/translator/jaxpr_translator_builder.py               | 3 +--
 .../primitive_translators/broadcast_in_dim_translator.py      | 2 +-
 src/jace/translator/primitive_translators/conditions.py       | 4 ++--
 .../translator/primitive_translators/gather_translator.py     | 3 ---
 4 files changed, 4 insertions(+), 8 deletions(-)

diff --git a/src/jace/translator/jaxpr_translator_builder.py b/src/jace/translator/jaxpr_translator_builder.py
index c82c277..288593f 100644
--- a/src/jace/translator/jaxpr_translator_builder.py
+++ b/src/jace/translator/jaxpr_translator_builder.py
@@ -598,10 +598,9 @@ def _translate_single_eqn(self, eqn: jax_core.JaxprEqn) -> None:
             prev_terminal_state,
             new_sdfg_term_state,
         )
-        self._ctx.validate()
-
         # Modify terminal root state of 'self'
         self._ctx.terminal_state = new_sdfg_term_state
+        self._ctx.validate()
 
     def _translate_jaxpr_internal(self, jaxpr: jax_core.ClosedJaxpr) -> TranslationContext:
         """
diff --git a/src/jace/translator/primitive_translators/broadcast_in_dim_translator.py b/src/jace/translator/primitive_translators/broadcast_in_dim_translator.py
index 964a2f6..d8bd388 100644
--- a/src/jace/translator/primitive_translators/broadcast_in_dim_translator.py
+++ b/src/jace/translator/primitive_translators/broadcast_in_dim_translator.py
@@ -56,7 +56,7 @@ def make_input_memlets(
         subset_str = (
             ", ".join(tskl_ranges[bdim][0] for bdim in eqn.params["broadcast_dimensions"])
             if eqn.params["broadcast_dimensions"]
-            else "0",
+            else "0"
         )
         return {"__in0": dace.Memlet.simple(in_var_names[0], subset_str)}
 
diff --git a/src/jace/translator/primitive_translators/conditions.py b/src/jace/translator/primitive_translators/conditions.py
index 6e37a7a..945baf1 100644
--- a/src/jace/translator/primitive_translators/conditions.py
+++ b/src/jace/translator/primitive_translators/conditions.py
@@ -79,7 +79,7 @@ def condition_translator(
     # Make sure that the selection variable is a DaCe symbol.
     if in_var_names[0] is None:
         literal_selection_value = str(util.get_jax_literal_value(eqn.invars[0]))
-        selection_symbol = f"max({len(branches)}, min(0, {literal_selection_value}))"
+        selection_symbol = f"min({len(branches)}, max(0, {literal_selection_value}))"
         selection_state = eqn_state
     else:
         selection_variable_name = in_var_names[0]
@@ -87,7 +87,7 @@ def condition_translator(
         selection_state = builder.append_new_state(
             label=f"{name_pattern}_fork",
             assignments={
-                selection_symbol: f"max({len(branches)}, min(0, {selection_variable_name}[0]))"
+                selection_symbol: f"min({len(branches)}, max(0, {selection_variable_name}))"
             },
             prev_state=eqn_state,
         )
diff --git a/src/jace/translator/primitive_translators/gather_translator.py b/src/jace/translator/primitive_translators/gather_translator.py
index daacb56..4f459d9 100644
--- a/src/jace/translator/primitive_translators/gather_translator.py
+++ b/src/jace/translator/primitive_translators/gather_translator.py
@@ -123,14 +123,12 @@ def gather_translator(  # noqa: PLR0914 [too-many-locals]  # Can not reduce any
             inside_window_map_ranges.append((f"__i{dim}", f"0:{slice_size}"))
             src_access_pattern.append(inside_window_map_ranges[-1][0])
             assert dim in not_collapsed_slice_dims
-            assert dim not in batch_dims
 
         elif dim in collapsed_slice_dims:
             # This dimension is only partially copied, but because it is collapsed,
             #  only a single element is copied. Thus the offset is only given by the
             #  what we read from the index array.
             src_access_pattern.append(f"__gather_{dim}")
-            assert dim in batch_dims
 
         else:
             # This dimension is partially copied, but _not colapsed_. This the element
@@ -138,7 +136,6 @@ def gather_translator(  # noqa: PLR0914 [too-many-locals]  # Can not reduce any
             #  current position within the slicing window.
             inside_window_map_ranges.append((f"__i{dim}", f"0:{slice_size}"))
             src_access_pattern.append(f"__gather_{dim} + {inside_window_map_ranges[-1][0]}")
-            assert dim in batch_dims
             assert dim in not_collapsed_slice_dims
 
     # These are the map variables that are associated to the first implicit loop (the

From e787ee98a05a708a6fc6b3e7374b23197951639b Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Tue, 24 Sep 2024 14:41:39 +0200
Subject: [PATCH 449/458] Fixed an error in the tests.

---
 tests/integration_tests/test_primitive_translator_managing.py | 2 --
 1 file changed, 2 deletions(-)

diff --git a/tests/integration_tests/test_primitive_translator_managing.py b/tests/integration_tests/test_primitive_translator_managing.py
index a52ab01..b7cf3d9 100644
--- a/tests/integration_tests/test_primitive_translator_managing.py
+++ b/tests/integration_tests/test_primitive_translator_managing.py
@@ -70,8 +70,6 @@ def fake_add_translator(*args: Any, **kwargs: Any) -> None:  # noqa: ARG001 [unu
 
 
 def test_has_pjit():
-    print(f"ADDRESS: {translator.get_registered_primitive_translators()['pjit']}")
-    print(f"FUN ADDRESS: {translator.primitive_translators.pjit_translator.PJITTranslator}")
     assert "pjit" in translator.get_registered_primitive_translators()
 
 
From 846a34512c1ba674c040c41ce28cf5a349703dec Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Tue, 24 Sep 2024 14:37:42 +0200
Subject: [PATCH 450/458] Fixed some errors.

---
 src/jace/translator/jaxpr_translator_builder.py               | 3 +--
 .../primitive_translators/broadcast_in_dim_translator.py      | 2 +-
 src/jace/translator/primitive_translators/conditions.py       | 4 ++--
 .../translator/primitive_translators/gather_translator.py     | 3 ---
 4 files changed, 4 insertions(+), 8 deletions(-)

diff --git a/src/jace/translator/jaxpr_translator_builder.py b/src/jace/translator/jaxpr_translator_builder.py
index c82c277..288593f 100644
--- a/src/jace/translator/jaxpr_translator_builder.py
+++ b/src/jace/translator/jaxpr_translator_builder.py
@@ -598,10 +598,9 @@ def _translate_single_eqn(self, eqn: jax_core.JaxprEqn) -> None:
             prev_terminal_state,
             new_sdfg_term_state,
         )
-        self._ctx.validate()
-
         # Modify terminal root state of 'self'
         self._ctx.terminal_state = new_sdfg_term_state
+        self._ctx.validate()
 
     def _translate_jaxpr_internal(self, jaxpr: jax_core.ClosedJaxpr) -> TranslationContext:
         """
diff --git a/src/jace/translator/primitive_translators/broadcast_in_dim_translator.py b/src/jace/translator/primitive_translators/broadcast_in_dim_translator.py
index 964a2f6..d8bd388 100644
--- a/src/jace/translator/primitive_translators/broadcast_in_dim_translator.py
+++ b/src/jace/translator/primitive_translators/broadcast_in_dim_translator.py
@@ -56,7 +56,7 @@ def make_input_memlets(
         subset_str = (
             ", ".join(tskl_ranges[bdim][0] for bdim in eqn.params["broadcast_dimensions"])
             if eqn.params["broadcast_dimensions"]
-            else "0",
+            else "0"
         )
         return {"__in0": dace.Memlet.simple(in_var_names[0], subset_str)}
 
diff --git a/src/jace/translator/primitive_translators/conditions.py b/src/jace/translator/primitive_translators/conditions.py
index 6e37a7a..945baf1 100644
--- a/src/jace/translator/primitive_translators/conditions.py
+++ b/src/jace/translator/primitive_translators/conditions.py
@@ -79,7 +79,7 @@ def condition_translator(
     # Make sure that the selection variable is a DaCe symbol.
     if in_var_names[0] is None:
         literal_selection_value = str(util.get_jax_literal_value(eqn.invars[0]))
-        selection_symbol = f"max({len(branches)}, min(0, {literal_selection_value}))"
+        selection_symbol = f"min({len(branches)}, max(0, {literal_selection_value}))"
         selection_state = eqn_state
     else:
         selection_variable_name = in_var_names[0]
@@ -87,7 +87,7 @@ def condition_translator(
         selection_state = builder.append_new_state(
             label=f"{name_pattern}_fork",
             assignments={
-                selection_symbol: f"max({len(branches)}, min(0, {selection_variable_name}[0]))"
+                selection_symbol: f"min({len(branches)}, max(0, {selection_variable_name}))"
             },
             prev_state=eqn_state,
         )
diff --git a/src/jace/translator/primitive_translators/gather_translator.py b/src/jace/translator/primitive_translators/gather_translator.py
index daacb56..4f459d9 100644
--- a/src/jace/translator/primitive_translators/gather_translator.py
+++ b/src/jace/translator/primitive_translators/gather_translator.py
@@ -123,14 +123,12 @@ def gather_translator(  # noqa: PLR0914 [too-many-locals]  # Can not reduce any
             inside_window_map_ranges.append((f"__i{dim}", f"0:{slice_size}"))
             src_access_pattern.append(inside_window_map_ranges[-1][0])
             assert dim in not_collapsed_slice_dims
-            assert dim not in batch_dims
 
         elif dim in collapsed_slice_dims:
             # This dimension is only partially copied, but because it is collapsed,
             #  only a single element is copied. Thus the offset is only given by the
             #  what we read from the index array.
             src_access_pattern.append(f"__gather_{dim}")
-            assert dim in batch_dims
 
         else:
             # This dimension is partially copied, but _not colapsed_. This the element
@@ -138,7 +136,6 @@ def gather_translator(  # noqa: PLR0914 [too-many-locals]  # Can not reduce any
             #  current position within the slicing window.
             inside_window_map_ranges.append((f"__i{dim}", f"0:{slice_size}"))
             src_access_pattern.append(f"__gather_{dim} + {inside_window_map_ranges[-1][0]}")
-            assert dim in batch_dims
             assert dim in not_collapsed_slice_dims
 
     # These are the map variables that are associated to the first implicit loop (the

From 090c3a2488297f6bd5f78aa36a7bd61e4fa54fcd Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Wed, 25 Sep 2024 14:17:26 +0200
Subject: [PATCH 451/458] Updated the `make_array()` function.

Before the `order` argument was a `Literal` but this caused more truble now it is a string.
---
 .../primitive_translators/test_primitive_reshape.py         | 3 +--
 tests/util.py                                               | 6 +++---
 2 files changed, 4 insertions(+), 5 deletions(-)

diff --git a/tests/integration_tests/primitive_translators/test_primitive_reshape.py b/tests/integration_tests/primitive_translators/test_primitive_reshape.py
index bd1d6ab..4a504c5 100644
--- a/tests/integration_tests/primitive_translators/test_primitive_reshape.py
+++ b/tests/integration_tests/primitive_translators/test_primitive_reshape.py
@@ -25,8 +25,7 @@ def _test_impl_reshaping(
     src_shape: Sequence[int], dst_shape: Sequence[int], order: str = "C"
 ) -> None:
     """Performs a reshaping from `src_shape` to `dst_shape`."""
-    a = testutil.make_array(src_shape)
-    a = np.array(a, order=order)  # type: ignore[call-overload]  # MyPy wants a literal as order.
+    a = testutil.make_array(src_shape, order=order)
 
     def testee(a: np.ndarray) -> jax.Array:
         return jnp.reshape(a, dst_shape)
diff --git a/tests/util.py b/tests/util.py
index 1fa2e07..3b38bfe 100644
--- a/tests/util.py
+++ b/tests/util.py
@@ -10,7 +10,7 @@
 from __future__ import annotations
 
 from collections.abc import Mapping, Sequence
-from typing import Any, Literal
+from typing import Any
 
 import numpy as np
 
@@ -23,7 +23,7 @@
 def make_array(
     shape: Sequence[int] | int,
     dtype: type = np.float64,
-    order: Literal[None, "K", "A", "C", "F"] = "C",
+    order: str = "C",
     low: Any = None,
     high: Any = None,
 ) -> np.ndarray:
@@ -69,7 +69,7 @@ def make_array(
             res = low + (high - low) * res
         assert (low is None) == (high is None)
 
-    return np.array(res, order=order, dtype=dtype)
+    return np.array(res, order=order, dtype=dtype)  # type: ignore[call-overload]  # Because we use `str` as `order`.
 
 
 def set_active_primitive_translators_to(

From e66785435887bca284c585f09d862941915fd7f0 Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Wed, 25 Sep 2024 15:12:09 +0200
Subject: [PATCH 452/458] Disabled the simplify pass again in the tests.

I enabled the simplify pass in commit `411bd7bd` and it worked locally.
However, this was because I was not running it inside nox and using my own version of DaCe.
The bug in simplify was fixed in [PR#1603](https://github.com/spcl/dace/pull/1603) which was merged _after_ 16.1 was released, thus the fix is not avaliable.
---
 tests/integration_tests/primitive_translators/conftest.py | 7 ++++++-
 1 file changed, 6 insertions(+), 1 deletion(-)

diff --git a/tests/integration_tests/primitive_translators/conftest.py b/tests/integration_tests/primitive_translators/conftest.py
index b914da2..6f81b09 100644
--- a/tests/integration_tests/primitive_translators/conftest.py
+++ b/tests/integration_tests/primitive_translators/conftest.py
@@ -20,7 +20,12 @@
     autouse=True,
     params=[
         optimization.NO_OPTIMIZATIONS,
-        optimization.DEFAULT_OPTIMIZATIONS,
+        pytest.param(
+            optimization.DEFAULT_OPTIMIZATIONS,
+            marks=pytest.mark.skip(
+                "Simplify bug 'https://github.com/spcl/dace/issues/1595'; resolved > 16.1"
+            ),
+        ),
     ],
 )
 def _set_compile_options(request) -> Generator[None, None, None]:

From 6fe78b07446fda85889c593bea98b296c7f70ad7 Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Wed, 25 Sep 2024 15:44:14 +0200
Subject: [PATCH 453/458] Fixed an error in the tests.

It seems JAX has updated the `make_jaxpr()` function and now that thing caches itself.
This is now accounted for.
---
 tests/unit_tests/test_caching.py | 10 ++++++++--
 1 file changed, 8 insertions(+), 2 deletions(-)

diff --git a/tests/unit_tests/test_caching.py b/tests/unit_tests/test_caching.py
index 60be130..85e5b3b 100644
--- a/tests/unit_tests/test_caching.py
+++ b/tests/unit_tests/test_caching.py
@@ -402,9 +402,15 @@ def wrapped(a: np.ndarray) -> np.ndarray:
     res_f = lower_f.compile()(array_f)
 
     assert res_c is not res_f
-    assert np.allclose(res_f, res_c)
     assert lower_f is not lower_c
-    assert lower_cnt[0] == 2
+    assert np.allclose(res_f, res_c)
+
+    # In previous versions JAX did not cached the result of the tracing,
+    #  but in newer version the tracing itself is also cached
+    if lower_c._jaxpr is lower_f._jaxpr:
+        assert lower_cnt[0] == 1
+    else:
+        assert lower_cnt[0] == 2
 
 
 def test_caching_jax_numpy_array() -> None:

From d88752aa210961e8801e18f9e5157abb7170d9c7 Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Wed, 25 Sep 2024 16:16:13 +0200
Subject: [PATCH 454/458] The test was not really testing anything, okay if it
 was working.

But the new function really tests if the loweing works, if teh strides are honored and infered.
---
 .../test_jaxpr_translator_builder.py          | 28 +++++++++++--------
 1 file changed, 17 insertions(+), 11 deletions(-)

diff --git a/tests/integration_tests/test_jaxpr_translator_builder.py b/tests/integration_tests/test_jaxpr_translator_builder.py
index df708dc..40b4fff 100644
--- a/tests/integration_tests/test_jaxpr_translator_builder.py
+++ b/tests/integration_tests/test_jaxpr_translator_builder.py
@@ -634,23 +634,29 @@ def test_builder_jace_var() -> None:
             _ = JaCeVar((), dace.int8, name=iname)
 
 
-def test_builder_FORTRAN_strides() -> None:  # noqa: N802 [invalid-function-name]
-    """Tests if we can lower without a standard stride.
+def test_builder_strides_lowering() -> None:
+    """Tests if we can lower without standard strides."""
 
-    Notes:
-        This tests if the restriction is currently in place.
-        See also `tests/test_caching.py::test_caching_strides`.
-    """
-
-    def testee(a: np.ndarray) -> np.ndarray:
-        return a + 10.0
+    def testee(a: np.ndarray, b: np.ndarray) -> np.ndarray:
+        return a + b
 
     a = testutil.make_array((4, 3), order="F")
-    ref = testee(a)
-    res = jace.jit(testee)(a)
+    b = testutil.make_array((4, 3), order="C")
+    ref = testee(a, b)
+    a_ref_strides = (1, 4)
+    b_ref_strides = (3, 1)
+
+    lowered = jace.jit(testee).lower(a, b)
+    a_res_strides = lowered.as_sdfg().arrays["__jace_input_0"].strides
+    b_res_strides = lowered.as_sdfg().arrays["__jace_input_1"].strides
+
+    compiled = lowered.compile()
+    res = compiled(a, b)
 
     assert ref.shape == res.shape
     assert np.allclose(ref, res)
+    assert a_ref_strides == a_res_strides
+    assert b_ref_strides == b_res_strides
 
 
 def test_builder_drop_variables() -> None:

From 2c7b3c8819daaf74bc721c43a2fe08e2ac51b5ec Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Thu, 26 Sep 2024 15:35:16 +0200
Subject: [PATCH 455/458] Applied Enriques primarly fixes.

---
 .../translator/jaxpr_translator_builder.py    | 21 +---------
 .../arithmetic_logical_translators.py         | 40 ++++++++++++-------
 .../primitive_translators/conditions.py       |  2 +-
 .../primitive_translators/slicing.py          |  2 +-
 4 files changed, 30 insertions(+), 35 deletions(-)

diff --git a/src/jace/translator/jaxpr_translator_builder.py b/src/jace/translator/jaxpr_translator_builder.py
index 288593f..3e48964 100644
--- a/src/jace/translator/jaxpr_translator_builder.py
+++ b/src/jace/translator/jaxpr_translator_builder.py
@@ -179,24 +179,6 @@ def append_new_state(
             self._ctx.terminal_state = new_state
         return new_state
 
-    def add_orphan_state(
-        self,
-        label: str,
-    ) -> dace.SDFGState:
-        """
-        Add a new orphan state to the SDFG.
-
-        The state is not connected to any other state, nor it is the new start state.
-        Except you know what you are doing you should not use this function and
-        instead use `self.append_new_state()`.
-
-        Args:
-            label: The name of the state.
-        """
-        if not self.is_allocated():
-            raise RuntimeError("Builder is not allocated.")
-        return self._ctx.sdfg.add_state(label=label, is_start_block=False)
-
     @property
     def arrays(self) -> Mapping[str, dace_data.Data]:
         """
@@ -520,7 +502,8 @@ def _allocate_translation_ctx(
     @property
     def _ctx(self) -> TranslationContext:
         """Returns the currently active translation context."""
-        assert len(self._ctx_stack) != 0, "No context is active."
+        if not self.is_allocated():
+            raise RuntimeError("The context is not allocated.")
         return self._ctx_stack[-1]
 
     def _clear_translation_ctx(self) -> TranslationContext | None:
diff --git a/src/jace/translator/primitive_translators/arithmetic_logical_translators.py b/src/jace/translator/primitive_translators/arithmetic_logical_translators.py
index 7cf321f..28f9a3a 100644
--- a/src/jace/translator/primitive_translators/arithmetic_logical_translators.py
+++ b/src/jace/translator/primitive_translators/arithmetic_logical_translators.py
@@ -79,8 +79,8 @@ class LogicalOperationTranslator(mapped_base.MappedOperationTranslatorBase):
 
     Args:
         prim_name: The name of the primitive that should be handled.
-        int_tmpl: The template used for the integer case.
-        bool_tmpl: The template used for the bool case.
+        bitwise_tmpl: The template used for the bitwise case.
+        logical_tmpl: The template used for the logical case.
 
     Note:
         Since it does not make sense to single out `not` and keep the other
@@ -88,10 +88,10 @@ class LogicalOperationTranslator(mapped_base.MappedOperationTranslatorBase):
         handled by this class.
     """
 
-    def __init__(self, prim_name: str, int_tmpl: str, bool_tmpl: str) -> None:
+    def __init__(self, prim_name: str, bitwise_tmpl: str, logical_tmpl: str) -> None:
         super().__init__(primitive_name=prim_name)
-        self._int_tmpl = int_tmpl
-        self._bool_tmpl = bool_tmpl
+        self._bitwise_tmpl = bitwise_tmpl
+        self._logical_tmpl = logical_tmpl
 
     @override
     def write_tasklet_code(
@@ -101,8 +101,8 @@ def write_tasklet_code(
         eqn: jax_core.JaxprEqn,
     ) -> str:
         if all(util.get_jax_var_dtype(invar) is dace.bool_ for invar in eqn.invars):
-            return self._bool_tmpl
-        return self._int_tmpl
+            return self._logical_tmpl
+        return self._bitwise_tmpl
 
 
 # Maps the name of an arithmetic JAX primitive to the code template that is used to
@@ -176,11 +176,23 @@ def write_tasklet_code(
 # Maps the name of a logical primitive to the two code templates, first the integer
 #  case and second the boolean case, that are used to create the body of the mapped
 #  tasklet. They are used to instantiate the `LogicalOperationTranslator` translators.
-_LOGICAL_OPERATION_TEMPLATES: Final[dict[str, tuple[str, str]]] = {
-    "or": ("__out = (__in0) | (__in1)",  "__out = (__in0) or (__in1)"),
-    "not": ("__out = ~(__in0)", "__out = not (__in0)"),
-    "and": ("__out = (__in0) & (__in1)", "__out = (__in0) and (__in1)"),
-    "xor": ("__out = (__in0) ^ (__in1)", "__out = (__in0) != (__in1)"),
+_LOGICAL_OPERATION_TEMPLATES: Final[dict[str, dict[str, str]]] = {
+    "or": {
+        "bitwise_tmpl": "__out = (__in0) | (__in1)",
+        "logical_tmpl": "__out = (__in0) or (__in1)",
+    },
+    "not": {
+        "bitwise_tmpl": "__out = ~(__in0)",
+        "logical_tmpl": "__out = not (__in0)",
+    },
+    "and": {
+        "bitwise_tmpl": "__out = (__in0) & (__in1)",
+        "logical_tmpl": "__out = (__in0) and (__in1)",
+    },
+    "xor": {
+        "bitwise_tmpl": "__out = (__in0) ^ (__in1)",
+        "logical_tmpl": "__out = (__in0) != (__in1)",
+    },
 }
 # fmt: on
 
@@ -188,5 +200,5 @@ def write_tasklet_code(
 # Instantiate the arithmetic and logical translators from the templates.
 for pname, ptmpl in _ARITMETIC_OPERATION_TEMPLATES.items():
     translator.register_primitive_translator(ArithmeticOperationTranslator(pname, ptmpl))
-for pname, (itmpl, btmpl) in _LOGICAL_OPERATION_TEMPLATES.items():
-    translator.register_primitive_translator(LogicalOperationTranslator(pname, itmpl, btmpl))
+for pname, ptmpl in _LOGICAL_OPERATION_TEMPLATES.items():  # type: ignore[assignment]  # Type confusion
+    translator.register_primitive_translator(LogicalOperationTranslator(pname, **ptmpl))  # type: ignore[arg-type]  # Type confusion
diff --git a/src/jace/translator/primitive_translators/conditions.py b/src/jace/translator/primitive_translators/conditions.py
index 945baf1..e13920b 100644
--- a/src/jace/translator/primitive_translators/conditions.py
+++ b/src/jace/translator/primitive_translators/conditions.py
@@ -116,7 +116,7 @@ def condition_translator(
         branch_states.append(branch_state)
 
     # Connect all branch states to the join state
-    join_state = builder.add_orphan_state(f"{name_pattern}__join_state")
+    join_state = builder._ctx.sdfg.add_state(label=f"{name_pattern}__join_state")
     for branch_state in branch_states:
         builder.sdfg.add_edge(
             branch_state,
diff --git a/src/jace/translator/primitive_translators/slicing.py b/src/jace/translator/primitive_translators/slicing.py
index c53c3d0..6d9ae26 100644
--- a/src/jace/translator/primitive_translators/slicing.py
+++ b/src/jace/translator/primitive_translators/slicing.py
@@ -57,7 +57,7 @@ def make_input_memlets(
         eqn: jax_core.JaxprEqn,
     ) -> dict[str, dace.Memlet]:
         strides: Sequence[int] = (
-            ((1,) * len(tskl_ranges)) if eqn.params["strides"] is None else eqn.params["strides"]
+            eqn.params["strides"] if eqn.params["strides"] else ((1,) * len(tskl_ranges))
         )
         start_indices: Sequence[int] = eqn.params["start_indices"]  # Fist index to slice
         return {

From cc10a483d4a9542d608ea86222d35bcc52a8e318 Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Thu, 26 Sep 2024 16:22:59 +0200
Subject: [PATCH 456/458] Splited a test into multiple one, for better
 pinpointing.

---
 .../test_primitive_select_n.py                | 34 ++++++++++++-------
 1 file changed, 22 insertions(+), 12 deletions(-)

diff --git a/tests/integration_tests/primitive_translators/test_primitive_select_n.py b/tests/integration_tests/primitive_translators/test_primitive_select_n.py
index a87088f..a0cab1f 100644
--- a/tests/integration_tests/primitive_translators/test_primitive_select_n.py
+++ b/tests/integration_tests/primitive_translators/test_primitive_select_n.py
@@ -14,6 +14,7 @@
 
 import jax
 import numpy as np
+import pytest
 from jax import numpy as jnp
 
 import jace
@@ -21,6 +22,12 @@
 from tests import util as testutil
 
 
+@pytest.fixture(params=[True, False])
+def pred(request) -> np.bool_:
+    """Predicate used in the `test_mapped_unary_scalar_literal_*` tests."""
+    return np.bool_(request.param)
+
+
 def _perform_test(testee: Callable, *args: Any) -> None:
     res = testee(*args)
     ref = jace.jit(testee)(*args)
@@ -38,24 +45,27 @@ def testee(pred: np.ndarray, tbranch: np.ndarray, fbranch: np.ndarray) -> jax.Ar
     _perform_test(testee, pred, tbranch, fbranch)
 
 
-def test_select_n_where_literal() -> None:
-    def testee1(pred: np.ndarray, fbranch: np.ndarray) -> jax.Array:
+def test_select_n_where_literal_1(pred) -> None:
+    def testee(pred: np.ndarray, fbranch: np.ndarray) -> jax.Array:
         return jnp.where(pred, 2, fbranch)
 
-    def testee2(pred: np.ndarray, tbranch: np.ndarray) -> jax.Array:
+    fbranch = 1
+    _perform_test(testee, pred, fbranch)
+
+
+def test_select_n_where_literal_2(pred) -> None:
+    def testee(pred: np.ndarray, tbranch: np.ndarray) -> jax.Array:
         return jnp.where(pred, tbranch, 3)
 
-    def testee3(pred: np.ndarray) -> jax.Array:
-        return jnp.where(pred, 8, 9)
+    tbranch = 2
+    _perform_test(testee, pred, tbranch)
 
-    shape = ()
-    pred = testutil.make_array(shape, np.bool_)
-    tbranch = testutil.make_array(shape, np.int_)
-    fbranch = tbranch + 1
 
-    _perform_test(testee1, pred, fbranch)
-    _perform_test(testee2, pred, tbranch)
-    _perform_test(testee3, pred)
+def test_select_n_where_literal_3(pred) -> None:
+    def testee(pred: np.ndarray) -> jax.Array:
+        return jnp.where(pred, 8, 9)
+
+    _perform_test(testee, pred)
 
 
 def test_select_n_many_inputs() -> None:

From 18bdee9326ba2307100d08badb45f9f7fdd12442 Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?Philip=20M=C3=BCller?=
 <147368808+philip-paul-mueller@users.noreply.github.com>
Date: Thu, 26 Sep 2024 16:27:38 +0200
Subject: [PATCH 457/458] Apply suggestions from code review
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

Co-authored-by: Enrique González Paredes <enriqueg@cscs.ch>
---
 .../primitive_translators/convert_element_type_translator.py  | 2 +-
 .../translator/primitive_translators/gather_translator.py     | 2 +-
 src/jace/translator/primitive_translators/pjit_translator.py  | 4 +---
 3 files changed, 3 insertions(+), 5 deletions(-)

diff --git a/src/jace/translator/primitive_translators/convert_element_type_translator.py b/src/jace/translator/primitive_translators/convert_element_type_translator.py
index a9f179c..e1fb8e5 100644
--- a/src/jace/translator/primitive_translators/convert_element_type_translator.py
+++ b/src/jace/translator/primitive_translators/convert_element_type_translator.py
@@ -32,7 +32,7 @@ class ConvertElementTypeTranslator(mapped_base.MappedOperationTranslatorBase):
     will perform the type conversion operation.
 
     Note:
-        The type to cast to id inferred from the output variable and the `new_dtype`
+        The type to cast to is inferred from the output variable and the `new_dtype`
         parameter of the equation is ignored.
     """
 
diff --git a/src/jace/translator/primitive_translators/gather_translator.py b/src/jace/translator/primitive_translators/gather_translator.py
index 4f459d9..51f5730 100644
--- a/src/jace/translator/primitive_translators/gather_translator.py
+++ b/src/jace/translator/primitive_translators/gather_translator.py
@@ -63,7 +63,7 @@ def gather_translator(  # noqa: PLR0914 [too-many-locals]  # Can not reduce any
     if eqn.params["mode"] != jax_lax.GatherScatterMode.PROMISE_IN_BOUNDS:
         raise NotImplementedError(f"The mode {eqn.params['mode']} is not implemented.")
 
-    # This is the size of the slice window that is copied. Its length equal the rank
+    # This is the size of the slice window that is copied. Its length is the rank
     #  of the source array, dimensions that are excluded from copying are listed
     #  in `collapsed_slice_dims`.
     slice_sizes: Sequence[int] = eqn.params["slice_sizes"]
diff --git a/src/jace/translator/primitive_translators/pjit_translator.py b/src/jace/translator/primitive_translators/pjit_translator.py
index 43bc3ea..95cb3d4 100644
--- a/src/jace/translator/primitive_translators/pjit_translator.py
+++ b/src/jace/translator/primitive_translators/pjit_translator.py
@@ -57,9 +57,7 @@ def pjit_translator(
     nested_jaxpr: jax_core.ClosedJaxpr = eqn.params["jaxpr"]
     in_shardings = eqn.params["in_shardings"]
     out_shardings = eqn.params["out_shardings"]
-    _ = eqn.params["donated_invars"]  # Always ignored
-    _ = eqn.params["keep_unused"]
-    _ = eqn.params["inline"]
+    # "donated_invars", "keep_unused", "inline" parameters are just ignored
 
     if not all(in_sharding is jax_sharding.UNSPECIFIED for in_sharding in in_shardings):
         raise NotImplementedError("Currently 'pjit' does not support sharding in its input.")

From 2169470cf600bd68a7632e75711befe6a9cb9754 Mon Sep 17 00:00:00 2001
From: Philip Mueller <philip.mueller@cscs.ch>
Date: Fri, 27 Sep 2024 11:12:47 +0200
Subject: [PATCH 458/458] The import error that panda is not found is now
 ignored.

---
 pyproject.toml | 1 +
 1 file changed, 1 insertion(+)

diff --git a/pyproject.toml b/pyproject.toml
index fabd4a3..a03a349 100644
--- a/pyproject.toml
+++ b/pyproject.toml
@@ -113,6 +113,7 @@ addopts = ["-ra", "--showlocals", "--strict-markers", "--strict-config"]
 filterwarnings = [
   "error",
   "ignore:numpy\\..*:DeprecationWarning",  # DaCe is not NumPy v2.0 ready so ignore the usage of deprecated features.
+  "ignore:pandas not found, skipping conversion test\\.:ImportWarning",  # Pandas is not installed on the CI.
 ]
 log_cli_level = "INFO"
 minversion = "6.0"