Skip to content

[mlir] Python: write bytecode to a file path #127118

New issue

Have a question about this project? Sign up for a free GitHub account to open an issue and contact its maintainers and the community.

By clicking “Sign up for GitHub”, you agree to our terms of service and privacy statement. We’ll occasionally send you account related emails.

Already on GitHub? Sign in to your account

Merged
merged 7 commits into from
Feb 25, 2025
Merged
Show file tree
Hide file tree
Changes from all commits
Commits
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
15 changes: 9 additions & 6 deletions mlir/lib/Bindings/Python/IRCore.cpp
Original file line number Diff line number Diff line change
Expand Up @@ -6,22 +6,25 @@
//
//===----------------------------------------------------------------------===//

#include <optional>
#include <utility>

#include "Globals.h"
#include "IRModule.h"
#include "NanobindUtils.h"
#include "mlir-c/Bindings/Python/Interop.h" // This is expected after nanobind.
#include "mlir-c/BuiltinAttributes.h"
#include "mlir-c/Debug.h"
#include "mlir-c/Diagnostics.h"
#include "mlir-c/IR.h"
#include "mlir-c/Support.h"
#include "mlir/Bindings/Python/Nanobind.h"
#include "mlir/Bindings/Python/NanobindAdaptors.h"
#include "mlir-c/Bindings/Python/Interop.h" // This is expected after nanobind.
#include "nanobind/nanobind.h"
#include "llvm/ADT/ArrayRef.h"
#include "llvm/ADT/SmallVector.h"
#include "llvm/Support/raw_ostream.h"

#include <optional>
#include <system_error>
#include <utility>

namespace nb = nanobind;
using namespace nb::literals;
Expand Down Expand Up @@ -1329,11 +1332,11 @@ void PyOperationBase::print(PyAsmState &state, nb::object fileObject,
accum.getUserData());
}

void PyOperationBase::writeBytecode(const nb::object &fileObject,
void PyOperationBase::writeBytecode(const nb::object &fileOrStringObject,
std::optional<int64_t> bytecodeVersion) {
PyOperation &operation = getOperation();
operation.checkValid();
PyFileAccumulator accum(fileObject, /*binary=*/true);
PyFileAccumulator accum(fileOrStringObject, /*binary=*/true);

if (!bytecodeVersion.has_value())
return mlirOperationWriteBytecode(operation, accum.getCallback(),
Expand Down
49 changes: 40 additions & 9 deletions mlir/lib/Bindings/Python/NanobindUtils.h
Original file line number Diff line number Diff line change
Expand Up @@ -13,8 +13,13 @@
#include "mlir-c/Support.h"
#include "mlir/Bindings/Python/Nanobind.h"
#include "llvm/ADT/STLExtras.h"
#include "llvm/ADT/StringRef.h"
#include "llvm/ADT/Twine.h"
#include "llvm/Support/DataTypes.h"
#include "llvm/Support/raw_ostream.h"

#include <string>
#include <variant>

template <>
struct std::iterator_traits<nanobind::detail::fast_iterator> {
Expand Down Expand Up @@ -128,33 +133,59 @@ struct PyPrintAccumulator {
}
};

/// Accumulates int a python file-like object, either writing text (default)
/// or binary.
/// Accumulates into a file, either writing text (default)
/// or binary. The file may be a Python file-like object or a path to a file.
class PyFileAccumulator {
public:
PyFileAccumulator(const nanobind::object &fileObject, bool binary)
: pyWriteFunction(fileObject.attr("write")), binary(binary) {}
PyFileAccumulator(const nanobind::object &fileOrStringObject, bool binary)
: binary(binary) {
std::string filePath;
if (nanobind::try_cast<std::string>(fileOrStringObject, filePath)) {
std::error_code ec;
writeTarget.emplace<llvm::raw_fd_ostream>(filePath, ec);
if (ec) {
throw nanobind::value_error(
(std::string("Unable to open file for writing: ") + ec.message())
.c_str());
}
} else {
writeTarget.emplace<nanobind::object>(fileOrStringObject.attr("write"));
}
}

MlirStringCallback getCallback() {
return writeTarget.index() == 0 ? getPyWriteCallback()
: getOstreamCallback();
}

void *getUserData() { return this; }

MlirStringCallback getCallback() {
private:
MlirStringCallback getPyWriteCallback() {
return [](MlirStringRef part, void *userData) {
nanobind::gil_scoped_acquire acquire;
PyFileAccumulator *accum = static_cast<PyFileAccumulator *>(userData);
if (accum->binary) {
// Note: Still has to copy and not avoidable with this API.
nanobind::bytes pyBytes(part.data, part.length);
accum->pyWriteFunction(pyBytes);
std::get<nanobind::object>(accum->writeTarget)(pyBytes);
} else {
nanobind::str pyStr(part.data,
part.length); // Decodes as UTF-8 by default.
accum->pyWriteFunction(pyStr);
std::get<nanobind::object>(accum->writeTarget)(pyStr);
}
};
}

private:
nanobind::object pyWriteFunction;
MlirStringCallback getOstreamCallback() {
return [](MlirStringRef part, void *userData) {
PyFileAccumulator *accum = static_cast<PyFileAccumulator *>(userData);
std::get<llvm::raw_fd_ostream>(accum->writeTarget)
.write(part.data, part.length);
};
}

std::variant<nanobind::object, llvm::raw_fd_ostream> writeTarget;
bool binary;
};

Expand Down
6 changes: 3 additions & 3 deletions mlir/python/mlir/_mlir_libs/_mlir/ir.pyi
Original file line number Diff line number Diff line change
Expand Up @@ -47,7 +47,7 @@ import collections
from collections.abc import Callable, Sequence
import io
from pathlib import Path
from typing import Any, ClassVar, TypeVar, overload
from typing import Any, BinaryIO, ClassVar, TypeVar, overload

__all__ = [
"AffineAddExpr",
Expand Down Expand Up @@ -285,12 +285,12 @@ class _OperationBase:
"""
Verify the operation. Raises MLIRError if verification fails, and returns true otherwise.
"""
def write_bytecode(self, file: Any, desired_version: int | None = None) -> None:
def write_bytecode(self, file: BinaryIO | str, desired_version: int | None = None) -> None:
"""
Write the bytecode form of the operation to a file like object.

Args:
file: The file like object to write to.
file: The file like object or path to write to.
desired_version: The version of bytecode to emit.
Returns:
The bytecode writer status.
Expand Down
7 changes: 7 additions & 0 deletions mlir/test/python/ir/operation.py
Original file line number Diff line number Diff line change
Expand Up @@ -3,6 +3,7 @@
import gc
import io
import itertools
from tempfile import NamedTemporaryFile
from mlir.ir import *
from mlir.dialects.builtin import ModuleOp
from mlir.dialects import arith
Expand Down Expand Up @@ -617,6 +618,12 @@ def testOperationPrint():
module.operation.write_bytecode(bytecode_stream, desired_version=1)
bytecode = bytecode_stream.getvalue()
assert bytecode.startswith(b"ML\xefR"), "Expected bytecode to start with MLïR"
with NamedTemporaryFile() as tmpfile:
module.operation.write_bytecode(str(tmpfile.name), desired_version=1)
tmpfile.seek(0)
assert tmpfile.read().startswith(
b"ML\xefR"
), "Expected bytecode to start with MLïR"
ctx2 = Context()
module_roundtrip = Module.parse(bytecode, ctx2)
f = io.StringIO()
Expand Down