core/maxframe/io/objects/tensor.py (50 lines of code) (raw):
# Copyright 1999-2025 Alibaba Group Holding Ltd.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
# http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
import struct
from io import BytesIO
from typing import Any, Dict
import msgpack
import numpy as np
from ...lib import wrapped_pickle as pickle
from ...tensor.core import TensorData
from ...typing_ import SlicesType, TileableType
from ..odpsio import ODPSVolumeReader, ODPSVolumeWriter
from .core import AbstractObjectIOHandler, register_object_io_handler
@register_object_io_handler(TensorData)
class TensorIOHandler(AbstractObjectIOHandler):
def write_object_meta(
self,
writer: ODPSVolumeWriter,
tileable: TileableType,
extra_meta: Dict[str, Any] = None,
):
# fixme upload in real slices when tensors are supported in DPE
extra_meta = extra_meta or dict()
extra_meta["nsplits"] = ((np.nan,),)
super().write_object_meta(writer, tileable, extra_meta=extra_meta)
def _read_object_body(
self,
reader: ODPSVolumeReader,
tileable: TileableType,
meta: Dict[str, Any],
slices: SlicesType = None,
) -> Any:
# fixme read data with slices when tensors are supported in DPE
body = reader.read_file("0,0.dat")
bio = BytesIO(body)
(header_len,) = struct.unpack("<I", bio.read(4))
header_data = msgpack.loads(bio.read(header_len))
pickled = bio.read(header_data[0])
bufs = [bio.read(size) for size in header_data[1:]]
return pickle.loads(pickled, buffers=bufs)
def _write_object_body(
self, writer: ODPSVolumeWriter, tileable: TileableType, value: Any
):
# fixme upload in real slices when tensors are supported in DPE
def data_gen():
bufs = []
pickled = pickle.dumps(value, buffer_callback=bufs.append)
header_data = msgpack.dumps(
[len(pickled)] + [len(buf.raw()) for buf in bufs]
)
yield struct.pack("<I", len(header_data))
yield header_data
yield pickled
for buf in bufs:
yield buf
writer.write_file("0,0.dat", data_gen())