7.1.6. Example: Explicitly Transferring Data Between Host And Device

Example: Inference With A Model を元に、明示的にホストーデバイス間のデータ転送を行う API を扱うサンプルプログラム

実行方法

$ cd /opt/pfn/pfcomp/codegen/examples/
$ ./exec_with_env.sh python3 explicit_data_transfer_api.py

想定出力

ランダムに初期化されたモデルによる推論結果 (infer.py の結果と等しければ良い)

tensor([[-0.3188,  0.6279, -0.5000, -1.2148],
        [-0.3188,  0.6279, -0.5000, -1.2148],
        [-0.3188,  0.6279, -0.5000, -1.2148],
        [-0.3188,  0.6279, -0.5000, -1.2148]])

関連リンク

サンプルプログラム

リスト 7.6 /opt/pfn/pfcomp/codegen/MLSDK/examples/explicit_data_transfer_api.py

import torch
from mlsdk import Context, MNDevice, set_tensor_name_in_module, storage

torch.manual_seed(0)


def run_explicit_data_transfer():
    device = MNDevice("mncore2:auto")
    context = Context(device)
    Context.switch_context(context)

    model = torch.nn.Linear(4, 4)
    model.eval()
    set_tensor_name_in_module(model, "model")
    for p in model.parameters():
        context.register_param(p)
    for b in model.buffers():
        context.register_buffer(b)

    def infer(input: dict[str, torch.Tensor]) -> dict[str, torch.Tensor]:
        x = input["x"]
        y = model(x)
        return {"out": y}

    sample = {"x": torch.randn(4, 4)}

    compiled_infer = context.compile(
        infer,
        sample,
        storage.path("/tmp/proxy_transfer"),
    )

    input_proxies_allocated = compiled_infer.allocate_input_proxy()
    input_proxies_allocated["x"].load_from(torch.ones(4, 4), clone=False)

    for model_param in model.parameters():
        model_param_proxy = context.get_registered_value_proxy(model_param)
        model_param_proxy.load_from(model_param)

    result = compiled_infer(input_proxies_allocated)
    result_on_cpu = result["out"].cpu()
    print(result_on_cpu)


if __name__ == "__main__":
    run_explicit_data_transfer()