File: device_op_overrides.py

package info (click to toggle)
pytorch-cuda 2.6.0%2Bdfsg-7
  • links: PTS, VCS
  • area: contrib
  • in suites: forky, sid, trixie
  • size: 161,620 kB
  • sloc: python: 1,278,832; cpp: 900,322; ansic: 82,710; asm: 7,754; java: 3,363; sh: 2,811; javascript: 2,443; makefile: 597; ruby: 195; xml: 84; objc: 68
file content (79 lines) | stat: -rw-r--r-- 2,154 bytes parent folder | download | duplicates (3)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
# mypy: allow-untyped-defs
from ..common import DeviceOpOverrides, register_device_op_overrides


class XPUDeviceOpOverrides(DeviceOpOverrides):
    def import_get_raw_stream_as(self, name):
        return f"from torch._C import _xpu_getCurrentRawStream as {name}"

    def set_device(self, device_idx):
        return f"torch.xpu.set_device({device_idx})"

    def synchronize(self):
        return "torch.xpu.synchronize()"

    def device_guard(self, device_idx):
        return f"torch.xpu._DeviceGuard({device_idx})"

    def cpp_device_guard(self):
        return "at::DeviceGuard"

    def cpp_aoti_device_guard(self):
        return "AOTIXpuGuard"

    def cpp_stream_guard(self):
        return "at::xpu::XPUStreamGuard"

    def cpp_aoti_stream_guard(self):
        return "AOTIXpuStreamGuard"

    def cpp_getStreamFromExternal(self):
        return "at::xpu::getStreamFromExternal"

    def kernel_header(self):
        source_codes = """
        #include <torch/csrc/inductor/aoti_runtime/sycl_runtime_wrappers.h>
        """
        return source_codes

    def kernel_driver(self):
        source_codes = """
            namespace {

            struct Grid {
                Grid(uint32_t x, uint32_t y, uint32_t z)
                  : grid_x(x), grid_y(y), grid_z(z) {}
                uint32_t grid_x;
                uint32_t grid_y;
                uint32_t grid_z;

                bool is_non_zero() {
                    return grid_x > 0 && grid_y > 0 && grid_z > 0;
                }
            };

            }  // anonymous namespace

        """
        return source_codes

    def abi_compatible_header(self):
        return """
        #include <torch/csrc/inductor/aoti_runtime/utils_xpu.h>
        #include <torch/csrc/inductor/aoti_runtime/sycl_runtime_wrappers.h>
        """

    def cpp_stream_type(self):
        return "sycl::queue*"

    def aoti_get_stream(self):
        return "aoti_torch_get_current_xpu_stream"

    def cpp_kernel_type(self):
        return "std::unique_ptr<sycl::kernel>"

    def cpp_device_ptr(self):
        return "void *"


register_device_op_overrides("xpu", XPUDeviceOpOverrides())