Kernels
kernels-bot commited on
Commit
3415ddf
·
verified ·
1 Parent(s): d33a099

Uploaded using `kernel-builder`.

Browse files
Files changed (22) hide show
  1. build/torch210-cxx11-cu126-x86_64-linux/_ops.py +3 -3
  2. build/torch210-cxx11-cu126-x86_64-linux/{_rotary_cuda_17de4fe.abi3.so → _rotary_cuda_1ff2c4a.abi3.so} +1 -1
  3. build/torch210-cxx11-cu128-x86_64-linux/_ops.py +3 -3
  4. build/torch210-cxx11-cu128-x86_64-linux/{_rotary_cuda_17de4fe.abi3.so → _rotary_cuda_1ff2c4a.abi3.so} +1 -1
  5. build/torch210-cxx11-cu130-x86_64-linux/_ops.py +3 -3
  6. build/torch210-cxx11-cu130-x86_64-linux/{_rotary_cuda_17de4fe.abi3.so → _rotary_cuda_1ff2c4a.abi3.so} +2 -2
  7. build/torch210-cxx11-xpu20253-x86_64-linux/_ops.py +3 -3
  8. build/torch210-cxx11-xpu20253-x86_64-linux/{_rotary_xpu_17de4fe.abi3.so → _rotary_xpu_1ff2c4a.abi3.so} +1 -1
  9. build/torch211-cxx11-cu126-x86_64-linux/_ops.py +3 -3
  10. build/torch211-cxx11-cu126-x86_64-linux/{_rotary_cuda_17de4fe.abi3.so → _rotary_cuda_1ff2c4a.abi3.so} +1 -1
  11. build/torch211-cxx11-cu128-x86_64-linux/_ops.py +3 -3
  12. build/torch211-cxx11-cu128-x86_64-linux/{_rotary_cuda_17de4fe.abi3.so → _rotary_cuda_1ff2c4a.abi3.so} +1 -1
  13. build/torch211-cxx11-cu130-x86_64-linux/_ops.py +3 -3
  14. build/torch211-cxx11-cu130-x86_64-linux/_rotary_cuda_17de4fe.abi3.so +0 -3
  15. build/torch211-cxx11-cu130-x86_64-linux/_rotary_cuda_1ff2c4a.abi3.so +3 -0
  16. build/torch211-cxx11-xpu20253-x86_64-linux/__init__.py +52 -0
  17. build/torch211-cxx11-xpu20253-x86_64-linux/_ops.py +9 -0
  18. build/torch211-cxx11-xpu20253-x86_64-linux/_rotary_xpu_1ff2c4a.abi3.so +3 -0
  19. build/torch211-cxx11-xpu20253-x86_64-linux/metadata.json +8 -0
  20. build/torch211-cxx11-xpu20253-x86_64-linux/rotary/__init__.py +26 -0
  21. build/torch29-cxx11-cu129-x86_64-linux/_ops.py +3 -3
  22. build/torch29-cxx11-cu129-x86_64-linux/{_rotary_cuda_17de4fe.abi3.so → _rotary_cuda_1ff2c4a.abi3.so} +1 -1
build/torch210-cxx11-cu126-x86_64-linux/_ops.py CHANGED
@@ -1,9 +1,9 @@
1
  import torch
2
- from . import _rotary_cuda_17de4fe
3
- ops = torch.ops._rotary_cuda_17de4fe
4
 
5
  def add_op_namespace_prefix(op_name: str):
6
  """
7
  Prefix op by namespace.
8
  """
9
- return f"_rotary_cuda_17de4fe::{op_name}"
 
1
  import torch
2
+ from . import _rotary_cuda_1ff2c4a
3
+ ops = torch.ops._rotary_cuda_1ff2c4a
4
 
5
  def add_op_namespace_prefix(op_name: str):
6
  """
7
  Prefix op by namespace.
8
  """
9
+ return f"_rotary_cuda_1ff2c4a::{op_name}"
build/torch210-cxx11-cu126-x86_64-linux/{_rotary_cuda_17de4fe.abi3.so → _rotary_cuda_1ff2c4a.abi3.so} RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:2dc06be886cf33ed300ddf18a4b47a0c6bf86ecaf3fcf1270f7c76e2155475ff
3
  size 8200568
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b2ca4629138cc61e16f0e0440f65c0f012cce964a49394a3c011e61bbeed789f
3
  size 8200568
build/torch210-cxx11-cu128-x86_64-linux/_ops.py CHANGED
@@ -1,9 +1,9 @@
1
  import torch
2
- from . import _rotary_cuda_17de4fe
3
- ops = torch.ops._rotary_cuda_17de4fe
4
 
5
  def add_op_namespace_prefix(op_name: str):
6
  """
7
  Prefix op by namespace.
8
  """
9
- return f"_rotary_cuda_17de4fe::{op_name}"
 
1
  import torch
2
+ from . import _rotary_cuda_1ff2c4a
3
+ ops = torch.ops._rotary_cuda_1ff2c4a
4
 
5
  def add_op_namespace_prefix(op_name: str):
6
  """
7
  Prefix op by namespace.
8
  """
9
+ return f"_rotary_cuda_1ff2c4a::{op_name}"
build/torch210-cxx11-cu128-x86_64-linux/{_rotary_cuda_17de4fe.abi3.so → _rotary_cuda_1ff2c4a.abi3.so} RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:29271f8a63c361c613578dd95dcf90de69567dc6711dc0bbd3741626d54ae07a
3
  size 11905904
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f661db8bac0b471dbe2a53a72ac0a3060294002c0158fd1c2dfc1fb635bf3b1a
3
  size 11905904
build/torch210-cxx11-cu130-x86_64-linux/_ops.py CHANGED
@@ -1,9 +1,9 @@
1
  import torch
2
- from . import _rotary_cuda_17de4fe
3
- ops = torch.ops._rotary_cuda_17de4fe
4
 
5
  def add_op_namespace_prefix(op_name: str):
6
  """
7
  Prefix op by namespace.
8
  """
9
- return f"_rotary_cuda_17de4fe::{op_name}"
 
1
  import torch
2
+ from . import _rotary_cuda_1ff2c4a
3
+ ops = torch.ops._rotary_cuda_1ff2c4a
4
 
5
  def add_op_namespace_prefix(op_name: str):
6
  """
7
  Prefix op by namespace.
8
  """
9
+ return f"_rotary_cuda_1ff2c4a::{op_name}"
build/torch210-cxx11-cu130-x86_64-linux/{_rotary_cuda_17de4fe.abi3.so → _rotary_cuda_1ff2c4a.abi3.so} RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:92f83279a8fe700b52af5bcb004ece45dd678061d90d790f6576961a040b3a3e
3
- size 10310752
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a5de9e68f719d1e9f5feb466c2ab6844e64191923103f83bce9636992f8c79e2
3
+ size 10307160
build/torch210-cxx11-xpu20253-x86_64-linux/_ops.py CHANGED
@@ -1,9 +1,9 @@
1
  import torch
2
- from . import _rotary_xpu_17de4fe
3
- ops = torch.ops._rotary_xpu_17de4fe
4
 
5
  def add_op_namespace_prefix(op_name: str):
6
  """
7
  Prefix op by namespace.
8
  """
9
- return f"_rotary_xpu_17de4fe::{op_name}"
 
1
  import torch
2
+ from . import _rotary_xpu_1ff2c4a
3
+ ops = torch.ops._rotary_xpu_1ff2c4a
4
 
5
  def add_op_namespace_prefix(op_name: str):
6
  """
7
  Prefix op by namespace.
8
  """
9
+ return f"_rotary_xpu_1ff2c4a::{op_name}"
build/torch210-cxx11-xpu20253-x86_64-linux/{_rotary_xpu_17de4fe.abi3.so → _rotary_xpu_1ff2c4a.abi3.so} RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:53435ac1dc220c7bacfff30fe0f9119269d8f08928780ef8d53f664cc8d462fa
3
  size 2301504
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:071f6c80b72223f9640eeb229ded44d36f13826714ed1ec90dc3317b0400b539
3
  size 2301504
build/torch211-cxx11-cu126-x86_64-linux/_ops.py CHANGED
@@ -1,9 +1,9 @@
1
  import torch
2
- from . import _rotary_cuda_17de4fe
3
- ops = torch.ops._rotary_cuda_17de4fe
4
 
5
  def add_op_namespace_prefix(op_name: str):
6
  """
7
  Prefix op by namespace.
8
  """
9
- return f"_rotary_cuda_17de4fe::{op_name}"
 
1
  import torch
2
+ from . import _rotary_cuda_1ff2c4a
3
+ ops = torch.ops._rotary_cuda_1ff2c4a
4
 
5
  def add_op_namespace_prefix(op_name: str):
6
  """
7
  Prefix op by namespace.
8
  """
9
+ return f"_rotary_cuda_1ff2c4a::{op_name}"
build/torch211-cxx11-cu126-x86_64-linux/{_rotary_cuda_17de4fe.abi3.so → _rotary_cuda_1ff2c4a.abi3.so} RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:7e784ee2ad7a9c68601fc0e40734f940e15e83b738e514b275c164f7bb5740cf
3
  size 8193600
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:26abf96731f0a53085c242187f0955d70cc20e8c9f6047a2d4d1569efc07d87e
3
  size 8193600
build/torch211-cxx11-cu128-x86_64-linux/_ops.py CHANGED
@@ -1,9 +1,9 @@
1
  import torch
2
- from . import _rotary_cuda_17de4fe
3
- ops = torch.ops._rotary_cuda_17de4fe
4
 
5
  def add_op_namespace_prefix(op_name: str):
6
  """
7
  Prefix op by namespace.
8
  """
9
- return f"_rotary_cuda_17de4fe::{op_name}"
 
1
  import torch
2
+ from . import _rotary_cuda_1ff2c4a
3
+ ops = torch.ops._rotary_cuda_1ff2c4a
4
 
5
  def add_op_namespace_prefix(op_name: str):
6
  """
7
  Prefix op by namespace.
8
  """
9
+ return f"_rotary_cuda_1ff2c4a::{op_name}"
build/torch211-cxx11-cu128-x86_64-linux/{_rotary_cuda_17de4fe.abi3.so → _rotary_cuda_1ff2c4a.abi3.so} RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d5b56c5504c4f8fccd032bb25a6dcfd168ba35b62edb22b68a31cb48e64113aa
3
  size 11894840
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9c5c9ff2340b8a94fbc7920c238556b18498c903d8d931da93fda84c1d9ae675
3
  size 11894840
build/torch211-cxx11-cu130-x86_64-linux/_ops.py CHANGED
@@ -1,9 +1,9 @@
1
  import torch
2
- from . import _rotary_cuda_17de4fe
3
- ops = torch.ops._rotary_cuda_17de4fe
4
 
5
  def add_op_namespace_prefix(op_name: str):
6
  """
7
  Prefix op by namespace.
8
  """
9
- return f"_rotary_cuda_17de4fe::{op_name}"
 
1
  import torch
2
+ from . import _rotary_cuda_1ff2c4a
3
+ ops = torch.ops._rotary_cuda_1ff2c4a
4
 
5
  def add_op_namespace_prefix(op_name: str):
6
  """
7
  Prefix op by namespace.
8
  """
9
+ return f"_rotary_cuda_1ff2c4a::{op_name}"
build/torch211-cxx11-cu130-x86_64-linux/_rotary_cuda_17de4fe.abi3.so DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:807bdc834886287cbf730c475412278109a6f43131e95b15b66fe75686f54634
3
- size 10303784
 
 
 
 
build/torch211-cxx11-cu130-x86_64-linux/_rotary_cuda_1ff2c4a.abi3.so ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0ef1f14ac10914f04945d5512be813414ebe128499b81267a1e2d41bf15b0393
3
+ size 10296096
build/torch211-cxx11-xpu20253-x86_64-linux/__init__.py ADDED
@@ -0,0 +1,52 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ from typing import Optional, Tuple
2
+ import torch
3
+
4
+ from ._ops import ops
5
+
6
+
7
+ def apply_rotary(
8
+ x1: torch.Tensor,
9
+ x2: torch.Tensor,
10
+ cos: torch.Tensor,
11
+ sin: torch.Tensor,
12
+ out1: torch.Tensor,
13
+ out2: torch.Tensor,
14
+ conj: bool,
15
+ ) -> None:
16
+ ops.apply_rotary(x1, x2, cos, sin, out1, out2, conj)
17
+
18
+
19
+ def apply_rotary_transformers(
20
+ q: torch.Tensor,
21
+ k: torch.Tensor,
22
+ cos: torch.Tensor,
23
+ sin: torch.Tensor,
24
+ unsqueeze_dim: int = 1,
25
+ ) -> Tuple[torch.Tensor, torch.Tensor]:
26
+ """
27
+ Rotary kernel implementation wrapper
28
+ Adapts rotary kernel implementation to match transformers apply_rotary_pos_emb signature
29
+ """
30
+ cos = cos.unsqueeze(unsqueeze_dim)
31
+ sin = sin.unsqueeze(unsqueeze_dim)
32
+
33
+ q_rotated = q.clone()
34
+ k_rotated = k.clone()
35
+
36
+ # Get half dimension for rotation
37
+ half_dim = q.shape[-1] // 2
38
+ q1 = q_rotated[..., :half_dim]
39
+ q2 = q_rotated[..., half_dim:]
40
+ k1 = k_rotated[..., :half_dim]
41
+ k2 = k_rotated[..., half_dim:]
42
+ if cos.shape[-1] != half_dim:
43
+ # Trim cos/sin to match half_dim
44
+ cos = cos[..., :half_dim]
45
+ sin = sin[..., :half_dim]
46
+
47
+ apply_rotary(q1, q2, cos, sin, q1, q2, False)
48
+ apply_rotary(k1, k2, cos, sin, k1, k2, False)
49
+ return q_rotated, k_rotated
50
+
51
+
52
+ __all__ = ["apply_rotary", "apply_rotary_transformers"]
build/torch211-cxx11-xpu20253-x86_64-linux/_ops.py ADDED
@@ -0,0 +1,9 @@
 
 
 
 
 
 
 
 
 
 
1
+ import torch
2
+ from . import _rotary_xpu_1ff2c4a
3
+ ops = torch.ops._rotary_xpu_1ff2c4a
4
+
5
+ def add_op_namespace_prefix(op_name: str):
6
+ """
7
+ Prefix op by namespace.
8
+ """
9
+ return f"_rotary_xpu_1ff2c4a::{op_name}"
build/torch211-cxx11-xpu20253-x86_64-linux/_rotary_xpu_1ff2c4a.abi3.so ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:866dec73565cc4bc480f07f9b176b617a445e79a23c030820cf36f4c667f1040
3
+ size 2301504
build/torch211-cxx11-xpu20253-x86_64-linux/metadata.json ADDED
@@ -0,0 +1,8 @@
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "version": 1,
3
+ "license": "BSD-3-Clause",
4
+ "python-depends": [],
5
+ "backend": {
6
+ "type": "xpu"
7
+ }
8
+ }
build/torch211-cxx11-xpu20253-x86_64-linux/rotary/__init__.py ADDED
@@ -0,0 +1,26 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ import ctypes
2
+ import importlib.util
3
+ import sys
4
+ from pathlib import Path
5
+ from types import ModuleType
6
+
7
+
8
+ def _import_from_path(file_path: Path) -> ModuleType:
9
+ # We cannot use the module name as-is, after adding it to `sys.modules`,
10
+ # it would also be used for other imports. So, we make a module name that
11
+ # depends on the path for it to be unique using the hex-encoded hash of
12
+ # the path.
13
+ path_hash = "{:x}".format(ctypes.c_size_t(hash(file_path.absolute())).value)
14
+ module_name = path_hash
15
+ spec = importlib.util.spec_from_file_location(module_name, file_path)
16
+ if spec is None:
17
+ raise ImportError(f"Cannot load spec for {module_name} from {file_path}")
18
+ module = importlib.util.module_from_spec(spec)
19
+ if module is None:
20
+ raise ImportError(f"Cannot load module {module_name} from spec")
21
+ sys.modules[module_name] = module
22
+ spec.loader.exec_module(module) # type: ignore
23
+ return module
24
+
25
+
26
+ globals().update(vars(_import_from_path(Path(__file__).parent.parent / "__init__.py")))
build/torch29-cxx11-cu129-x86_64-linux/_ops.py CHANGED
@@ -1,9 +1,9 @@
1
  import torch
2
- from . import _rotary_cuda_17de4fe
3
- ops = torch.ops._rotary_cuda_17de4fe
4
 
5
  def add_op_namespace_prefix(op_name: str):
6
  """
7
  Prefix op by namespace.
8
  """
9
- return f"_rotary_cuda_17de4fe::{op_name}"
 
1
  import torch
2
+ from . import _rotary_cuda_1ff2c4a
3
+ ops = torch.ops._rotary_cuda_1ff2c4a
4
 
5
  def add_op_namespace_prefix(op_name: str):
6
  """
7
  Prefix op by namespace.
8
  """
9
+ return f"_rotary_cuda_1ff2c4a::{op_name}"
build/torch29-cxx11-cu129-x86_64-linux/{_rotary_cuda_17de4fe.abi3.so → _rotary_cuda_1ff2c4a.abi3.so} RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:bcd3ab1517eabfaf2fcca055deaf85cc8031f097d7982df460a891bea5206add
3
  size 11964176
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:73512553b334acb47e085a7975ead67470641381044836837d819adffd22e1b5
3
  size 11964176