Build for Torch 2.8 (x86_64-linux)
Browse files- build/torch28-cxx11-cu126-x86_64-linux/quantization_eetq/__init__.py +3 -0
- build/torch28-cxx11-cu126-x86_64-linux/quantization_eetq/__pycache__/__init__.cpython-313.pyc +0 -0
- build/torch28-cxx11-cu126-x86_64-linux/quantization_eetq/__pycache__/_ops.cpython-313.pyc +0 -0
- build/torch28-cxx11-cu126-x86_64-linux/quantization_eetq/__pycache__/custom_ops.cpython-313.pyc +0 -0
- build/torch28-cxx11-cu126-x86_64-linux/quantization_eetq/_ops.py +9 -0
- build/torch28-cxx11-cu126-x86_64-linux/quantization_eetq/_quantization_eetq_0c60fb4.abi3.so +3 -0
- build/torch28-cxx11-cu126-x86_64-linux/quantization_eetq/custom_ops.py +36 -0
- build/torch28-cxx11-cu128-x86_64-linux/quantization_eetq/__init__.py +3 -0
- build/torch28-cxx11-cu128-x86_64-linux/quantization_eetq/__pycache__/__init__.cpython-313.pyc +0 -0
- build/torch28-cxx11-cu128-x86_64-linux/quantization_eetq/__pycache__/_ops.cpython-313.pyc +0 -0
- build/torch28-cxx11-cu128-x86_64-linux/quantization_eetq/__pycache__/custom_ops.cpython-313.pyc +0 -0
- build/torch28-cxx11-cu128-x86_64-linux/quantization_eetq/_ops.py +9 -0
- build/torch28-cxx11-cu128-x86_64-linux/quantization_eetq/_quantization_eetq_0c60fb4.abi3.so +3 -0
- build/torch28-cxx11-cu128-x86_64-linux/quantization_eetq/custom_ops.py +36 -0
- build/torch28-cxx11-cu129-x86_64-linux/quantization_eetq/__init__.py +3 -0
- build/torch28-cxx11-cu129-x86_64-linux/quantization_eetq/__pycache__/__init__.cpython-313.pyc +0 -0
- build/torch28-cxx11-cu129-x86_64-linux/quantization_eetq/__pycache__/_ops.cpython-313.pyc +0 -0
- build/torch28-cxx11-cu129-x86_64-linux/quantization_eetq/__pycache__/custom_ops.cpython-313.pyc +0 -0
- build/torch28-cxx11-cu129-x86_64-linux/quantization_eetq/_ops.py +9 -0
- build/torch28-cxx11-cu129-x86_64-linux/quantization_eetq/_quantization_eetq_0c60fb4.abi3.so +3 -0
- build/torch28-cxx11-cu129-x86_64-linux/quantization_eetq/custom_ops.py +36 -0
build/torch28-cxx11-cu126-x86_64-linux/quantization_eetq/__init__.py
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
from .custom_ops import w8_a16_gemm, w8_a16_gemm_, preprocess_weights, quant_weights
|
2 |
+
|
3 |
+
__all__ = ["w8_a16_gemm", "w8_a16_gemm_", "preprocess_weights", "quant_weights"]
|
build/torch28-cxx11-cu126-x86_64-linux/quantization_eetq/__pycache__/__init__.cpython-313.pyc
ADDED
Binary file (334 Bytes). View file
|
|
build/torch28-cxx11-cu126-x86_64-linux/quantization_eetq/__pycache__/_ops.cpython-313.pyc
ADDED
Binary file (547 Bytes). View file
|
|
build/torch28-cxx11-cu126-x86_64-linux/quantization_eetq/__pycache__/custom_ops.cpython-313.pyc
ADDED
Binary file (1.84 kB). View file
|
|
build/torch28-cxx11-cu126-x86_64-linux/quantization_eetq/_ops.py
ADDED
@@ -0,0 +1,9 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
import torch
|
2 |
+
from . import _quantization_eetq_0c60fb4
|
3 |
+
ops = torch.ops._quantization_eetq_0c60fb4
|
4 |
+
|
5 |
+
def add_op_namespace_prefix(op_name: str):
|
6 |
+
"""
|
7 |
+
Prefix op by namespace.
|
8 |
+
"""
|
9 |
+
return f"_quantization_eetq_0c60fb4::{op_name}"
|
build/torch28-cxx11-cu126-x86_64-linux/quantization_eetq/_quantization_eetq_0c60fb4.abi3.so
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:854740b7499076f0f7c54be036dc9a66bdf4aa0bab322f8f2ef7e92723f76f93
|
3 |
+
size 30881144
|
build/torch28-cxx11-cu126-x86_64-linux/quantization_eetq/custom_ops.py
ADDED
@@ -0,0 +1,36 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
from typing import List
|
2 |
+
import torch
|
3 |
+
|
4 |
+
from ._ops import ops
|
5 |
+
|
6 |
+
|
7 |
+
def w8_a16_gemm(
|
8 |
+
input: torch.Tensor, weight: torch.Tensor, scale: torch.Tensor
|
9 |
+
) -> torch.Tensor:
|
10 |
+
return ops.w8_a16_gemm(input, weight, scale)
|
11 |
+
|
12 |
+
|
13 |
+
def w8_a16_gemm_(
|
14 |
+
input: torch.Tensor,
|
15 |
+
weight: torch.Tensor,
|
16 |
+
scale: torch.Tensor,
|
17 |
+
output: torch.Tensor,
|
18 |
+
m: int,
|
19 |
+
n: int,
|
20 |
+
k: int,
|
21 |
+
) -> torch.Tensor:
|
22 |
+
return ops.w8_a16_gemm_(input, weight, scale, output, m, n, k)
|
23 |
+
|
24 |
+
|
25 |
+
def preprocess_weights(origin_weight: torch.Tensor, is_int4: bool) -> torch.Tensor:
|
26 |
+
return ops.preprocess_weights(origin_weight, is_int4)
|
27 |
+
|
28 |
+
|
29 |
+
def quant_weights(
|
30 |
+
origin_weight: torch.Tensor,
|
31 |
+
quant_type: torch.dtype,
|
32 |
+
return_unprocessed_quantized_tensor: bool,
|
33 |
+
) -> List[torch.Tensor]:
|
34 |
+
return ops.quant_weights(
|
35 |
+
origin_weight, quant_type, return_unprocessed_quantized_tensor
|
36 |
+
)
|
build/torch28-cxx11-cu128-x86_64-linux/quantization_eetq/__init__.py
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
from .custom_ops import w8_a16_gemm, w8_a16_gemm_, preprocess_weights, quant_weights
|
2 |
+
|
3 |
+
__all__ = ["w8_a16_gemm", "w8_a16_gemm_", "preprocess_weights", "quant_weights"]
|
build/torch28-cxx11-cu128-x86_64-linux/quantization_eetq/__pycache__/__init__.cpython-313.pyc
ADDED
Binary file (334 Bytes). View file
|
|
build/torch28-cxx11-cu128-x86_64-linux/quantization_eetq/__pycache__/_ops.cpython-313.pyc
ADDED
Binary file (547 Bytes). View file
|
|
build/torch28-cxx11-cu128-x86_64-linux/quantization_eetq/__pycache__/custom_ops.cpython-313.pyc
ADDED
Binary file (1.84 kB). View file
|
|
build/torch28-cxx11-cu128-x86_64-linux/quantization_eetq/_ops.py
ADDED
@@ -0,0 +1,9 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
import torch
|
2 |
+
from . import _quantization_eetq_0c60fb4
|
3 |
+
ops = torch.ops._quantization_eetq_0c60fb4
|
4 |
+
|
5 |
+
def add_op_namespace_prefix(op_name: str):
|
6 |
+
"""
|
7 |
+
Prefix op by namespace.
|
8 |
+
"""
|
9 |
+
return f"_quantization_eetq_0c60fb4::{op_name}"
|
build/torch28-cxx11-cu128-x86_64-linux/quantization_eetq/_quantization_eetq_0c60fb4.abi3.so
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:213e1c9f8e5db3152b870ed377f10e7acd1f3c1fd584bce8721c1b88c612a5e9
|
3 |
+
size 37476304
|
build/torch28-cxx11-cu128-x86_64-linux/quantization_eetq/custom_ops.py
ADDED
@@ -0,0 +1,36 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
from typing import List
|
2 |
+
import torch
|
3 |
+
|
4 |
+
from ._ops import ops
|
5 |
+
|
6 |
+
|
7 |
+
def w8_a16_gemm(
|
8 |
+
input: torch.Tensor, weight: torch.Tensor, scale: torch.Tensor
|
9 |
+
) -> torch.Tensor:
|
10 |
+
return ops.w8_a16_gemm(input, weight, scale)
|
11 |
+
|
12 |
+
|
13 |
+
def w8_a16_gemm_(
|
14 |
+
input: torch.Tensor,
|
15 |
+
weight: torch.Tensor,
|
16 |
+
scale: torch.Tensor,
|
17 |
+
output: torch.Tensor,
|
18 |
+
m: int,
|
19 |
+
n: int,
|
20 |
+
k: int,
|
21 |
+
) -> torch.Tensor:
|
22 |
+
return ops.w8_a16_gemm_(input, weight, scale, output, m, n, k)
|
23 |
+
|
24 |
+
|
25 |
+
def preprocess_weights(origin_weight: torch.Tensor, is_int4: bool) -> torch.Tensor:
|
26 |
+
return ops.preprocess_weights(origin_weight, is_int4)
|
27 |
+
|
28 |
+
|
29 |
+
def quant_weights(
|
30 |
+
origin_weight: torch.Tensor,
|
31 |
+
quant_type: torch.dtype,
|
32 |
+
return_unprocessed_quantized_tensor: bool,
|
33 |
+
) -> List[torch.Tensor]:
|
34 |
+
return ops.quant_weights(
|
35 |
+
origin_weight, quant_type, return_unprocessed_quantized_tensor
|
36 |
+
)
|
build/torch28-cxx11-cu129-x86_64-linux/quantization_eetq/__init__.py
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
from .custom_ops import w8_a16_gemm, w8_a16_gemm_, preprocess_weights, quant_weights
|
2 |
+
|
3 |
+
__all__ = ["w8_a16_gemm", "w8_a16_gemm_", "preprocess_weights", "quant_weights"]
|
build/torch28-cxx11-cu129-x86_64-linux/quantization_eetq/__pycache__/__init__.cpython-313.pyc
ADDED
Binary file (334 Bytes). View file
|
|
build/torch28-cxx11-cu129-x86_64-linux/quantization_eetq/__pycache__/_ops.cpython-313.pyc
ADDED
Binary file (547 Bytes). View file
|
|
build/torch28-cxx11-cu129-x86_64-linux/quantization_eetq/__pycache__/custom_ops.cpython-313.pyc
ADDED
Binary file (1.84 kB). View file
|
|
build/torch28-cxx11-cu129-x86_64-linux/quantization_eetq/_ops.py
ADDED
@@ -0,0 +1,9 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
import torch
|
2 |
+
from . import _quantization_eetq_0c60fb4
|
3 |
+
ops = torch.ops._quantization_eetq_0c60fb4
|
4 |
+
|
5 |
+
def add_op_namespace_prefix(op_name: str):
|
6 |
+
"""
|
7 |
+
Prefix op by namespace.
|
8 |
+
"""
|
9 |
+
return f"_quantization_eetq_0c60fb4::{op_name}"
|
build/torch28-cxx11-cu129-x86_64-linux/quantization_eetq/_quantization_eetq_0c60fb4.abi3.so
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:91d74be2ae273fc4826b1d9f6c725e9462217e45705df2dd3aa4574479ae4e1b
|
3 |
+
size 38205656
|
build/torch28-cxx11-cu129-x86_64-linux/quantization_eetq/custom_ops.py
ADDED
@@ -0,0 +1,36 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
from typing import List
|
2 |
+
import torch
|
3 |
+
|
4 |
+
from ._ops import ops
|
5 |
+
|
6 |
+
|
7 |
+
def w8_a16_gemm(
|
8 |
+
input: torch.Tensor, weight: torch.Tensor, scale: torch.Tensor
|
9 |
+
) -> torch.Tensor:
|
10 |
+
return ops.w8_a16_gemm(input, weight, scale)
|
11 |
+
|
12 |
+
|
13 |
+
def w8_a16_gemm_(
|
14 |
+
input: torch.Tensor,
|
15 |
+
weight: torch.Tensor,
|
16 |
+
scale: torch.Tensor,
|
17 |
+
output: torch.Tensor,
|
18 |
+
m: int,
|
19 |
+
n: int,
|
20 |
+
k: int,
|
21 |
+
) -> torch.Tensor:
|
22 |
+
return ops.w8_a16_gemm_(input, weight, scale, output, m, n, k)
|
23 |
+
|
24 |
+
|
25 |
+
def preprocess_weights(origin_weight: torch.Tensor, is_int4: bool) -> torch.Tensor:
|
26 |
+
return ops.preprocess_weights(origin_weight, is_int4)
|
27 |
+
|
28 |
+
|
29 |
+
def quant_weights(
|
30 |
+
origin_weight: torch.Tensor,
|
31 |
+
quant_type: torch.dtype,
|
32 |
+
return_unprocessed_quantized_tensor: bool,
|
33 |
+
) -> List[torch.Tensor]:
|
34 |
+
return ops.quant_weights(
|
35 |
+
origin_weight, quant_type, return_unprocessed_quantized_tensor
|
36 |
+
)
|