1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
|
From 97c972045ab8bf8f4f4db39da0728b2c41183eff Mon Sep 17 00:00:00 2001
From: zhengchenhui <zhengchenhui1@huawei.com>
Date: Wed, 12 Nov 2025 16:38:50 +0800
Subject: [PATCH] Add python bindings for kernels.
---
...i_def_KPFusedEmbeddingActionIdGather.pbtxt | 3 ++
.../api_def_KPFusedEmbeddingPadding.pbtxt | 3 ++
.../api_def_KPFusedEmbeddingPaddingFast.pbtxt | 3 ++
.../api_def/api_def_KPFusedGather.pbtxt | 3 ++
.../api_def_KPFusedSparseDynamicStitch.pbtxt | 3 ++
.../api_def_KPFusedSparseReshape.pbtxt | 3 ++
.../api_def_KPFusedSparseSegmentReduce.pbtxt | 3 ++
...ef_KPFusedSparseSegmentReduceNonzero.pbtxt | 3 ++
.../api_def/api_def_KPFusedSparseSelect.pbtxt | 3 ++
annc/tensorflow/tf_annc_optimizer.patch | 53 +++++++++++++++++--
10 files changed, 76 insertions(+), 4 deletions(-)
create mode 100644 annc/tensorflow/api_def/api_def_KPFusedEmbeddingActionIdGather.pbtxt
create mode 100644 annc/tensorflow/api_def/api_def_KPFusedEmbeddingPadding.pbtxt
create mode 100644 annc/tensorflow/api_def/api_def_KPFusedEmbeddingPaddingFast.pbtxt
create mode 100644 annc/tensorflow/api_def/api_def_KPFusedGather.pbtxt
create mode 100644 annc/tensorflow/api_def/api_def_KPFusedSparseDynamicStitch.pbtxt
create mode 100644 annc/tensorflow/api_def/api_def_KPFusedSparseReshape.pbtxt
create mode 100644 annc/tensorflow/api_def/api_def_KPFusedSparseSegmentReduce.pbtxt
create mode 100644 annc/tensorflow/api_def/api_def_KPFusedSparseSegmentReduceNonzero.pbtxt
create mode 100644 annc/tensorflow/api_def/api_def_KPFusedSparseSelect.pbtxt
diff --git a/annc/tensorflow/api_def/api_def_KPFusedEmbeddingActionIdGather.pbtxt b/annc/tensorflow/api_def/api_def_KPFusedEmbeddingActionIdGather.pbtxt
new file mode 100644
index 0000000..bb221ad
--- /dev/null
+++ b/annc/tensorflow/api_def/api_def_KPFusedEmbeddingActionIdGather.pbtxt
@@ -0,0 +1,3 @@
+op {
+ graph_op_name: "KPFusedEmbeddingActionIdGather"
+}
diff --git a/annc/tensorflow/api_def/api_def_KPFusedEmbeddingPadding.pbtxt b/annc/tensorflow/api_def/api_def_KPFusedEmbeddingPadding.pbtxt
new file mode 100644
index 0000000..5aef378
--- /dev/null
+++ b/annc/tensorflow/api_def/api_def_KPFusedEmbeddingPadding.pbtxt
@@ -0,0 +1,3 @@
+op {
+ graph_op_name: "KPFusedEmbeddingPadding"
+}
diff --git a/annc/tensorflow/api_def/api_def_KPFusedEmbeddingPaddingFast.pbtxt b/annc/tensorflow/api_def/api_def_KPFusedEmbeddingPaddingFast.pbtxt
new file mode 100644
index 0000000..17e7ebc
--- /dev/null
+++ b/annc/tensorflow/api_def/api_def_KPFusedEmbeddingPaddingFast.pbtxt
@@ -0,0 +1,3 @@
+op {
+ graph_op_name: "KPFusedEmbeddingPaddingFast"
+}
diff --git a/annc/tensorflow/api_def/api_def_KPFusedGather.pbtxt b/annc/tensorflow/api_def/api_def_KPFusedGather.pbtxt
new file mode 100644
index 0000000..63c4eef
--- /dev/null
+++ b/annc/tensorflow/api_def/api_def_KPFusedGather.pbtxt
@@ -0,0 +1,3 @@
+op {
+ graph_op_name: "KPFusedGather"
+}
diff --git a/annc/tensorflow/api_def/api_def_KPFusedSparseDynamicStitch.pbtxt b/annc/tensorflow/api_def/api_def_KPFusedSparseDynamicStitch.pbtxt
new file mode 100644
index 0000000..5b01d70
--- /dev/null
+++ b/annc/tensorflow/api_def/api_def_KPFusedSparseDynamicStitch.pbtxt
@@ -0,0 +1,3 @@
+op {
+ graph_op_name: "KPFusedSparseDynamicStitch"
+}
diff --git a/annc/tensorflow/api_def/api_def_KPFusedSparseReshape.pbtxt b/annc/tensorflow/api_def/api_def_KPFusedSparseReshape.pbtxt
new file mode 100644
index 0000000..8fe3c2f
--- /dev/null
+++ b/annc/tensorflow/api_def/api_def_KPFusedSparseReshape.pbtxt
@@ -0,0 +1,3 @@
+op {
+ graph_op_name: "KPFusedSparseReshape"
+}
diff --git a/annc/tensorflow/api_def/api_def_KPFusedSparseSegmentReduce.pbtxt b/annc/tensorflow/api_def/api_def_KPFusedSparseSegmentReduce.pbtxt
new file mode 100644
index 0000000..b13aa7d
--- /dev/null
+++ b/annc/tensorflow/api_def/api_def_KPFusedSparseSegmentReduce.pbtxt
@@ -0,0 +1,3 @@
+op {
+ graph_op_name: "KPFusedSparseSegmentReduce"
+}
diff --git a/annc/tensorflow/api_def/api_def_KPFusedSparseSegmentReduceNonzero.pbtxt b/annc/tensorflow/api_def/api_def_KPFusedSparseSegmentReduceNonzero.pbtxt
new file mode 100644
index 0000000..c0945af
--- /dev/null
+++ b/annc/tensorflow/api_def/api_def_KPFusedSparseSegmentReduceNonzero.pbtxt
@@ -0,0 +1,3 @@
+op {
+ graph_op_name: "KPFusedSparseSegmentReduceNonzero"
+}
diff --git a/annc/tensorflow/api_def/api_def_KPFusedSparseSelect.pbtxt b/annc/tensorflow/api_def/api_def_KPFusedSparseSelect.pbtxt
new file mode 100644
index 0000000..bafc915
--- /dev/null
+++ b/annc/tensorflow/api_def/api_def_KPFusedSparseSelect.pbtxt
@@ -0,0 +1,3 @@
+op {
+ graph_op_name: "KPFusedSparseSelect"
+}
diff --git a/annc/tensorflow/tf_annc_optimizer.patch b/annc/tensorflow/tf_annc_optimizer.patch
index c92330a..ec0199e 100644
--- a/annc/tensorflow/tf_annc_optimizer.patch
+++ b/annc/tensorflow/tf_annc_optimizer.patch
@@ -1,5 +1,5 @@
diff --git a/tensorflow/core/BUILD b/tensorflow/core/BUILD
-index 538574360ba..b43e0455802 100644
+index 538574360ba..3864064d18c 100644
--- a/tensorflow/core/BUILD
+++ b/tensorflow/core/BUILD
@@ -629,6 +629,7 @@ cc_library(
@@ -10,6 +10,14 @@ index 538574360ba..b43e0455802 100644
] + if_mkl([
"//tensorflow/core/kernels/mkl:mkl_concat_op",
"//tensorflow/core/kernels/mkl:mkl_dequantize_op",
+@@ -907,6 +908,7 @@ filegroup(
+ "candidate_sampling_ops_op_lib",
+ "checkpoint_ops_op_lib",
+ "clustering_ops_op_lib",
++ "embedding_fused_ops_op_lib",
+ "collective_ops_op_lib",
+ "control_flow_ops_op_lib",
+ "count_ops_op_lib",
diff --git a/tensorflow/core/grappler/optimizers/BUILD b/tensorflow/core/grappler/optimizers/BUILD
index ecd559734ea..97a918ead6d 100644
--- a/tensorflow/core/grappler/optimizers/BUILD
@@ -189,6 +197,45 @@ index 91d80b6c2b5..b00b2a5d027 100644
] + select({
# Non-tpu platforms don't need tpu dependency.
"//tensorflow:chromiumos": [],
+diff --git a/tensorflow/python/BUILD b/tensorflow/python/BUILD
+index 9810f8acd2e..3b0b23fec0a 100644
+--- a/tensorflow/python/BUILD
++++ b/tensorflow/python/BUILD
+@@ -269,6 +269,7 @@ py_strict_library(
+ "//tensorflow/python/ops/signal:util_ops",
+ "//tensorflow/python/ops/signal:window_ops",
+ "//tensorflow/python/ops/structured:structured_ops",
++ "//tensorflow/python/ops:embedding_fused_ops_gen",
+ "//tensorflow/python/platform:_pywrap_stacktrace_handler",
+ "//tensorflow/python/platform:app",
+ "//tensorflow/python/platform:client_testlib",
+@@ -389,6 +390,7 @@ py_strict_library(
+ "//tensorflow/python/ops:bitwise_ops",
+ "//tensorflow/python/ops:boosted_trees_ops_gen",
+ "//tensorflow/python/ops:clustering_ops_gen",
++ "//tensorflow/python/ops:embedding_fused_ops_gen",
+ "//tensorflow/python/ops:composite_tensor_ops",
+ "//tensorflow/python/ops:cond_v2",
+ "//tensorflow/python/ops:cudnn_rnn_ops_gen",
+diff --git a/tensorflow/python/ops/BUILD b/tensorflow/python/ops/BUILD
+index b3a3d612a01..185da7da4a8 100644
+--- a/tensorflow/python/ops/BUILD
++++ b/tensorflow/python/ops/BUILD
+@@ -228,6 +228,14 @@ tf_gen_op_strict_wrapper_private_py(
+ ],
+ )
+
++tf_gen_op_strict_wrapper_private_py(
++ name = "embedding_fused_ops_gen",
++ visibility = ["//tensorflow:internal"],
++ deps = [
++ "//tensorflow/core:embedding_fused_ops_op_lib",
++ ],
++)
++
+ tf_gen_op_strict_wrapper_private_py(
+ name = "collective_ops_gen",
+ visibility = ["//tensorflow:internal"],
diff --git a/third_party/xla/xla/service/cpu/BUILD b/third_party/xla/xla/service/cpu/BUILD
index 6e0ea613435..47c346b4e93 100644
--- a/third_party/xla/xla/service/cpu/BUILD
@@ -216,6 +263,4 @@ index 6e0ea613435..47c346b4e93 100644
+
cc_library(
name = "cpu_compiler_pure",
- srcs = ["cpu_compiler.cc"],
-
-
+ srcs = ["cpu_compiler.cc"],
\ No newline at end of file
--
2.33.0
|