jd-opensource
diff --git a/‎xllm/core/layers/CMakeLists.txt‎
Lines changed: 1 addition & 0 deletions b/‎xllm/core/layers/CMakeLists.txt‎
Lines changed: 1 addition & 0 deletions
diff --git a/‎xllm/core/layers/glm4_decoder_layer.h‎
Lines changed: 35 additions & 0 deletions b/‎xllm/core/layers/glm4_decoder_layer.h‎
Lines changed: 35 additions & 0 deletions
diff --git a/‎xllm/core/layers/npu/CMakeLists.txt‎
Lines changed: 2 additions & 0 deletions b/‎xllm/core/layers/npu/CMakeLists.txt‎
Lines changed: 2 additions & 0 deletions
@@ -64,6 +64,7 @@ cc_library(
     qwen3_vision_encode_layer.h
     qwen3_decoder_layer.h
     qwen3_moe_decoder_layer.h
+    glm4_decoder_layer.h
     rms_norm.h
     siglip_encoder_layer.h
     pos_embedding.h
 
@@ -0,0 +1,35 @@
+/* Copyright 2025 The xLLM Authors. All Rights Reserved.
+Licensed under the Apache License, Version 2.0 (the "License");
+you may not use this file except in compliance with the License.
+You may obtain a copy of the License at
+    https://github.com/jd-opensource/xllm/blob/main/LICENSE
+Unless required by applicable law or agreed to in writing, software
+distributed under the License is distributed on an "AS IS" BASIS,
+WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+See the License for the specific language governing permissions and
+limitations under the License.
+==============================================================================*/
+#pragma once
+#include "npu/npu_glm4_decoder_layer_impl.h"
+namespace xllm {
+namespace layer {
+#if defined(USE_NPU)
+class Glm4DecoderLayer
+    : public torch::nn::ModuleHolder<NpuGlm4DecoderLayerImpl> {
+ public:
+  using torch::nn::ModuleHolder<NpuGlm4DecoderLayerImpl>::ModuleHolder;
+  using Impl __attribute__((__unused__)) = NpuGlm4DecoderLayerImpl;
+  Glm4DecoderLayer(const ModelContext& context)
+      : ModuleHolder(std::make_shared<NpuGlm4DecoderLayerImpl>(context)) {}
+};
+#else
+class Glm4DecoderLayer : public torch::nn::ModuleHolder<Qwen2DecoderImpl> {
+ public:
+  using torch::nn::ModuleHolder<Qwen2DecoderImpl>::ModuleHolder;
+  using Impl __attribute__((__unused__)) = Qwen2DecoderImpl;
+  Glm4DecoderLayer(const ModelContext& context)
+      : ModuleHolder(std::make_shared<Qwen2DecoderImpl>(context)) {}
+};
+#endif
+}  // namespace layer
+}  // namespace xllm
@@ -24,6 +24,7 @@ cc_library(
     npu_llama_decoder_layer_impl.h
     npu_qwen2_decoder_layer_impl.h
     npu_qwen3_decoder_layer_impl.h
+    npu_glm4_decoder_layer_impl.h
     npu_rms_norm_impl.h
     npu_siglip_encoder_layer_impl.h
   SRCS
@@ -45,6 +46,7 @@ cc_library(
     npu_llama_decoder_layer_impl.cpp
     npu_qwen2_decoder_layer_impl.cpp
     npu_qwen3_decoder_layer_impl.cpp
+    npu_glm4_decoder_layer_impl.cpp
     npu_rms_norm_impl.cpp
     npu_siglip_encoder_layer_impl.cpp
   DEPS