diff --git a/aikg/examples/run_torch_triton_parallel.py b/aikg/examples/run_torch_triton_parallel.py
new file mode 100644
index 0000000000000000000000000000000000000000..3c9282bdc9cbc7b25b26dbb23ca9eda13883d6df
--- /dev/null
+++ b/aikg/examples/run_torch_triton_parallel.py
@@ -0,0 +1,118 @@
+# Copyright 2025 Huawei Technologies Co., Ltd
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+# http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+import asyncio
+from ai_kernel_generator.core.task import Task
+from ai_kernel_generator.core.async_pool.task_pool import TaskPool
+from ai_kernel_generator.core.async_pool.device_pool import DevicePool
+from ai_kernel_generator.config.config_validator import load_config
+from ai_kernel_generator.utils.environment_check import check_env_for_task
+
+
+def get_op_name_and_task_desc():
+    pair1 = ('relu', '''
+import torch
+import torch.nn as nn
+
+
+class Model(nn.Module):
+    """
+    ReLU激活函数模型
+    """
+    def __init__(self):
+        super(Model, self).__init__()
+
+    def forward(self, x: torch.Tensor) -> torch.Tensor:
+
+        return torch.relu(x)
+
+
+batch_size = 16
+dim = 16384
+
+
+def get_inputs():
+    x = torch.randn(batch_size, dim, dtype=torch.float16)
+    return [x]
+
+
+def get_init_inputs():
+    return []  # No special initialization inputs needed
+    ''')
+
+    pair2 = ('tanh', '''
+import torch
+import torch.nn as nn
+
+
+class Model(nn.Module):
+    """
+    Tanh激活函数模型
+    """
+    def __init__(self):
+        super(Model, self).__init__()
+
+    def forward(self, x: torch.Tensor) -> torch.Tensor:
+
+        return torch.tanh(x)
+
+
+batch_size = 16
+dim = 16384
+
+
+def get_inputs():
+    x = torch.randn(batch_size, dim, dtype=torch.float16)
+    return [x]
+
+
+def get_init_inputs():
+    return []  # No special initialization inputs needed
+    ''')
+    return [pair1, pair2]
+
+
+async def run_torch_triton_parallel():
+    op_name_and_task_desc = get_op_name_and_task_desc()
+
+    task_pool = TaskPool()
+    device_pool = DevicePool([0, 1])
+    config = load_config("triton")  # or load_config("/your-path-to-config/xxx_config.yaml")
+
+    check_env_for_task("torch", "ascend", "triton", config) # or cuda, a100
+
+    for i, (op_name, task_desc) in enumerate(op_name_and_task_desc):
+        task = Task(
+            op_name=op_name,
+            task_desc=task_desc,
+            task_id=str(i),
+            dsl="triton",
+            backend="ascend", # cuda
+            arch="ascend910b4", # a100
+            config=config,
+            device_pool=device_pool,
+            framework="torch",
+            workflow="coder_only_workflow"
+        )
+        task_pool.create_task(task.run)
+
+    results = await task_pool.wait_all()
+    for op_name, result, _ in results:
+        if result:
+            print(f"Task {op_name} passed")
+        else:
+            print(f"Task {op_name} failed")
+
+if __name__ == "__main__":
+    asyncio.run(run_torch_triton_parallel())
diff --git a/aikg/examples/run_torch_triton_single.py b/aikg/examples/run_torch_triton_single.py
new file mode 100644
index 0000000000000000000000000000000000000000..6e6b449fa17f6a35266bcaa8f202871999c97d13
--- /dev/null
+++ b/aikg/examples/run_torch_triton_single.py
@@ -0,0 +1,100 @@
+# Copyright 2025 Huawei Technologies Co., Ltd
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+# http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+from ai_kernel_generator.config.config_validator import load_config
+from ai_kernel_generator.core.async_pool.device_pool import DevicePool
+from ai_kernel_generator.core.async_pool.task_pool import TaskPool
+from ai_kernel_generator.core.task import Task
+from ai_kernel_generator.utils.environment_check import check_env_for_task
+import asyncio
+import os
+os.environ['AIKG_STREAM_OUTPUT'] = 'on'
+
+
+def get_op_name():
+    return 'relu'
+
+
+def get_task_desc():
+    return '''
+import torch
+import torch.nn as nn
+
+
+class Model(nn.Module):
+    """
+    ReLU激活函数模型
+    """
+    def __init__(self):
+        super(Model, self).__init__()
+
+    def forward(self, x: torch.Tensor) -> torch.Tensor:
+        """
+        计算ReLU激活函数
+        Args:
+            x: 输入张量
+        Returns:
+            ReLU激活后的张量
+        """
+        return torch.relu(x)
+
+
+batch_size = 16
+dim = 16384
+
+
+def get_inputs():
+    x = torch.randn(batch_size, dim, dtype=torch.float16)
+    return [x]
+
+
+def get_init_inputs():
+    return []  # No special initialization inputs needed
+'''
+
+
+async def run_torch_triton_single():
+    op_name = get_op_name()
+    task_desc = get_task_desc()
+
+    task_pool = TaskPool()
+    device_pool = DevicePool([0])
+    config = load_config("triton")  # use official deepseek api
+    # config = load_config(config_path="./python/ai_kernel_generator/config/vllm_triton_coderonly_config.yaml")
+
+    check_env_for_task("torch", "ascend", "triton", config) # or cuda, a100
+
+    task = Task(
+        op_name=op_name,
+        task_desc=task_desc,
+        task_id="0",
+        dsl="triton",
+        backend="ascend", # cuda
+        arch="ascend910b4", # a100
+        config=config,
+        device_pool=device_pool,
+        framework="torch",
+        workflow="coder_only_workflow"
+    )
+
+    task_pool.create_task(task.run)
+    results = await task_pool.wait_all()
+    for op_name, result, _ in results:
+        if result:
+            print(f"Task {op_name} passed")
+        else:
+            print(f"Task {op_name} failed")
+
+if __name__ == "__main__":
+    asyncio.run(run_torch_triton_single())