From 9658bd6d36fcc888c830506eed43806262a7718a Mon Sep 17 00:00:00 2001 From: =?UTF-8?q?=E5=8F=B6=E9=BE=99=E5=89=91?= Date: Thu, 6 Nov 2025 20:26:41 +0800 Subject: [PATCH 1/6] Sub package divide --- CMakeLists.txt | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/CMakeLists.txt b/CMakeLists.txt index a26ab9fed8..c866553fd6 100644 --- a/CMakeLists.txt +++ b/CMakeLists.txt @@ -246,7 +246,7 @@ if (ENABLE_OPEN_SRC) set(CPACK_EXTERNAL_PACKAGE_SCRIPT ${ASCEND_INSTALL_PATH}/toolkit/tools/op_project_templates/ascendc/customize/cmake/makeself.cmake) set(CPACK_EXTERNAL_BUILT_PACKAGES ${CPACK_PACKAGE_DIRECTORY}/_CPack_Packages/Linux/External/${CPACK_PACKAGE_FILE_NAME}/${CPACK_PACKAGE_FILE_NAME}) include(CPack) - else() + elseif(CMAKE_SOURCE_DIR STREQUAL PROJECT_SOURCE_DIR) include(cmake/package.cmake) endif() endif() -- Gitee From baf03625fdc612d12570140a2b9f5919d4da8328 Mon Sep 17 00:00:00 2001 From: j00427146 Date: Mon, 3 Nov 2025 11:20:58 +0800 Subject: [PATCH 2/6] =?UTF-8?q?=E3=80=90=E6=8F=8F=20=20=20=20=E8=BF=B0?= =?UTF-8?q?=E3=80=91=20=20aicpu=20errormessage=20=E3=80=90=E4=BF=AE=20?= =?UTF-8?q?=E6=94=B9=20=E4=BA=BA=E3=80=91=20=20j00427146=20=E3=80=90?= =?UTF-8?q?=E4=BF=AE=E6=94=B9=E6=97=B6=E9=97=B4=E3=80=91=20=202025.11.1?= MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit --- error_manager/error_code.json | 123 +++++++++++++++++++++------------- 1 file changed, 78 insertions(+), 45 deletions(-) diff --git a/error_manager/error_code.json b/error_manager/error_code.json index f696a08618..bae1142eb9 100644 --- a/error_manager/error_code.json +++ b/error_manager/error_code.json @@ -1410,35 +1410,35 @@ }, { "errClass": "AI CPU Errors", - "errTitle": "NN_Process_Count_Limit_Exceeded", + "errTitle": "Not_Supported_Specification", "ErrCode": "E30003", "ErrMessage": "The number of started NN processes exceeds the limit.", "Arglist": "", "suggestion": { - "Possible Cause": "Something wrong with queue_schedule.", - "Solution": "Wait for 10s after the last training process exited and try again." + "Possible Cause": "The number of processes started in the scheduling queue exceeds the limit. For details about the restrictions, see Processes in https://hiascend.com/document/redirect/CannCommercialCppAppendix.", + "Solution": "Try again 10 seconds after the last training job exits." } }, { "errClass": "AI CPU Errors", "errTitle": "NN_Process_Bin_Error", "ErrCode": "E30004", - "ErrMessage": "The binary file of the NN process is damaged or the file permissions are incorrect.", + "ErrMessage": "The binary file of the NN process is damaged.", "Arglist": "", "suggestion": { - "Possible Cause": "The driver package is incorrectly installed.", - "Solution": "Reinstall the driver package." + "Possible Cause": "An ECC memory error occurs on the device.", + "Solution": "Obtain the device log, check whether ECC errors are reported, and contact technical support at https://www.hiascend.com/support." } }, { "errClass": "AI CPU Errors", - "errTitle": "AI_CPU_Timeout", + "errTitle": "Execution_Error_AICPU_Operator_Timeout", "ErrCode": "E30008", - "ErrMessage": "AI CPU operator execution time out.", + "ErrMessage": "AI CPU operator execution timed out.", "Arglist": "", "suggestion": { - "Possible Cause": "1. For the GetNext operator, its preprocessing duration may be too long. 2. For a custom operator, its logic may be improper.", - "Solution": "1. For the GetNext operator, check its preprocessing or set OpExecuteTimeOut to a larger value. 2. For a custom operator, make sure its logic is proper." + "Possible Cause": "1. For a GetNext operator, its preprocessing time may be too long. 2. For a custom operator, it contains an ultra-large loop in the implementation logic or its input and output shapes are too large. 3. The input and output shapes of a built-in operator are too large.", + "Solution": "1. For a GetNext operator, check its preprocessing or use the aclrtSetOpExecuteTimeOut interface to adjust the timeout. 2. For a custom operator, ensure that the logic design is proper or modify the shape. 3. If the input and output shapes are too large, modify the shape or use the aclrtSetOpExecuteTimeOut interface to adjust the timeout." } }, { @@ -1448,19 +1448,19 @@ "ErrMessage": "The argument is invalid.", "Arglist": "", "suggestion": { - "Possible Cause": "The parameter value is null or the parameter length is invalid.", - "Solution": "See the host log for details, and then check the parameter where the error log is reported." + "Possible Cause": "The argument has an empty value or an invalid length.", + "Solution": "View the host log and check the argument in the error log." } }, { "errClass": "AI CPU Errors", - "errTitle": "Driver_Function_Call_Failure", + "errTitle": "Inner_Error_Driver_API_Call_Failed", "ErrCode": "E39002", "ErrMessage": "Failed to obtain the number of devices and the device list.", "Arglist": "", "suggestion": { - "Possible Cause": "Failed to obtain the device information from the driver.", - "Solution": "Check the device logs to see whether the device driver service is normal." + "Possible Cause": "Failed to obtain device information from the device driver.", + "Solution": "Obtain the device log and contact technical support at https://www.hiascend.com/support." } }, { @@ -1470,74 +1470,107 @@ "ErrMessage": "Failed to add the AI CPU scheduler to the Cgroup.", "Arglist": "", "suggestion": { - "Possible Cause": "1. The User have no sudo Permission.\n2. The Cgroup configuration is incorrect.", - "Solution": "1. Check whether the user have sudo Permission or not.\n2. Submit an issue on Gitee at https://gitee.com/ascend." + "Possible Cause": "The Cgroup configuration is incorrect.", + "Solution": "Obtain the device log and contact technical support at https://www.hiascend.com/support." } }, { "errClass": "AI CPU Errors", - "errTitle": "AI_CPU_Scheduler_Initialization_Failure", + "errTitle": "Inner_Error_AICPU_Scheduler_Init_Failed", "ErrCode": "E39004", - "ErrMessage": "The AI CPU scheduler is abnormal.", + "ErrMessage": "The AI CPU scheduler process initialization is abnormal.", "Arglist": "", "suggestion": { - "Possible Cause": "Something wrong with aicpu_scheduler", - "Solution": "Check the initialization information from device logs." + "Possible Cause": "The internal processing of the AI CPU scheduler process is abnormal.", + "Solution": "Obtain the device log and contact technical support at https://www.hiascend.com/support." } }, { "errClass": "AI CPU Errors", "errTitle": "Device_Connection_Failure", "ErrCode": "E30005", - "ErrMessage": "The device failed to be connected.", + "ErrMessage": "Failed to connect the device.", "Arglist": "", "suggestion": { - "Possible Cause": "1. The device is broken.\n2. The device failed to be started.", - "Solution": "1.Restart the device.\n2. Submit an issue on Gitee at https://gitee.com/ascend." + "Possible Cause": "1. Heartbeats are missing on the device. 2. The underlying channel is disconnected.", + "Solution": "1. Obtain the device log and contact technical support at https://www.hiascend.com/support. 2. Restart the device." } }, { "errClass": "AI CPU Errors", - "errTitle": "TSDaemon_Process_Abnormal", + "errTitle": "Inner_Error_TSDaemon_Process_Abnormal", "ErrCode": "E39005", - "ErrMessage": "The TSDaemon process is abnormal.", + "ErrMessage": "The TSDaemon process initialization is abnormal.", "Arglist": "", "suggestion": { - "Possible Cause": "The TSDaemon process failed to be started.", - "Solution": "Check the device logs to see if TSDaemon is normal." + "Possible Cause": "The internal processing of the TSDaemon process is abnormal.", + "Solution": "Obtain the device log and contact technical support at https://www.hiascend.com/support." } }, { "errClass": "AI CPU Errors", - "errTitle": "Failed_to_Send_OPP_to_device", + "errTitle": "Inner_Error_Failed_Send_OPP_To_Device", "ErrCode": "E39006", "ErrMessage": "Failed to send the OPP to the device.", "Arglist": "", "suggestion": { - "Possible Cause": "1.The HDCD process is abnormal.\n2. The device failed to be connected.", - "Solution": "Check the host and device logs to see if HDC is normal." + "Possible Cause": "1.The HDC link is faulty. 2. The device status is abnormal.", + "Solution": "Obtain the device log and contact technical support at https://www.hiascend.com/support." } }, { "errClass": "AI CPU Errors", - "errTitle": "Device_Subprocess_Startup_Timeout", + "errTitle": "Inner_Error_Device_Subprocess_Startup_Timeout", "ErrCode": "E39007", "ErrMessage": "Starting a subprocess on the device timed out.", "Arglist": "", "suggestion": { - "Possible Cause": "1.The subprocess failed to be started.\n2. HDC is abnormal.", - "Solution": "1. Check the device logs to see if the subprocess is started is started successfully.\n2. Check the host and device logs to see if HDC is normal." + "Possible Cause": "1.Failed to start the subprocess. 2. The HDC link is faulty.", + "Solution": "Obtain the device log and contact technical support at https://www.hiascend.com/support." } }, { "errClass": "AI CPU Errors", - "errTitle": "OPP_Verification_Failure", + "errTitle": "Package_Error_Verify_OPP", "ErrCode": "E30006", - "ErrMessage": "Failed to verify the OPP", + "ErrMessage": "Failed to verify the OPP.", "Arglist": "", "suggestion": { - "Possible Cause": "1.The OPP is incorrect.", - "Solution": "1. Use a correct OPP." + "Possible Cause": "1. The AI CPU OPP on the host is tampered with. 2. An ECC memory error occurs on the device.", + "Solution": "1. Install the correct OPP. 2.Obtain the device log, check whether ECC errors are reported, and contact technical support at https://www.hiascend.com/support." + } + }, + { + "errClass": "AI CPU Errors", + "errTitle": "Inner_Error_Verify_NN_Process_Binary", + "ErrCode": "E39008", + "ErrMessage": "The binary file of the NN process is damaged.", + "Arglist": "", + "suggestion": { + "Possible Cause": "An ECC memory error occurs on the device.", + "Solution": "Obtain the device log, check whether ECC errors are reported, and contact technical support at https://www.hiascend.com/support." + } + }, + { + "errClass": "AI CPU Errors", + "errTitle": "Inner_Error_Device_Status_Abnormal", + "ErrCode": "E39009", + "ErrMessage": "Failed to connect the device.", + "Arglist": "", + "suggestion": { + "Possible Cause": "1. Heartbeats are missing on the device. 2. The underlying channel is disconnected.", + "Solution": "1. Obtain the device log and contact technical support at https://www.hiascend.com/support. 2. Restart the device." + } + }, + { + "errClass": "AI CPU Errors", + "errTitle": "Inner_Error_Cgroup_Add_Failed", + "ErrCode": "E39010", + "ErrMessage": "Failed to add the AI CPU scheduler to the Cgroup.", + "Arglist": "", + "suggestion": { + "Possible Cause": "The Cgroup configuration is incorrect.", + "Solution": "Obtain the device log and contact technical support at https://www.hiascend.com/support." } }, { @@ -2455,24 +2488,24 @@ }, { "errClass": "Queue Schedule Errors", - "errTitle": "Group_Attaching_Failure", + "errTitle": "Inner_Error_Group_Attach_Failed", "ErrCode": "EM9001", - "ErrMessage": "Failed to attach the queue_schedule process to the group.", + "ErrMessage": "Failed to attach the queue_schedule process to the shared memory group.", "Arglist": "", "suggestion": { - "Possible Cause": "N/A", - "Solution": "Submit an issue to request for support at https://gitee.com/ascend or contact Huawei technical support." + "Possible Cause": "The queue_schedule process is not added to the shared memory group.", + "Solution": "Obtain the device log and contact technical support at https://www.hiascend.com/support." } }, { "errClass": "Queue Schedule Errors", - "errTitle": "Queue_Schedule_Initialization_Failure", + "errTitle": "Inner_Error_Queue_Scheduler_Init_Failed", "ErrCode": "EM9002", "ErrMessage": "Failed to initialize the queue_schedule process.", "Arglist": "", "suggestion": { - "Possible Cause": "N/A", - "Solution": "Submit an issue to request for support at https://gitee.com/ascend or contact Huawei technical support." + "Possible Cause": "The internal processing of the queue_schedule process is abnormal.", + "Solution": "Obtain the device log and contact technical support at https://www.hiascend.com/support." } }, { -- Gitee From fbf4ac0744c80372caf71a05cd7d33838ef72715 Mon Sep 17 00:00:00 2001 From: =?UTF-8?q?=E5=B5=87=E9=94=B4?= Date: Thu, 6 Nov 2025 22:29:57 +0800 Subject: [PATCH 3/6] fix missing header files in metadef run --- cmake/package.cmake | 11 +++++++++++ scripts/package/metadef/metadef.xml | 1 + scripts/package/module/ascend/MetadefInc.xml | 12 ++++++++++++ 3 files changed, 24 insertions(+) diff --git a/cmake/package.cmake b/cmake/package.cmake index cb6d0be889..186726b8ec 100644 --- a/cmake/package.cmake +++ b/cmake/package.cmake @@ -199,10 +199,17 @@ install(FILES ${CMAKE_SOURCE_DIR}/inc/external/base/registry/op_impl_space_regis ${CMAKE_SOURCE_DIR}/inc/external/base/registry/opp_package_utils.h DESTINATION metadef/pkg_inc/base/registry ) +install(FILES ${CMAKE_SOURCE_DIR}/pkg_inc/base/err_mgr.h + DESTINATION metadef/pkg_inc/base +) install(FILES ${CMAKE_SOURCE_DIR}/inc/external/base/context_builder/context_holder.h ${CMAKE_SOURCE_DIR}/inc/external/base/context_builder/op_context_builder_base.h ${CMAKE_SOURCE_DIR}/inc/external/base/context_builder/op_tiling_parse_context_builder.h ${CMAKE_SOURCE_DIR}/inc/external/base/context_builder/op_tiling_context_builder.h + ${CMAKE_SOURCE_DIR}/inc/external/base/context_builder/op_infer_datatype_context_builder.h + ${CMAKE_SOURCE_DIR}/inc/external/base/context_builder/op_infer_shape_context_builder.h + ${CMAKE_SOURCE_DIR}/inc/external/base/context_builder/op_infer_shape_range_context_builder.h + ${CMAKE_SOURCE_DIR}/inc/external/base/context_builder/op_kernel_run_context_builder.h DESTINATION metadef/include/base/context_builder ) set(EXTERNAL_REGISTRY_FILES @@ -211,6 +218,10 @@ set(EXTERNAL_REGISTRY_FILES ${CMAKE_SOURCE_DIR}/inc/external/register/register_types.h ${CMAKE_SOURCE_DIR}/inc/external/register/register_fmk_types.h ${CMAKE_SOURCE_DIR}/inc/external/register/register_error_codes.h + ${CMAKE_SOURCE_DIR}/inc/external/register/op_ct_impl_kernel_registry.h + ${CMAKE_SOURCE_DIR}/inc/external/register/op_ct_impl_registry_api.h + ${CMAKE_SOURCE_DIR}/inc/external/register/op_ct_impl_registry.h + ${CMAKE_SOURCE_DIR}/inc/external/register/op_bin_info.h ) install(FILES ${EXTERNAL_REGISTRY_FILES} DESTINATION metadef/include/register diff --git a/scripts/package/metadef/metadef.xml b/scripts/package/metadef/metadef.xml index 80df6f7281..f706bbfa36 100644 --- a/scripts/package/metadef/metadef.xml +++ b/scripts/package/metadef/metadef.xml @@ -49,6 +49,7 @@ + diff --git a/scripts/package/module/ascend/MetadefInc.xml b/scripts/package/module/ascend/MetadefInc.xml index bd171d5c47..5d26c7099b 100644 --- a/scripts/package/module/ascend/MetadefInc.xml +++ b/scripts/package/module/ascend/MetadefInc.xml @@ -8,6 +8,7 @@ + @@ -75,15 +76,26 @@ + + + + + + + + + + + \ No newline at end of file -- Gitee From a40de0ceed57d40398df2d1ae119c8043fb656cd Mon Sep 17 00:00:00 2001 From: likun104 Date: Mon, 10 Nov 2025 09:56:00 +0800 Subject: [PATCH 4/6] fix metadef pkg install error --- scripts/package/metadef/metadef.xml | 11 ++++++++++- scripts/package/module/ascend/MetadefInc.xml | 10 +++++++--- scripts/package/module/ascend/MetadefSo.xml | 6 +++++- 3 files changed, 22 insertions(+), 5 deletions(-) diff --git a/scripts/package/metadef/metadef.xml b/scripts/package/metadef/metadef.xml index f706bbfa36..079de8ba0a 100644 --- a/scripts/package/metadef/metadef.xml +++ b/scripts/package/metadef/metadef.xml @@ -36,21 +36,30 @@ + + + + + + + - + + + diff --git a/scripts/package/module/ascend/MetadefInc.xml b/scripts/package/module/ascend/MetadefInc.xml index 5d26c7099b..89d2292afb 100644 --- a/scripts/package/module/ascend/MetadefInc.xml +++ b/scripts/package/module/ascend/MetadefInc.xml @@ -2,14 +2,18 @@ - + + - + + + + @@ -46,7 +50,7 @@ - + diff --git a/scripts/package/module/ascend/MetadefSo.xml b/scripts/package/module/ascend/MetadefSo.xml index 435dcac087..bec59d32e6 100644 --- a/scripts/package/module/ascend/MetadefSo.xml +++ b/scripts/package/module/ascend/MetadefSo.xml @@ -1,11 +1,15 @@ + - + + + + -- Gitee From b694e1f7a50fb8285fd3ab84c209a05b6664d4e2 Mon Sep 17 00:00:00 2001 From: =?UTF-8?q?=E9=99=88=E4=B8=80=E6=BA=90?= Date: Mon, 10 Nov 2025 13:51:55 +0000 Subject: [PATCH 5/6] =?UTF-8?q?!7109=20Export=20tilingdata=5Fbase.h=20Merg?= =?UTF-8?q?e=20pull=20request=20!7109=20from=20=E9=99=88=E4=B8=80=E6=BA=90?= =?UTF-8?q?/master?= MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit --- cmake/package.cmake | 1 + scripts/package/module/ascend/MetadefInc.xml | 1 + 2 files changed, 2 insertions(+) diff --git a/cmake/package.cmake b/cmake/package.cmake index 186726b8ec..e6354cb326 100644 --- a/cmake/package.cmake +++ b/cmake/package.cmake @@ -222,6 +222,7 @@ set(EXTERNAL_REGISTRY_FILES ${CMAKE_SOURCE_DIR}/inc/external/register/op_ct_impl_registry_api.h ${CMAKE_SOURCE_DIR}/inc/external/register/op_ct_impl_registry.h ${CMAKE_SOURCE_DIR}/inc/external/register/op_bin_info.h + ${CMAKE_SOURCE_DIR}/inc/external/register/tilingdata_base.h ) install(FILES ${EXTERNAL_REGISTRY_FILES} DESTINATION metadef/include/register diff --git a/scripts/package/module/ascend/MetadefInc.xml b/scripts/package/module/ascend/MetadefInc.xml index 89d2292afb..6d2876668b 100644 --- a/scripts/package/module/ascend/MetadefInc.xml +++ b/scripts/package/module/ascend/MetadefInc.xml @@ -84,6 +84,7 @@ + -- Gitee From 53f46772ba1b440b189cd77776794b97a2506691 Mon Sep 17 00:00:00 2001 From: =?UTF-8?q?=E5=8F=B6=E9=BE=99=E5=89=91?= Date: Wed, 12 Nov 2025 14:24:19 +0800 Subject: [PATCH 6/6] Adjusting the subpackage content --- CMakeLists.txt | 2 +- cmake/package.cmake | 5 ----- scripts/package/metadef/metadef.xml | 3 +-- scripts/package/module/ascend/EngineeringCommon.xml | 1 + scripts/package/module/ascend/MetadefInc.xml | 8 +------- 5 files changed, 4 insertions(+), 15 deletions(-) diff --git a/CMakeLists.txt b/CMakeLists.txt index c866553fd6..9bc4ef4f6d 100644 --- a/CMakeLists.txt +++ b/CMakeLists.txt @@ -123,13 +123,13 @@ if (ENABLE_OPEN_SRC) find_package(msprof MODULE REQUIRED) find_package(SymEngine CONFIG REQUIRED) find_package(Boost CONFIG REQUIRED) + find_package(slog MODULE REQUIRED) else() include(cmake/third_party/json.cmake) endif() # 自研软件包 find_package(securec MODULE REQUIRED) - find_package(slog MODULE REQUIRED) find_package(unified_dlog MODULE REQUIRED) if (NOT (ENABLE_METADEF_UT OR ENABLE_METADEF_ST)) find_package(mmpa MODULE REQUIRED) diff --git a/cmake/package.cmake b/cmake/package.cmake index e6354cb326..1691e08908 100644 --- a/cmake/package.cmake +++ b/cmake/package.cmake @@ -168,12 +168,8 @@ set(EXTERNAL_GRAPH_FILES ${CMAKE_SOURCE_DIR}/inc/external/graph/ge_error_codes.h ${CMAKE_SOURCE_DIR}/inc/external/graph/infer_format_context.h ${CMAKE_SOURCE_DIR}/inc/external/graph/compiler_def.h - ${CMAKE_SOURCE_DIR}/inc/graph/op_desc.h ${CMAKE_SOURCE_DIR}/inc/external/graph/ascend_string.h ${CMAKE_SOURCE_DIR}/inc/external/graph/attr_value.h - ${CMAKE_SOURCE_DIR}/inc/external/graph/operator.h - ${CMAKE_SOURCE_DIR}/inc/external/graph/operator_factory.h - ${CMAKE_SOURCE_DIR}/inc/external/graph/resource_context.h ${CMAKE_SOURCE_DIR}/inc/external/graph/inference_context.h ${CMAKE_SOURCE_DIR}/inc/external/graph/types.h ) @@ -187,7 +183,6 @@ install(FILES ${CMAKE_SOURCE_DIR}/inc/external/utils/extern_math_util.h DESTINATION metadef/include/utils ) install(FILES ${CMAKE_SOURCE_DIR}/inc/external/ge/ge_allocator.h - ${CMAKE_SOURCE_DIR}/inc/external/ge_common/ge_api_types.h DESTINATION metadef/include/ge ) install(FILES ${CMAKE_SOURCE_DIR}/inc/external/ge_common/ge_api_types.h diff --git a/scripts/package/metadef/metadef.xml b/scripts/package/metadef/metadef.xml index 079de8ba0a..f8a538d172 100644 --- a/scripts/package/metadef/metadef.xml +++ b/scripts/package/metadef/metadef.xml @@ -47,9 +47,9 @@ + - @@ -59,7 +59,6 @@ - diff --git a/scripts/package/module/ascend/EngineeringCommon.xml b/scripts/package/module/ascend/EngineeringCommon.xml index 6f974ee2de..50dfb85834 100644 --- a/scripts/package/module/ascend/EngineeringCommon.xml +++ b/scripts/package/module/ascend/EngineeringCommon.xml @@ -7,6 +7,7 @@ + diff --git a/scripts/package/module/ascend/MetadefInc.xml b/scripts/package/module/ascend/MetadefInc.xml index 6d2876668b..1cf464f9ae 100644 --- a/scripts/package/module/ascend/MetadefInc.xml +++ b/scripts/package/module/ascend/MetadefInc.xml @@ -1,7 +1,7 @@ - + @@ -13,7 +13,6 @@ - @@ -50,12 +49,8 @@ - - - - @@ -67,7 +62,6 @@ - -- Gitee