diff --git a/profiler/cluster_analyse/analysis/cluster_net_checker/README.md b/profiler/cluster_analyse/analysis/cluster_net_checker/README.md new file mode 100644 index 0000000000000000000000000000000000000000..712bb336c1fda32a113393b751c7a2c44c70f59e --- /dev/null +++ b/profiler/cluster_analyse/analysis/cluster_net_checker/README.md @@ -0,0 +1,37 @@ +# 网络工具demo + + +## 功能 + +1. 网络拓扑展示 + + a. 支持万卡+拓扑展示(选择并展示集群中特定通信域拓扑) + + b. 通信域信息准确(从训练中采集) + + c. 物理拓扑获取(调研中) + + +2. 问题rank分析 + + a. 快慢卡 + + b. 慢链路 + + c. rank指标排序 + + +## 使用流程 + +采集+分析+可视化 + +1. 采集: + - profiling工具动态采集 + - 插入到mindspeed的patch代码(获取并行信息,并使用mstx将并行信息写入profiling db) + +2. 分析: + - cluster_net_checker.py + +3. 可视化: + - 快速穿刺版本 stats.ipynb + - 未来使用 insight \ No newline at end of file diff --git a/profiler/cluster_analyse/analysis/cluster_net_checker/__init__.py b/profiler/cluster_analyse/analysis/cluster_net_checker/__init__.py new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/profiler/cluster_analyse/analysis/cluster_net_checker/cluster_net_checker.py b/profiler/cluster_analyse/analysis/cluster_net_checker/cluster_net_checker.py new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/profiler/cluster_analyse/analysis/cluster_net_checker/stats.ipynb b/profiler/cluster_analyse/analysis/cluster_net_checker/stats.ipynb new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/profiler/cluster_analyse/cluster_statistics_export/cluster_net_checker_export.py b/profiler/cluster_analyse/cluster_statistics_export/cluster_net_checker_export.py new file mode 100644 index 0000000000000000000000000000000000000000..43b5e68b970a656ada47dae61863bf817749eb2d --- /dev/null +++ b/profiler/cluster_analyse/cluster_statistics_export/cluster_net_checker_export.py @@ -0,0 +1,27 @@ +# Copyright (c) 2024, Huawei Technologies Co., Ltd. +# All rights reserved. +# +# Licensed under the Apache License, Version 2.0 (the "License"); +# you may not use this file except in compliance with the License. +# You may obtain a copy of the License at +# +# http://www.apache.org/licenses/LICENSE-2.0 +# +# Unless required by applicable law or agreed to in writing, software +# distributed under the License is distributed on an "AS IS" BASIS, +# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. +# See the License for the specific language governing permissions and +# limitations under the License. + +from cluster_statistics_export.stats_export import StatsExport + + +QUERY = """ +""" + + +class ClusterNetCheckerExport(StatsExport): + + def __init__(self, db_path, recipe_name): + super().__init__(db_path, recipe_name) + self._query = QUERY \ No newline at end of file