Skip to content
New issue

Have a question about this project? Sign up for a free GitHub account to open an issue and contact its maintainers and the community.

By clicking “Sign up for GitHub”, you agree to our terms of service and privacy statement. We’ll occasionally send you account related emails.

Already on GitHub? Sign in to your account

Add dygraph component #1077

Merged
merged 11 commits into from
Jun 21, 2022
Merged
Show file tree
Hide file tree
Changes from 3 commits
Commits
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
13 changes: 13 additions & 0 deletions .pre-commit-config.yaml
Original file line number Diff line number Diff line change
Expand Up @@ -33,3 +33,16 @@ repos:
hooks:
- id: check-hooks-apply
- id: check-useless-excludes
- repo: https://github.com/asottile/reorder_python_imports
rev: v2.4.0
hooks:
- id: reorder-python-imports

- repo: local
hooks:
- id: yapf
name: yapf
entry: yapf
language: system
args: [-i, --style .style.yapf]
files: \.py$
19 changes: 19 additions & 0 deletions visualdl/component/graph/__init__.py
Original file line number Diff line number Diff line change
@@ -0,0 +1,19 @@
# Copyright (c) 2022 VisualDL Authors. All Rights Reserve.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
# http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
# =======================================================================
from .exporter import translate_graph
from .graph_component import analyse_model
from .netron_graph import Model

__all__ = ['translate_graph', 'analyse_model', 'Model']
37 changes: 37 additions & 0 deletions visualdl/component/graph/exporter.py
Original file line number Diff line number Diff line change
@@ -0,0 +1,37 @@
# Copyright (c) 2022 VisualDL Authors. All Rights Reserve.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
# http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
# =======================================================================
import json
import os
import tempfile

from .graph_component import analyse_model
from .utils import create_opname_scope


def translate_graph(model, input_spec, verbose=True):
import paddle
with tempfile.TemporaryDirectory() as tmp:
model._full_name = '{}[{}]'.format(model.__class__.__name__, "model")
create_opname_scope(model)
paddle.jit.save(model, os.path.join(tmp, 'temp'), input_spec)
model_data = open(os.path.join(tmp, 'temp.pdmodel'), 'rb').read()
result = analyse_model(model_data)
if verbose:
from paddle.framework import core
ProgramDesc = core.ProgramDesc
program_desc = ProgramDesc(model_data)
print(program_desc)
result = json.dumps(result, indent=2)
return result
319 changes: 319 additions & 0 deletions visualdl/component/graph/graph_component.py
Original file line number Diff line number Diff line change
@@ -0,0 +1,319 @@
# Copyright (c) 2022 VisualDL Authors. All Rights Reserve.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
# http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
# =======================================================================
import collections
import os.path
import re

from paddle.framework import core
AttrType = core.AttrType

attr_type_name = {
AttrType.INT: "INT",
AttrType.INTS: "INTS",
AttrType.LONG: "LONG",
AttrType.LONGS: "LONGS",
AttrType.FLOAT: "FLOAT",
AttrType.FLOATS: "FLOATS",
AttrType.STRING: "STRING",
AttrType.STRINGS: "STRINGS",
AttrType.BOOL: "BOOL",
AttrType.BOOLS: "BOOLS",
AttrType.BLOCK: "BLOCK",
AttrType.BLOCKS: "BLOCKS"
}

_graph_version = '1.0.0'


def analyse_model(model_pb):
ProgramDesc = core.ProgramDesc
from paddle.utils.unique_name import generate
program_desc = ProgramDesc(model_pb)
all_ops = {}
all_vars = {}
all_edges = {}
op_inputvars_dict = collections.defaultdict(list)
op_outputvars_dict = collections.defaultdict(list)
for i in range(program_desc.num_blocks()):
block_desc = program_desc.block(i)
# vars info
for i, var_desc in enumerate(block_desc.all_vars()):
try:
var_name = var_desc.name()
all_vars[var_name] = {}
all_vars[var_name]['name'] = var_name
all_vars[var_name]['shape'] = var_desc.shape()
all_vars[var_name]['type'] = str(var_desc.type())
all_vars[var_name]['dtype'] = str(var_desc.dtype())
all_vars[var_name]['value'] = []
all_vars[var_name]['persistable'] = var_desc.persistable()
attr_dict = {}
for attr_name in var_desc.attr_names():
attr_dict[attr_name] = var_desc.attr(attr_name)
all_vars[var_name]['attrs'] = attr_dict
all_vars[var_name]['from_node'] = ''
all_vars[var_name]['to_nodes'] = []

except Exception:
# feed, fetch var
var_name = var_desc.name()
all_vars[var_name] = {}
all_vars[var_name]['name'] = var_name
all_vars[var_name]['shape'] = ''
all_vars[var_name]['type'] = str(var_desc.type())
all_vars[var_name]['dtype'] = ''
all_vars[var_name]['value'] = []
all_vars[var_name]['persistable'] = var_desc.persistable()
attr_dict = {}
for attr_name in var_desc.attr_names():
attr_dict[attr_name] = var_desc.attr(attr_name)
all_vars[var_name]['attrs'] = attr_dict
all_vars[var_name]['from_node'] = ''
all_vars[var_name]['to_nodes'] = []

# ops info
for i in range(block_desc.op_size()):
op_desc = block_desc.op(i)
op_name = op_desc.attr('op_namescope') + generate(
str(op_desc.type()))
all_ops[op_name] = {}
all_ops[op_name]['name'] = op_name
all_ops[op_name]['show_name'] = re.sub(r'\[(\w|\.)*\]', '',
op_name)
all_ops[op_name]['type'] = str(op_desc.type())
all_ops[op_name]['input_vars'] = {}
all_ops[op_name]['is_leaf_node'] = True
for input_name, variable_list in op_desc.inputs().items():
all_ops[op_name]['input_vars'][input_name] = variable_list
op_inputvars_dict[op_name].extend(variable_list)
# fill var 'to_nodes'
for variable_name in variable_list:
all_vars[variable_name]['to_nodes'].append(op_name)
all_ops[op_name]['output_vars'] = {}
for output_name, variable_list in op_desc.outputs().items():
all_ops[op_name]['output_vars'][output_name] = variable_list
op_outputvars_dict[op_name].extend(variable_list)
# fill var 'from_node'
for variable_name in variable_list:
all_vars[variable_name]['from_node'] = op_name

attr_dict = {}
attr_type_dict = {}
for attr_name in op_desc.attr_names():
attr_dict[attr_name] = op_desc.attr(attr_name)
attr_type_dict[attr_name] = attr_type_name[op_desc.attr_type(
attr_name)]
all_ops[op_name]['attrs'] = attr_dict
all_ops[op_name]['attr_types'] = attr_type_dict
all_ops[op_name]['children_node'] = []
all_ops[op_name]['input_nodes'] = []
all_ops[op_name]['output_nodes'] = []
all_ops[op_name]['edge_input_nodes'] = []
all_ops[op_name]['edge_output_nodes'] = []
# second pass, create non-leaf nodes, fill 'parent_node', 'children_nodes' of nodes.
for variable_name in all_vars:
if all_vars[variable_name]['from_node'] == '':
continue
# some variable's input and output node are the same, we should prevent to show this situation as a cycle
from_node_name = all_vars[variable_name]['from_node']
for to_node_name in all_vars[variable_name]['to_nodes']:
if to_node_name != from_node_name:
all_ops[from_node_name]['output_nodes'].append(
to_node_name)
all_ops[to_node_name]['input_nodes'].append(from_node_name)

general_children_dict = collections.defaultdict(set)

def create_non_leaf_nodes(parent_node_name, child_node_name):
if parent_node_name == '/' or parent_node_name == '': # root node
parent_node_name = '/'
if parent_node_name not in all_ops:
all_ops[parent_node_name] = {}
all_ops[parent_node_name]['children_node'] = set()
all_ops[parent_node_name]['name'] = parent_node_name
all_ops[parent_node_name]['show_name'] = os.path.dirname(
all_ops[child_node_name]['show_name'])
all_ops[parent_node_name]['attrs'] = {}
all_ops[parent_node_name]['input_nodes'] = set()
all_ops[parent_node_name]['output_nodes'] = set()
all_ops[parent_node_name]['type'] = os.path.basename(
all_ops[parent_node_name]['show_name'])
all_ops[parent_node_name]['input_vars'] = set()
all_ops[parent_node_name]['output_vars'] = set()
all_ops[parent_node_name]['parent_node'] = ''
all_ops[parent_node_name]['edge_input_nodes'] = []
all_ops[parent_node_name]['edge_output_nodes'] = []
all_ops[parent_node_name]['is_leaf_node'] = False

all_ops[child_node_name]['parent_node'] = parent_node_name
all_ops[parent_node_name]['children_node'].add(child_node_name)
general_children_dict[parent_node_name].add(child_node_name)
general_children_dict[parent_node_name].update(
general_children_dict[child_node_name])
if parent_node_name == '/': # root node
return
else:
create_non_leaf_nodes(
os.path.dirname(parent_node_name), parent_node_name)

def construct_edges(var_name):
'''
Construct path edges from var's from_node to to_nodes.
Algorithm:
1. Judge if src_node and dst_node have the same parent node, if yes, link them directly
and fill information in all_edges, return.
2. Find the closest common ancestor, repeat link node and its parent until reach the common ancestor.
Every time construct a new edge, fill information in all_edges.
'''
from_node = all_vars[var_name]['from_node']
to_nodes = all_vars[var_name]['to_nodes']

def _construct_edge(src_node, dst_node):
if all_ops[src_node]['parent_node'] == all_ops[dst_node][
'parent_node']:
if (src_node, dst_node) not in all_edges:
all_edges[(src_node, dst_node)] = {
'from_node': src_node,
'to_node': dst_node,
'vars': {var_name},
'label': ''
}
else:
all_edges[(src_node, dst_node)]['vars'].add(var_name)
else:
common_ancestor = os.path.commonpath([src_node, dst_node])
src_base_node = src_node
while True:
parent_node = all_ops[src_base_node]['parent_node']
if parent_node == common_ancestor:
break
if (src_base_node, parent_node) not in all_edges:
all_edges[(src_base_node, parent_node)] = {
'from_node': src_base_node,
'to_node': parent_node,
'vars': {var_name},
'label': ''
}
else:
all_edges[(src_base_node,
parent_node)]['vars'].add(var_name)
src_base_node = parent_node
dst_base_node = dst_node
while True:
parent_node = all_ops[dst_base_node]['parent_node']
if parent_node == common_ancestor:
break
if (parent_node, dst_base_node) not in all_edges:
all_edges[(parent_node, dst_base_node)] = {
'from_node': parent_node,
'to_node': dst_base_node,
'vars': {var_name},
'label': ''
}
else:
all_edges[(parent_node,
dst_base_node)]['vars'].add(var_name)
dst_base_node = parent_node
if (src_base_node, dst_base_node) not in all_edges:
all_edges[(src_base_node, dst_base_node)] = {
'from_node': src_base_node,
'to_node': dst_base_node,
'vars': {var_name},
'label': ''
}
else:
all_edges[(src_base_node,
dst_base_node)]['vars'].add(var_name)
return

if from_node and to_nodes:
for to_node in to_nodes:
if from_node == to_node:
continue
_construct_edge(from_node, to_node)

all_op_names = list(all_ops.keys())
for op_name in all_op_names:
create_non_leaf_nodes(os.path.dirname(op_name), op_name)

# fill all non-leaf node's 'output_nodes' 'input_nodes' 'output_vars' 'input_vars'
# post-order traverse tree
post_order_results = []

def post_order_traverse(root):
for child in all_ops[root]['children_node']:
post_order_traverse(child)
nonlocal post_order_results
post_order_results.append(root)
return

post_order_traverse('/')

for op_name in post_order_results:
op = all_ops[op_name]
op['children_node'] = list(op['children_node'])

if op['children_node']:
for child_op in op['children_node']:
for input_node in all_ops[child_op]['input_nodes']:
if input_node in general_children_dict[op_name]:
continue
else:
op['input_nodes'].add(input_node)
for output_node in all_ops[child_op]['output_nodes']:
if output_node in general_children_dict[op_name]:
continue
else:
op['output_nodes'].add(output_node)
for input_var in op_inputvars_dict[child_op]:
if all_vars[input_var][
'from_node'] not in general_children_dict[
op_name]:
op['input_vars'].add(input_var)
for output_var in op_outputvars_dict[child_op]:
for to_node_name in all_vars[output_var]['to_nodes']:
if to_node_name not in general_children_dict[
op_name]:
op['output_vars'].add(output_var)
op['input_nodes'] = list(op['input_nodes'])
op['output_nodes'] = list(op['output_nodes'])
op_inputvars_dict[op_name] = list(op['input_vars'])
op_outputvars_dict[op_name] = list(op['output_vars'])
op['input_vars'] = {'X': list(op['input_vars'])}
op['output_vars'] = {'Y': list(op['output_vars'])}

# Supplement edges and 'edge_input_nodes', 'edge_output_nodes' in op to help draw in frontend
for var_name in all_vars.keys():
construct_edges(var_name)

for src_node, to_node in all_edges.keys():
all_ops[src_node]['edge_output_nodes'].append(to_node)
all_ops[to_node]['edge_input_nodes'].append(src_node)
all_edges[(src_node, to_node)]['vars'] = list(
all_edges[(src_node, to_node)]['vars'])
if len(all_edges[(src_node, to_node)]['vars']) > 1:
all_edges[(src_node, to_node)]['label'] = str(
len(all_edges[(src_node, to_node)]['vars'])) + ' tensors'
elif len(all_edges[(src_node, to_node)]['vars']) == 1:
all_edges[(src_node, to_node)]['label'] = str(
all_vars[all_edges[(src_node, to_node)]['vars'][0]]['shape'])

final_data = {
'version': _graph_version,
'nodes': list(all_ops.values()),
'vars': list(all_vars.values()),
'edges': list(all_edges.values())
}
return final_data
Loading