tfcheckpoint2pytorch.py

import os
import sys
import glob
import json
import argparse
import tempfile
import shutil
import tarfile
import zipfile
import collections

import numpy as np
import tensorflow

try:
    from tensorflow.python.pywrap_tensorflow import NewCheckpointReader
except:
    from tensorflow.compat.v1.train import NewCheckpointReader

from tensorflow.python.framework import meta_graph
from tensorflow.core.framework import types_pb2

parser = argparse.ArgumentParser()
parser.add_argument('-i', '--checkpoint')
parser.add_argument('-o', '--output_path', default = '')
parser.add_argument('--tmp', default = tempfile.mkdtemp())
parser.add_argument('--identityop', action = 'append', default = [])
parser.add_argument('--ignoreattr', action = 'append', default = [])
parser.add_argument('--input_name', action = 'append', default = [])
parser.add_argument('--input_shape', action = 'append', nargs = '+', type = int)
parser.add_argument('--input_dtype', action = 'append', type = str)
parser.add_argument('--output_name', action = 'append', default = [])
parser.add_argument('--opset', default = 10, type = int)
parser.add_argument('--onnx')
parser.add_argument('--tensorboard')
parser.add_argument('--graph')
args = parser.parse_args()

if args.checkpoint.endswith('.tar.gz') or args.checkpoint.endswith('.tar'):
    checkpoint_dir = args.tmp
    tarfile.open(args.checkpoint).extractall(checkpoint_dir)
    files = [os.path.join(checkpoint_dir, d) for d in os.listdir(checkpoint_dir)]
    checkpoint_dir = files[0] if os.path.isdir(files[0]) else checkpoint_dir
elif args.checkpoint.endswith('.zip'):
    checkpoint_dir = args.tmp
    zipfile.ZipFile(args.checkpoint).extractall(checkpoint_dir)
    files = [os.path.join(checkpoint_dir, d) for d in os.listdir(checkpoint_dir)]
    checkpoint_dir = files[0] if os.path.isdir(files[0]) else checkpoint_dir
else:
    checkpoint_dir = args.checkpoint

reader = NewCheckpointReader(tensorflow.train.latest_checkpoint(checkpoint_dir))
blobs = {k : reader.get_tensor(k) for k in reader.get_variable_to_shape_map()}
		
if args.output_path.endswith('.json'):
    with open(args.output_path, 'w') as f:
        json.dump({k : blob.tolist() for k, blob in blobs.items()}, f, sort_keys = True, indent = 2)
elif args.output_path.endswith('.h5'):
    import h5py
    with h5py.File(args.output_path, 'w') as h:
        h.update(**blobs)
elif args.output_path.endswith('.npy') or args.output_path.endswith('.npz'):
    (np.savez if args.output_path[-1] == 'z' else numpy.save)(args.output_path, **blobs)
elif args.output_path.endswith('.pt'):
    import torch
    torch.save({k : (torch.as_tensor(blob) if not np.isscalar(blob) else torch.tensor(blob)  )  if isinstance(blob, np.ndarray) else blob for k, blob in blobs.items()}, args.output_path)

if args.onnx or args.tensorboard or args.graph:
	meta_graph_file = glob.glob(os.path.join(checkpoint_dir, '*.meta'))[0]
	graph_def = meta_graph.read_meta_graph_file(meta_graph_file).graph_def

	if args.graph or (not args.input_name) or (args.onnx and not args.output_name):
		print('\n'.join(sorted(f'{v.name} <- {v.op}(' + ', '.join(v.input) for v in graph_def.node)) + ')', file = None if not args.graph else open(args.graph, 'w'))
		sys.exit(0)

	for v in graph_def.node:
		if any(name in v.name for name in args.identityop):
			v.op = 'Identity'
			for a in set(v.attr.keys()) - set(['T']):
				del v.attr[a]

	with_port_id = lambda n: n if ':' in n else n + ':0'
	without_port_id = lambda n: n.split(':')[0]
	port_id = lambda n: int(n.split(':')[1]) if ':' in n else 0

	def input_type_shape(n):
		port = port_id(n)
		name = without_port_id(n)
		i = args.input_name.index(n)
		nodes = [v for v in graph_def.node if name in v.name]

		shape = [None if d == -1 else d for d in args.input_shape[i]] if args.input_shape else [None if d.size == -1 else d.size for d in nodes[0].attr['output_shapes'].list.shape[port].dim]
		dtype = getattr(tensorflow, args.input_dtype[i]) if args.input_dtype else nodes[0].attr['output_types'].list.type[port]

		return dtype, shape

	input_map = {with_port_id(a) : tensorflow.placeholder(*input_type_shape(a), name = without_port_id(a)) for a in args.input_name}

	input_names = [with_port_id(a.name) for a in input_map.values()]
	output_names = [with_port_id(o) for o in args.output_name]

if args.tensorboard or args.onnx:
	tensorflow.import_graph_def(graph_def, input_map = input_map)
	graph = tensorflow.get_default_graph()

if args.tensorboard:
	shutil.rmtree(args.tensorboard, ignore_errors = True)
	tensorflow.summary.FileWriter(args.tensorboard, graph = graph).close()
	
if args.onnx:
	import onnx, tf2onnx
	tf2onnx.utils.TF_TO_ONNX_DTYPE[types_pb2.DT_VARIANT] = tf2onnx.utils.TF_TO_ONNX_DTYPE[types_pb2.DT_FLOAT]
	for t in dir(types_pb2):
		if t.endswith('_REF'):
			tf2onnx.utils.TF_TO_ONNX_DTYPE[getattr(types_pb2, t)] = tf2onnx.utils.TF_TO_ONNX_DTYPE.get(getattr(types_pb2, t[:-len('_REF')], None))
	onnx.helper.make_node = lambda *args_, make_node_ = onnx.helper.make_node, **kwargs_: make_node_(*args_, **{k: v for k, v in kwargs_.items() if k not in args.ignoreattr})
	onnx_graph = tf2onnx.tfonnx.process_tf_graph(graph, input_names = input_names, output_names = ['import/' + o for o in output_names], continue_on_error = True, opset = args.opset)

	model_proto = onnx_graph.make_model(os.path.basename(args.onnx))
	#model_proto = tf2onnx.graph.GraphUtil.optimize_model_proto(model_proto)

	with open(args.onnx, "wb") as f:
		f.write(model_proto.SerializeToString())