mirror of
https://github.com/zebrajr/pytorch.git
synced 2025-12-07 00:21:07 +01:00
Summary: from caffe2.python import workspace; p = workspace.Predictor(init_net, predict_net); outputs = p.run(inputs) Reviewed By: Yangqing Differential Revision: D4576793 fbshipit-source-id: b829bbcaf2e7c34dad85024177433207bd96a234
463 lines
14 KiB
Python
463 lines
14 KiB
Python
import contextlib
|
|
from google.protobuf.message import Message
|
|
from multiprocessing import Process
|
|
import os
|
|
import shutil
|
|
import socket
|
|
import tempfile
|
|
import logging
|
|
|
|
import numpy as np
|
|
from caffe2.proto import caffe2_pb2
|
|
from caffe2.python import scope, utils
|
|
|
|
import caffe2.python._import_c_extension as C
|
|
|
|
logger = logging.getLogger(__name__)
|
|
|
|
Blobs = C.blobs
|
|
CreateBlob = C.create_blob
|
|
CurrentWorkspace = C.current_workspace
|
|
DeserializeBlob = C.deserialize_blob
|
|
GlobalInit = C.global_init
|
|
HasBlob = C.has_blob
|
|
RegisteredOperators = C.registered_operators
|
|
SerializeBlob = C.serialize_blob
|
|
SwitchWorkspace = C.switch_workspace
|
|
RootFolder = C.root_folder
|
|
Workspaces = C.workspaces
|
|
BenchmarkNet = C.benchmark_net
|
|
Predictor = C.Predictor
|
|
|
|
is_asan = C.is_asan
|
|
has_gpu_support = C.has_gpu_support
|
|
if has_gpu_support:
|
|
NumCudaDevices = C.num_cuda_devices
|
|
SetDefaultGPUID = C.set_default_gpu_id
|
|
GetDefaultGPUID = C.get_default_gpu_id
|
|
GetCuDNNVersion = C.get_cudnn_version
|
|
|
|
def GetCudaPeerAccessPattern():
|
|
return np.asarray(C.get_cuda_peer_access_pattern())
|
|
else:
|
|
NumCudaDevices = lambda: 0 # noqa
|
|
SetDefaultGPUID = lambda x: None # noqa
|
|
GetDefaultGPUID = lambda: 0 # noqa
|
|
GetCuDNNVersion = lambda: 0 # noqa
|
|
GetCudaPeerAccessPattern = lambda: np.array([]) # noqa
|
|
|
|
|
|
# Python 2 and 3 compatibility: test if basestring exists
|
|
try:
|
|
basestring # NOQA
|
|
except NameError:
|
|
# This is python3 so we define basestring.
|
|
basestring = str
|
|
|
|
|
|
def _GetFreeFlaskPort():
|
|
"""Get a free flask port."""
|
|
# We will prefer to use 5000. If not, we will then pick a random port.
|
|
sock = socket.socket(socket.AF_INET, socket.SOCK_STREAM)
|
|
result = sock.connect_ex(('127.0.0.1', 5000))
|
|
if result == 0:
|
|
return 5000
|
|
else:
|
|
s = socket.socket()
|
|
s.bind(('', 0))
|
|
port = s.getsockname()[1]
|
|
s.close()
|
|
# Race condition: between the interval we close the socket and actually
|
|
# start a mint process, another process might have occupied the port. We
|
|
# don't do much here as this is mostly for convenience in research
|
|
# rather than 24x7 service.
|
|
return port
|
|
|
|
|
|
def StartMint(root_folder=None, port=None):
|
|
"""Start a mint instance.
|
|
|
|
TODO(Yangqing): this does not work well under ipython yet. According to
|
|
https://github.com/ipython/ipython/issues/5862
|
|
writing up some fix is a todo item.
|
|
"""
|
|
from caffe2.python.mint import app
|
|
if root_folder is None:
|
|
# Get the root folder from the current workspace
|
|
root_folder = C.root_folder()
|
|
if port is None:
|
|
port = _GetFreeFlaskPort()
|
|
process = Process(
|
|
target=app.main,
|
|
args=(
|
|
['-p', str(port), '-r', root_folder],
|
|
)
|
|
)
|
|
process.start()
|
|
print('Mint running at http://{}:{}'.format(socket.getfqdn(), port))
|
|
return process
|
|
|
|
|
|
def StringifyProto(obj):
|
|
"""Stringify a protocol buffer object.
|
|
|
|
Inputs:
|
|
obj: a protocol buffer object, or a Pycaffe2 object that has a Proto()
|
|
function.
|
|
Outputs:
|
|
string: the output protobuf string.
|
|
Raises:
|
|
AttributeError: if the passed in object does not have the right attribute.
|
|
"""
|
|
if type(obj) is str:
|
|
return obj
|
|
else:
|
|
if isinstance(obj, Message):
|
|
# First, see if this object is a protocol buffer, which we can
|
|
# simply serialize with the SerializeToString() call.
|
|
return obj.SerializeToString()
|
|
elif hasattr(obj, 'Proto'):
|
|
return obj.Proto().SerializeToString()
|
|
else:
|
|
raise ValueError("Unexpected argument to StringifyProto of type " +
|
|
type(obj).__name__)
|
|
|
|
|
|
def ResetWorkspace(root_folder=None):
|
|
if root_folder is None:
|
|
# Reset the workspace, but keep the current root folder setting.
|
|
return C.reset_workspace(C.root_folder())
|
|
else:
|
|
if not os.path.exists(root_folder):
|
|
os.makedirs(root_folder)
|
|
return C.reset_workspace(root_folder)
|
|
|
|
|
|
def CreateNet(net, input_blobs=None):
|
|
if input_blobs is None:
|
|
input_blobs = []
|
|
for input_blob in input_blobs:
|
|
C.create_blob(input_blob)
|
|
return C.create_net(StringifyProto(net))
|
|
|
|
|
|
def RunOperatorOnce(operator):
|
|
return C.run_operator_once(StringifyProto(operator))
|
|
|
|
|
|
def RunOperatorsOnce(operators):
|
|
for op in operators:
|
|
success = RunOperatorOnce(op)
|
|
if not success:
|
|
return False
|
|
return True
|
|
|
|
|
|
def RunNetOnce(net):
|
|
return C.run_net_once(StringifyProto(net))
|
|
|
|
|
|
def RunNet(name, num_iter=1):
|
|
"""Runs a given net.
|
|
|
|
Inputs:
|
|
name: the name of the net, or a reference to the net.
|
|
num_iter: number of iterations to run
|
|
Returns:
|
|
True or an exception.
|
|
"""
|
|
return C.run_net(StringifyNetName(name), num_iter)
|
|
|
|
|
|
def RunPlan(plan_or_step):
|
|
# TODO(jiayq): refactor core.py/workspace.py to avoid circular deps
|
|
import caffe2.python.core as core
|
|
if isinstance(plan_or_step, core.ExecutionStep):
|
|
plan_or_step = core.Plan(plan_or_step)
|
|
return C.run_plan(StringifyProto(plan_or_step))
|
|
|
|
|
|
def InferShapesAndTypes(nets, blob_dimensions=None):
|
|
"""Infers the shapes and types for the specified nets.
|
|
|
|
Inputs:
|
|
nets: the list of nets
|
|
blob_dimensions (optional): a dictionary of blobs and their dimensions.
|
|
If not specified, the workspace blobs are used.
|
|
Returns:
|
|
A tuple of (shapes, types) dictionaries keyed by blob name.
|
|
"""
|
|
net_protos = [StringifyProto(n.Proto()) for n in nets]
|
|
if blob_dimensions is None:
|
|
blobdesc_prototxt = C.infer_shapes_and_types_from_workspace(net_protos)
|
|
else:
|
|
blobdesc_prototxt = C.infer_shapes_and_types_from_map(
|
|
net_protos, blob_dimensions
|
|
)
|
|
blobdesc_proto = caffe2_pb2.TensorShapes()
|
|
blobdesc_proto.ParseFromString(blobdesc_prototxt)
|
|
shapes = {}
|
|
types = {}
|
|
for ts in blobdesc_proto.shapes:
|
|
if not ts.unknown_shape:
|
|
shapes[ts.name] = list(ts.dims)
|
|
types[ts.name] = ts.data_type
|
|
|
|
return (shapes, types)
|
|
|
|
|
|
def _StringifyName(name, expected_type):
|
|
if isinstance(name, basestring):
|
|
return name
|
|
assert type(name).__name__ == expected_type, \
|
|
"Expected a string or %s" % expected_type
|
|
return str(name)
|
|
|
|
|
|
def StringifyBlobName(name):
|
|
return _StringifyName(name, "BlobReference")
|
|
|
|
|
|
def StringifyNetName(name):
|
|
return _StringifyName(name, "Net")
|
|
|
|
|
|
def FeedBlob(name, arr, device_option=None):
|
|
"""Feeds a blob into the workspace.
|
|
|
|
Inputs:
|
|
name: the name of the blob.
|
|
arr: either a TensorProto object or a numpy array object to be fed into
|
|
the workspace.
|
|
device_option (optional): the device option to feed the data with.
|
|
Returns:
|
|
True or False, stating whether the feed is successful.
|
|
"""
|
|
if type(arr) is caffe2_pb2.TensorProto:
|
|
arr = utils.Caffe2TensorToNumpyArray(arr)
|
|
if type(arr) is np.ndarray and arr.dtype.kind == 'S':
|
|
# Plain NumPy strings are weird, let's use objects instead
|
|
arr = arr.astype(np.object)
|
|
|
|
if device_option is None:
|
|
device_option = scope.CurrentDeviceScope()
|
|
|
|
if device_option and device_option.device_type == caffe2_pb2.CUDA:
|
|
if arr.dtype == np.dtype('float64'):
|
|
logger.warning(
|
|
"CUDA operators do not support 64-bit doubles, " +
|
|
"please use arr.astype(np.float32) or np.int32 for ints." +
|
|
" Blob: {}".format(name) +
|
|
" type: {}".format(str(arr.dtype))
|
|
)
|
|
|
|
name = StringifyBlobName(name)
|
|
if device_option is not None:
|
|
return C.feed_blob(name, arr, StringifyProto(device_option))
|
|
else:
|
|
return C.feed_blob(name, arr)
|
|
|
|
|
|
def FetchBlobs(names):
|
|
"""Fetches a list of blobs from the workspace.
|
|
|
|
Inputs:
|
|
names: list of names of blobs - strings or BlobReferences
|
|
Returns:
|
|
list of fetched blobs
|
|
"""
|
|
return [FetchBlob(name) for name in names]
|
|
|
|
|
|
def FetchBlob(name):
|
|
"""Fetches a blob from the workspace.
|
|
|
|
Inputs:
|
|
name: the name of the blob - a string or a BlobReference
|
|
Returns:
|
|
Fetched blob (numpy array or string) if successful
|
|
"""
|
|
return C.fetch_blob(StringifyBlobName(name))
|
|
|
|
|
|
def GetNameScope():
|
|
"""Return the current namescope string. To be used to fetch blobs"""
|
|
return scope.CurrentNameScope()
|
|
|
|
|
|
class _BlobDict(object):
|
|
"""Provides python dict compatible way to do fetching and feeding"""
|
|
|
|
def __getitem__(self, key):
|
|
return FetchBlob(key)
|
|
|
|
def __setitem__(self, key, value):
|
|
return FeedBlob(key, value)
|
|
|
|
def __len__(self):
|
|
return len(C.blobs())
|
|
|
|
def __iter__(self):
|
|
return C.blobs().__iter__()
|
|
|
|
def __contains__(self, item):
|
|
return C.has_blob(item)
|
|
|
|
|
|
blobs = _BlobDict()
|
|
|
|
|
|
################################################################################
|
|
# Utilities for immediate mode
|
|
#
|
|
# Caffe2's immediate mode implements the following behavior: between the two
|
|
# function calls StartImmediate() and StopImmediate(), for any operator that is
|
|
# called through CreateOperator(), we will also run that operator in a workspace
|
|
# that is specific to the immediate mode. The user is explicitly expected to
|
|
# make sure that these ops have proper inputs and outputs, i.e. one should not
|
|
# run an op where an external input is not created or fed.
|
|
#
|
|
# Users can use FeedImmediate() and FetchImmediate() to interact with blobs
|
|
# in the immediate workspace.
|
|
#
|
|
# Once StopImmediate() is called, all contents in the immediate workspace is
|
|
# freed up so one can continue using normal runs.
|
|
#
|
|
# The immediate mode is solely for debugging purposes and support will be very
|
|
# sparse.
|
|
################################################################################
|
|
|
|
_immediate_mode = False
|
|
_immediate_workspace_name = "_CAFFE2_IMMEDIATE"
|
|
_immediate_root_folder = ''
|
|
|
|
|
|
def IsImmediate():
|
|
return _immediate_mode
|
|
|
|
|
|
@contextlib.contextmanager
|
|
def WorkspaceGuard(workspace_name):
|
|
current = CurrentWorkspace()
|
|
SwitchWorkspace(workspace_name, True)
|
|
yield
|
|
SwitchWorkspace(current)
|
|
|
|
|
|
def StartImmediate(i_know=False):
|
|
global _immediate_mode
|
|
global _immediate_root_folder
|
|
if IsImmediate():
|
|
# already in immediate mode. We will kill the previous one
|
|
# and start from fresh.
|
|
StopImmediate()
|
|
_immediate_mode = True
|
|
with WorkspaceGuard(_immediate_workspace_name):
|
|
_immediate_root_folder = tempfile.mkdtemp()
|
|
ResetWorkspace(_immediate_root_folder)
|
|
if i_know:
|
|
# if the user doesn't want to see the warning message, sure...
|
|
return
|
|
print("""
|
|
Enabling immediate mode in caffe2 python is an EXTREMELY EXPERIMENTAL
|
|
feature and may very easily go wrong. This is because Caffe2 uses a
|
|
declarative way of defining operators and models, which is essentially
|
|
not meant to run things in an interactive way. Read the following carefully
|
|
to make sure that you understand the caveats.
|
|
|
|
(1) You need to make sure that the sequences of operators you create are
|
|
actually runnable sequentially. For example, if you create an op that takes
|
|
an input X, somewhere earlier you should have already created X.
|
|
|
|
(2) Caffe2 immediate uses one single workspace, so if the set of operators
|
|
you run are intended to be under different workspaces, they will not run.
|
|
To create boundaries between such use cases, you can call FinishImmediate()
|
|
and StartImmediate() manually to flush out everything no longer needed.
|
|
|
|
(3) Underlying objects held by the immediate mode may interfere with your
|
|
normal run. For example, if there is a leveldb that you opened in immediate
|
|
mode and did not close, your main run will fail because leveldb does not
|
|
support double opening. Immediate mode may also occupy a lot of memory esp.
|
|
on GPUs. Call FinishImmediate() as soon as possible when you no longer
|
|
need it.
|
|
|
|
(4) Immediate is designed to be slow. Every immediate call implicitly
|
|
creates a temp operator object, runs it, and destroys the operator. This
|
|
slow-speed run is by design to discourage abuse. For most use cases other
|
|
than debugging, do NOT turn on immediate mode.
|
|
|
|
(5) If there is anything FATAL happening in the underlying C++ code, the
|
|
immediate mode will immediately (pun intended) cause the runtime to crash.
|
|
|
|
Thus you should use immediate mode with extra care. If you still would
|
|
like to, have fun [https://xkcd.com/149/].
|
|
""")
|
|
|
|
|
|
def StopImmediate():
|
|
"""Stops an immediate mode run."""
|
|
# Phew, that was a dangerous ride.
|
|
global _immediate_mode
|
|
global _immediate_root_folder
|
|
if not IsImmediate():
|
|
return
|
|
with WorkspaceGuard(_immediate_workspace_name):
|
|
ResetWorkspace()
|
|
shutil.rmtree(_immediate_root_folder)
|
|
_immediate_root_folder = ''
|
|
_immediate_mode = False
|
|
|
|
|
|
def ImmediateBlobs():
|
|
with WorkspaceGuard(_immediate_workspace_name):
|
|
return Blobs()
|
|
|
|
|
|
def RunOperatorImmediate(op):
|
|
with WorkspaceGuard(_immediate_workspace_name):
|
|
RunOperatorOnce(op)
|
|
|
|
|
|
def FetchImmediate(*args, **kwargs):
|
|
with WorkspaceGuard(_immediate_workspace_name):
|
|
return FetchBlob(*args, **kwargs)
|
|
|
|
|
|
def FeedImmediate(*args, **kwargs):
|
|
with WorkspaceGuard(_immediate_workspace_name):
|
|
return FeedBlob(*args, **kwargs)
|
|
|
|
|
|
# CWorkspace utilities
|
|
|
|
def _Workspace_create_net(ws, net):
|
|
return ws._create_net(StringifyProto(net))
|
|
|
|
|
|
C.Workspace.create_net = _Workspace_create_net
|
|
|
|
|
|
def _Workspace_run(ws, obj):
|
|
if hasattr(obj, 'Proto'):
|
|
obj = obj.Proto()
|
|
if isinstance(obj, caffe2_pb2.PlanDef):
|
|
return ws._run_plan(obj.SerializeToString())
|
|
if isinstance(obj, caffe2_pb2.NetDef):
|
|
return ws._run_net(obj.SerializeToString())
|
|
if isinstance(obj, caffe2_pb2.OperatorDef):
|
|
return ws._run_operator(obj.SerializeToString())
|
|
raise ValueError(
|
|
"Don't know how to do Workspace.run() on {}".format(type(obj)))
|
|
|
|
|
|
C.Workspace.run = _Workspace_run
|
|
|
|
|
|
def _Blob_feed(blob, arg, device_option=None):
|
|
if device_option is not None:
|
|
device_option = StringifyProto(device_option)
|
|
return blob._feed(arg, device_option)
|
|
|
|
|
|
C.Blob.feed = _Blob_feed
|