pytorch/torch/csrc/cuda/Stream.cpp
Shen Li 99d2743863 Move Stream.query() implementation down to C++ (#15737)
Summary:
See #15682

Pushing up this small PR to check if I am doing the right thing. If correct, more will follow for other Stream APIs. Questions will be added inline.
Pull Request resolved: https://github.com/pytorch/pytorch/pull/15737

Differential Revision: D13581400

Pulled By: mrshenli

fbshipit-source-id: 24afed7847b89b62f0692c79a101ec7ff9d9ee4d
2019-01-07 20:58:07 -08:00

116 lines
4.2 KiB
C++

#include <torch/csrc/cuda/Stream.h>
#include <torch/csrc/THP.h>
#include <torch/csrc/cuda/Module.h>
#include <c10/cuda/CUDAGuard.h>
#include <c10/cuda/CUDAStream.h>
#include <structmember.h>
#include <cuda_runtime_api.h>
PyObject *THCPStreamClass = nullptr;
static PyObject * THCPStream_pynew(PyTypeObject *type, PyObject *args, PyObject *kwargs)
{
HANDLE_TH_ERRORS
int current_device;
THCudaCheck(cudaGetDevice(&current_device));
int priority = 0;
uint64_t cdata = 0;
static char *kwlist[] = {"priority", "_cdata", nullptr};
if (!PyArg_ParseTupleAndKeywords(args, kwargs, "|iK", kwlist, &priority, &cdata)) {
return nullptr;
}
THPObjectPtr ptr(type->tp_alloc(type, 0));
if (!ptr) {
return nullptr;
}
at::cuda::CUDAStream stream =
cdata ?
at::cuda::CUDAStream::unpack(cdata) :
at::cuda::getStreamFromPool(/* isHighPriority */ priority < 0 ? true : false);
THCPStream* self = (THCPStream *)ptr.get();
self->cdata = stream.pack();
self->device = stream.device_index();
self->cuda_stream = stream.stream();
return (PyObject *)ptr.release();
END_HANDLE_TH_ERRORS
}
static PyObject * THCPStream_query(THCPStream *self) {
HANDLE_TH_ERRORS
return PyBool_FromLong(at::cuda::CUDAStream::unpack(self->cdata).query());
END_HANDLE_TH_ERRORS
}
static struct PyMemberDef THCPStream_members[] = {
{(char*)"_cdata", T_ULONGLONG, offsetof(THCPStream, cdata), READONLY, nullptr},
{(char*)"device", T_INT, offsetof(THCPStream, device), READONLY, nullptr},
{(char*)"cuda_stream", T_ULONGLONG, offsetof(THCPStream, cuda_stream), READONLY, nullptr},
{nullptr}
};
static PyMethodDef THCPStream_methods[] = {
{(char*)"query", (PyCFunction)THCPStream_query, METH_NOARGS, nullptr},
{nullptr}
};
PyTypeObject THCPStreamType = {
PyVarObject_HEAD_INIT(nullptr, 0)
"torch._C._CudaStreamBase", /* tp_name */
sizeof(THCPStream), /* tp_basicsize */
0, /* tp_itemsize */
0, /* tp_dealloc */
0, /* tp_print */
0, /* tp_getattr */
0, /* tp_setattr */
0, /* tp_reserved */
0, /* tp_repr */
0, /* tp_as_number */
0, /* tp_as_sequence */
0, /* tp_as_mapping */
0, /* tp_hash */
0, /* tp_call */
0, /* tp_str */
0, /* tp_getattro */
0, /* tp_setattro */
0, /* tp_as_buffer */
Py_TPFLAGS_DEFAULT | Py_TPFLAGS_BASETYPE, /* tp_flags */
nullptr, /* tp_doc */
0, /* tp_traverse */
0, /* tp_clear */
0, /* tp_richcompare */
0, /* tp_weaklistoffset */
0, /* tp_iter */
0, /* tp_iternext */
THCPStream_methods, /* tp_methods */
THCPStream_members, /* tp_members */
0, /* tp_getset */
0, /* tp_base */
0, /* tp_dict */
0, /* tp_descr_get */
0, /* tp_descr_set */
0, /* tp_dictoffset */
0, /* tp_init */
0, /* tp_alloc */
THCPStream_pynew, /* tp_new */
};
bool THCPStream_init(PyObject *module)
{
THCPStreamClass = (PyObject*)&THCPStreamType;
if (PyType_Ready(&THCPStreamType) < 0)
return false;
Py_INCREF(&THCPStreamType);
PyModule_AddObject(module, "_CudaStreamBase", (PyObject *)&THCPStreamType);
return true;
}