Skip to content
Snippets Groups Projects
Commit 02b56294 authored by Nicolas Pope's avatar Nicolas Pope
Browse files

Actually use streams in operators

parent a68d53fb
No related branches found
No related tags found
1 merge request!165Implements #224 to use discontinuity mask
Pipeline #16324 passed
...@@ -99,6 +99,7 @@ class Graph : public ftl::Configurable { ...@@ -99,6 +99,7 @@ class Graph : public ftl::Configurable {
private: private:
std::list<ftl::operators::detail::OperatorNode> operators_; std::list<ftl::operators::detail::OperatorNode> operators_;
std::map<std::string, ftl::Configurable*> configs_; std::map<std::string, ftl::Configurable*> configs_;
cudaStream_t stream_;
ftl::Configurable *_append(ftl::operators::detail::ConstructionHelperBase*); ftl::Configurable *_append(ftl::operators::detail::ConstructionHelperBase*);
}; };
......
...@@ -12,6 +12,8 @@ ColourChannels::~ColourChannels() { ...@@ -12,6 +12,8 @@ ColourChannels::~ColourChannels() {
} }
bool ColourChannels::apply(ftl::rgbd::Frame &in, ftl::rgbd::Frame &out, ftl::rgbd::Source *s, cudaStream_t stream) { bool ColourChannels::apply(ftl::rgbd::Frame &in, ftl::rgbd::Frame &out, ftl::rgbd::Source *s, cudaStream_t stream) {
auto cvstream = cv::cuda::StreamAccessor::wrapStream(stream);
// Convert colour from BGR to BGRA if needed // Convert colour from BGR to BGRA if needed
if (in.get<cv::cuda::GpuMat>(Channel::Colour).type() == CV_8UC3) { if (in.get<cv::cuda::GpuMat>(Channel::Colour).type() == CV_8UC3) {
//cv::cuda::Stream cvstream = cv::cuda::StreamAccessor::wrapStream(stream); //cv::cuda::Stream cvstream = cv::cuda::StreamAccessor::wrapStream(stream);
...@@ -19,7 +21,7 @@ bool ColourChannels::apply(ftl::rgbd::Frame &in, ftl::rgbd::Frame &out, ftl::rgb ...@@ -19,7 +21,7 @@ bool ColourChannels::apply(ftl::rgbd::Frame &in, ftl::rgbd::Frame &out, ftl::rgb
auto &col = in.get<cv::cuda::GpuMat>(Channel::Colour); auto &col = in.get<cv::cuda::GpuMat>(Channel::Colour);
temp_.create(col.size(), CV_8UC4); temp_.create(col.size(), CV_8UC4);
cv::cuda::swap(col, temp_); cv::cuda::swap(col, temp_);
cv::cuda::cvtColor(temp_,col, cv::COLOR_BGR2BGRA, 0); cv::cuda::cvtColor(temp_,col, cv::COLOR_BGR2BGRA, 0, cvstream);
} }
return true; return true;
......
...@@ -22,7 +22,7 @@ bool ScanFieldFill::apply(ftl::rgbd::Frame &in, ftl::rgbd::Frame &out, ftl::rgbd ...@@ -22,7 +22,7 @@ bool ScanFieldFill::apply(ftl::rgbd::Frame &in, ftl::rgbd::Frame &out, ftl::rgbd
in.createTexture<float>(Channel::Depth), in.createTexture<float>(Channel::Depth),
in.createTexture<float>(Channel::Smoothing), in.createTexture<float>(Channel::Smoothing),
thresh, thresh,
s->parameters(), 0 s->parameters(), stream
); );
return true; return true;
......
...@@ -13,19 +13,13 @@ __global__ void discontinuity_kernel(ftl::cuda::TextureObject<int> mask_out, ftl ...@@ -13,19 +13,13 @@ __global__ void discontinuity_kernel(ftl::cuda::TextureObject<int> mask_out, ftl
const float d = depth.tex2D((int)x, (int)y); const float d = depth.tex2D((int)x, (int)y);
// Calculate depth between 0.0 and 1.0
//float p = (d - params.minDepth) / (params.maxDepth - params.minDepth);
if (d >= params.minDepth && d <= params.maxDepth) { if (d >= params.minDepth && d <= params.maxDepth) {
/* Orts-Escolano S. et al. 2016. Holoportation: Virtual 3D teleportation in real-time. */ /* Orts-Escolano S. et al. 2016. Holoportation: Virtual 3D teleportation in real-time. */
// Is there a discontinuity nearby?
//for (int u=-RADIUS; u<=RADIUS; ++u) {
// for (int v=-RADIUS; v<=RADIUS; ++v) {
// If yes, the flag using w = -1
// if (fabs(depth.tex2D((int)x+u, (int)y+v) - d) > 0.1f) mask.isDiscontinuity(true);
// }
//}
// If colour cross support region terminates within the requested
// radius, and the absolute depth difference on the other side is
// greater than threshold, then is is a discontinuity.
// Repeat for left, right, up and down.
const uchar4 sup = support.tex2D((int)x, (int)y); const uchar4 sup = support.tex2D((int)x, (int)y);
if (sup.x <= radius) { if (sup.x <= radius) {
float dS = depth.tex2D((int)x - sup.x - radius, (int)y); float dS = depth.tex2D((int)x - sup.x - radius, (int)y);
......
...@@ -28,7 +28,7 @@ bool Normals::apply(ftl::rgbd::Frame &in, ftl::rgbd::Frame &out, ftl::rgbd::Sour ...@@ -28,7 +28,7 @@ bool Normals::apply(ftl::rgbd::Frame &in, ftl::rgbd::Frame &out, ftl::rgbd::Sour
ftl::cuda::normals( ftl::cuda::normals(
out.createTexture<float4>(Channel::Normals, ftl::rgbd::Format<float4>(in.get<cv::cuda::GpuMat>(Channel::Depth).size())), out.createTexture<float4>(Channel::Normals, ftl::rgbd::Format<float4>(in.get<cv::cuda::GpuMat>(Channel::Depth).size())),
in.createTexture<float>(Channel::Depth), in.createTexture<float>(Channel::Depth),
s->parameters(), 0 s->parameters(), stream
); );
return true; return true;
......
...@@ -31,16 +31,18 @@ bool Operator::apply(FrameSet &in, Frame &out, Source *os, cudaStream_t stream) ...@@ -31,16 +31,18 @@ bool Operator::apply(FrameSet &in, Frame &out, Source *os, cudaStream_t stream)
Graph::Graph(nlohmann::json &config) : ftl::Configurable(config) { Graph::Graph(nlohmann::json &config) : ftl::Configurable(config) {
cudaSafeCall( cudaStreamCreate(&stream_) );
} }
Graph::~Graph() { Graph::~Graph() {
cudaStreamDestroy(stream_);
} }
bool Graph::apply(FrameSet &in, FrameSet &out, cudaStream_t stream) { bool Graph::apply(FrameSet &in, FrameSet &out, cudaStream_t stream) {
if (!value("enabled", true)) return false; if (!value("enabled", true)) return false;
auto stream_actual = (stream == 0) ? stream_ : stream;
if (in.frames.size() != out.frames.size()) return false; if (in.frames.size() != out.frames.size()) return false;
for (auto &i : operators_) { for (auto &i : operators_) {
...@@ -53,11 +55,16 @@ bool Graph::apply(FrameSet &in, FrameSet &out, cudaStream_t stream) { ...@@ -53,11 +55,16 @@ bool Graph::apply(FrameSet &in, FrameSet &out, cudaStream_t stream) {
auto *instance = i.instances[j]; auto *instance = i.instances[j];
if (instance->enabled()) { if (instance->enabled()) {
instance->apply(in.frames[j], out.frames[j], in.sources[j], stream); instance->apply(in.frames[j], out.frames[j], in.sources[j], stream_actual);
} }
} }
} }
if (stream == 0) {
cudaStreamSynchronize(stream_actual);
cudaSafeCall( cudaGetLastError() );
}
return true; return true;
} }
......
...@@ -22,7 +22,7 @@ bool CrossSupport::apply(ftl::rgbd::Frame &in, ftl::rgbd::Frame &out, ftl::rgbd: ...@@ -22,7 +22,7 @@ bool CrossSupport::apply(ftl::rgbd::Frame &in, ftl::rgbd::Frame &out, ftl::rgbd:
out.createTexture<uchar4>(Channel::Support2, ftl::rgbd::Format<uchar4>(in.get<cv::cuda::GpuMat>(Channel::Colour).size())), out.createTexture<uchar4>(Channel::Support2, ftl::rgbd::Format<uchar4>(in.get<cv::cuda::GpuMat>(Channel::Colour).size())),
config()->value("depth_tau", 0.04f), config()->value("depth_tau", 0.04f),
config()->value("v_max", 5), config()->value("v_max", 5),
config()->value("h_max", 5), 0 config()->value("h_max", 5), stream
); );
} //else { } //else {
ftl::cuda::support_region( ftl::cuda::support_region(
...@@ -30,7 +30,7 @@ bool CrossSupport::apply(ftl::rgbd::Frame &in, ftl::rgbd::Frame &out, ftl::rgbd: ...@@ -30,7 +30,7 @@ bool CrossSupport::apply(ftl::rgbd::Frame &in, ftl::rgbd::Frame &out, ftl::rgbd:
out.createTexture<uchar4>(Channel::Support1, ftl::rgbd::Format<uchar4>(in.get<cv::cuda::GpuMat>(Channel::Colour).size())), out.createTexture<uchar4>(Channel::Support1, ftl::rgbd::Format<uchar4>(in.get<cv::cuda::GpuMat>(Channel::Colour).size())),
config()->value("tau", 5.0f), config()->value("tau", 5.0f),
config()->value("v_max", 5), config()->value("v_max", 5),
config()->value("h_max", 5), 0 config()->value("h_max", 5), stream
); );
//} //}
...@@ -62,7 +62,7 @@ bool VisCrossSupport::apply(ftl::rgbd::Frame &in, ftl::rgbd::Frame &out, ftl::rg ...@@ -62,7 +62,7 @@ bool VisCrossSupport::apply(ftl::rgbd::Frame &in, ftl::rgbd::Frame &out, ftl::rg
in.createTexture<float>(Channel::Depth), in.createTexture<float>(Channel::Depth),
in.createTexture<uchar4>(Channel::Support1), in.createTexture<uchar4>(Channel::Support1),
in.createTexture<uchar4>(Channel::Support2), in.createTexture<uchar4>(Channel::Support2),
0 stream
); );
} else { } else {
ftl::cuda::vis_support_region( ftl::cuda::vis_support_region(
...@@ -74,7 +74,7 @@ bool VisCrossSupport::apply(ftl::rgbd::Frame &in, ftl::rgbd::Frame &out, ftl::rg ...@@ -74,7 +74,7 @@ bool VisCrossSupport::apply(ftl::rgbd::Frame &in, ftl::rgbd::Frame &out, ftl::rg
config()->value("offset_y", 0), config()->value("offset_y", 0),
config()->value("spacing_x", 50), config()->value("spacing_x", 50),
config()->value("spacing_y", 50), config()->value("spacing_y", 50),
0 stream
); );
if (show_depth) { if (show_depth) {
...@@ -87,7 +87,7 @@ bool VisCrossSupport::apply(ftl::rgbd::Frame &in, ftl::rgbd::Frame &out, ftl::rg ...@@ -87,7 +87,7 @@ bool VisCrossSupport::apply(ftl::rgbd::Frame &in, ftl::rgbd::Frame &out, ftl::rg
config()->value("offset_y", 0), config()->value("offset_y", 0),
config()->value("spacing_x", 50), config()->value("spacing_x", 50),
config()->value("spacing_y", 50), config()->value("spacing_y", 50),
0 stream
); );
} }
} }
......
...@@ -33,7 +33,7 @@ bool HFSmoother::apply(ftl::rgbd::Frame &in, ftl::rgbd::Frame &out, ftl::rgbd::S ...@@ -33,7 +33,7 @@ bool HFSmoother::apply(ftl::rgbd::Frame &in, ftl::rgbd::Frame &out, ftl::rgbd::S
in.createTexture<float>(Channel::Energy, ftl::rgbd::Format<float>(in.get<cv::cuda::GpuMat>(Channel::Depth).size())), in.createTexture<float>(Channel::Energy, ftl::rgbd::Format<float>(in.get<cv::cuda::GpuMat>(Channel::Depth).size())),
in.createTexture<float>(Channel::Smoothing, ftl::rgbd::Format<float>(in.get<cv::cuda::GpuMat>(Channel::Depth).size())), in.createTexture<float>(Channel::Smoothing, ftl::rgbd::Format<float>(in.get<cv::cuda::GpuMat>(Channel::Depth).size())),
var_thresh, var_thresh,
s->parameters(), 0 s->parameters(), stream
); );
} }
...@@ -158,7 +158,7 @@ bool SimpleMLS::apply(ftl::rgbd::Frame &in, ftl::rgbd::Frame &out, ftl::rgbd::So ...@@ -158,7 +158,7 @@ bool SimpleMLS::apply(ftl::rgbd::Frame &in, ftl::rgbd::Frame &out, ftl::rgbd::So
thresh, thresh,
radius, radius,
s->parameters(), s->parameters(),
0 stream
); );
in.swapChannels(Channel::Depth, Channel::Depth2); in.swapChannels(Channel::Depth, Channel::Depth2);
...@@ -204,7 +204,7 @@ bool ColourMLS::apply(ftl::rgbd::Frame &in, ftl::rgbd::Frame &out, ftl::rgbd::So ...@@ -204,7 +204,7 @@ bool ColourMLS::apply(ftl::rgbd::Frame &in, ftl::rgbd::Frame &out, ftl::rgbd::So
col_smooth, col_smooth,
radius, radius,
s->parameters(), s->parameters(),
0 stream
); );
} else { } else {
ftl::cuda::colour_mls_smooth_csr( ftl::cuda::colour_mls_smooth_csr(
...@@ -218,7 +218,7 @@ bool ColourMLS::apply(ftl::rgbd::Frame &in, ftl::rgbd::Frame &out, ftl::rgbd::So ...@@ -218,7 +218,7 @@ bool ColourMLS::apply(ftl::rgbd::Frame &in, ftl::rgbd::Frame &out, ftl::rgbd::So
col_smooth, col_smooth,
filling, filling,
s->parameters(), s->parameters(),
0 stream
); );
} }
...@@ -259,7 +259,7 @@ bool AdaptiveMLS::apply(ftl::rgbd::Frame &in, ftl::rgbd::Frame &out, ftl::rgbd:: ...@@ -259,7 +259,7 @@ bool AdaptiveMLS::apply(ftl::rgbd::Frame &in, ftl::rgbd::Frame &out, ftl::rgbd::
in.createTexture<float>(Channel::Smoothing), in.createTexture<float>(Channel::Smoothing),
radius, radius,
s->parameters(), s->parameters(),
0 stream
); );
in.swapChannels(Channel::Depth, Channel::Depth2); in.swapChannels(Channel::Depth, Channel::Depth2);
......
0% Loading or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment