Skip to content
体验新版
项目
组织
正在加载...
登录
切换导航
打开侧边栏
OpenCV
opencv
提交
a9807d8f
O
opencv
项目概览
OpenCV
/
opencv
上一次同步 9 个月
通知
992
Star
71100
Fork
55581
代码
文件
提交
分支
Tags
贡献者
分支图
Diff
Issue
1
列表
看板
标记
里程碑
合并请求
0
Wiki
0
Wiki
分析
仓库
DevOps
项目成员
Pages
O
opencv
项目概览
项目概览
详情
发布
仓库
仓库
文件
提交
分支
标签
贡献者
分支图
比较
Issue
1
Issue
1
列表
看板
标记
里程碑
合并请求
0
合并请求
0
Pages
分析
分析
仓库分析
DevOps
Wiki
0
Wiki
成员
成员
收起侧边栏
关闭侧边栏
动态
分支图
创建新Issue
提交
Issue看板
前往新版Gitcode,体验更适合开发者的 AI 搜索 >>
提交
a9807d8f
编写于
12月 28, 2017
作者:
D
Dmitry Kurtaev
浏览文件
操作
浏览文件
下载
电子邮件补丁
差异文件
Allocate new memory for optimized concat to prevent collisions.
Add a flag to disable memory reusing in dnn module.
上级
3542c98d
变更
2
隐藏空白更改
内联
并排
Showing
2 changed file
with
52 addition
and
49 deletion
+52
-49
modules/dnn/CMakeLists.txt
modules/dnn/CMakeLists.txt
+5
-0
modules/dnn/src/dnn.cpp
modules/dnn/src/dnn.cpp
+47
-49
未找到文件。
modules/dnn/CMakeLists.txt
浏览文件 @
a9807d8f
...
...
@@ -97,3 +97,8 @@ if(BUILD_PERF_TESTS)
endif
()
endif
()
endif
()
ocv_option
(
${
the_module
}
_REUSE_MEMORY
"Enable reusing strategy of memory management"
ON
)
if
(
${
the_module
}
_REUSE_MEMORY
)
add_definitions
(
-DREUSE_DNN_MEMORY=1
)
endif
()
modules/dnn/src/dnn.cpp
浏览文件 @
a9807d8f
...
...
@@ -367,43 +367,42 @@ public:
}
}
void
reuseOrCreate
(
const
MatShape
&
shape
,
const
LayerPin
&
lp
,
Mat
&
dst
,
bool
force
)
void
reuseOrCreate
(
const
MatShape
&
shape
,
const
LayerPin
&
lp
,
Mat
&
dst
)
{
#ifdef REUSE_DNN_MEMORY
Mat
bestBlob
;
LayerPin
bestBlobPin
;
if
(
!
force
)
{
std
::
map
<
LayerPin
,
Mat
>::
iterator
hostIt
;
std
::
map
<
LayerPin
,
int
>::
iterator
refIt
;
std
::
map
<
LayerPin
,
Mat
>::
iterator
hostIt
;
std
::
map
<
LayerPin
,
int
>::
iterator
refIt
;
const
int
targetTotal
=
total
(
shape
);
int
bestBlobTotal
=
INT_MAX
;
const
int
targetTotal
=
total
(
shape
);
int
bestBlobTotal
=
INT_MAX
;
for
(
hostIt
=
memHosts
.
begin
();
hostIt
!=
memHosts
.
end
();
++
hostIt
)
for
(
hostIt
=
memHosts
.
begin
();
hostIt
!=
memHosts
.
end
();
++
hostIt
)
{
refIt
=
refCounter
.
find
(
hostIt
->
first
);
// Use only blobs that had references before because if not,
// it might be used as output.
if
(
refIt
!=
refCounter
.
end
()
&&
refIt
->
second
==
0
)
{
refIt
=
refCounter
.
find
(
hostIt
->
first
);
// Use only blobs that had references before because if not,
// it might be used as output.
if
(
refIt
!=
refCounter
.
end
()
&&
refIt
->
second
==
0
)
Mat
&
unusedBlob
=
hostIt
->
second
;
if
(
unusedBlob
.
total
()
>=
targetTotal
&&
unusedBlob
.
total
()
<
bestBlobTotal
)
{
Mat
&
unusedBlob
=
hostIt
->
second
;
if
(
unusedBlob
.
total
()
>=
targetTotal
&&
unusedBlob
.
total
()
<
bestBlobTotal
)
{
bestBlobPin
=
hostIt
->
first
;
bestBlob
=
unusedBlob
;
bestBlobTotal
=
unusedBlob
.
total
();
}
bestBlobPin
=
hostIt
->
first
;
bestBlob
=
unusedBlob
;
bestBlobTotal
=
unusedBlob
.
total
();
}
}
}
if
(
!
bestBlob
.
empty
())
{
reuse
(
bestBlobPin
,
lp
);
dst
=
Mat
(
shape
,
CV_32F
,
bestBlob
.
data
);
dst
=
bestBlob
.
reshape
(
1
,
1
).
colRange
(
0
,
targetTotal
).
reshape
(
1
,
shape
);
}
else
#endif // REUSE_DNN_MEMORY
{
// if dst already has been allocated with total(shape) elements,
// it won't be recrreated and pointer of dst.data remains the same.
...
...
@@ -412,34 +411,32 @@ public:
}
}
void
reuseOrCreate
(
const
MatShape
&
shape
,
const
LayerPin
&
lp
,
UMat
&
umat_dst
,
bool
force
)
void
reuseOrCreate
(
const
MatShape
&
shape
,
const
LayerPin
&
lp
,
UMat
&
umat_dst
)
{
#ifdef REUSE_DNN_MEMORY
UMat
bestBlob
;
LayerPin
bestBlobPin
;
if
(
!
force
)
{
std
::
map
<
LayerPin
,
UMat
>::
iterator
hostIt
;
std
::
map
<
LayerPin
,
int
>::
iterator
refIt
;
std
::
map
<
LayerPin
,
UMat
>::
iterator
hostIt
;
std
::
map
<
LayerPin
,
int
>::
iterator
refIt
;
const
int
targetTotal
=
total
(
shape
);
int
bestBlobTotal
=
INT_MAX
;
const
int
targetTotal
=
total
(
shape
);
int
bestBlobTotal
=
INT_MAX
;
for
(
hostIt
=
umat_memHosts
.
begin
();
hostIt
!=
umat_memHosts
.
end
();
++
hostIt
)
for
(
hostIt
=
umat_memHosts
.
begin
();
hostIt
!=
umat_memHosts
.
end
();
++
hostIt
)
{
refIt
=
refCounter
.
find
(
hostIt
->
first
);
// Use only blobs that had references before because if not,
// it might be used as output.
if
(
refIt
!=
refCounter
.
end
()
&&
refIt
->
second
==
0
)
{
refIt
=
refCounter
.
find
(
hostIt
->
first
);
// Use only blobs that had references before because if not,
// it might be used as output.
if
(
refIt
!=
refCounter
.
end
()
&&
refIt
->
second
==
0
)
UMat
&
unusedBlob
=
hostIt
->
second
;
if
(
unusedBlob
.
total
()
>=
targetTotal
&&
unusedBlob
.
total
()
<
bestBlobTotal
)
{
UMat
&
unusedBlob
=
hostIt
->
second
;
if
(
unusedBlob
.
total
()
>=
targetTotal
&&
unusedBlob
.
total
()
<
bestBlobTotal
)
{
bestBlobPin
=
hostIt
->
first
;
bestBlob
=
unusedBlob
;
bestBlobTotal
=
unusedBlob
.
total
();
}
bestBlobPin
=
hostIt
->
first
;
bestBlob
=
unusedBlob
;
bestBlobTotal
=
unusedBlob
.
total
();
}
}
}
...
...
@@ -449,6 +446,7 @@ public:
umat_dst
.
create
(
shape
,
CV_32F
);
}
else
#endif // REUSE_DNN_MEMORY
{
// if dst already has been allocated with total(shape) elements,
// it won't be recrreated and pointer of dst.data remains the same.
...
...
@@ -458,8 +456,7 @@ public:
}
void
allocateBlobsForLayer
(
LayerData
&
ld
,
const
LayerShapes
&
layerShapes
,
std
::
vector
<
LayerPin
>&
pinsForInternalBlobs
,
bool
maximizeReuse
)
std
::
vector
<
LayerPin
>&
pinsForInternalBlobs
)
{
CV_TRACE_FUNCTION
();
bool
use_umat
=
(
preferableBackend
==
DNN_BACKEND_DEFAULT
&&
...
...
@@ -530,7 +527,6 @@ public:
}
std
::
map
<
int
,
std
::
vector
<
int
>
>::
reverse_iterator
it
;
bool
force
=
!
maximizeReuse
&&
ld
.
inputBlobsId
.
size
()
>
1
;
for
(
it
=
idxSizes
.
rbegin
();
it
!=
idxSizes
.
rend
();
it
++
)
{
for
(
int
j
=
0
;
j
<
it
->
second
.
size
();
j
++
)
...
...
@@ -539,7 +535,7 @@ public:
if
(
total
(
shapes
[
index
]))
{
LayerPin
blobPin
(
ld
.
id
,
index
);
if
(
index
<
outShapes
.
size
()
&&
inPlace
&&
!
force
)
if
(
index
<
outShapes
.
size
()
&&
inPlace
)
{
if
(
use_umat
)
{
...
...
@@ -558,9 +554,9 @@ public:
else
{
if
(
use_umat
)
reuseOrCreate
(
shapes
[
index
],
blobPin
,
*
umat_blobs
[
index
]
,
force
);
reuseOrCreate
(
shapes
[
index
],
blobPin
,
*
umat_blobs
[
index
]);
else
reuseOrCreate
(
shapes
[
index
],
blobPin
,
*
blobs
[
index
]
,
force
);
reuseOrCreate
(
shapes
[
index
],
blobPin
,
*
blobs
[
index
]);
}
}
}
...
...
@@ -1111,8 +1107,7 @@ struct Net::Impl
CV_Assert
(
layerShapesIt
!=
layersShapes
.
end
());
std
::
vector
<
LayerPin
>
pinsForInternalBlobs
;
bool
maximizeReuse
=
preferableBackend
==
DNN_BACKEND_HALIDE
;
blobManager
.
allocateBlobsForLayer
(
ld
,
layerShapesIt
->
second
,
pinsForInternalBlobs
,
maximizeReuse
);
blobManager
.
allocateBlobsForLayer
(
ld
,
layerShapesIt
->
second
,
pinsForInternalBlobs
);
ld
.
outputBlobsWrappers
.
resize
(
ld
.
outputBlobs
.
size
());
for
(
int
i
=
0
;
i
<
ld
.
outputBlobs
.
size
();
++
i
)
{
...
...
@@ -1415,6 +1410,9 @@ struct Net::Impl
if
(
i
>=
ninputs
)
{
// Allocate new memory to prevent collisions during memory
// reusing (see https://github.com/opencv/opencv/pull/10456).
output
=
output
.
clone
();
Range
chrange
[]
=
{
Range
::
all
(),
Range
::
all
(),
Range
::
all
(),
Range
::
all
()
};
int
ofs
=
0
;
for
(
i
=
0
;
i
<
ninputs
;
i
++
)
...
...
编辑
预览
Markdown
is supported
0%
请重试
或
添加新附件
.
添加附件
取消
You are about to add
0
people
to the discussion. Proceed with caution.
先完成此消息的编辑!
取消
想要评论请
注册
或
登录