Skip to content
Projects
Groups
Snippets
Help
Loading...
Sign in / Register
Toggle navigation
O
opencv_contrib
Project
Project
Details
Activity
Cycle Analytics
Repository
Repository
Files
Commits
Branches
Tags
Contributors
Graph
Compare
Charts
Issues
0
Issues
0
List
Board
Labels
Milestones
Merge Requests
0
Merge Requests
0
CI / CD
CI / CD
Pipelines
Jobs
Schedules
Charts
Packages
Packages
Wiki
Wiki
Snippets
Snippets
Members
Members
Collapse sidebar
Close sidebar
Activity
Graph
Charts
Create a new issue
Jobs
Commits
Issue Boards
Open sidebar
submodule
opencv_contrib
Commits
a2cab071
Commit
a2cab071
authored
Aug 22, 2017
by
sghoshcvc
Browse files
Options
Browse Files
Download
Email Patches
Plain Diff
DNN backend initial commit
parent
111b3bed
Expand all
Hide whitespace changes
Inline
Side-by-side
Showing
6 changed files
with
258 additions
and
8 deletions
+258
-8
CMakeLists.txt
modules/text/CMakeLists.txt
+9
-1
ocr.hpp
modules/text/include/opencv2/text/ocr.hpp
+7
-4
textDetector.hpp
modules/text/include/opencv2/text/textDetector.hpp
+2
-2
textbox_demo.cpp
modules/text/samples/textbox_demo.cpp
+2
-1
ocr_holistic.cpp
modules/text/src/ocr_holistic.cpp
+238
-0
text_detectorCNN.cpp
modules/text/src/text_detectorCNN.cpp
+0
-0
No files found.
modules/text/CMakeLists.txt
View file @
a2cab071
...
...
@@ -31,7 +31,7 @@ else()
message
(
STATUS
"Glog: NO"
)
endif
()
ocv_define_module
(
text opencv_ml opencv_imgproc opencv_core opencv_features2d opencv_calib3d WRAP python
)
ocv_define_module
(
text opencv_ml opencv_imgproc opencv_core opencv_features2d opencv_calib3d
OPTIONAL opencv_dnn
WRAP python
)
#ocv_define_module(text ${TEXT_DEPS} WRAP python)
#set(CMAKE_MODULE_PATH ${CMAKE_MODULE_PATH} ${CMAKE_CURRENT_SOURCE_DIR})
...
...
@@ -67,3 +67,11 @@ if()
else
()
message
(
STATUS
"TEXT CAFFE CONFLICT"
)
endif
()
if
(
HAVE_opencv_dnn
)
message
(
STATUS
"dnn module found"
)
add_definitions
(
-DHAVE_DNN
)
set
(
HAVE_DNN 1
)
else
()
message
(
STATUS
"dnn module not found"
)
endif
()
modules/text/include/opencv2/text/ocr.hpp
View file @
a2cab071
...
...
@@ -658,9 +658,12 @@ CV_EXPORTS_W Ptr<OCRBeamSearchDecoder::ClassifierCallback> loadOCRBeamSearchClas
//Classifiers should provide diferent backends
//For the moment only caffe is implemeted
enum
{
OCR_HOLISTIC_BACKEND_NONE
,
OCR_HOLISTIC_BACKEND_CAFFE
OCR_HOLISTIC_BACKEND_NONE
,
//No back end
OCR_HOLISTIC_BACKEND_DNN
,
// dnn backend opencv_dnn
OCR_HOLISTIC_BACKEND_CAFFE
,
// caffe based backend
OCR_HOLISTIC_BACKEND_DEFAULT
// to store default value based on environment
};
class
TextImageClassifier
;
...
...
@@ -831,7 +834,7 @@ public:
* @param backEnd integer parameter selecting the coputation framework. For now OCR_HOLISTIC_BACKEND_CAFFE is
* the only option
*/
CV_WRAP
static
Ptr
<
DeepCNN
>
create
(
String
archFilename
,
String
weightsFilename
,
Ptr
<
ImagePreprocessor
>
preprocessor
,
int
minibatchSz
=
100
,
int
backEnd
=
OCR_HOLISTIC_BACKEND_
CAFFE
);
CV_WRAP
static
Ptr
<
DeepCNN
>
create
(
String
archFilename
,
String
weightsFilename
,
Ptr
<
ImagePreprocessor
>
preprocessor
,
int
minibatchSz
=
100
,
int
backEnd
=
OCR_HOLISTIC_BACKEND_
DEFAULT
);
/** @brief Constructs a DeepCNN intended to be used for word spotting.
*
...
...
@@ -853,7 +856,7 @@ public:
* @param backEnd integer parameter selecting the coputation framework. For now OCR_HOLISTIC_BACKEND_CAFFE is
* the only option
*/
CV_WRAP
static
Ptr
<
DeepCNN
>
createDictNet
(
String
archFilename
,
String
weightsFilename
,
int
backEnd
=
OCR_HOLISTIC_BACKEND_
CAFFE
);
CV_WRAP
static
Ptr
<
DeepCNN
>
createDictNet
(
String
archFilename
,
String
weightsFilename
,
int
backEnd
=
OCR_HOLISTIC_BACKEND_
DEFAULT
);
};
...
...
modules/text/include/opencv2/text/textDetector.hpp
View file @
a2cab071
...
...
@@ -160,7 +160,7 @@ public:
* @param backEnd integer parameter selecting the coputation framework. For now OCR_HOLISTIC_BACKEND_CAFFE is
* the only option
*/
CV_WRAP
static
Ptr
<
DeepCNNTextDetector
>
create
(
String
archFilename
,
String
weightsFilename
,
Ptr
<
ImagePreprocessor
>
preprocessor
,
int
minibatchSz
=
100
,
int
backEnd
=
OCR_HOLISTIC_BACKEND_
CAFFE
);
CV_WRAP
static
Ptr
<
DeepCNNTextDetector
>
create
(
String
archFilename
,
String
weightsFilename
,
Ptr
<
ImagePreprocessor
>
preprocessor
,
int
minibatchSz
=
100
,
int
backEnd
=
OCR_HOLISTIC_BACKEND_
DEFAULT
);
/** @brief Constructs a DeepCNNTextDetector intended to be used for text area detection.
*
...
...
@@ -177,7 +177,7 @@ public:
* @param backEnd integer parameter selecting the coputation framework. For now OCR_HOLISTIC_BACKEND_CAFFE is
* the only option
*/
CV_WRAP
static
Ptr
<
DeepCNNTextDetector
>
createTextBoxNet
(
String
archFilename
,
String
weightsFilename
,
int
backEnd
=
OCR_HOLISTIC_BACKEND_
CAFFE
);
CV_WRAP
static
Ptr
<
DeepCNNTextDetector
>
createTextBoxNet
(
String
archFilename
,
String
weightsFilename
,
int
backEnd
=
OCR_HOLISTIC_BACKEND_
DEFAULT
);
friend
class
ImagePreprocessor
;
};
...
...
modules/text/samples/textbox_demo.cpp
View file @
a2cab071
...
...
@@ -59,9 +59,10 @@ void textbox_draw(cv::Mat &src, std::vector<cv::Rect> &groups,std::vector<float
int
main
(
int
argc
,
const
char
*
argv
[]){
if
(
!
cv
::
text
::
cnn_config
::
caffe_backend
::
getCaffeAvailable
()){
std
::
cout
<<
"The text module was compiled without Caffe which is the only available DeepCNN backend.
\n
Aborting!
\n
"
;
exit
(
1
);
//
exit(1);
}
//set to true if you have a GPU with more than 3GB
if
(
cv
::
text
::
cnn_config
::
caffe_backend
::
getCaffeAvailable
())
cv
::
text
::
cnn_config
::
caffe_backend
::
setCaffeGpuMode
(
true
);
if
(
argc
<
3
){
...
...
modules/text/src/ocr_holistic.cpp
View file @
a2cab071
...
...
@@ -21,6 +21,13 @@
#include "caffe/caffe.hpp"
#endif
#ifdef HAVE_DNN
#include "opencv2/dnn.hpp"
#endif
using
namespace
cv
;
using
namespace
cv
::
dnn
;
using
namespace
std
;
namespace
cv
{
namespace
text
{
//Maybe OpenCV has a routine better suited
...
...
@@ -47,6 +54,7 @@ void ImagePreprocessor::set_mean(Mat mean){
}
class
ResizerPreprocessor
:
public
ImagePreprocessor
{
protected
:
void
preprocess_
(
const
Mat
&
input
,
Mat
&
output
,
Size
outputSize
,
int
outputChannels
){
...
...
@@ -579,6 +587,183 @@ public:
}
};
class
DeepCNNOpenCvDNNImpl
:
public
DeepCNN
{
protected
:
void
classifyMiniBatch
(
std
::
vector
<
Mat
>
inputImageList
,
Mat
outputMat
)
{
//Classifies a list of images containing at most minibatchSz_ images
CV_Assert
(
int
(
inputImageList
.
size
())
<=
this
->
minibatchSz_
);
CV_Assert
(
outputMat
.
isContinuous
());
#ifdef HAVE_DNN
std
::
vector
<
Mat
>
preProcessedImList
;
// to store preprocessed images, should it be handled inside preprocessing class?
Mat
preprocessed
;
// preprocesses each image in the inputImageList and push to preprocessedImList
for
(
size_t
imgNum
=
0
;
imgNum
<
inputImageList
.
size
();
imgNum
++
)
{
this
->
preprocess
(
inputImageList
[
imgNum
],
preprocessed
);
preProcessedImList
.
push_back
(
preprocessed
);
}
// set input data blob in dnn::net
net_
->
setInput
(
blobFromImages
(
preProcessedImList
,
1
,
Size
(
100
,
32
)),
"data"
);
float
*
outputMatData
=
(
float
*
)(
outputMat
.
data
);
//Mat outputNet(inputImageList.size(),this->outputSize_,CV_32FC1,outputMatData) ;
Mat
outputNet
=
this
->
net_
->
forward
();
outputNet
=
outputNet
.
reshape
(
1
,
1
);
float
*
outputNetData
=
(
float
*
)(
outputNet
.
data
);
memcpy
(
outputMatData
,
outputNetData
,
sizeof
(
float
)
*
this
->
outputSize_
*
inputImageList
.
size
());
#endif
}
#ifdef HAVE_DNN
Ptr
<
Net
>
net_
;
#endif
//Size inputGeometry_;
int
minibatchSz_
;
//The existence of the assignment operator mandates this to be nonconst
int
outputSize_
;
public
:
DeepCNNOpenCvDNNImpl
(
const
DeepCNNOpenCvDNNImpl
&
dn
)
:
minibatchSz_
(
dn
.
minibatchSz_
),
outputSize_
(
dn
.
outputSize_
){
channelCount_
=
dn
.
channelCount_
;
inputGeometry_
=
dn
.
inputGeometry_
;
//Implemented to supress Visual Studio warning "assignment operator could not be generated"
#ifdef HAVE_DNN
this
->
net_
=
dn
.
net_
;
#endif
}
DeepCNNOpenCvDNNImpl
&
operator
=
(
const
DeepCNNOpenCvDNNImpl
&
dn
)
{
#ifdef HAVE_DNN
this
->
net_
=
dn
.
net_
;
#endif
this
->
setPreprocessor
(
dn
.
preprocessor_
);
this
->
inputGeometry_
=
dn
.
inputGeometry_
;
this
->
channelCount_
=
dn
.
channelCount_
;
this
->
minibatchSz_
=
dn
.
minibatchSz_
;
this
->
outputSize_
=
dn
.
outputSize_
;
this
->
preprocessor_
=
dn
.
preprocessor_
;
this
->
outputGeometry_
=
dn
.
outputGeometry_
;
return
*
this
;
//Implemented to supress Visual Studio warning "assignment operator could not be generated"
}
DeepCNNOpenCvDNNImpl
(
String
modelArchFilename
,
String
modelWeightsFilename
,
Ptr
<
ImagePreprocessor
>
preprocessor
,
int
maxMinibatchSz
)
:
minibatchSz_
(
maxMinibatchSz
)
{
CV_Assert
(
this
->
minibatchSz_
>
0
);
CV_Assert
(
fileExists
(
modelArchFilename
));
CV_Assert
(
fileExists
(
modelWeightsFilename
));
CV_Assert
(
!
preprocessor
.
empty
());
this
->
setPreprocessor
(
preprocessor
);
#ifdef HAVE_DNN
this
->
net_
=
makePtr
<
Net
>
(
readNetFromCaffe
(
modelArchFilename
,
modelWeightsFilename
));
if
(
this
->
net_
.
empty
())
{
std
::
cerr
<<
"Can't load network by using the following files: "
<<
std
::
endl
;
std
::
cerr
<<
"prototxt: "
<<
modelArchFilename
<<
std
::
endl
;
std
::
cerr
<<
"caffemodel: "
<<
modelWeightsFilename
<<
std
::
endl
;
//std::cerr << "bvlc_googlenet.caffemodel can be downloaded here:" << std::endl;
//std::cerr << "http://dl.caffe.berkeleyvision.org/bvlc_googlenet.caffemodel" << std::endl;
exit
(
-
1
);
}
// find a wa to check the followings in cv::dnn ???
// CV_Assert(net_->num_inputs()==1);
// CV_Assert(net_->num_outputs()==1);
// CV_Assert(this->net_->input_blobs()[0]->channels()==1
// ||this->net_->input_blobs()[0]->channels()==3);
// this->channelCount_=this->net_->input_blobs()[0]->channels();
//this->net_->CopyTrainedLayersFrom(modelWeightsFilename);
//caffe::Blob<float>* inputLayer = this->net_->input_blobs()[0];
//inputLayerId = net_->getLayerId('data');
// inputLayerShape = net_->getLayerShapes(const MatShape& netInputShape,
// inputLayerId,
// std::vector<MatShape>* inLayerShapes,
// std::vector<MatShape>* outLayerShapes) const;
// should not be hard coded ideally
this
->
inputGeometry_
=
Size
(
100
,
32
);
// Size(inputLayer->width(), inputLayer->height());
this
->
channelCount_
=
1
;
//inputLayer->channels();
//inputLayer->Reshape(this->minibatchSz_,this->channelCount_,this->inputGeometry_.height, this->inputGeometry_.width);
//net_->Reshape();
this
->
outputSize_
=
88172
;
//net_->output_blobs()[0]->channels();
this
->
outputGeometry_
=
Size
(
1
,
1
);
//Size(net_->output_blobs()[0]->width(),net_->output_blobs()[0]->height());
#else
CV_Error
(
Error
::
StsError
,
"DNN module not available during compilation!"
);
#endif
}
void
classify
(
InputArray
image
,
OutputArray
classProbabilities
)
{
std
::
vector
<
Mat
>
inputImageList
;
inputImageList
.
push_back
(
image
.
getMat
());
classifyBatch
(
inputImageList
,
classProbabilities
);
}
void
classifyBatch
(
InputArrayOfArrays
inputImageList
,
OutputArray
classProbabilities
)
{
std
::
vector
<
Mat
>
allImageVector
;
inputImageList
.
getMatVector
(
allImageVector
);
size_t
outputSize
=
size_t
(
this
->
outputSize_
);
//temporary variable to avoid int to size_t arithmentic
size_t
minibatchSize
=
size_t
(
this
->
minibatchSz_
);
//temporary variable to avoid int to size_t arithmentic
classProbabilities
.
create
(
Size
(
int
(
outputSize
),
int
(
allImageVector
.
size
())),
CV_32F
);
Mat
outputMat
=
classProbabilities
.
getMat
();
printf
(
"ekhane"
);
for
(
size_t
imgNum
=
0
;
imgNum
<
allImageVector
.
size
();
imgNum
+=
minibatchSize
)
{
size_t
rangeEnd
=
imgNum
+
std
::
min
<
size_t
>
(
allImageVector
.
size
()
-
imgNum
,
minibatchSize
);
std
::
vector
<
Mat
>::
const_iterator
from
=
std
::
vector
<
Mat
>::
const_iterator
(
allImageVector
.
begin
()
+
imgNum
);
std
::
vector
<
Mat
>::
const_iterator
to
=
std
::
vector
<
Mat
>::
const_iterator
(
allImageVector
.
begin
()
+
rangeEnd
);
std
::
vector
<
Mat
>
minibatchInput
(
from
,
to
);
classifyMiniBatch
(
minibatchInput
,
outputMat
.
rowRange
(
int
(
imgNum
),
int
(
rangeEnd
)));
}
}
int
getOutputSize
()
{
return
this
->
outputSize_
;
}
Size
getOutputGeometry
()
{
return
this
->
outputGeometry_
;
}
int
getMinibatchSize
()
{
return
this
->
minibatchSz_
;
}
int
getBackend
()
{
return
OCR_HOLISTIC_BACKEND_DNN
;
}
};
Ptr
<
DeepCNN
>
DeepCNN
::
create
(
String
archFilename
,
String
weightsFilename
,
Ptr
<
ImagePreprocessor
>
preprocessor
,
int
minibatchSz
,
int
backEnd
)
{
...
...
@@ -587,9 +772,25 @@ Ptr<DeepCNN> DeepCNN::create(String archFilename,String weightsFilename,Ptr<Imag
preprocessor
=
ImagePreprocessor
::
createResizer
();
}
switch
(
backEnd
){
case
OCR_HOLISTIC_BACKEND_DEFAULT
:
#ifdef HAVE_CAFFE
return
Ptr
<
DeepCNN
>
(
new
DeepCNNCaffeImpl
(
archFilename
,
weightsFilename
,
preprocessor
,
minibatchSz
));
#elif defined(HAVE_DNN)
return
Ptr
<
DeepCNN
>
(
new
DeepCNNOpenCvDNNImpl
(
archFilename
,
weightsFilename
,
preprocessor
,
minibatchSz
));
#else
CV_Error
(
Error
::
StsError
,
"DeepCNN::create backend not implemented"
);
return
Ptr
<
DeepCNN
>
();
#endif
break
;
case
OCR_HOLISTIC_BACKEND_CAFFE
:
return
Ptr
<
DeepCNN
>
(
new
DeepCNNCaffeImpl
(
archFilename
,
weightsFilename
,
preprocessor
,
minibatchSz
));
break
;
case
OCR_HOLISTIC_BACKEND_DNN
:
return
Ptr
<
DeepCNN
>
(
new
DeepCNNOpenCvDNNImpl
(
archFilename
,
weightsFilename
,
preprocessor
,
minibatchSz
));
break
;
case
OCR_HOLISTIC_BACKEND_NONE
:
default
:
CV_Error
(
Error
::
StsError
,
"DeepCNN::create backend not implemented"
);
...
...
@@ -603,9 +804,25 @@ Ptr<DeepCNN> DeepCNN::createDictNet(String archFilename,String weightsFilename,i
{
Ptr
<
ImagePreprocessor
>
preprocessor
=
ImagePreprocessor
::
createImageStandarizer
(
113
);
switch
(
backEnd
){
case
OCR_HOLISTIC_BACKEND_DEFAULT
:
#ifdef HAVE_CAFFE
return
Ptr
<
DeepCNN
>
(
new
DeepCNNCaffeImpl
(
archFilename
,
weightsFilename
,
preprocessor
,
100
));
#elif defined(HAVE_DNN)
return
Ptr
<
DeepCNN
>
(
new
DeepCNNOpenCvDNNImpl
(
archFilename
,
weightsFilename
,
preprocessor
,
100
));
#else
CV_Error
(
Error
::
StsError
,
"DeepCNN::create backend not implemented"
);
return
Ptr
<
DeepCNN
>
();
#endif
break
;
case
OCR_HOLISTIC_BACKEND_CAFFE
:
return
Ptr
<
DeepCNN
>
(
new
DeepCNNCaffeImpl
(
archFilename
,
weightsFilename
,
preprocessor
,
100
));
break
;
case
OCR_HOLISTIC_BACKEND_DNN
:
return
Ptr
<
DeepCNN
>
(
new
DeepCNNOpenCvDNNImpl
(
archFilename
,
weightsFilename
,
preprocessor
,
100
));
break
;
case
OCR_HOLISTIC_BACKEND_NONE
:
default
:
CV_Error
(
Error
::
StsError
,
"DeepCNN::create backend not implemented"
);
...
...
@@ -639,6 +856,27 @@ bool getCaffeAvailable()
{
return
true
;
}
#elif defined(HAVE_DNN)
bool
getCaffeGpuMode
()
{
CV_Error
(
Error
::
StsError
,
"Caffe not available during compilation!"
);
return
0
;
}
void
setCaffeGpuMode
(
bool
useGpu
)
{
CV_Error
(
Error
::
StsError
,
"Caffe not available during compilation!"
);
CV_Assert
(
useGpu
==
1
);
//Compilation directives force
}
bool
getCaffeAvailable
(){
return
0
;
}
bool
getDNNAvailable
(){
return
true
;
}
#else
...
...
modules/text/src/text_detectorCNN.cpp
View file @
a2cab071
This diff is collapsed.
Click to expand it.
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment