/*M///////////////////////////////////////////////////////////////////////////////////////
//
//  IMPORTANT: READ BEFORE DOWNLOADING, COPYING, INSTALLING OR USING.
//
//  By downloading, copying, installing or using the software you agree to this license.
//  If you do not agree to this license, do not download, install,
//  copy or use the software.
//
//
//                           License Agreement
//                For Open Source Computer Vision Library
//
// Copyright (C) 2014, Itseez Inc, all rights reserved.
// Third party copyrights are property of their respective owners.
//
// Redistribution and use in source and binary forms, with or without modification,
// are permitted provided that the following conditions are met:
//
//   * Redistribution's of source code must retain the above copyright notice,
//     this list of conditions and the following disclaimer.
//
//   * Redistribution's in binary form must reproduce the above copyright notice,
//     this list of conditions and the following disclaimer in the documentation
//     and/or other materials provided with the distribution.
//
//   * The name of the copyright holders may not be used to endorse or promote products
//     derived from this software without specific prior written permission.
//
// This software is provided by the copyright holders and contributors "as is" and
// any express or implied warranties, including, but not limited to, the implied
// warranties of merchantability and fitness for a particular purpose are disclaimed.
// In no event shall the Itseez Inc or contributors be liable for any direct,
// indirect, incidental, special, exemplary, or consequential damages
// (including, but not limited to, procurement of substitute goods or services;
// loss of use, data, or profits; or business interruption) however caused
// and on any theory of liability, whether in contract, strict liability,
// or tort (including negligence or otherwise) arising in any way out of
// the use of this software, even if advised of the possibility of such damage.
//
//M*/

#include "opencv2/datasets/tr_icdar.hpp"
#include "opencv2/datasets/util.hpp"

#include <sstream>
#include <fstream>


namespace cv
{
namespace datasets
{

using namespace std;

class TR_icdarImp CV_FINAL : public TR_icdar
{
public:
    TR_icdarImp() {}
    //TR_icdarImp(const string &path);
    virtual ~TR_icdarImp() CV_OVERRIDE {}

    virtual void load(const string &path) CV_OVERRIDE;

private:
    void loadDataset(const string &path);

    void objParseFiles(const string &path, int img_id, vector<Ptr <Object> > &out);
};

void TR_icdarImp::objParseFiles(const string &path, int img_id, vector<Ptr <Object> > &out)
{
    Ptr<TR_icdarObj> curr(new TR_icdarObj);

    stringstream fileName;
    fileName << "img_" << img_id << ".jpg";
    curr->fileName = fileName.str();

    stringstream gtFileName;
    gtFileName << path << "/gt_img_" << img_id << ".txt";
    ifstream infile(gtFileName.str().c_str());
    if (!infile.is_open()) CV_Error(Error::StsBadArg, gtFileName.str().c_str());
    string line;
    while (getline(infile, line))
    {
        //Ignore EOL characters
        line.erase(remove(line.begin(), line.end(), '\n'), line.end());
        line.erase(remove(line.begin(), line.end(), '\r'), line.end());
        //Ignore byte-order marks (BOM first utf character in W$ files)
        if ( (line[0] == (char)0xEFu) && (line[1] == (char)0xBBu) && (line[2] == (char)0xBFu) )
            line.erase (line.begin(),line.begin()+3);
        vector<string> fields;
        split(line, fields, ',');
        word w;
        w.value  = fields[8];
        w.x      = atoi(fields[0].c_str());
        w.y      = atoi(fields[1].c_str());
        w.width  = atoi(fields[2].c_str()) - atoi(fields[0].c_str());
        w.height = atoi(fields[7].c_str()) - atoi(fields[1].c_str());
        curr->words.push_back(w);
    }
    infile.close();

    stringstream lex100FileName;
    lex100FileName << path << "/voc_img_" << img_id << ".txt";
    infile.open(lex100FileName.str().c_str());
    if (!infile.is_open()) CV_Error(Error::StsBadArg, lex100FileName.str().c_str());
    while (getline(infile, line))
    {
        //Ignore EOL characters
        line.erase(remove(line.begin(), line.end(), '\n'), line.end());
        line.erase(remove(line.begin(), line.end(), '\r'), line.end());
        //Ignore byte-order marks (BOM first utf character in W$ files)
        if ( (line[0] == (char)0xEFu) && (line[1] == (char)0xBBu) && (line[2] == (char)0xBFu) )
            line.erase (line.begin(),line.begin()+3);
        curr->lex100.push_back(line);
    }
    infile.close();

    stringstream lexFullFileName;
    if (path.substr(path.size()-5,4) == string("test"))
        lexFullFileName << path << "ch2_test_vocabulary.txt";
    else
        lexFullFileName << path << "ch2_training_vocabulary.txt";
    infile.open(lexFullFileName.str().c_str());
    if (!infile.is_open()) CV_Error(Error::StsBadArg, lexFullFileName.str().c_str());
    while (getline(infile, line))
    {
        //Ignore EOL characters
        line.erase(remove(line.begin(), line.end(), '\n'), line.end());
        line.erase(remove(line.begin(), line.end(), '\r'), line.end());
        //Ignore byte-order marks (BOM first utf character in W$ files)
        if ( (line[0] == (char)0xEFu) && (line[1] == (char)0xBBu) && (line[2] == (char)0xBFu) )
            line.erase (line.begin(),line.begin()+3);
        curr->lexFull.push_back(line);
    }
    infile.close();

    out.push_back(curr);
}

/*TR_icdarImp::TR_icdarImp(const string &path)
{
    loadDataset(path);
}*/

void TR_icdarImp::load(const string &path)
{
    loadDataset(path);
}

void TR_icdarImp::loadDataset(const string &path)
{
    train.push_back(vector< Ptr<Object> >());
    test.push_back(vector< Ptr<Object> >());
    validation.push_back(vector< Ptr<Object> >());

    string train_path(path + "/train/");
    string test_path (path + "/test/");

    // loading 229 train images descriptions
    for (int i=1; i<230; i++)
        objParseFiles(train_path, i, train.back());

    // loading 233 test images descriptions
    for (int i=1; i<234; i++)
        objParseFiles(test_path, i, test.back());
}

Ptr<TR_icdar> TR_icdar::create()
{
    return Ptr<TR_icdarImp>(new TR_icdarImp);
}

}
}