mirror of
https://github.com/moses-smt/mosesdecoder.git
synced 2024-09-20 07:42:21 +03:00
41a1849437
git-svn-id: https://mosesdecoder.svn.sourceforge.net/svnroot/mosesdecoder/trunk@4184 1f5c12ca-751b-0410-a591-d2e778427230
160 lines
3.2 KiB
C++
160 lines
3.2 KiB
C++
/*
|
|
* FeatureStats.cpp
|
|
* met - Minimum Error Training
|
|
*
|
|
* Created by Nicola Bertoldi on 13/05/08.
|
|
*
|
|
*/
|
|
|
|
#include <fstream>
|
|
#include "FeatureStats.h"
|
|
|
|
#define AVAILABLE_ 8;
|
|
|
|
|
|
FeatureStats::FeatureStats()
|
|
{
|
|
available_ = AVAILABLE_;
|
|
entries_ = 0;
|
|
array_ = new FeatureStatsType[available_];
|
|
};
|
|
|
|
FeatureStats::~FeatureStats()
|
|
{
|
|
delete[] array_;
|
|
};
|
|
|
|
FeatureStats::FeatureStats(const FeatureStats &stats)
|
|
{
|
|
available_ = stats.available();
|
|
entries_ = stats.size();
|
|
array_ = new FeatureStatsType[available_];
|
|
memcpy(array_,stats.getArray(),featbytes_);
|
|
map_ = stats.getSparse();
|
|
};
|
|
|
|
FeatureStats::FeatureStats(const size_t size)
|
|
{
|
|
available_ = size;
|
|
entries_ = size;
|
|
array_ = new FeatureStatsType[available_];
|
|
memset(array_,0,featbytes_);
|
|
};
|
|
|
|
|
|
FeatureStats::FeatureStats(std::string &theString)
|
|
{
|
|
set(theString);
|
|
}
|
|
|
|
void FeatureStats::expand()
|
|
{
|
|
available_*=2;
|
|
featstats_t t_ = new FeatureStatsType[available_];
|
|
memcpy(t_,array_,featbytes_);
|
|
delete array_;
|
|
array_=t_;
|
|
}
|
|
|
|
void FeatureStats::add(FeatureStatsType v)
|
|
{
|
|
if (isfull()) expand();
|
|
array_[entries_++]=v;
|
|
}
|
|
|
|
void FeatureStats::addSparse(string name, FeatureStatsType v)
|
|
{
|
|
map_[name]=v;
|
|
}
|
|
|
|
void FeatureStats::set(std::string &theString)
|
|
{
|
|
std::string substring, stringBuf;
|
|
reset();
|
|
|
|
while (!theString.empty()) {
|
|
getNextPound(theString, substring);
|
|
// regular feature
|
|
if (substring.find(":") == string::npos) {
|
|
add(ATOFST(substring.c_str()));
|
|
}
|
|
// sparse feature
|
|
else {
|
|
size_t separator = substring.find_last_of(":");
|
|
addSparse(substring.substr(0,separator), atof(substring.substr(separator+1).c_str()) );
|
|
}
|
|
}
|
|
}
|
|
|
|
|
|
void FeatureStats::loadbin(std::ifstream& inFile)
|
|
{
|
|
inFile.read((char*) array_, featbytes_);
|
|
}
|
|
|
|
void FeatureStats::loadtxt(std::ifstream& inFile)
|
|
{
|
|
std::string theString;
|
|
std::getline(inFile, theString);
|
|
set(theString);
|
|
}
|
|
|
|
void FeatureStats::loadtxt(const std::string &file)
|
|
{
|
|
// TRACE_ERR("loading the stats from " << file << std::endl);
|
|
|
|
std::ifstream inFile(file.c_str(), std::ios::in); // matches a stream with a file. Opens the file
|
|
|
|
loadtxt(inFile);
|
|
}
|
|
|
|
|
|
void FeatureStats::savetxt(const std::string &file)
|
|
{
|
|
// TRACE_ERR("saving the stats into " << file << std::endl);
|
|
|
|
std::ofstream outFile(file.c_str(), std::ios::out); // matches a stream with a file. Opens the file
|
|
|
|
savetxt(outFile);
|
|
}
|
|
|
|
|
|
void FeatureStats::savetxt(std::ofstream& outFile)
|
|
{
|
|
// TRACE_ERR("saving the stats" << std::endl);
|
|
outFile << *this;
|
|
}
|
|
|
|
void FeatureStats::savebin(std::ofstream& outFile)
|
|
{
|
|
outFile.write((char*) array_, featbytes_);
|
|
}
|
|
|
|
FeatureStats& FeatureStats::operator=(const FeatureStats &stats)
|
|
{
|
|
delete array_;
|
|
available_ = stats.available();
|
|
entries_ = stats.size();
|
|
array_ = new FeatureStatsType[available_];
|
|
memcpy(array_,stats.getArray(),featbytes_);
|
|
map_ = stats.getSparse();
|
|
|
|
return *this;
|
|
}
|
|
|
|
|
|
/**write the whole object to a stream*/
|
|
ostream& operator<<(ostream& o, const FeatureStats& e)
|
|
{
|
|
// print regular features
|
|
for (size_t i=0; i< e.size(); i++) {
|
|
o << e.get(i) << " ";
|
|
}
|
|
// sparse features
|
|
const sparse_featstats_t &sparse = e.getSparse();
|
|
for(sparse_featstats_t::const_iterator i = sparse.begin(); i != sparse.end(); i++) {
|
|
o << i->first << i->second << " ";
|
|
}
|
|
return o;
|
|
}
|