2009-11-06 18:06:12 +01:00
|
|
|
/*
|
|
|
|
* Copyright 2005-2007 Gerald Schmidt.
|
|
|
|
*
|
|
|
|
* This file is part of Xml Copy Editor.
|
|
|
|
*
|
2014-06-09 16:19:51 +02:00
|
|
|
* Xml Copy Editor is free software; you can redistribute it and/or
|
|
|
|
* modify it under the terms of the GNU General Public License
|
|
|
|
* as published by the Free Software Foundation; either version 2
|
|
|
|
* of the License, or (at your option) any later version.
|
2009-11-06 18:06:12 +01:00
|
|
|
*
|
|
|
|
* Xml Copy Editor is distributed in the hope that it will be useful,
|
|
|
|
* but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
|
|
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
|
|
|
* GNU General Public License for more details.
|
|
|
|
*
|
|
|
|
* You should have received a copy of the GNU General Public License
|
|
|
|
* along with Xml Copy Editor; if not, write to the Free Software
|
|
|
|
* Foundation, Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA
|
|
|
|
*/
|
|
|
|
|
2012-03-14 16:08:20 +01:00
|
|
|
#include <wx/intl.h>
|
2009-11-06 18:06:12 +01:00
|
|
|
#include <cstring>
|
|
|
|
#include "housestyle.h"
|
|
|
|
#include "readfile.h"
|
|
|
|
|
|
|
|
HouseStyle::HouseStyle (
|
|
|
|
int typeParameter,
|
|
|
|
const std::string& bufferParameter,
|
2013-10-19 02:44:17 +02:00
|
|
|
const wxString& ruleDirectoryParameter,
|
|
|
|
const wxString& ruleFileParameter,
|
|
|
|
const wxString& filterDirectoryParameter,
|
|
|
|
const wxString& filterFileParameter,
|
|
|
|
const wxString& pathSeparatorParameter,
|
2009-11-06 18:06:12 +01:00
|
|
|
#ifdef __WXMSW__
|
2013-10-19 02:44:17 +02:00
|
|
|
const wxString& aspellDataPathParameter,
|
|
|
|
const wxString& aspellDictPathParameter,
|
2009-11-06 18:06:12 +01:00
|
|
|
#endif
|
|
|
|
int contextRangeParameter ) :
|
|
|
|
type ( typeParameter ),
|
|
|
|
buffer ( bufferParameter ),
|
|
|
|
ruleDirectory ( ruleDirectoryParameter ),
|
|
|
|
ruleFile ( ruleFileParameter ),
|
|
|
|
filterDirectory ( filterDirectoryParameter ),
|
|
|
|
filterFile ( filterFileParameter ),
|
|
|
|
pathSeparator ( pathSeparatorParameter ),
|
|
|
|
#ifdef __WXMSW__
|
2013-10-19 02:44:17 +02:00
|
|
|
aspellDataPath ( aspellDataPathParameter ),
|
|
|
|
aspellDictPath ( aspellDictPathParameter ),
|
2009-11-06 18:06:12 +01:00
|
|
|
#endif
|
|
|
|
contextRange ( contextRangeParameter ),
|
|
|
|
ruleVector ( new std::vector<boost::shared_ptr<Rule> > ),
|
|
|
|
dictionary ( new StringSet<char> ),
|
|
|
|
passiveDictionary ( new StringSet<char> )
|
2013-10-19 02:44:17 +02:00
|
|
|
{
|
2009-11-06 18:06:12 +01:00
|
|
|
}
|
|
|
|
|
|
|
|
HouseStyle::~HouseStyle()
|
|
|
|
{}
|
|
|
|
|
|
|
|
void HouseStyle::collectFilter (
|
2013-10-19 02:44:17 +02:00
|
|
|
const std::string& fileName,
|
2009-11-06 18:06:12 +01:00
|
|
|
std::set<std::string>& excludeSet,
|
|
|
|
int *filterCount )
|
|
|
|
{
|
|
|
|
// from v. 1.1.0.7: always ignore
|
|
|
|
//if ( type == HS_TYPE_SPELL || fileName == "(No filter)" )
|
|
|
|
return;
|
|
|
|
|
|
|
|
/*
|
|
|
|
string filePath, buffer;
|
|
|
|
filePath = filterDirectory + pathSeparator + fileName;
|
|
|
|
|
|
|
|
if ( !ReadFile::run ( filePath, buffer ) )
|
|
|
|
return;
|
|
|
|
|
|
|
|
XmlFilterReader xfr;
|
|
|
|
if ( !xfr.parse ( buffer ) )
|
|
|
|
{
|
|
|
|
std::string report = xfr.getLastError();
|
|
|
|
throw runtime_error ( report.c_str() );
|
|
|
|
}
|
|
|
|
|
|
|
|
std::map<std::string, std::map<std::string, std::set<std::string> > >
|
|
|
|
temporaryMap;
|
|
|
|
std::map<std::string, std::map<std::string, std::set<std::string> > >::iterator
|
|
|
|
temporaryMapIterator;
|
|
|
|
xfr.getFilterMap ( temporaryMap );
|
|
|
|
|
|
|
|
for ( temporaryMapIterator = temporaryMap.begin();
|
|
|
|
temporaryMapIterator != temporaryMap.end();
|
|
|
|
++temporaryMapIterator )
|
|
|
|
{
|
|
|
|
filterMap.insert ( *temporaryMapIterator );
|
|
|
|
( *filterCount ) ++;
|
|
|
|
}
|
|
|
|
|
|
|
|
// add current file to exclude set
|
|
|
|
excludeSet.insert ( fileName );
|
|
|
|
|
|
|
|
// fetch exclude vector
|
|
|
|
std::vector<std::string> localExcludeVector;
|
|
|
|
std::vector<std::string>::iterator excludeIterator;
|
|
|
|
xfr.getExcludeVector ( localExcludeVector );
|
|
|
|
for ( excludeIterator = localExcludeVector.begin();
|
|
|
|
excludeIterator != localExcludeVector.end();
|
|
|
|
excludeIterator++ )
|
|
|
|
excludeSet.insert ( *excludeIterator );
|
|
|
|
|
|
|
|
// fetch include vector
|
|
|
|
std::vector<std::string> includeVector;
|
|
|
|
std::vector<std::string>::iterator includeIterator;
|
|
|
|
xfr.getIncludeVector ( includeVector );
|
|
|
|
|
|
|
|
if ( includeVector.empty() )
|
|
|
|
return;
|
|
|
|
|
|
|
|
for ( includeIterator = includeVector.begin();
|
|
|
|
includeIterator != includeVector.end();
|
|
|
|
includeIterator++ )
|
|
|
|
{
|
|
|
|
if ( !excludeSet.count ( *includeIterator ) )
|
|
|
|
collectFilter ( *includeIterator, excludeSet, filterCount );
|
|
|
|
}
|
|
|
|
*/
|
|
|
|
}
|
|
|
|
|
2013-10-19 02:44:17 +02:00
|
|
|
void HouseStyle::collectRules ( const std::string& fileName,
|
2009-11-06 18:06:12 +01:00
|
|
|
boost::shared_ptr<std::vector<boost::shared_ptr<Rule> > > ruleVector,
|
|
|
|
std::set<string>& excludeSet,
|
|
|
|
int *ruleCount )
|
|
|
|
{
|
|
|
|
if (type == HS_TYPE_SPELL)
|
|
|
|
return;
|
|
|
|
|
|
|
|
std::string filePath, buffer;
|
2013-10-19 02:44:17 +02:00
|
|
|
filePath = (const char *) ( ruleDirectory + pathSeparator ).mb_str() + fileName;
|
2009-11-06 18:06:12 +01:00
|
|
|
if ( !ReadFile::run ( filePath, buffer ) )
|
|
|
|
return;
|
|
|
|
|
2019-12-01 15:12:17 +01:00
|
|
|
boost::scoped_ptr<XmlRuleReader> xrr ( new XmlRuleReader (
|
2009-11-06 18:06:12 +01:00
|
|
|
dictionary,
|
|
|
|
passiveDictionary,
|
|
|
|
ruleVector ) );
|
|
|
|
if ( !xrr->parse ( buffer ) )
|
|
|
|
{
|
|
|
|
std::string report = xrr->getIncorrectPatternReport();
|
|
|
|
if ( report != "" )
|
2022-10-05 04:40:20 +02:00
|
|
|
throw std::runtime_error ( report.c_str() );
|
2009-11-06 18:06:12 +01:00
|
|
|
else
|
2022-10-05 04:40:20 +02:00
|
|
|
throw std::runtime_error ( ( const char * ) xrr->getLastError().utf8_str() );
|
2009-11-06 18:06:12 +01:00
|
|
|
}
|
|
|
|
|
|
|
|
// add current file to exclude set
|
|
|
|
excludeSet.insert ( fileName );
|
|
|
|
|
|
|
|
// fetch exclude vector
|
|
|
|
std::vector<std::string> localExcludeVector;
|
|
|
|
std::vector<std::string>::iterator excludeIterator;
|
|
|
|
xrr->getExcludeVector ( localExcludeVector );
|
|
|
|
for ( excludeIterator = localExcludeVector.begin();
|
|
|
|
excludeIterator != localExcludeVector.end();
|
2014-03-19 13:21:14 +01:00
|
|
|
++excludeIterator )
|
2009-11-06 18:06:12 +01:00
|
|
|
excludeSet.insert ( *excludeIterator );
|
|
|
|
|
|
|
|
* ( ruleCount ) += xrr->getRuleCount();
|
|
|
|
|
|
|
|
// fetch include vector
|
|
|
|
std::vector<std::string> includeVector;
|
|
|
|
xrr->getIncludeVector ( includeVector );
|
|
|
|
std::vector<std::string>::iterator includeIterator;
|
|
|
|
for ( includeIterator = includeVector.begin();
|
|
|
|
includeIterator != includeVector.end();
|
2014-03-19 13:21:14 +01:00
|
|
|
++includeIterator )
|
2009-11-06 18:06:12 +01:00
|
|
|
{
|
|
|
|
if ( !excludeSet.count ( *includeIterator ) )
|
|
|
|
collectRules ( *includeIterator, ruleVector, excludeSet, ruleCount );
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
bool HouseStyle::createReport()
|
|
|
|
{
|
|
|
|
if ( type == HS_TYPE_STYLE && !updateRules() )
|
|
|
|
{
|
2013-10-19 02:44:17 +02:00
|
|
|
error = _ ( "no rules found" );
|
2009-11-06 18:06:12 +01:00
|
|
|
return false;
|
|
|
|
}
|
|
|
|
|
|
|
|
/*
|
|
|
|
updateFilter();
|
|
|
|
|
|
|
|
auto_ptr<HouseStyleReader> xtr ( new HouseStyleReader ( filterMap ) );
|
|
|
|
if ( !xtr->parse ( buffer ) )
|
|
|
|
{
|
2013-10-19 02:44:17 +02:00
|
|
|
error = _ ( "file is not well-formed" );
|
2009-11-06 18:06:12 +01:00
|
|
|
return false;
|
|
|
|
}
|
|
|
|
*/
|
|
|
|
std::vector<std::pair<std::string, unsigned> > nodeVector;
|
|
|
|
//xtr->getNodeVector ( nodeVector );
|
|
|
|
nodeVector.push_back( make_pair ( buffer, 0 ) ); // new from 1.1.0.7
|
|
|
|
|
|
|
|
int ruleVectorsize, nodeVectorSize;
|
|
|
|
|
|
|
|
std::vector<ContextMatch> contextVector;
|
|
|
|
std::vector<ContextMatch>::iterator matchIterator;
|
|
|
|
ruleVectorsize = ruleVector->size();
|
|
|
|
|
|
|
|
nodeVectorSize = nodeVector.size();
|
|
|
|
|
|
|
|
WrapAspell *spellcheck = NULL;
|
|
|
|
try {
|
|
|
|
if (type == HS_TYPE_SPELL)
|
|
|
|
spellcheck = new WrapAspell(
|
|
|
|
ruleFile // carries lang information
|
|
|
|
#ifdef __WXMSW__
|
|
|
|
, aspellDataPath,
|
|
|
|
aspellDictPath
|
|
|
|
#endif
|
|
|
|
);
|
|
|
|
}
|
|
|
|
catch (...)
|
|
|
|
{
|
2013-10-19 02:44:17 +02:00
|
|
|
error = _ ( "Cannot initialise spellcheck" );
|
2009-11-06 18:06:12 +01:00
|
|
|
return false;
|
|
|
|
}
|
|
|
|
|
|
|
|
std::string nodeBuffer;
|
|
|
|
unsigned elementCount;
|
|
|
|
for ( int j = 0; j < nodeVectorSize; ++j )
|
|
|
|
{
|
|
|
|
nodeBuffer = nodeVector.at ( j ).first;
|
|
|
|
elementCount = nodeVector.at ( j ).second;
|
|
|
|
|
|
|
|
if ( !nodeBuffer.size() )
|
|
|
|
continue;
|
|
|
|
|
|
|
|
// try spelling first
|
|
|
|
if ( type == HS_TYPE_SPELL && spellcheck )
|
|
|
|
{
|
|
|
|
spellcheck->checkString (
|
|
|
|
nodeBuffer,
|
|
|
|
contextVector,
|
|
|
|
contextRange );
|
|
|
|
|
|
|
|
for ( matchIterator = contextVector.begin();
|
|
|
|
matchIterator != contextVector.end();
|
2014-03-19 13:21:14 +01:00
|
|
|
++matchIterator )
|
2009-11-06 18:06:12 +01:00
|
|
|
{
|
|
|
|
matchIterator->report = "Not in dictionary";
|
|
|
|
matchIterator->elementCount = elementCount;
|
|
|
|
matchVector.push_back ( *matchIterator );
|
|
|
|
}
|
|
|
|
contextVector.clear();
|
|
|
|
continue; // bail out before we reach style loop
|
|
|
|
}
|
|
|
|
|
|
|
|
// otherwise, proceed with style check
|
|
|
|
for ( int i = 0; i < ruleVectorsize; i++ )
|
|
|
|
{
|
|
|
|
if ( type == HS_TYPE_STYLE )
|
|
|
|
{
|
|
|
|
boost::shared_ptr<Rule> rule ( ruleVector->at ( i ) );
|
|
|
|
if ( rule->matchPatternGlobal (
|
|
|
|
nodeBuffer,
|
|
|
|
contextVector,
|
|
|
|
elementCount,
|
|
|
|
contextRange ) )
|
|
|
|
{
|
|
|
|
std::string report = rule->getReport();
|
|
|
|
|
|
|
|
for ( matchIterator = contextVector.begin();
|
|
|
|
matchIterator != contextVector.end();
|
2014-03-19 13:21:14 +01:00
|
|
|
++matchIterator )
|
2009-11-06 18:06:12 +01:00
|
|
|
{
|
|
|
|
if ( rule->getAdjustCaseAttribute() )
|
|
|
|
CaseHandler::adjustCase (
|
|
|
|
matchIterator->replace,
|
|
|
|
matchIterator->match );
|
|
|
|
|
|
|
|
// tentative?
|
|
|
|
matchIterator->tentative =
|
|
|
|
( rule->getTentativeAttribute() ) ? true : false;
|
|
|
|
|
|
|
|
matchIterator->report = report;
|
|
|
|
|
|
|
|
matchVector.push_back ( *matchIterator );
|
|
|
|
}
|
|
|
|
contextVector.clear();
|
|
|
|
}
|
|
|
|
}
|
|
|
|
/*
|
|
|
|
// check spelling
|
|
|
|
else // if ( !dictionary->empty() )
|
|
|
|
{
|
|
|
|
spellcheck->checkString (
|
|
|
|
nodeBuffer,
|
|
|
|
contextVector,
|
|
|
|
contextRange );
|
|
|
|
|
|
|
|
for ( matchIterator = contextVector.begin();
|
|
|
|
matchIterator != contextVector.end();
|
|
|
|
matchIterator++ )
|
|
|
|
{
|
|
|
|
matchIterator->report = "Not in dictionary";
|
|
|
|
matchIterator->elementCount = elementCount;
|
|
|
|
|
|
|
|
matchVector.push_back ( *matchIterator );
|
|
|
|
}
|
|
|
|
contextVector.clear();
|
|
|
|
}
|
|
|
|
*/
|
|
|
|
}
|
|
|
|
}
|
|
|
|
delete spellcheck;
|
|
|
|
return true;
|
|
|
|
}
|
|
|
|
|
2013-10-19 02:44:17 +02:00
|
|
|
const wxString &HouseStyle::getLastError()
|
2009-11-06 18:06:12 +01:00
|
|
|
{
|
|
|
|
return error;
|
|
|
|
}
|
|
|
|
|
2013-10-19 02:44:17 +02:00
|
|
|
const std::vector<ContextMatch> &HouseStyle::getMatchVector()
|
2009-11-06 18:06:12 +01:00
|
|
|
{
|
|
|
|
return matchVector;
|
|
|
|
}
|
|
|
|
|
|
|
|
int HouseStyle::updateRules()
|
|
|
|
{
|
|
|
|
ruleVector->clear();
|
|
|
|
dictionary->clear();
|
|
|
|
passiveDictionary->clear();
|
|
|
|
|
|
|
|
int ruleCount = 0;
|
|
|
|
set<string> excludeSet;
|
2013-10-19 02:44:17 +02:00
|
|
|
collectRules ( ( const char * ) ruleFile.mb_str(), ruleVector, excludeSet, &ruleCount );
|
2009-11-06 18:06:12 +01:00
|
|
|
return ruleCount;
|
|
|
|
}
|
|
|
|
|
|
|
|
int HouseStyle::updateFilter()
|
|
|
|
{
|
|
|
|
filterMap.clear();
|
|
|
|
int filterCount = 0;
|
|
|
|
set<string> excludeSet;
|
2013-10-19 02:44:17 +02:00
|
|
|
collectFilter ( ( const char * ) filterFile.mb_str(), excludeSet, &filterCount );
|
2009-11-06 18:06:12 +01:00
|
|
|
|
|
|
|
return filterCount;
|
|
|
|
}
|