/* * Copyright 2005-2007 Gerald Schmidt. * * This file is part of Xml Copy Editor. * * Xml Copy Editor is free software; you can redistribute it and/or modify * it under the terms of the GNU General Public License as published by * the Free Software Foundation; version 2 of the License. * * Xml Copy Editor is distributed in the hope that it will be useful, * but WITHOUT ANY WARRANTY; without even the implied warranty of * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the * GNU General Public License for more details. * * You should have received a copy of the GNU General Public License * along with Xml Copy Editor; if not, write to the Free Software * Foundation, Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA */ #include #include "housestyle.h" #include "readfile.h" HouseStyle::HouseStyle ( int typeParameter, const std::string& bufferParameter, const std::string& ruleDirectoryParameter, const std::string& ruleFileParameter, const std::string& filterDirectoryParameter, const std::string& filterFileParameter, const std::string& pathSeparatorParameter, #ifdef __WXMSW__ const std::string& aspellDataPathParameter, const std::string& aspellDictPathParameter, #endif int contextRangeParameter ) : type ( typeParameter ), buffer ( bufferParameter ), ruleDirectory ( ruleDirectoryParameter ), ruleFile ( ruleFileParameter ), filterDirectory ( filterDirectoryParameter ), filterFile ( filterFileParameter ), pathSeparator ( pathSeparatorParameter ), #ifdef __WXMSW__ aspellDataPath ( aspellDataPathParameter ), aspellDictPath ( aspellDictPathParameter ), #endif contextRange ( contextRangeParameter ), ruleVector ( new std::vector > ), dictionary ( new StringSet ), passiveDictionary ( new StringSet ) { } HouseStyle::~HouseStyle() {} void HouseStyle::collectFilter ( std::string& fileName, std::set& excludeSet, int *filterCount ) { // from v. 1.1.0.7: always ignore //if ( type == HS_TYPE_SPELL || fileName == "(No filter)" ) return; /* string filePath, buffer; filePath = filterDirectory + pathSeparator + fileName; if ( !ReadFile::run ( filePath, buffer ) ) return; XmlFilterReader xfr; if ( !xfr.parse ( buffer ) ) { std::string report = xfr.getLastError(); throw runtime_error ( report.c_str() ); } std::map > > temporaryMap; std::map > >::iterator temporaryMapIterator; xfr.getFilterMap ( temporaryMap ); for ( temporaryMapIterator = temporaryMap.begin(); temporaryMapIterator != temporaryMap.end(); ++temporaryMapIterator ) { filterMap.insert ( *temporaryMapIterator ); ( *filterCount ) ++; } // add current file to exclude set excludeSet.insert ( fileName ); // fetch exclude vector std::vector localExcludeVector; std::vector::iterator excludeIterator; xfr.getExcludeVector ( localExcludeVector ); for ( excludeIterator = localExcludeVector.begin(); excludeIterator != localExcludeVector.end(); excludeIterator++ ) excludeSet.insert ( *excludeIterator ); // fetch include vector std::vector includeVector; std::vector::iterator includeIterator; xfr.getIncludeVector ( includeVector ); if ( includeVector.empty() ) return; for ( includeIterator = includeVector.begin(); includeIterator != includeVector.end(); includeIterator++ ) { if ( !excludeSet.count ( *includeIterator ) ) collectFilter ( *includeIterator, excludeSet, filterCount ); } */ } void HouseStyle::collectRules ( string& fileName, boost::shared_ptr > > ruleVector, std::set& excludeSet, int *ruleCount ) { if (type == HS_TYPE_SPELL) return; std::string filePath, buffer; filePath = ruleDirectory + pathSeparator + fileName; if ( !ReadFile::run ( filePath, buffer ) ) return; std::auto_ptr xrr ( new XmlRuleReader ( dictionary, passiveDictionary, ruleVector ) ); if ( !xrr->parse ( buffer ) ) { std::string report = xrr->getIncorrectPatternReport(); if ( report != "" ) throw runtime_error ( report.c_str() ); else throw runtime_error ( xrr->getLastError().c_str() ); } // add current file to exclude set excludeSet.insert ( fileName ); // fetch exclude vector std::vector localExcludeVector; std::vector::iterator excludeIterator; xrr->getExcludeVector ( localExcludeVector ); for ( excludeIterator = localExcludeVector.begin(); excludeIterator != localExcludeVector.end(); excludeIterator++ ) excludeSet.insert ( *excludeIterator ); * ( ruleCount ) += xrr->getRuleCount(); // fetch include vector std::vector includeVector; xrr->getIncludeVector ( includeVector ); std::vector::iterator includeIterator; for ( includeIterator = includeVector.begin(); includeIterator != includeVector.end(); includeIterator++ ) { if ( !excludeSet.count ( *includeIterator ) ) collectRules ( *includeIterator, ruleVector, excludeSet, ruleCount ); } } bool HouseStyle::createReport() { if ( type == HS_TYPE_STYLE && !updateRules() ) { error = "no rules found"; return false; } /* updateFilter(); auto_ptr xtr ( new HouseStyleReader ( filterMap ) ); if ( !xtr->parse ( buffer ) ) { error = "file is not well-formed"; return false; } */ std::vector > nodeVector; //xtr->getNodeVector ( nodeVector ); nodeVector.push_back( make_pair ( buffer, 0 ) ); // new from 1.1.0.7 int ruleVectorsize, nodeVectorSize; std::vector contextVector; std::vector::iterator matchIterator; ruleVectorsize = ruleVector->size(); nodeVectorSize = nodeVector.size(); WrapAspell *spellcheck = NULL; try { if (type == HS_TYPE_SPELL) spellcheck = new WrapAspell( ruleFile, // carries lang information #ifdef __WXMSW__ aspellDataPath, aspellDictPath #endif ); } catch (...) { error = "Cannot initialise spellcheck"; return false; } std::string nodeBuffer; unsigned elementCount; for ( int j = 0; j < nodeVectorSize; ++j ) { nodeBuffer = nodeVector.at ( j ).first; elementCount = nodeVector.at ( j ).second; if ( !nodeBuffer.size() ) continue; // try spelling first if ( type == HS_TYPE_SPELL && spellcheck ) { spellcheck->checkString ( nodeBuffer, contextVector, contextRange ); for ( matchIterator = contextVector.begin(); matchIterator != contextVector.end(); matchIterator++ ) { matchIterator->report = "Not in dictionary"; matchIterator->elementCount = elementCount; matchVector.push_back ( *matchIterator ); } contextVector.clear(); continue; // bail out before we reach style loop } // otherwise, proceed with style check for ( int i = 0; i < ruleVectorsize; i++ ) { if ( type == HS_TYPE_STYLE ) { boost::shared_ptr rule ( ruleVector->at ( i ) ); if ( rule->matchPatternGlobal ( nodeBuffer, contextVector, elementCount, contextRange ) ) { std::string report = rule->getReport(); for ( matchIterator = contextVector.begin(); matchIterator != contextVector.end(); matchIterator++ ) { if ( rule->getAdjustCaseAttribute() ) CaseHandler::adjustCase ( matchIterator->replace, matchIterator->match ); // tentative? matchIterator->tentative = ( rule->getTentativeAttribute() ) ? true : false; matchIterator->report = report; matchVector.push_back ( *matchIterator ); } contextVector.clear(); } } /* // check spelling else // if ( !dictionary->empty() ) { spellcheck->checkString ( nodeBuffer, contextVector, contextRange ); for ( matchIterator = contextVector.begin(); matchIterator != contextVector.end(); matchIterator++ ) { matchIterator->report = "Not in dictionary"; matchIterator->elementCount = elementCount; matchVector.push_back ( *matchIterator ); } contextVector.clear(); } */ } } delete spellcheck; return true; } std::string HouseStyle::getLastError() { return error; } std::vector HouseStyle::getMatchVector() { return matchVector; } int HouseStyle::updateRules() { ruleVector->clear(); dictionary->clear(); passiveDictionary->clear(); int ruleCount = 0; set excludeSet; collectRules ( ruleFile, ruleVector, excludeSet, &ruleCount ); return ruleCount; } int HouseStyle::updateFilter() { filterMap.clear(); int filterCount = 0; set excludeSet; collectFilter ( filterFile, excludeSet, &filterCount ); return filterCount; }