//============================================================================= // File: boyermor.cpp // Contents: Definitions for DwBoyerMoore // Maintainer: Doug Sauder // WWW: http://www.fwb.gulf.net/~dwsauder/mimepp.html // // Copyright (c) 1996, 1997 Douglas W. Sauder // All rights reserved. // // IN NO EVENT SHALL DOUGLAS W. SAUDER BE LIABLE TO ANY PARTY FOR DIRECT, // INDIRECT, SPECIAL, INCIDENTAL, OR CONSEQUENTIAL DAMAGES ARISING OUT OF // THE USE OF THIS SOFTWARE AND ITS DOCUMENTATION, EVEN IF DOUGLAS W. SAUDER // HAS BEEN ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. // // DOUGLAS W. SAUDER SPECIFICALLY DISCLAIMS ANY WARRANTIES, INCLUDING, BUT // NOT LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A // PARTICULAR PURPOSE. THE SOFTWARE PROVIDED HEREUNDER IS ON AN "AS IS" // BASIS, AND DOUGLAS W. SAUDER HAS NO OBLIGATION TO PROVIDE MAINTENANCE, // SUPPORT, UPDATES, ENHANCEMENTS, OR MODIFICATIONS. // //============================================================================= #define DW_IMPLEMENTATION #include #include #include #include #include DwBoyerMoore::DwBoyerMoore(const char* aCstr) : mPat( 0 ), mCiPat( 0 ) { size_t len = strlen(aCstr); _Assign(aCstr, len); } DwBoyerMoore::DwBoyerMoore(const DwString& aStr) : mPat( 0 ), mCiPat( 0 ) { _Assign(aStr.data(), aStr.length()); } DwBoyerMoore::DwBoyerMoore(const DwBoyerMoore & other) : mPat( 0 ), mCiPat( 0 ) { _Assign(other.mPat, other.mPatLen); } DwBoyerMoore::~DwBoyerMoore() { delete[] mPat; mPat = 0; delete[] mCiPat; mCiPat = 0; } const DwBoyerMoore & DwBoyerMoore::operator=( const DwBoyerMoore & other ) { if (this != &other) _Assign(other.mPat, other.mPatLen); return *this; } void DwBoyerMoore::Assign(const char* aCstr) { size_t len = strlen(aCstr); _Assign(aCstr, len); } void DwBoyerMoore::Assign(const DwString& aStr) { _Assign(aStr.data(), aStr.length()); } void DwBoyerMoore::_Assign(const char* aPat, size_t aPatLen) { mPatLen = 0; delete[] mPat; mPat = 0; delete[] mCiPat; mCiPat = 0; mPat = new char[aPatLen+1]; mCiPat = new char[aPatLen+1]; if (mPat != 0 && aPatLen) { mPatLen = aPatLen; strncpy(mPat, aPat, mPatLen); mCiPat[mPatLen] = mPat[mPatLen] = 0; // Initialize the jump table for Boyer-Moore-Horspool algorithm size_t i; for (i=0; i < 256; ++i) mSkipAmt[i] = mCiSkipAmt[i] = (unsigned char) mPatLen; for (i=0; i < mPatLen-1; ++i) { unsigned char skip = mPatLen - i - 1; mCiPat[i] = tolower(mPat[i]); mCiSkipAmt[(unsigned char)mCiPat[i]] = skip; mCiSkipAmt[(unsigned char)toupper(mCiPat[i])] = skip; mSkipAmt[(unsigned char)mPat[i]] = skip; } mCiPat[i] = tolower(mPat[i]); } } size_t DwBoyerMoore::FindIn(const DwString& aStr, size_t aPos, bool aCs) const { char *pat = aCs ? mPat : mCiPat; const unsigned char *skipAmt = aCs ? mSkipAmt : mCiSkipAmt; if (aStr.length() <= aPos) { return (size_t) -1; } if (pat == 0 || mPatLen == 0) { return 0; } size_t bufLen = aStr.length() - aPos; const char* buf = aStr.data() + aPos; size_t i; for (i=mPatLen-1; i < bufLen; i += skipAmt[(unsigned char)buf[i]]) { int iBuf = i; int iPat = mPatLen - 1; while (iPat >= 0 && (aCs ? buf[iBuf] : tolower(buf[iBuf])) == pat[iPat]) { --iBuf; --iPat; } if (iPat == -1) return aPos + iBuf + 1; } return (size_t)-1; }