2005-11-22 12:26:26 +00:00
|
|
|
// Scintilla source code edit control
|
|
|
|
/** @file RESearch.h
|
|
|
|
** Interface to the regular expression search library.
|
|
|
|
**/
|
|
|
|
// Written by Neil Hodgson <neilh@scintilla.org>
|
|
|
|
// Based on the work of Ozan S. Yigit.
|
|
|
|
// This file is in the public domain.
|
|
|
|
|
|
|
|
#ifndef RESEARCH_H
|
|
|
|
#define RESEARCH_H
|
|
|
|
|
2007-06-18 13:02:34 +00:00
|
|
|
#ifdef SCI_NAMESPACE
|
|
|
|
namespace Scintilla {
|
|
|
|
#endif
|
|
|
|
|
2005-11-22 12:26:26 +00:00
|
|
|
/*
|
|
|
|
* The following defines are not meant to be changeable.
|
|
|
|
* They are for readability only.
|
|
|
|
*/
|
|
|
|
#define MAXCHR 256
|
|
|
|
#define CHRBIT 8
|
|
|
|
#define BITBLK MAXCHR/CHRBIT
|
|
|
|
|
|
|
|
class CharacterIndexer {
|
2006-03-11 02:33:39 +00:00
|
|
|
public:
|
2005-11-22 12:26:26 +00:00
|
|
|
virtual char CharAt(int index)=0;
|
|
|
|
virtual ~CharacterIndexer() {
|
|
|
|
}
|
|
|
|
};
|
|
|
|
|
|
|
|
class RESearch {
|
|
|
|
|
|
|
|
public:
|
2006-03-11 02:33:39 +00:00
|
|
|
RESearch(CharClassify *charClassTable);
|
2005-11-22 12:26:26 +00:00
|
|
|
~RESearch();
|
|
|
|
bool GrabMatches(CharacterIndexer &ci);
|
2008-10-18 10:56:10 +00:00
|
|
|
const char *Compile(const char *pattern, int length, bool caseSensitive, bool posix);
|
2005-11-22 12:26:26 +00:00
|
|
|
int Execute(CharacterIndexer &ci, int lp, int endp);
|
|
|
|
int Substitute(CharacterIndexer &ci, char *src, char *dst);
|
|
|
|
|
2007-06-18 13:02:34 +00:00
|
|
|
enum { MAXTAG=10 };
|
|
|
|
enum { MAXNFA=2048 };
|
|
|
|
enum { NOTFOUND=-1 };
|
2005-11-22 12:26:26 +00:00
|
|
|
|
|
|
|
int bopat[MAXTAG];
|
|
|
|
int eopat[MAXTAG];
|
|
|
|
char *pat[MAXTAG];
|
|
|
|
|
|
|
|
private:
|
2006-03-11 02:33:39 +00:00
|
|
|
void Init();
|
|
|
|
void Clear();
|
2007-06-18 13:02:34 +00:00
|
|
|
void ChSet(unsigned char c);
|
|
|
|
void ChSetWithCase(unsigned char c, bool caseSensitive);
|
2008-10-18 10:56:10 +00:00
|
|
|
int GetBackslashExpression(const char *pattern, int &incr);
|
2006-03-11 02:33:39 +00:00
|
|
|
|
2005-11-22 12:26:26 +00:00
|
|
|
int PMatch(CharacterIndexer &ci, int lp, int endp, char *ap);
|
|
|
|
|
|
|
|
int bol;
|
2007-06-18 13:02:34 +00:00
|
|
|
int tagstk[MAXTAG]; /* subpat tag stack */
|
2006-03-11 02:33:39 +00:00
|
|
|
char nfa[MAXNFA]; /* automaton */
|
2005-11-22 12:26:26 +00:00
|
|
|
int sta;
|
2007-06-18 13:02:34 +00:00
|
|
|
unsigned char bittab[BITBLK]; /* bit table for CCL pre-set bits */
|
2005-11-22 12:26:26 +00:00
|
|
|
int failure;
|
2006-03-11 02:33:39 +00:00
|
|
|
CharClassify *charClass;
|
|
|
|
bool iswordc(unsigned char x) {
|
|
|
|
return charClass->IsWord(x);
|
|
|
|
}
|
2005-11-22 12:26:26 +00:00
|
|
|
};
|
|
|
|
|
2007-06-18 13:02:34 +00:00
|
|
|
#ifdef SCI_NAMESPACE
|
|
|
|
}
|
2005-11-22 12:26:26 +00:00
|
|
|
#endif
|
2007-06-18 13:02:34 +00:00
|
|
|
|
|
|
|
#endif
|
|
|
|
|