2001-07-13 12:17:43 -04:00
|
|
|
///////////////////////////////////////////////////////////////////////////////
|
|
|
|
// Name: wx/regex.h
|
|
|
|
// Purpose: regular expression matching
|
2007-12-03 17:09:26 -05:00
|
|
|
// Author: Karsten Ballueder
|
2001-07-13 12:17:43 -04:00
|
|
|
// Modified by: VZ at 13.07.01 (integrated to wxWin)
|
|
|
|
// Created: 05.02.2000
|
2007-12-03 17:09:26 -05:00
|
|
|
// Copyright: (c) 2000 Karsten Ballueder <ballueder@gmx.net>
|
2004-05-23 16:53:33 -04:00
|
|
|
// Licence: wxWindows licence
|
2001-07-13 12:17:43 -04:00
|
|
|
///////////////////////////////////////////////////////////////////////////////
|
|
|
|
|
|
|
|
#ifndef _WX_REGEX_H_
|
|
|
|
#define _WX_REGEX_H_
|
|
|
|
|
|
|
|
#include "wx/defs.h"
|
|
|
|
|
|
|
|
#if wxUSE_REGEX
|
|
|
|
|
2009-01-02 12:29:32 -05:00
|
|
|
#include "wx/string.h"
|
2021-07-17 14:28:39 -04:00
|
|
|
#include "wx/versioninfo.h"
|
2001-07-16 14:07:30 -04:00
|
|
|
|
2001-07-13 12:17:43 -04:00
|
|
|
// ----------------------------------------------------------------------------
|
|
|
|
// constants
|
|
|
|
// ----------------------------------------------------------------------------
|
|
|
|
|
|
|
|
// flags for regex compilation: these can be used with Compile()
|
|
|
|
enum
|
|
|
|
{
|
2004-02-19 12:28:56 -05:00
|
|
|
// use extended regex syntax
|
2001-07-13 12:17:43 -04:00
|
|
|
wxRE_EXTENDED = 0,
|
2004-09-21 14:15:59 -04:00
|
|
|
|
2021-07-17 11:40:16 -04:00
|
|
|
// use advanced RE syntax (deprecated, same as wxRE_EXTENDED now)
|
2004-02-19 12:28:56 -05:00
|
|
|
wxRE_ADVANCED = 1,
|
2001-07-13 12:17:43 -04:00
|
|
|
|
|
|
|
// use basic RE syntax
|
|
|
|
wxRE_BASIC = 2,
|
|
|
|
|
|
|
|
// ignore case in match
|
|
|
|
wxRE_ICASE = 4,
|
|
|
|
|
|
|
|
// only check match, don't set back references
|
|
|
|
wxRE_NOSUB = 8,
|
|
|
|
|
|
|
|
// if not set, treat '\n' as an ordinary character, otherwise it is
|
|
|
|
// special: it is not matched by '.' and '^' and '$' always match
|
|
|
|
// after/before it regardless of the setting of wxRE_NOT[BE]OL
|
|
|
|
wxRE_NEWLINE = 16,
|
|
|
|
|
|
|
|
// default flags
|
2001-07-13 13:10:00 -04:00
|
|
|
wxRE_DEFAULT = wxRE_EXTENDED
|
2001-07-13 12:17:43 -04:00
|
|
|
};
|
|
|
|
|
|
|
|
// flags for regex matching: these can be used with Matches()
|
|
|
|
//
|
|
|
|
// these flags are mainly useful when doing several matches in a long string,
|
|
|
|
// they can be used to prevent erroneous matches for '^' and '$'
|
|
|
|
enum
|
|
|
|
{
|
|
|
|
// '^' doesn't match at the start of line
|
|
|
|
wxRE_NOTBOL = 32,
|
|
|
|
|
|
|
|
// '$' doesn't match at the end of line
|
2021-07-17 11:00:19 -04:00
|
|
|
wxRE_NOTEOL = 64,
|
|
|
|
|
|
|
|
// don't accept empty string as valid match, try alternatives or fail
|
|
|
|
wxRE_NOTEMPTY = 128
|
2001-07-13 12:17:43 -04:00
|
|
|
};
|
|
|
|
|
|
|
|
// ----------------------------------------------------------------------------
|
|
|
|
// wxRegEx: a regular expression
|
|
|
|
// ----------------------------------------------------------------------------
|
|
|
|
|
2007-07-09 06:09:52 -04:00
|
|
|
class WXDLLIMPEXP_FWD_BASE wxRegExImpl;
|
2001-07-13 12:17:43 -04:00
|
|
|
|
2003-07-01 21:59:24 -04:00
|
|
|
class WXDLLIMPEXP_BASE wxRegEx
|
2001-07-13 12:17:43 -04:00
|
|
|
{
|
|
|
|
public:
|
|
|
|
// default ctor: use Compile() later
|
|
|
|
wxRegEx() { Init(); }
|
|
|
|
|
|
|
|
// create and compile
|
|
|
|
wxRegEx(const wxString& expr, int flags = wxRE_DEFAULT)
|
|
|
|
{
|
|
|
|
Init();
|
|
|
|
(void)Compile(expr, flags);
|
|
|
|
}
|
|
|
|
|
2004-09-21 14:15:59 -04:00
|
|
|
// return true if this is a valid compiled regular expression
|
2001-07-13 12:17:43 -04:00
|
|
|
bool IsValid() const { return m_impl != NULL; }
|
|
|
|
|
2004-09-21 14:15:59 -04:00
|
|
|
// compile the string into regular expression, return true if ok or false
|
2001-07-13 12:17:43 -04:00
|
|
|
// if string has a syntax error
|
|
|
|
bool Compile(const wxString& pattern, int flags = wxRE_DEFAULT);
|
|
|
|
|
|
|
|
// matches the precompiled regular expression against a string, return
|
2004-09-21 14:15:59 -04:00
|
|
|
// true if matches and false otherwise
|
2001-07-13 12:17:43 -04:00
|
|
|
//
|
|
|
|
// flags may be combination of wxRE_NOTBOL and wxRE_NOTEOL
|
2005-11-20 12:25:33 -05:00
|
|
|
// len may be the length of text (ignored by most system regex libs)
|
2001-07-13 13:10:00 -04:00
|
|
|
//
|
|
|
|
// may only be called after successful call to Compile()
|
2007-03-22 11:20:50 -04:00
|
|
|
bool Matches(const wxString& text, int flags = 0) const;
|
|
|
|
bool Matches(const wxChar *text, int flags, size_t len) const
|
|
|
|
{ return Matches(wxString(text, len), flags); }
|
2001-07-13 12:17:43 -04:00
|
|
|
|
|
|
|
// get the start index and the length of the match of the expression
|
|
|
|
// (index 0) or a bracketed subexpression (index != 0)
|
|
|
|
//
|
2001-07-13 13:10:00 -04:00
|
|
|
// may only be called after successful call to Matches()
|
|
|
|
//
|
2004-09-21 14:15:59 -04:00
|
|
|
// return false if no match or on error
|
2001-07-13 12:17:43 -04:00
|
|
|
bool GetMatch(size_t *start, size_t *len, size_t index = 0) const;
|
|
|
|
|
2001-07-13 13:10:00 -04:00
|
|
|
// return the part of string corresponding to the match, empty string is
|
|
|
|
// returned if match failed
|
|
|
|
//
|
|
|
|
// may only be called after successful call to Matches()
|
|
|
|
wxString GetMatch(const wxString& text, size_t index = 0) const;
|
|
|
|
|
2004-04-21 16:14:14 -04:00
|
|
|
// return the size of the array of matches, i.e. the number of bracketed
|
|
|
|
// subexpressions plus one for the expression itself, or 0 on error.
|
|
|
|
//
|
|
|
|
// may only be called after successful call to Compile()
|
|
|
|
size_t GetMatchCount() const;
|
|
|
|
|
2001-07-13 12:17:43 -04:00
|
|
|
// replaces the current regular expression in the string pointed to by
|
|
|
|
// pattern, with the text in replacement and return number of matches
|
|
|
|
// replaced (maybe 0 if none found) or -1 on error
|
2001-07-14 12:13:32 -04:00
|
|
|
//
|
|
|
|
// the replacement text may contain backreferences (\number) which will be
|
|
|
|
// replaced with the value of the corresponding subexpression in the
|
|
|
|
// pattern match
|
|
|
|
//
|
|
|
|
// maxMatches may be used to limit the number of replacements made, setting
|
2008-09-29 08:10:58 -04:00
|
|
|
// it to 1, for example, will only replace first occurrence (if any) of the
|
2001-07-14 12:13:32 -04:00
|
|
|
// pattern in the text while default value of 0 means replace all
|
|
|
|
int Replace(wxString *text, const wxString& replacement,
|
|
|
|
size_t maxMatches = 0) const;
|
|
|
|
|
2008-09-29 08:10:58 -04:00
|
|
|
// replace the first occurrence
|
2001-07-14 12:13:32 -04:00
|
|
|
int ReplaceFirst(wxString *text, const wxString& replacement) const
|
|
|
|
{ return Replace(text, replacement, 1); }
|
|
|
|
|
2008-09-29 08:10:58 -04:00
|
|
|
// replace all occurrences: this is actually a synonym for Replace()
|
2001-07-14 12:13:32 -04:00
|
|
|
int ReplaceAll(wxString *text, const wxString& replacement) const
|
|
|
|
{ return Replace(text, replacement, 0); }
|
2001-07-13 12:17:43 -04:00
|
|
|
|
2019-08-24 17:26:50 -04:00
|
|
|
static wxString QuoteMeta(const wxString& str);
|
|
|
|
|
2021-06-18 17:56:09 -04:00
|
|
|
// return the extended RE corresponding to the given basic RE
|
|
|
|
static wxString ConvertFromBasic(const wxString& bre);
|
|
|
|
|
2021-07-17 14:28:39 -04:00
|
|
|
// return version information for the underlying regex library
|
|
|
|
static wxVersionInfo GetLibraryVersionInfo();
|
|
|
|
|
2001-07-13 12:17:43 -04:00
|
|
|
// dtor not virtual, don't derive from this class
|
|
|
|
~wxRegEx();
|
|
|
|
|
|
|
|
private:
|
|
|
|
// common part of all ctors
|
|
|
|
void Init();
|
|
|
|
|
|
|
|
// the real guts of this class
|
|
|
|
wxRegExImpl *m_impl;
|
2001-09-06 13:21:00 -04:00
|
|
|
|
|
|
|
// as long as the class wxRegExImpl is not ref-counted,
|
|
|
|
// instances of the handle wxRegEx must not be copied.
|
|
|
|
wxRegEx(const wxRegEx&);
|
|
|
|
wxRegEx &operator=(const wxRegEx&);
|
2001-07-13 12:17:43 -04:00
|
|
|
};
|
|
|
|
|
|
|
|
#endif // wxUSE_REGEX
|
|
|
|
|
|
|
|
#endif // _WX_REGEX_H_
|
|
|
|
|