File: tregex.h

package info (click to toggle)
mp3check 0.8.7-6
  • links: PTS, VCS
  • area: main
  • in suites: forky, sid, trixie
  • size: 820 kB
  • sloc: cpp: 14,731; makefile: 182; sh: 3
file content (92 lines) | stat: -rw-r--r-- 3,247 bytes parent folder | download | duplicates (6)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
/*GPL*START*
 *
 * encapsulated POSIX regular expression (regex) interface header
 *
 * Copyright (C) 1998 by Johannes Overmann <Johannes.Overmann@gmx.de>
 * 
 * This program is free software; you can redistribute it and/or modify
 * it under the terms of the GNU General Public License as published by
 * the Free Software Foundation; either version 2 of the License, or
 * (at your option) any later version.
 * 
 * This program is distributed in the hope that it will be useful,
 * but WITHOUT ANY WARRANTY; without even the implied warranty of
 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 * GNU General Public License for more details.
 * 
 * You should have received a copy of the GNU General Public License
 * along with this program; if not, write to the Free Software
 * Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
 * *GPL*END*/  

#ifndef _ngw_tregex_h_
#define _ngw_tregex_h_

#include <sys/types.h>
#include <regex.h>
#include "tstring.h"


class TRegEx {
 public:
   // ctor & dtor
   // cflags: REG_EXTENDED, REG_ICASE, REG_NOSUB, REG_NEWLINE
   TRegEx(const char *regex, int cflags);
   ~TRegEx();

   // matching:
   // eflags: REG_NOTBOL, REG_NOTEOL
   
   // return true if str matches the regex
   bool match(const char *str, int eflags=0) const;
   // return true if str matches the regex and set position
   bool firstMatch(const char *str, int& start, int& len, int eflags=0) const;
   // return true if str matches the regex and return all positions
   // in all: all[0]=start1, all[1]=len1, all[2]=start2, all[3]=len2, ...
   bool allMatches(const char *str, tvector<int>& all, int eflags=0) const;
   // same as above but also recognize substrings in all
   bool allMatchesSubstring(const char *str, tvector<tvector<int> >& all, 
			    int eflags=0, int progress=0, int progmode=0) const;

   // constants for allMatchesSubstring(..., progmode)
   // default: print '.' to stdout
   // P_STDERR: print to stderr
   // P_NUMBER: print number instead of a '.'
   enum {P_STDERR=1, P_NUMBER=2};

   // error exceptions
   class TErroneousRegexException: public TException {
      TExceptionN(TErroneousRegexException);
      TErroneousRegexException(int error_, const regex_t& preg_): error(error_), preg(preg_) {}
      const char *str() const {
	 static char buf[256];
	 regerror(error, &preg, buf, sizeof(buf));
	 return buf;
      }
      int error;
      regex_t preg;
      TExceptionM2("%s (error #%d)", str(), error);
   };
   class TNoSubRegexException: public TException {TExceptionN(TErroneousRegexException);};

 private: 
   // private data
   regex_t preg;
   bool nosub;
   
   // forbid default copy and assignment
   TRegEx(const TRegEx&);                  
   const TRegEx& operator=(const TRegEx&);    
};


// substitute occurences occ in string with sub and write to out
// and use back references in sub from occ (\0 .. \9 \a .. \z)
void parameterSubstitution(const tstring& in, tstring& out, const tstring& sub,
			   const tvector<tvector<int> >& occ, 
			   bool preserve_case=false, int modify_case=0,
			   int progress=0, const tstring& pre_padstring=tstring(), 
			   const tstring& post_padstring=tstring(), tvector<int> *match_pos=0);


#endif /* tregex.h */