[Libreoffice-commits] .: regexp/prj regexp/source
Matus Kukan
mkukan at kemper.freedesktop.org
Tue Sep 27 10:43:23 PDT 2011
regexp/prj/d.lst | 1
regexp/source/reclass.hxx | 388 ----------------------------------------------
2 files changed, 389 deletions(-)
New commits:
commit 31e7820f03badc3c6fe8fdaffb74f2125e05ea96
Author: Matúš Kukan <matus.kukan at gmail.com>
Date: Tue Sep 27 19:41:05 2011 +0200
remove unused header and clean d.lst which should be empty
diff --git a/regexp/prj/d.lst b/regexp/prj/d.lst
index 3f38fbe..e69de29 100644
--- a/regexp/prj/d.lst
+++ b/regexp/prj/d.lst
@@ -1 +0,0 @@
-..\%__SRC%\lib\libi18nregexp*.dll.a %_DEST%\lib\libi18nregexp*.dll.a
diff --git a/regexp/source/reclass.hxx b/regexp/source/reclass.hxx
deleted file mode 100644
index 34d1c27..0000000
--- a/regexp/source/reclass.hxx
+++ /dev/null
@@ -1,388 +0,0 @@
-/* -*- Mode: C++; tab-width: 4; indent-tabs-mode: nil; c-basic-offset: 4 -*- */
-/* Definitions for data structures and routines for the regular
- expression library, version 0.12.
- Copyright (C) 1985,89,90,91,92,93,95,96,97,98 Free Software Foundation, Inc.
-
- This file is part of the GNU C Library. Its master source is NOT part of
- the C library, however. The master source lives in /gd/gnu/lib.
-
- The GNU C Library is free software; you can redistribute it and/or
- modify it under the terms of the GNU Library General Public License as
- published by the Free Software Foundation; either version 2 of the
- License, or (at your option) any later version.
-
- The GNU C Library is distributed in the hope that it will be useful,
- but WITHOUT ANY WARRANTY; without even the implied warranty of
- MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
- Library General Public License for more details.
-
- You should have received a copy of the GNU Library General Public
- License along with the GNU C Library; see the file COPYING.LIB. If not,
- write to the Free Software Foundation, Inc., 59 Temple Place - Suite 330,
- Boston, MA 02111-1307, USA. */
-
-/*
- Modified for OpenOffice.org to use sal_Unicode and Transliteration service.
- */
-
-#ifndef INCLUDED_REGEXP_RECLASS_HXX
-#define INCLUDED_REGEXP_RECLASS_HXX
-
-#include <i18nutil/unicode.hxx>
-#include <com/sun/star/util/SearchFlags.hpp>
-#include <com/sun/star/util/SearchOptions.hpp>
-#include <sal/types.h>
-#include <com/sun/star/i18n/XExtendedTransliteration.hpp>
-
-/* If any error codes are removed, changed, or added, update the
- `re_error_msg' table in regex.c. */
-typedef enum
-{
-#ifdef _XOPEN_SOURCE
- REG_ENOSYS = -1, /* This will never happen for this implementation. */
-#endif
-
- REG_NOERROR = 0, /* Success. */
- REG_NOMATCH, /* Didn't find a match (for regexec). */
-
- /* POSIX regcomp return error codes. (In the order listed in the
- standard.) */
- REG_BADPAT, /* Invalid pattern. */
- REG_ECOLLATE, /* Not implemented. */
- REG_ECTYPE, /* Invalid character class name. */
- REG_EESCAPE, /* Trailing backslash. */
- REG_ESUBREG, /* Invalid back reference. */
- REG_EBRACK, /* Unmatched left bracket. */
- REG_EPAREN, /* Parenthesis imbalance. */
- REG_EBRACE, /* Unmatched \{. */
- REG_BADBR, /* Invalid contents of \{\}. */
- REG_ERANGE, /* Invalid range end. */
- REG_ESPACE, /* Ran out of memory. */
- REG_BADRPT, /* No preceding re for repetition op. */
-
- /* Error codes we've added. */
- REG_EEND, /* Premature end. */
- REG_ESIZE, /* Compiled pattern bigger than 2^16 bytes. */
- REG_ERPAREN /* Unmatched ) or \); not returned from regcomp. */
-} reg_errcode_t;
-
-
-/* This data structure represents a compiled pattern. Before calling
- the pattern compiler, the fields `buffer', `allocated', `fastmap',
- can be set. After the pattern has been
- compiled, the `re_nsub' field is available. All other fields are
- private to the regex routines. */
-
-struct re_pattern_buffer
-{
-/* [[[begin pattern_buffer]]] */
- /* Space that holds the compiled pattern. It is declared as
- `unsigned char *' because its elements are
- sometimes used as array indexes. */
- sal_Unicode *buffer;
-
- /* Number of bytes to which `buffer' points. */
- sal_uInt32 allocated;
-
- /* Number of bytes actually used in `buffer'. */
- sal_uInt32 used;
-
- /* Pointer to a fastmap, if any, otherwise zero. re_search uses
- the fastmap, if there is one, to skip over impossible
- starting points for matches. */
- sal_Unicode *fastmap;
-
-
- /* Number of subexpressions found by the compiler. */
- size_t re_nsub;
-
- /* Zero if this pattern cannot match the empty string, one else.
- Well, in truth it's used only in `re_search2', to see
- whether or not we should use the fastmap, so we don't set
- this absolutely perfectly; see `re_compile_fastmap' (the
- `duplicate' case). */
- unsigned can_be_null : 1;
-
- /* Set to zero when `regex_compile' compiles a pattern; set to one
- by `re_compile_fastmap' if it updates the fastmap. */
- unsigned fastmap_accurate : 1;
-
- /* If set, a beginning-of-line anchor doesn't match at the
- beginning of the string. */
- unsigned not_bol : 1;
-
- /* Similarly for an end-of-line anchor. */
- unsigned not_eol : 1;
-
- /* If true, an anchor at a newline matches. */
- unsigned newline_anchor : 1;
-
-/* [[[end pattern_buffer]]] */
-};
-
-/* These are the command codes that appear in compiled regular
- expressions. Some opcodes are followed by argument bytes. A
- command code can specify any interpretation whatsoever for its
- arguments. Zero bytes may appear in the compiled regular expression. */
-
-typedef enum
-{
- no_op = 0,
-
- /* Succeed right away--no more backtracking. */
- succeed,
-
- /* Followed by one byte giving n, then by n literal bytes. */
- exactn,
-
- /* Matches any (more or less) character. */
- anychar,
-
- /* Matches any one char belonging to specified set. First
- following byte is number of bitmap bytes. Then come bytes
- for a bitmap saying which chars are in. Bits in each byte
- are ordered low-bit-first. A character is in the set if its
- bit is 1. A character too large to have a bit in the map is
- automatically not in the set. */
- charset,
-
- /* Same parameters as charset, but match any character that is
- not one of those specified. */
- charset_not,
-
- /* Start remembering the text that is matched, for storing in a
- register. Followed by one byte with the register number, in
- the range 0 to one less than the pattern buffer's re_nsub
- field. Then followed by one byte with the number of groups
- inner to this one. (This last has to be part of the
- start_memory only because we need it in the on_failure_jump
- of re_match2.) */
- start_memory,
- /* Stop remembering the text that is matched and store it in a
- memory register. Followed by one byte with the register
- number, in the range 0 to one less than `re_nsub' in the
- pattern buffer, and one byte with the number of inner groups,
- just like `start_memory'. (We need the number of inner
- groups here because we don't have any easy way of finding the
- corresponding start_memory when we're at a stop_memory.) */
- stop_memory,
-
- /* Match a duplicate of something remembered. Followed by one
- byte containing the register number. */
- duplicate,
-
- /* Fail unless at beginning of line. */
- begline,
-
- /* Fail unless at end of line. */
- endline,
-
- /* Succeeds if at beginning of buffer (if emacs) or at beginning
- of string to be matched (if not). */
- begbuf,
-
- /* Analogously, for end of buffer/string. */
- endbuf,
-
- /* Followed by two byte relative address to which to jump. */
- jump,
-
- /* Same as jump, but marks the end of an alternative. */
- jump_past_alt,
-
- /* Followed by two-byte relative address of place to resume at
- in case of failure. */
- on_failure_jump,
-
- /* Like on_failure_jump, but pushes a placeholder instead of the
- current string position when executed. */
- on_failure_keep_string_jump,
-
- /* Throw away latest failure point and then jump to following
- two-byte relative address. */
- pop_failure_jump,
-
- /* Change to pop_failure_jump if know won't have to backtrack to
- match; otherwise change to jump. This is used to jump
- back to the beginning of a repeat. If what follows this jump
- clearly won't match what the repeat does, such that we can be
- sure that there is no use backtracking out of repetitions
- already matched, then we change it to a pop_failure_jump.
- Followed by two-byte address. */
- maybe_pop_jump,
-
- /* Jump to following two-byte address, and push a dummy failure
- point. This failure point will be thrown away if an attempt
- is made to use it for a failure. A `+' construct makes this
- before the first repeat. Also used as an intermediary kind
- of jump when compiling an alternative. */
- dummy_failure_jump,
-
- /* Push a dummy failure point and continue. Used at the end of
- alternatives. */
- push_dummy_failure,
-
- /* Followed by two-byte relative address and two-byte number n.
- After matching N times, jump to the address upon failure. */
- succeed_n,
-
- /* Followed by two-byte relative address, and two-byte number n.
- Jump to the address N times, then fail. */
- jump_n,
-
- /* Set the following two-byte relative address to the
- subsequent two-byte number. The address *includes* the two
- bytes of number. */
- set_number_at,
-
- wordbeg, /* Succeeds if at word beginning. */
- wordend /* Succeeds if at word end. */
-
-} re_opcode_t;
-
-typedef struct re_pattern_buffer regex_t;
-
-/* Type for byte offsets within the string. POSIX mandates this. */
-typedef sal_Int32 regoff_t;
-
-/* This is the structure we store register match data in. See
- regex.texinfo for a full description of what registers match. */
-struct re_registers
-{
- sal_uInt32 num_regs;
- sal_Int32 *start;
- sal_Int32 *end;
- sal_Int32 num_of_match;
-};
-
-typedef struct {
- sal_Int32 begalt_offset;
- sal_Int32 fixup_alt_jump;
- sal_Int32 inner_group_offset;
- sal_Int32 laststart_offset;
- sal_uInt32 regnum;
-} compile_stack_elt_t;
-
-typedef struct {
- compile_stack_elt_t *stack;
- sal_uInt32 size;
- sal_uInt32 avail;
-} compile_stack_type;
-
-union fail_stack_elt
-{
- sal_Unicode *pointer;
- sal_Int32 integer;
-};
-
-typedef union fail_stack_elt fail_stack_elt_t;
-
-typedef struct
-{
- fail_stack_elt_t *stack;
- sal_uInt32 size;
- sal_uInt32 avail; /* Offset of next open position. */
-} fail_stack_type;
-
-typedef union
-{
- fail_stack_elt_t word;
- struct
- {
- /* This field is one if this group can match the empty string,
- zero if not. If not yet determined, `MATCH_NULL_UNSET_VALUE'. */
-#define MATCH_NULL_UNSET_VALUE 3
- unsigned match_null_string_p : 2;
- unsigned is_active : 1;
- unsigned matched_something : 1;
- unsigned ever_matched_something : 1;
- } bits;
-} register_info_type;
-
-
-class Regexpr
-{
- ::com::sun::star::uno::Reference<
- ::com::sun::star::i18n::XExtendedTransliteration > translit;
-
- const sal_Unicode *line; // line to search in
- sal_Int32 linelen; // length of search string
-
- sal_Unicode *pattern; // RE pattern to match
- sal_Int32 patsize; // Length of pattern
-
- struct re_pattern_buffer *bufp;
-
- sal_Bool isIgnoreCase;
-
- /* Either a translate table to apply to all characters before
- comparing them, or zero for no translation. The translation
- is applied to a pattern when it is compiled and to a string
- when it is matched. */
- int translate;
-
- sal_uInt32 failure_id;
- sal_uInt32 nfailure_points_pushed;
- sal_uInt32 nfailure_points_popped;
- /* Counts the total number of registers pushed. */
- sal_uInt32 num_regs_pushed;
-
- sal_uInt32 re_max_failures;
-
- /* Registers are set to a sentinel when they haven't yet matched. */
- sal_Unicode reg_unset_dummy;
-
- // private instance functions
- inline void store_number( sal_Unicode * destination, sal_Int32 number );
- inline void store_number_and_incr( sal_Unicode *& destination, sal_Int32 number );
- inline void extract_number(sal_Int32 & dest, sal_Unicode *source);
- inline void extract_number_and_incr(sal_Int32 & destination, sal_Unicode *& source);
-
- sal_Bool group_match_null_string_p(sal_Unicode **p, sal_Unicode *end,
- register_info_type *reg_info);
- sal_Bool alt_match_null_string_p(sal_Unicode *p, sal_Unicode *end,
- register_info_type *reg_info);
-
- sal_Bool common_op_match_null_string_p(sal_Unicode **p, sal_Unicode *end,
- register_info_type *reg_info);
- sal_Int32 bcmp_translate(const sal_Unicode *s1,
- const sal_Unicode *s2, sal_Int32 len);
-
- sal_Int32 regcomp(void);
- sal_Int32 regex_compile(void);
- inline void store_op1(re_opcode_t op, sal_Unicode *loc, sal_Int32 arg);
- inline void store_op2(re_opcode_t op, sal_Unicode *loc, sal_Int32 arg1, sal_Int32 arg2);
- void insert_op1(re_opcode_t op, sal_Unicode *loc, sal_Int32 arg,
- sal_Unicode *end);
- void insert_op2(re_opcode_t op, sal_Unicode *loc, sal_Int32 arg1,
- sal_Int32 arg2, sal_Unicode *end);
- sal_Bool at_begline_loc_p(const sal_Unicode *local_pattern,
- const sal_Unicode *p);
- sal_Bool at_endline_loc_p(const sal_Unicode *p, const sal_Unicode *pend);
- reg_errcode_t compile_range(sal_Unicode range_begin, sal_Unicode range_end, sal_Unicode *b);
- sal_Bool group_in_compile_stack(compile_stack_type compile_stack,
- sal_uInt32 regnum);
- sal_Int32 re_match2(struct re_registers *regs, sal_Int32 pos, sal_Int32 range);
-
- sal_Bool iswordbegin(const sal_Unicode *d, sal_Unicode *string, sal_Int32 ssize);
- sal_Bool iswordend(const sal_Unicode *d, sal_Unicode *string, sal_Int32 ssize);
- void set_list_bit(sal_Unicode c, sal_Unicode *b);
-
-public:
- // constructors
- Regexpr( const ::com::sun::star::util::SearchOptions & rOptions,
- ::com::sun::star::uno::Reference<
- ::com::sun::star::i18n::XExtendedTransliteration > XTrans );
-
- // destructor
- ~Regexpr();
-
- void set_line( const sal_Unicode *line, sal_Int32 len );
-
- // function returning pointers to occurrences in regs
- sal_Int32 re_search(struct re_registers *regs, sal_Int32 pOffset); // find pattern in line
-};
-
-#endif
-
-/* vim:set shiftwidth=4 softtabstop=4 expandtab: */
More information about the Libreoffice-commits
mailing list