emacs: src/search.c annotate

author	Dave Love <fx@gnu.org>
date	Fri, 28 Jan 2000 23:14:55 +0000 (2000-01-28)
parents	1121a5da20a5
children	5cd59d1800ad

rev	line source
603 470f556a9453 Initial revision Jim Blandy <jimb@redhat.com> parents: diff changeset	1 /* String search routines for GNU Emacs.
26088 b7aa6ac26872 Add support for large files, 64-bit Solaris, system locale codings. Paul Eggert <eggert@twinsun.com> parents: 25663 diff changeset	2 Copyright (C) 1985, 86,87,93,94,97,98, 1999 Free Software Foundation, Inc.
603 470f556a9453 Initial revision Jim Blandy <jimb@redhat.com> parents: diff changeset	3
470f556a9453 Initial revision Jim Blandy <jimb@redhat.com> parents: diff changeset	4 This file is part of GNU Emacs.
470f556a9453 Initial revision Jim Blandy <jimb@redhat.com> parents: diff changeset	5
470f556a9453 Initial revision Jim Blandy <jimb@redhat.com> parents: diff changeset	6 GNU Emacs is free software; you can redistribute it and/or modify
470f556a9453 Initial revision Jim Blandy <jimb@redhat.com> parents: diff changeset	7 it under the terms of the GNU General Public License as published by
12244 ac7375e60931 Update GPL to version 2. Karl Heuer <kwzh@gnu.org> parents: 12148 diff changeset	8 the Free Software Foundation; either version 2, or (at your option)
603 470f556a9453 Initial revision Jim Blandy <jimb@redhat.com> parents: diff changeset	9 any later version.
470f556a9453 Initial revision Jim Blandy <jimb@redhat.com> parents: diff changeset	10
470f556a9453 Initial revision Jim Blandy <jimb@redhat.com> parents: diff changeset	11 GNU Emacs is distributed in the hope that it will be useful,
470f556a9453 Initial revision Jim Blandy <jimb@redhat.com> parents: diff changeset	12 but WITHOUT ANY WARRANTY; without even the implied warranty of
470f556a9453 Initial revision Jim Blandy <jimb@redhat.com> parents: diff changeset	13 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
470f556a9453 Initial revision Jim Blandy <jimb@redhat.com> parents: diff changeset	14 GNU General Public License for more details.
470f556a9453 Initial revision Jim Blandy <jimb@redhat.com> parents: diff changeset	15
470f556a9453 Initial revision Jim Blandy <jimb@redhat.com> parents: diff changeset	16 You should have received a copy of the GNU General Public License
470f556a9453 Initial revision Jim Blandy <jimb@redhat.com> parents: diff changeset	17 along with GNU Emacs; see the file COPYING. If not, write to
14186 ee40177f6c68 Update FSF's address in the preamble. Erik Naggum <erik@naggum.no> parents: 14086 diff changeset	18 the Free Software Foundation, Inc., 59 Temple Place - Suite 330,
ee40177f6c68 Update FSF's address in the preamble. Erik Naggum <erik@naggum.no> parents: 14086 diff changeset	19 Boston, MA 02111-1307, USA. */
603 470f556a9453 Initial revision Jim Blandy <jimb@redhat.com> parents: diff changeset	20
470f556a9453 Initial revision Jim Blandy <jimb@redhat.com> parents: diff changeset	21
4696 1fc792473491 Include <config.h> instead of "config.h". Roland McGrath <roland@gnu.org> parents: 4635 diff changeset	22 #include <config.h>
603 470f556a9453 Initial revision Jim Blandy <jimb@redhat.com> parents: diff changeset	23 #include "lisp.h"
470f556a9453 Initial revision Jim Blandy <jimb@redhat.com> parents: diff changeset	24 #include "syntax.h"
17053 df904355f033 Include category.h and charset.h. Karl Heuer <kwzh@gnu.org> parents: 16880 diff changeset	25 #include "category.h"
603 470f556a9453 Initial revision Jim Blandy <jimb@redhat.com> parents: diff changeset	26 #include "buffer.h"
17053 df904355f033 Include category.h and charset.h. Karl Heuer <kwzh@gnu.org> parents: 16880 diff changeset	27 #include "charset.h"
9410 8598c3d6f2f0 * search.c: #include "region-cache.h". Jim Blandy <jimb@redhat.com> parents: 9319 diff changeset	28 #include "region-cache.h"
603 470f556a9453 Initial revision Jim Blandy <jimb@redhat.com> parents: diff changeset	29 #include "commands.h"
2439 b6c62e4abf59 Put interrupt input blocking in a separate file from xterm.h. Jim Blandy <jimb@redhat.com> parents: 2393 diff changeset	30 #include "blockinput.h"
20347 d8e5f3c1618b Include "intervals.h" for prototypes. Andreas Schwab <schwab@suse.de> parents: 19541 diff changeset	31 #include "intervals.h"
621 eca8812e61cd * empty log message * Jim Blandy <jimb@redhat.com> parents: 605 diff changeset	32
603 470f556a9453 Initial revision Jim Blandy <jimb@redhat.com> parents: diff changeset	33 #include <sys/types.h>
470f556a9453 Initial revision Jim Blandy <jimb@redhat.com> parents: diff changeset	34 #include "regex.h"
470f556a9453 Initial revision Jim Blandy <jimb@redhat.com> parents: diff changeset	35
21457 8c6ea32aadfa (min, max): Make these macros, not functions. Karl Heuer <kwzh@gnu.org> parents: 21248 diff changeset	36 #define min(a, b) ((a) < (b) ? (a) : (b))
8c6ea32aadfa (min, max): Make these macros, not functions. Karl Heuer <kwzh@gnu.org> parents: 21248 diff changeset	37 #define max(a, b) ((a) > (b) ? (a) : (b))
8c6ea32aadfa (min, max): Make these macros, not functions. Karl Heuer <kwzh@gnu.org> parents: 21248 diff changeset	38
16275 a4bcfdc9bb66 (REGEXP_CACHE_SIZE): Increase to 20. Richard M. Stallman <rms@gnu.org> parents: 16152 diff changeset	39 #define REGEXP_CACHE_SIZE 20
603 470f556a9453 Initial revision Jim Blandy <jimb@redhat.com> parents: diff changeset	40
9605 cf97e75d8e02 (searchbufs): New variable, replaces searchbuf and last_regexp and Karl Heuer <kwzh@gnu.org> parents: 9452 diff changeset	41 /* If the regexp is non-nil, then the buffer contains the compiled form
cf97e75d8e02 (searchbufs): New variable, replaces searchbuf and last_regexp and Karl Heuer <kwzh@gnu.org> parents: 9452 diff changeset	42 of that regexp, suitable for searching. */
16275 a4bcfdc9bb66 (REGEXP_CACHE_SIZE): Increase to 20. Richard M. Stallman <rms@gnu.org> parents: 16152 diff changeset	43 struct regexp_cache
a4bcfdc9bb66 (REGEXP_CACHE_SIZE): Increase to 20. Richard M. Stallman <rms@gnu.org> parents: 16152 diff changeset	44 {
9605 cf97e75d8e02 (searchbufs): New variable, replaces searchbuf and last_regexp and Karl Heuer <kwzh@gnu.org> parents: 9452 diff changeset	45 struct regexp_cache *next;
cf97e75d8e02 (searchbufs): New variable, replaces searchbuf and last_regexp and Karl Heuer <kwzh@gnu.org> parents: 9452 diff changeset	46 Lisp_Object regexp;
cf97e75d8e02 (searchbufs): New variable, replaces searchbuf and last_regexp and Karl Heuer <kwzh@gnu.org> parents: 9452 diff changeset	47 struct re_pattern_buffer buf;
cf97e75d8e02 (searchbufs): New variable, replaces searchbuf and last_regexp and Karl Heuer <kwzh@gnu.org> parents: 9452 diff changeset	48 char fastmap[0400];
10020 c41ce96785a8 (struct regexp_cache): New field `posix'. Richard M. Stallman <rms@gnu.org> parents: 9605 diff changeset	49 /* Nonzero means regexp was compiled to do full POSIX backtracking. */
c41ce96785a8 (struct regexp_cache): New field `posix'. Richard M. Stallman <rms@gnu.org> parents: 9605 diff changeset	50 char posix;
9605 cf97e75d8e02 (searchbufs): New variable, replaces searchbuf and last_regexp and Karl Heuer <kwzh@gnu.org> parents: 9452 diff changeset	51 };
603 470f556a9453 Initial revision Jim Blandy <jimb@redhat.com> parents: diff changeset	52
9605 cf97e75d8e02 (searchbufs): New variable, replaces searchbuf and last_regexp and Karl Heuer <kwzh@gnu.org> parents: 9452 diff changeset	53 /* The instances of that struct. */
cf97e75d8e02 (searchbufs): New variable, replaces searchbuf and last_regexp and Karl Heuer <kwzh@gnu.org> parents: 9452 diff changeset	54 struct regexp_cache searchbufs[REGEXP_CACHE_SIZE];
603 470f556a9453 Initial revision Jim Blandy <jimb@redhat.com> parents: diff changeset	55
9605 cf97e75d8e02 (searchbufs): New variable, replaces searchbuf and last_regexp and Karl Heuer <kwzh@gnu.org> parents: 9452 diff changeset	56 /* The head of the linked list; points to the most recently used buffer. */
cf97e75d8e02 (searchbufs): New variable, replaces searchbuf and last_regexp and Karl Heuer <kwzh@gnu.org> parents: 9452 diff changeset	57 struct regexp_cache *searchbuf_head;
cf97e75d8e02 (searchbufs): New variable, replaces searchbuf and last_regexp and Karl Heuer <kwzh@gnu.org> parents: 9452 diff changeset	58
603 470f556a9453 Initial revision Jim Blandy <jimb@redhat.com> parents: diff changeset	59
621 eca8812e61cd * empty log message * Jim Blandy <jimb@redhat.com> parents: 605 diff changeset	60 /* Every call to re_match, etc., must pass &search_regs as the regs
eca8812e61cd * empty log message * Jim Blandy <jimb@redhat.com> parents: 605 diff changeset	61 argument unless you can show it is unnecessary (i.e., if re_match
eca8812e61cd * empty log message * Jim Blandy <jimb@redhat.com> parents: 605 diff changeset	62 is certainly going to be called again before region-around-match
eca8812e61cd * empty log message * Jim Blandy <jimb@redhat.com> parents: 605 diff changeset	63 can be called).
eca8812e61cd * empty log message * Jim Blandy <jimb@redhat.com> parents: 605 diff changeset	64
eca8812e61cd * empty log message * Jim Blandy <jimb@redhat.com> parents: 605 diff changeset	65 Since the registers are now dynamically allocated, we need to make
eca8812e61cd * empty log message * Jim Blandy <jimb@redhat.com> parents: 605 diff changeset	66 sure not to refer to the Nth register before checking that it has
708 030fb4635335 * empty log message * Jim Blandy <jimb@redhat.com> parents: 648 diff changeset	67 been allocated by checking search_regs.num_regs.
603 470f556a9453 Initial revision Jim Blandy <jimb@redhat.com> parents: diff changeset	68
708 030fb4635335 * empty log message * Jim Blandy <jimb@redhat.com> parents: 648 diff changeset	69 The regex code keeps track of whether it has allocated the search
9605 cf97e75d8e02 (searchbufs): New variable, replaces searchbuf and last_regexp and Karl Heuer <kwzh@gnu.org> parents: 9452 diff changeset	70 buffer using bits in the re_pattern_buffer. This means that whenever
cf97e75d8e02 (searchbufs): New variable, replaces searchbuf and last_regexp and Karl Heuer <kwzh@gnu.org> parents: 9452 diff changeset	71 you compile a new pattern, it completely forgets whether it has
708 030fb4635335 * empty log message * Jim Blandy <jimb@redhat.com> parents: 648 diff changeset	72 allocated any registers, and will allocate new registers the next
030fb4635335 * empty log message * Jim Blandy <jimb@redhat.com> parents: 648 diff changeset	73 time you call a searching or matching function. Therefore, we need
030fb4635335 * empty log message * Jim Blandy <jimb@redhat.com> parents: 648 diff changeset	74 to call re_set_registers after compiling a new pattern or after
030fb4635335 * empty log message * Jim Blandy <jimb@redhat.com> parents: 648 diff changeset	75 setting the match registers, so that the regex functions will be
030fb4635335 * empty log message * Jim Blandy <jimb@redhat.com> parents: 648 diff changeset	76 able to free or re-allocate it properly. */
603 470f556a9453 Initial revision Jim Blandy <jimb@redhat.com> parents: diff changeset	77 static struct re_registers search_regs;
470f556a9453 Initial revision Jim Blandy <jimb@redhat.com> parents: diff changeset	78
727 540b047ece4d * empty log message * Jim Blandy <jimb@redhat.com> parents: 708 diff changeset	79 /* The buffer in which the last search was performed, or
540b047ece4d * empty log message * Jim Blandy <jimb@redhat.com> parents: 708 diff changeset	80 Qt if the last search was done in a string;
540b047ece4d * empty log message * Jim Blandy <jimb@redhat.com> parents: 708 diff changeset	81 Qnil if no searching has been done yet. */
540b047ece4d * empty log message * Jim Blandy <jimb@redhat.com> parents: 708 diff changeset	82 static Lisp_Object last_thing_searched;
603 470f556a9453 Initial revision Jim Blandy <jimb@redhat.com> parents: diff changeset	83
14036 621a575db6f7 Comment fixes. Karl Heuer <kwzh@gnu.org> parents: 13295 diff changeset	84 /* error condition signaled when regexp compile_pattern fails */
603 470f556a9453 Initial revision Jim Blandy <jimb@redhat.com> parents: diff changeset	85
470f556a9453 Initial revision Jim Blandy <jimb@redhat.com> parents: diff changeset	86 Lisp_Object Qinvalid_regexp;
470f556a9453 Initial revision Jim Blandy <jimb@redhat.com> parents: diff changeset	87
5556 14161cfec24a (set_search_regs): New subroutine. Richard M. Stallman <rms@gnu.org> parents: 4954 diff changeset	88 static void set_search_regs ();
10055 cb713218845a (save_search_regs): Add declaration. Richard M. Stallman <rms@gnu.org> parents: 10032 diff changeset	89 static void save_search_regs ();
20869 c9f608f889b4 (boyer_moore, simple_search): New subroutines. Richard M. Stallman <rms@gnu.org> parents: 20824 diff changeset	90 static int simple_search ();
c9f608f889b4 (boyer_moore, simple_search): New subroutines. Richard M. Stallman <rms@gnu.org> parents: 20824 diff changeset	91 static int boyer_moore ();
10020 c41ce96785a8 (struct regexp_cache): New field `posix'. Richard M. Stallman <rms@gnu.org> parents: 9605 diff changeset	92 static int search_buffer ();
c41ce96785a8 (struct regexp_cache): New field `posix'. Richard M. Stallman <rms@gnu.org> parents: 9605 diff changeset	93
603 470f556a9453 Initial revision Jim Blandy <jimb@redhat.com> parents: diff changeset	94 static void
470f556a9453 Initial revision Jim Blandy <jimb@redhat.com> parents: diff changeset	95 matcher_overflow ()
470f556a9453 Initial revision Jim Blandy <jimb@redhat.com> parents: diff changeset	96 {
470f556a9453 Initial revision Jim Blandy <jimb@redhat.com> parents: diff changeset	97 error ("Stack overflow in regexp matcher");
470f556a9453 Initial revision Jim Blandy <jimb@redhat.com> parents: diff changeset	98 }
470f556a9453 Initial revision Jim Blandy <jimb@redhat.com> parents: diff changeset	99
470f556a9453 Initial revision Jim Blandy <jimb@redhat.com> parents: diff changeset	100 #ifdef __STDC__
470f556a9453 Initial revision Jim Blandy <jimb@redhat.com> parents: diff changeset	101 #define CONST const
470f556a9453 Initial revision Jim Blandy <jimb@redhat.com> parents: diff changeset	102 #else
470f556a9453 Initial revision Jim Blandy <jimb@redhat.com> parents: diff changeset	103 #define CONST
470f556a9453 Initial revision Jim Blandy <jimb@redhat.com> parents: diff changeset	104 #endif
470f556a9453 Initial revision Jim Blandy <jimb@redhat.com> parents: diff changeset	105
10020 c41ce96785a8 (struct regexp_cache): New field `posix'. Richard M. Stallman <rms@gnu.org> parents: 9605 diff changeset	106 /* Compile a regexp and signal a Lisp error if anything goes wrong.
c41ce96785a8 (struct regexp_cache): New field `posix'. Richard M. Stallman <rms@gnu.org> parents: 9605 diff changeset	107 PATTERN is the pattern to compile.
c41ce96785a8 (struct regexp_cache): New field `posix'. Richard M. Stallman <rms@gnu.org> parents: 9605 diff changeset	108 CP is the place to put the result.
20869 c9f608f889b4 (boyer_moore, simple_search): New subroutines. Richard M. Stallman <rms@gnu.org> parents: 20824 diff changeset	109 TRANSLATE is a translation table for ignoring case, or nil for none.
10020 c41ce96785a8 (struct regexp_cache): New field `posix'. Richard M. Stallman <rms@gnu.org> parents: 9605 diff changeset	110 REGP is the structure that says where to store the "register"
c41ce96785a8 (struct regexp_cache): New field `posix'. Richard M. Stallman <rms@gnu.org> parents: 9605 diff changeset	111 values that will result from matching this pattern.
c41ce96785a8 (struct regexp_cache): New field `posix'. Richard M. Stallman <rms@gnu.org> parents: 9605 diff changeset	112 If it is 0, we should compile the pattern not to record any
c41ce96785a8 (struct regexp_cache): New field `posix'. Richard M. Stallman <rms@gnu.org> parents: 9605 diff changeset	113 subexpression bounds.
c41ce96785a8 (struct regexp_cache): New field `posix'. Richard M. Stallman <rms@gnu.org> parents: 9605 diff changeset	114 POSIX is nonzero if we want full backtracking (POSIX style)
17053 df904355f033 Include category.h and charset.h. Karl Heuer <kwzh@gnu.org> parents: 16880 diff changeset	115 for this pattern. 0 means backtrack only enough to get a valid match.
df904355f033 Include category.h and charset.h. Karl Heuer <kwzh@gnu.org> parents: 16880 diff changeset	116 MULTIBYTE is nonzero if we want to handle multibyte characters in
df904355f033 Include category.h and charset.h. Karl Heuer <kwzh@gnu.org> parents: 16880 diff changeset	117 PATTERN. 0 means all multibyte characters are recognized just as
df904355f033 Include category.h and charset.h. Karl Heuer <kwzh@gnu.org> parents: 16880 diff changeset	118 sequences of binary data. */
603 470f556a9453 Initial revision Jim Blandy <jimb@redhat.com> parents: diff changeset	119
9605 cf97e75d8e02 (searchbufs): New variable, replaces searchbuf and last_regexp and Karl Heuer <kwzh@gnu.org> parents: 9452 diff changeset	120 static void
17053 df904355f033 Include category.h and charset.h. Karl Heuer <kwzh@gnu.org> parents: 16880 diff changeset	121 compile_pattern_1 (cp, pattern, translate, regp, posix, multibyte)
9605 cf97e75d8e02 (searchbufs): New variable, replaces searchbuf and last_regexp and Karl Heuer <kwzh@gnu.org> parents: 9452 diff changeset	122 struct regexp_cache *cp;
603 470f556a9453 Initial revision Jim Blandy <jimb@redhat.com> parents: diff changeset	123 Lisp_Object pattern;
20869 c9f608f889b4 (boyer_moore, simple_search): New subroutines. Richard M. Stallman <rms@gnu.org> parents: 20824 diff changeset	124 Lisp_Object translate;
708 030fb4635335 * empty log message * Jim Blandy <jimb@redhat.com> parents: 648 diff changeset	125 struct re_registers *regp;
10020 c41ce96785a8 (struct regexp_cache): New field `posix'. Richard M. Stallman <rms@gnu.org> parents: 9605 diff changeset	126 int posix;
17053 df904355f033 Include category.h and charset.h. Karl Heuer <kwzh@gnu.org> parents: 16880 diff changeset	127 int multibyte;
603 470f556a9453 Initial revision Jim Blandy <jimb@redhat.com> parents: diff changeset	128 {
21915 8f1159b417c2 (search_buffer): Fix casts when assigning raw_pattern. Richard M. Stallman <rms@gnu.org> parents: 21887 diff changeset	129 unsigned char *raw_pattern;
20671 be91d6130341 (compile_pattern_1): If representation of STRING Karl Heuer <kwzh@gnu.org> parents: 20588 diff changeset	130 int raw_pattern_size;
18762 12c0de0113af (compile_pattern_1): Don't declare val with CONST. Richard M. Stallman <rms@gnu.org> parents: 18193 diff changeset	131 char *val;
10020 c41ce96785a8 (struct regexp_cache): New field `posix'. Richard M. Stallman <rms@gnu.org> parents: 9605 diff changeset	132 reg_syntax_t old;
603 470f556a9453 Initial revision Jim Blandy <jimb@redhat.com> parents: diff changeset	133
20671 be91d6130341 (compile_pattern_1): If representation of STRING Karl Heuer <kwzh@gnu.org> parents: 20588 diff changeset	134 /* MULTIBYTE says whether the text to be searched is multibyte.
be91d6130341 (compile_pattern_1): If representation of STRING Karl Heuer <kwzh@gnu.org> parents: 20588 diff changeset	135 We must convert PATTERN to match that, or we will not really
be91d6130341 (compile_pattern_1): If representation of STRING Karl Heuer <kwzh@gnu.org> parents: 20588 diff changeset	136 find things right. */
be91d6130341 (compile_pattern_1): If representation of STRING Karl Heuer <kwzh@gnu.org> parents: 20588 diff changeset	137
be91d6130341 (compile_pattern_1): If representation of STRING Karl Heuer <kwzh@gnu.org> parents: 20588 diff changeset	138 if (multibyte == STRING_MULTIBYTE (pattern))
be91d6130341 (compile_pattern_1): If representation of STRING Karl Heuer <kwzh@gnu.org> parents: 20588 diff changeset	139 {
21915 8f1159b417c2 (search_buffer): Fix casts when assigning raw_pattern. Richard M. Stallman <rms@gnu.org> parents: 21887 diff changeset	140 raw_pattern = (unsigned char *) XSTRING (pattern)->data;
21244 50929073a0ba Use STRING_BYTES and SET_STRING_BYTES. Richard M. Stallman <rms@gnu.org> parents: 21171 diff changeset	141 raw_pattern_size = STRING_BYTES (XSTRING (pattern));
20671 be91d6130341 (compile_pattern_1): If representation of STRING Karl Heuer <kwzh@gnu.org> parents: 20588 diff changeset	142 }
be91d6130341 (compile_pattern_1): If representation of STRING Karl Heuer <kwzh@gnu.org> parents: 20588 diff changeset	143 else if (multibyte)
be91d6130341 (compile_pattern_1): If representation of STRING Karl Heuer <kwzh@gnu.org> parents: 20588 diff changeset	144 {
be91d6130341 (compile_pattern_1): If representation of STRING Karl Heuer <kwzh@gnu.org> parents: 20588 diff changeset	145 raw_pattern_size = count_size_as_multibyte (XSTRING (pattern)->data,
be91d6130341 (compile_pattern_1): If representation of STRING Karl Heuer <kwzh@gnu.org> parents: 20588 diff changeset	146 XSTRING (pattern)->size);
21915 8f1159b417c2 (search_buffer): Fix casts when assigning raw_pattern. Richard M. Stallman <rms@gnu.org> parents: 21887 diff changeset	147 raw_pattern = (unsigned char *) alloca (raw_pattern_size + 1);
20671 be91d6130341 (compile_pattern_1): If representation of STRING Karl Heuer <kwzh@gnu.org> parents: 20588 diff changeset	148 copy_text (XSTRING (pattern)->data, raw_pattern,
be91d6130341 (compile_pattern_1): If representation of STRING Karl Heuer <kwzh@gnu.org> parents: 20588 diff changeset	149 XSTRING (pattern)->size, 0, 1);
be91d6130341 (compile_pattern_1): If representation of STRING Karl Heuer <kwzh@gnu.org> parents: 20588 diff changeset	150 }
be91d6130341 (compile_pattern_1): If representation of STRING Karl Heuer <kwzh@gnu.org> parents: 20588 diff changeset	151 else
be91d6130341 (compile_pattern_1): If representation of STRING Karl Heuer <kwzh@gnu.org> parents: 20588 diff changeset	152 {
be91d6130341 (compile_pattern_1): If representation of STRING Karl Heuer <kwzh@gnu.org> parents: 20588 diff changeset	153 /* Converting multibyte to single-byte.
be91d6130341 (compile_pattern_1): If representation of STRING Karl Heuer <kwzh@gnu.org> parents: 20588 diff changeset	154
be91d6130341 (compile_pattern_1): If representation of STRING Karl Heuer <kwzh@gnu.org> parents: 20588 diff changeset	155 ??? Perhaps this conversion should be done in a special way
be91d6130341 (compile_pattern_1): If representation of STRING Karl Heuer <kwzh@gnu.org> parents: 20588 diff changeset	156 by subtracting nonascii-insert-offset from each non-ASCII char,
be91d6130341 (compile_pattern_1): If representation of STRING Karl Heuer <kwzh@gnu.org> parents: 20588 diff changeset	157 so that only the multibyte chars which really correspond to
be91d6130341 (compile_pattern_1): If representation of STRING Karl Heuer <kwzh@gnu.org> parents: 20588 diff changeset	158 the chosen single-byte character set can possibly match. */
be91d6130341 (compile_pattern_1): If representation of STRING Karl Heuer <kwzh@gnu.org> parents: 20588 diff changeset	159 raw_pattern_size = XSTRING (pattern)->size;
21915 8f1159b417c2 (search_buffer): Fix casts when assigning raw_pattern. Richard M. Stallman <rms@gnu.org> parents: 21887 diff changeset	160 raw_pattern = (unsigned char *) alloca (raw_pattern_size + 1);
20671 be91d6130341 (compile_pattern_1): If representation of STRING Karl Heuer <kwzh@gnu.org> parents: 20588 diff changeset	161 copy_text (XSTRING (pattern)->data, raw_pattern,
21244 50929073a0ba Use STRING_BYTES and SET_STRING_BYTES. Richard M. Stallman <rms@gnu.org> parents: 21171 diff changeset	162 STRING_BYTES (XSTRING (pattern)), 1, 0);
20671 be91d6130341 (compile_pattern_1): If representation of STRING Karl Heuer <kwzh@gnu.org> parents: 20588 diff changeset	163 }
be91d6130341 (compile_pattern_1): If representation of STRING Karl Heuer <kwzh@gnu.org> parents: 20588 diff changeset	164
9605 cf97e75d8e02 (searchbufs): New variable, replaces searchbuf and last_regexp and Karl Heuer <kwzh@gnu.org> parents: 9452 diff changeset	165 cp->regexp = Qnil;
21531 5811a3129878 (compile_pattern, compile_pattern_1): Fix mixing of Andreas Schwab <schwab@suse.de> parents: 21514 diff changeset	166 cp->buf.translate = (! NILP (translate) ? translate : make_number (0));
10020 c41ce96785a8 (struct regexp_cache): New field `posix'. Richard M. Stallman <rms@gnu.org> parents: 9605 diff changeset	167 cp->posix = posix;
17053 df904355f033 Include category.h and charset.h. Karl Heuer <kwzh@gnu.org> parents: 16880 diff changeset	168 cp->buf.multibyte = multibyte;
2439 b6c62e4abf59 Put interrupt input blocking in a separate file from xterm.h. Jim Blandy <jimb@redhat.com> parents: 2393 diff changeset	169 BLOCK_INPUT;
25441 d30cff97fb20 (compile_pattern_1): Enable RE_CHAR_CLASSES for regexp. Richard M. Stallman <rms@gnu.org> parents: 24716 diff changeset	170 old = re_set_syntax (RE_SYNTAX_EMACS \| RE_CHAR_CLASSES
10020 c41ce96785a8 (struct regexp_cache): New field `posix'. Richard M. Stallman <rms@gnu.org> parents: 9605 diff changeset	171 \| (posix ? 0 : RE_NO_POSIX_BACKTRACKING));
21915 8f1159b417c2 (search_buffer): Fix casts when assigning raw_pattern. Richard M. Stallman <rms@gnu.org> parents: 21887 diff changeset	172 val = (char ) re_compile_pattern ((char )raw_pattern,
8f1159b417c2 (search_buffer): Fix casts when assigning raw_pattern. Richard M. Stallman <rms@gnu.org> parents: 21887 diff changeset	173 raw_pattern_size, &cp->buf);
10020 c41ce96785a8 (struct regexp_cache): New field `posix'. Richard M. Stallman <rms@gnu.org> parents: 9605 diff changeset	174 re_set_syntax (old);
2439 b6c62e4abf59 Put interrupt input blocking in a separate file from xterm.h. Jim Blandy <jimb@redhat.com> parents: 2393 diff changeset	175 UNBLOCK_INPUT;
603 470f556a9453 Initial revision Jim Blandy <jimb@redhat.com> parents: diff changeset	176 if (val)
9605 cf97e75d8e02 (searchbufs): New variable, replaces searchbuf and last_regexp and Karl Heuer <kwzh@gnu.org> parents: 9452 diff changeset	177 Fsignal (Qinvalid_regexp, Fcons (build_string (val), Qnil));
708 030fb4635335 * empty log message * Jim Blandy <jimb@redhat.com> parents: 648 diff changeset	178
9605 cf97e75d8e02 (searchbufs): New variable, replaces searchbuf and last_regexp and Karl Heuer <kwzh@gnu.org> parents: 9452 diff changeset	179 cp->regexp = Fcopy_sequence (pattern);
cf97e75d8e02 (searchbufs): New variable, replaces searchbuf and last_regexp and Karl Heuer <kwzh@gnu.org> parents: 9452 diff changeset	180 }
708 030fb4635335 * empty log message * Jim Blandy <jimb@redhat.com> parents: 648 diff changeset	181
22221 239a4b800303 (shrink_regexp_cache): New function. Richard M. Stallman <rms@gnu.org> parents: 22082 diff changeset	182 /* Shrink each compiled regexp buffer in the cache
239a4b800303 (shrink_regexp_cache): New function. Richard M. Stallman <rms@gnu.org> parents: 22082 diff changeset	183 to the size actually used right now.
239a4b800303 (shrink_regexp_cache): New function. Richard M. Stallman <rms@gnu.org> parents: 22082 diff changeset	184 This is called from garbage collection. */
239a4b800303 (shrink_regexp_cache): New function. Richard M. Stallman <rms@gnu.org> parents: 22082 diff changeset	185
239a4b800303 (shrink_regexp_cache): New function. Richard M. Stallman <rms@gnu.org> parents: 22082 diff changeset	186 void
239a4b800303 (shrink_regexp_cache): New function. Richard M. Stallman <rms@gnu.org> parents: 22082 diff changeset	187 shrink_regexp_cache ()
239a4b800303 (shrink_regexp_cache): New function. Richard M. Stallman <rms@gnu.org> parents: 22082 diff changeset	188 {
239a4b800303 (shrink_regexp_cache): New function. Richard M. Stallman <rms@gnu.org> parents: 22082 diff changeset	189 struct regexp_cache cp, *cpp;
239a4b800303 (shrink_regexp_cache): New function. Richard M. Stallman <rms@gnu.org> parents: 22082 diff changeset	190
239a4b800303 (shrink_regexp_cache): New function. Richard M. Stallman <rms@gnu.org> parents: 22082 diff changeset	191 for (cp = searchbuf_head; cp != 0; cp = cp->next)
239a4b800303 (shrink_regexp_cache): New function. Richard M. Stallman <rms@gnu.org> parents: 22082 diff changeset	192 {
239a4b800303 (shrink_regexp_cache): New function. Richard M. Stallman <rms@gnu.org> parents: 22082 diff changeset	193 cp->buf.allocated = cp->buf.used;
239a4b800303 (shrink_regexp_cache): New function. Richard M. Stallman <rms@gnu.org> parents: 22082 diff changeset	194 cp->buf.buffer
239a4b800303 (shrink_regexp_cache): New function. Richard M. Stallman <rms@gnu.org> parents: 22082 diff changeset	195 = (unsigned char *) realloc (cp->buf.buffer, cp->buf.used);
239a4b800303 (shrink_regexp_cache): New function. Richard M. Stallman <rms@gnu.org> parents: 22082 diff changeset	196 }
239a4b800303 (shrink_regexp_cache): New function. Richard M. Stallman <rms@gnu.org> parents: 22082 diff changeset	197 }
239a4b800303 (shrink_regexp_cache): New function. Richard M. Stallman <rms@gnu.org> parents: 22082 diff changeset	198
9605 cf97e75d8e02 (searchbufs): New variable, replaces searchbuf and last_regexp and Karl Heuer <kwzh@gnu.org> parents: 9452 diff changeset	199 /* Compile a regexp if necessary, but first check to see if there's one in
10020 c41ce96785a8 (struct regexp_cache): New field `posix'. Richard M. Stallman <rms@gnu.org> parents: 9605 diff changeset	200 the cache.
c41ce96785a8 (struct regexp_cache): New field `posix'. Richard M. Stallman <rms@gnu.org> parents: 9605 diff changeset	201 PATTERN is the pattern to compile.
20869 c9f608f889b4 (boyer_moore, simple_search): New subroutines. Richard M. Stallman <rms@gnu.org> parents: 20824 diff changeset	202 TRANSLATE is a translation table for ignoring case, or nil for none.
10020 c41ce96785a8 (struct regexp_cache): New field `posix'. Richard M. Stallman <rms@gnu.org> parents: 9605 diff changeset	203 REGP is the structure that says where to store the "register"
c41ce96785a8 (struct regexp_cache): New field `posix'. Richard M. Stallman <rms@gnu.org> parents: 9605 diff changeset	204 values that will result from matching this pattern.
c41ce96785a8 (struct regexp_cache): New field `posix'. Richard M. Stallman <rms@gnu.org> parents: 9605 diff changeset	205 If it is 0, we should compile the pattern not to record any
c41ce96785a8 (struct regexp_cache): New field `posix'. Richard M. Stallman <rms@gnu.org> parents: 9605 diff changeset	206 subexpression bounds.
c41ce96785a8 (struct regexp_cache): New field `posix'. Richard M. Stallman <rms@gnu.org> parents: 9605 diff changeset	207 POSIX is nonzero if we want full backtracking (POSIX style)
c41ce96785a8 (struct regexp_cache): New field `posix'. Richard M. Stallman <rms@gnu.org> parents: 9605 diff changeset	208 for this pattern. 0 means backtrack only enough to get a valid match. */
9605 cf97e75d8e02 (searchbufs): New variable, replaces searchbuf and last_regexp and Karl Heuer <kwzh@gnu.org> parents: 9452 diff changeset	209
cf97e75d8e02 (searchbufs): New variable, replaces searchbuf and last_regexp and Karl Heuer <kwzh@gnu.org> parents: 9452 diff changeset	210 struct re_pattern_buffer *
20588 138c95482e6b (search_buffer): Handle bytes vs chars in non-RE case. Richard M. Stallman <rms@gnu.org> parents: 20547 diff changeset	211 compile_pattern (pattern, regp, translate, posix, multibyte)
9605 cf97e75d8e02 (searchbufs): New variable, replaces searchbuf and last_regexp and Karl Heuer <kwzh@gnu.org> parents: 9452 diff changeset	212 Lisp_Object pattern;
cf97e75d8e02 (searchbufs): New variable, replaces searchbuf and last_regexp and Karl Heuer <kwzh@gnu.org> parents: 9452 diff changeset	213 struct re_registers *regp;
20869 c9f608f889b4 (boyer_moore, simple_search): New subroutines. Richard M. Stallman <rms@gnu.org> parents: 20824 diff changeset	214 Lisp_Object translate;
20588 138c95482e6b (search_buffer): Handle bytes vs chars in non-RE case. Richard M. Stallman <rms@gnu.org> parents: 20547 diff changeset	215 int posix, multibyte;
9605 cf97e75d8e02 (searchbufs): New variable, replaces searchbuf and last_regexp and Karl Heuer <kwzh@gnu.org> parents: 9452 diff changeset	216 {
cf97e75d8e02 (searchbufs): New variable, replaces searchbuf and last_regexp and Karl Heuer <kwzh@gnu.org> parents: 9452 diff changeset	217 struct regexp_cache cp, *cpp;
cf97e75d8e02 (searchbufs): New variable, replaces searchbuf and last_regexp and Karl Heuer <kwzh@gnu.org> parents: 9452 diff changeset	218
cf97e75d8e02 (searchbufs): New variable, replaces searchbuf and last_regexp and Karl Heuer <kwzh@gnu.org> parents: 9452 diff changeset	219 for (cpp = &searchbuf_head; ; cpp = &cp->next)
cf97e75d8e02 (searchbufs): New variable, replaces searchbuf and last_regexp and Karl Heuer <kwzh@gnu.org> parents: 9452 diff changeset	220 {
cf97e75d8e02 (searchbufs): New variable, replaces searchbuf and last_regexp and Karl Heuer <kwzh@gnu.org> parents: 9452 diff changeset	221 cp = *cpp;
16275 a4bcfdc9bb66 (REGEXP_CACHE_SIZE): Increase to 20. Richard M. Stallman <rms@gnu.org> parents: 16152 diff changeset	222 if (XSTRING (cp->regexp)->size == XSTRING (pattern)->size
a4bcfdc9bb66 (REGEXP_CACHE_SIZE): Increase to 20. Richard M. Stallman <rms@gnu.org> parents: 16152 diff changeset	223 && !NILP (Fstring_equal (cp->regexp, pattern))
21531 5811a3129878 (compile_pattern, compile_pattern_1): Fix mixing of Andreas Schwab <schwab@suse.de> parents: 21514 diff changeset	224 && EQ (cp->buf.translate, (! NILP (translate) ? translate : make_number (0)))
17053 df904355f033 Include category.h and charset.h. Karl Heuer <kwzh@gnu.org> parents: 16880 diff changeset	225 && cp->posix == posix
df904355f033 Include category.h and charset.h. Karl Heuer <kwzh@gnu.org> parents: 16880 diff changeset	226 && cp->buf.multibyte == multibyte)
9605 cf97e75d8e02 (searchbufs): New variable, replaces searchbuf and last_regexp and Karl Heuer <kwzh@gnu.org> parents: 9452 diff changeset	227 break;
cf97e75d8e02 (searchbufs): New variable, replaces searchbuf and last_regexp and Karl Heuer <kwzh@gnu.org> parents: 9452 diff changeset	228
cf97e75d8e02 (searchbufs): New variable, replaces searchbuf and last_regexp and Karl Heuer <kwzh@gnu.org> parents: 9452 diff changeset	229 /* If we're at the end of the cache, compile into the last cell. */
cf97e75d8e02 (searchbufs): New variable, replaces searchbuf and last_regexp and Karl Heuer <kwzh@gnu.org> parents: 9452 diff changeset	230 if (cp->next == 0)
cf97e75d8e02 (searchbufs): New variable, replaces searchbuf and last_regexp and Karl Heuer <kwzh@gnu.org> parents: 9452 diff changeset	231 {
17053 df904355f033 Include category.h and charset.h. Karl Heuer <kwzh@gnu.org> parents: 16880 diff changeset	232 compile_pattern_1 (cp, pattern, translate, regp, posix, multibyte);
9605 cf97e75d8e02 (searchbufs): New variable, replaces searchbuf and last_regexp and Karl Heuer <kwzh@gnu.org> parents: 9452 diff changeset	233 break;
cf97e75d8e02 (searchbufs): New variable, replaces searchbuf and last_regexp and Karl Heuer <kwzh@gnu.org> parents: 9452 diff changeset	234 }
cf97e75d8e02 (searchbufs): New variable, replaces searchbuf and last_regexp and Karl Heuer <kwzh@gnu.org> parents: 9452 diff changeset	235 }
cf97e75d8e02 (searchbufs): New variable, replaces searchbuf and last_regexp and Karl Heuer <kwzh@gnu.org> parents: 9452 diff changeset	236
cf97e75d8e02 (searchbufs): New variable, replaces searchbuf and last_regexp and Karl Heuer <kwzh@gnu.org> parents: 9452 diff changeset	237 /* When we get here, cp (aka *cpp) contains the compiled pattern,
cf97e75d8e02 (searchbufs): New variable, replaces searchbuf and last_regexp and Karl Heuer <kwzh@gnu.org> parents: 9452 diff changeset	238 either because we found it in the cache or because we just compiled it.
cf97e75d8e02 (searchbufs): New variable, replaces searchbuf and last_regexp and Karl Heuer <kwzh@gnu.org> parents: 9452 diff changeset	239 Move it to the front of the queue to mark it as most recently used. */
cf97e75d8e02 (searchbufs): New variable, replaces searchbuf and last_regexp and Karl Heuer <kwzh@gnu.org> parents: 9452 diff changeset	240 *cpp = cp->next;
cf97e75d8e02 (searchbufs): New variable, replaces searchbuf and last_regexp and Karl Heuer <kwzh@gnu.org> parents: 9452 diff changeset	241 cp->next = searchbuf_head;
cf97e75d8e02 (searchbufs): New variable, replaces searchbuf and last_regexp and Karl Heuer <kwzh@gnu.org> parents: 9452 diff changeset	242 searchbuf_head = cp;
cf97e75d8e02 (searchbufs): New variable, replaces searchbuf and last_regexp and Karl Heuer <kwzh@gnu.org> parents: 9452 diff changeset	243
10141 afe81fd385eb (compile_pattern): Call re_set_registers here. Richard M. Stallman <rms@gnu.org> parents: 10128 diff changeset	244 /* Advise the searching functions about the space we have allocated
afe81fd385eb (compile_pattern): Call re_set_registers here. Richard M. Stallman <rms@gnu.org> parents: 10128 diff changeset	245 for register data. */
afe81fd385eb (compile_pattern): Call re_set_registers here. Richard M. Stallman <rms@gnu.org> parents: 10128 diff changeset	246 if (regp)
afe81fd385eb (compile_pattern): Call re_set_registers here. Richard M. Stallman <rms@gnu.org> parents: 10128 diff changeset	247 re_set_registers (&cp->buf, regp, regp->num_regs, regp->start, regp->end);
afe81fd385eb (compile_pattern): Call re_set_registers here. Richard M. Stallman <rms@gnu.org> parents: 10128 diff changeset	248
9605 cf97e75d8e02 (searchbufs): New variable, replaces searchbuf and last_regexp and Karl Heuer <kwzh@gnu.org> parents: 9452 diff changeset	249 return &cp->buf;
603 470f556a9453 Initial revision Jim Blandy <jimb@redhat.com> parents: diff changeset	250 }
470f556a9453 Initial revision Jim Blandy <jimb@redhat.com> parents: diff changeset	251
470f556a9453 Initial revision Jim Blandy <jimb@redhat.com> parents: diff changeset	252 /* Error condition used for failing searches */
470f556a9453 Initial revision Jim Blandy <jimb@redhat.com> parents: diff changeset	253 Lisp_Object Qsearch_failed;
470f556a9453 Initial revision Jim Blandy <jimb@redhat.com> parents: diff changeset	254
470f556a9453 Initial revision Jim Blandy <jimb@redhat.com> parents: diff changeset	255 Lisp_Object
470f556a9453 Initial revision Jim Blandy <jimb@redhat.com> parents: diff changeset	256 signal_failure (arg)
470f556a9453 Initial revision Jim Blandy <jimb@redhat.com> parents: diff changeset	257 Lisp_Object arg;
470f556a9453 Initial revision Jim Blandy <jimb@redhat.com> parents: diff changeset	258 {
470f556a9453 Initial revision Jim Blandy <jimb@redhat.com> parents: diff changeset	259 Fsignal (Qsearch_failed, Fcons (arg, Qnil));
470f556a9453 Initial revision Jim Blandy <jimb@redhat.com> parents: diff changeset	260 return Qnil;
470f556a9453 Initial revision Jim Blandy <jimb@redhat.com> parents: diff changeset	261 }
470f556a9453 Initial revision Jim Blandy <jimb@redhat.com> parents: diff changeset	262
10020 c41ce96785a8 (struct regexp_cache): New field `posix'. Richard M. Stallman <rms@gnu.org> parents: 9605 diff changeset	263 static Lisp_Object
c41ce96785a8 (struct regexp_cache): New field `posix'. Richard M. Stallman <rms@gnu.org> parents: 9605 diff changeset	264 looking_at_1 (string, posix)
603 470f556a9453 Initial revision Jim Blandy <jimb@redhat.com> parents: diff changeset	265 Lisp_Object string;
10020 c41ce96785a8 (struct regexp_cache): New field `posix'. Richard M. Stallman <rms@gnu.org> parents: 9605 diff changeset	266 int posix;
603 470f556a9453 Initial revision Jim Blandy <jimb@redhat.com> parents: diff changeset	267 {
470f556a9453 Initial revision Jim Blandy <jimb@redhat.com> parents: diff changeset	268 Lisp_Object val;
470f556a9453 Initial revision Jim Blandy <jimb@redhat.com> parents: diff changeset	269 unsigned char p1, p2;
470f556a9453 Initial revision Jim Blandy <jimb@redhat.com> parents: diff changeset	270 int s1, s2;
470f556a9453 Initial revision Jim Blandy <jimb@redhat.com> parents: diff changeset	271 register int i;
9605 cf97e75d8e02 (searchbufs): New variable, replaces searchbuf and last_regexp and Karl Heuer <kwzh@gnu.org> parents: 9452 diff changeset	272 struct re_pattern_buffer *bufp;
603 470f556a9453 Initial revision Jim Blandy <jimb@redhat.com> parents: diff changeset	273
10032 f689803caa92 Added code for automatically saving and restoring the match data Francesco Potortì <pot@gnu.org> parents: 10020 diff changeset	274 if (running_asynch_code)
f689803caa92 Added code for automatically saving and restoring the match data Francesco Potortì <pot@gnu.org> parents: 10020 diff changeset	275 save_search_regs ();
f689803caa92 Added code for automatically saving and restoring the match data Francesco Potortì <pot@gnu.org> parents: 10020 diff changeset	276
603 470f556a9453 Initial revision Jim Blandy <jimb@redhat.com> parents: diff changeset	277 CHECK_STRING (string, 0);
9605 cf97e75d8e02 (searchbufs): New variable, replaces searchbuf and last_regexp and Karl Heuer <kwzh@gnu.org> parents: 9452 diff changeset	278 bufp = compile_pattern (string, &search_regs,
cf97e75d8e02 (searchbufs): New variable, replaces searchbuf and last_regexp and Karl Heuer <kwzh@gnu.org> parents: 9452 diff changeset	279 (!NILP (current_buffer->case_fold_search)
20869 c9f608f889b4 (boyer_moore, simple_search): New subroutines. Richard M. Stallman <rms@gnu.org> parents: 20824 diff changeset	280 ? DOWNCASE_TABLE : Qnil),
20588 138c95482e6b (search_buffer): Handle bytes vs chars in non-RE case. Richard M. Stallman <rms@gnu.org> parents: 20547 diff changeset	281 posix,
138c95482e6b (search_buffer): Handle bytes vs chars in non-RE case. Richard M. Stallman <rms@gnu.org> parents: 20547 diff changeset	282 !NILP (current_buffer->enable_multibyte_characters));
603 470f556a9453 Initial revision Jim Blandy <jimb@redhat.com> parents: diff changeset	283
470f556a9453 Initial revision Jim Blandy <jimb@redhat.com> parents: diff changeset	284 immediate_quit = 1;
470f556a9453 Initial revision Jim Blandy <jimb@redhat.com> parents: diff changeset	285 QUIT; /* Do a pending quit right away, to avoid paradoxical behavior */
470f556a9453 Initial revision Jim Blandy <jimb@redhat.com> parents: diff changeset	286
470f556a9453 Initial revision Jim Blandy <jimb@redhat.com> parents: diff changeset	287 /* Get pointers and sizes of the two strings
470f556a9453 Initial revision Jim Blandy <jimb@redhat.com> parents: diff changeset	288 that make up the visible portion of the buffer. */
470f556a9453 Initial revision Jim Blandy <jimb@redhat.com> parents: diff changeset	289
470f556a9453 Initial revision Jim Blandy <jimb@redhat.com> parents: diff changeset	290 p1 = BEGV_ADDR;
20545 c20c92ff4055 (looking_at_1): Use bytepos to call re_search_2. Richard M. Stallman <rms@gnu.org> parents: 20347 diff changeset	291 s1 = GPT_BYTE - BEGV_BYTE;
603 470f556a9453 Initial revision Jim Blandy <jimb@redhat.com> parents: diff changeset	292 p2 = GAP_END_ADDR;
20545 c20c92ff4055 (looking_at_1): Use bytepos to call re_search_2. Richard M. Stallman <rms@gnu.org> parents: 20347 diff changeset	293 s2 = ZV_BYTE - GPT_BYTE;
603 470f556a9453 Initial revision Jim Blandy <jimb@redhat.com> parents: diff changeset	294 if (s1 < 0)
470f556a9453 Initial revision Jim Blandy <jimb@redhat.com> parents: diff changeset	295 {
470f556a9453 Initial revision Jim Blandy <jimb@redhat.com> parents: diff changeset	296 p2 = p1;
20545 c20c92ff4055 (looking_at_1): Use bytepos to call re_search_2. Richard M. Stallman <rms@gnu.org> parents: 20347 diff changeset	297 s2 = ZV_BYTE - BEGV_BYTE;
603 470f556a9453 Initial revision Jim Blandy <jimb@redhat.com> parents: diff changeset	298 s1 = 0;
470f556a9453 Initial revision Jim Blandy <jimb@redhat.com> parents: diff changeset	299 }
470f556a9453 Initial revision Jim Blandy <jimb@redhat.com> parents: diff changeset	300 if (s2 < 0)
470f556a9453 Initial revision Jim Blandy <jimb@redhat.com> parents: diff changeset	301 {
20545 c20c92ff4055 (looking_at_1): Use bytepos to call re_search_2. Richard M. Stallman <rms@gnu.org> parents: 20347 diff changeset	302 s1 = ZV_BYTE - BEGV_BYTE;
603 470f556a9453 Initial revision Jim Blandy <jimb@redhat.com> parents: diff changeset	303 s2 = 0;
470f556a9453 Initial revision Jim Blandy <jimb@redhat.com> parents: diff changeset	304 }
17463 bb9ae80d22e2 (looking_at_1): Set re_match_object. Richard M. Stallman <rms@gnu.org> parents: 17284 diff changeset	305
bb9ae80d22e2 (looking_at_1): Set re_match_object. Richard M. Stallman <rms@gnu.org> parents: 17284 diff changeset	306 re_match_object = Qnil;
603 470f556a9453 Initial revision Jim Blandy <jimb@redhat.com> parents: diff changeset	307
9605 cf97e75d8e02 (searchbufs): New variable, replaces searchbuf and last_regexp and Karl Heuer <kwzh@gnu.org> parents: 9452 diff changeset	308 i = re_match_2 (bufp, (char ) p1, s1, (char ) p2, s2,
20545 c20c92ff4055 (looking_at_1): Use bytepos to call re_search_2. Richard M. Stallman <rms@gnu.org> parents: 20347 diff changeset	309 PT_BYTE - BEGV_BYTE, &search_regs,
c20c92ff4055 (looking_at_1): Use bytepos to call re_search_2. Richard M. Stallman <rms@gnu.org> parents: 20347 diff changeset	310 ZV_BYTE - BEGV_BYTE);
26985 1121a5da20a5 (looking_at_1): Reset immediate_quit before modifying Gerd Moellmann <gerd@gnu.org> parents: 26982 diff changeset	311 immediate_quit = 0;
1121a5da20a5 (looking_at_1): Reset immediate_quit before modifying Gerd Moellmann <gerd@gnu.org> parents: 26982 diff changeset	312
603 470f556a9453 Initial revision Jim Blandy <jimb@redhat.com> parents: diff changeset	313 if (i == -2)
470f556a9453 Initial revision Jim Blandy <jimb@redhat.com> parents: diff changeset	314 matcher_overflow ();
470f556a9453 Initial revision Jim Blandy <jimb@redhat.com> parents: diff changeset	315
470f556a9453 Initial revision Jim Blandy <jimb@redhat.com> parents: diff changeset	316 val = (0 <= i ? Qt : Qnil);
20545 c20c92ff4055 (looking_at_1): Use bytepos to call re_search_2. Richard M. Stallman <rms@gnu.org> parents: 20347 diff changeset	317 if (i >= 0)
c20c92ff4055 (looking_at_1): Use bytepos to call re_search_2. Richard M. Stallman <rms@gnu.org> parents: 20347 diff changeset	318 for (i = 0; i < search_regs.num_regs; i++)
c20c92ff4055 (looking_at_1): Use bytepos to call re_search_2. Richard M. Stallman <rms@gnu.org> parents: 20347 diff changeset	319 if (search_regs.start[i] >= 0)
c20c92ff4055 (looking_at_1): Use bytepos to call re_search_2. Richard M. Stallman <rms@gnu.org> parents: 20347 diff changeset	320 {
c20c92ff4055 (looking_at_1): Use bytepos to call re_search_2. Richard M. Stallman <rms@gnu.org> parents: 20347 diff changeset	321 search_regs.start[i]
c20c92ff4055 (looking_at_1): Use bytepos to call re_search_2. Richard M. Stallman <rms@gnu.org> parents: 20347 diff changeset	322 = BYTE_TO_CHAR (search_regs.start[i] + BEGV_BYTE);
c20c92ff4055 (looking_at_1): Use bytepos to call re_search_2. Richard M. Stallman <rms@gnu.org> parents: 20347 diff changeset	323 search_regs.end[i]
c20c92ff4055 (looking_at_1): Use bytepos to call re_search_2. Richard M. Stallman <rms@gnu.org> parents: 20347 diff changeset	324 = BYTE_TO_CHAR (search_regs.end[i] + BEGV_BYTE);
c20c92ff4055 (looking_at_1): Use bytepos to call re_search_2. Richard M. Stallman <rms@gnu.org> parents: 20347 diff changeset	325 }
9278 f2138d548313 (Flooking_at, skip_chars, search_buffer, set_search_regs, Fstore_match_data): Karl Heuer <kwzh@gnu.org> parents: 9113 diff changeset	326 XSETBUFFER (last_thing_searched, current_buffer);
603 470f556a9453 Initial revision Jim Blandy <jimb@redhat.com> parents: diff changeset	327 return val;
470f556a9453 Initial revision Jim Blandy <jimb@redhat.com> parents: diff changeset	328 }
470f556a9453 Initial revision Jim Blandy <jimb@redhat.com> parents: diff changeset	329
10020 c41ce96785a8 (struct regexp_cache): New field `posix'. Richard M. Stallman <rms@gnu.org> parents: 9605 diff changeset	330 DEFUN ("looking-at", Flooking_at, Slooking_at, 1, 1, 0,
11213 d0811ba886f8 (Flooking_at, Fposix_looking_at): Change arg name. Richard M. Stallman <rms@gnu.org> parents: 10250 diff changeset	331 "Return t if text after point matches regular expression REGEXP.\n\
10020 c41ce96785a8 (struct regexp_cache): New field `posix'. Richard M. Stallman <rms@gnu.org> parents: 9605 diff changeset	332 This function modifies the match data that `match-beginning',\n\
c41ce96785a8 (struct regexp_cache): New field `posix'. Richard M. Stallman <rms@gnu.org> parents: 9605 diff changeset	333 `match-end' and `match-data' access; save and restore the match\n\
c41ce96785a8 (struct regexp_cache): New field `posix'. Richard M. Stallman <rms@gnu.org> parents: 9605 diff changeset	334 data if you want to preserve them.")
11213 d0811ba886f8 (Flooking_at, Fposix_looking_at): Change arg name. Richard M. Stallman <rms@gnu.org> parents: 10250 diff changeset	335 (regexp)
d0811ba886f8 (Flooking_at, Fposix_looking_at): Change arg name. Richard M. Stallman <rms@gnu.org> parents: 10250 diff changeset	336 Lisp_Object regexp;
10020 c41ce96785a8 (struct regexp_cache): New field `posix'. Richard M. Stallman <rms@gnu.org> parents: 9605 diff changeset	337 {
11213 d0811ba886f8 (Flooking_at, Fposix_looking_at): Change arg name. Richard M. Stallman <rms@gnu.org> parents: 10250 diff changeset	338 return looking_at_1 (regexp, 0);
10020 c41ce96785a8 (struct regexp_cache): New field `posix'. Richard M. Stallman <rms@gnu.org> parents: 9605 diff changeset	339 }
c41ce96785a8 (struct regexp_cache): New field `posix'. Richard M. Stallman <rms@gnu.org> parents: 9605 diff changeset	340
c41ce96785a8 (struct regexp_cache): New field `posix'. Richard M. Stallman <rms@gnu.org> parents: 9605 diff changeset	341 DEFUN ("posix-looking-at", Fposix_looking_at, Sposix_looking_at, 1, 1, 0,
11213 d0811ba886f8 (Flooking_at, Fposix_looking_at): Change arg name. Richard M. Stallman <rms@gnu.org> parents: 10250 diff changeset	342 "Return t if text after point matches regular expression REGEXP.\n\
10020 c41ce96785a8 (struct regexp_cache): New field `posix'. Richard M. Stallman <rms@gnu.org> parents: 9605 diff changeset	343 Find the longest match, in accord with Posix regular expression rules.\n\
c41ce96785a8 (struct regexp_cache): New field `posix'. Richard M. Stallman <rms@gnu.org> parents: 9605 diff changeset	344 This function modifies the match data that `match-beginning',\n\
c41ce96785a8 (struct regexp_cache): New field `posix'. Richard M. Stallman <rms@gnu.org> parents: 9605 diff changeset	345 `match-end' and `match-data' access; save and restore the match\n\
c41ce96785a8 (struct regexp_cache): New field `posix'. Richard M. Stallman <rms@gnu.org> parents: 9605 diff changeset	346 data if you want to preserve them.")
11213 d0811ba886f8 (Flooking_at, Fposix_looking_at): Change arg name. Richard M. Stallman <rms@gnu.org> parents: 10250 diff changeset	347 (regexp)
d0811ba886f8 (Flooking_at, Fposix_looking_at): Change arg name. Richard M. Stallman <rms@gnu.org> parents: 10250 diff changeset	348 Lisp_Object regexp;
10020 c41ce96785a8 (struct regexp_cache): New field `posix'. Richard M. Stallman <rms@gnu.org> parents: 9605 diff changeset	349 {
11213 d0811ba886f8 (Flooking_at, Fposix_looking_at): Change arg name. Richard M. Stallman <rms@gnu.org> parents: 10250 diff changeset	350 return looking_at_1 (regexp, 1);
10020 c41ce96785a8 (struct regexp_cache): New field `posix'. Richard M. Stallman <rms@gnu.org> parents: 9605 diff changeset	351 }
c41ce96785a8 (struct regexp_cache): New field `posix'. Richard M. Stallman <rms@gnu.org> parents: 9605 diff changeset	352
c41ce96785a8 (struct regexp_cache): New field `posix'. Richard M. Stallman <rms@gnu.org> parents: 9605 diff changeset	353 static Lisp_Object
c41ce96785a8 (struct regexp_cache): New field `posix'. Richard M. Stallman <rms@gnu.org> parents: 9605 diff changeset	354 string_match_1 (regexp, string, start, posix)
603 470f556a9453 Initial revision Jim Blandy <jimb@redhat.com> parents: diff changeset	355 Lisp_Object regexp, string, start;
10020 c41ce96785a8 (struct regexp_cache): New field `posix'. Richard M. Stallman <rms@gnu.org> parents: 9605 diff changeset	356 int posix;
603 470f556a9453 Initial revision Jim Blandy <jimb@redhat.com> parents: diff changeset	357 {
470f556a9453 Initial revision Jim Blandy <jimb@redhat.com> parents: diff changeset	358 int val;
9605 cf97e75d8e02 (searchbufs): New variable, replaces searchbuf and last_regexp and Karl Heuer <kwzh@gnu.org> parents: 9452 diff changeset	359 struct re_pattern_buffer *bufp;
20588 138c95482e6b (search_buffer): Handle bytes vs chars in non-RE case. Richard M. Stallman <rms@gnu.org> parents: 20547 diff changeset	360 int pos, pos_byte;
138c95482e6b (search_buffer): Handle bytes vs chars in non-RE case. Richard M. Stallman <rms@gnu.org> parents: 20547 diff changeset	361 int i;
603 470f556a9453 Initial revision Jim Blandy <jimb@redhat.com> parents: diff changeset	362
10032 f689803caa92 Added code for automatically saving and restoring the match data Francesco Potortì <pot@gnu.org> parents: 10020 diff changeset	363 if (running_asynch_code)
f689803caa92 Added code for automatically saving and restoring the match data Francesco Potortì <pot@gnu.org> parents: 10020 diff changeset	364 save_search_regs ();
f689803caa92 Added code for automatically saving and restoring the match data Francesco Potortì <pot@gnu.org> parents: 10020 diff changeset	365
603 470f556a9453 Initial revision Jim Blandy <jimb@redhat.com> parents: diff changeset	366 CHECK_STRING (regexp, 0);
470f556a9453 Initial revision Jim Blandy <jimb@redhat.com> parents: diff changeset	367 CHECK_STRING (string, 1);
470f556a9453 Initial revision Jim Blandy <jimb@redhat.com> parents: diff changeset	368
470f556a9453 Initial revision Jim Blandy <jimb@redhat.com> parents: diff changeset	369 if (NILP (start))
20588 138c95482e6b (search_buffer): Handle bytes vs chars in non-RE case. Richard M. Stallman <rms@gnu.org> parents: 20547 diff changeset	370 pos = 0, pos_byte = 0;
603 470f556a9453 Initial revision Jim Blandy <jimb@redhat.com> parents: diff changeset	371 else
470f556a9453 Initial revision Jim Blandy <jimb@redhat.com> parents: diff changeset	372 {
470f556a9453 Initial revision Jim Blandy <jimb@redhat.com> parents: diff changeset	373 int len = XSTRING (string)->size;
470f556a9453 Initial revision Jim Blandy <jimb@redhat.com> parents: diff changeset	374
470f556a9453 Initial revision Jim Blandy <jimb@redhat.com> parents: diff changeset	375 CHECK_NUMBER (start, 2);
20588 138c95482e6b (search_buffer): Handle bytes vs chars in non-RE case. Richard M. Stallman <rms@gnu.org> parents: 20547 diff changeset	376 pos = XINT (start);
138c95482e6b (search_buffer): Handle bytes vs chars in non-RE case. Richard M. Stallman <rms@gnu.org> parents: 20547 diff changeset	377 if (pos < 0 && -pos <= len)
138c95482e6b (search_buffer): Handle bytes vs chars in non-RE case. Richard M. Stallman <rms@gnu.org> parents: 20547 diff changeset	378 pos = len + pos;
138c95482e6b (search_buffer): Handle bytes vs chars in non-RE case. Richard M. Stallman <rms@gnu.org> parents: 20547 diff changeset	379 else if (0 > pos \|\| pos > len)
603 470f556a9453 Initial revision Jim Blandy <jimb@redhat.com> parents: diff changeset	380 args_out_of_range (string, start);
20588 138c95482e6b (search_buffer): Handle bytes vs chars in non-RE case. Richard M. Stallman <rms@gnu.org> parents: 20547 diff changeset	381 pos_byte = string_char_to_byte (string, pos);
603 470f556a9453 Initial revision Jim Blandy <jimb@redhat.com> parents: diff changeset	382 }
470f556a9453 Initial revision Jim Blandy <jimb@redhat.com> parents: diff changeset	383
9605 cf97e75d8e02 (searchbufs): New variable, replaces searchbuf and last_regexp and Karl Heuer <kwzh@gnu.org> parents: 9452 diff changeset	384 bufp = compile_pattern (regexp, &search_regs,
cf97e75d8e02 (searchbufs): New variable, replaces searchbuf and last_regexp and Karl Heuer <kwzh@gnu.org> parents: 9452 diff changeset	385 (!NILP (current_buffer->case_fold_search)
20869 c9f608f889b4 (boyer_moore, simple_search): New subroutines. Richard M. Stallman <rms@gnu.org> parents: 20824 diff changeset	386 ? DOWNCASE_TABLE : Qnil),
20588 138c95482e6b (search_buffer): Handle bytes vs chars in non-RE case. Richard M. Stallman <rms@gnu.org> parents: 20547 diff changeset	387 posix,
138c95482e6b (search_buffer): Handle bytes vs chars in non-RE case. Richard M. Stallman <rms@gnu.org> parents: 20547 diff changeset	388 STRING_MULTIBYTE (string));
603 470f556a9453 Initial revision Jim Blandy <jimb@redhat.com> parents: diff changeset	389 immediate_quit = 1;
17463 bb9ae80d22e2 (looking_at_1): Set re_match_object. Richard M. Stallman <rms@gnu.org> parents: 17284 diff changeset	390 re_match_object = string;
bb9ae80d22e2 (looking_at_1): Set re_match_object. Richard M. Stallman <rms@gnu.org> parents: 17284 diff changeset	391
9605 cf97e75d8e02 (searchbufs): New variable, replaces searchbuf and last_regexp and Karl Heuer <kwzh@gnu.org> parents: 9452 diff changeset	392 val = re_search (bufp, (char *) XSTRING (string)->data,
21244 50929073a0ba Use STRING_BYTES and SET_STRING_BYTES. Richard M. Stallman <rms@gnu.org> parents: 21171 diff changeset	393 STRING_BYTES (XSTRING (string)), pos_byte,
50929073a0ba Use STRING_BYTES and SET_STRING_BYTES. Richard M. Stallman <rms@gnu.org> parents: 21171 diff changeset	394 STRING_BYTES (XSTRING (string)) - pos_byte,
603 470f556a9453 Initial revision Jim Blandy <jimb@redhat.com> parents: diff changeset	395 &search_regs);
470f556a9453 Initial revision Jim Blandy <jimb@redhat.com> parents: diff changeset	396 immediate_quit = 0;
727 540b047ece4d * empty log message * Jim Blandy <jimb@redhat.com> parents: 708 diff changeset	397 last_thing_searched = Qt;
603 470f556a9453 Initial revision Jim Blandy <jimb@redhat.com> parents: diff changeset	398 if (val == -2)
470f556a9453 Initial revision Jim Blandy <jimb@redhat.com> parents: diff changeset	399 matcher_overflow ();
470f556a9453 Initial revision Jim Blandy <jimb@redhat.com> parents: diff changeset	400 if (val < 0) return Qnil;
20588 138c95482e6b (search_buffer): Handle bytes vs chars in non-RE case. Richard M. Stallman <rms@gnu.org> parents: 20547 diff changeset	401
138c95482e6b (search_buffer): Handle bytes vs chars in non-RE case. Richard M. Stallman <rms@gnu.org> parents: 20547 diff changeset	402 for (i = 0; i < search_regs.num_regs; i++)
138c95482e6b (search_buffer): Handle bytes vs chars in non-RE case. Richard M. Stallman <rms@gnu.org> parents: 20547 diff changeset	403 if (search_regs.start[i] >= 0)
138c95482e6b (search_buffer): Handle bytes vs chars in non-RE case. Richard M. Stallman <rms@gnu.org> parents: 20547 diff changeset	404 {
138c95482e6b (search_buffer): Handle bytes vs chars in non-RE case. Richard M. Stallman <rms@gnu.org> parents: 20547 diff changeset	405 search_regs.start[i]
138c95482e6b (search_buffer): Handle bytes vs chars in non-RE case. Richard M. Stallman <rms@gnu.org> parents: 20547 diff changeset	406 = string_byte_to_char (string, search_regs.start[i]);
138c95482e6b (search_buffer): Handle bytes vs chars in non-RE case. Richard M. Stallman <rms@gnu.org> parents: 20547 diff changeset	407 search_regs.end[i]
138c95482e6b (search_buffer): Handle bytes vs chars in non-RE case. Richard M. Stallman <rms@gnu.org> parents: 20547 diff changeset	408 = string_byte_to_char (string, search_regs.end[i]);
138c95482e6b (search_buffer): Handle bytes vs chars in non-RE case. Richard M. Stallman <rms@gnu.org> parents: 20547 diff changeset	409 }
138c95482e6b (search_buffer): Handle bytes vs chars in non-RE case. Richard M. Stallman <rms@gnu.org> parents: 20547 diff changeset	410
138c95482e6b (search_buffer): Handle bytes vs chars in non-RE case. Richard M. Stallman <rms@gnu.org> parents: 20547 diff changeset	411 return make_number (string_byte_to_char (string, val));
603 470f556a9453 Initial revision Jim Blandy <jimb@redhat.com> parents: diff changeset	412 }
842 5ce0a9ac1ea7 entered into RCS Richard M. Stallman <rms@gnu.org> parents: 808 diff changeset	413
10020 c41ce96785a8 (struct regexp_cache): New field `posix'. Richard M. Stallman <rms@gnu.org> parents: 9605 diff changeset	414 DEFUN ("string-match", Fstring_match, Sstring_match, 2, 3, 0,
c41ce96785a8 (struct regexp_cache): New field `posix'. Richard M. Stallman <rms@gnu.org> parents: 9605 diff changeset	415 "Return index of start of first match for REGEXP in STRING, or nil.\n\
24433 118e66d79d64 (Fstring_match, Fposix_string_match): Doc fix. Karl Heuer <kwzh@gnu.org> parents: 24014 diff changeset	416 Case is ignored if `case-fold-search' is non-nil in the current buffer.\n\
10020 c41ce96785a8 (struct regexp_cache): New field `posix'. Richard M. Stallman <rms@gnu.org> parents: 9605 diff changeset	417 If third arg START is non-nil, start search at that index in STRING.\n\
c41ce96785a8 (struct regexp_cache): New field `posix'. Richard M. Stallman <rms@gnu.org> parents: 9605 diff changeset	418 For index of first char beyond the match, do (match-end 0).\n\
c41ce96785a8 (struct regexp_cache): New field `posix'. Richard M. Stallman <rms@gnu.org> parents: 9605 diff changeset	419 `match-end' and `match-beginning' also give indices of substrings\n\
c41ce96785a8 (struct regexp_cache): New field `posix'. Richard M. Stallman <rms@gnu.org> parents: 9605 diff changeset	420 matched by parenthesis constructs in the pattern.")
c41ce96785a8 (struct regexp_cache): New field `posix'. Richard M. Stallman <rms@gnu.org> parents: 9605 diff changeset	421 (regexp, string, start)
c41ce96785a8 (struct regexp_cache): New field `posix'. Richard M. Stallman <rms@gnu.org> parents: 9605 diff changeset	422 Lisp_Object regexp, string, start;
c41ce96785a8 (struct regexp_cache): New field `posix'. Richard M. Stallman <rms@gnu.org> parents: 9605 diff changeset	423 {
c41ce96785a8 (struct regexp_cache): New field `posix'. Richard M. Stallman <rms@gnu.org> parents: 9605 diff changeset	424 return string_match_1 (regexp, string, start, 0);
c41ce96785a8 (struct regexp_cache): New field `posix'. Richard M. Stallman <rms@gnu.org> parents: 9605 diff changeset	425 }
c41ce96785a8 (struct regexp_cache): New field `posix'. Richard M. Stallman <rms@gnu.org> parents: 9605 diff changeset	426
c41ce96785a8 (struct regexp_cache): New field `posix'. Richard M. Stallman <rms@gnu.org> parents: 9605 diff changeset	427 DEFUN ("posix-string-match", Fposix_string_match, Sposix_string_match, 2, 3, 0,
c41ce96785a8 (struct regexp_cache): New field `posix'. Richard M. Stallman <rms@gnu.org> parents: 9605 diff changeset	428 "Return index of start of first match for REGEXP in STRING, or nil.\n\
c41ce96785a8 (struct regexp_cache): New field `posix'. Richard M. Stallman <rms@gnu.org> parents: 9605 diff changeset	429 Find the longest match, in accord with Posix regular expression rules.\n\
24433 118e66d79d64 (Fstring_match, Fposix_string_match): Doc fix. Karl Heuer <kwzh@gnu.org> parents: 24014 diff changeset	430 Case is ignored if `case-fold-search' is non-nil in the current buffer.\n\
10020 c41ce96785a8 (struct regexp_cache): New field `posix'. Richard M. Stallman <rms@gnu.org> parents: 9605 diff changeset	431 If third arg START is non-nil, start search at that index in STRING.\n\
c41ce96785a8 (struct regexp_cache): New field `posix'. Richard M. Stallman <rms@gnu.org> parents: 9605 diff changeset	432 For index of first char beyond the match, do (match-end 0).\n\
c41ce96785a8 (struct regexp_cache): New field `posix'. Richard M. Stallman <rms@gnu.org> parents: 9605 diff changeset	433 `match-end' and `match-beginning' also give indices of substrings\n\
c41ce96785a8 (struct regexp_cache): New field `posix'. Richard M. Stallman <rms@gnu.org> parents: 9605 diff changeset	434 matched by parenthesis constructs in the pattern.")
c41ce96785a8 (struct regexp_cache): New field `posix'. Richard M. Stallman <rms@gnu.org> parents: 9605 diff changeset	435 (regexp, string, start)
c41ce96785a8 (struct regexp_cache): New field `posix'. Richard M. Stallman <rms@gnu.org> parents: 9605 diff changeset	436 Lisp_Object regexp, string, start;
c41ce96785a8 (struct regexp_cache): New field `posix'. Richard M. Stallman <rms@gnu.org> parents: 9605 diff changeset	437 {
c41ce96785a8 (struct regexp_cache): New field `posix'. Richard M. Stallman <rms@gnu.org> parents: 9605 diff changeset	438 return string_match_1 (regexp, string, start, 1);
c41ce96785a8 (struct regexp_cache): New field `posix'. Richard M. Stallman <rms@gnu.org> parents: 9605 diff changeset	439 }
c41ce96785a8 (struct regexp_cache): New field `posix'. Richard M. Stallman <rms@gnu.org> parents: 9605 diff changeset	440
842 5ce0a9ac1ea7 entered into RCS Richard M. Stallman <rms@gnu.org> parents: 808 diff changeset	441 /* Match REGEXP against STRING, searching all of STRING,
5ce0a9ac1ea7 entered into RCS Richard M. Stallman <rms@gnu.org> parents: 808 diff changeset	442 and return the index of the match, or negative on failure.
5ce0a9ac1ea7 entered into RCS Richard M. Stallman <rms@gnu.org> parents: 808 diff changeset	443 This does not clobber the match data. */
5ce0a9ac1ea7 entered into RCS Richard M. Stallman <rms@gnu.org> parents: 808 diff changeset	444
5ce0a9ac1ea7 entered into RCS Richard M. Stallman <rms@gnu.org> parents: 808 diff changeset	445 int
5ce0a9ac1ea7 entered into RCS Richard M. Stallman <rms@gnu.org> parents: 808 diff changeset	446 fast_string_match (regexp, string)
5ce0a9ac1ea7 entered into RCS Richard M. Stallman <rms@gnu.org> parents: 808 diff changeset	447 Lisp_Object regexp, string;
5ce0a9ac1ea7 entered into RCS Richard M. Stallman <rms@gnu.org> parents: 808 diff changeset	448 {
5ce0a9ac1ea7 entered into RCS Richard M. Stallman <rms@gnu.org> parents: 808 diff changeset	449 int val;
9605 cf97e75d8e02 (searchbufs): New variable, replaces searchbuf and last_regexp and Karl Heuer <kwzh@gnu.org> parents: 9452 diff changeset	450 struct re_pattern_buffer *bufp;
842 5ce0a9ac1ea7 entered into RCS Richard M. Stallman <rms@gnu.org> parents: 808 diff changeset	451
20869 c9f608f889b4 (boyer_moore, simple_search): New subroutines. Richard M. Stallman <rms@gnu.org> parents: 20824 diff changeset	452 bufp = compile_pattern (regexp, 0, Qnil,
c9f608f889b4 (boyer_moore, simple_search): New subroutines. Richard M. Stallman <rms@gnu.org> parents: 20824 diff changeset	453 0, STRING_MULTIBYTE (string));
842 5ce0a9ac1ea7 entered into RCS Richard M. Stallman <rms@gnu.org> parents: 808 diff changeset	454 immediate_quit = 1;
17463 bb9ae80d22e2 (looking_at_1): Set re_match_object. Richard M. Stallman <rms@gnu.org> parents: 17284 diff changeset	455 re_match_object = string;
bb9ae80d22e2 (looking_at_1): Set re_match_object. Richard M. Stallman <rms@gnu.org> parents: 17284 diff changeset	456
9605 cf97e75d8e02 (searchbufs): New variable, replaces searchbuf and last_regexp and Karl Heuer <kwzh@gnu.org> parents: 9452 diff changeset	457 val = re_search (bufp, (char *) XSTRING (string)->data,
21244 50929073a0ba Use STRING_BYTES and SET_STRING_BYTES. Richard M. Stallman <rms@gnu.org> parents: 21171 diff changeset	458 STRING_BYTES (XSTRING (string)), 0,
50929073a0ba Use STRING_BYTES and SET_STRING_BYTES. Richard M. Stallman <rms@gnu.org> parents: 21171 diff changeset	459 STRING_BYTES (XSTRING (string)), 0);
842 5ce0a9ac1ea7 entered into RCS Richard M. Stallman <rms@gnu.org> parents: 808 diff changeset	460 immediate_quit = 0;
5ce0a9ac1ea7 entered into RCS Richard M. Stallman <rms@gnu.org> parents: 808 diff changeset	461 return val;
5ce0a9ac1ea7 entered into RCS Richard M. Stallman <rms@gnu.org> parents: 808 diff changeset	462 }
17053 df904355f033 Include category.h and charset.h. Karl Heuer <kwzh@gnu.org> parents: 16880 diff changeset	463
df904355f033 Include category.h and charset.h. Karl Heuer <kwzh@gnu.org> parents: 16880 diff changeset	464 /* Match REGEXP against STRING, searching all of STRING ignoring case,
df904355f033 Include category.h and charset.h. Karl Heuer <kwzh@gnu.org> parents: 16880 diff changeset	465 and return the index of the match, or negative on failure.
20588 138c95482e6b (search_buffer): Handle bytes vs chars in non-RE case. Richard M. Stallman <rms@gnu.org> parents: 20547 diff changeset	466 This does not clobber the match data.
138c95482e6b (search_buffer): Handle bytes vs chars in non-RE case. Richard M. Stallman <rms@gnu.org> parents: 20547 diff changeset	467 We assume that STRING contains single-byte characters. */
17053 df904355f033 Include category.h and charset.h. Karl Heuer <kwzh@gnu.org> parents: 16880 diff changeset	468
df904355f033 Include category.h and charset.h. Karl Heuer <kwzh@gnu.org> parents: 16880 diff changeset	469 extern Lisp_Object Vascii_downcase_table;
df904355f033 Include category.h and charset.h. Karl Heuer <kwzh@gnu.org> parents: 16880 diff changeset	470
df904355f033 Include category.h and charset.h. Karl Heuer <kwzh@gnu.org> parents: 16880 diff changeset	471 int
18193 4e4c8edb56da (fast_c_string_match_ignore_case): Richard M. Stallman <rms@gnu.org> parents: 18124 diff changeset	472 fast_c_string_match_ignore_case (regexp, string)
17053 df904355f033 Include category.h and charset.h. Karl Heuer <kwzh@gnu.org> parents: 16880 diff changeset	473 Lisp_Object regexp;
df904355f033 Include category.h and charset.h. Karl Heuer <kwzh@gnu.org> parents: 16880 diff changeset	474 char *string;
df904355f033 Include category.h and charset.h. Karl Heuer <kwzh@gnu.org> parents: 16880 diff changeset	475 {
df904355f033 Include category.h and charset.h. Karl Heuer <kwzh@gnu.org> parents: 16880 diff changeset	476 int val;
df904355f033 Include category.h and charset.h. Karl Heuer <kwzh@gnu.org> parents: 16880 diff changeset	477 struct re_pattern_buffer *bufp;
df904355f033 Include category.h and charset.h. Karl Heuer <kwzh@gnu.org> parents: 16880 diff changeset	478 int len = strlen (string);
df904355f033 Include category.h and charset.h. Karl Heuer <kwzh@gnu.org> parents: 16880 diff changeset	479
20588 138c95482e6b (search_buffer): Handle bytes vs chars in non-RE case. Richard M. Stallman <rms@gnu.org> parents: 20547 diff changeset	480 regexp = string_make_unibyte (regexp);
18193 4e4c8edb56da (fast_c_string_match_ignore_case): Richard M. Stallman <rms@gnu.org> parents: 18124 diff changeset	481 re_match_object = Qt;
17053 df904355f033 Include category.h and charset.h. Karl Heuer <kwzh@gnu.org> parents: 16880 diff changeset	482 bufp = compile_pattern (regexp, 0,
20869 c9f608f889b4 (boyer_moore, simple_search): New subroutines. Richard M. Stallman <rms@gnu.org> parents: 20824 diff changeset	483 Vascii_downcase_table, 0,
20671 be91d6130341 (compile_pattern_1): If representation of STRING Karl Heuer <kwzh@gnu.org> parents: 20588 diff changeset	484 0);
17053 df904355f033 Include category.h and charset.h. Karl Heuer <kwzh@gnu.org> parents: 16880 diff changeset	485 immediate_quit = 1;
df904355f033 Include category.h and charset.h. Karl Heuer <kwzh@gnu.org> parents: 16880 diff changeset	486 val = re_search (bufp, string, len, 0, len, 0);
df904355f033 Include category.h and charset.h. Karl Heuer <kwzh@gnu.org> parents: 16880 diff changeset	487 immediate_quit = 0;
df904355f033 Include category.h and charset.h. Karl Heuer <kwzh@gnu.org> parents: 16880 diff changeset	488 return val;
df904355f033 Include category.h and charset.h. Karl Heuer <kwzh@gnu.org> parents: 16880 diff changeset	489 }
603 470f556a9453 Initial revision Jim Blandy <jimb@redhat.com> parents: diff changeset	490
9410 8598c3d6f2f0 * search.c: #include "region-cache.h". Jim Blandy <jimb@redhat.com> parents: 9319 diff changeset	491 /* The newline cache: remembering which sections of text have no newlines. */
8598c3d6f2f0 * search.c: #include "region-cache.h". Jim Blandy <jimb@redhat.com> parents: 9319 diff changeset	492
8598c3d6f2f0 * search.c: #include "region-cache.h". Jim Blandy <jimb@redhat.com> parents: 9319 diff changeset	493 /* If the user has requested newline caching, make sure it's on.
8598c3d6f2f0 * search.c: #include "region-cache.h". Jim Blandy <jimb@redhat.com> parents: 9319 diff changeset	494 Otherwise, make sure it's off.
8598c3d6f2f0 * search.c: #include "region-cache.h". Jim Blandy <jimb@redhat.com> parents: 9319 diff changeset	495 This is our cheezy way of associating an action with the change of
8598c3d6f2f0 * search.c: #include "region-cache.h". Jim Blandy <jimb@redhat.com> parents: 9319 diff changeset	496 state of a buffer-local variable. */
8598c3d6f2f0 * search.c: #include "region-cache.h". Jim Blandy <jimb@redhat.com> parents: 9319 diff changeset	497 static void
8598c3d6f2f0 * search.c: #include "region-cache.h". Jim Blandy <jimb@redhat.com> parents: 9319 diff changeset	498 newline_cache_on_off (buf)
8598c3d6f2f0 * search.c: #include "region-cache.h". Jim Blandy <jimb@redhat.com> parents: 9319 diff changeset	499 struct buffer *buf;
8598c3d6f2f0 * search.c: #include "region-cache.h". Jim Blandy <jimb@redhat.com> parents: 9319 diff changeset	500 {

603

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

1 /* String search routines for GNU Emacs.

26088

b7aa6ac26872 Add support for large files, 64-bit Solaris, system locale codings.

Paul Eggert <eggert@twinsun.com>

parents: 25663

diff changeset

603

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

3

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

4 This file is part of GNU Emacs.

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

5

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

6 GNU Emacs is free software; you can redistribute it and/or modify

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

7 it under the terms of the GNU General Public License as published by

12244

ac7375e60931 Update GPL to version 2.

Karl Heuer <kwzh@gnu.org>

parents: 12148

diff changeset

8 the Free Software Foundation; either version 2, or (at your option)

603

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

9 any later version.

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

10

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

11 GNU Emacs is distributed in the hope that it will be useful,

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

12 but WITHOUT ANY WARRANTY; without even the implied warranty of

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

13 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

14 GNU General Public License for more details.

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

15

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

16 You should have received a copy of the GNU General Public License

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

17 along with GNU Emacs; see the file COPYING. If not, write to

14186

ee40177f6c68 Update FSF's address in the preamble.

Erik Naggum <erik@naggum.no>

parents: 14086

diff changeset

18 the Free Software Foundation, Inc., 59 Temple Place - Suite 330,

ee40177f6c68 Update FSF's address in the preamble.

Erik Naggum <erik@naggum.no>

parents: 14086

diff changeset

19 Boston, MA 02111-1307, USA. */

603

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

20

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

21

4696

1fc792473491 Include <config.h> instead of "config.h".

Roland McGrath <roland@gnu.org>

parents: 4635

diff changeset

22 #include <config.h>

603

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

23 #include "lisp.h"

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

24 #include "syntax.h"

17053

df904355f033 Include category.h and charset.h.

Karl Heuer <kwzh@gnu.org>

parents: 16880

diff changeset

25 #include "category.h"

603

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

26 #include "buffer.h"

17053

df904355f033 Include category.h and charset.h.

Karl Heuer <kwzh@gnu.org>

parents: 16880

diff changeset

27 #include "charset.h"

9410

8598c3d6f2f0 * search.c: #include "region-cache.h".

Jim Blandy <jimb@redhat.com>

parents: 9319

diff changeset

28 #include "region-cache.h"

603

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

29 #include "commands.h"

2439

b6c62e4abf59 Put interrupt input blocking in a separate file from xterm.h.

Jim Blandy <jimb@redhat.com>

parents: 2393

diff changeset

30 #include "blockinput.h"

20347

d8e5f3c1618b Include "intervals.h" for prototypes.

Andreas Schwab <schwab@suse.de>

parents: 19541

diff changeset

31 #include "intervals.h"

621

eca8812e61cd *** empty log message ***

Jim Blandy <jimb@redhat.com>

parents: 605

diff changeset

32

603

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

33 #include <sys/types.h>

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

34 #include "regex.h"

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

35

21457

8c6ea32aadfa (min, max): Make these macros, not functions.

Karl Heuer <kwzh@gnu.org>

parents: 21248

diff changeset

36 #define min(a, b) ((a) < (b) ? (a) : (b))

8c6ea32aadfa (min, max): Make these macros, not functions.

Karl Heuer <kwzh@gnu.org>

parents: 21248

diff changeset

37 #define max(a, b) ((a) > (b) ? (a) : (b))

8c6ea32aadfa (min, max): Make these macros, not functions.

Karl Heuer <kwzh@gnu.org>

parents: 21248

diff changeset

38

16275

a4bcfdc9bb66 (REGEXP_CACHE_SIZE): Increase to 20.

Richard M. Stallman <rms@gnu.org>

parents: 16152

diff changeset

39 #define REGEXP_CACHE_SIZE 20

603

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

40

9605

cf97e75d8e02 (searchbufs): New variable, replaces searchbuf and last_regexp and

Karl Heuer <kwzh@gnu.org>

parents: 9452

diff changeset

41 /* If the regexp is non-nil, then the buffer contains the compiled form

cf97e75d8e02 (searchbufs): New variable, replaces searchbuf and last_regexp and

Karl Heuer <kwzh@gnu.org>

parents: 9452

diff changeset

42 of that regexp, suitable for searching. */

16275

a4bcfdc9bb66 (REGEXP_CACHE_SIZE): Increase to 20.

Richard M. Stallman <rms@gnu.org>

parents: 16152

diff changeset

43 struct regexp_cache

a4bcfdc9bb66 (REGEXP_CACHE_SIZE): Increase to 20.

Richard M. Stallman <rms@gnu.org>

parents: 16152

diff changeset

44 {

9605

cf97e75d8e02 (searchbufs): New variable, replaces searchbuf and last_regexp and

Karl Heuer <kwzh@gnu.org>

parents: 9452

diff changeset

45 struct regexp_cache *next;

cf97e75d8e02 (searchbufs): New variable, replaces searchbuf and last_regexp and

Karl Heuer <kwzh@gnu.org>

parents: 9452

diff changeset

46 Lisp_Object regexp;

cf97e75d8e02 (searchbufs): New variable, replaces searchbuf and last_regexp and

Karl Heuer <kwzh@gnu.org>

parents: 9452

diff changeset

47 struct re_pattern_buffer buf;

cf97e75d8e02 (searchbufs): New variable, replaces searchbuf and last_regexp and

Karl Heuer <kwzh@gnu.org>

parents: 9452

diff changeset

48 char fastmap[0400];

10020

c41ce96785a8 (struct regexp_cache): New field `posix'.

Richard M. Stallman <rms@gnu.org>

parents: 9605

diff changeset

49 /* Nonzero means regexp was compiled to do full POSIX backtracking. */

c41ce96785a8 (struct regexp_cache): New field `posix'.

Richard M. Stallman <rms@gnu.org>

parents: 9605

diff changeset

50 char posix;

9605

cf97e75d8e02 (searchbufs): New variable, replaces searchbuf and last_regexp and

Karl Heuer <kwzh@gnu.org>

parents: 9452

diff changeset

51 };

603

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

52

9605

cf97e75d8e02 (searchbufs): New variable, replaces searchbuf and last_regexp and

Karl Heuer <kwzh@gnu.org>

parents: 9452

diff changeset

53 /* The instances of that struct. */

cf97e75d8e02 (searchbufs): New variable, replaces searchbuf and last_regexp and

Karl Heuer <kwzh@gnu.org>

parents: 9452

diff changeset

54 struct regexp_cache searchbufs[REGEXP_CACHE_SIZE];

603

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

55

9605

cf97e75d8e02 (searchbufs): New variable, replaces searchbuf and last_regexp and

Karl Heuer <kwzh@gnu.org>

parents: 9452

diff changeset

56 /* The head of the linked list; points to the most recently used buffer. */

cf97e75d8e02 (searchbufs): New variable, replaces searchbuf and last_regexp and

Karl Heuer <kwzh@gnu.org>

parents: 9452

diff changeset

57 struct regexp_cache *searchbuf_head;

cf97e75d8e02 (searchbufs): New variable, replaces searchbuf and last_regexp and

Karl Heuer <kwzh@gnu.org>

parents: 9452

diff changeset

58

603

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

59

621

eca8812e61cd *** empty log message ***

Jim Blandy <jimb@redhat.com>

parents: 605

diff changeset

60 /* Every call to re_match, etc., must pass &search_regs as the regs

eca8812e61cd *** empty log message ***

Jim Blandy <jimb@redhat.com>

parents: 605

diff changeset

61 argument unless you can show it is unnecessary (i.e., if re_match

eca8812e61cd *** empty log message ***

Jim Blandy <jimb@redhat.com>

parents: 605

diff changeset

62 is certainly going to be called again before region-around-match

eca8812e61cd *** empty log message ***

Jim Blandy <jimb@redhat.com>

parents: 605

diff changeset

63 can be called).

eca8812e61cd *** empty log message ***

Jim Blandy <jimb@redhat.com>

parents: 605

diff changeset

64

eca8812e61cd *** empty log message ***

Jim Blandy <jimb@redhat.com>

parents: 605

diff changeset

65 Since the registers are now dynamically allocated, we need to make

eca8812e61cd *** empty log message ***

Jim Blandy <jimb@redhat.com>

parents: 605

diff changeset

66 sure not to refer to the Nth register before checking that it has

708

030fb4635335 *** empty log message ***

Jim Blandy <jimb@redhat.com>

parents: 648

diff changeset

67 been allocated by checking search_regs.num_regs.

603

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

68

708

030fb4635335 *** empty log message ***

Jim Blandy <jimb@redhat.com>

parents: 648

diff changeset

69 The regex code keeps track of whether it has allocated the search

9605

cf97e75d8e02 (searchbufs): New variable, replaces searchbuf and last_regexp and

Karl Heuer <kwzh@gnu.org>

parents: 9452

diff changeset

70 buffer using bits in the re_pattern_buffer. This means that whenever

cf97e75d8e02 (searchbufs): New variable, replaces searchbuf and last_regexp and

Karl Heuer <kwzh@gnu.org>

parents: 9452

diff changeset

71 you compile a new pattern, it completely forgets whether it has

708

030fb4635335 *** empty log message ***

Jim Blandy <jimb@redhat.com>

parents: 648

diff changeset

72 allocated any registers, and will allocate new registers the next

030fb4635335 *** empty log message ***

Jim Blandy <jimb@redhat.com>

parents: 648

diff changeset

73 time you call a searching or matching function. Therefore, we need

030fb4635335 *** empty log message ***

Jim Blandy <jimb@redhat.com>

parents: 648

diff changeset

74 to call re_set_registers after compiling a new pattern or after

030fb4635335 *** empty log message ***

Jim Blandy <jimb@redhat.com>

parents: 648

diff changeset

75 setting the match registers, so that the regex functions will be

030fb4635335 *** empty log message ***

Jim Blandy <jimb@redhat.com>

parents: 648

diff changeset

76 able to free or re-allocate it properly. */

603

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

77 static struct re_registers search_regs;

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

78

727

540b047ece4d *** empty log message ***

Jim Blandy <jimb@redhat.com>

parents: 708

diff changeset

79 /* The buffer in which the last search was performed, or

540b047ece4d *** empty log message ***

Jim Blandy <jimb@redhat.com>

parents: 708

diff changeset

80 Qt if the last search was done in a string;

540b047ece4d *** empty log message ***

Jim Blandy <jimb@redhat.com>

parents: 708

diff changeset

81 Qnil if no searching has been done yet. */

540b047ece4d *** empty log message ***

Jim Blandy <jimb@redhat.com>

parents: 708

diff changeset

82 static Lisp_Object last_thing_searched;

603

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

83

14036

621a575db6f7 Comment fixes.

Karl Heuer <kwzh@gnu.org>

parents: 13295

diff changeset

84 /* error condition signaled when regexp compile_pattern fails */

603

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

85

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

86 Lisp_Object Qinvalid_regexp;

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

87

5556

14161cfec24a (set_search_regs): New subroutine.

Richard M. Stallman <rms@gnu.org>

parents: 4954

diff changeset

88 static void set_search_regs ();

10055

cb713218845a (save_search_regs): Add declaration.

Richard M. Stallman <rms@gnu.org>

parents: 10032

diff changeset

89 static void save_search_regs ();

20869

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

90 static int simple_search ();

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

91 static int boyer_moore ();

10020

c41ce96785a8 (struct regexp_cache): New field `posix'.

Richard M. Stallman <rms@gnu.org>

parents: 9605

diff changeset

92 static int search_buffer ();

c41ce96785a8 (struct regexp_cache): New field `posix'.

Richard M. Stallman <rms@gnu.org>

parents: 9605

diff changeset

93

603

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

94 static void

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

95 matcher_overflow ()

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

96 {

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

97 error ("Stack overflow in regexp matcher");

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

98 }

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

99

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

100 #ifdef __STDC__

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

101 #define CONST const

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

102 #else

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

103 #define CONST

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

104 #endif

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

105

10020

c41ce96785a8 (struct regexp_cache): New field `posix'.

Richard M. Stallman <rms@gnu.org>

parents: 9605

diff changeset

106 /* Compile a regexp and signal a Lisp error if anything goes wrong.

c41ce96785a8 (struct regexp_cache): New field `posix'.

Richard M. Stallman <rms@gnu.org>

parents: 9605

diff changeset

107 PATTERN is the pattern to compile.

c41ce96785a8 (struct regexp_cache): New field `posix'.

Richard M. Stallman <rms@gnu.org>

parents: 9605

diff changeset

108 CP is the place to put the result.

20869

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

109 TRANSLATE is a translation table for ignoring case, or nil for none.

10020

c41ce96785a8 (struct regexp_cache): New field `posix'.

Richard M. Stallman <rms@gnu.org>

parents: 9605

diff changeset

110 REGP is the structure that says where to store the "register"

c41ce96785a8 (struct regexp_cache): New field `posix'.

Richard M. Stallman <rms@gnu.org>

parents: 9605

diff changeset

111 values that will result from matching this pattern.

c41ce96785a8 (struct regexp_cache): New field `posix'.

Richard M. Stallman <rms@gnu.org>

parents: 9605

diff changeset

112 If it is 0, we should compile the pattern not to record any

c41ce96785a8 (struct regexp_cache): New field `posix'.

Richard M. Stallman <rms@gnu.org>

parents: 9605

diff changeset

113 subexpression bounds.

c41ce96785a8 (struct regexp_cache): New field `posix'.

Richard M. Stallman <rms@gnu.org>

parents: 9605

diff changeset

114 POSIX is nonzero if we want full backtracking (POSIX style)

17053

df904355f033 Include category.h and charset.h.

Karl Heuer <kwzh@gnu.org>

parents: 16880

diff changeset

115 for this pattern. 0 means backtrack only enough to get a valid match.

df904355f033 Include category.h and charset.h.

Karl Heuer <kwzh@gnu.org>

parents: 16880

diff changeset

116 MULTIBYTE is nonzero if we want to handle multibyte characters in

df904355f033 Include category.h and charset.h.

Karl Heuer <kwzh@gnu.org>

parents: 16880

diff changeset

117 PATTERN. 0 means all multibyte characters are recognized just as

df904355f033 Include category.h and charset.h.

Karl Heuer <kwzh@gnu.org>

parents: 16880

diff changeset

118 sequences of binary data. */

603

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

119

9605

cf97e75d8e02 (searchbufs): New variable, replaces searchbuf and last_regexp and

Karl Heuer <kwzh@gnu.org>

parents: 9452

diff changeset

120 static void

17053

df904355f033 Include category.h and charset.h.

Karl Heuer <kwzh@gnu.org>

parents: 16880

diff changeset

121 compile_pattern_1 (cp, pattern, translate, regp, posix, multibyte)

9605

cf97e75d8e02 (searchbufs): New variable, replaces searchbuf and last_regexp and

Karl Heuer <kwzh@gnu.org>

parents: 9452

diff changeset

122 struct regexp_cache *cp;

603

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

123 Lisp_Object pattern;

20869

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

124 Lisp_Object translate;

708

030fb4635335 *** empty log message ***

Jim Blandy <jimb@redhat.com>

parents: 648

diff changeset

125 struct re_registers *regp;

10020

c41ce96785a8 (struct regexp_cache): New field `posix'.

Richard M. Stallman <rms@gnu.org>

parents: 9605

diff changeset

126 int posix;

17053

df904355f033 Include category.h and charset.h.

Karl Heuer <kwzh@gnu.org>

parents: 16880

diff changeset

127 int multibyte;

603

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

128 {

21915

8f1159b417c2 (search_buffer): Fix casts when assigning raw_pattern.

Richard M. Stallman <rms@gnu.org>

parents: 21887

diff changeset

129 unsigned char *raw_pattern;

20671

be91d6130341 (compile_pattern_1): If representation of STRING

Karl Heuer <kwzh@gnu.org>

parents: 20588

diff changeset

130 int raw_pattern_size;

18762

12c0de0113af (compile_pattern_1): Don't declare val with CONST.

Richard M. Stallman <rms@gnu.org>

parents: 18193

diff changeset

131 char *val;

10020

c41ce96785a8 (struct regexp_cache): New field `posix'.

Richard M. Stallman <rms@gnu.org>

parents: 9605

diff changeset

132 reg_syntax_t old;

603

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

133

20671

be91d6130341 (compile_pattern_1): If representation of STRING

Karl Heuer <kwzh@gnu.org>

parents: 20588

diff changeset

134 /* MULTIBYTE says whether the text to be searched is multibyte.

be91d6130341 (compile_pattern_1): If representation of STRING

Karl Heuer <kwzh@gnu.org>

parents: 20588

diff changeset

135 We must convert PATTERN to match that, or we will not really

be91d6130341 (compile_pattern_1): If representation of STRING

Karl Heuer <kwzh@gnu.org>

parents: 20588

diff changeset

136 find things right. */

be91d6130341 (compile_pattern_1): If representation of STRING

Karl Heuer <kwzh@gnu.org>

parents: 20588

diff changeset

137

be91d6130341 (compile_pattern_1): If representation of STRING

Karl Heuer <kwzh@gnu.org>

parents: 20588

diff changeset

138 if (multibyte == STRING_MULTIBYTE (pattern))

be91d6130341 (compile_pattern_1): If representation of STRING

Karl Heuer <kwzh@gnu.org>

parents: 20588

diff changeset

139 {

21915

8f1159b417c2 (search_buffer): Fix casts when assigning raw_pattern.

Richard M. Stallman <rms@gnu.org>

parents: 21887

diff changeset

140 raw_pattern = (unsigned char *) XSTRING (pattern)->data;

21244

50929073a0ba Use STRING_BYTES and SET_STRING_BYTES.

Richard M. Stallman <rms@gnu.org>

parents: 21171

diff changeset

141 raw_pattern_size = STRING_BYTES (XSTRING (pattern));

20671

be91d6130341 (compile_pattern_1): If representation of STRING

Karl Heuer <kwzh@gnu.org>

parents: 20588

diff changeset

142 }

be91d6130341 (compile_pattern_1): If representation of STRING

Karl Heuer <kwzh@gnu.org>

parents: 20588

diff changeset

143 else if (multibyte)

be91d6130341 (compile_pattern_1): If representation of STRING

Karl Heuer <kwzh@gnu.org>

parents: 20588

diff changeset

144 {

be91d6130341 (compile_pattern_1): If representation of STRING

Karl Heuer <kwzh@gnu.org>

parents: 20588

diff changeset

145 raw_pattern_size = count_size_as_multibyte (XSTRING (pattern)->data,

be91d6130341 (compile_pattern_1): If representation of STRING

Karl Heuer <kwzh@gnu.org>

parents: 20588

diff changeset

146 XSTRING (pattern)->size);

21915

8f1159b417c2 (search_buffer): Fix casts when assigning raw_pattern.

Richard M. Stallman <rms@gnu.org>

parents: 21887

diff changeset

147 raw_pattern = (unsigned char *) alloca (raw_pattern_size + 1);

20671

be91d6130341 (compile_pattern_1): If representation of STRING

Karl Heuer <kwzh@gnu.org>

parents: 20588

diff changeset

148 copy_text (XSTRING (pattern)->data, raw_pattern,

be91d6130341 (compile_pattern_1): If representation of STRING

Karl Heuer <kwzh@gnu.org>

parents: 20588

diff changeset

149 XSTRING (pattern)->size, 0, 1);

be91d6130341 (compile_pattern_1): If representation of STRING

Karl Heuer <kwzh@gnu.org>

parents: 20588

diff changeset

150 }

be91d6130341 (compile_pattern_1): If representation of STRING

Karl Heuer <kwzh@gnu.org>

parents: 20588

diff changeset

151 else

be91d6130341 (compile_pattern_1): If representation of STRING

Karl Heuer <kwzh@gnu.org>

parents: 20588

diff changeset

152 {

be91d6130341 (compile_pattern_1): If representation of STRING

Karl Heuer <kwzh@gnu.org>

parents: 20588

diff changeset

153 /* Converting multibyte to single-byte.

be91d6130341 (compile_pattern_1): If representation of STRING

Karl Heuer <kwzh@gnu.org>

parents: 20588

diff changeset

154

be91d6130341 (compile_pattern_1): If representation of STRING

Karl Heuer <kwzh@gnu.org>

parents: 20588

diff changeset

155 ??? Perhaps this conversion should be done in a special way

be91d6130341 (compile_pattern_1): If representation of STRING

Karl Heuer <kwzh@gnu.org>

parents: 20588

diff changeset

156 by subtracting nonascii-insert-offset from each non-ASCII char,

be91d6130341 (compile_pattern_1): If representation of STRING

Karl Heuer <kwzh@gnu.org>

parents: 20588

diff changeset

157 so that only the multibyte chars which really correspond to

be91d6130341 (compile_pattern_1): If representation of STRING

Karl Heuer <kwzh@gnu.org>

parents: 20588

diff changeset

158 the chosen single-byte character set can possibly match. */

be91d6130341 (compile_pattern_1): If representation of STRING

Karl Heuer <kwzh@gnu.org>

parents: 20588

diff changeset

159 raw_pattern_size = XSTRING (pattern)->size;

21915

8f1159b417c2 (search_buffer): Fix casts when assigning raw_pattern.

Richard M. Stallman <rms@gnu.org>

parents: 21887

diff changeset

160 raw_pattern = (unsigned char *) alloca (raw_pattern_size + 1);

20671

be91d6130341 (compile_pattern_1): If representation of STRING

Karl Heuer <kwzh@gnu.org>

parents: 20588

diff changeset

161 copy_text (XSTRING (pattern)->data, raw_pattern,

21244

50929073a0ba Use STRING_BYTES and SET_STRING_BYTES.

Richard M. Stallman <rms@gnu.org>

parents: 21171

diff changeset

162 STRING_BYTES (XSTRING (pattern)), 1, 0);

20671

be91d6130341 (compile_pattern_1): If representation of STRING

Karl Heuer <kwzh@gnu.org>

parents: 20588

diff changeset

163 }

be91d6130341 (compile_pattern_1): If representation of STRING

Karl Heuer <kwzh@gnu.org>

parents: 20588

diff changeset

164

9605

cf97e75d8e02 (searchbufs): New variable, replaces searchbuf and last_regexp and

Karl Heuer <kwzh@gnu.org>

parents: 9452

diff changeset

165 cp->regexp = Qnil;

21531

5811a3129878 (compile_pattern, compile_pattern_1): Fix mixing of

Andreas Schwab <schwab@suse.de>

parents: 21514

diff changeset

166 cp->buf.translate = (! NILP (translate) ? translate : make_number (0));

10020

c41ce96785a8 (struct regexp_cache): New field `posix'.

Richard M. Stallman <rms@gnu.org>

parents: 9605

diff changeset

167 cp->posix = posix;

17053

df904355f033 Include category.h and charset.h.

Karl Heuer <kwzh@gnu.org>

parents: 16880

diff changeset

168 cp->buf.multibyte = multibyte;

2439

b6c62e4abf59 Put interrupt input blocking in a separate file from xterm.h.

Jim Blandy <jimb@redhat.com>

parents: 2393

diff changeset

169 BLOCK_INPUT;

25441

d30cff97fb20 (compile_pattern_1): Enable RE_CHAR_CLASSES for regexp.

Richard M. Stallman <rms@gnu.org>

parents: 24716

diff changeset

170 old = re_set_syntax (RE_SYNTAX_EMACS | RE_CHAR_CLASSES

10020

c41ce96785a8 (struct regexp_cache): New field `posix'.

Richard M. Stallman <rms@gnu.org>

parents: 9605

diff changeset

171 | (posix ? 0 : RE_NO_POSIX_BACKTRACKING));

21915

8f1159b417c2 (search_buffer): Fix casts when assigning raw_pattern.

Richard M. Stallman <rms@gnu.org>

parents: 21887

diff changeset

172 val = (char *) re_compile_pattern ((char *)raw_pattern,

8f1159b417c2 (search_buffer): Fix casts when assigning raw_pattern.

Richard M. Stallman <rms@gnu.org>

parents: 21887

diff changeset

173 raw_pattern_size, &cp->buf);

10020

c41ce96785a8 (struct regexp_cache): New field `posix'.

Richard M. Stallman <rms@gnu.org>

parents: 9605

diff changeset

174 re_set_syntax (old);

2439

b6c62e4abf59 Put interrupt input blocking in a separate file from xterm.h.

Jim Blandy <jimb@redhat.com>

parents: 2393

diff changeset

175 UNBLOCK_INPUT;

603

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

176 if (val)

9605

cf97e75d8e02 (searchbufs): New variable, replaces searchbuf and last_regexp and

Karl Heuer <kwzh@gnu.org>

parents: 9452

diff changeset

177 Fsignal (Qinvalid_regexp, Fcons (build_string (val), Qnil));

708

030fb4635335 *** empty log message ***

Jim Blandy <jimb@redhat.com>

parents: 648

diff changeset

178

9605

cf97e75d8e02 (searchbufs): New variable, replaces searchbuf and last_regexp and

Karl Heuer <kwzh@gnu.org>

parents: 9452

diff changeset

179 cp->regexp = Fcopy_sequence (pattern);

cf97e75d8e02 (searchbufs): New variable, replaces searchbuf and last_regexp and

Karl Heuer <kwzh@gnu.org>

parents: 9452

diff changeset

180 }

708

030fb4635335 *** empty log message ***

Jim Blandy <jimb@redhat.com>

parents: 648

diff changeset

181

22221

239a4b800303 (shrink_regexp_cache): New function.

Richard M. Stallman <rms@gnu.org>

parents: 22082

diff changeset

182 /* Shrink each compiled regexp buffer in the cache

239a4b800303 (shrink_regexp_cache): New function.

Richard M. Stallman <rms@gnu.org>

parents: 22082

diff changeset

183 to the size actually used right now.

239a4b800303 (shrink_regexp_cache): New function.

Richard M. Stallman <rms@gnu.org>

parents: 22082

diff changeset

184 This is called from garbage collection. */

239a4b800303 (shrink_regexp_cache): New function.

Richard M. Stallman <rms@gnu.org>

parents: 22082

diff changeset

185

239a4b800303 (shrink_regexp_cache): New function.

Richard M. Stallman <rms@gnu.org>

parents: 22082

diff changeset

186 void

239a4b800303 (shrink_regexp_cache): New function.

Richard M. Stallman <rms@gnu.org>

parents: 22082

diff changeset

187 shrink_regexp_cache ()

239a4b800303 (shrink_regexp_cache): New function.

Richard M. Stallman <rms@gnu.org>

parents: 22082

diff changeset

188 {

239a4b800303 (shrink_regexp_cache): New function.

Richard M. Stallman <rms@gnu.org>

parents: 22082

diff changeset

189 struct regexp_cache *cp, **cpp;

239a4b800303 (shrink_regexp_cache): New function.

Richard M. Stallman <rms@gnu.org>

parents: 22082

diff changeset

190

239a4b800303 (shrink_regexp_cache): New function.

Richard M. Stallman <rms@gnu.org>

parents: 22082

diff changeset

191 for (cp = searchbuf_head; cp != 0; cp = cp->next)

239a4b800303 (shrink_regexp_cache): New function.

Richard M. Stallman <rms@gnu.org>

parents: 22082

diff changeset

192 {

239a4b800303 (shrink_regexp_cache): New function.

Richard M. Stallman <rms@gnu.org>

parents: 22082

diff changeset

193 cp->buf.allocated = cp->buf.used;

239a4b800303 (shrink_regexp_cache): New function.

Richard M. Stallman <rms@gnu.org>

parents: 22082

diff changeset

194 cp->buf.buffer

239a4b800303 (shrink_regexp_cache): New function.

Richard M. Stallman <rms@gnu.org>

parents: 22082

diff changeset

195 = (unsigned char *) realloc (cp->buf.buffer, cp->buf.used);

239a4b800303 (shrink_regexp_cache): New function.

Richard M. Stallman <rms@gnu.org>

parents: 22082

diff changeset

196 }

239a4b800303 (shrink_regexp_cache): New function.

Richard M. Stallman <rms@gnu.org>

parents: 22082

diff changeset

197 }

239a4b800303 (shrink_regexp_cache): New function.

Richard M. Stallman <rms@gnu.org>

parents: 22082

diff changeset

198

9605

cf97e75d8e02 (searchbufs): New variable, replaces searchbuf and last_regexp and

Karl Heuer <kwzh@gnu.org>

parents: 9452

diff changeset

199 /* Compile a regexp if necessary, but first check to see if there's one in

10020

c41ce96785a8 (struct regexp_cache): New field `posix'.

Richard M. Stallman <rms@gnu.org>

parents: 9605

diff changeset

200 the cache.

c41ce96785a8 (struct regexp_cache): New field `posix'.

Richard M. Stallman <rms@gnu.org>

parents: 9605

diff changeset

201 PATTERN is the pattern to compile.

20869

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

202 TRANSLATE is a translation table for ignoring case, or nil for none.

10020

c41ce96785a8 (struct regexp_cache): New field `posix'.

Richard M. Stallman <rms@gnu.org>

parents: 9605

diff changeset

203 REGP is the structure that says where to store the "register"

c41ce96785a8 (struct regexp_cache): New field `posix'.

Richard M. Stallman <rms@gnu.org>

parents: 9605

diff changeset

204 values that will result from matching this pattern.

c41ce96785a8 (struct regexp_cache): New field `posix'.

Richard M. Stallman <rms@gnu.org>

parents: 9605

diff changeset

205 If it is 0, we should compile the pattern not to record any

c41ce96785a8 (struct regexp_cache): New field `posix'.

Richard M. Stallman <rms@gnu.org>

parents: 9605

diff changeset

206 subexpression bounds.

c41ce96785a8 (struct regexp_cache): New field `posix'.

Richard M. Stallman <rms@gnu.org>

parents: 9605

diff changeset

207 POSIX is nonzero if we want full backtracking (POSIX style)

c41ce96785a8 (struct regexp_cache): New field `posix'.

Richard M. Stallman <rms@gnu.org>

parents: 9605

diff changeset

208 for this pattern. 0 means backtrack only enough to get a valid match. */

9605

cf97e75d8e02 (searchbufs): New variable, replaces searchbuf and last_regexp and

Karl Heuer <kwzh@gnu.org>

parents: 9452

diff changeset

209

cf97e75d8e02 (searchbufs): New variable, replaces searchbuf and last_regexp and

Karl Heuer <kwzh@gnu.org>

parents: 9452

diff changeset

210 struct re_pattern_buffer *

20588

138c95482e6b (search_buffer): Handle bytes vs chars in non-RE case.

Richard M. Stallman <rms@gnu.org>

parents: 20547

diff changeset

211 compile_pattern (pattern, regp, translate, posix, multibyte)

9605

cf97e75d8e02 (searchbufs): New variable, replaces searchbuf and last_regexp and

Karl Heuer <kwzh@gnu.org>

parents: 9452

diff changeset

212 Lisp_Object pattern;

cf97e75d8e02 (searchbufs): New variable, replaces searchbuf and last_regexp and

Karl Heuer <kwzh@gnu.org>

parents: 9452

diff changeset

213 struct re_registers *regp;

20869

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

214 Lisp_Object translate;

20588

138c95482e6b (search_buffer): Handle bytes vs chars in non-RE case.

Richard M. Stallman <rms@gnu.org>

parents: 20547

diff changeset

215 int posix, multibyte;

9605

cf97e75d8e02 (searchbufs): New variable, replaces searchbuf and last_regexp and

Karl Heuer <kwzh@gnu.org>

parents: 9452

diff changeset

216 {

cf97e75d8e02 (searchbufs): New variable, replaces searchbuf and last_regexp and

Karl Heuer <kwzh@gnu.org>

parents: 9452

diff changeset

217 struct regexp_cache *cp, **cpp;

cf97e75d8e02 (searchbufs): New variable, replaces searchbuf and last_regexp and

Karl Heuer <kwzh@gnu.org>

parents: 9452

diff changeset

218

cf97e75d8e02 (searchbufs): New variable, replaces searchbuf and last_regexp and

Karl Heuer <kwzh@gnu.org>

parents: 9452

diff changeset

219 for (cpp = &searchbuf_head; ; cpp = &cp->next)

cf97e75d8e02 (searchbufs): New variable, replaces searchbuf and last_regexp and

Karl Heuer <kwzh@gnu.org>

parents: 9452

diff changeset

220 {

cf97e75d8e02 (searchbufs): New variable, replaces searchbuf and last_regexp and

Karl Heuer <kwzh@gnu.org>

parents: 9452

diff changeset

221 cp = *cpp;

16275

a4bcfdc9bb66 (REGEXP_CACHE_SIZE): Increase to 20.

Richard M. Stallman <rms@gnu.org>

parents: 16152

diff changeset

222 if (XSTRING (cp->regexp)->size == XSTRING (pattern)->size

a4bcfdc9bb66 (REGEXP_CACHE_SIZE): Increase to 20.

Richard M. Stallman <rms@gnu.org>

parents: 16152

diff changeset

223 && !NILP (Fstring_equal (cp->regexp, pattern))

21531

5811a3129878 (compile_pattern, compile_pattern_1): Fix mixing of

Andreas Schwab <schwab@suse.de>

parents: 21514

diff changeset

224 && EQ (cp->buf.translate, (! NILP (translate) ? translate : make_number (0)))

17053

df904355f033 Include category.h and charset.h.

Karl Heuer <kwzh@gnu.org>

parents: 16880

diff changeset

225 && cp->posix == posix

df904355f033 Include category.h and charset.h.

Karl Heuer <kwzh@gnu.org>

parents: 16880

diff changeset

226 && cp->buf.multibyte == multibyte)

9605

cf97e75d8e02 (searchbufs): New variable, replaces searchbuf and last_regexp and

Karl Heuer <kwzh@gnu.org>

parents: 9452

diff changeset

227 break;

cf97e75d8e02 (searchbufs): New variable, replaces searchbuf and last_regexp and

Karl Heuer <kwzh@gnu.org>

parents: 9452

diff changeset

228

cf97e75d8e02 (searchbufs): New variable, replaces searchbuf and last_regexp and

Karl Heuer <kwzh@gnu.org>

parents: 9452

diff changeset

229 /* If we're at the end of the cache, compile into the last cell. */

cf97e75d8e02 (searchbufs): New variable, replaces searchbuf and last_regexp and

Karl Heuer <kwzh@gnu.org>

parents: 9452

diff changeset

230 if (cp->next == 0)

cf97e75d8e02 (searchbufs): New variable, replaces searchbuf and last_regexp and

Karl Heuer <kwzh@gnu.org>

parents: 9452

diff changeset

231 {

17053

df904355f033 Include category.h and charset.h.

Karl Heuer <kwzh@gnu.org>

parents: 16880

diff changeset

232 compile_pattern_1 (cp, pattern, translate, regp, posix, multibyte);

9605

cf97e75d8e02 (searchbufs): New variable, replaces searchbuf and last_regexp and

Karl Heuer <kwzh@gnu.org>

parents: 9452

diff changeset

233 break;

cf97e75d8e02 (searchbufs): New variable, replaces searchbuf and last_regexp and

Karl Heuer <kwzh@gnu.org>

parents: 9452

diff changeset

234 }

cf97e75d8e02 (searchbufs): New variable, replaces searchbuf and last_regexp and

Karl Heuer <kwzh@gnu.org>

parents: 9452

diff changeset

235 }

cf97e75d8e02 (searchbufs): New variable, replaces searchbuf and last_regexp and

Karl Heuer <kwzh@gnu.org>

parents: 9452

diff changeset

236

cf97e75d8e02 (searchbufs): New variable, replaces searchbuf and last_regexp and

Karl Heuer <kwzh@gnu.org>

parents: 9452

diff changeset

237 /* When we get here, cp (aka *cpp) contains the compiled pattern,

cf97e75d8e02 (searchbufs): New variable, replaces searchbuf and last_regexp and

Karl Heuer <kwzh@gnu.org>

parents: 9452

diff changeset

238 either because we found it in the cache or because we just compiled it.

cf97e75d8e02 (searchbufs): New variable, replaces searchbuf and last_regexp and

Karl Heuer <kwzh@gnu.org>

parents: 9452

diff changeset

239 Move it to the front of the queue to mark it as most recently used. */

cf97e75d8e02 (searchbufs): New variable, replaces searchbuf and last_regexp and

Karl Heuer <kwzh@gnu.org>

parents: 9452

diff changeset

240 *cpp = cp->next;

cf97e75d8e02 (searchbufs): New variable, replaces searchbuf and last_regexp and

Karl Heuer <kwzh@gnu.org>

parents: 9452

diff changeset

241 cp->next = searchbuf_head;

cf97e75d8e02 (searchbufs): New variable, replaces searchbuf and last_regexp and

Karl Heuer <kwzh@gnu.org>

parents: 9452

diff changeset

242 searchbuf_head = cp;

cf97e75d8e02 (searchbufs): New variable, replaces searchbuf and last_regexp and

Karl Heuer <kwzh@gnu.org>

parents: 9452

diff changeset

243

10141

afe81fd385eb (compile_pattern): Call re_set_registers here.

Richard M. Stallman <rms@gnu.org>

parents: 10128

diff changeset

244 /* Advise the searching functions about the space we have allocated

afe81fd385eb (compile_pattern): Call re_set_registers here.

Richard M. Stallman <rms@gnu.org>

parents: 10128

diff changeset

245 for register data. */

afe81fd385eb (compile_pattern): Call re_set_registers here.

Richard M. Stallman <rms@gnu.org>

parents: 10128

diff changeset

246 if (regp)

afe81fd385eb (compile_pattern): Call re_set_registers here.

Richard M. Stallman <rms@gnu.org>

parents: 10128

diff changeset

247 re_set_registers (&cp->buf, regp, regp->num_regs, regp->start, regp->end);

afe81fd385eb (compile_pattern): Call re_set_registers here.

Richard M. Stallman <rms@gnu.org>

parents: 10128

diff changeset

248

9605

cf97e75d8e02 (searchbufs): New variable, replaces searchbuf and last_regexp and

Karl Heuer <kwzh@gnu.org>

parents: 9452

diff changeset

249 return &cp->buf;

603

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

250 }

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

251

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

252 /* Error condition used for failing searches */

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

253 Lisp_Object Qsearch_failed;

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

254

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

255 Lisp_Object

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

256 signal_failure (arg)

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

257 Lisp_Object arg;

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

258 {

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

259 Fsignal (Qsearch_failed, Fcons (arg, Qnil));

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

260 return Qnil;

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

261 }

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

262

10020

c41ce96785a8 (struct regexp_cache): New field `posix'.

Richard M. Stallman <rms@gnu.org>

parents: 9605

diff changeset

263 static Lisp_Object

c41ce96785a8 (struct regexp_cache): New field `posix'.

Richard M. Stallman <rms@gnu.org>

parents: 9605

diff changeset

264 looking_at_1 (string, posix)

603

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

265 Lisp_Object string;

10020

c41ce96785a8 (struct regexp_cache): New field `posix'.

Richard M. Stallman <rms@gnu.org>

parents: 9605

diff changeset

266 int posix;

603

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

267 {

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

268 Lisp_Object val;

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

269 unsigned char *p1, *p2;

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

270 int s1, s2;

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

271 register int i;

9605

cf97e75d8e02 (searchbufs): New variable, replaces searchbuf and last_regexp and

Karl Heuer <kwzh@gnu.org>

parents: 9452

diff changeset

272 struct re_pattern_buffer *bufp;

603

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

273

10032

f689803caa92 Added code for automatically saving and restoring the match data

Francesco Potortì <pot@gnu.org>

parents: 10020

diff changeset

274 if (running_asynch_code)

f689803caa92 Added code for automatically saving and restoring the match data

Francesco Potortì <pot@gnu.org>

parents: 10020

diff changeset

275 save_search_regs ();

f689803caa92 Added code for automatically saving and restoring the match data

Francesco Potortì <pot@gnu.org>

parents: 10020

diff changeset

276

603

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

277 CHECK_STRING (string, 0);

9605

cf97e75d8e02 (searchbufs): New variable, replaces searchbuf and last_regexp and

Karl Heuer <kwzh@gnu.org>

parents: 9452

diff changeset

278 bufp = compile_pattern (string, &search_regs,

cf97e75d8e02 (searchbufs): New variable, replaces searchbuf and last_regexp and

Karl Heuer <kwzh@gnu.org>

parents: 9452

diff changeset

279 (!NILP (current_buffer->case_fold_search)

20869

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

280 ? DOWNCASE_TABLE : Qnil),

20588

138c95482e6b (search_buffer): Handle bytes vs chars in non-RE case.

Richard M. Stallman <rms@gnu.org>

parents: 20547

diff changeset

281 posix,

138c95482e6b (search_buffer): Handle bytes vs chars in non-RE case.

Richard M. Stallman <rms@gnu.org>

parents: 20547

diff changeset

282 !NILP (current_buffer->enable_multibyte_characters));

603

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

283

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

284 immediate_quit = 1;

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

285 QUIT; /* Do a pending quit right away, to avoid paradoxical behavior */

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

286

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

287 /* Get pointers and sizes of the two strings

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

288 that make up the visible portion of the buffer. */

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

289

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

290 p1 = BEGV_ADDR;

20545

c20c92ff4055 (looking_at_1): Use bytepos to call re_search_2.

Richard M. Stallman <rms@gnu.org>

parents: 20347

diff changeset

291 s1 = GPT_BYTE - BEGV_BYTE;

603

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

292 p2 = GAP_END_ADDR;

20545

c20c92ff4055 (looking_at_1): Use bytepos to call re_search_2.

Richard M. Stallman <rms@gnu.org>

parents: 20347

diff changeset

293 s2 = ZV_BYTE - GPT_BYTE;

603

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

294 if (s1 < 0)

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

295 {

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

296 p2 = p1;

20545

c20c92ff4055 (looking_at_1): Use bytepos to call re_search_2.

Richard M. Stallman <rms@gnu.org>

parents: 20347

diff changeset

297 s2 = ZV_BYTE - BEGV_BYTE;

603

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

298 s1 = 0;

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

299 }

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

300 if (s2 < 0)

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

301 {

20545

c20c92ff4055 (looking_at_1): Use bytepos to call re_search_2.

Richard M. Stallman <rms@gnu.org>

parents: 20347

diff changeset

302 s1 = ZV_BYTE - BEGV_BYTE;

603

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

303 s2 = 0;

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

304 }

17463

bb9ae80d22e2 (looking_at_1): Set re_match_object.

Richard M. Stallman <rms@gnu.org>

parents: 17284

diff changeset

305

bb9ae80d22e2 (looking_at_1): Set re_match_object.

Richard M. Stallman <rms@gnu.org>

parents: 17284

diff changeset

306 re_match_object = Qnil;

603

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

307

9605

cf97e75d8e02 (searchbufs): New variable, replaces searchbuf and last_regexp and

Karl Heuer <kwzh@gnu.org>

parents: 9452

diff changeset

308 i = re_match_2 (bufp, (char *) p1, s1, (char *) p2, s2,

20545

c20c92ff4055 (looking_at_1): Use bytepos to call re_search_2.

Richard M. Stallman <rms@gnu.org>

parents: 20347

diff changeset

309 PT_BYTE - BEGV_BYTE, &search_regs,

c20c92ff4055 (looking_at_1): Use bytepos to call re_search_2.

Richard M. Stallman <rms@gnu.org>

parents: 20347

diff changeset

310 ZV_BYTE - BEGV_BYTE);

26985

1121a5da20a5 (looking_at_1): Reset immediate_quit before modifying

Gerd Moellmann <gerd@gnu.org>

parents: 26982

diff changeset

311 immediate_quit = 0;

1121a5da20a5 (looking_at_1): Reset immediate_quit before modifying

Gerd Moellmann <gerd@gnu.org>

parents: 26982

diff changeset

312

603

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

313 if (i == -2)

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

314 matcher_overflow ();

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

315

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

316 val = (0 <= i ? Qt : Qnil);

20545

c20c92ff4055 (looking_at_1): Use bytepos to call re_search_2.

Richard M. Stallman <rms@gnu.org>

parents: 20347

diff changeset

317 if (i >= 0)

c20c92ff4055 (looking_at_1): Use bytepos to call re_search_2.

Richard M. Stallman <rms@gnu.org>

parents: 20347

diff changeset

318 for (i = 0; i < search_regs.num_regs; i++)

c20c92ff4055 (looking_at_1): Use bytepos to call re_search_2.

Richard M. Stallman <rms@gnu.org>

parents: 20347

diff changeset

319 if (search_regs.start[i] >= 0)

c20c92ff4055 (looking_at_1): Use bytepos to call re_search_2.

Richard M. Stallman <rms@gnu.org>

parents: 20347

diff changeset

320 {

c20c92ff4055 (looking_at_1): Use bytepos to call re_search_2.

Richard M. Stallman <rms@gnu.org>

parents: 20347

diff changeset

321 search_regs.start[i]

c20c92ff4055 (looking_at_1): Use bytepos to call re_search_2.

Richard M. Stallman <rms@gnu.org>

parents: 20347

diff changeset

322 = BYTE_TO_CHAR (search_regs.start[i] + BEGV_BYTE);

c20c92ff4055 (looking_at_1): Use bytepos to call re_search_2.

Richard M. Stallman <rms@gnu.org>

parents: 20347

diff changeset

323 search_regs.end[i]

c20c92ff4055 (looking_at_1): Use bytepos to call re_search_2.

Richard M. Stallman <rms@gnu.org>

parents: 20347

diff changeset

324 = BYTE_TO_CHAR (search_regs.end[i] + BEGV_BYTE);

c20c92ff4055 (looking_at_1): Use bytepos to call re_search_2.

Richard M. Stallman <rms@gnu.org>

parents: 20347

diff changeset

325 }

9278

f2138d548313 (Flooking_at, skip_chars, search_buffer, set_search_regs, Fstore_match_data):

Karl Heuer <kwzh@gnu.org>

parents: 9113

diff changeset

326 XSETBUFFER (last_thing_searched, current_buffer);

603

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

327 return val;

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

328 }

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

329

10020

c41ce96785a8 (struct regexp_cache): New field `posix'.

Richard M. Stallman <rms@gnu.org>

parents: 9605

diff changeset

330 DEFUN ("looking-at", Flooking_at, Slooking_at, 1, 1, 0,

11213

d0811ba886f8 (Flooking_at, Fposix_looking_at): Change arg name.

Richard M. Stallman <rms@gnu.org>

parents: 10250

diff changeset

331 "Return t if text after point matches regular expression REGEXP.\n\

10020

c41ce96785a8 (struct regexp_cache): New field `posix'.

Richard M. Stallman <rms@gnu.org>

parents: 9605

diff changeset

332 This function modifies the match data that `match-beginning',\n\

c41ce96785a8 (struct regexp_cache): New field `posix'.

Richard M. Stallman <rms@gnu.org>

parents: 9605

diff changeset

333 `match-end' and `match-data' access; save and restore the match\n\

c41ce96785a8 (struct regexp_cache): New field `posix'.

Richard M. Stallman <rms@gnu.org>

parents: 9605

diff changeset

334 data if you want to preserve them.")

11213

d0811ba886f8 (Flooking_at, Fposix_looking_at): Change arg name.

Richard M. Stallman <rms@gnu.org>

parents: 10250

diff changeset

335 (regexp)

d0811ba886f8 (Flooking_at, Fposix_looking_at): Change arg name.

Richard M. Stallman <rms@gnu.org>

parents: 10250

diff changeset

336 Lisp_Object regexp;

10020

c41ce96785a8 (struct regexp_cache): New field `posix'.

Richard M. Stallman <rms@gnu.org>

parents: 9605

diff changeset

337 {

11213

d0811ba886f8 (Flooking_at, Fposix_looking_at): Change arg name.

Richard M. Stallman <rms@gnu.org>

parents: 10250

diff changeset

338 return looking_at_1 (regexp, 0);

10020

c41ce96785a8 (struct regexp_cache): New field `posix'.

Richard M. Stallman <rms@gnu.org>

parents: 9605

diff changeset

339 }

c41ce96785a8 (struct regexp_cache): New field `posix'.

Richard M. Stallman <rms@gnu.org>

parents: 9605

diff changeset

340

c41ce96785a8 (struct regexp_cache): New field `posix'.

Richard M. Stallman <rms@gnu.org>

parents: 9605

diff changeset

341 DEFUN ("posix-looking-at", Fposix_looking_at, Sposix_looking_at, 1, 1, 0,

11213

d0811ba886f8 (Flooking_at, Fposix_looking_at): Change arg name.

Richard M. Stallman <rms@gnu.org>

parents: 10250

diff changeset

342 "Return t if text after point matches regular expression REGEXP.\n\

10020

c41ce96785a8 (struct regexp_cache): New field `posix'.

Richard M. Stallman <rms@gnu.org>

parents: 9605

diff changeset

343 Find the longest match, in accord with Posix regular expression rules.\n\

c41ce96785a8 (struct regexp_cache): New field `posix'.

Richard M. Stallman <rms@gnu.org>

parents: 9605

diff changeset

344 This function modifies the match data that `match-beginning',\n\

c41ce96785a8 (struct regexp_cache): New field `posix'.

Richard M. Stallman <rms@gnu.org>

parents: 9605

diff changeset

345 `match-end' and `match-data' access; save and restore the match\n\

c41ce96785a8 (struct regexp_cache): New field `posix'.

Richard M. Stallman <rms@gnu.org>

parents: 9605

diff changeset

346 data if you want to preserve them.")

11213

d0811ba886f8 (Flooking_at, Fposix_looking_at): Change arg name.

Richard M. Stallman <rms@gnu.org>

parents: 10250

diff changeset

347 (regexp)

d0811ba886f8 (Flooking_at, Fposix_looking_at): Change arg name.

Richard M. Stallman <rms@gnu.org>

parents: 10250

diff changeset

348 Lisp_Object regexp;

10020

c41ce96785a8 (struct regexp_cache): New field `posix'.

Richard M. Stallman <rms@gnu.org>

parents: 9605

diff changeset

349 {

11213

d0811ba886f8 (Flooking_at, Fposix_looking_at): Change arg name.

Richard M. Stallman <rms@gnu.org>

parents: 10250

diff changeset

350 return looking_at_1 (regexp, 1);

10020

c41ce96785a8 (struct regexp_cache): New field `posix'.

Richard M. Stallman <rms@gnu.org>

parents: 9605

diff changeset

351 }

c41ce96785a8 (struct regexp_cache): New field `posix'.

Richard M. Stallman <rms@gnu.org>

parents: 9605

diff changeset

352

c41ce96785a8 (struct regexp_cache): New field `posix'.

Richard M. Stallman <rms@gnu.org>

parents: 9605

diff changeset

353 static Lisp_Object

c41ce96785a8 (struct regexp_cache): New field `posix'.

Richard M. Stallman <rms@gnu.org>

parents: 9605

diff changeset

354 string_match_1 (regexp, string, start, posix)

603

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

355 Lisp_Object regexp, string, start;

10020

c41ce96785a8 (struct regexp_cache): New field `posix'.

Richard M. Stallman <rms@gnu.org>

parents: 9605

diff changeset

356 int posix;

603

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

357 {

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

358 int val;

9605

cf97e75d8e02 (searchbufs): New variable, replaces searchbuf and last_regexp and

Karl Heuer <kwzh@gnu.org>

parents: 9452

diff changeset

359 struct re_pattern_buffer *bufp;

20588

138c95482e6b (search_buffer): Handle bytes vs chars in non-RE case.

Richard M. Stallman <rms@gnu.org>

parents: 20547

diff changeset

360 int pos, pos_byte;

138c95482e6b (search_buffer): Handle bytes vs chars in non-RE case.

Richard M. Stallman <rms@gnu.org>

parents: 20547

diff changeset

361 int i;

603

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

362

10032

f689803caa92 Added code for automatically saving and restoring the match data

Francesco Potortì <pot@gnu.org>

parents: 10020

diff changeset

363 if (running_asynch_code)

f689803caa92 Added code for automatically saving and restoring the match data

Francesco Potortì <pot@gnu.org>

parents: 10020

diff changeset

364 save_search_regs ();

f689803caa92 Added code for automatically saving and restoring the match data

Francesco Potortì <pot@gnu.org>

parents: 10020

diff changeset

365

603

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

366 CHECK_STRING (regexp, 0);

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

367 CHECK_STRING (string, 1);

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

368

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

369 if (NILP (start))

20588

138c95482e6b (search_buffer): Handle bytes vs chars in non-RE case.

Richard M. Stallman <rms@gnu.org>

parents: 20547

diff changeset

370 pos = 0, pos_byte = 0;

603

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

371 else

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

372 {

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

373 int len = XSTRING (string)->size;

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

374

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

375 CHECK_NUMBER (start, 2);

20588

138c95482e6b (search_buffer): Handle bytes vs chars in non-RE case.

Richard M. Stallman <rms@gnu.org>

parents: 20547

diff changeset

376 pos = XINT (start);

138c95482e6b (search_buffer): Handle bytes vs chars in non-RE case.

Richard M. Stallman <rms@gnu.org>

parents: 20547

diff changeset

377 if (pos < 0 && -pos <= len)

138c95482e6b (search_buffer): Handle bytes vs chars in non-RE case.

Richard M. Stallman <rms@gnu.org>

parents: 20547

diff changeset

378 pos = len + pos;

138c95482e6b (search_buffer): Handle bytes vs chars in non-RE case.

Richard M. Stallman <rms@gnu.org>

parents: 20547

diff changeset

379 else if (0 > pos || pos > len)

603

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

380 args_out_of_range (string, start);

20588

138c95482e6b (search_buffer): Handle bytes vs chars in non-RE case.

Richard M. Stallman <rms@gnu.org>

parents: 20547

diff changeset

381 pos_byte = string_char_to_byte (string, pos);

603

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

382 }

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

383

9605

cf97e75d8e02 (searchbufs): New variable, replaces searchbuf and last_regexp and

Karl Heuer <kwzh@gnu.org>

parents: 9452

diff changeset

384 bufp = compile_pattern (regexp, &search_regs,

cf97e75d8e02 (searchbufs): New variable, replaces searchbuf and last_regexp and

Karl Heuer <kwzh@gnu.org>

parents: 9452

diff changeset

385 (!NILP (current_buffer->case_fold_search)

20869

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

386 ? DOWNCASE_TABLE : Qnil),

20588

138c95482e6b (search_buffer): Handle bytes vs chars in non-RE case.

Richard M. Stallman <rms@gnu.org>

parents: 20547

diff changeset

387 posix,

138c95482e6b (search_buffer): Handle bytes vs chars in non-RE case.

Richard M. Stallman <rms@gnu.org>

parents: 20547

diff changeset

388 STRING_MULTIBYTE (string));

603

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

389 immediate_quit = 1;

17463

bb9ae80d22e2 (looking_at_1): Set re_match_object.

Richard M. Stallman <rms@gnu.org>

parents: 17284

diff changeset

390 re_match_object = string;

bb9ae80d22e2 (looking_at_1): Set re_match_object.

Richard M. Stallman <rms@gnu.org>

parents: 17284

diff changeset

391

9605

cf97e75d8e02 (searchbufs): New variable, replaces searchbuf and last_regexp and

Karl Heuer <kwzh@gnu.org>

parents: 9452

diff changeset

392 val = re_search (bufp, (char *) XSTRING (string)->data,

21244

50929073a0ba Use STRING_BYTES and SET_STRING_BYTES.

Richard M. Stallman <rms@gnu.org>

parents: 21171

diff changeset

393 STRING_BYTES (XSTRING (string)), pos_byte,

50929073a0ba Use STRING_BYTES and SET_STRING_BYTES.

Richard M. Stallman <rms@gnu.org>

parents: 21171

diff changeset

394 STRING_BYTES (XSTRING (string)) - pos_byte,

603

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

395 &search_regs);

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

396 immediate_quit = 0;

727

540b047ece4d *** empty log message ***

Jim Blandy <jimb@redhat.com>

parents: 708

diff changeset

397 last_thing_searched = Qt;

603

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

398 if (val == -2)

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

399 matcher_overflow ();

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

400 if (val < 0) return Qnil;

20588

138c95482e6b (search_buffer): Handle bytes vs chars in non-RE case.

Richard M. Stallman <rms@gnu.org>

parents: 20547

diff changeset

401

138c95482e6b (search_buffer): Handle bytes vs chars in non-RE case.

Richard M. Stallman <rms@gnu.org>

parents: 20547

diff changeset

402 for (i = 0; i < search_regs.num_regs; i++)

138c95482e6b (search_buffer): Handle bytes vs chars in non-RE case.

Richard M. Stallman <rms@gnu.org>

parents: 20547

diff changeset

403 if (search_regs.start[i] >= 0)

138c95482e6b (search_buffer): Handle bytes vs chars in non-RE case.

Richard M. Stallman <rms@gnu.org>

parents: 20547

diff changeset

404 {

138c95482e6b (search_buffer): Handle bytes vs chars in non-RE case.

Richard M. Stallman <rms@gnu.org>

parents: 20547

diff changeset

405 search_regs.start[i]

138c95482e6b (search_buffer): Handle bytes vs chars in non-RE case.

Richard M. Stallman <rms@gnu.org>

parents: 20547

diff changeset

406 = string_byte_to_char (string, search_regs.start[i]);

138c95482e6b (search_buffer): Handle bytes vs chars in non-RE case.

Richard M. Stallman <rms@gnu.org>

parents: 20547

diff changeset

407 search_regs.end[i]

138c95482e6b (search_buffer): Handle bytes vs chars in non-RE case.

Richard M. Stallman <rms@gnu.org>

parents: 20547

diff changeset

408 = string_byte_to_char (string, search_regs.end[i]);

138c95482e6b (search_buffer): Handle bytes vs chars in non-RE case.

Richard M. Stallman <rms@gnu.org>

parents: 20547

diff changeset

409 }

138c95482e6b (search_buffer): Handle bytes vs chars in non-RE case.

Richard M. Stallman <rms@gnu.org>

parents: 20547

diff changeset

410

138c95482e6b (search_buffer): Handle bytes vs chars in non-RE case.

Richard M. Stallman <rms@gnu.org>

parents: 20547

diff changeset

411 return make_number (string_byte_to_char (string, val));

603

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

412 }

842

5ce0a9ac1ea7 entered into RCS

Richard M. Stallman <rms@gnu.org>

parents: 808

diff changeset

413

10020

c41ce96785a8 (struct regexp_cache): New field `posix'.

Richard M. Stallman <rms@gnu.org>

parents: 9605

diff changeset

414 DEFUN ("string-match", Fstring_match, Sstring_match, 2, 3, 0,

c41ce96785a8 (struct regexp_cache): New field `posix'.

Richard M. Stallman <rms@gnu.org>

parents: 9605

diff changeset

415 "Return index of start of first match for REGEXP in STRING, or nil.\n\

24433

118e66d79d64 (Fstring_match, Fposix_string_match): Doc fix.

Karl Heuer <kwzh@gnu.org>

parents: 24014

diff changeset

416 Case is ignored if `case-fold-search' is non-nil in the current buffer.\n\

10020

c41ce96785a8 (struct regexp_cache): New field `posix'.

Richard M. Stallman <rms@gnu.org>

parents: 9605

diff changeset

417 If third arg START is non-nil, start search at that index in STRING.\n\

c41ce96785a8 (struct regexp_cache): New field `posix'.

Richard M. Stallman <rms@gnu.org>

parents: 9605

diff changeset

418 For index of first char beyond the match, do (match-end 0).\n\

c41ce96785a8 (struct regexp_cache): New field `posix'.

Richard M. Stallman <rms@gnu.org>

parents: 9605

diff changeset

419 `match-end' and `match-beginning' also give indices of substrings\n\

c41ce96785a8 (struct regexp_cache): New field `posix'.

Richard M. Stallman <rms@gnu.org>

parents: 9605

diff changeset

420 matched by parenthesis constructs in the pattern.")

c41ce96785a8 (struct regexp_cache): New field `posix'.

Richard M. Stallman <rms@gnu.org>

parents: 9605

diff changeset

421 (regexp, string, start)

c41ce96785a8 (struct regexp_cache): New field `posix'.

Richard M. Stallman <rms@gnu.org>

parents: 9605

diff changeset

422 Lisp_Object regexp, string, start;

c41ce96785a8 (struct regexp_cache): New field `posix'.

Richard M. Stallman <rms@gnu.org>

parents: 9605

diff changeset

423 {

c41ce96785a8 (struct regexp_cache): New field `posix'.

Richard M. Stallman <rms@gnu.org>

parents: 9605

diff changeset

424 return string_match_1 (regexp, string, start, 0);

c41ce96785a8 (struct regexp_cache): New field `posix'.

Richard M. Stallman <rms@gnu.org>

parents: 9605

diff changeset

425 }

c41ce96785a8 (struct regexp_cache): New field `posix'.

Richard M. Stallman <rms@gnu.org>

parents: 9605

diff changeset

426

c41ce96785a8 (struct regexp_cache): New field `posix'.

Richard M. Stallman <rms@gnu.org>

parents: 9605

diff changeset

427 DEFUN ("posix-string-match", Fposix_string_match, Sposix_string_match, 2, 3, 0,

c41ce96785a8 (struct regexp_cache): New field `posix'.

Richard M. Stallman <rms@gnu.org>

parents: 9605

diff changeset

428 "Return index of start of first match for REGEXP in STRING, or nil.\n\

c41ce96785a8 (struct regexp_cache): New field `posix'.

Richard M. Stallman <rms@gnu.org>

parents: 9605

diff changeset

429 Find the longest match, in accord with Posix regular expression rules.\n\

24433

118e66d79d64 (Fstring_match, Fposix_string_match): Doc fix.

Karl Heuer <kwzh@gnu.org>

parents: 24014

diff changeset

430 Case is ignored if `case-fold-search' is non-nil in the current buffer.\n\

10020

c41ce96785a8 (struct regexp_cache): New field `posix'.

Richard M. Stallman <rms@gnu.org>

parents: 9605

diff changeset

431 If third arg START is non-nil, start search at that index in STRING.\n\

c41ce96785a8 (struct regexp_cache): New field `posix'.

Richard M. Stallman <rms@gnu.org>

parents: 9605

diff changeset

432 For index of first char beyond the match, do (match-end 0).\n\

c41ce96785a8 (struct regexp_cache): New field `posix'.

Richard M. Stallman <rms@gnu.org>

parents: 9605

diff changeset

433 `match-end' and `match-beginning' also give indices of substrings\n\

c41ce96785a8 (struct regexp_cache): New field `posix'.

Richard M. Stallman <rms@gnu.org>

parents: 9605

diff changeset

434 matched by parenthesis constructs in the pattern.")

c41ce96785a8 (struct regexp_cache): New field `posix'.

Richard M. Stallman <rms@gnu.org>

parents: 9605

diff changeset

435 (regexp, string, start)

c41ce96785a8 (struct regexp_cache): New field `posix'.

Richard M. Stallman <rms@gnu.org>

parents: 9605

diff changeset

436 Lisp_Object regexp, string, start;

c41ce96785a8 (struct regexp_cache): New field `posix'.

Richard M. Stallman <rms@gnu.org>

parents: 9605

diff changeset

437 {

c41ce96785a8 (struct regexp_cache): New field `posix'.

Richard M. Stallman <rms@gnu.org>

parents: 9605

diff changeset

438 return string_match_1 (regexp, string, start, 1);

c41ce96785a8 (struct regexp_cache): New field `posix'.

Richard M. Stallman <rms@gnu.org>

parents: 9605

diff changeset

439 }

c41ce96785a8 (struct regexp_cache): New field `posix'.

Richard M. Stallman <rms@gnu.org>

parents: 9605

diff changeset

440

842

5ce0a9ac1ea7 entered into RCS

Richard M. Stallman <rms@gnu.org>

parents: 808

diff changeset

441 /* Match REGEXP against STRING, searching all of STRING,

5ce0a9ac1ea7 entered into RCS

Richard M. Stallman <rms@gnu.org>

parents: 808

diff changeset

442 and return the index of the match, or negative on failure.

5ce0a9ac1ea7 entered into RCS

Richard M. Stallman <rms@gnu.org>

parents: 808

diff changeset

443 This does not clobber the match data. */

5ce0a9ac1ea7 entered into RCS

Richard M. Stallman <rms@gnu.org>

parents: 808

diff changeset

444

5ce0a9ac1ea7 entered into RCS

Richard M. Stallman <rms@gnu.org>

parents: 808

diff changeset

445 int

5ce0a9ac1ea7 entered into RCS

Richard M. Stallman <rms@gnu.org>

parents: 808

diff changeset

446 fast_string_match (regexp, string)

5ce0a9ac1ea7 entered into RCS

Richard M. Stallman <rms@gnu.org>

parents: 808

diff changeset

447 Lisp_Object regexp, string;

5ce0a9ac1ea7 entered into RCS

Richard M. Stallman <rms@gnu.org>

parents: 808

diff changeset

448 {

5ce0a9ac1ea7 entered into RCS

Richard M. Stallman <rms@gnu.org>

parents: 808

diff changeset

449 int val;

9605

cf97e75d8e02 (searchbufs): New variable, replaces searchbuf and last_regexp and

Karl Heuer <kwzh@gnu.org>

parents: 9452

diff changeset

450 struct re_pattern_buffer *bufp;

842

5ce0a9ac1ea7 entered into RCS

Richard M. Stallman <rms@gnu.org>

parents: 808

diff changeset

451

20869

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

452 bufp = compile_pattern (regexp, 0, Qnil,

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

453 0, STRING_MULTIBYTE (string));

842

5ce0a9ac1ea7 entered into RCS

Richard M. Stallman <rms@gnu.org>

parents: 808

diff changeset

454 immediate_quit = 1;

17463

bb9ae80d22e2 (looking_at_1): Set re_match_object.

Richard M. Stallman <rms@gnu.org>

parents: 17284

diff changeset

455 re_match_object = string;

bb9ae80d22e2 (looking_at_1): Set re_match_object.

Richard M. Stallman <rms@gnu.org>

parents: 17284

diff changeset

456

9605

cf97e75d8e02 (searchbufs): New variable, replaces searchbuf and last_regexp and

Karl Heuer <kwzh@gnu.org>

parents: 9452

diff changeset

457 val = re_search (bufp, (char *) XSTRING (string)->data,

21244

50929073a0ba Use STRING_BYTES and SET_STRING_BYTES.

Richard M. Stallman <rms@gnu.org>

parents: 21171

diff changeset

458 STRING_BYTES (XSTRING (string)), 0,

50929073a0ba Use STRING_BYTES and SET_STRING_BYTES.

Richard M. Stallman <rms@gnu.org>

parents: 21171

diff changeset

459 STRING_BYTES (XSTRING (string)), 0);

842

5ce0a9ac1ea7 entered into RCS

Richard M. Stallman <rms@gnu.org>

parents: 808

diff changeset

460 immediate_quit = 0;

5ce0a9ac1ea7 entered into RCS

Richard M. Stallman <rms@gnu.org>

parents: 808

diff changeset

461 return val;

5ce0a9ac1ea7 entered into RCS

Richard M. Stallman <rms@gnu.org>

parents: 808

diff changeset

462 }

17053

df904355f033 Include category.h and charset.h.

Karl Heuer <kwzh@gnu.org>

parents: 16880

diff changeset

463

df904355f033 Include category.h and charset.h.

Karl Heuer <kwzh@gnu.org>

parents: 16880

diff changeset

464 /* Match REGEXP against STRING, searching all of STRING ignoring case,

df904355f033 Include category.h and charset.h.

Karl Heuer <kwzh@gnu.org>

parents: 16880

diff changeset

465 and return the index of the match, or negative on failure.

20588

138c95482e6b (search_buffer): Handle bytes vs chars in non-RE case.

Richard M. Stallman <rms@gnu.org>

parents: 20547

diff changeset

466 This does not clobber the match data.

138c95482e6b (search_buffer): Handle bytes vs chars in non-RE case.

Richard M. Stallman <rms@gnu.org>

parents: 20547

diff changeset

467 We assume that STRING contains single-byte characters. */

17053

df904355f033 Include category.h and charset.h.

Karl Heuer <kwzh@gnu.org>

parents: 16880

diff changeset

468

df904355f033 Include category.h and charset.h.

Karl Heuer <kwzh@gnu.org>

parents: 16880

diff changeset

469 extern Lisp_Object Vascii_downcase_table;

df904355f033 Include category.h and charset.h.

Karl Heuer <kwzh@gnu.org>

parents: 16880

diff changeset

470

df904355f033 Include category.h and charset.h.

Karl Heuer <kwzh@gnu.org>

parents: 16880

diff changeset

471 int

18193

4e4c8edb56da (fast_c_string_match_ignore_case):

Richard M. Stallman <rms@gnu.org>

parents: 18124

diff changeset

472 fast_c_string_match_ignore_case (regexp, string)

17053

df904355f033 Include category.h and charset.h.

Karl Heuer <kwzh@gnu.org>

parents: 16880

diff changeset

473 Lisp_Object regexp;

df904355f033 Include category.h and charset.h.

Karl Heuer <kwzh@gnu.org>

parents: 16880

diff changeset

474 char *string;

df904355f033 Include category.h and charset.h.

Karl Heuer <kwzh@gnu.org>

parents: 16880

diff changeset

475 {

df904355f033 Include category.h and charset.h.

Karl Heuer <kwzh@gnu.org>

parents: 16880

diff changeset

476 int val;

df904355f033 Include category.h and charset.h.

Karl Heuer <kwzh@gnu.org>

parents: 16880

diff changeset

477 struct re_pattern_buffer *bufp;

df904355f033 Include category.h and charset.h.

Karl Heuer <kwzh@gnu.org>

parents: 16880

diff changeset

478 int len = strlen (string);

df904355f033 Include category.h and charset.h.

Karl Heuer <kwzh@gnu.org>

parents: 16880

diff changeset

479

20588

138c95482e6b (search_buffer): Handle bytes vs chars in non-RE case.

Richard M. Stallman <rms@gnu.org>

parents: 20547

diff changeset

480 regexp = string_make_unibyte (regexp);

18193

4e4c8edb56da (fast_c_string_match_ignore_case):

Richard M. Stallman <rms@gnu.org>

parents: 18124

diff changeset

481 re_match_object = Qt;

17053

df904355f033 Include category.h and charset.h.

Karl Heuer <kwzh@gnu.org>

parents: 16880

diff changeset

482 bufp = compile_pattern (regexp, 0,

20869

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

483 Vascii_downcase_table, 0,

20671

be91d6130341 (compile_pattern_1): If representation of STRING

Karl Heuer <kwzh@gnu.org>

parents: 20588

diff changeset

484 0);

17053

df904355f033 Include category.h and charset.h.

Karl Heuer <kwzh@gnu.org>

parents: 16880

diff changeset

485 immediate_quit = 1;

df904355f033 Include category.h and charset.h.

Karl Heuer <kwzh@gnu.org>

parents: 16880

diff changeset

486 val = re_search (bufp, string, len, 0, len, 0);

df904355f033 Include category.h and charset.h.

Karl Heuer <kwzh@gnu.org>

parents: 16880

diff changeset

487 immediate_quit = 0;

df904355f033 Include category.h and charset.h.

Karl Heuer <kwzh@gnu.org>

parents: 16880

diff changeset

488 return val;

df904355f033 Include category.h and charset.h.

Karl Heuer <kwzh@gnu.org>

parents: 16880

diff changeset

489 }

603

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

490

9410

8598c3d6f2f0 * search.c: #include "region-cache.h".

Jim Blandy <jimb@redhat.com>

parents: 9319

diff changeset

491 /* The newline cache: remembering which sections of text have no newlines. */

8598c3d6f2f0 * search.c: #include "region-cache.h".

Jim Blandy <jimb@redhat.com>

parents: 9319

diff changeset

492

8598c3d6f2f0 * search.c: #include "region-cache.h".

Jim Blandy <jimb@redhat.com>

parents: 9319

diff changeset

493 /* If the user has requested newline caching, make sure it's on.

8598c3d6f2f0 * search.c: #include "region-cache.h".

Jim Blandy <jimb@redhat.com>

parents: 9319

diff changeset

494 Otherwise, make sure it's off.

8598c3d6f2f0 * search.c: #include "region-cache.h".

Jim Blandy <jimb@redhat.com>

parents: 9319

diff changeset

495 This is our cheezy way of associating an action with the change of

8598c3d6f2f0 * search.c: #include "region-cache.h".

Jim Blandy <jimb@redhat.com>

parents: 9319

diff changeset

496 state of a buffer-local variable. */

8598c3d6f2f0 * search.c: #include "region-cache.h".

Jim Blandy <jimb@redhat.com>

parents: 9319

diff changeset

497 static void

8598c3d6f2f0 * search.c: #include "region-cache.h".

Jim Blandy <jimb@redhat.com>

parents: 9319

diff changeset

498 newline_cache_on_off (buf)

8598c3d6f2f0 * search.c: #include "region-cache.h".

Jim Blandy <jimb@redhat.com>

parents: 9319

diff changeset

499 struct buffer *buf;

8598c3d6f2f0 * search.c: #include "region-cache.h".

Jim Blandy <jimb@redhat.com>

parents: 9319

diff changeset

500 {

8598c3d6f2f0 * search.c: #include "region-cache.h".

Jim Blandy <jimb@redhat.com>

parents: 9319

diff changeset

501 if (NILP (buf->cache_long_line_scans))

8598c3d6f2f0 * search.c: #include "region-cache.h".

Jim Blandy <jimb@redhat.com>

parents: 9319

diff changeset

502 {

8598c3d6f2f0 * search.c: #include "region-cache.h".

Jim Blandy <jimb@redhat.com>

parents: 9319

diff changeset

503 /* It should be off. */

8598c3d6f2f0 * search.c: #include "region-cache.h".

Jim Blandy <jimb@redhat.com>

parents: 9319

diff changeset

504 if (buf->newline_cache)

8598c3d6f2f0 * search.c: #include "region-cache.h".

Jim Blandy <jimb@redhat.com>

parents: 9319

diff changeset

505 {

8598c3d6f2f0 * search.c: #include "region-cache.h".

Jim Blandy <jimb@redhat.com>

parents: 9319

diff changeset

506 free_region_cache (buf->newline_cache);

8598c3d6f2f0 * search.c: #include "region-cache.h".

Jim Blandy <jimb@redhat.com>

parents: 9319

diff changeset

507 buf->newline_cache = 0;

8598c3d6f2f0 * search.c: #include "region-cache.h".

Jim Blandy <jimb@redhat.com>

parents: 9319

diff changeset

508 }

8598c3d6f2f0 * search.c: #include "region-cache.h".

Jim Blandy <jimb@redhat.com>

parents: 9319

diff changeset

509 }

8598c3d6f2f0 * search.c: #include "region-cache.h".

Jim Blandy <jimb@redhat.com>

parents: 9319

diff changeset

510 else

8598c3d6f2f0 * search.c: #include "region-cache.h".

Jim Blandy <jimb@redhat.com>

parents: 9319

diff changeset

511 {

8598c3d6f2f0 * search.c: #include "region-cache.h".

Jim Blandy <jimb@redhat.com>

parents: 9319

diff changeset

512 /* It should be on. */

8598c3d6f2f0 * search.c: #include "region-cache.h".

Jim Blandy <jimb@redhat.com>

parents: 9319

diff changeset

513 if (buf->newline_cache == 0)

8598c3d6f2f0 * search.c: #include "region-cache.h".

Jim Blandy <jimb@redhat.com>

parents: 9319

diff changeset

514 buf->newline_cache = new_region_cache ();

8598c3d6f2f0 * search.c: #include "region-cache.h".

Jim Blandy <jimb@redhat.com>

parents: 9319

diff changeset

515 }

8598c3d6f2f0 * search.c: #include "region-cache.h".

Jim Blandy <jimb@redhat.com>

parents: 9319

diff changeset

516 }

8598c3d6f2f0 * search.c: #include "region-cache.h".

Jim Blandy <jimb@redhat.com>

parents: 9319

diff changeset

517

8598c3d6f2f0 * search.c: #include "region-cache.h".

Jim Blandy <jimb@redhat.com>

parents: 9319

diff changeset

518

8598c3d6f2f0 * search.c: #include "region-cache.h".

Jim Blandy <jimb@redhat.com>

parents: 9319

diff changeset

519 /* Search for COUNT instances of the character TARGET between START and END.

8598c3d6f2f0 * search.c: #include "region-cache.h".

Jim Blandy <jimb@redhat.com>

parents: 9319

diff changeset

520

8598c3d6f2f0 * search.c: #include "region-cache.h".

Jim Blandy <jimb@redhat.com>

parents: 9319

diff changeset

521 If COUNT is positive, search forwards; END must be >= START.

8598c3d6f2f0 * search.c: #include "region-cache.h".

Jim Blandy <jimb@redhat.com>

parents: 9319

diff changeset

522 If COUNT is negative, search backwards for the -COUNTth instance;

8598c3d6f2f0 * search.c: #include "region-cache.h".

Jim Blandy <jimb@redhat.com>

parents: 9319

diff changeset

523 END must be <= START.

8598c3d6f2f0 * search.c: #include "region-cache.h".

Jim Blandy <jimb@redhat.com>

parents: 9319

diff changeset

524 If COUNT is zero, do anything you please; run rogue, for all I care.

8598c3d6f2f0 * search.c: #include "region-cache.h".

Jim Blandy <jimb@redhat.com>

parents: 9319

diff changeset

525

8598c3d6f2f0 * search.c: #include "region-cache.h".

Jim Blandy <jimb@redhat.com>

parents: 9319

diff changeset

526 If END is zero, use BEGV or ZV instead, as appropriate for the

8598c3d6f2f0 * search.c: #include "region-cache.h".

Jim Blandy <jimb@redhat.com>

parents: 9319

diff changeset

527 direction indicated by COUNT.

648

70b112526394 *** empty log message ***

Jim Blandy <jimb@redhat.com>

parents: 639

diff changeset

528

70b112526394 *** empty log message ***

Jim Blandy <jimb@redhat.com>

parents: 639

diff changeset

529 If we find COUNT instances, set *SHORTAGE to zero, and return the

1413

527af9fa8676 Comment fix.

Richard M. Stallman <rms@gnu.org>

parents: 842

diff changeset

530 position after the COUNTth match. Note that for reverse motion

527af9fa8676 Comment fix.

Richard M. Stallman <rms@gnu.org>

parents: 842

diff changeset

531 this is not the same as the usual convention for Emacs motion commands.

648

70b112526394 *** empty log message ***

Jim Blandy <jimb@redhat.com>

parents: 639

diff changeset

532

9410

8598c3d6f2f0 * search.c: #include "region-cache.h".

Jim Blandy <jimb@redhat.com>

parents: 9319

diff changeset

533 If we don't find COUNT instances before reaching END, set *SHORTAGE

8598c3d6f2f0 * search.c: #include "region-cache.h".

Jim Blandy <jimb@redhat.com>

parents: 9319

diff changeset

534 to the number of TARGETs left unfound, and return END.

648

70b112526394 *** empty log message ***

Jim Blandy <jimb@redhat.com>

parents: 639

diff changeset

535

5756

a54c236b43c6 (scan_buffer): New arg ALLOW_QUIT.

Richard M. Stallman <rms@gnu.org>

parents: 5556

diff changeset

536 If ALLOW_QUIT is non-zero, set immediate_quit. That's good to do

a54c236b43c6 (scan_buffer): New arg ALLOW_QUIT.

Richard M. Stallman <rms@gnu.org>

parents: 5556

diff changeset

537 except when inside redisplay. */

a54c236b43c6 (scan_buffer): New arg ALLOW_QUIT.

Richard M. Stallman <rms@gnu.org>

parents: 5556

diff changeset

538

21514

fa9ff387d260 Fix -Wimplicit warnings.

Andreas Schwab <schwab@suse.de>

parents: 21457

diff changeset

539 int

9410

8598c3d6f2f0 * search.c: #include "region-cache.h".

Jim Blandy <jimb@redhat.com>

parents: 9319

diff changeset

540 scan_buffer (target, start, end, count, shortage, allow_quit)

8598c3d6f2f0 * search.c: #include "region-cache.h".

Jim Blandy <jimb@redhat.com>

parents: 9319

diff changeset

541 register int target;

8598c3d6f2f0 * search.c: #include "region-cache.h".

Jim Blandy <jimb@redhat.com>

parents: 9319

diff changeset

542 int start, end;

8598c3d6f2f0 * search.c: #include "region-cache.h".

Jim Blandy <jimb@redhat.com>

parents: 9319

diff changeset

543 int count;

8598c3d6f2f0 * search.c: #include "region-cache.h".

Jim Blandy <jimb@redhat.com>

parents: 9319

diff changeset

544 int *shortage;

5756

a54c236b43c6 (scan_buffer): New arg ALLOW_QUIT.

Richard M. Stallman <rms@gnu.org>

parents: 5556

diff changeset

545 int allow_quit;

603

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

546 {

9410

8598c3d6f2f0 * search.c: #include "region-cache.h".

Jim Blandy <jimb@redhat.com>

parents: 9319

diff changeset

547 struct region_cache *newline_cache;

8598c3d6f2f0 * search.c: #include "region-cache.h".

Jim Blandy <jimb@redhat.com>

parents: 9319

diff changeset

548 int direction;

648

70b112526394 *** empty log message ***

Jim Blandy <jimb@redhat.com>

parents: 639

diff changeset

549

9410

8598c3d6f2f0 * search.c: #include "region-cache.h".

Jim Blandy <jimb@redhat.com>

parents: 9319

diff changeset

550 if (count > 0)

8598c3d6f2f0 * search.c: #include "region-cache.h".

Jim Blandy <jimb@redhat.com>

parents: 9319

diff changeset

551 {

8598c3d6f2f0 * search.c: #include "region-cache.h".

Jim Blandy <jimb@redhat.com>

parents: 9319

diff changeset

552 direction = 1;

8598c3d6f2f0 * search.c: #include "region-cache.h".

Jim Blandy <jimb@redhat.com>

parents: 9319

diff changeset

553 if (! end) end = ZV;

8598c3d6f2f0 * search.c: #include "region-cache.h".

Jim Blandy <jimb@redhat.com>

parents: 9319

diff changeset

554 }

8598c3d6f2f0 * search.c: #include "region-cache.h".

Jim Blandy <jimb@redhat.com>

parents: 9319

diff changeset

555 else

8598c3d6f2f0 * search.c: #include "region-cache.h".

Jim Blandy <jimb@redhat.com>

parents: 9319

diff changeset

556 {

8598c3d6f2f0 * search.c: #include "region-cache.h".

Jim Blandy <jimb@redhat.com>

parents: 9319

diff changeset

557 direction = -1;

8598c3d6f2f0 * search.c: #include "region-cache.h".

Jim Blandy <jimb@redhat.com>

parents: 9319

diff changeset

558 if (! end) end = BEGV;

8598c3d6f2f0 * search.c: #include "region-cache.h".

Jim Blandy <jimb@redhat.com>

parents: 9319

diff changeset

559 }

648

70b112526394 *** empty log message ***

Jim Blandy <jimb@redhat.com>

parents: 639

diff changeset

560

9410

8598c3d6f2f0 * search.c: #include "region-cache.h".

Jim Blandy <jimb@redhat.com>

parents: 9319

diff changeset

561 newline_cache_on_off (current_buffer);

8598c3d6f2f0 * search.c: #include "region-cache.h".

Jim Blandy <jimb@redhat.com>

parents: 9319

diff changeset

562 newline_cache = current_buffer->newline_cache;

603

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

563

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

564 if (shortage != 0)

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

565 *shortage = 0;

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

566

5756

a54c236b43c6 (scan_buffer): New arg ALLOW_QUIT.

Richard M. Stallman <rms@gnu.org>

parents: 5556

diff changeset

567 immediate_quit = allow_quit;

603

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

568

648

70b112526394 *** empty log message ***

Jim Blandy <jimb@redhat.com>

parents: 639

diff changeset

569 if (count > 0)

9410

8598c3d6f2f0 * search.c: #include "region-cache.h".

Jim Blandy <jimb@redhat.com>

parents: 9319

diff changeset

570 while (start != end)

603

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

571 {

9410

8598c3d6f2f0 * search.c: #include "region-cache.h".

Jim Blandy <jimb@redhat.com>

parents: 9319

diff changeset

572 /* Our innermost scanning loop is very simple; it doesn't know

8598c3d6f2f0 * search.c: #include "region-cache.h".

Jim Blandy <jimb@redhat.com>

parents: 9319

diff changeset

573 about gaps, buffer ends, or the newline cache. ceiling is

8598c3d6f2f0 * search.c: #include "region-cache.h".

Jim Blandy <jimb@redhat.com>

parents: 9319

diff changeset

574 the position of the last character before the next such

8598c3d6f2f0 * search.c: #include "region-cache.h".

Jim Blandy <jimb@redhat.com>

parents: 9319

diff changeset

575 obstacle --- the last character the dumb search loop should

8598c3d6f2f0 * search.c: #include "region-cache.h".

Jim Blandy <jimb@redhat.com>

parents: 9319

diff changeset

576 examine. */

20545

c20c92ff4055 (looking_at_1): Use bytepos to call re_search_2.

Richard M. Stallman <rms@gnu.org>

parents: 20347

diff changeset

577 int ceiling_byte = CHAR_TO_BYTE (end) - 1;

c20c92ff4055 (looking_at_1): Use bytepos to call re_search_2.

Richard M. Stallman <rms@gnu.org>

parents: 20347

diff changeset

578 int start_byte = CHAR_TO_BYTE (start);

21457

8c6ea32aadfa (min, max): Make these macros, not functions.

Karl Heuer <kwzh@gnu.org>

parents: 21248

diff changeset

579 int tem;

9410

8598c3d6f2f0 * search.c: #include "region-cache.h".

Jim Blandy <jimb@redhat.com>

parents: 9319

diff changeset

580

8598c3d6f2f0 * search.c: #include "region-cache.h".

Jim Blandy <jimb@redhat.com>

parents: 9319

diff changeset

581 /* If we're looking for a newline, consult the newline cache

8598c3d6f2f0 * search.c: #include "region-cache.h".

Jim Blandy <jimb@redhat.com>

parents: 9319

diff changeset

582 to see where we can avoid some scanning. */

8598c3d6f2f0 * search.c: #include "region-cache.h".

Jim Blandy <jimb@redhat.com>

parents: 9319

diff changeset

583 if (target == '\n' && newline_cache)

8598c3d6f2f0 * search.c: #include "region-cache.h".

Jim Blandy <jimb@redhat.com>

parents: 9319

diff changeset

584 {

8598c3d6f2f0 * search.c: #include "region-cache.h".

Jim Blandy <jimb@redhat.com>

parents: 9319

diff changeset

585 int next_change;

8598c3d6f2f0 * search.c: #include "region-cache.h".

Jim Blandy <jimb@redhat.com>

parents: 9319

diff changeset

586 immediate_quit = 0;

8598c3d6f2f0 * search.c: #include "region-cache.h".

Jim Blandy <jimb@redhat.com>

parents: 9319

diff changeset

587 while (region_cache_forward

20545

c20c92ff4055 (looking_at_1): Use bytepos to call re_search_2.

Richard M. Stallman <rms@gnu.org>

parents: 20347

diff changeset

588 (current_buffer, newline_cache, start_byte, &next_change))

c20c92ff4055 (looking_at_1): Use bytepos to call re_search_2.

Richard M. Stallman <rms@gnu.org>

parents: 20347

diff changeset

589 start_byte = next_change;

9452

76f75b9091f1 (scan_buffer): After temporarily turning immediate_quit off, turn it

Jim Blandy <jimb@redhat.com>

parents: 9410

diff changeset

590 immediate_quit = allow_quit;

9410

8598c3d6f2f0 * search.c: #include "region-cache.h".

Jim Blandy <jimb@redhat.com>

parents: 9319

diff changeset

591

20545

c20c92ff4055 (looking_at_1): Use bytepos to call re_search_2.

Richard M. Stallman <rms@gnu.org>

parents: 20347

diff changeset

592 /* START should never be after END. */

c20c92ff4055 (looking_at_1): Use bytepos to call re_search_2.

Richard M. Stallman <rms@gnu.org>

parents: 20347

diff changeset

593 if (start_byte > ceiling_byte)

c20c92ff4055 (looking_at_1): Use bytepos to call re_search_2.

Richard M. Stallman <rms@gnu.org>

parents: 20347

diff changeset

594 start_byte = ceiling_byte;

9410

8598c3d6f2f0 * search.c: #include "region-cache.h".

Jim Blandy <jimb@redhat.com>

parents: 9319

diff changeset

595

8598c3d6f2f0 * search.c: #include "region-cache.h".

Jim Blandy <jimb@redhat.com>

parents: 9319

diff changeset

596 /* Now the text after start is an unknown region, and

8598c3d6f2f0 * search.c: #include "region-cache.h".

Jim Blandy <jimb@redhat.com>

parents: 9319

diff changeset

597 next_change is the position of the next known region. */

20545

c20c92ff4055 (looking_at_1): Use bytepos to call re_search_2.

Richard M. Stallman <rms@gnu.org>

parents: 20347

diff changeset

598 ceiling_byte = min (next_change - 1, ceiling_byte);

9410

8598c3d6f2f0 * search.c: #include "region-cache.h".

Jim Blandy <jimb@redhat.com>

parents: 9319

diff changeset

599 }

8598c3d6f2f0 * search.c: #include "region-cache.h".

Jim Blandy <jimb@redhat.com>

parents: 9319

diff changeset

600

8598c3d6f2f0 * search.c: #include "region-cache.h".

Jim Blandy <jimb@redhat.com>

parents: 9319

diff changeset

601 /* The dumb loop can only scan text stored in contiguous

8598c3d6f2f0 * search.c: #include "region-cache.h".

Jim Blandy <jimb@redhat.com>

parents: 9319

diff changeset

602 bytes. BUFFER_CEILING_OF returns the last character

8598c3d6f2f0 * search.c: #include "region-cache.h".

Jim Blandy <jimb@redhat.com>

parents: 9319

diff changeset

603 position that is contiguous, so the ceiling is the

8598c3d6f2f0 * search.c: #include "region-cache.h".

Jim Blandy <jimb@redhat.com>

parents: 9319

diff changeset

604 position after that. */

21457

8c6ea32aadfa (min, max): Make these macros, not functions.

Karl Heuer <kwzh@gnu.org>

parents: 21248

diff changeset

605 tem = BUFFER_CEILING_OF (start_byte);

8c6ea32aadfa (min, max): Make these macros, not functions.

Karl Heuer <kwzh@gnu.org>

parents: 21248

diff changeset

606 ceiling_byte = min (tem, ceiling_byte);

9410

8598c3d6f2f0 * search.c: #include "region-cache.h".

Jim Blandy <jimb@redhat.com>

parents: 9319

diff changeset

607

8598c3d6f2f0 * search.c: #include "region-cache.h".

Jim Blandy <jimb@redhat.com>

parents: 9319

diff changeset

608 {

8598c3d6f2f0 * search.c: #include "region-cache.h".

Jim Blandy <jimb@redhat.com>

parents: 9319

diff changeset

609 /* The termination address of the dumb loop. */

20545

c20c92ff4055 (looking_at_1): Use bytepos to call re_search_2.

Richard M. Stallman <rms@gnu.org>

parents: 20347

diff changeset

610 register unsigned char *ceiling_addr

c20c92ff4055 (looking_at_1): Use bytepos to call re_search_2.

Richard M. Stallman <rms@gnu.org>

parents: 20347

diff changeset

611 = BYTE_POS_ADDR (ceiling_byte) + 1;

c20c92ff4055 (looking_at_1): Use bytepos to call re_search_2.

Richard M. Stallman <rms@gnu.org>

parents: 20347

diff changeset

612 register unsigned char *cursor

c20c92ff4055 (looking_at_1): Use bytepos to call re_search_2.

Richard M. Stallman <rms@gnu.org>

parents: 20347

diff changeset

613 = BYTE_POS_ADDR (start_byte);

9410

8598c3d6f2f0 * search.c: #include "region-cache.h".

Jim Blandy <jimb@redhat.com>

parents: 9319

diff changeset

614 unsigned char *base = cursor;

8598c3d6f2f0 * search.c: #include "region-cache.h".

Jim Blandy <jimb@redhat.com>

parents: 9319

diff changeset

615

8598c3d6f2f0 * search.c: #include "region-cache.h".

Jim Blandy <jimb@redhat.com>

parents: 9319

diff changeset

616 while (cursor < ceiling_addr)

8598c3d6f2f0 * search.c: #include "region-cache.h".

Jim Blandy <jimb@redhat.com>

parents: 9319

diff changeset

617 {

8598c3d6f2f0 * search.c: #include "region-cache.h".

Jim Blandy <jimb@redhat.com>

parents: 9319

diff changeset

618 unsigned char *scan_start = cursor;

8598c3d6f2f0 * search.c: #include "region-cache.h".

Jim Blandy <jimb@redhat.com>

parents: 9319

diff changeset

619

8598c3d6f2f0 * search.c: #include "region-cache.h".

Jim Blandy <jimb@redhat.com>

parents: 9319

diff changeset

620 /* The dumb loop. */

8598c3d6f2f0 * search.c: #include "region-cache.h".

Jim Blandy <jimb@redhat.com>

parents: 9319

diff changeset

621 while (*cursor != target && ++cursor < ceiling_addr)

8598c3d6f2f0 * search.c: #include "region-cache.h".

Jim Blandy <jimb@redhat.com>

parents: 9319

diff changeset

622 ;

8598c3d6f2f0 * search.c: #include "region-cache.h".

Jim Blandy <jimb@redhat.com>

parents: 9319

diff changeset

623

8598c3d6f2f0 * search.c: #include "region-cache.h".

Jim Blandy <jimb@redhat.com>

parents: 9319

diff changeset

624 /* If we're looking for newlines, cache the fact that

8598c3d6f2f0 * search.c: #include "region-cache.h".

Jim Blandy <jimb@redhat.com>

parents: 9319

diff changeset

625 the region from start to cursor is free of them. */

8598c3d6f2f0 * search.c: #include "region-cache.h".

Jim Blandy <jimb@redhat.com>

parents: 9319

diff changeset

626 if (target == '\n' && newline_cache)

8598c3d6f2f0 * search.c: #include "region-cache.h".

Jim Blandy <jimb@redhat.com>

parents: 9319

diff changeset

627 know_region_cache (current_buffer, newline_cache,

20545

c20c92ff4055 (looking_at_1): Use bytepos to call re_search_2.

Richard M. Stallman <rms@gnu.org>

parents: 20347

diff changeset

628 start_byte + scan_start - base,

c20c92ff4055 (looking_at_1): Use bytepos to call re_search_2.

Richard M. Stallman <rms@gnu.org>

parents: 20347

diff changeset

629 start_byte + cursor - base);

9410

8598c3d6f2f0 * search.c: #include "region-cache.h".

Jim Blandy <jimb@redhat.com>

parents: 9319

diff changeset

630

8598c3d6f2f0 * search.c: #include "region-cache.h".

Jim Blandy <jimb@redhat.com>

parents: 9319

diff changeset

631 /* Did we find the target character? */

8598c3d6f2f0 * search.c: #include "region-cache.h".

Jim Blandy <jimb@redhat.com>

parents: 9319

diff changeset

632 if (cursor < ceiling_addr)

8598c3d6f2f0 * search.c: #include "region-cache.h".

Jim Blandy <jimb@redhat.com>

parents: 9319

diff changeset

633 {

8598c3d6f2f0 * search.c: #include "region-cache.h".

Jim Blandy <jimb@redhat.com>

parents: 9319

diff changeset

634 if (--count == 0)

8598c3d6f2f0 * search.c: #include "region-cache.h".

Jim Blandy <jimb@redhat.com>

parents: 9319

diff changeset

635 {

8598c3d6f2f0 * search.c: #include "region-cache.h".

Jim Blandy <jimb@redhat.com>

parents: 9319

diff changeset

636 immediate_quit = 0;

20545

c20c92ff4055 (looking_at_1): Use bytepos to call re_search_2.

Richard M. Stallman <rms@gnu.org>

parents: 20347

diff changeset

637 return BYTE_TO_CHAR (start_byte + cursor - base + 1);

9410

8598c3d6f2f0 * search.c: #include "region-cache.h".

Jim Blandy <jimb@redhat.com>

parents: 9319

diff changeset

638 }

8598c3d6f2f0 * search.c: #include "region-cache.h".

Jim Blandy <jimb@redhat.com>

parents: 9319

diff changeset

639 cursor++;

8598c3d6f2f0 * search.c: #include "region-cache.h".

Jim Blandy <jimb@redhat.com>

parents: 9319

diff changeset

640 }

8598c3d6f2f0 * search.c: #include "region-cache.h".

Jim Blandy <jimb@redhat.com>

parents: 9319

diff changeset

641 }

8598c3d6f2f0 * search.c: #include "region-cache.h".

Jim Blandy <jimb@redhat.com>

parents: 9319

diff changeset

642

20545

c20c92ff4055 (looking_at_1): Use bytepos to call re_search_2.

Richard M. Stallman <rms@gnu.org>

parents: 20347

diff changeset

643 start = BYTE_TO_CHAR (start_byte + cursor - base);

9410

8598c3d6f2f0 * search.c: #include "region-cache.h".

Jim Blandy <jimb@redhat.com>

parents: 9319

diff changeset

644 }

603

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

645 }

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

646 else

9410

8598c3d6f2f0 * search.c: #include "region-cache.h".

Jim Blandy <jimb@redhat.com>

parents: 9319

diff changeset

647 while (start > end)

8598c3d6f2f0 * search.c: #include "region-cache.h".

Jim Blandy <jimb@redhat.com>

parents: 9319

diff changeset

648 {

8598c3d6f2f0 * search.c: #include "region-cache.h".

Jim Blandy <jimb@redhat.com>

parents: 9319

diff changeset

649 /* The last character to check before the next obstacle. */

20545

c20c92ff4055 (looking_at_1): Use bytepos to call re_search_2.

Richard M. Stallman <rms@gnu.org>

parents: 20347

diff changeset

650 int ceiling_byte = CHAR_TO_BYTE (end);

c20c92ff4055 (looking_at_1): Use bytepos to call re_search_2.

Richard M. Stallman <rms@gnu.org>

parents: 20347

diff changeset

651 int start_byte = CHAR_TO_BYTE (start);

21457

8c6ea32aadfa (min, max): Make these macros, not functions.

Karl Heuer <kwzh@gnu.org>

parents: 21248

diff changeset

652 int tem;

9410

8598c3d6f2f0 * search.c: #include "region-cache.h".

Jim Blandy <jimb@redhat.com>

parents: 9319

diff changeset

653

8598c3d6f2f0 * search.c: #include "region-cache.h".

Jim Blandy <jimb@redhat.com>

parents: 9319

diff changeset

654 /* Consult the newline cache, if appropriate. */

8598c3d6f2f0 * search.c: #include "region-cache.h".

Jim Blandy <jimb@redhat.com>

parents: 9319

diff changeset

655 if (target == '\n' && newline_cache)

8598c3d6f2f0 * search.c: #include "region-cache.h".

Jim Blandy <jimb@redhat.com>

parents: 9319

diff changeset

656 {

8598c3d6f2f0 * search.c: #include "region-cache.h".

Jim Blandy <jimb@redhat.com>

parents: 9319

diff changeset

657 int next_change;

8598c3d6f2f0 * search.c: #include "region-cache.h".

Jim Blandy <jimb@redhat.com>

parents: 9319

diff changeset

658 immediate_quit = 0;

8598c3d6f2f0 * search.c: #include "region-cache.h".

Jim Blandy <jimb@redhat.com>

parents: 9319

diff changeset

659 while (region_cache_backward

20545

c20c92ff4055 (looking_at_1): Use bytepos to call re_search_2.

Richard M. Stallman <rms@gnu.org>

parents: 20347

diff changeset

660 (current_buffer, newline_cache, start_byte, &next_change))

c20c92ff4055 (looking_at_1): Use bytepos to call re_search_2.

Richard M. Stallman <rms@gnu.org>

parents: 20347

diff changeset

661 start_byte = next_change;

9452

76f75b9091f1 (scan_buffer): After temporarily turning immediate_quit off, turn it

Jim Blandy <jimb@redhat.com>

parents: 9410

diff changeset

662 immediate_quit = allow_quit;

9410

8598c3d6f2f0 * search.c: #include "region-cache.h".

Jim Blandy <jimb@redhat.com>

parents: 9319

diff changeset

663

8598c3d6f2f0 * search.c: #include "region-cache.h".

Jim Blandy <jimb@redhat.com>

parents: 9319

diff changeset

664 /* Start should never be at or before end. */

20545

c20c92ff4055 (looking_at_1): Use bytepos to call re_search_2.

Richard M. Stallman <rms@gnu.org>

parents: 20347

diff changeset

665 if (start_byte <= ceiling_byte)

c20c92ff4055 (looking_at_1): Use bytepos to call re_search_2.

Richard M. Stallman <rms@gnu.org>

parents: 20347

diff changeset

666 start_byte = ceiling_byte + 1;

9410

8598c3d6f2f0 * search.c: #include "region-cache.h".

Jim Blandy <jimb@redhat.com>

parents: 9319

diff changeset

667

8598c3d6f2f0 * search.c: #include "region-cache.h".

Jim Blandy <jimb@redhat.com>

parents: 9319

diff changeset

668 /* Now the text before start is an unknown region, and

8598c3d6f2f0 * search.c: #include "region-cache.h".

Jim Blandy <jimb@redhat.com>

parents: 9319

diff changeset

669 next_change is the position of the next known region. */

20545

c20c92ff4055 (looking_at_1): Use bytepos to call re_search_2.

Richard M. Stallman <rms@gnu.org>

parents: 20347

diff changeset

670 ceiling_byte = max (next_change, ceiling_byte);

9410

8598c3d6f2f0 * search.c: #include "region-cache.h".

Jim Blandy <jimb@redhat.com>

parents: 9319

diff changeset

671 }

8598c3d6f2f0 * search.c: #include "region-cache.h".

Jim Blandy <jimb@redhat.com>

parents: 9319

diff changeset

672

8598c3d6f2f0 * search.c: #include "region-cache.h".

Jim Blandy <jimb@redhat.com>

parents: 9319

diff changeset

673 /* Stop scanning before the gap. */

21457

8c6ea32aadfa (min, max): Make these macros, not functions.

Karl Heuer <kwzh@gnu.org>

parents: 21248

diff changeset

674 tem = BUFFER_FLOOR_OF (start_byte - 1);

8c6ea32aadfa (min, max): Make these macros, not functions.

Karl Heuer <kwzh@gnu.org>

parents: 21248

diff changeset

675 ceiling_byte = max (tem, ceiling_byte);

9410

8598c3d6f2f0 * search.c: #include "region-cache.h".

Jim Blandy <jimb@redhat.com>

parents: 9319

diff changeset

676

8598c3d6f2f0 * search.c: #include "region-cache.h".

Jim Blandy <jimb@redhat.com>

parents: 9319

diff changeset

677 {

8598c3d6f2f0 * search.c: #include "region-cache.h".

Jim Blandy <jimb@redhat.com>

parents: 9319

diff changeset

678 /* The termination address of the dumb loop. */

20545

c20c92ff4055 (looking_at_1): Use bytepos to call re_search_2.

Richard M. Stallman <rms@gnu.org>

parents: 20347

diff changeset

679 register unsigned char *ceiling_addr = BYTE_POS_ADDR (ceiling_byte);

c20c92ff4055 (looking_at_1): Use bytepos to call re_search_2.

Richard M. Stallman <rms@gnu.org>

parents: 20347

diff changeset

680 register unsigned char *cursor = BYTE_POS_ADDR (start_byte - 1);

9410

8598c3d6f2f0 * search.c: #include "region-cache.h".

Jim Blandy <jimb@redhat.com>

parents: 9319

diff changeset

681 unsigned char *base = cursor;

8598c3d6f2f0 * search.c: #include "region-cache.h".

Jim Blandy <jimb@redhat.com>

parents: 9319

diff changeset

682

8598c3d6f2f0 * search.c: #include "region-cache.h".

Jim Blandy <jimb@redhat.com>

parents: 9319

diff changeset

683 while (cursor >= ceiling_addr)

8598c3d6f2f0 * search.c: #include "region-cache.h".

Jim Blandy <jimb@redhat.com>

parents: 9319

diff changeset

684 {

8598c3d6f2f0 * search.c: #include "region-cache.h".

Jim Blandy <jimb@redhat.com>

parents: 9319

diff changeset

685 unsigned char *scan_start = cursor;

8598c3d6f2f0 * search.c: #include "region-cache.h".

Jim Blandy <jimb@redhat.com>

parents: 9319

diff changeset

686

8598c3d6f2f0 * search.c: #include "region-cache.h".

Jim Blandy <jimb@redhat.com>

parents: 9319

diff changeset

687 while (*cursor != target && --cursor >= ceiling_addr)

8598c3d6f2f0 * search.c: #include "region-cache.h".

Jim Blandy <jimb@redhat.com>

parents: 9319

diff changeset

688 ;

8598c3d6f2f0 * search.c: #include "region-cache.h".

Jim Blandy <jimb@redhat.com>

parents: 9319

diff changeset

689

8598c3d6f2f0 * search.c: #include "region-cache.h".

Jim Blandy <jimb@redhat.com>

parents: 9319

diff changeset

690 /* If we're looking for newlines, cache the fact that

8598c3d6f2f0 * search.c: #include "region-cache.h".

Jim Blandy <jimb@redhat.com>

parents: 9319

diff changeset

691 the region from after the cursor to start is free of them. */

8598c3d6f2f0 * search.c: #include "region-cache.h".

Jim Blandy <jimb@redhat.com>

parents: 9319

diff changeset

692 if (target == '\n' && newline_cache)

8598c3d6f2f0 * search.c: #include "region-cache.h".

Jim Blandy <jimb@redhat.com>

parents: 9319

diff changeset

693 know_region_cache (current_buffer, newline_cache,

20545

c20c92ff4055 (looking_at_1): Use bytepos to call re_search_2.

Richard M. Stallman <rms@gnu.org>

parents: 20347

diff changeset

694 start_byte + cursor - base,

c20c92ff4055 (looking_at_1): Use bytepos to call re_search_2.

Richard M. Stallman <rms@gnu.org>

parents: 20347

diff changeset

695 start_byte + scan_start - base);

9410

8598c3d6f2f0 * search.c: #include "region-cache.h".

Jim Blandy <jimb@redhat.com>

parents: 9319

diff changeset

696

8598c3d6f2f0 * search.c: #include "region-cache.h".

Jim Blandy <jimb@redhat.com>

parents: 9319

diff changeset

697 /* Did we find the target character? */

8598c3d6f2f0 * search.c: #include "region-cache.h".

Jim Blandy <jimb@redhat.com>

parents: 9319

diff changeset

698 if (cursor >= ceiling_addr)

8598c3d6f2f0 * search.c: #include "region-cache.h".

Jim Blandy <jimb@redhat.com>

parents: 9319

diff changeset

699 {

8598c3d6f2f0 * search.c: #include "region-cache.h".

Jim Blandy <jimb@redhat.com>

parents: 9319

diff changeset

700 if (++count >= 0)

8598c3d6f2f0 * search.c: #include "region-cache.h".

Jim Blandy <jimb@redhat.com>

parents: 9319

diff changeset

701 {

8598c3d6f2f0 * search.c: #include "region-cache.h".

Jim Blandy <jimb@redhat.com>

parents: 9319

diff changeset

702 immediate_quit = 0;

20545

c20c92ff4055 (looking_at_1): Use bytepos to call re_search_2.

Richard M. Stallman <rms@gnu.org>

parents: 20347

diff changeset

703 return BYTE_TO_CHAR (start_byte + cursor - base);

9410

8598c3d6f2f0 * search.c: #include "region-cache.h".

Jim Blandy <jimb@redhat.com>

parents: 9319

diff changeset

704 }

8598c3d6f2f0 * search.c: #include "region-cache.h".

Jim Blandy <jimb@redhat.com>

parents: 9319

diff changeset

705 cursor--;

8598c3d6f2f0 * search.c: #include "region-cache.h".

Jim Blandy <jimb@redhat.com>

parents: 9319

diff changeset

706 }

8598c3d6f2f0 * search.c: #include "region-cache.h".

Jim Blandy <jimb@redhat.com>

parents: 9319

diff changeset

707 }

8598c3d6f2f0 * search.c: #include "region-cache.h".

Jim Blandy <jimb@redhat.com>

parents: 9319

diff changeset

708

20545

c20c92ff4055 (looking_at_1): Use bytepos to call re_search_2.

Richard M. Stallman <rms@gnu.org>

parents: 20347

diff changeset

709 start = BYTE_TO_CHAR (start_byte + cursor - base);

9410

8598c3d6f2f0 * search.c: #include "region-cache.h".

Jim Blandy <jimb@redhat.com>

parents: 9319

diff changeset

710 }

8598c3d6f2f0 * search.c: #include "region-cache.h".

Jim Blandy <jimb@redhat.com>

parents: 9319

diff changeset

711 }

8598c3d6f2f0 * search.c: #include "region-cache.h".

Jim Blandy <jimb@redhat.com>

parents: 9319

diff changeset

712

603

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

713 immediate_quit = 0;

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

714 if (shortage != 0)

648

70b112526394 *** empty log message ***

Jim Blandy <jimb@redhat.com>

parents: 639

diff changeset

715 *shortage = count * direction;

9410

8598c3d6f2f0 * search.c: #include "region-cache.h".

Jim Blandy <jimb@redhat.com>

parents: 9319

diff changeset

716 return start;

603

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

717 }

20545

c20c92ff4055 (looking_at_1): Use bytepos to call re_search_2.

Richard M. Stallman <rms@gnu.org>

parents: 20347

diff changeset

718

c20c92ff4055 (looking_at_1): Use bytepos to call re_search_2.

Richard M. Stallman <rms@gnu.org>

parents: 20347

diff changeset

719 /* Search for COUNT instances of a line boundary, which means either a

c20c92ff4055 (looking_at_1): Use bytepos to call re_search_2.

Richard M. Stallman <rms@gnu.org>

parents: 20347

diff changeset

720 newline or (if selective display enabled) a carriage return.

c20c92ff4055 (looking_at_1): Use bytepos to call re_search_2.

Richard M. Stallman <rms@gnu.org>

parents: 20347

diff changeset

721 Start at START. If COUNT is negative, search backwards.

c20c92ff4055 (looking_at_1): Use bytepos to call re_search_2.

Richard M. Stallman <rms@gnu.org>

parents: 20347

diff changeset

722

c20c92ff4055 (looking_at_1): Use bytepos to call re_search_2.

Richard M. Stallman <rms@gnu.org>

parents: 20347

diff changeset

723 We report the resulting position by calling TEMP_SET_PT_BOTH.

c20c92ff4055 (looking_at_1): Use bytepos to call re_search_2.

Richard M. Stallman <rms@gnu.org>

parents: 20347

diff changeset

724

c20c92ff4055 (looking_at_1): Use bytepos to call re_search_2.

Richard M. Stallman <rms@gnu.org>

parents: 20347

diff changeset

725 If we find COUNT instances. we position after (always after,

c20c92ff4055 (looking_at_1): Use bytepos to call re_search_2.

Richard M. Stallman <rms@gnu.org>

parents: 20347

diff changeset

726 even if scanning backwards) the COUNTth match, and return 0.

c20c92ff4055 (looking_at_1): Use bytepos to call re_search_2.

Richard M. Stallman <rms@gnu.org>

parents: 20347

diff changeset

727

c20c92ff4055 (looking_at_1): Use bytepos to call re_search_2.

Richard M. Stallman <rms@gnu.org>

parents: 20347

diff changeset

728 If we don't find COUNT instances before reaching the end of the

c20c92ff4055 (looking_at_1): Use bytepos to call re_search_2.

Richard M. Stallman <rms@gnu.org>

parents: 20347

diff changeset

729 buffer (or the beginning, if scanning backwards), we return

c20c92ff4055 (looking_at_1): Use bytepos to call re_search_2.

Richard M. Stallman <rms@gnu.org>

parents: 20347

diff changeset

730 the number of line boundaries left unfound, and position at

c20c92ff4055 (looking_at_1): Use bytepos to call re_search_2.

Richard M. Stallman <rms@gnu.org>

parents: 20347

diff changeset

731 the limit we bumped up against.

c20c92ff4055 (looking_at_1): Use bytepos to call re_search_2.

Richard M. Stallman <rms@gnu.org>

parents: 20347

diff changeset

732

c20c92ff4055 (looking_at_1): Use bytepos to call re_search_2.

Richard M. Stallman <rms@gnu.org>

parents: 20347

diff changeset

733 If ALLOW_QUIT is non-zero, set immediate_quit. That's good to do

20547

07053199a368 (scan_newline): Always restore prev value of immediate_quit.

Richard M. Stallman <rms@gnu.org>

parents: 20545

diff changeset

734 except in special cases. */

20545

c20c92ff4055 (looking_at_1): Use bytepos to call re_search_2.

Richard M. Stallman <rms@gnu.org>

parents: 20347

diff changeset

735

c20c92ff4055 (looking_at_1): Use bytepos to call re_search_2.

Richard M. Stallman <rms@gnu.org>

parents: 20347

diff changeset

736 int

c20c92ff4055 (looking_at_1): Use bytepos to call re_search_2.

Richard M. Stallman <rms@gnu.org>

parents: 20347

diff changeset

737 scan_newline (start, start_byte, limit, limit_byte, count, allow_quit)

c20c92ff4055 (looking_at_1): Use bytepos to call re_search_2.

Richard M. Stallman <rms@gnu.org>

parents: 20347

diff changeset

738 int start, start_byte;

c20c92ff4055 (looking_at_1): Use bytepos to call re_search_2.

Richard M. Stallman <rms@gnu.org>

parents: 20347

diff changeset

739 int limit, limit_byte;

c20c92ff4055 (looking_at_1): Use bytepos to call re_search_2.

Richard M. Stallman <rms@gnu.org>

parents: 20347

diff changeset

740 register int count;

c20c92ff4055 (looking_at_1): Use bytepos to call re_search_2.

Richard M. Stallman <rms@gnu.org>

parents: 20347

diff changeset

741 int allow_quit;

c20c92ff4055 (looking_at_1): Use bytepos to call re_search_2.

Richard M. Stallman <rms@gnu.org>

parents: 20347

diff changeset

742 {

c20c92ff4055 (looking_at_1): Use bytepos to call re_search_2.

Richard M. Stallman <rms@gnu.org>

parents: 20347

diff changeset

743 int direction = ((count > 0) ? 1 : -1);

c20c92ff4055 (looking_at_1): Use bytepos to call re_search_2.

Richard M. Stallman <rms@gnu.org>

parents: 20347

diff changeset

744

c20c92ff4055 (looking_at_1): Use bytepos to call re_search_2.

Richard M. Stallman <rms@gnu.org>

parents: 20347

diff changeset

745 register unsigned char *cursor;

c20c92ff4055 (looking_at_1): Use bytepos to call re_search_2.

Richard M. Stallman <rms@gnu.org>

parents: 20347

diff changeset

746 unsigned char *base;

c20c92ff4055 (looking_at_1): Use bytepos to call re_search_2.

Richard M. Stallman <rms@gnu.org>

parents: 20347

diff changeset

747

c20c92ff4055 (looking_at_1): Use bytepos to call re_search_2.

Richard M. Stallman <rms@gnu.org>

parents: 20347

diff changeset

748 register int ceiling;

c20c92ff4055 (looking_at_1): Use bytepos to call re_search_2.

Richard M. Stallman <rms@gnu.org>

parents: 20347

diff changeset

749 register unsigned char *ceiling_addr;

c20c92ff4055 (looking_at_1): Use bytepos to call re_search_2.

Richard M. Stallman <rms@gnu.org>

parents: 20347

diff changeset

750

20547

07053199a368 (scan_newline): Always restore prev value of immediate_quit.

Richard M. Stallman <rms@gnu.org>

parents: 20545

diff changeset

751 int old_immediate_quit = immediate_quit;

07053199a368 (scan_newline): Always restore prev value of immediate_quit.

Richard M. Stallman <rms@gnu.org>

parents: 20545

diff changeset

752

20545

c20c92ff4055 (looking_at_1): Use bytepos to call re_search_2.

Richard M. Stallman <rms@gnu.org>

parents: 20347

diff changeset

753 /* If we are not in selective display mode,

c20c92ff4055 (looking_at_1): Use bytepos to call re_search_2.

Richard M. Stallman <rms@gnu.org>

parents: 20347

diff changeset

754 check only for newlines. */

c20c92ff4055 (looking_at_1): Use bytepos to call re_search_2.

Richard M. Stallman <rms@gnu.org>

parents: 20347

diff changeset

755 int selective_display = (!NILP (current_buffer->selective_display)

c20c92ff4055 (looking_at_1): Use bytepos to call re_search_2.

Richard M. Stallman <rms@gnu.org>

parents: 20347

diff changeset

756 && !INTEGERP (current_buffer->selective_display));

c20c92ff4055 (looking_at_1): Use bytepos to call re_search_2.

Richard M. Stallman <rms@gnu.org>

parents: 20347

diff changeset

757

c20c92ff4055 (looking_at_1): Use bytepos to call re_search_2.

Richard M. Stallman <rms@gnu.org>

parents: 20347

diff changeset

758 /* The code that follows is like scan_buffer

c20c92ff4055 (looking_at_1): Use bytepos to call re_search_2.

Richard M. Stallman <rms@gnu.org>

parents: 20347

diff changeset

759 but checks for either newline or carriage return. */

c20c92ff4055 (looking_at_1): Use bytepos to call re_search_2.

Richard M. Stallman <rms@gnu.org>

parents: 20347

diff changeset

760

20547

07053199a368 (scan_newline): Always restore prev value of immediate_quit.

Richard M. Stallman <rms@gnu.org>

parents: 20545

diff changeset

761 if (allow_quit)

07053199a368 (scan_newline): Always restore prev value of immediate_quit.

Richard M. Stallman <rms@gnu.org>

parents: 20545

diff changeset

762 immediate_quit++;

20545

c20c92ff4055 (looking_at_1): Use bytepos to call re_search_2.

Richard M. Stallman <rms@gnu.org>

parents: 20347

diff changeset

763

c20c92ff4055 (looking_at_1): Use bytepos to call re_search_2.

Richard M. Stallman <rms@gnu.org>

parents: 20347

diff changeset

764 start_byte = CHAR_TO_BYTE (start);

c20c92ff4055 (looking_at_1): Use bytepos to call re_search_2.

Richard M. Stallman <rms@gnu.org>

parents: 20347

diff changeset

765

c20c92ff4055 (looking_at_1): Use bytepos to call re_search_2.

Richard M. Stallman <rms@gnu.org>

parents: 20347

diff changeset

766 if (count > 0)

c20c92ff4055 (looking_at_1): Use bytepos to call re_search_2.

Richard M. Stallman <rms@gnu.org>

parents: 20347

diff changeset

767 {

c20c92ff4055 (looking_at_1): Use bytepos to call re_search_2.

Richard M. Stallman <rms@gnu.org>

parents: 20347

diff changeset

768 while (start_byte < limit_byte)

c20c92ff4055 (looking_at_1): Use bytepos to call re_search_2.

Richard M. Stallman <rms@gnu.org>

parents: 20347

diff changeset

769 {

c20c92ff4055 (looking_at_1): Use bytepos to call re_search_2.

Richard M. Stallman <rms@gnu.org>

parents: 20347

diff changeset

770 ceiling = BUFFER_CEILING_OF (start_byte);

c20c92ff4055 (looking_at_1): Use bytepos to call re_search_2.

Richard M. Stallman <rms@gnu.org>

parents: 20347

diff changeset

771 ceiling = min (limit_byte - 1, ceiling);

c20c92ff4055 (looking_at_1): Use bytepos to call re_search_2.

Richard M. Stallman <rms@gnu.org>

parents: 20347

diff changeset

772 ceiling_addr = BYTE_POS_ADDR (ceiling) + 1;

c20c92ff4055 (looking_at_1): Use bytepos to call re_search_2.

Richard M. Stallman <rms@gnu.org>

parents: 20347

diff changeset

773 base = (cursor = BYTE_POS_ADDR (start_byte));

c20c92ff4055 (looking_at_1): Use bytepos to call re_search_2.

Richard M. Stallman <rms@gnu.org>

parents: 20347

diff changeset

774 while (1)

c20c92ff4055 (looking_at_1): Use bytepos to call re_search_2.

Richard M. Stallman <rms@gnu.org>

parents: 20347

diff changeset

775 {

c20c92ff4055 (looking_at_1): Use bytepos to call re_search_2.

Richard M. Stallman <rms@gnu.org>

parents: 20347

diff changeset

776 while (*cursor != '\n' && ++cursor != ceiling_addr)

c20c92ff4055 (looking_at_1): Use bytepos to call re_search_2.

Richard M. Stallman <rms@gnu.org>

parents: 20347

diff changeset

777 ;

c20c92ff4055 (looking_at_1): Use bytepos to call re_search_2.

Richard M. Stallman <rms@gnu.org>

parents: 20347

diff changeset

778

c20c92ff4055 (looking_at_1): Use bytepos to call re_search_2.

Richard M. Stallman <rms@gnu.org>

parents: 20347

diff changeset

779 if (cursor != ceiling_addr)

c20c92ff4055 (looking_at_1): Use bytepos to call re_search_2.

Richard M. Stallman <rms@gnu.org>

parents: 20347

diff changeset

780 {

c20c92ff4055 (looking_at_1): Use bytepos to call re_search_2.

Richard M. Stallman <rms@gnu.org>

parents: 20347

diff changeset

781 if (--count == 0)

c20c92ff4055 (looking_at_1): Use bytepos to call re_search_2.

Richard M. Stallman <rms@gnu.org>

parents: 20347

diff changeset

782 {

20547

07053199a368 (scan_newline): Always restore prev value of immediate_quit.

Richard M. Stallman <rms@gnu.org>

parents: 20545

diff changeset

783 immediate_quit = old_immediate_quit;

20545

c20c92ff4055 (looking_at_1): Use bytepos to call re_search_2.

Richard M. Stallman <rms@gnu.org>

parents: 20347

diff changeset

784 start_byte = start_byte + cursor - base + 1;

c20c92ff4055 (looking_at_1): Use bytepos to call re_search_2.

Richard M. Stallman <rms@gnu.org>

parents: 20347

diff changeset

785 start = BYTE_TO_CHAR (start_byte);

c20c92ff4055 (looking_at_1): Use bytepos to call re_search_2.

Richard M. Stallman <rms@gnu.org>

parents: 20347

diff changeset

786 TEMP_SET_PT_BOTH (start, start_byte);

c20c92ff4055 (looking_at_1): Use bytepos to call re_search_2.

Richard M. Stallman <rms@gnu.org>

parents: 20347

diff changeset

787 return 0;

c20c92ff4055 (looking_at_1): Use bytepos to call re_search_2.

Richard M. Stallman <rms@gnu.org>

parents: 20347

diff changeset

788 }

c20c92ff4055 (looking_at_1): Use bytepos to call re_search_2.

Richard M. Stallman <rms@gnu.org>

parents: 20347

diff changeset

789 else

c20c92ff4055 (looking_at_1): Use bytepos to call re_search_2.

Richard M. Stallman <rms@gnu.org>

parents: 20347

diff changeset

790 if (++cursor == ceiling_addr)

c20c92ff4055 (looking_at_1): Use bytepos to call re_search_2.

Richard M. Stallman <rms@gnu.org>

parents: 20347

diff changeset

791 break;

c20c92ff4055 (looking_at_1): Use bytepos to call re_search_2.

Richard M. Stallman <rms@gnu.org>

parents: 20347

diff changeset

792 }

c20c92ff4055 (looking_at_1): Use bytepos to call re_search_2.

Richard M. Stallman <rms@gnu.org>

parents: 20347

diff changeset

793 else

c20c92ff4055 (looking_at_1): Use bytepos to call re_search_2.

Richard M. Stallman <rms@gnu.org>

parents: 20347

diff changeset

794 break;

c20c92ff4055 (looking_at_1): Use bytepos to call re_search_2.

Richard M. Stallman <rms@gnu.org>

parents: 20347

diff changeset

795 }

c20c92ff4055 (looking_at_1): Use bytepos to call re_search_2.

Richard M. Stallman <rms@gnu.org>

parents: 20347

diff changeset

796 start_byte += cursor - base;

c20c92ff4055 (looking_at_1): Use bytepos to call re_search_2.

Richard M. Stallman <rms@gnu.org>

parents: 20347

diff changeset

797 }

c20c92ff4055 (looking_at_1): Use bytepos to call re_search_2.

Richard M. Stallman <rms@gnu.org>

parents: 20347

diff changeset

798 }

c20c92ff4055 (looking_at_1): Use bytepos to call re_search_2.

Richard M. Stallman <rms@gnu.org>

parents: 20347

diff changeset

799 else

c20c92ff4055 (looking_at_1): Use bytepos to call re_search_2.

Richard M. Stallman <rms@gnu.org>

parents: 20347

diff changeset

800 {

c20c92ff4055 (looking_at_1): Use bytepos to call re_search_2.

Richard M. Stallman <rms@gnu.org>

parents: 20347

diff changeset

801 while (start_byte > limit_byte)

c20c92ff4055 (looking_at_1): Use bytepos to call re_search_2.

Richard M. Stallman <rms@gnu.org>

parents: 20347

diff changeset

802 {

c20c92ff4055 (looking_at_1): Use bytepos to call re_search_2.

Richard M. Stallman <rms@gnu.org>

parents: 20347

diff changeset

803 ceiling = BUFFER_FLOOR_OF (start_byte - 1);

c20c92ff4055 (looking_at_1): Use bytepos to call re_search_2.

Richard M. Stallman <rms@gnu.org>

parents: 20347

diff changeset

804 ceiling = max (limit_byte, ceiling);

c20c92ff4055 (looking_at_1): Use bytepos to call re_search_2.

Richard M. Stallman <rms@gnu.org>

parents: 20347

diff changeset

805 ceiling_addr = BYTE_POS_ADDR (ceiling) - 1;

c20c92ff4055 (looking_at_1): Use bytepos to call re_search_2.

Richard M. Stallman <rms@gnu.org>

parents: 20347

diff changeset

806 base = (cursor = BYTE_POS_ADDR (start_byte - 1) + 1);

c20c92ff4055 (looking_at_1): Use bytepos to call re_search_2.

Richard M. Stallman <rms@gnu.org>

parents: 20347

diff changeset

807 while (1)

c20c92ff4055 (looking_at_1): Use bytepos to call re_search_2.

Richard M. Stallman <rms@gnu.org>

parents: 20347

diff changeset

808 {

c20c92ff4055 (looking_at_1): Use bytepos to call re_search_2.

Richard M. Stallman <rms@gnu.org>

parents: 20347

diff changeset

809 while (--cursor != ceiling_addr && *cursor != '\n')

c20c92ff4055 (looking_at_1): Use bytepos to call re_search_2.

Richard M. Stallman <rms@gnu.org>

parents: 20347

diff changeset

810 ;

c20c92ff4055 (looking_at_1): Use bytepos to call re_search_2.

Richard M. Stallman <rms@gnu.org>

parents: 20347

diff changeset

811

c20c92ff4055 (looking_at_1): Use bytepos to call re_search_2.

Richard M. Stallman <rms@gnu.org>

parents: 20347

diff changeset

812 if (cursor != ceiling_addr)

c20c92ff4055 (looking_at_1): Use bytepos to call re_search_2.

Richard M. Stallman <rms@gnu.org>

parents: 20347

diff changeset

813 {

c20c92ff4055 (looking_at_1): Use bytepos to call re_search_2.

Richard M. Stallman <rms@gnu.org>

parents: 20347

diff changeset

814 if (++count == 0)

c20c92ff4055 (looking_at_1): Use bytepos to call re_search_2.

Richard M. Stallman <rms@gnu.org>

parents: 20347

diff changeset

815 {

20547

07053199a368 (scan_newline): Always restore prev value of immediate_quit.

Richard M. Stallman <rms@gnu.org>

parents: 20545

diff changeset

816 immediate_quit = old_immediate_quit;

20545

c20c92ff4055 (looking_at_1): Use bytepos to call re_search_2.

Richard M. Stallman <rms@gnu.org>

parents: 20347

diff changeset

817 /* Return the position AFTER the match we found. */

c20c92ff4055 (looking_at_1): Use bytepos to call re_search_2.

Richard M. Stallman <rms@gnu.org>

parents: 20347

diff changeset

818 start_byte = start_byte + cursor - base + 1;

c20c92ff4055 (looking_at_1): Use bytepos to call re_search_2.

Richard M. Stallman <rms@gnu.org>

parents: 20347

diff changeset

819 start = BYTE_TO_CHAR (start_byte);

c20c92ff4055 (looking_at_1): Use bytepos to call re_search_2.

Richard M. Stallman <rms@gnu.org>

parents: 20347

diff changeset

820 TEMP_SET_PT_BOTH (start, start_byte);

c20c92ff4055 (looking_at_1): Use bytepos to call re_search_2.

Richard M. Stallman <rms@gnu.org>

parents: 20347

diff changeset

821 return 0;

c20c92ff4055 (looking_at_1): Use bytepos to call re_search_2.

Richard M. Stallman <rms@gnu.org>

parents: 20347

diff changeset

822 }

c20c92ff4055 (looking_at_1): Use bytepos to call re_search_2.

Richard M. Stallman <rms@gnu.org>

parents: 20347

diff changeset

823 }

c20c92ff4055 (looking_at_1): Use bytepos to call re_search_2.

Richard M. Stallman <rms@gnu.org>

parents: 20347

diff changeset

824 else

c20c92ff4055 (looking_at_1): Use bytepos to call re_search_2.

Richard M. Stallman <rms@gnu.org>

parents: 20347

diff changeset

825 break;

c20c92ff4055 (looking_at_1): Use bytepos to call re_search_2.

Richard M. Stallman <rms@gnu.org>

parents: 20347

diff changeset

826 }

c20c92ff4055 (looking_at_1): Use bytepos to call re_search_2.

Richard M. Stallman <rms@gnu.org>

parents: 20347

diff changeset

827 /* Here we add 1 to compensate for the last decrement

c20c92ff4055 (looking_at_1): Use bytepos to call re_search_2.

Richard M. Stallman <rms@gnu.org>

parents: 20347

diff changeset

828 of CURSOR, which took it past the valid range. */

c20c92ff4055 (looking_at_1): Use bytepos to call re_search_2.

Richard M. Stallman <rms@gnu.org>

parents: 20347

diff changeset

829 start_byte += cursor - base + 1;

c20c92ff4055 (looking_at_1): Use bytepos to call re_search_2.

Richard M. Stallman <rms@gnu.org>

parents: 20347

diff changeset

830 }

c20c92ff4055 (looking_at_1): Use bytepos to call re_search_2.

Richard M. Stallman <rms@gnu.org>

parents: 20347

diff changeset

831 }

c20c92ff4055 (looking_at_1): Use bytepos to call re_search_2.

Richard M. Stallman <rms@gnu.org>

parents: 20347

diff changeset

832

c20c92ff4055 (looking_at_1): Use bytepos to call re_search_2.

Richard M. Stallman <rms@gnu.org>

parents: 20347

diff changeset

833 TEMP_SET_PT_BOTH (limit, limit_byte);

20547

07053199a368 (scan_newline): Always restore prev value of immediate_quit.

Richard M. Stallman <rms@gnu.org>

parents: 20545

diff changeset

834 immediate_quit = old_immediate_quit;

20545

c20c92ff4055 (looking_at_1): Use bytepos to call re_search_2.

Richard M. Stallman <rms@gnu.org>

parents: 20347

diff changeset

835

c20c92ff4055 (looking_at_1): Use bytepos to call re_search_2.

Richard M. Stallman <rms@gnu.org>

parents: 20347

diff changeset

836 return count * direction;

c20c92ff4055 (looking_at_1): Use bytepos to call re_search_2.

Richard M. Stallman <rms@gnu.org>

parents: 20347

diff changeset

837 }

603

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

838

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

839 int

7891

7d8e0f338e4a (find_next_newline_no_quit): New function.

Richard M. Stallman <rms@gnu.org>

parents: 7856

diff changeset

840 find_next_newline_no_quit (from, cnt)

7d8e0f338e4a (find_next_newline_no_quit): New function.

Richard M. Stallman <rms@gnu.org>

parents: 7856

diff changeset

841 register int from, cnt;

7d8e0f338e4a (find_next_newline_no_quit): New function.

Richard M. Stallman <rms@gnu.org>

parents: 7856

diff changeset

842 {

9410

8598c3d6f2f0 * search.c: #include "region-cache.h".

Jim Blandy <jimb@redhat.com>

parents: 9319

diff changeset

843 return scan_buffer ('\n', from, 0, cnt, (int *) 0, 0);

7891

7d8e0f338e4a (find_next_newline_no_quit): New function.

Richard M. Stallman <rms@gnu.org>

parents: 7856

diff changeset

844 }

7d8e0f338e4a (find_next_newline_no_quit): New function.

Richard M. Stallman <rms@gnu.org>

parents: 7856

diff changeset

845

9410

8598c3d6f2f0 * search.c: #include "region-cache.h".

Jim Blandy <jimb@redhat.com>

parents: 9319

diff changeset

846 /* Like find_next_newline, but returns position before the newline,

8598c3d6f2f0 * search.c: #include "region-cache.h".

Jim Blandy <jimb@redhat.com>

parents: 9319

diff changeset

847 not after, and only search up to TO. This isn't just

8598c3d6f2f0 * search.c: #include "region-cache.h".

Jim Blandy <jimb@redhat.com>

parents: 9319

diff changeset

848 find_next_newline (...)-1, because you might hit TO. */

20545

c20c92ff4055 (looking_at_1): Use bytepos to call re_search_2.

Richard M. Stallman <rms@gnu.org>

parents: 20347

diff changeset

849

9410

8598c3d6f2f0 * search.c: #include "region-cache.h".

Jim Blandy <jimb@redhat.com>

parents: 9319

diff changeset

850 int

8598c3d6f2f0 * search.c: #include "region-cache.h".

Jim Blandy <jimb@redhat.com>

parents: 9319

diff changeset

851 find_before_next_newline (from, to, cnt)

9452

76f75b9091f1 (scan_buffer): After temporarily turning immediate_quit off, turn it

Jim Blandy <jimb@redhat.com>

parents: 9410

diff changeset

852 int from, to, cnt;

9410

8598c3d6f2f0 * search.c: #include "region-cache.h".

Jim Blandy <jimb@redhat.com>

parents: 9319

diff changeset

853 {

8598c3d6f2f0 * search.c: #include "region-cache.h".

Jim Blandy <jimb@redhat.com>

parents: 9319

diff changeset

854 int shortage;

8598c3d6f2f0 * search.c: #include "region-cache.h".

Jim Blandy <jimb@redhat.com>

parents: 9319

diff changeset

855 int pos = scan_buffer ('\n', from, to, cnt, &shortage, 1);

8598c3d6f2f0 * search.c: #include "region-cache.h".

Jim Blandy <jimb@redhat.com>

parents: 9319

diff changeset

856

8598c3d6f2f0 * search.c: #include "region-cache.h".

Jim Blandy <jimb@redhat.com>

parents: 9319

diff changeset

857 if (shortage == 0)

8598c3d6f2f0 * search.c: #include "region-cache.h".

Jim Blandy <jimb@redhat.com>

parents: 9319

diff changeset

858 pos--;

8598c3d6f2f0 * search.c: #include "region-cache.h".

Jim Blandy <jimb@redhat.com>

parents: 9319

diff changeset

859

8598c3d6f2f0 * search.c: #include "region-cache.h".

Jim Blandy <jimb@redhat.com>

parents: 9319

diff changeset

860 return pos;

603

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

861 }

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

862

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

863 /* Subroutines of Lisp buffer search functions. */

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

864

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

865 static Lisp_Object

10020

c41ce96785a8 (struct regexp_cache): New field `posix'.

Richard M. Stallman <rms@gnu.org>

parents: 9605

diff changeset

866 search_command (string, bound, noerror, count, direction, RE, posix)

603

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

867 Lisp_Object string, bound, noerror, count;

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

868 int direction;

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

869 int RE;

10020

c41ce96785a8 (struct regexp_cache): New field `posix'.

Richard M. Stallman <rms@gnu.org>

parents: 9605

diff changeset

870 int posix;

603

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

871 {

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

872 register int np;

20824

97df0c6e753d (search_buffer): New args pos_byte and lim_byte.

Richard M. Stallman <rms@gnu.org>

parents: 20792

diff changeset

873 int lim, lim_byte;

603

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

874 int n = direction;

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

875

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

876 if (!NILP (count))

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

877 {

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

878 CHECK_NUMBER (count, 3);

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

879 n *= XINT (count);

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

880 }

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

881

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

882 CHECK_STRING (string, 0);

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

883 if (NILP (bound))

20824

97df0c6e753d (search_buffer): New args pos_byte and lim_byte.

Richard M. Stallman <rms@gnu.org>

parents: 20792

diff changeset

884 {

97df0c6e753d (search_buffer): New args pos_byte and lim_byte.

Richard M. Stallman <rms@gnu.org>

parents: 20792

diff changeset

885 if (n > 0)

97df0c6e753d (search_buffer): New args pos_byte and lim_byte.

Richard M. Stallman <rms@gnu.org>

parents: 20792

diff changeset

886 lim = ZV, lim_byte = ZV_BYTE;

97df0c6e753d (search_buffer): New args pos_byte and lim_byte.

Richard M. Stallman <rms@gnu.org>

parents: 20792

diff changeset

887 else

97df0c6e753d (search_buffer): New args pos_byte and lim_byte.

Richard M. Stallman <rms@gnu.org>

parents: 20792

diff changeset

888 lim = BEGV, lim_byte = BEGV_BYTE;

97df0c6e753d (search_buffer): New args pos_byte and lim_byte.

Richard M. Stallman <rms@gnu.org>

parents: 20792

diff changeset

889 }

603

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

890 else

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

891 {

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

892 CHECK_NUMBER_COERCE_MARKER (bound, 1);

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

893 lim = XINT (bound);

16039

855c8d8ba0f0 Change all references from point to PT.

Karl Heuer <kwzh@gnu.org>

parents: 15667

diff changeset

894 if (n > 0 ? lim < PT : lim > PT)

603

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

895 error ("Invalid search bound (wrong side of point)");

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

896 if (lim > ZV)

20824

97df0c6e753d (search_buffer): New args pos_byte and lim_byte.

Richard M. Stallman <rms@gnu.org>

parents: 20792

diff changeset

897 lim = ZV, lim_byte = ZV_BYTE;

20924

eda7e44ef9d9 (search_command): Check LIM in valid range

Karl Heuer <kwzh@gnu.org>

parents: 20898

diff changeset

898 else if (lim < BEGV)

20824

97df0c6e753d (search_buffer): New args pos_byte and lim_byte.

Richard M. Stallman <rms@gnu.org>

parents: 20792

diff changeset

899 lim = BEGV, lim_byte = BEGV_BYTE;

20924

eda7e44ef9d9 (search_command): Check LIM in valid range

Karl Heuer <kwzh@gnu.org>

parents: 20898

diff changeset

900 else

eda7e44ef9d9 (search_command): Check LIM in valid range

Karl Heuer <kwzh@gnu.org>

parents: 20898

diff changeset

901 lim_byte = CHAR_TO_BYTE (lim);

603

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

902 }

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

903

20824

97df0c6e753d (search_buffer): New args pos_byte and lim_byte.

Richard M. Stallman <rms@gnu.org>

parents: 20792

diff changeset

904 np = search_buffer (string, PT, PT_BYTE, lim, lim_byte, n, RE,

603

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

905 (!NILP (current_buffer->case_fold_search)

20869

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

906 ? current_buffer->case_canon_table

20875

4fac9830041a (search_command): Fix call to search_buffer.

Richard M. Stallman <rms@gnu.org>

parents: 20869

diff changeset

907 : Qnil),

603

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

908 (!NILP (current_buffer->case_fold_search)

20869

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

909 ? current_buffer->case_eqv_table

20875

4fac9830041a (search_command): Fix call to search_buffer.

Richard M. Stallman <rms@gnu.org>

parents: 20869

diff changeset

910 : Qnil),

10020

c41ce96785a8 (struct regexp_cache): New field `posix'.

Richard M. Stallman <rms@gnu.org>

parents: 9605

diff changeset

911 posix);

603

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

912 if (np <= 0)

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

913 {

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

914 if (NILP (noerror))

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

915 return signal_failure (string);

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

916 if (!EQ (noerror, Qt))

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

917 {

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

918 if (lim < BEGV || lim > ZV)

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

919 abort ();

20824

97df0c6e753d (search_buffer): New args pos_byte and lim_byte.

Richard M. Stallman <rms@gnu.org>

parents: 20792

diff changeset

920 SET_PT_BOTH (lim, lim_byte);

1878

1c26d0049d4f (search_command): #if 0 previous change.

Richard M. Stallman <rms@gnu.org>

parents: 1877

diff changeset

921 return Qnil;

1c26d0049d4f (search_command): #if 0 previous change.

Richard M. Stallman <rms@gnu.org>

parents: 1877

diff changeset

922 #if 0 /* This would be clean, but maybe programs depend on

1c26d0049d4f (search_command): #if 0 previous change.

Richard M. Stallman <rms@gnu.org>

parents: 1877

diff changeset

923 a value of nil here. */

1877

7786f61ec635 (search_command): When moving to LIM on failure, return LIM.

Richard M. Stallman <rms@gnu.org>

parents: 1684

diff changeset

924 np = lim;

1878

1c26d0049d4f (search_command): #if 0 previous change.

Richard M. Stallman <rms@gnu.org>

parents: 1877

diff changeset

925 #endif

603

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

926 }

1877

7786f61ec635 (search_command): When moving to LIM on failure, return LIM.

Richard M. Stallman <rms@gnu.org>

parents: 1684

diff changeset

927 else

7786f61ec635 (search_command): When moving to LIM on failure, return LIM.

Richard M. Stallman <rms@gnu.org>

parents: 1684

diff changeset

928 return Qnil;

603

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

929 }

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

930

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

931 if (np < BEGV || np > ZV)

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

932 abort ();

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

933

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

934 SET_PT (np);

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

935

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

936 return make_number (np);

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

937 }

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

938

20545

c20c92ff4055 (looking_at_1): Use bytepos to call re_search_2.

Richard M. Stallman <rms@gnu.org>

parents: 20347

diff changeset

939 /* Return 1 if REGEXP it matches just one constant string. */

c20c92ff4055 (looking_at_1): Use bytepos to call re_search_2.

Richard M. Stallman <rms@gnu.org>

parents: 20347

diff changeset

940

8950

68ad2f08d735 (trivial_regexp_p): New function.

Karl Heuer <kwzh@gnu.org>

parents: 8584

diff changeset

941 static int

68ad2f08d735 (trivial_regexp_p): New function.

Karl Heuer <kwzh@gnu.org>

parents: 8584

diff changeset

942 trivial_regexp_p (regexp)

68ad2f08d735 (trivial_regexp_p): New function.

Karl Heuer <kwzh@gnu.org>

parents: 8584

diff changeset

943 Lisp_Object regexp;

68ad2f08d735 (trivial_regexp_p): New function.

Karl Heuer <kwzh@gnu.org>

parents: 8584

diff changeset

944 {

21244

50929073a0ba Use STRING_BYTES and SET_STRING_BYTES.

Richard M. Stallman <rms@gnu.org>

parents: 21171

diff changeset

945 int len = STRING_BYTES (XSTRING (regexp));

8950

68ad2f08d735 (trivial_regexp_p): New function.

Karl Heuer <kwzh@gnu.org>

parents: 8584

diff changeset

946 unsigned char *s = XSTRING (regexp)->data;

68ad2f08d735 (trivial_regexp_p): New function.

Karl Heuer <kwzh@gnu.org>

parents: 8584

diff changeset

947 unsigned char c;

68ad2f08d735 (trivial_regexp_p): New function.

Karl Heuer <kwzh@gnu.org>

parents: 8584

diff changeset

948 while (--len >= 0)

68ad2f08d735 (trivial_regexp_p): New function.

Karl Heuer <kwzh@gnu.org>

parents: 8584

diff changeset

949 {

68ad2f08d735 (trivial_regexp_p): New function.

Karl Heuer <kwzh@gnu.org>

parents: 8584

diff changeset

950 switch (*s++)

68ad2f08d735 (trivial_regexp_p): New function.

Karl Heuer <kwzh@gnu.org>

parents: 8584

diff changeset

951 {

68ad2f08d735 (trivial_regexp_p): New function.

Karl Heuer <kwzh@gnu.org>

parents: 8584

diff changeset

952 case '.': case '*': case '+': case '?': case '[': case '^': case '$':

68ad2f08d735 (trivial_regexp_p): New function.

Karl Heuer <kwzh@gnu.org>

parents: 8584

diff changeset

953 return 0;

68ad2f08d735 (trivial_regexp_p): New function.

Karl Heuer <kwzh@gnu.org>

parents: 8584

diff changeset

954 case '\\':

68ad2f08d735 (trivial_regexp_p): New function.

Karl Heuer <kwzh@gnu.org>

parents: 8584

diff changeset

955 if (--len < 0)

68ad2f08d735 (trivial_regexp_p): New function.

Karl Heuer <kwzh@gnu.org>

parents: 8584

diff changeset

956 return 0;

68ad2f08d735 (trivial_regexp_p): New function.

Karl Heuer <kwzh@gnu.org>

parents: 8584

diff changeset

957 switch (*s++)

68ad2f08d735 (trivial_regexp_p): New function.

Karl Heuer <kwzh@gnu.org>

parents: 8584

diff changeset

958 {

68ad2f08d735 (trivial_regexp_p): New function.

Karl Heuer <kwzh@gnu.org>

parents: 8584

diff changeset

959 case '|': case '(': case ')': case '`': case '\'': case 'b':

68ad2f08d735 (trivial_regexp_p): New function.

Karl Heuer <kwzh@gnu.org>

parents: 8584

diff changeset

960 case 'B': case '<': case '>': case 'w': case 'W': case 's':

12069

505dc29a68cf (trivial_regexp_p): = is special after \.

Karl Heuer <kwzh@gnu.org>

parents: 11678

diff changeset

961 case 'S': case '=':

17053

df904355f033 Include category.h and charset.h.

Karl Heuer <kwzh@gnu.org>

parents: 16880

diff changeset

962 case 'c': case 'C': /* for categoryspec and notcategoryspec */

12069

505dc29a68cf (trivial_regexp_p): = is special after \.

Karl Heuer <kwzh@gnu.org>

parents: 11678

diff changeset

963 case '1': case '2': case '3': case '4': case '5':

8950

68ad2f08d735 (trivial_regexp_p): New function.

Karl Heuer <kwzh@gnu.org>

parents: 8584

diff changeset

964 case '6': case '7': case '8': case '9':

68ad2f08d735 (trivial_regexp_p): New function.

Karl Heuer <kwzh@gnu.org>

parents: 8584

diff changeset

965 return 0;

68ad2f08d735 (trivial_regexp_p): New function.

Karl Heuer <kwzh@gnu.org>

parents: 8584

diff changeset

966 }

68ad2f08d735 (trivial_regexp_p): New function.

Karl Heuer <kwzh@gnu.org>

parents: 8584

diff changeset

967 }

68ad2f08d735 (trivial_regexp_p): New function.

Karl Heuer <kwzh@gnu.org>

parents: 8584

diff changeset

968 }

68ad2f08d735 (trivial_regexp_p): New function.

Karl Heuer <kwzh@gnu.org>

parents: 8584

diff changeset

969 return 1;

68ad2f08d735 (trivial_regexp_p): New function.

Karl Heuer <kwzh@gnu.org>

parents: 8584

diff changeset

970 }

68ad2f08d735 (trivial_regexp_p): New function.

Karl Heuer <kwzh@gnu.org>

parents: 8584

diff changeset

971

5556

14161cfec24a (set_search_regs): New subroutine.

Richard M. Stallman <rms@gnu.org>

parents: 4954

diff changeset

972 /* Search for the n'th occurrence of STRING in the current buffer,

603

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

973 starting at position POS and stopping at position LIM,

10020

c41ce96785a8 (struct regexp_cache): New field `posix'.

Richard M. Stallman <rms@gnu.org>

parents: 9605

diff changeset

974 treating STRING as a literal string if RE is false or as

603

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

975 a regular expression if RE is true.

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

976

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

977 If N is positive, searching is forward and LIM must be greater than POS.

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

978 If N is negative, searching is backward and LIM must be less than POS.

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

979

20869

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

980 Returns -x if x occurrences remain to be found (x > 0),

603

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

981 or else the position at the beginning of the Nth occurrence

10020

c41ce96785a8 (struct regexp_cache): New field `posix'.

Richard M. Stallman <rms@gnu.org>

parents: 9605

diff changeset

982 (if searching backward) or the end (if searching forward).

603

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

983

10020

c41ce96785a8 (struct regexp_cache): New field `posix'.

Richard M. Stallman <rms@gnu.org>

parents: 9605

diff changeset

984 POSIX is nonzero if we want full backtracking (POSIX style)

c41ce96785a8 (struct regexp_cache): New field `posix'.

Richard M. Stallman <rms@gnu.org>

parents: 9605

diff changeset

985 for this pattern. 0 means backtrack only enough to get a valid match. */

c41ce96785a8 (struct regexp_cache): New field `posix'.

Richard M. Stallman <rms@gnu.org>

parents: 9605

diff changeset

986

20898

f69969e35e78 (simple_search): Call set_search_regs.

Richard M. Stallman <rms@gnu.org>

parents: 20875

diff changeset

987 #define TRANSLATE(out, trt, d) \

f69969e35e78 (simple_search): Call set_search_regs.

Richard M. Stallman <rms@gnu.org>

parents: 20875

diff changeset

988 do \

f69969e35e78 (simple_search): Call set_search_regs.

Richard M. Stallman <rms@gnu.org>

parents: 20875

diff changeset

989 { \

f69969e35e78 (simple_search): Call set_search_regs.

Richard M. Stallman <rms@gnu.org>

parents: 20875

diff changeset

990 if (! NILP (trt)) \

f69969e35e78 (simple_search): Call set_search_regs.

Richard M. Stallman <rms@gnu.org>

parents: 20875

diff changeset

991 { \

f69969e35e78 (simple_search): Call set_search_regs.

Richard M. Stallman <rms@gnu.org>

parents: 20875

diff changeset

992 Lisp_Object temp; \

f69969e35e78 (simple_search): Call set_search_regs.

Richard M. Stallman <rms@gnu.org>

parents: 20875

diff changeset

993 temp = Faref (trt, make_number (d)); \

f69969e35e78 (simple_search): Call set_search_regs.

Richard M. Stallman <rms@gnu.org>

parents: 20875

diff changeset

994 if (INTEGERP (temp)) \

f69969e35e78 (simple_search): Call set_search_regs.

Richard M. Stallman <rms@gnu.org>

parents: 20875

diff changeset

995 out = XINT (temp); \

f69969e35e78 (simple_search): Call set_search_regs.

Richard M. Stallman <rms@gnu.org>

parents: 20875

diff changeset

996 else \

f69969e35e78 (simple_search): Call set_search_regs.

Richard M. Stallman <rms@gnu.org>

parents: 20875

diff changeset

997 out = d; \

f69969e35e78 (simple_search): Call set_search_regs.

Richard M. Stallman <rms@gnu.org>

parents: 20875

diff changeset

998 } \

f69969e35e78 (simple_search): Call set_search_regs.

Richard M. Stallman <rms@gnu.org>

parents: 20875

diff changeset

999 else \

f69969e35e78 (simple_search): Call set_search_regs.

Richard M. Stallman <rms@gnu.org>

parents: 20875

diff changeset

1000 out = d; \

f69969e35e78 (simple_search): Call set_search_regs.

Richard M. Stallman <rms@gnu.org>

parents: 20875

diff changeset

1001 } \

f69969e35e78 (simple_search): Call set_search_regs.

Richard M. Stallman <rms@gnu.org>

parents: 20875

diff changeset

1002 while (0)

20869

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1003

10020

c41ce96785a8 (struct regexp_cache): New field `posix'.

Richard M. Stallman <rms@gnu.org>

parents: 9605

diff changeset

1004 static int

20824

97df0c6e753d (search_buffer): New args pos_byte and lim_byte.

Richard M. Stallman <rms@gnu.org>

parents: 20792

diff changeset

1005 search_buffer (string, pos, pos_byte, lim, lim_byte, n,

97df0c6e753d (search_buffer): New args pos_byte and lim_byte.

Richard M. Stallman <rms@gnu.org>

parents: 20792

diff changeset

1006 RE, trt, inverse_trt, posix)

603

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

1007 Lisp_Object string;

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

1008 int pos;

20824

97df0c6e753d (search_buffer): New args pos_byte and lim_byte.

Richard M. Stallman <rms@gnu.org>

parents: 20792

diff changeset

1009 int pos_byte;

603

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

1010 int lim;

20824

97df0c6e753d (search_buffer): New args pos_byte and lim_byte.

Richard M. Stallman <rms@gnu.org>

parents: 20792

diff changeset

1011 int lim_byte;

603

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

1012 int n;

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

1013 int RE;

20869

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1014 Lisp_Object trt;

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1015 Lisp_Object inverse_trt;

10020

c41ce96785a8 (struct regexp_cache): New field `posix'.

Richard M. Stallman <rms@gnu.org>

parents: 9605

diff changeset

1016 int posix;

603

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

1017 {

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

1018 int len = XSTRING (string)->size;

21244

50929073a0ba Use STRING_BYTES and SET_STRING_BYTES.

Richard M. Stallman <rms@gnu.org>

parents: 21171

diff changeset

1019 int len_byte = STRING_BYTES (XSTRING (string));

20869

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1020 register int i;

603

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

1021

10032

f689803caa92 Added code for automatically saving and restoring the match data

Francesco Potortì <pot@gnu.org>

parents: 10020

diff changeset

1022 if (running_asynch_code)

f689803caa92 Added code for automatically saving and restoring the match data

Francesco Potortì <pot@gnu.org>

parents: 10020

diff changeset

1023 save_search_regs ();

f689803caa92 Added code for automatically saving and restoring the match data

Francesco Potortì <pot@gnu.org>

parents: 10020

diff changeset

1024

22082

84bcdbc46d71 (search_buffer): Set search regs for all success with an empty string.

Richard M. Stallman <rms@gnu.org>

parents: 21988

diff changeset

1025 /* Searching 0 times means don't move. */

603

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

1026 /* Null string is found at starting position. */

22082

84bcdbc46d71 (search_buffer): Set search regs for all success with an empty string.

Richard M. Stallman <rms@gnu.org>

parents: 21988

diff changeset

1027 if (len == 0 || n == 0)

5556

14161cfec24a (set_search_regs): New subroutine.

Richard M. Stallman <rms@gnu.org>

parents: 4954

diff changeset

1028 {

14161cfec24a (set_search_regs): New subroutine.

Richard M. Stallman <rms@gnu.org>

parents: 4954

diff changeset

1029 set_search_regs (pos, 0);

14161cfec24a (set_search_regs): New subroutine.

Richard M. Stallman <rms@gnu.org>

parents: 4954

diff changeset

1030 return pos;

14161cfec24a (set_search_regs): New subroutine.

Richard M. Stallman <rms@gnu.org>

parents: 4954

diff changeset

1031 }

4299

7a2e1d7362c5 (search_buffer): If n is 0, just return POS.

Richard M. Stallman <rms@gnu.org>

parents: 3615

diff changeset

1032

8950

68ad2f08d735 (trivial_regexp_p): New function.

Karl Heuer <kwzh@gnu.org>

parents: 8584

diff changeset

1033 if (RE && !trivial_regexp_p (string))

603

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

1034 {

20869

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1035 unsigned char *p1, *p2;

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1036 int s1, s2;

9605

cf97e75d8e02 (searchbufs): New variable, replaces searchbuf and last_regexp and

Karl Heuer <kwzh@gnu.org>

parents: 9452

diff changeset

1037 struct re_pattern_buffer *bufp;

cf97e75d8e02 (searchbufs): New variable, replaces searchbuf and last_regexp and

Karl Heuer <kwzh@gnu.org>

parents: 9452

diff changeset

1038

20588

138c95482e6b (search_buffer): Handle bytes vs chars in non-RE case.

Richard M. Stallman <rms@gnu.org>

parents: 20547

diff changeset

1039 bufp = compile_pattern (string, &search_regs, trt, posix,

138c95482e6b (search_buffer): Handle bytes vs chars in non-RE case.

Richard M. Stallman <rms@gnu.org>

parents: 20547

diff changeset

1040 !NILP (current_buffer->enable_multibyte_characters));

603

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

1041

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

1042 immediate_quit = 1; /* Quit immediately if user types ^G,

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

1043 because letting this function finish

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

1044 can take too long. */

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

1045 QUIT; /* Do a pending quit right away,

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

1046 to avoid paradoxical behavior */

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

1047 /* Get pointers and sizes of the two strings

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

1048 that make up the visible portion of the buffer. */

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

1049

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

1050 p1 = BEGV_ADDR;

20545

c20c92ff4055 (looking_at_1): Use bytepos to call re_search_2.

Richard M. Stallman <rms@gnu.org>

parents: 20347

diff changeset

1051 s1 = GPT_BYTE - BEGV_BYTE;

603

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

1052 p2 = GAP_END_ADDR;

20545

c20c92ff4055 (looking_at_1): Use bytepos to call re_search_2.

Richard M. Stallman <rms@gnu.org>

parents: 20347

diff changeset

1053 s2 = ZV_BYTE - GPT_BYTE;

603

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

1054 if (s1 < 0)

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

1055 {

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

1056 p2 = p1;

20545

c20c92ff4055 (looking_at_1): Use bytepos to call re_search_2.

Richard M. Stallman <rms@gnu.org>

parents: 20347

diff changeset

1057 s2 = ZV_BYTE - BEGV_BYTE;

603

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

1058 s1 = 0;

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

1059 }

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

1060 if (s2 < 0)

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

1061 {

20545

c20c92ff4055 (looking_at_1): Use bytepos to call re_search_2.

Richard M. Stallman <rms@gnu.org>

parents: 20347

diff changeset

1062 s1 = ZV_BYTE - BEGV_BYTE;

603

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

1063 s2 = 0;

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

1064 }

17463

bb9ae80d22e2 (looking_at_1): Set re_match_object.

Richard M. Stallman <rms@gnu.org>

parents: 17284

diff changeset

1065 re_match_object = Qnil;

bb9ae80d22e2 (looking_at_1): Set re_match_object.

Richard M. Stallman <rms@gnu.org>

parents: 17284

diff changeset

1066

603

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

1067 while (n < 0)

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

1068 {

2475

052bbdf1b817 (search_buffer): Fix typo in previous change.

Richard M. Stallman <rms@gnu.org>

parents: 2439

diff changeset

1069 int val;

9605

cf97e75d8e02 (searchbufs): New variable, replaces searchbuf and last_regexp and

Karl Heuer <kwzh@gnu.org>

parents: 9452

diff changeset

1070 val = re_search_2 (bufp, (char *) p1, s1, (char *) p2, s2,

20792

f0aa5cc14e8a (fast_string_match): Give re_search byte size of

Kenichi Handa <handa@m17n.org>

parents: 20706

diff changeset

1071 pos_byte - BEGV_BYTE, lim_byte - pos_byte,

f0aa5cc14e8a (fast_string_match): Give re_search byte size of

Kenichi Handa <handa@m17n.org>

parents: 20706

diff changeset

1072 &search_regs,

2475

052bbdf1b817 (search_buffer): Fix typo in previous change.

Richard M. Stallman <rms@gnu.org>

parents: 2439

diff changeset

1073 /* Don't allow match past current point */

20792

f0aa5cc14e8a (fast_string_match): Give re_search byte size of

Kenichi Handa <handa@m17n.org>

parents: 20706

diff changeset

1074 pos_byte - BEGV_BYTE);

603

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

1075 if (val == -2)

8950

68ad2f08d735 (trivial_regexp_p): New function.

Karl Heuer <kwzh@gnu.org>

parents: 8584

diff changeset

1076 {

68ad2f08d735 (trivial_regexp_p): New function.

Karl Heuer <kwzh@gnu.org>

parents: 8584

diff changeset

1077 matcher_overflow ();

68ad2f08d735 (trivial_regexp_p): New function.

Karl Heuer <kwzh@gnu.org>

parents: 8584

diff changeset

1078 }

603

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

1079 if (val >= 0)

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

1080 {

20927

765fdbf766e4 (search_buffer): Update POS_BYTE for regexp search.

Kenichi Handa <handa@m17n.org>

parents: 20924

diff changeset

1081 pos_byte = search_regs.start[0] + BEGV_BYTE;

621

eca8812e61cd *** empty log message ***

Jim Blandy <jimb@redhat.com>

parents: 605

diff changeset

1082 for (i = 0; i < search_regs.num_regs; i++)

603

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

1083 if (search_regs.start[i] >= 0)

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

1084 {

20545

c20c92ff4055 (looking_at_1): Use bytepos to call re_search_2.

Richard M. Stallman <rms@gnu.org>

parents: 20347

diff changeset

1085 search_regs.start[i]

c20c92ff4055 (looking_at_1): Use bytepos to call re_search_2.

Richard M. Stallman <rms@gnu.org>

parents: 20347

diff changeset

1086 = BYTE_TO_CHAR (search_regs.start[i] + BEGV_BYTE);

c20c92ff4055 (looking_at_1): Use bytepos to call re_search_2.

Richard M. Stallman <rms@gnu.org>

parents: 20347

diff changeset

1087 search_regs.end[i]

c20c92ff4055 (looking_at_1): Use bytepos to call re_search_2.

Richard M. Stallman <rms@gnu.org>

parents: 20347

diff changeset

1088 = BYTE_TO_CHAR (search_regs.end[i] + BEGV_BYTE);

603

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

1089 }

9278

f2138d548313 (Flooking_at, skip_chars, search_buffer, set_search_regs, Fstore_match_data):

Karl Heuer <kwzh@gnu.org>

parents: 9113

diff changeset

1090 XSETBUFFER (last_thing_searched, current_buffer);

603

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

1091 /* Set pos to the new position. */

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

1092 pos = search_regs.start[0];

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

1093 }

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

1094 else

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

1095 {

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

1096 immediate_quit = 0;

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

1097 return (n);

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

1098 }

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

1099 n++;

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

1100 }

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

1101 while (n > 0)

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

1102 {

2475

052bbdf1b817 (search_buffer): Fix typo in previous change.

Richard M. Stallman <rms@gnu.org>

parents: 2439

diff changeset

1103 int val;

9605

cf97e75d8e02 (searchbufs): New variable, replaces searchbuf and last_regexp and

Karl Heuer <kwzh@gnu.org>

parents: 9452

diff changeset

1104 val = re_search_2 (bufp, (char *) p1, s1, (char *) p2, s2,

20792

f0aa5cc14e8a (fast_string_match): Give re_search byte size of

Kenichi Handa <handa@m17n.org>

parents: 20706

diff changeset

1105 pos_byte - BEGV_BYTE, lim_byte - pos_byte,

f0aa5cc14e8a (fast_string_match): Give re_search byte size of

Kenichi Handa <handa@m17n.org>

parents: 20706

diff changeset

1106 &search_regs,

f0aa5cc14e8a (fast_string_match): Give re_search byte size of

Kenichi Handa <handa@m17n.org>

parents: 20706

diff changeset

1107 lim_byte - BEGV_BYTE);

603

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

1108 if (val == -2)

8950

68ad2f08d735 (trivial_regexp_p): New function.

Karl Heuer <kwzh@gnu.org>

parents: 8584

diff changeset

1109 {

68ad2f08d735 (trivial_regexp_p): New function.

Karl Heuer <kwzh@gnu.org>

parents: 8584

diff changeset

1110 matcher_overflow ();

68ad2f08d735 (trivial_regexp_p): New function.

Karl Heuer <kwzh@gnu.org>

parents: 8584

diff changeset

1111 }

603

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

1112 if (val >= 0)

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

1113 {

20927

765fdbf766e4 (search_buffer): Update POS_BYTE for regexp search.

Kenichi Handa <handa@m17n.org>

parents: 20924

diff changeset

1114 pos_byte = search_regs.end[0] + BEGV_BYTE;

621

eca8812e61cd *** empty log message ***

Jim Blandy <jimb@redhat.com>

parents: 605

diff changeset

1115 for (i = 0; i < search_regs.num_regs; i++)

603

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

1116 if (search_regs.start[i] >= 0)

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

1117 {

20545

c20c92ff4055 (looking_at_1): Use bytepos to call re_search_2.

Richard M. Stallman <rms@gnu.org>

parents: 20347

diff changeset

1118 search_regs.start[i]

c20c92ff4055 (looking_at_1): Use bytepos to call re_search_2.

Richard M. Stallman <rms@gnu.org>

parents: 20347

diff changeset

1119 = BYTE_TO_CHAR (search_regs.start[i] + BEGV_BYTE);

c20c92ff4055 (looking_at_1): Use bytepos to call re_search_2.

Richard M. Stallman <rms@gnu.org>

parents: 20347

diff changeset

1120 search_regs.end[i]

c20c92ff4055 (looking_at_1): Use bytepos to call re_search_2.

Richard M. Stallman <rms@gnu.org>

parents: 20347

diff changeset

1121 = BYTE_TO_CHAR (search_regs.end[i] + BEGV_BYTE);

603

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

1122 }

9278

f2138d548313 (Flooking_at, skip_chars, search_buffer, set_search_regs, Fstore_match_data):

Karl Heuer <kwzh@gnu.org>

parents: 9113

diff changeset

1123 XSETBUFFER (last_thing_searched, current_buffer);

603

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

1124 pos = search_regs.end[0];

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

1125 }

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

1126 else

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

1127 {

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

1128 immediate_quit = 0;

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

1129 return (0 - n);

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

1130 }

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

1131 n--;

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

1132 }

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

1133 immediate_quit = 0;

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

1134 return (pos);

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

1135 }

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

1136 else /* non-RE case */

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

1137 {

20869

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1138 unsigned char *raw_pattern, *pat;

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1139 int raw_pattern_size;

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1140 int raw_pattern_size_byte;

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1141 unsigned char *patbuf;

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1142 int multibyte = !NILP (current_buffer->enable_multibyte_characters);

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1143 unsigned char *base_pat = XSTRING (string)->data;

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1144 int charset_base = -1;

23876

8d2f38338c81 (search_buffer): Don't use Boyer-Moore

Kenichi Handa <handa@m17n.org>

parents: 23790

diff changeset

1145 int boyer_moore_ok = 1;

20869

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1146

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1147 /* MULTIBYTE says whether the text to be searched is multibyte.

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1148 We must convert PATTERN to match that, or we will not really

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1149 find things right. */

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1150

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1151 if (multibyte == STRING_MULTIBYTE (string))

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1152 {

21915

8f1159b417c2 (search_buffer): Fix casts when assigning raw_pattern.

Richard M. Stallman <rms@gnu.org>

parents: 21887

diff changeset

1153 raw_pattern = (unsigned char *) XSTRING (string)->data;

20869

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1154 raw_pattern_size = XSTRING (string)->size;

21244

50929073a0ba Use STRING_BYTES and SET_STRING_BYTES.

Richard M. Stallman <rms@gnu.org>

parents: 21171

diff changeset

1155 raw_pattern_size_byte = STRING_BYTES (XSTRING (string));

20869

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1156 }

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1157 else if (multibyte)

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1158 {

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1159 raw_pattern_size = XSTRING (string)->size;

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1160 raw_pattern_size_byte

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1161 = count_size_as_multibyte (XSTRING (string)->data,

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1162 raw_pattern_size);

21915

8f1159b417c2 (search_buffer): Fix casts when assigning raw_pattern.

Richard M. Stallman <rms@gnu.org>

parents: 21887

diff changeset

1163 raw_pattern = (unsigned char *) alloca (raw_pattern_size_byte + 1);

20869

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1164 copy_text (XSTRING (string)->data, raw_pattern,

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1165 XSTRING (string)->size, 0, 1);

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1166 }

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1167 else

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1168 {

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1169 /* Converting multibyte to single-byte.

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1170

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1171 ??? Perhaps this conversion should be done in a special way

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1172 by subtracting nonascii-insert-offset from each non-ASCII char,

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1173 so that only the multibyte chars which really correspond to

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1174 the chosen single-byte character set can possibly match. */

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1175 raw_pattern_size = XSTRING (string)->size;

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1176 raw_pattern_size_byte = XSTRING (string)->size;

21915

8f1159b417c2 (search_buffer): Fix casts when assigning raw_pattern.

Richard M. Stallman <rms@gnu.org>

parents: 21887

diff changeset

1177 raw_pattern = (unsigned char *) alloca (raw_pattern_size + 1);

20869

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1178 copy_text (XSTRING (string)->data, raw_pattern,

21244

50929073a0ba Use STRING_BYTES and SET_STRING_BYTES.

Richard M. Stallman <rms@gnu.org>

parents: 21171

diff changeset

1179 STRING_BYTES (XSTRING (string)), 1, 0);

20869

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1180 }

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1181

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1182 /* Copy and optionally translate the pattern. */

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1183 len = raw_pattern_size;

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1184 len_byte = raw_pattern_size_byte;

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1185 patbuf = (unsigned char *) alloca (len_byte);

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1186 pat = patbuf;

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1187 base_pat = raw_pattern;

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1188 if (multibyte)

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1189 {

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1190 while (--len >= 0)

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1191 {

26869

cb8fbc50812f (search_buffer): Adjusted for the change of CHAR_STRING.

Kenichi Handa <handa@m17n.org>

parents: 26088

diff changeset

1192 unsigned char str[MAX_MULTIBYTE_LENGTH];

20898

f69969e35e78 (simple_search): Call set_search_regs.

Richard M. Stallman <rms@gnu.org>

parents: 20875

diff changeset

1193 int c, translated, inverse;

20869

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1194 int in_charlen, charlen;

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1195

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1196 /* If we got here and the RE flag is set, it's because we're

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1197 dealing with a regexp known to be trivial, so the backslash

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1198 just quotes the next character. */

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1199 if (RE && *base_pat == '\\')

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1200 {

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1201 len--;

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1202 len_byte--;

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1203 base_pat++;

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1204 }

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1205

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1206 c = STRING_CHAR_AND_LENGTH (base_pat, len_byte, in_charlen);

23876

8d2f38338c81 (search_buffer): Don't use Boyer-Moore

Kenichi Handa <handa@m17n.org>

parents: 23790

diff changeset

1207

20869

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1208 /* Translate the character, if requested. */

20898

f69969e35e78 (simple_search): Call set_search_regs.

Richard M. Stallman <rms@gnu.org>

parents: 20875

diff changeset

1209 TRANSLATE (translated, trt, c);

20869

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1210 /* If translation changed the byte-length, go back

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1211 to the original character. */

26869

cb8fbc50812f (search_buffer): Adjusted for the change of CHAR_STRING.

Kenichi Handa <handa@m17n.org>

parents: 26088

diff changeset

1212 charlen = CHAR_STRING (translated, str);

20869

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1213 if (in_charlen != charlen)

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1214 {

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1215 translated = c;

26869

cb8fbc50812f (search_buffer): Adjusted for the change of CHAR_STRING.

Kenichi Handa <handa@m17n.org>

parents: 26088

diff changeset

1216 charlen = CHAR_STRING (c, str);

20869

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1217 }

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1218

24014

0997bcfd8827 (search_buffer): Fix previous change.

Richard M. Stallman <rms@gnu.org>

parents: 23876

diff changeset

1219 /* If we are searching for something strange,

0997bcfd8827 (search_buffer): Fix previous change.

Richard M. Stallman <rms@gnu.org>

parents: 23876

diff changeset

1220 an invalid multibyte code, don't use boyer-moore. */

0997bcfd8827 (search_buffer): Fix previous change.

Richard M. Stallman <rms@gnu.org>

parents: 23876

diff changeset

1221 if (! ASCII_BYTE_P (translated)

0997bcfd8827 (search_buffer): Fix previous change.

Richard M. Stallman <rms@gnu.org>

parents: 23876

diff changeset

1222 && (charlen == 1 /* 8bit code */

0997bcfd8827 (search_buffer): Fix previous change.

Richard M. Stallman <rms@gnu.org>

parents: 23876

diff changeset

1223 || charlen != in_charlen /* invalid multibyte code */

0997bcfd8827 (search_buffer): Fix previous change.

Richard M. Stallman <rms@gnu.org>

parents: 23876

diff changeset

1224 ))

0997bcfd8827 (search_buffer): Fix previous change.

Richard M. Stallman <rms@gnu.org>

parents: 23876

diff changeset

1225 boyer_moore_ok = 0;

0997bcfd8827 (search_buffer): Fix previous change.

Richard M. Stallman <rms@gnu.org>

parents: 23876

diff changeset

1226

20898

f69969e35e78 (simple_search): Call set_search_regs.

Richard M. Stallman <rms@gnu.org>

parents: 20875

diff changeset

1227 TRANSLATE (inverse, inverse_trt, c);

f69969e35e78 (simple_search): Call set_search_regs.

Richard M. Stallman <rms@gnu.org>

parents: 20875

diff changeset

1228

20869

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1229 /* Did this char actually get translated?

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1230 Would any other char get translated into it? */

20898

f69969e35e78 (simple_search): Call set_search_regs.

Richard M. Stallman <rms@gnu.org>

parents: 20875

diff changeset

1231 if (translated != c || inverse != c)

20869

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1232 {

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1233 /* Keep track of which character set row

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1234 contains the characters that need translation. */

24014

0997bcfd8827 (search_buffer): Fix previous change.

Richard M. Stallman <rms@gnu.org>

parents: 23876

diff changeset

1235 int charset_base_code = c & ~CHAR_FIELD3_MASK;

20869

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1236 if (charset_base == -1)

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1237 charset_base = charset_base_code;

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1238 else if (charset_base != charset_base_code)

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1239 /* If two different rows appear, needing translation,

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1240 then we cannot use boyer_moore search. */

23876

8d2f38338c81 (search_buffer): Don't use Boyer-Moore

Kenichi Handa <handa@m17n.org>

parents: 23790

diff changeset

1241 boyer_moore_ok = 0;

20898

f69969e35e78 (simple_search): Call set_search_regs.

Richard M. Stallman <rms@gnu.org>

parents: 20875

diff changeset

1242 }

20869

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1243

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1244 /* Store this character into the translated pattern. */

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1245 bcopy (str, pat, charlen);

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1246 pat += charlen;

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1247 base_pat += in_charlen;

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1248 len_byte -= in_charlen;

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1249 }

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1250 }

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1251 else

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1252 {

23876

8d2f38338c81 (search_buffer): Don't use Boyer-Moore

Kenichi Handa <handa@m17n.org>

parents: 23790

diff changeset

1253 /* Unibyte buffer. */

8d2f38338c81 (search_buffer): Don't use Boyer-Moore

Kenichi Handa <handa@m17n.org>

parents: 23790

diff changeset

1254 charset_base = 0;

20869

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1255 while (--len >= 0)

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1256 {

23876

8d2f38338c81 (search_buffer): Don't use Boyer-Moore

Kenichi Handa <handa@m17n.org>

parents: 23790

diff changeset

1257 int c, translated;

20869

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1258

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1259 /* If we got here and the RE flag is set, it's because we're

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1260 dealing with a regexp known to be trivial, so the backslash

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1261 just quotes the next character. */

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1262 if (RE && *base_pat == '\\')

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1263 {

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1264 len--;

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1265 base_pat++;

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1266 }

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1267 c = *base_pat++;

20898

f69969e35e78 (simple_search): Call set_search_regs.

Richard M. Stallman <rms@gnu.org>

parents: 20875

diff changeset

1268 TRANSLATE (translated, trt, c);

20869

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1269 *pat++ = translated;

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1270 }

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1271 }

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1272

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1273 len_byte = pat - patbuf;

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1274 len = raw_pattern_size;

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1275 pat = base_pat = patbuf;

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1276

23876

8d2f38338c81 (search_buffer): Don't use Boyer-Moore

Kenichi Handa <handa@m17n.org>

parents: 23790

diff changeset

1277 if (boyer_moore_ok)

20869

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1278 return boyer_moore (n, pat, len, len_byte, trt, inverse_trt,

20898

f69969e35e78 (simple_search): Call set_search_regs.

Richard M. Stallman <rms@gnu.org>

parents: 20875

diff changeset

1279 pos, pos_byte, lim, lim_byte,

f69969e35e78 (simple_search): Call set_search_regs.

Richard M. Stallman <rms@gnu.org>

parents: 20875

diff changeset

1280 charset_base);

20869

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1281 else

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1282 return simple_search (n, pat, len, len_byte, trt,

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1283 pos, pos_byte, lim, lim_byte);

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1284 }

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1285 }

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1286

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1287 /* Do a simple string search N times for the string PAT,

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1288 whose length is LEN/LEN_BYTE,

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1289 from buffer position POS/POS_BYTE until LIM/LIM_BYTE.

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1290 TRT is the translation table.

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1291

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1292 Return the character position where the match is found.

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1293 Otherwise, if M matches remained to be found, return -M.

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1294

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1295 This kind of search works regardless of what is in PAT and

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1296 regardless of what is in TRT. It is used in cases where

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1297 boyer_moore cannot work. */

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1298

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1299 static int

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1300 simple_search (n, pat, len, len_byte, trt, pos, pos_byte, lim, lim_byte)

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1301 int n;

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1302 unsigned char *pat;

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1303 int len, len_byte;

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1304 Lisp_Object trt;

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1305 int pos, pos_byte;

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1306 int lim, lim_byte;

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1307 {

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1308 int multibyte = ! NILP (current_buffer->enable_multibyte_characters);

21117

a88d2c555a06 (simple_search): Don't count a character until it matches!

Richard M. Stallman <rms@gnu.org>

parents: 20965

diff changeset

1309 int forward = n > 0;

20869

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1310

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1311 if (lim > pos && multibyte)

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1312 while (n > 0)

8950

68ad2f08d735 (trivial_regexp_p): New function.

Karl Heuer <kwzh@gnu.org>

parents: 8584

diff changeset

1313 {

20869

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1314 while (1)

20671

be91d6130341 (compile_pattern_1): If representation of STRING

Karl Heuer <kwzh@gnu.org>

parents: 20588

diff changeset

1315 {

20869

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1316 /* Try matching at position POS. */

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1317 int this_pos = pos;

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1318 int this_pos_byte = pos_byte;

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1319 int this_len = len;

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1320 int this_len_byte = len_byte;

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1321 unsigned char *p = pat;

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1322 if (pos + len > lim)

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1323 goto stop;

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1324

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1325 while (this_len > 0)

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1326 {

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1327 int charlen, buf_charlen;

21117

a88d2c555a06 (simple_search): Don't count a character until it matches!

Richard M. Stallman <rms@gnu.org>

parents: 20965

diff changeset

1328 int pat_ch, buf_ch;

a88d2c555a06 (simple_search): Don't count a character until it matches!

Richard M. Stallman <rms@gnu.org>

parents: 20965

diff changeset

1329

a88d2c555a06 (simple_search): Don't count a character until it matches!

Richard M. Stallman <rms@gnu.org>

parents: 20965

diff changeset

1330 pat_ch = STRING_CHAR_AND_LENGTH (p, this_len_byte, charlen);

a88d2c555a06 (simple_search): Don't count a character until it matches!

Richard M. Stallman <rms@gnu.org>

parents: 20965

diff changeset

1331 buf_ch = STRING_CHAR_AND_LENGTH (BYTE_POS_ADDR (this_pos_byte),

a88d2c555a06 (simple_search): Don't count a character until it matches!

Richard M. Stallman <rms@gnu.org>

parents: 20965

diff changeset

1332 ZV_BYTE - this_pos_byte,

a88d2c555a06 (simple_search): Don't count a character until it matches!

Richard M. Stallman <rms@gnu.org>

parents: 20965

diff changeset

1333 buf_charlen);

a88d2c555a06 (simple_search): Don't count a character until it matches!

Richard M. Stallman <rms@gnu.org>

parents: 20965

diff changeset

1334 TRANSLATE (buf_ch, trt, buf_ch);

a88d2c555a06 (simple_search): Don't count a character until it matches!

Richard M. Stallman <rms@gnu.org>

parents: 20965

diff changeset

1335

a88d2c555a06 (simple_search): Don't count a character until it matches!

Richard M. Stallman <rms@gnu.org>

parents: 20965

diff changeset

1336 if (buf_ch != pat_ch)

a88d2c555a06 (simple_search): Don't count a character until it matches!

Richard M. Stallman <rms@gnu.org>

parents: 20965

diff changeset

1337 break;

20869

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1338

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1339 this_len_byte -= charlen;

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1340 this_len--;

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1341 p += charlen;

20671

be91d6130341 (compile_pattern_1): If representation of STRING

Karl Heuer <kwzh@gnu.org>

parents: 20588

diff changeset

1342

20869

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1343 this_pos_byte += buf_charlen;

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1344 this_pos++;

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1345 }

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1346

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1347 if (this_len == 0)

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1348 {

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1349 pos += len;

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1350 pos_byte += len_byte;

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1351 break;

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1352 }

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1353

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1354 INC_BOTH (pos, pos_byte);

20671

be91d6130341 (compile_pattern_1): If representation of STRING

Karl Heuer <kwzh@gnu.org>

parents: 20588

diff changeset

1355 }

be91d6130341 (compile_pattern_1): If representation of STRING

Karl Heuer <kwzh@gnu.org>

parents: 20588

diff changeset

1356

20869

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1357 n--;

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1358 }

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1359 else if (lim > pos)

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1360 while (n > 0)

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1361 {

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1362 while (1)

8950

68ad2f08d735 (trivial_regexp_p): New function.

Karl Heuer <kwzh@gnu.org>

parents: 8584

diff changeset

1363 {

20869

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1364 /* Try matching at position POS. */

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1365 int this_pos = pos;

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1366 int this_len = len;

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1367 unsigned char *p = pat;

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1368

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1369 if (pos + len > lim)

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1370 goto stop;

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1371

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1372 while (this_len > 0)

8950

68ad2f08d735 (trivial_regexp_p): New function.

Karl Heuer <kwzh@gnu.org>

parents: 8584

diff changeset

1373 {

20869

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1374 int pat_ch = *p++;

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1375 int buf_ch = FETCH_BYTE (this_pos);

20898

f69969e35e78 (simple_search): Call set_search_regs.

Richard M. Stallman <rms@gnu.org>

parents: 20875

diff changeset

1376 TRANSLATE (buf_ch, trt, buf_ch);

20869

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1377

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1378 if (buf_ch != pat_ch)

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1379 break;

21117

a88d2c555a06 (simple_search): Don't count a character until it matches!

Richard M. Stallman <rms@gnu.org>

parents: 20965

diff changeset

1380

a88d2c555a06 (simple_search): Don't count a character until it matches!

Richard M. Stallman <rms@gnu.org>

parents: 20965

diff changeset

1381 this_len--;

a88d2c555a06 (simple_search): Don't count a character until it matches!

Richard M. Stallman <rms@gnu.org>

parents: 20965

diff changeset

1382 this_pos++;

8950

68ad2f08d735 (trivial_regexp_p): New function.

Karl Heuer <kwzh@gnu.org>

parents: 8584

diff changeset

1383 }

20869

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1384

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1385 if (this_len == 0)

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1386 {

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1387 pos += len;

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1388 break;

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1389 }

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1390

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1391 pos++;

8950

68ad2f08d735 (trivial_regexp_p): New function.

Karl Heuer <kwzh@gnu.org>

parents: 8584

diff changeset

1392 }

20869

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1393

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1394 n--;

8950

68ad2f08d735 (trivial_regexp_p): New function.

Karl Heuer <kwzh@gnu.org>

parents: 8584

diff changeset

1395 }

20869

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1396 /* Backwards search. */

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1397 else if (lim < pos && multibyte)

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1398 while (n < 0)

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1399 {

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1400 while (1)

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1401 {

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1402 /* Try matching at position POS. */

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1403 int this_pos = pos - len;

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1404 int this_pos_byte = pos_byte - len_byte;

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1405 int this_len = len;

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1406 int this_len_byte = len_byte;

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1407 unsigned char *p = pat;

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1408

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1409 if (pos - len < lim)

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1410 goto stop;

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1411

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1412 while (this_len > 0)

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1413 {

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1414 int charlen, buf_charlen;

21117

a88d2c555a06 (simple_search): Don't count a character until it matches!

Richard M. Stallman <rms@gnu.org>

parents: 20965

diff changeset

1415 int pat_ch, buf_ch;

a88d2c555a06 (simple_search): Don't count a character until it matches!

Richard M. Stallman <rms@gnu.org>

parents: 20965

diff changeset

1416

a88d2c555a06 (simple_search): Don't count a character until it matches!

Richard M. Stallman <rms@gnu.org>

parents: 20965

diff changeset

1417 pat_ch = STRING_CHAR_AND_LENGTH (p, this_len_byte, charlen);

a88d2c555a06 (simple_search): Don't count a character until it matches!

Richard M. Stallman <rms@gnu.org>

parents: 20965

diff changeset

1418 buf_ch = STRING_CHAR_AND_LENGTH (BYTE_POS_ADDR (this_pos_byte),

a88d2c555a06 (simple_search): Don't count a character until it matches!

Richard M. Stallman <rms@gnu.org>

parents: 20965

diff changeset

1419 ZV_BYTE - this_pos_byte,

a88d2c555a06 (simple_search): Don't count a character until it matches!

Richard M. Stallman <rms@gnu.org>

parents: 20965

diff changeset

1420 buf_charlen);

a88d2c555a06 (simple_search): Don't count a character until it matches!

Richard M. Stallman <rms@gnu.org>

parents: 20965

diff changeset

1421 TRANSLATE (buf_ch, trt, buf_ch);

a88d2c555a06 (simple_search): Don't count a character until it matches!

Richard M. Stallman <rms@gnu.org>

parents: 20965

diff changeset

1422

a88d2c555a06 (simple_search): Don't count a character until it matches!

Richard M. Stallman <rms@gnu.org>

parents: 20965

diff changeset

1423 if (buf_ch != pat_ch)

a88d2c555a06 (simple_search): Don't count a character until it matches!

Richard M. Stallman <rms@gnu.org>

parents: 20965

diff changeset

1424 break;

20869

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1425

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1426 this_len_byte -= charlen;

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1427 this_len--;

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1428 p += charlen;

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1429 this_pos_byte += buf_charlen;

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1430 this_pos++;

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1431 }

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1432

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1433 if (this_len == 0)

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1434 {

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1435 pos -= len;

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1436 pos_byte -= len_byte;

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1437 break;

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1438 }

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1439

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1440 DEC_BOTH (pos, pos_byte);

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1441 }

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1442

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1443 n++;

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1444 }

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1445 else if (lim < pos)

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1446 while (n < 0)

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1447 {

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1448 while (1)

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1449 {

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1450 /* Try matching at position POS. */

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1451 int this_pos = pos - len;

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1452 int this_len = len;

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1453 unsigned char *p = pat;

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1454

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1455 if (pos - len < lim)

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1456 goto stop;

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1457

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1458 while (this_len > 0)

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1459 {

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1460 int pat_ch = *p++;

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1461 int buf_ch = FETCH_BYTE (this_pos);

20898

f69969e35e78 (simple_search): Call set_search_regs.

Richard M. Stallman <rms@gnu.org>

parents: 20875

diff changeset

1462 TRANSLATE (buf_ch, trt, buf_ch);

20869

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1463

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1464 if (buf_ch != pat_ch)

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1465 break;

21117

a88d2c555a06 (simple_search): Don't count a character until it matches!

Richard M. Stallman <rms@gnu.org>

parents: 20965

diff changeset

1466 this_len--;

a88d2c555a06 (simple_search): Don't count a character until it matches!

Richard M. Stallman <rms@gnu.org>

parents: 20965

diff changeset

1467 this_pos++;

20869

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1468 }

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1469

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1470 if (this_len == 0)

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1471 {

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1472 pos -= len;

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1473 break;

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1474 }

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1475

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1476 pos--;

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1477 }

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1478

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1479 n++;

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1480 }

603

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

1481

20869

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1482 stop:

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1483 if (n == 0)

20898

f69969e35e78 (simple_search): Call set_search_regs.

Richard M. Stallman <rms@gnu.org>

parents: 20875

diff changeset

1484 {

21117

a88d2c555a06 (simple_search): Don't count a character until it matches!

Richard M. Stallman <rms@gnu.org>

parents: 20965

diff changeset

1485 if (forward)

a88d2c555a06 (simple_search): Don't count a character until it matches!

Richard M. Stallman <rms@gnu.org>

parents: 20965

diff changeset

1486 set_search_regs ((multibyte ? pos_byte : pos) - len_byte, len_byte);

a88d2c555a06 (simple_search): Don't count a character until it matches!

Richard M. Stallman <rms@gnu.org>

parents: 20965

diff changeset

1487 else

a88d2c555a06 (simple_search): Don't count a character until it matches!

Richard M. Stallman <rms@gnu.org>

parents: 20965

diff changeset

1488 set_search_regs (multibyte ? pos_byte : pos, len_byte);

20898

f69969e35e78 (simple_search): Call set_search_regs.

Richard M. Stallman <rms@gnu.org>

parents: 20875

diff changeset

1489

f69969e35e78 (simple_search): Call set_search_regs.

Richard M. Stallman <rms@gnu.org>

parents: 20875

diff changeset

1490 return pos;

f69969e35e78 (simple_search): Call set_search_regs.

Richard M. Stallman <rms@gnu.org>

parents: 20875

diff changeset

1491 }

20869

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1492 else if (n > 0)

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1493 return -n;

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1494 else

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1495 return n;

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1496 }

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1497

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1498 /* Do Boyer-Moore search N times for the string PAT,

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1499 whose length is LEN/LEN_BYTE,

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1500 from buffer position POS/POS_BYTE until LIM/LIM_BYTE.

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1501 DIRECTION says which direction we search in.

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1502 TRT and INVERSE_TRT are translation tables.

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1503

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1504 This kind of search works if all the characters in PAT that have

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1505 nontrivial translation are the same aside from the last byte. This

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1506 makes it possible to translate just the last byte of a character,

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1507 and do so after just a simple test of the context.

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1508

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1509 If that criterion is not satisfied, do not call this function. */

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1510

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1511 static int

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1512 boyer_moore (n, base_pat, len, len_byte, trt, inverse_trt,

20898

f69969e35e78 (simple_search): Call set_search_regs.

Richard M. Stallman <rms@gnu.org>

parents: 20875

diff changeset

1513 pos, pos_byte, lim, lim_byte, charset_base)

20869

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1514 int n;

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1515 unsigned char *base_pat;

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1516 int len, len_byte;

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1517 Lisp_Object trt;

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1518 Lisp_Object inverse_trt;

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1519 int pos, pos_byte;

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1520 int lim, lim_byte;

20898

f69969e35e78 (simple_search): Call set_search_regs.

Richard M. Stallman <rms@gnu.org>

parents: 20875

diff changeset

1521 int charset_base;

20869

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1522 {

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1523 int direction = ((n > 0) ? 1 : -1);

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1524 register int dirlen;

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1525 int infinity, limit, k, stride_for_teases;

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1526 register int *BM_tab;

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1527 int *BM_tab_base;

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1528 register unsigned char *cursor, *p_limit;

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1529 register int i, j;

21945

bda081af77e7 (boyer_moore): Check more reliably for ptr[1] being

Richard M. Stallman <rms@gnu.org>

parents: 21915

diff changeset

1530 unsigned char *pat, *pat_end;

20869

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1531 int multibyte = ! NILP (current_buffer->enable_multibyte_characters);

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1532

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1533 unsigned char simple_translate[0400];

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1534 int translate_prev_byte;

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1535 int translate_anteprev_byte;

603

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

1536

20869

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1537 #ifdef C_ALLOCA

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1538 int BM_tab_space[0400];

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1539 BM_tab = &BM_tab_space[0];

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1540 #else

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1541 BM_tab = (int *) alloca (0400 * sizeof (int));

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1542 #endif

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1543 /* The general approach is that we are going to maintain that we know */

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1544 /* the first (closest to the present position, in whatever direction */

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1545 /* we're searching) character that could possibly be the last */

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1546 /* (furthest from present position) character of a valid match. We */

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1547 /* advance the state of our knowledge by looking at that character */

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1548 /* and seeing whether it indeed matches the last character of the */

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1549 /* pattern. If it does, we take a closer look. If it does not, we */

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1550 /* move our pointer (to putative last characters) as far as is */

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1551 /* logically possible. This amount of movement, which I call a */

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1552 /* stride, will be the length of the pattern if the actual character */

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1553 /* appears nowhere in the pattern, otherwise it will be the distance */

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1554 /* from the last occurrence of that character to the end of the */

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1555 /* pattern. */

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1556 /* As a coding trick, an enormous stride is coded into the table for */

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1557 /* characters that match the last character. This allows use of only */

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1558 /* a single test, a test for having gone past the end of the */

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1559 /* permissible match region, to test for both possible matches (when */

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1560 /* the stride goes past the end immediately) and failure to */

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1561 /* match (where you get nudged past the end one stride at a time). */

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1562

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1563 /* Here we make a "mickey mouse" BM table. The stride of the search */

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1564 /* is determined only by the last character of the putative match. */

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1565 /* If that character does not match, we will stride the proper */

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1566 /* distance to propose a match that superimposes it on the last */

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1567 /* instance of a character that matches it (per trt), or misses */

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1568 /* it entirely if there is none. */

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1569

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1570 dirlen = len_byte * direction;

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1571 infinity = dirlen - (lim_byte + pos_byte + len_byte + len_byte) * direction;

21945

bda081af77e7 (boyer_moore): Check more reliably for ptr[1] being

Richard M. Stallman <rms@gnu.org>

parents: 21915

diff changeset

1572

bda081af77e7 (boyer_moore): Check more reliably for ptr[1] being

Richard M. Stallman <rms@gnu.org>

parents: 21915

diff changeset

1573 /* Record position after the end of the pattern. */

bda081af77e7 (boyer_moore): Check more reliably for ptr[1] being

Richard M. Stallman <rms@gnu.org>

parents: 21915

diff changeset

1574 pat_end = base_pat + len_byte;

bda081af77e7 (boyer_moore): Check more reliably for ptr[1] being

Richard M. Stallman <rms@gnu.org>

parents: 21915

diff changeset

1575 /* BASE_PAT points to a character that we start scanning from.

bda081af77e7 (boyer_moore): Check more reliably for ptr[1] being

Richard M. Stallman <rms@gnu.org>

parents: 21915

diff changeset

1576 It is the first character in a forward search,

bda081af77e7 (boyer_moore): Check more reliably for ptr[1] being

Richard M. Stallman <rms@gnu.org>

parents: 21915

diff changeset

1577 the last character in a backward search. */

20869

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1578 if (direction < 0)

21945

bda081af77e7 (boyer_moore): Check more reliably for ptr[1] being

Richard M. Stallman <rms@gnu.org>

parents: 21915

diff changeset

1579 base_pat = pat_end - 1;

bda081af77e7 (boyer_moore): Check more reliably for ptr[1] being

Richard M. Stallman <rms@gnu.org>

parents: 21915

diff changeset

1580

20869

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1581 BM_tab_base = BM_tab;

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1582 BM_tab += 0400;

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1583 j = dirlen; /* to get it in a register */

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1584 /* A character that does not appear in the pattern induces a */

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1585 /* stride equal to the pattern length. */

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1586 while (BM_tab_base != BM_tab)

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1587 {

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1588 *--BM_tab = j;

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1589 *--BM_tab = j;

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1590 *--BM_tab = j;

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1591 *--BM_tab = j;

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1592 }

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1593

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1594 /* We use this for translation, instead of TRT itself.

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1595 We fill this in to handle the characters that actually

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1596 occur in the pattern. Others don't matter anyway! */

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1597 bzero (simple_translate, sizeof simple_translate);

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1598 for (i = 0; i < 0400; i++)

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1599 simple_translate[i] = i;

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1600

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1601 i = 0;

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1602 while (i != infinity)

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1603 {

21945

bda081af77e7 (boyer_moore): Check more reliably for ptr[1] being

Richard M. Stallman <rms@gnu.org>

parents: 21915

diff changeset

1604 unsigned char *ptr = base_pat + i;

20869

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1605 i += direction;

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1606 if (i == dirlen)

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1607 i = infinity;

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1608 if (! NILP (trt))

603

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

1609 {

20869

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1610 int ch;

20898

f69969e35e78 (simple_search): Call set_search_regs.

Richard M. Stallman <rms@gnu.org>

parents: 20875

diff changeset

1611 int untranslated;

20869

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1612 int this_translated = 1;

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1613

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1614 if (multibyte

21945

bda081af77e7 (boyer_moore): Check more reliably for ptr[1] being

Richard M. Stallman <rms@gnu.org>

parents: 21915

diff changeset

1615 /* Is *PTR the last byte of a character? */

bda081af77e7 (boyer_moore): Check more reliably for ptr[1] being

Richard M. Stallman <rms@gnu.org>

parents: 21915

diff changeset

1616 && (pat_end - ptr == 1 || CHAR_HEAD_P (ptr[1])))

603

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

1617 {

20869

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1618 unsigned char *charstart = ptr;

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1619 while (! CHAR_HEAD_P (*charstart))

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1620 charstart--;

20898

f69969e35e78 (simple_search): Call set_search_regs.

Richard M. Stallman <rms@gnu.org>

parents: 20875

diff changeset

1621 untranslated = STRING_CHAR (charstart, ptr - charstart + 1);

24716

ceeb1f1d1a88 (boyer_moore): Get charset base value of `untranslated'

Kenichi Handa <handa@m17n.org>

parents: 24433

diff changeset

1622 if (charset_base == (untranslated & ~CHAR_FIELD3_MASK))

20869

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1623 {

21117

a88d2c555a06 (simple_search): Don't count a character until it matches!

Richard M. Stallman <rms@gnu.org>

parents: 20965

diff changeset

1624 TRANSLATE (ch, trt, untranslated);

20898

f69969e35e78 (simple_search): Call set_search_regs.

Richard M. Stallman <rms@gnu.org>

parents: 20875

diff changeset

1625 if (! CHAR_HEAD_P (*ptr))

f69969e35e78 (simple_search): Call set_search_regs.

Richard M. Stallman <rms@gnu.org>

parents: 20875

diff changeset

1626 {

f69969e35e78 (simple_search): Call set_search_regs.

Richard M. Stallman <rms@gnu.org>

parents: 20875

diff changeset

1627 translate_prev_byte = ptr[-1];

f69969e35e78 (simple_search): Call set_search_regs.

Richard M. Stallman <rms@gnu.org>

parents: 20875

diff changeset

1628 if (! CHAR_HEAD_P (translate_prev_byte))

f69969e35e78 (simple_search): Call set_search_regs.

Richard M. Stallman <rms@gnu.org>

parents: 20875

diff changeset

1629 translate_anteprev_byte = ptr[-2];

f69969e35e78 (simple_search): Call set_search_regs.

Richard M. Stallman <rms@gnu.org>

parents: 20875

diff changeset

1630 }

20869

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1631 }

20898

f69969e35e78 (simple_search): Call set_search_regs.

Richard M. Stallman <rms@gnu.org>

parents: 20875

diff changeset

1632 else

21117

a88d2c555a06 (simple_search): Don't count a character until it matches!

Richard M. Stallman <rms@gnu.org>

parents: 20965

diff changeset

1633 {

a88d2c555a06 (simple_search): Don't count a character until it matches!

Richard M. Stallman <rms@gnu.org>

parents: 20965

diff changeset

1634 this_translated = 0;

a88d2c555a06 (simple_search): Don't count a character until it matches!

Richard M. Stallman <rms@gnu.org>

parents: 20965

diff changeset

1635 ch = *ptr;

a88d2c555a06 (simple_search): Don't count a character until it matches!

Richard M. Stallman <rms@gnu.org>

parents: 20965

diff changeset

1636 }

603

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

1637 }

20869

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1638 else if (!multibyte)

20898

f69969e35e78 (simple_search): Call set_search_regs.

Richard M. Stallman <rms@gnu.org>

parents: 20875

diff changeset

1639 TRANSLATE (ch, trt, *ptr);

603

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

1640 else

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

1641 {

20869

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1642 ch = *ptr;

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1643 this_translated = 0;

603

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

1644 }

20869

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1645

21117

a88d2c555a06 (simple_search): Don't count a character until it matches!

Richard M. Stallman <rms@gnu.org>

parents: 20965

diff changeset

1646 if (ch > 0400)

a88d2c555a06 (simple_search): Don't count a character until it matches!

Richard M. Stallman <rms@gnu.org>

parents: 20965

diff changeset

1647 j = ((unsigned char) ch) | 0200;

a88d2c555a06 (simple_search): Don't count a character until it matches!

Richard M. Stallman <rms@gnu.org>

parents: 20965

diff changeset

1648 else

a88d2c555a06 (simple_search): Don't count a character until it matches!

Richard M. Stallman <rms@gnu.org>

parents: 20965

diff changeset

1649 j = (unsigned char) ch;

a88d2c555a06 (simple_search): Don't count a character until it matches!

Richard M. Stallman <rms@gnu.org>

parents: 20965

diff changeset

1650

20869

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1651 if (i == infinity)

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1652 stride_for_teases = BM_tab[j];

21117

a88d2c555a06 (simple_search): Don't count a character until it matches!

Richard M. Stallman <rms@gnu.org>

parents: 20965

diff changeset

1653

20869

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1654 BM_tab[j] = dirlen - i;

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1655 /* A translation table is accompanied by its inverse -- see */

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1656 /* comment following downcase_table for details */

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1657 if (this_translated)

21117

a88d2c555a06 (simple_search): Don't count a character until it matches!

Richard M. Stallman <rms@gnu.org>

parents: 20965

diff changeset

1658 {

a88d2c555a06 (simple_search): Don't count a character until it matches!

Richard M. Stallman <rms@gnu.org>

parents: 20965

diff changeset

1659 int starting_ch = ch;

a88d2c555a06 (simple_search): Don't count a character until it matches!

Richard M. Stallman <rms@gnu.org>

parents: 20965

diff changeset

1660 int starting_j = j;

a88d2c555a06 (simple_search): Don't count a character until it matches!

Richard M. Stallman <rms@gnu.org>

parents: 20965

diff changeset

1661 while (1)

a88d2c555a06 (simple_search): Don't count a character until it matches!

Richard M. Stallman <rms@gnu.org>

parents: 20965

diff changeset

1662 {

a88d2c555a06 (simple_search): Don't count a character until it matches!

Richard M. Stallman <rms@gnu.org>

parents: 20965

diff changeset

1663 TRANSLATE (ch, inverse_trt, ch);

a88d2c555a06 (simple_search): Don't count a character until it matches!

Richard M. Stallman <rms@gnu.org>

parents: 20965

diff changeset

1664 if (ch > 0400)

a88d2c555a06 (simple_search): Don't count a character until it matches!

Richard M. Stallman <rms@gnu.org>

parents: 20965

diff changeset

1665 j = ((unsigned char) ch) | 0200;

a88d2c555a06 (simple_search): Don't count a character until it matches!

Richard M. Stallman <rms@gnu.org>

parents: 20965

diff changeset

1666 else

a88d2c555a06 (simple_search): Don't count a character until it matches!

Richard M. Stallman <rms@gnu.org>

parents: 20965

diff changeset

1667 j = (unsigned char) ch;

a88d2c555a06 (simple_search): Don't count a character until it matches!

Richard M. Stallman <rms@gnu.org>

parents: 20965

diff changeset

1668

a88d2c555a06 (simple_search): Don't count a character until it matches!

Richard M. Stallman <rms@gnu.org>

parents: 20965

diff changeset

1669 /* For all the characters that map into CH,

a88d2c555a06 (simple_search): Don't count a character until it matches!

Richard M. Stallman <rms@gnu.org>

parents: 20965

diff changeset

1670 set up simple_translate to map the last byte

a88d2c555a06 (simple_search): Don't count a character until it matches!

Richard M. Stallman <rms@gnu.org>

parents: 20965

diff changeset

1671 into STARTING_J. */

a88d2c555a06 (simple_search): Don't count a character until it matches!

Richard M. Stallman <rms@gnu.org>

parents: 20965

diff changeset

1672 simple_translate[j] = starting_j;

a88d2c555a06 (simple_search): Don't count a character until it matches!

Richard M. Stallman <rms@gnu.org>

parents: 20965

diff changeset

1673 if (ch == starting_ch)

a88d2c555a06 (simple_search): Don't count a character until it matches!

Richard M. Stallman <rms@gnu.org>

parents: 20965

diff changeset

1674 break;

a88d2c555a06 (simple_search): Don't count a character until it matches!

Richard M. Stallman <rms@gnu.org>

parents: 20965

diff changeset

1675 BM_tab[j] = dirlen - i;

a88d2c555a06 (simple_search): Don't count a character until it matches!

Richard M. Stallman <rms@gnu.org>

parents: 20965

diff changeset

1676 }

a88d2c555a06 (simple_search): Don't count a character until it matches!

Richard M. Stallman <rms@gnu.org>

parents: 20965

diff changeset

1677 }

603

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

1678 }

20869

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1679 else

603

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

1680 {

20869

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1681 j = *ptr;

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1682

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1683 if (i == infinity)

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1684 stride_for_teases = BM_tab[j];

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1685 BM_tab[j] = dirlen - i;

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1686 }

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1687 /* stride_for_teases tells how much to stride if we get a */

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1688 /* match on the far character but are subsequently */

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1689 /* disappointed, by recording what the stride would have been */

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1690 /* for that character if the last character had been */

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1691 /* different. */

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1692 }

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1693 infinity = dirlen - infinity;

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1694 pos_byte += dirlen - ((direction > 0) ? direction : 0);

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1695 /* loop invariant - POS_BYTE points at where last char (first

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1696 char if reverse) of pattern would align in a possible match. */

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1697 while (n != 0)

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1698 {

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1699 int tail_end;

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1700 unsigned char *tail_end_ptr;

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1701

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1702 /* It's been reported that some (broken) compiler thinks that

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1703 Boolean expressions in an arithmetic context are unsigned.

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1704 Using an explicit ?1:0 prevents this. */

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1705 if ((lim_byte - pos_byte - ((direction > 0) ? 1 : 0)) * direction

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1706 < 0)

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1707 return (n * (0 - direction));

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1708 /* First we do the part we can by pointers (maybe nothing) */

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1709 QUIT;

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1710 pat = base_pat;

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1711 limit = pos_byte - dirlen + direction;

21457

8c6ea32aadfa (min, max): Make these macros, not functions.

Karl Heuer <kwzh@gnu.org>

parents: 21248

diff changeset

1712 if (direction > 0)

8c6ea32aadfa (min, max): Make these macros, not functions.

Karl Heuer <kwzh@gnu.org>

parents: 21248

diff changeset

1713 {

8c6ea32aadfa (min, max): Make these macros, not functions.

Karl Heuer <kwzh@gnu.org>

parents: 21248

diff changeset

1714 limit = BUFFER_CEILING_OF (limit);

8c6ea32aadfa (min, max): Make these macros, not functions.

Karl Heuer <kwzh@gnu.org>

parents: 21248

diff changeset

1715 /* LIMIT is now the last (not beyond-last!) value POS_BYTE

8c6ea32aadfa (min, max): Make these macros, not functions.

Karl Heuer <kwzh@gnu.org>

parents: 21248

diff changeset

1716 can take on without hitting edge of buffer or the gap. */

8c6ea32aadfa (min, max): Make these macros, not functions.

Karl Heuer <kwzh@gnu.org>

parents: 21248

diff changeset

1717 limit = min (limit, pos_byte + 20000);

8c6ea32aadfa (min, max): Make these macros, not functions.

Karl Heuer <kwzh@gnu.org>

parents: 21248

diff changeset

1718 limit = min (limit, lim_byte - 1);

8c6ea32aadfa (min, max): Make these macros, not functions.

Karl Heuer <kwzh@gnu.org>

parents: 21248

diff changeset

1719 }

8c6ea32aadfa (min, max): Make these macros, not functions.

Karl Heuer <kwzh@gnu.org>

parents: 21248

diff changeset

1720 else

8c6ea32aadfa (min, max): Make these macros, not functions.

Karl Heuer <kwzh@gnu.org>

parents: 21248

diff changeset

1721 {

8c6ea32aadfa (min, max): Make these macros, not functions.

Karl Heuer <kwzh@gnu.org>

parents: 21248

diff changeset

1722 limit = BUFFER_FLOOR_OF (limit);

8c6ea32aadfa (min, max): Make these macros, not functions.

Karl Heuer <kwzh@gnu.org>

parents: 21248

diff changeset

1723 /* LIMIT is now the last (not beyond-last!) value POS_BYTE

8c6ea32aadfa (min, max): Make these macros, not functions.

Karl Heuer <kwzh@gnu.org>

parents: 21248

diff changeset

1724 can take on without hitting edge of buffer or the gap. */

8c6ea32aadfa (min, max): Make these macros, not functions.

Karl Heuer <kwzh@gnu.org>

parents: 21248

diff changeset

1725 limit = max (limit, pos_byte - 20000);

8c6ea32aadfa (min, max): Make these macros, not functions.

Karl Heuer <kwzh@gnu.org>

parents: 21248

diff changeset

1726 limit = max (limit, lim_byte);

8c6ea32aadfa (min, max): Make these macros, not functions.

Karl Heuer <kwzh@gnu.org>

parents: 21248

diff changeset

1727 }

20869

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1728 tail_end = BUFFER_CEILING_OF (pos_byte) + 1;

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1729 tail_end_ptr = BYTE_POS_ADDR (tail_end);

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1730

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1731 if ((limit - pos_byte) * direction > 20)

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1732 {

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1733 unsigned char *p2;

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1734

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1735 p_limit = BYTE_POS_ADDR (limit);

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1736 p2 = (cursor = BYTE_POS_ADDR (pos_byte));

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1737 /* In this loop, pos + cursor - p2 is the surrogate for pos */

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1738 while (1) /* use one cursor setting as long as i can */

603

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

1739 {

20869

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1740 if (direction > 0) /* worth duplicating */

603

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

1741 {

20869

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1742 /* Use signed comparison if appropriate

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1743 to make cursor+infinity sure to be > p_limit.

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1744 Assuming that the buffer lies in a range of addresses

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1745 that are all "positive" (as ints) or all "negative",

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1746 either kind of comparison will work as long

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1747 as we don't step by infinity. So pick the kind

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1748 that works when we do step by infinity. */

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1749 if ((EMACS_INT) (p_limit + infinity) > (EMACS_INT) p_limit)

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1750 while ((EMACS_INT) cursor <= (EMACS_INT) p_limit)

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1751 cursor += BM_tab[*cursor];

603

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

1752 else

20869

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1753 while ((EMACS_UINT) cursor <= (EMACS_UINT) p_limit)

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1754 cursor += BM_tab[*cursor];

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1755 }

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1756 else

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1757 {

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1758 if ((EMACS_INT) (p_limit + infinity) < (EMACS_INT) p_limit)

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1759 while ((EMACS_INT) cursor >= (EMACS_INT) p_limit)

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1760 cursor += BM_tab[*cursor];

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1761 else

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1762 while ((EMACS_UINT) cursor >= (EMACS_UINT) p_limit)

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1763 cursor += BM_tab[*cursor];

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1764 }

603

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

1765 /* If you are here, cursor is beyond the end of the searched region. */

20869

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1766 /* This can happen if you match on the far character of the pattern, */

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1767 /* because the "stride" of that character is infinity, a number able */

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1768 /* to throw you well beyond the end of the search. It can also */

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1769 /* happen if you fail to match within the permitted region and would */

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1770 /* otherwise try a character beyond that region */

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1771 if ((cursor - p_limit) * direction <= len_byte)

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1772 break; /* a small overrun is genuine */

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1773 cursor -= infinity; /* large overrun = hit */

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1774 i = dirlen - direction;

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1775 if (! NILP (trt))

603

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

1776 {

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

1777 while ((i -= direction) + direction != 0)

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

1778 {

20869

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1779 int ch;

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1780 cursor -= direction;

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1781 /* Translate only the last byte of a character. */

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1782 if (! multibyte

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1783 || ((cursor == tail_end_ptr

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1784 || CHAR_HEAD_P (cursor[1]))

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1785 && (CHAR_HEAD_P (cursor[0])

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1786 || (translate_prev_byte == cursor[-1]

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1787 && (CHAR_HEAD_P (translate_prev_byte)

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1788 || translate_anteprev_byte == cursor[-2])))))

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1789 ch = simple_translate[*cursor];

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1790 else

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1791 ch = *cursor;

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1792 if (pat[i] != ch)

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1793 break;

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1794 }

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1795 }

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1796 else

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1797 {

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1798 while ((i -= direction) + direction != 0)

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1799 {

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1800 cursor -= direction;

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1801 if (pat[i] != *cursor)

603

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

1802 break;

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

1803 }

20869

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1804 }

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1805 cursor += dirlen - i - direction; /* fix cursor */

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1806 if (i + direction == 0)

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1807 {

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1808 int position;

708

030fb4635335 *** empty log message ***

Jim Blandy <jimb@redhat.com>

parents: 648

diff changeset

1809

20869

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1810 cursor -= direction;

20588

138c95482e6b (search_buffer): Handle bytes vs chars in non-RE case.

Richard M. Stallman <rms@gnu.org>

parents: 20547

diff changeset

1811

20869

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1812 position = pos_byte + cursor - p2 + ((direction > 0)

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1813 ? 1 - len_byte : 0);

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1814 set_search_regs (position, len_byte);

708

030fb4635335 *** empty log message ***

Jim Blandy <jimb@redhat.com>

parents: 648

diff changeset

1815

20869

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1816 if ((n -= direction) != 0)

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1817 cursor += dirlen; /* to resume search */

603

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

1818 else

20869

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1819 return ((direction > 0)

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1820 ? search_regs.end[0] : search_regs.start[0]);

603

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

1821 }

20869

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1822 else

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1823 cursor += stride_for_teases; /* <sigh> we lose - */

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1824 }

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1825 pos_byte += cursor - p2;

603

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

1826 }

20869

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1827 else

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1828 /* Now we'll pick up a clump that has to be done the hard */

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1829 /* way because it covers a discontinuity */

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1830 {

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1831 limit = ((direction > 0)

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1832 ? BUFFER_CEILING_OF (pos_byte - dirlen + 1)

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1833 : BUFFER_FLOOR_OF (pos_byte - dirlen - 1));

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1834 limit = ((direction > 0)

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1835 ? min (limit + len_byte, lim_byte - 1)

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1836 : max (limit - len_byte, lim_byte));

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1837 /* LIMIT is now the last value POS_BYTE can have

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1838 and still be valid for a possible match. */

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1839 while (1)

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1840 {

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1841 /* This loop can be coded for space rather than */

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1842 /* speed because it will usually run only once. */

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1843 /* (the reach is at most len + 21, and typically */

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1844 /* does not exceed len) */

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1845 while ((limit - pos_byte) * direction >= 0)

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1846 pos_byte += BM_tab[FETCH_BYTE (pos_byte)];

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1847 /* now run the same tests to distinguish going off the */

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1848 /* end, a match or a phony match. */

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1849 if ((pos_byte - limit) * direction <= len_byte)

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1850 break; /* ran off the end */

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1851 /* Found what might be a match.

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1852 Set POS_BYTE back to last (first if reverse) pos. */

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1853 pos_byte -= infinity;

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1854 i = dirlen - direction;

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1855 while ((i -= direction) + direction != 0)

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1856 {

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1857 int ch;

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1858 unsigned char *ptr;

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1859 pos_byte -= direction;

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1860 ptr = BYTE_POS_ADDR (pos_byte);

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1861 /* Translate only the last byte of a character. */

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1862 if (! multibyte

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1863 || ((ptr == tail_end_ptr

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1864 || CHAR_HEAD_P (ptr[1]))

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1865 && (CHAR_HEAD_P (ptr[0])

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1866 || (translate_prev_byte == ptr[-1]

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1867 && (CHAR_HEAD_P (translate_prev_byte)

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1868 || translate_anteprev_byte == ptr[-2])))))

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1869 ch = simple_translate[*ptr];

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1870 else

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1871 ch = *ptr;

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1872 if (pat[i] != ch)

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1873 break;

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1874 }

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1875 /* Above loop has moved POS_BYTE part or all the way

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1876 back to the first pos (last pos if reverse).

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1877 Set it once again at the last (first if reverse) char. */

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1878 pos_byte += dirlen - i- direction;

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1879 if (i + direction == 0)

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1880 {

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1881 int position;

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1882 pos_byte -= direction;

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1883

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1884 position = pos_byte + ((direction > 0) ? 1 - len_byte : 0);

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1885

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1886 set_search_regs (position, len_byte);

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1887

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1888 if ((n -= direction) != 0)

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1889 pos_byte += dirlen; /* to resume search */

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1890 else

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1891 return ((direction > 0)

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1892 ? search_regs.end[0] : search_regs.start[0]);

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1893 }

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1894 else

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1895 pos_byte += stride_for_teases;

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1896 }

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1897 }

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1898 /* We have done one clump. Can we continue? */

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1899 if ((lim_byte - pos_byte) * direction < 0)

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1900 return ((0 - n) * direction);

603

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

1901 }

20869

c9f608f889b4 (boyer_moore, simple_search): New subroutines.

Richard M. Stallman <rms@gnu.org>

parents: 20824

diff changeset

1902 return BYTE_TO_CHAR (pos_byte);

603

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

1903 }

5556

14161cfec24a (set_search_regs): New subroutine.

Richard M. Stallman <rms@gnu.org>

parents: 4954

diff changeset

1904

20545

c20c92ff4055 (looking_at_1): Use bytepos to call re_search_2.

Richard M. Stallman <rms@gnu.org>

parents: 20347

diff changeset

1905 /* Record beginning BEG_BYTE and end BEG_BYTE + NBYTES

22082

84bcdbc46d71 (search_buffer): Set search regs for all success with an empty string.

Richard M. Stallman <rms@gnu.org>

parents: 21988

diff changeset

1906 for the overall match just found in the current buffer.

84bcdbc46d71 (search_buffer): Set search regs for all success with an empty string.

Richard M. Stallman <rms@gnu.org>

parents: 21988

diff changeset

1907 Also clear out the match data for registers 1 and up. */

5556

14161cfec24a (set_search_regs): New subroutine.

Richard M. Stallman <rms@gnu.org>

parents: 4954

diff changeset

1908

14161cfec24a (set_search_regs): New subroutine.

Richard M. Stallman <rms@gnu.org>

parents: 4954

diff changeset

1909 static void

20545

c20c92ff4055 (looking_at_1): Use bytepos to call re_search_2.

Richard M. Stallman <rms@gnu.org>

parents: 20347

diff changeset

1910 set_search_regs (beg_byte, nbytes)

c20c92ff4055 (looking_at_1): Use bytepos to call re_search_2.

Richard M. Stallman <rms@gnu.org>

parents: 20347

diff changeset

1911 int beg_byte, nbytes;

5556

14161cfec24a (set_search_regs): New subroutine.

Richard M. Stallman <rms@gnu.org>

parents: 4954

diff changeset

1912 {

22082

84bcdbc46d71 (search_buffer): Set search regs for all success with an empty string.

Richard M. Stallman <rms@gnu.org>

parents: 21988

diff changeset

1913 int i;

84bcdbc46d71 (search_buffer): Set search regs for all success with an empty string.

Richard M. Stallman <rms@gnu.org>

parents: 21988

diff changeset

1914

5556

14161cfec24a (set_search_regs): New subroutine.

Richard M. Stallman <rms@gnu.org>

parents: 4954

diff changeset

1915 /* Make sure we have registers in which to store

14161cfec24a (set_search_regs): New subroutine.

Richard M. Stallman <rms@gnu.org>

parents: 4954

diff changeset

1916 the match position. */

14161cfec24a (set_search_regs): New subroutine.

Richard M. Stallman <rms@gnu.org>

parents: 4954

diff changeset

1917 if (search_regs.num_regs == 0)

14161cfec24a (set_search_regs): New subroutine.

Richard M. Stallman <rms@gnu.org>

parents: 4954

diff changeset

1918 {

10250

422c3b96efda (set_search_regs): Really set search_regs.start and .end.

Richard M. Stallman <rms@gnu.org>

parents: 10141

diff changeset

1919 search_regs.start = (regoff_t *) xmalloc (2 * sizeof (regoff_t));

422c3b96efda (set_search_regs): Really set search_regs.start and .end.

Richard M. Stallman <rms@gnu.org>

parents: 10141

diff changeset

1920 search_regs.end = (regoff_t *) xmalloc (2 * sizeof (regoff_t));

9605

cf97e75d8e02 (searchbufs): New variable, replaces searchbuf and last_regexp and

Karl Heuer <kwzh@gnu.org>

parents: 9452

diff changeset

1921 search_regs.num_regs = 2;

5556

14161cfec24a (set_search_regs): New subroutine.

Richard M. Stallman <rms@gnu.org>

parents: 4954

diff changeset

1922 }

14161cfec24a (set_search_regs): New subroutine.

Richard M. Stallman <rms@gnu.org>

parents: 4954

diff changeset

1923

22082

84bcdbc46d71 (search_buffer): Set search regs for all success with an empty string.

Richard M. Stallman <rms@gnu.org>

parents: 21988

diff changeset

1924 /* Clear out the other registers. */

84bcdbc46d71 (search_buffer): Set search regs for all success with an empty string.

Richard M. Stallman <rms@gnu.org>

parents: 21988

diff changeset

1925 for (i = 1; i < search_regs.num_regs; i++)

84bcdbc46d71 (search_buffer): Set search regs for all success with an empty string.

Richard M. Stallman <rms@gnu.org>

parents: 21988

diff changeset

1926 {

84bcdbc46d71 (search_buffer): Set search regs for all success with an empty string.

Richard M. Stallman <rms@gnu.org>

parents: 21988

diff changeset

1927 search_regs.start[i] = -1;

84bcdbc46d71 (search_buffer): Set search regs for all success with an empty string.

Richard M. Stallman <rms@gnu.org>

parents: 21988

diff changeset

1928 search_regs.end[i] = -1;

84bcdbc46d71 (search_buffer): Set search regs for all success with an empty string.

Richard M. Stallman <rms@gnu.org>

parents: 21988

diff changeset

1929 }

84bcdbc46d71 (search_buffer): Set search regs for all success with an empty string.

Richard M. Stallman <rms@gnu.org>

parents: 21988

diff changeset

1930

20545

c20c92ff4055 (looking_at_1): Use bytepos to call re_search_2.

Richard M. Stallman <rms@gnu.org>

parents: 20347

diff changeset

1931 search_regs.start[0] = BYTE_TO_CHAR (beg_byte);

c20c92ff4055 (looking_at_1): Use bytepos to call re_search_2.

Richard M. Stallman <rms@gnu.org>

parents: 20347

diff changeset

1932 search_regs.end[0] = BYTE_TO_CHAR (beg_byte + nbytes);

9278

f2138d548313 (Flooking_at, skip_chars, search_buffer, set_search_regs, Fstore_match_data):

Karl Heuer <kwzh@gnu.org>

parents: 9113

diff changeset

1933 XSETBUFFER (last_thing_searched, current_buffer);

5556

14161cfec24a (set_search_regs): New subroutine.

Richard M. Stallman <rms@gnu.org>

parents: 4954

diff changeset

1934 }

603

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

1935

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

1936 /* Given a string of words separated by word delimiters,

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

1937 compute a regexp that matches those exact words

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

1938 separated by arbitrary punctuation. */

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

1939

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

1940 static Lisp_Object

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

1941 wordify (string)

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

1942 Lisp_Object string;

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

1943 {

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

1944 register unsigned char *p, *o;

20588

138c95482e6b (search_buffer): Handle bytes vs chars in non-RE case.

Richard M. Stallman <rms@gnu.org>

parents: 20547

diff changeset

1945 register int i, i_byte, len, punct_count = 0, word_count = 0;

603

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

1946 Lisp_Object val;

20588

138c95482e6b (search_buffer): Handle bytes vs chars in non-RE case.

Richard M. Stallman <rms@gnu.org>

parents: 20547

diff changeset

1947 int prev_c = 0;

138c95482e6b (search_buffer): Handle bytes vs chars in non-RE case.

Richard M. Stallman <rms@gnu.org>

parents: 20547

diff changeset

1948 int adjust;

603

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

1949

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

1950 CHECK_STRING (string, 0);

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

1951 p = XSTRING (string)->data;

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

1952 len = XSTRING (string)->size;

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

1953

20588

138c95482e6b (search_buffer): Handle bytes vs chars in non-RE case.

Richard M. Stallman <rms@gnu.org>

parents: 20547

diff changeset

1954 for (i = 0, i_byte = 0; i < len; )

138c95482e6b (search_buffer): Handle bytes vs chars in non-RE case.

Richard M. Stallman <rms@gnu.org>

parents: 20547

diff changeset

1955 {

138c95482e6b (search_buffer): Handle bytes vs chars in non-RE case.

Richard M. Stallman <rms@gnu.org>

parents: 20547

diff changeset

1956 int c;

138c95482e6b (search_buffer): Handle bytes vs chars in non-RE case.

Richard M. Stallman <rms@gnu.org>

parents: 20547

diff changeset

1957

138c95482e6b (search_buffer): Handle bytes vs chars in non-RE case.

Richard M. Stallman <rms@gnu.org>

parents: 20547

diff changeset

1958 if (STRING_MULTIBYTE (string))

138c95482e6b (search_buffer): Handle bytes vs chars in non-RE case.

Richard M. Stallman <rms@gnu.org>

parents: 20547

diff changeset

1959 FETCH_STRING_CHAR_ADVANCE (c, string, i, i_byte);

138c95482e6b (search_buffer): Handle bytes vs chars in non-RE case.

Richard M. Stallman <rms@gnu.org>

parents: 20547

diff changeset

1960 else

138c95482e6b (search_buffer): Handle bytes vs chars in non-RE case.

Richard M. Stallman <rms@gnu.org>

parents: 20547

diff changeset

1961 c = XSTRING (string)->data[i++];

603

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

1962

20588

138c95482e6b (search_buffer): Handle bytes vs chars in non-RE case.

Richard M. Stallman <rms@gnu.org>

parents: 20547

diff changeset

1963 if (SYNTAX (c) != Sword)

138c95482e6b (search_buffer): Handle bytes vs chars in non-RE case.

Richard M. Stallman <rms@gnu.org>

parents: 20547

diff changeset

1964 {

138c95482e6b (search_buffer): Handle bytes vs chars in non-RE case.

Richard M. Stallman <rms@gnu.org>

parents: 20547

diff changeset

1965 punct_count++;

138c95482e6b (search_buffer): Handle bytes vs chars in non-RE case.

Richard M. Stallman <rms@gnu.org>

parents: 20547

diff changeset

1966 if (i > 0 && SYNTAX (prev_c) == Sword)

138c95482e6b (search_buffer): Handle bytes vs chars in non-RE case.

Richard M. Stallman <rms@gnu.org>

parents: 20547

diff changeset

1967 word_count++;

138c95482e6b (search_buffer): Handle bytes vs chars in non-RE case.

Richard M. Stallman <rms@gnu.org>

parents: 20547

diff changeset

1968 }

138c95482e6b (search_buffer): Handle bytes vs chars in non-RE case.

Richard M. Stallman <rms@gnu.org>

parents: 20547

diff changeset

1969

138c95482e6b (search_buffer): Handle bytes vs chars in non-RE case.

Richard M. Stallman <rms@gnu.org>

parents: 20547

diff changeset

1970 prev_c = c;

138c95482e6b (search_buffer): Handle bytes vs chars in non-RE case.

Richard M. Stallman <rms@gnu.org>

parents: 20547

diff changeset

1971 }

138c95482e6b (search_buffer): Handle bytes vs chars in non-RE case.

Richard M. Stallman <rms@gnu.org>

parents: 20547

diff changeset

1972

138c95482e6b (search_buffer): Handle bytes vs chars in non-RE case.

Richard M. Stallman <rms@gnu.org>

parents: 20547

diff changeset

1973 if (SYNTAX (prev_c) == Sword)

138c95482e6b (search_buffer): Handle bytes vs chars in non-RE case.

Richard M. Stallman <rms@gnu.org>

parents: 20547

diff changeset

1974 word_count++;

138c95482e6b (search_buffer): Handle bytes vs chars in non-RE case.

Richard M. Stallman <rms@gnu.org>

parents: 20547

diff changeset

1975 if (!word_count)

138c95482e6b (search_buffer): Handle bytes vs chars in non-RE case.

Richard M. Stallman <rms@gnu.org>

parents: 20547

diff changeset

1976 return build_string ("");

138c95482e6b (search_buffer): Handle bytes vs chars in non-RE case.

Richard M. Stallman <rms@gnu.org>

parents: 20547

diff changeset

1977

138c95482e6b (search_buffer): Handle bytes vs chars in non-RE case.

Richard M. Stallman <rms@gnu.org>

parents: 20547

diff changeset

1978 adjust = - punct_count + 5 * (word_count - 1) + 4;

22640

929ad308aba6 (wordify): Fix i_byte even in unibyte case for copy loop.

Richard M. Stallman <rms@gnu.org>

parents: 22533

diff changeset

1979 if (STRING_MULTIBYTE (string))

929ad308aba6 (wordify): Fix i_byte even in unibyte case for copy loop.

Richard M. Stallman <rms@gnu.org>

parents: 22533

diff changeset

1980 val = make_uninit_multibyte_string (len + adjust,

929ad308aba6 (wordify): Fix i_byte even in unibyte case for copy loop.

Richard M. Stallman <rms@gnu.org>

parents: 22533

diff changeset

1981 STRING_BYTES (XSTRING (string))

929ad308aba6 (wordify): Fix i_byte even in unibyte case for copy loop.

Richard M. Stallman <rms@gnu.org>

parents: 22533

diff changeset

1982 + adjust);

929ad308aba6 (wordify): Fix i_byte even in unibyte case for copy loop.

Richard M. Stallman <rms@gnu.org>

parents: 22533

diff changeset

1983 else

929ad308aba6 (wordify): Fix i_byte even in unibyte case for copy loop.

Richard M. Stallman <rms@gnu.org>

parents: 22533

diff changeset

1984 val = make_uninit_string (len + adjust);

603

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

1985

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

1986 o = XSTRING (val)->data;

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

1987 *o++ = '\\';

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

1988 *o++ = 'b';

21887

1c9f20274f76 (wordify): Do the second loop by chars, not by bytes.

Richard M. Stallman <rms@gnu.org>

parents: 21531

diff changeset

1989 prev_c = 0;

603

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

1990

21887

1c9f20274f76 (wordify): Do the second loop by chars, not by bytes.

Richard M. Stallman <rms@gnu.org>

parents: 21531

diff changeset

1991 for (i = 0, i_byte = 0; i < len; )

1c9f20274f76 (wordify): Do the second loop by chars, not by bytes.

Richard M. Stallman <rms@gnu.org>

parents: 21531

diff changeset

1992 {

1c9f20274f76 (wordify): Do the second loop by chars, not by bytes.

Richard M. Stallman <rms@gnu.org>

parents: 21531

diff changeset

1993 int c;

1c9f20274f76 (wordify): Do the second loop by chars, not by bytes.

Richard M. Stallman <rms@gnu.org>

parents: 21531

diff changeset

1994 int i_byte_orig = i_byte;

1c9f20274f76 (wordify): Do the second loop by chars, not by bytes.

Richard M. Stallman <rms@gnu.org>

parents: 21531

diff changeset

1995

1c9f20274f76 (wordify): Do the second loop by chars, not by bytes.

Richard M. Stallman <rms@gnu.org>

parents: 21531

diff changeset

1996 if (STRING_MULTIBYTE (string))

1c9f20274f76 (wordify): Do the second loop by chars, not by bytes.

Richard M. Stallman <rms@gnu.org>

parents: 21531

diff changeset

1997 FETCH_STRING_CHAR_ADVANCE (c, string, i, i_byte);

1c9f20274f76 (wordify): Do the second loop by chars, not by bytes.

Richard M. Stallman <rms@gnu.org>

parents: 21531

diff changeset

1998 else

22640

929ad308aba6 (wordify): Fix i_byte even in unibyte case for copy loop.

Richard M. Stallman <rms@gnu.org>

parents: 22533

diff changeset

1999 {

929ad308aba6 (wordify): Fix i_byte even in unibyte case for copy loop.

Richard M. Stallman <rms@gnu.org>

parents: 22533

diff changeset

2000 c = XSTRING (string)->data[i++];

929ad308aba6 (wordify): Fix i_byte even in unibyte case for copy loop.

Richard M. Stallman <rms@gnu.org>

parents: 22533

diff changeset

2001 i_byte++;

929ad308aba6 (wordify): Fix i_byte even in unibyte case for copy loop.

Richard M. Stallman <rms@gnu.org>

parents: 22533

diff changeset

2002 }

21887

1c9f20274f76 (wordify): Do the second loop by chars, not by bytes.

Richard M. Stallman <rms@gnu.org>

parents: 21531

diff changeset

2003

1c9f20274f76 (wordify): Do the second loop by chars, not by bytes.

Richard M. Stallman <rms@gnu.org>

parents: 21531

diff changeset

2004 if (SYNTAX (c) == Sword)

1c9f20274f76 (wordify): Do the second loop by chars, not by bytes.

Richard M. Stallman <rms@gnu.org>

parents: 21531

diff changeset

2005 {

1c9f20274f76 (wordify): Do the second loop by chars, not by bytes.

Richard M. Stallman <rms@gnu.org>

parents: 21531

diff changeset

2006 bcopy (&XSTRING (string)->data[i_byte_orig], o,

1c9f20274f76 (wordify): Do the second loop by chars, not by bytes.

Richard M. Stallman <rms@gnu.org>

parents: 21531

diff changeset

2007 i_byte - i_byte_orig);

1c9f20274f76 (wordify): Do the second loop by chars, not by bytes.

Richard M. Stallman <rms@gnu.org>

parents: 21531

diff changeset

2008 o += i_byte - i_byte_orig;

1c9f20274f76 (wordify): Do the second loop by chars, not by bytes.

Richard M. Stallman <rms@gnu.org>

parents: 21531

diff changeset

2009 }

1c9f20274f76 (wordify): Do the second loop by chars, not by bytes.

Richard M. Stallman <rms@gnu.org>

parents: 21531

diff changeset

2010 else if (i > 0 && SYNTAX (prev_c) == Sword && --word_count)

1c9f20274f76 (wordify): Do the second loop by chars, not by bytes.

Richard M. Stallman <rms@gnu.org>

parents: 21531

diff changeset

2011 {

1c9f20274f76 (wordify): Do the second loop by chars, not by bytes.

Richard M. Stallman <rms@gnu.org>

parents: 21531

diff changeset

2012 *o++ = '\\';

1c9f20274f76 (wordify): Do the second loop by chars, not by bytes.

Richard M. Stallman <rms@gnu.org>

parents: 21531

diff changeset

2013 *o++ = 'W';

1c9f20274f76 (wordify): Do the second loop by chars, not by bytes.

Richard M. Stallman <rms@gnu.org>

parents: 21531

diff changeset

2014 *o++ = '\\';

1c9f20274f76 (wordify): Do the second loop by chars, not by bytes.

Richard M. Stallman <rms@gnu.org>

parents: 21531

diff changeset

2015 *o++ = 'W';

1c9f20274f76 (wordify): Do the second loop by chars, not by bytes.

Richard M. Stallman <rms@gnu.org>

parents: 21531

diff changeset

2016 *o++ = '*';

1c9f20274f76 (wordify): Do the second loop by chars, not by bytes.

Richard M. Stallman <rms@gnu.org>

parents: 21531

diff changeset

2017 }

1c9f20274f76 (wordify): Do the second loop by chars, not by bytes.

Richard M. Stallman <rms@gnu.org>

parents: 21531

diff changeset

2018

1c9f20274f76 (wordify): Do the second loop by chars, not by bytes.

Richard M. Stallman <rms@gnu.org>

parents: 21531

diff changeset

2019 prev_c = c;

1c9f20274f76 (wordify): Do the second loop by chars, not by bytes.

Richard M. Stallman <rms@gnu.org>

parents: 21531

diff changeset

2020 }

603

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2021

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2022 *o++ = '\\';

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2023 *o++ = 'b';

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2024

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2025 return val;

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2026 }

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2027

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2028 DEFUN ("search-backward", Fsearch_backward, Ssearch_backward, 1, 4,

19541

e7876a076881 (Fsearch_backward): Inherit the current input method on

Kenichi Handa <handa@m17n.org>

parents: 18762

diff changeset

2029 "MSearch backward: ",

603

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2030 "Search backward from point for STRING.\n\

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2031 Set point to the beginning of the occurrence found, and return point.\n\

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2032 An optional second argument bounds the search; it is a buffer position.\n\

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2033 The match found must not extend before that position.\n\

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2034 Optional third argument, if t, means if fail just return nil (no error).\n\

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2035 If not nil and not t, position at limit of search and return nil.\n\

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2036 Optional fourth argument is repeat count--search for successive occurrences.\n\

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2037 See also the functions `match-beginning', `match-end' and `replace-match'.")

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2038 (string, bound, noerror, count)

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2039 Lisp_Object string, bound, noerror, count;

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2040 {

10020

c41ce96785a8 (struct regexp_cache): New field `posix'.

Richard M. Stallman <rms@gnu.org>

parents: 9605

diff changeset

2041 return search_command (string, bound, noerror, count, -1, 0, 0);

603

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2042 }

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2043

19541

e7876a076881 (Fsearch_backward): Inherit the current input method on

Kenichi Handa <handa@m17n.org>

parents: 18762

diff changeset

2044 DEFUN ("search-forward", Fsearch_forward, Ssearch_forward, 1, 4, "MSearch: ",

603

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2045 "Search forward from point for STRING.\n\

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2046 Set point to the end of the occurrence found, and return point.\n\

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2047 An optional second argument bounds the search; it is a buffer position.\n\

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2048 The match found must not extend after that position. nil is equivalent\n\

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2049 to (point-max).\n\

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2050 Optional third argument, if t, means if fail just return nil (no error).\n\

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2051 If not nil and not t, move to limit of search and return nil.\n\

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2052 Optional fourth argument is repeat count--search for successive occurrences.\n\

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2053 See also the functions `match-beginning', `match-end' and `replace-match'.")

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2054 (string, bound, noerror, count)

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2055 Lisp_Object string, bound, noerror, count;

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2056 {

10020

c41ce96785a8 (struct regexp_cache): New field `posix'.

Richard M. Stallman <rms@gnu.org>

parents: 9605

diff changeset

2057 return search_command (string, bound, noerror, count, 1, 0, 0);

603

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2058 }

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2059

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2060 DEFUN ("word-search-backward", Fword_search_backward, Sword_search_backward, 1, 4,

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2061 "sWord search backward: ",

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2062 "Search backward from point for STRING, ignoring differences in punctuation.\n\

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2063 Set point to the beginning of the occurrence found, and return point.\n\

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2064 An optional second argument bounds the search; it is a buffer position.\n\

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2065 The match found must not extend before that position.\n\

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2066 Optional third argument, if t, means if fail just return nil (no error).\n\

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2067 If not nil and not t, move to limit of search and return nil.\n\

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2068 Optional fourth argument is repeat count--search for successive occurrences.")

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2069 (string, bound, noerror, count)

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2070 Lisp_Object string, bound, noerror, count;

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2071 {

10020

c41ce96785a8 (struct regexp_cache): New field `posix'.

Richard M. Stallman <rms@gnu.org>

parents: 9605

diff changeset

2072 return search_command (wordify (string), bound, noerror, count, -1, 1, 0);

603

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2073 }

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2074

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2075 DEFUN ("word-search-forward", Fword_search_forward, Sword_search_forward, 1, 4,

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2076 "sWord search: ",

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2077 "Search forward from point for STRING, ignoring differences in punctuation.\n\

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2078 Set point to the end of the occurrence found, and return point.\n\

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2079 An optional second argument bounds the search; it is a buffer position.\n\

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2080 The match found must not extend after that position.\n\

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2081 Optional third argument, if t, means if fail just return nil (no error).\n\

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2082 If not nil and not t, move to limit of search and return nil.\n\

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2083 Optional fourth argument is repeat count--search for successive occurrences.")

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2084 (string, bound, noerror, count)

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2085 Lisp_Object string, bound, noerror, count;

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2086 {

10020

c41ce96785a8 (struct regexp_cache): New field `posix'.

Richard M. Stallman <rms@gnu.org>

parents: 9605

diff changeset

2087 return search_command (wordify (string), bound, noerror, count, 1, 1, 0);

603

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2088 }

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2089

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2090 DEFUN ("re-search-backward", Fre_search_backward, Sre_search_backward, 1, 4,

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2091 "sRE search backward: ",

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2092 "Search backward from point for match for regular expression REGEXP.\n\

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2093 Set point to the beginning of the match, and return point.\n\

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2094 The match found is the one starting last in the buffer\n\

6297

b44907fd0ff0 (Fre_search_forward, Fre_search_backward): Doc fix.

Karl Heuer <kwzh@gnu.org>

parents: 6196

diff changeset

2095 and yet ending before the origin of the search.\n\

603

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2096 An optional second argument bounds the search; it is a buffer position.\n\

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2097 The match found must start at or after that position.\n\

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2098 Optional third argument, if t, means if fail just return nil (no error).\n\

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2099 If not nil and not t, move to limit of search and return nil.\n\

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2100 Optional fourth argument is repeat count--search for successive occurrences.\n\

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2101 See also the functions `match-beginning', `match-end' and `replace-match'.")

6297

b44907fd0ff0 (Fre_search_forward, Fre_search_backward): Doc fix.

Karl Heuer <kwzh@gnu.org>

parents: 6196

diff changeset

2102 (regexp, bound, noerror, count)

b44907fd0ff0 (Fre_search_forward, Fre_search_backward): Doc fix.

Karl Heuer <kwzh@gnu.org>

parents: 6196

diff changeset

2103 Lisp_Object regexp, bound, noerror, count;

603

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2104 {

10020

c41ce96785a8 (struct regexp_cache): New field `posix'.

Richard M. Stallman <rms@gnu.org>

parents: 9605

diff changeset

2105 return search_command (regexp, bound, noerror, count, -1, 1, 0);

603

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2106 }

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2107

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2108 DEFUN ("re-search-forward", Fre_search_forward, Sre_search_forward, 1, 4,

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2109 "sRE search: ",

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2110 "Search forward from point for regular expression REGEXP.\n\

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2111 Set point to the end of the occurrence found, and return point.\n\

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2112 An optional second argument bounds the search; it is a buffer position.\n\

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2113 The match found must not extend after that position.\n\

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2114 Optional third argument, if t, means if fail just return nil (no error).\n\

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2115 If not nil and not t, move to limit of search and return nil.\n\

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2116 Optional fourth argument is repeat count--search for successive occurrences.\n\

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2117 See also the functions `match-beginning', `match-end' and `replace-match'.")

6297

b44907fd0ff0 (Fre_search_forward, Fre_search_backward): Doc fix.

Karl Heuer <kwzh@gnu.org>

parents: 6196

diff changeset

2118 (regexp, bound, noerror, count)

b44907fd0ff0 (Fre_search_forward, Fre_search_backward): Doc fix.

Karl Heuer <kwzh@gnu.org>

parents: 6196

diff changeset

2119 Lisp_Object regexp, bound, noerror, count;

603

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2120 {

10020

c41ce96785a8 (struct regexp_cache): New field `posix'.

Richard M. Stallman <rms@gnu.org>

parents: 9605

diff changeset

2121 return search_command (regexp, bound, noerror, count, 1, 1, 0);

c41ce96785a8 (struct regexp_cache): New field `posix'.

Richard M. Stallman <rms@gnu.org>

parents: 9605

diff changeset

2122 }

c41ce96785a8 (struct regexp_cache): New field `posix'.

Richard M. Stallman <rms@gnu.org>

parents: 9605

diff changeset

2123

c41ce96785a8 (struct regexp_cache): New field `posix'.

Richard M. Stallman <rms@gnu.org>

parents: 9605

diff changeset

2124 DEFUN ("posix-search-backward", Fposix_search_backward, Sposix_search_backward, 1, 4,

c41ce96785a8 (struct regexp_cache): New field `posix'.

Richard M. Stallman <rms@gnu.org>

parents: 9605

diff changeset

2125 "sPosix search backward: ",

c41ce96785a8 (struct regexp_cache): New field `posix'.

Richard M. Stallman <rms@gnu.org>

parents: 9605

diff changeset

2126 "Search backward from point for match for regular expression REGEXP.\n\

c41ce96785a8 (struct regexp_cache): New field `posix'.

Richard M. Stallman <rms@gnu.org>

parents: 9605

diff changeset

2127 Find the longest match in accord with Posix regular expression rules.\n\

c41ce96785a8 (struct regexp_cache): New field `posix'.

Richard M. Stallman <rms@gnu.org>

parents: 9605

diff changeset

2128 Set point to the beginning of the match, and return point.\n\

c41ce96785a8 (struct regexp_cache): New field `posix'.

Richard M. Stallman <rms@gnu.org>

parents: 9605

diff changeset

2129 The match found is the one starting last in the buffer\n\

c41ce96785a8 (struct regexp_cache): New field `posix'.

Richard M. Stallman <rms@gnu.org>

parents: 9605

diff changeset

2130 and yet ending before the origin of the search.\n\

c41ce96785a8 (struct regexp_cache): New field `posix'.

Richard M. Stallman <rms@gnu.org>

parents: 9605

diff changeset

2131 An optional second argument bounds the search; it is a buffer position.\n\

c41ce96785a8 (struct regexp_cache): New field `posix'.

Richard M. Stallman <rms@gnu.org>

parents: 9605

diff changeset

2132 The match found must start at or after that position.\n\

c41ce96785a8 (struct regexp_cache): New field `posix'.

Richard M. Stallman <rms@gnu.org>

parents: 9605

diff changeset

2133 Optional third argument, if t, means if fail just return nil (no error).\n\

c41ce96785a8 (struct regexp_cache): New field `posix'.

Richard M. Stallman <rms@gnu.org>

parents: 9605

diff changeset

2134 If not nil and not t, move to limit of search and return nil.\n\

c41ce96785a8 (struct regexp_cache): New field `posix'.

Richard M. Stallman <rms@gnu.org>

parents: 9605

diff changeset

2135 Optional fourth argument is repeat count--search for successive occurrences.\n\

c41ce96785a8 (struct regexp_cache): New field `posix'.

Richard M. Stallman <rms@gnu.org>

parents: 9605

diff changeset

2136 See also the functions `match-beginning', `match-end' and `replace-match'.")

c41ce96785a8 (struct regexp_cache): New field `posix'.

Richard M. Stallman <rms@gnu.org>

parents: 9605

diff changeset

2137 (regexp, bound, noerror, count)

c41ce96785a8 (struct regexp_cache): New field `posix'.

Richard M. Stallman <rms@gnu.org>

parents: 9605

diff changeset

2138 Lisp_Object regexp, bound, noerror, count;

c41ce96785a8 (struct regexp_cache): New field `posix'.

Richard M. Stallman <rms@gnu.org>

parents: 9605

diff changeset

2139 {

c41ce96785a8 (struct regexp_cache): New field `posix'.

Richard M. Stallman <rms@gnu.org>

parents: 9605

diff changeset

2140 return search_command (regexp, bound, noerror, count, -1, 1, 1);

c41ce96785a8 (struct regexp_cache): New field `posix'.

Richard M. Stallman <rms@gnu.org>

parents: 9605

diff changeset

2141 }

c41ce96785a8 (struct regexp_cache): New field `posix'.

Richard M. Stallman <rms@gnu.org>

parents: 9605

diff changeset

2142

c41ce96785a8 (struct regexp_cache): New field `posix'.

Richard M. Stallman <rms@gnu.org>

parents: 9605

diff changeset

2143 DEFUN ("posix-search-forward", Fposix_search_forward, Sposix_search_forward, 1, 4,

c41ce96785a8 (struct regexp_cache): New field `posix'.

Richard M. Stallman <rms@gnu.org>

parents: 9605

diff changeset

2144 "sPosix search: ",

c41ce96785a8 (struct regexp_cache): New field `posix'.

Richard M. Stallman <rms@gnu.org>

parents: 9605

diff changeset

2145 "Search forward from point for regular expression REGEXP.\n\

c41ce96785a8 (struct regexp_cache): New field `posix'.

Richard M. Stallman <rms@gnu.org>

parents: 9605

diff changeset

2146 Find the longest match in accord with Posix regular expression rules.\n\

c41ce96785a8 (struct regexp_cache): New field `posix'.

Richard M. Stallman <rms@gnu.org>

parents: 9605

diff changeset

2147 Set point to the end of the occurrence found, and return point.\n\

c41ce96785a8 (struct regexp_cache): New field `posix'.

Richard M. Stallman <rms@gnu.org>

parents: 9605

diff changeset

2148 An optional second argument bounds the search; it is a buffer position.\n\

c41ce96785a8 (struct regexp_cache): New field `posix'.

Richard M. Stallman <rms@gnu.org>

parents: 9605

diff changeset

2149 The match found must not extend after that position.\n\

c41ce96785a8 (struct regexp_cache): New field `posix'.

Richard M. Stallman <rms@gnu.org>

parents: 9605

diff changeset

2150 Optional third argument, if t, means if fail just return nil (no error).\n\

c41ce96785a8 (struct regexp_cache): New field `posix'.

Richard M. Stallman <rms@gnu.org>

parents: 9605

diff changeset

2151 If not nil and not t, move to limit of search and return nil.\n\

c41ce96785a8 (struct regexp_cache): New field `posix'.

Richard M. Stallman <rms@gnu.org>

parents: 9605

diff changeset

2152 Optional fourth argument is repeat count--search for successive occurrences.\n\

c41ce96785a8 (struct regexp_cache): New field `posix'.

Richard M. Stallman <rms@gnu.org>

parents: 9605

diff changeset

2153 See also the functions `match-beginning', `match-end' and `replace-match'.")

c41ce96785a8 (struct regexp_cache): New field `posix'.

Richard M. Stallman <rms@gnu.org>

parents: 9605

diff changeset

2154 (regexp, bound, noerror, count)

c41ce96785a8 (struct regexp_cache): New field `posix'.

Richard M. Stallman <rms@gnu.org>

parents: 9605

diff changeset

2155 Lisp_Object regexp, bound, noerror, count;

c41ce96785a8 (struct regexp_cache): New field `posix'.

Richard M. Stallman <rms@gnu.org>

parents: 9605

diff changeset

2156 {

c41ce96785a8 (struct regexp_cache): New field `posix'.

Richard M. Stallman <rms@gnu.org>

parents: 9605

diff changeset

2157 return search_command (regexp, bound, noerror, count, 1, 1, 1);

603

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2158 }

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2159

12807

34d269b30df1 (Freplace_match): New arg SUBEXP.

Richard M. Stallman <rms@gnu.org>

parents: 12244

diff changeset

2160 DEFUN ("replace-match", Freplace_match, Sreplace_match, 1, 5, 0,

603

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2161 "Replace text matched by last search with NEWTEXT.\n\

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2162 If second arg FIXEDCASE is non-nil, do not alter case of replacement text.\n\

6543

33032ee16c7c (Freplace_match): Doc fix.

Richard M. Stallman <rms@gnu.org>

parents: 6343

diff changeset

2163 Otherwise maybe capitalize the whole text, or maybe just word initials,\n\

33032ee16c7c (Freplace_match): Doc fix.

Richard M. Stallman <rms@gnu.org>

parents: 6343

diff changeset

2164 based on the replaced text.\n\

33032ee16c7c (Freplace_match): Doc fix.

Richard M. Stallman <rms@gnu.org>

parents: 6343

diff changeset

2165 If the replaced text has only capital letters\n\

33032ee16c7c (Freplace_match): Doc fix.

Richard M. Stallman <rms@gnu.org>

parents: 6343

diff changeset

2166 and has at least one multiletter word, convert NEWTEXT to all caps.\n\

33032ee16c7c (Freplace_match): Doc fix.

Richard M. Stallman <rms@gnu.org>

parents: 6343

diff changeset

2167 If the replaced text has at least one word starting with a capital letter,\n\

33032ee16c7c (Freplace_match): Doc fix.

Richard M. Stallman <rms@gnu.org>

parents: 6343

diff changeset

2168 then capitalize each word in NEWTEXT.\n\n\

603

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2169 If third arg LITERAL is non-nil, insert NEWTEXT literally.\n\

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2170 Otherwise treat `\\' as special:\n\

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2171 `\\&' in NEWTEXT means substitute original matched text.\n\

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2172 `\\N' means substitute what matched the Nth `\$...\$'.\n\

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2173 If Nth parens didn't match, substitute nothing.\n\

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2174 `\\\\' means insert one `\\'.\n\

708

030fb4635335 *** empty log message ***

Jim Blandy <jimb@redhat.com>

parents: 648

diff changeset

2175 FIXEDCASE and LITERAL are optional arguments.\n\

9029

f0d89b62dd27 (Freplace_match): New 4th arg OBJECT can specify string to replace in.

Richard M. Stallman <rms@gnu.org>

parents: 8950

diff changeset

2176 Leaves point at end of replacement text.\n\

f0d89b62dd27 (Freplace_match): New 4th arg OBJECT can specify string to replace in.

Richard M. Stallman <rms@gnu.org>

parents: 8950

diff changeset

2177 \n\

f0d89b62dd27 (Freplace_match): New 4th arg OBJECT can specify string to replace in.

Richard M. Stallman <rms@gnu.org>

parents: 8950

diff changeset

2178 The optional fourth argument STRING can be a string to modify.\n\

f0d89b62dd27 (Freplace_match): New 4th arg OBJECT can specify string to replace in.

Richard M. Stallman <rms@gnu.org>

parents: 8950

diff changeset

2179 In that case, this function creates and returns a new string\n\

12807

34d269b30df1 (Freplace_match): New arg SUBEXP.

Richard M. Stallman <rms@gnu.org>

parents: 12244

diff changeset

2180 which is made by replacing the part of STRING that was matched.\n\

34d269b30df1 (Freplace_match): New arg SUBEXP.

Richard M. Stallman <rms@gnu.org>

parents: 12244

diff changeset

2181 \n\

34d269b30df1 (Freplace_match): New arg SUBEXP.

Richard M. Stallman <rms@gnu.org>

parents: 12244

diff changeset

2182 The optional fifth argument SUBEXP specifies a subexpression of the match.\n\

34d269b30df1 (Freplace_match): New arg SUBEXP.

Richard M. Stallman <rms@gnu.org>

parents: 12244

diff changeset

2183 It says to replace just that subexpression instead of the whole match.\n\

34d269b30df1 (Freplace_match): New arg SUBEXP.

Richard M. Stallman <rms@gnu.org>

parents: 12244

diff changeset

2184 This is useful only after a regular expression search or match\n\

34d269b30df1 (Freplace_match): New arg SUBEXP.

Richard M. Stallman <rms@gnu.org>

parents: 12244

diff changeset

2185 since only regular expressions have distinguished subexpressions.")

34d269b30df1 (Freplace_match): New arg SUBEXP.

Richard M. Stallman <rms@gnu.org>

parents: 12244

diff changeset

2186 (newtext, fixedcase, literal, string, subexp)

34d269b30df1 (Freplace_match): New arg SUBEXP.

Richard M. Stallman <rms@gnu.org>

parents: 12244

diff changeset

2187 Lisp_Object newtext, fixedcase, literal, string, subexp;

603

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2188 {

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2189 enum { nochange, all_caps, cap_initial } case_action;

22533

6eae236a4f01 (Freplace_match): Work by chars, not by bytes,

Karl Heuer <kwzh@gnu.org>

parents: 22221

diff changeset

2190 register int pos, pos_byte;

603

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2191 int some_multiletter_word;

2393

a35d2c5cbb3b (Freplace_match): Clean up criterion about converting case.

Richard M. Stallman <rms@gnu.org>

parents: 1926

diff changeset

2192 int some_lowercase;

7674

947d24fefd9e (Freplace_match): Improve capitalization heuristics.

Karl Heuer <kwzh@gnu.org>

parents: 7673

diff changeset

2193 int some_uppercase;

8526

2b7b23059f1b (Freplace_match): Treat caseless initial like a lowercase initial.

Richard M. Stallman <rms@gnu.org>

parents: 7891

diff changeset

2194 int some_nonuppercase_initial;

603

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2195 register int c, prevc;

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2196 int inslen;

12807

34d269b30df1 (Freplace_match): New arg SUBEXP.

Richard M. Stallman <rms@gnu.org>

parents: 12244

diff changeset

2197 int sub;

18081

300068b4fcef (Freplace_match): Fix previous change.

Richard M. Stallman <rms@gnu.org>

parents: 18077

diff changeset

2198 int opoint, newpoint;

603

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2199

4882

8c09f87f5087 (Freplace_match): Fix argument names to match doc string.

Brian Fox <bfox@gnu.org>

parents: 4832

diff changeset

2200 CHECK_STRING (newtext, 0);

603

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2201

9029

f0d89b62dd27 (Freplace_match): New 4th arg OBJECT can specify string to replace in.

Richard M. Stallman <rms@gnu.org>

parents: 8950

diff changeset

2202 if (! NILP (string))

f0d89b62dd27 (Freplace_match): New 4th arg OBJECT can specify string to replace in.

Richard M. Stallman <rms@gnu.org>

parents: 8950

diff changeset

2203 CHECK_STRING (string, 4);

f0d89b62dd27 (Freplace_match): New 4th arg OBJECT can specify string to replace in.

Richard M. Stallman <rms@gnu.org>

parents: 8950

diff changeset

2204

603

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2205 case_action = nochange; /* We tried an initialization */

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2206 /* but some C compilers blew it */

621

eca8812e61cd *** empty log message ***

Jim Blandy <jimb@redhat.com>

parents: 605

diff changeset

2207

eca8812e61cd *** empty log message ***

Jim Blandy <jimb@redhat.com>

parents: 605

diff changeset

2208 if (search_regs.num_regs <= 0)

eca8812e61cd *** empty log message ***

Jim Blandy <jimb@redhat.com>

parents: 605

diff changeset

2209 error ("replace-match called before any match found");

eca8812e61cd *** empty log message ***

Jim Blandy <jimb@redhat.com>

parents: 605

diff changeset

2210

12807

34d269b30df1 (Freplace_match): New arg SUBEXP.

Richard M. Stallman <rms@gnu.org>

parents: 12244

diff changeset

2211 if (NILP (subexp))

34d269b30df1 (Freplace_match): New arg SUBEXP.

Richard M. Stallman <rms@gnu.org>

parents: 12244

diff changeset

2212 sub = 0;

34d269b30df1 (Freplace_match): New arg SUBEXP.

Richard M. Stallman <rms@gnu.org>

parents: 12244

diff changeset

2213 else

34d269b30df1 (Freplace_match): New arg SUBEXP.

Richard M. Stallman <rms@gnu.org>

parents: 12244

diff changeset

2214 {

34d269b30df1 (Freplace_match): New arg SUBEXP.

Richard M. Stallman <rms@gnu.org>

parents: 12244

diff changeset

2215 CHECK_NUMBER (subexp, 3);

34d269b30df1 (Freplace_match): New arg SUBEXP.

Richard M. Stallman <rms@gnu.org>

parents: 12244

diff changeset

2216 sub = XINT (subexp);

34d269b30df1 (Freplace_match): New arg SUBEXP.

Richard M. Stallman <rms@gnu.org>

parents: 12244

diff changeset

2217 if (sub < 0 || sub >= search_regs.num_regs)

34d269b30df1 (Freplace_match): New arg SUBEXP.

Richard M. Stallman <rms@gnu.org>

parents: 12244

diff changeset

2218 args_out_of_range (subexp, make_number (search_regs.num_regs));

34d269b30df1 (Freplace_match): New arg SUBEXP.

Richard M. Stallman <rms@gnu.org>

parents: 12244

diff changeset

2219 }

34d269b30df1 (Freplace_match): New arg SUBEXP.

Richard M. Stallman <rms@gnu.org>

parents: 12244

diff changeset

2220

9029

f0d89b62dd27 (Freplace_match): New 4th arg OBJECT can specify string to replace in.

Richard M. Stallman <rms@gnu.org>

parents: 8950

diff changeset

2221 if (NILP (string))

f0d89b62dd27 (Freplace_match): New 4th arg OBJECT can specify string to replace in.

Richard M. Stallman <rms@gnu.org>

parents: 8950

diff changeset

2222 {

12807

34d269b30df1 (Freplace_match): New arg SUBEXP.

Richard M. Stallman <rms@gnu.org>

parents: 12244

diff changeset

2223 if (search_regs.start[sub] < BEGV

34d269b30df1 (Freplace_match): New arg SUBEXP.

Richard M. Stallman <rms@gnu.org>

parents: 12244

diff changeset

2224 || search_regs.start[sub] > search_regs.end[sub]

34d269b30df1 (Freplace_match): New arg SUBEXP.

Richard M. Stallman <rms@gnu.org>

parents: 12244

diff changeset

2225 || search_regs.end[sub] > ZV)

34d269b30df1 (Freplace_match): New arg SUBEXP.

Richard M. Stallman <rms@gnu.org>

parents: 12244

diff changeset

2226 args_out_of_range (make_number (search_regs.start[sub]),

34d269b30df1 (Freplace_match): New arg SUBEXP.

Richard M. Stallman <rms@gnu.org>

parents: 12244

diff changeset

2227 make_number (search_regs.end[sub]));

9029

f0d89b62dd27 (Freplace_match): New 4th arg OBJECT can specify string to replace in.

Richard M. Stallman <rms@gnu.org>

parents: 8950

diff changeset

2228 }

f0d89b62dd27 (Freplace_match): New 4th arg OBJECT can specify string to replace in.

Richard M. Stallman <rms@gnu.org>

parents: 8950

diff changeset

2229 else

f0d89b62dd27 (Freplace_match): New 4th arg OBJECT can specify string to replace in.

Richard M. Stallman <rms@gnu.org>

parents: 8950

diff changeset

2230 {

12807

34d269b30df1 (Freplace_match): New arg SUBEXP.

Richard M. Stallman <rms@gnu.org>

parents: 12244

diff changeset

2231 if (search_regs.start[sub] < 0

34d269b30df1 (Freplace_match): New arg SUBEXP.

Richard M. Stallman <rms@gnu.org>

parents: 12244

diff changeset

2232 || search_regs.start[sub] > search_regs.end[sub]

34d269b30df1 (Freplace_match): New arg SUBEXP.

Richard M. Stallman <rms@gnu.org>

parents: 12244

diff changeset

2233 || search_regs.end[sub] > XSTRING (string)->size)

34d269b30df1 (Freplace_match): New arg SUBEXP.

Richard M. Stallman <rms@gnu.org>

parents: 12244

diff changeset

2234 args_out_of_range (make_number (search_regs.start[sub]),

34d269b30df1 (Freplace_match): New arg SUBEXP.

Richard M. Stallman <rms@gnu.org>

parents: 12244

diff changeset

2235 make_number (search_regs.end[sub]));

9029

f0d89b62dd27 (Freplace_match): New 4th arg OBJECT can specify string to replace in.

Richard M. Stallman <rms@gnu.org>

parents: 8950

diff changeset

2236 }

603

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2237

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2238 if (NILP (fixedcase))

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2239 {

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2240 /* Decide how to casify by examining the matched text. */

22533

6eae236a4f01 (Freplace_match): Work by chars, not by bytes,

Karl Heuer <kwzh@gnu.org>

parents: 22221

diff changeset

2241 int last;

6eae236a4f01 (Freplace_match): Work by chars, not by bytes,

Karl Heuer <kwzh@gnu.org>

parents: 22221

diff changeset

2242

6eae236a4f01 (Freplace_match): Work by chars, not by bytes,

Karl Heuer <kwzh@gnu.org>

parents: 22221

diff changeset

2243 pos = search_regs.start[sub];

6eae236a4f01 (Freplace_match): Work by chars, not by bytes,

Karl Heuer <kwzh@gnu.org>

parents: 22221

diff changeset

2244 last = search_regs.end[sub];

603

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2245

20545

c20c92ff4055 (looking_at_1): Use bytepos to call re_search_2.

Richard M. Stallman <rms@gnu.org>

parents: 20347

diff changeset

2246 if (NILP (string))

22533

6eae236a4f01 (Freplace_match): Work by chars, not by bytes,

Karl Heuer <kwzh@gnu.org>

parents: 22221

diff changeset

2247 pos_byte = CHAR_TO_BYTE (pos);

20545

c20c92ff4055 (looking_at_1): Use bytepos to call re_search_2.

Richard M. Stallman <rms@gnu.org>

parents: 20347

diff changeset

2248 else

22533

6eae236a4f01 (Freplace_match): Work by chars, not by bytes,

Karl Heuer <kwzh@gnu.org>

parents: 22221

diff changeset

2249 pos_byte = string_char_to_byte (string, pos);

20545

c20c92ff4055 (looking_at_1): Use bytepos to call re_search_2.

Richard M. Stallman <rms@gnu.org>

parents: 20347

diff changeset

2250

603

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2251 prevc = '\n';

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2252 case_action = all_caps;

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2253

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2254 /* some_multiletter_word is set nonzero if any original word

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2255 is more than one letter long. */

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2256 some_multiletter_word = 0;

2393

a35d2c5cbb3b (Freplace_match): Clean up criterion about converting case.

Richard M. Stallman <rms@gnu.org>

parents: 1926

diff changeset

2257 some_lowercase = 0;

8526

2b7b23059f1b (Freplace_match): Treat caseless initial like a lowercase initial.

Richard M. Stallman <rms@gnu.org>

parents: 7891

diff changeset

2258 some_nonuppercase_initial = 0;

7674

947d24fefd9e (Freplace_match): Improve capitalization heuristics.

Karl Heuer <kwzh@gnu.org>

parents: 7673

diff changeset

2259 some_uppercase = 0;

603

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2260

22533

6eae236a4f01 (Freplace_match): Work by chars, not by bytes,

Karl Heuer <kwzh@gnu.org>

parents: 22221

diff changeset

2261 while (pos < last)

603

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2262 {

9029

f0d89b62dd27 (Freplace_match): New 4th arg OBJECT can specify string to replace in.

Richard M. Stallman <rms@gnu.org>

parents: 8950

diff changeset

2263 if (NILP (string))

22533

6eae236a4f01 (Freplace_match): Work by chars, not by bytes,

Karl Heuer <kwzh@gnu.org>

parents: 22221

diff changeset

2264 {

6eae236a4f01 (Freplace_match): Work by chars, not by bytes,

Karl Heuer <kwzh@gnu.org>

parents: 22221

diff changeset

2265 c = FETCH_CHAR (pos_byte);

6eae236a4f01 (Freplace_match): Work by chars, not by bytes,

Karl Heuer <kwzh@gnu.org>

parents: 22221

diff changeset

2266 INC_BOTH (pos, pos_byte);

6eae236a4f01 (Freplace_match): Work by chars, not by bytes,

Karl Heuer <kwzh@gnu.org>

parents: 22221

diff changeset

2267 }

9029

f0d89b62dd27 (Freplace_match): New 4th arg OBJECT can specify string to replace in.

Richard M. Stallman <rms@gnu.org>

parents: 8950

diff changeset

2268 else

22533

6eae236a4f01 (Freplace_match): Work by chars, not by bytes,

Karl Heuer <kwzh@gnu.org>

parents: 22221

diff changeset

2269 FETCH_STRING_CHAR_ADVANCE (c, string, pos, pos_byte);

9029

f0d89b62dd27 (Freplace_match): New 4th arg OBJECT can specify string to replace in.

Richard M. Stallman <rms@gnu.org>

parents: 8950

diff changeset

2270

603

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2271 if (LOWERCASEP (c))

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2272 {

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2273 /* Cannot be all caps if any original char is lower case */

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2274

2393

a35d2c5cbb3b (Freplace_match): Clean up criterion about converting case.

Richard M. Stallman <rms@gnu.org>

parents: 1926

diff changeset

2275 some_lowercase = 1;

603

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2276 if (SYNTAX (prevc) != Sword)

8526

2b7b23059f1b (Freplace_match): Treat caseless initial like a lowercase initial.

Richard M. Stallman <rms@gnu.org>

parents: 7891

diff changeset

2277 some_nonuppercase_initial = 1;

603

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2278 else

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2279 some_multiletter_word = 1;

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2280 }

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2281 else if (!NOCASEP (c))

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2282 {

7674

947d24fefd9e (Freplace_match): Improve capitalization heuristics.

Karl Heuer <kwzh@gnu.org>

parents: 7673

diff changeset

2283 some_uppercase = 1;

2393

a35d2c5cbb3b (Freplace_match): Clean up criterion about converting case.

Richard M. Stallman <rms@gnu.org>

parents: 1926

diff changeset

2284 if (SYNTAX (prevc) != Sword)

6679

490b7e2db978 (Freplace_match): Don't capitalize unless all matched words are capitalized.

Karl Heuer <kwzh@gnu.org>

parents: 6543

diff changeset

2285 ;

2393

a35d2c5cbb3b (Freplace_match): Clean up criterion about converting case.

Richard M. Stallman <rms@gnu.org>

parents: 1926

diff changeset

2286 else

603

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2287 some_multiletter_word = 1;

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2288 }

8526

2b7b23059f1b (Freplace_match): Treat caseless initial like a lowercase initial.

Richard M. Stallman <rms@gnu.org>

parents: 7891

diff changeset

2289 else

2b7b23059f1b (Freplace_match): Treat caseless initial like a lowercase initial.

Richard M. Stallman <rms@gnu.org>

parents: 7891

diff changeset

2290 {

2b7b23059f1b (Freplace_match): Treat caseless initial like a lowercase initial.

Richard M. Stallman <rms@gnu.org>

parents: 7891

diff changeset

2291 /* If the initial is a caseless word constituent,

2b7b23059f1b (Freplace_match): Treat caseless initial like a lowercase initial.

Richard M. Stallman <rms@gnu.org>

parents: 7891

diff changeset

2292 treat that like a lowercase initial. */

2b7b23059f1b (Freplace_match): Treat caseless initial like a lowercase initial.

Richard M. Stallman <rms@gnu.org>

parents: 7891

diff changeset

2293 if (SYNTAX (prevc) != Sword)

2b7b23059f1b (Freplace_match): Treat caseless initial like a lowercase initial.

Richard M. Stallman <rms@gnu.org>

parents: 7891

diff changeset

2294 some_nonuppercase_initial = 1;

2b7b23059f1b (Freplace_match): Treat caseless initial like a lowercase initial.

Richard M. Stallman <rms@gnu.org>

parents: 7891

diff changeset

2295 }

603

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2296

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2297 prevc = c;

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2298 }

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2299

2393

a35d2c5cbb3b (Freplace_match): Clean up criterion about converting case.

Richard M. Stallman <rms@gnu.org>

parents: 1926

diff changeset

2300 /* Convert to all caps if the old text is all caps

a35d2c5cbb3b (Freplace_match): Clean up criterion about converting case.

Richard M. Stallman <rms@gnu.org>

parents: 1926

diff changeset

2301 and has at least one multiletter word. */

a35d2c5cbb3b (Freplace_match): Clean up criterion about converting case.

Richard M. Stallman <rms@gnu.org>

parents: 1926

diff changeset

2302 if (! some_lowercase && some_multiletter_word)

a35d2c5cbb3b (Freplace_match): Clean up criterion about converting case.

Richard M. Stallman <rms@gnu.org>

parents: 1926

diff changeset

2303 case_action = all_caps;

6679

490b7e2db978 (Freplace_match): Don't capitalize unless all matched words are capitalized.

Karl Heuer <kwzh@gnu.org>

parents: 6543

diff changeset

2304 /* Capitalize each word, if the old text has all capitalized words. */

8526

2b7b23059f1b (Freplace_match): Treat caseless initial like a lowercase initial.

Richard M. Stallman <rms@gnu.org>

parents: 7891

diff changeset

2305 else if (!some_nonuppercase_initial && some_multiletter_word)

603

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2306 case_action = cap_initial;

8526

2b7b23059f1b (Freplace_match): Treat caseless initial like a lowercase initial.

Richard M. Stallman <rms@gnu.org>

parents: 7891

diff changeset

2307 else if (!some_nonuppercase_initial && some_uppercase)

7674

947d24fefd9e (Freplace_match): Improve capitalization heuristics.

Karl Heuer <kwzh@gnu.org>

parents: 7673

diff changeset

2308 /* Should x -> yz, operating on X, give Yz or YZ?

947d24fefd9e (Freplace_match): Improve capitalization heuristics.

Karl Heuer <kwzh@gnu.org>

parents: 7673

diff changeset

2309 We'll assume the latter. */

947d24fefd9e (Freplace_match): Improve capitalization heuristics.

Karl Heuer <kwzh@gnu.org>

parents: 7673

diff changeset

2310 case_action = all_caps;

2393

a35d2c5cbb3b (Freplace_match): Clean up criterion about converting case.

Richard M. Stallman <rms@gnu.org>

parents: 1926

diff changeset

2311 else

a35d2c5cbb3b (Freplace_match): Clean up criterion about converting case.

Richard M. Stallman <rms@gnu.org>

parents: 1926

diff changeset

2312 case_action = nochange;

603

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2313 }

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2314

9029

f0d89b62dd27 (Freplace_match): New 4th arg OBJECT can specify string to replace in.

Richard M. Stallman <rms@gnu.org>

parents: 8950

diff changeset

2315 /* Do replacement in a string. */

f0d89b62dd27 (Freplace_match): New 4th arg OBJECT can specify string to replace in.

Richard M. Stallman <rms@gnu.org>

parents: 8950

diff changeset

2316 if (!NILP (string))

f0d89b62dd27 (Freplace_match): New 4th arg OBJECT can specify string to replace in.

Richard M. Stallman <rms@gnu.org>

parents: 8950

diff changeset

2317 {

f0d89b62dd27 (Freplace_match): New 4th arg OBJECT can specify string to replace in.

Richard M. Stallman <rms@gnu.org>

parents: 8950

diff changeset

2318 Lisp_Object before, after;

f0d89b62dd27 (Freplace_match): New 4th arg OBJECT can specify string to replace in.

Richard M. Stallman <rms@gnu.org>

parents: 8950

diff changeset

2319

f0d89b62dd27 (Freplace_match): New 4th arg OBJECT can specify string to replace in.

Richard M. Stallman <rms@gnu.org>

parents: 8950

diff changeset

2320 before = Fsubstring (string, make_number (0),

12807

34d269b30df1 (Freplace_match): New arg SUBEXP.

Richard M. Stallman <rms@gnu.org>

parents: 12244

diff changeset

2321 make_number (search_regs.start[sub]));

34d269b30df1 (Freplace_match): New arg SUBEXP.

Richard M. Stallman <rms@gnu.org>

parents: 12244

diff changeset

2322 after = Fsubstring (string, make_number (search_regs.end[sub]), Qnil);

9029

f0d89b62dd27 (Freplace_match): New 4th arg OBJECT can specify string to replace in.

Richard M. Stallman <rms@gnu.org>

parents: 8950

diff changeset

2323

17225

739e41eed8b6 (Freplace_match): Give error if

Richard M. Stallman <rms@gnu.org>

parents: 17102

diff changeset

2324 /* Substitute parts of the match into NEWTEXT

739e41eed8b6 (Freplace_match): Give error if

Richard M. Stallman <rms@gnu.org>

parents: 17102

diff changeset

2325 if desired. */

9029

f0d89b62dd27 (Freplace_match): New 4th arg OBJECT can specify string to replace in.

Richard M. Stallman <rms@gnu.org>

parents: 8950

diff changeset

2326 if (NILP (literal))

f0d89b62dd27 (Freplace_match): New 4th arg OBJECT can specify string to replace in.

Richard M. Stallman <rms@gnu.org>

parents: 8950

diff changeset

2327 {

21988

8cf3bbc89c3c (Freplace_match): Fix the loop for copying text

Richard M. Stallman <rms@gnu.org>

parents: 21945

diff changeset

2328 int lastpos = 0;

8cf3bbc89c3c (Freplace_match): Fix the loop for copying text

Richard M. Stallman <rms@gnu.org>

parents: 21945

diff changeset

2329 int lastpos_byte = 0;

9029

f0d89b62dd27 (Freplace_match): New 4th arg OBJECT can specify string to replace in.

Richard M. Stallman <rms@gnu.org>

parents: 8950

diff changeset

2330 /* We build up the substituted string in ACCUM. */

f0d89b62dd27 (Freplace_match): New 4th arg OBJECT can specify string to replace in.

Richard M. Stallman <rms@gnu.org>

parents: 8950

diff changeset

2331 Lisp_Object accum;

f0d89b62dd27 (Freplace_match): New 4th arg OBJECT can specify string to replace in.

Richard M. Stallman <rms@gnu.org>

parents: 8950

diff changeset

2332 Lisp_Object middle;

22533

6eae236a4f01 (Freplace_match): Work by chars, not by bytes,

Karl Heuer <kwzh@gnu.org>

parents: 22221

diff changeset

2333 int length = STRING_BYTES (XSTRING (newtext));

9029

f0d89b62dd27 (Freplace_match): New 4th arg OBJECT can specify string to replace in.

Richard M. Stallman <rms@gnu.org>

parents: 8950

diff changeset

2334

f0d89b62dd27 (Freplace_match): New 4th arg OBJECT can specify string to replace in.

Richard M. Stallman <rms@gnu.org>

parents: 8950

diff changeset

2335 accum = Qnil;

f0d89b62dd27 (Freplace_match): New 4th arg OBJECT can specify string to replace in.

Richard M. Stallman <rms@gnu.org>

parents: 8950

diff changeset

2336

22533

6eae236a4f01 (Freplace_match): Work by chars, not by bytes,

Karl Heuer <kwzh@gnu.org>

parents: 22221

diff changeset

2337 for (pos_byte = 0, pos = 0; pos_byte < length;)

9029

f0d89b62dd27 (Freplace_match): New 4th arg OBJECT can specify string to replace in.

Richard M. Stallman <rms@gnu.org>

parents: 8950

diff changeset

2338 {

f0d89b62dd27 (Freplace_match): New 4th arg OBJECT can specify string to replace in.

Richard M. Stallman <rms@gnu.org>

parents: 8950

diff changeset

2339 int substart = -1;

f0d89b62dd27 (Freplace_match): New 4th arg OBJECT can specify string to replace in.

Richard M. Stallman <rms@gnu.org>

parents: 8950

diff changeset

2340 int subend;

12148

a1c38b9b0f73 (Freplace_match): Do the right thing with backslash.

Karl Heuer <kwzh@gnu.org>

parents: 12147

diff changeset

2341 int delbackslash = 0;

9029

f0d89b62dd27 (Freplace_match): New 4th arg OBJECT can specify string to replace in.

Richard M. Stallman <rms@gnu.org>

parents: 8950

diff changeset

2342

20588

138c95482e6b (search_buffer): Handle bytes vs chars in non-RE case.

Richard M. Stallman <rms@gnu.org>

parents: 20547

diff changeset

2343 FETCH_STRING_CHAR_ADVANCE (c, newtext, pos, pos_byte);

138c95482e6b (search_buffer): Handle bytes vs chars in non-RE case.

Richard M. Stallman <rms@gnu.org>

parents: 20547

diff changeset

2344

9029

f0d89b62dd27 (Freplace_match): New 4th arg OBJECT can specify string to replace in.

Richard M. Stallman <rms@gnu.org>

parents: 8950

diff changeset

2345 if (c == '\\')

f0d89b62dd27 (Freplace_match): New 4th arg OBJECT can specify string to replace in.

Richard M. Stallman <rms@gnu.org>

parents: 8950

diff changeset

2346 {

20588

138c95482e6b (search_buffer): Handle bytes vs chars in non-RE case.

Richard M. Stallman <rms@gnu.org>

parents: 20547

diff changeset

2347 FETCH_STRING_CHAR_ADVANCE (c, newtext, pos, pos_byte);

9029

f0d89b62dd27 (Freplace_match): New 4th arg OBJECT can specify string to replace in.

Richard M. Stallman <rms@gnu.org>

parents: 8950

diff changeset

2348 if (c == '&')

f0d89b62dd27 (Freplace_match): New 4th arg OBJECT can specify string to replace in.

Richard M. Stallman <rms@gnu.org>

parents: 8950

diff changeset

2349 {

12807

34d269b30df1 (Freplace_match): New arg SUBEXP.

Richard M. Stallman <rms@gnu.org>

parents: 12244

diff changeset

2350 substart = search_regs.start[sub];

34d269b30df1 (Freplace_match): New arg SUBEXP.

Richard M. Stallman <rms@gnu.org>

parents: 12244

diff changeset

2351 subend = search_regs.end[sub];

9029

f0d89b62dd27 (Freplace_match): New 4th arg OBJECT can specify string to replace in.

Richard M. Stallman <rms@gnu.org>

parents: 8950

diff changeset

2352 }

f0d89b62dd27 (Freplace_match): New 4th arg OBJECT can specify string to replace in.

Richard M. Stallman <rms@gnu.org>

parents: 8950

diff changeset

2353 else if (c >= '1' && c <= '9' && c <= search_regs.num_regs + '0')

f0d89b62dd27 (Freplace_match): New 4th arg OBJECT can specify string to replace in.

Richard M. Stallman <rms@gnu.org>

parents: 8950

diff changeset

2354 {

12147

9200a0e153d3 (Freplace_match): Fix check for valid reg in string replace.

Karl Heuer <kwzh@gnu.org>

parents: 12092

diff changeset

2355 if (search_regs.start[c - '0'] >= 0)

9029

f0d89b62dd27 (Freplace_match): New 4th arg OBJECT can specify string to replace in.

Richard M. Stallman <rms@gnu.org>

parents: 8950

diff changeset

2356 {

f0d89b62dd27 (Freplace_match): New 4th arg OBJECT can specify string to replace in.

Richard M. Stallman <rms@gnu.org>

parents: 8950

diff changeset

2357 substart = search_regs.start[c - '0'];

f0d89b62dd27 (Freplace_match): New 4th arg OBJECT can specify string to replace in.

Richard M. Stallman <rms@gnu.org>

parents: 8950

diff changeset

2358 subend = search_regs.end[c - '0'];

f0d89b62dd27 (Freplace_match): New 4th arg OBJECT can specify string to replace in.

Richard M. Stallman <rms@gnu.org>

parents: 8950

diff changeset

2359 }

f0d89b62dd27 (Freplace_match): New 4th arg OBJECT can specify string to replace in.

Richard M. Stallman <rms@gnu.org>

parents: 8950

diff changeset

2360 }

12148

a1c38b9b0f73 (Freplace_match): Do the right thing with backslash.

Karl Heuer <kwzh@gnu.org>

parents: 12147

diff changeset

2361 else if (c == '\\')

a1c38b9b0f73 (Freplace_match): Do the right thing with backslash.

Karl Heuer <kwzh@gnu.org>

parents: 12147

diff changeset

2362 delbackslash = 1;

17225

739e41eed8b6 (Freplace_match): Give error if

Richard M. Stallman <rms@gnu.org>

parents: 17102

diff changeset

2363 else

739e41eed8b6 (Freplace_match): Give error if

Richard M. Stallman <rms@gnu.org>

parents: 17102

diff changeset

2364 error ("Invalid use of `\\' in replacement text");

9029

f0d89b62dd27 (Freplace_match): New 4th arg OBJECT can specify string to replace in.

Richard M. Stallman <rms@gnu.org>

parents: 8950

diff changeset

2365 }

f0d89b62dd27 (Freplace_match): New 4th arg OBJECT can specify string to replace in.

Richard M. Stallman <rms@gnu.org>

parents: 8950

diff changeset

2366 if (substart >= 0)

f0d89b62dd27 (Freplace_match): New 4th arg OBJECT can specify string to replace in.

Richard M. Stallman <rms@gnu.org>

parents: 8950

diff changeset

2367 {

21988

8cf3bbc89c3c (Freplace_match): Fix the loop for copying text

Richard M. Stallman <rms@gnu.org>

parents: 21945

diff changeset

2368 if (pos - 2 != lastpos)

8cf3bbc89c3c (Freplace_match): Fix the loop for copying text

Richard M. Stallman <rms@gnu.org>

parents: 21945

diff changeset

2369 middle = substring_both (newtext, lastpos,

8cf3bbc89c3c (Freplace_match): Fix the loop for copying text

Richard M. Stallman <rms@gnu.org>

parents: 21945

diff changeset

2370 lastpos_byte,

8cf3bbc89c3c (Freplace_match): Fix the loop for copying text

Richard M. Stallman <rms@gnu.org>

parents: 21945

diff changeset

2371 pos - 2, pos_byte - 2);

9029

f0d89b62dd27 (Freplace_match): New 4th arg OBJECT can specify string to replace in.

Richard M. Stallman <rms@gnu.org>

parents: 8950

diff changeset

2372 else

f0d89b62dd27 (Freplace_match): New 4th arg OBJECT can specify string to replace in.

Richard M. Stallman <rms@gnu.org>

parents: 8950

diff changeset

2373 middle = Qnil;

f0d89b62dd27 (Freplace_match): New 4th arg OBJECT can specify string to replace in.

Richard M. Stallman <rms@gnu.org>

parents: 8950

diff changeset

2374 accum = concat3 (accum, middle,

20588

138c95482e6b (search_buffer): Handle bytes vs chars in non-RE case.

Richard M. Stallman <rms@gnu.org>

parents: 20547

diff changeset

2375 Fsubstring (string,

138c95482e6b (search_buffer): Handle bytes vs chars in non-RE case.

Richard M. Stallman <rms@gnu.org>

parents: 20547

diff changeset

2376 make_number (substart),

9029

f0d89b62dd27 (Freplace_match): New 4th arg OBJECT can specify string to replace in.

Richard M. Stallman <rms@gnu.org>

parents: 8950

diff changeset

2377 make_number (subend)));

f0d89b62dd27 (Freplace_match): New 4th arg OBJECT can specify string to replace in.

Richard M. Stallman <rms@gnu.org>

parents: 8950

diff changeset

2378 lastpos = pos;

20588

138c95482e6b (search_buffer): Handle bytes vs chars in non-RE case.

Richard M. Stallman <rms@gnu.org>

parents: 20547

diff changeset

2379 lastpos_byte = pos_byte;

9029

f0d89b62dd27 (Freplace_match): New 4th arg OBJECT can specify string to replace in.

Richard M. Stallman <rms@gnu.org>

parents: 8950

diff changeset

2380 }

12148

a1c38b9b0f73 (Freplace_match): Do the right thing with backslash.

Karl Heuer <kwzh@gnu.org>

parents: 12147

diff changeset

2381 else if (delbackslash)

a1c38b9b0f73 (Freplace_match): Do the right thing with backslash.

Karl Heuer <kwzh@gnu.org>

parents: 12147

diff changeset

2382 {

21988

8cf3bbc89c3c (Freplace_match): Fix the loop for copying text

Richard M. Stallman <rms@gnu.org>

parents: 21945

diff changeset

2383 middle = substring_both (newtext, lastpos,

8cf3bbc89c3c (Freplace_match): Fix the loop for copying text

Richard M. Stallman <rms@gnu.org>

parents: 21945

diff changeset

2384 lastpos_byte,

8cf3bbc89c3c (Freplace_match): Fix the loop for copying text

Richard M. Stallman <rms@gnu.org>

parents: 21945

diff changeset

2385 pos - 1, pos_byte - 1);

20588

138c95482e6b (search_buffer): Handle bytes vs chars in non-RE case.

Richard M. Stallman <rms@gnu.org>

parents: 20547

diff changeset

2386

12148

a1c38b9b0f73 (Freplace_match): Do the right thing with backslash.

Karl Heuer <kwzh@gnu.org>

parents: 12147

diff changeset

2387 accum = concat2 (accum, middle);

a1c38b9b0f73 (Freplace_match): Do the right thing with backslash.

Karl Heuer <kwzh@gnu.org>

parents: 12147

diff changeset

2388 lastpos = pos;

20588

138c95482e6b (search_buffer): Handle bytes vs chars in non-RE case.

Richard M. Stallman <rms@gnu.org>

parents: 20547

diff changeset

2389 lastpos_byte = pos_byte;

12148

a1c38b9b0f73 (Freplace_match): Do the right thing with backslash.

Karl Heuer <kwzh@gnu.org>

parents: 12147

diff changeset

2390 }

9029

f0d89b62dd27 (Freplace_match): New 4th arg OBJECT can specify string to replace in.

Richard M. Stallman <rms@gnu.org>

parents: 8950

diff changeset

2391 }

f0d89b62dd27 (Freplace_match): New 4th arg OBJECT can specify string to replace in.

Richard M. Stallman <rms@gnu.org>

parents: 8950

diff changeset

2392

21988

8cf3bbc89c3c (Freplace_match): Fix the loop for copying text

Richard M. Stallman <rms@gnu.org>

parents: 21945

diff changeset

2393 if (pos != lastpos)

8cf3bbc89c3c (Freplace_match): Fix the loop for copying text

Richard M. Stallman <rms@gnu.org>

parents: 21945

diff changeset

2394 middle = substring_both (newtext, lastpos,

8cf3bbc89c3c (Freplace_match): Fix the loop for copying text

Richard M. Stallman <rms@gnu.org>

parents: 21945

diff changeset

2395 lastpos_byte,

20588

138c95482e6b (search_buffer): Handle bytes vs chars in non-RE case.

Richard M. Stallman <rms@gnu.org>

parents: 20547

diff changeset

2396 pos, pos_byte);

9029

f0d89b62dd27 (Freplace_match): New 4th arg OBJECT can specify string to replace in.

Richard M. Stallman <rms@gnu.org>

parents: 8950

diff changeset

2397 else

f0d89b62dd27 (Freplace_match): New 4th arg OBJECT can specify string to replace in.

Richard M. Stallman <rms@gnu.org>

parents: 8950

diff changeset

2398 middle = Qnil;

f0d89b62dd27 (Freplace_match): New 4th arg OBJECT can specify string to replace in.

Richard M. Stallman <rms@gnu.org>

parents: 8950

diff changeset

2399

f0d89b62dd27 (Freplace_match): New 4th arg OBJECT can specify string to replace in.

Richard M. Stallman <rms@gnu.org>

parents: 8950

diff changeset

2400 newtext = concat2 (accum, middle);

f0d89b62dd27 (Freplace_match): New 4th arg OBJECT can specify string to replace in.

Richard M. Stallman <rms@gnu.org>

parents: 8950

diff changeset

2401 }

f0d89b62dd27 (Freplace_match): New 4th arg OBJECT can specify string to replace in.

Richard M. Stallman <rms@gnu.org>

parents: 8950

diff changeset

2402

17225

739e41eed8b6 (Freplace_match): Give error if

Richard M. Stallman <rms@gnu.org>

parents: 17102

diff changeset

2403 /* Do case substitution in NEWTEXT if desired. */

9029

f0d89b62dd27 (Freplace_match): New 4th arg OBJECT can specify string to replace in.

Richard M. Stallman <rms@gnu.org>

parents: 8950

diff changeset

2404 if (case_action == all_caps)

f0d89b62dd27 (Freplace_match): New 4th arg OBJECT can specify string to replace in.

Richard M. Stallman <rms@gnu.org>

parents: 8950

diff changeset

2405 newtext = Fupcase (newtext);

f0d89b62dd27 (Freplace_match): New 4th arg OBJECT can specify string to replace in.

Richard M. Stallman <rms@gnu.org>

parents: 8950

diff changeset

2406 else if (case_action == cap_initial)

12092

b932b2ed40f5 (Freplace_match): Calls to upcase_initials and upcase_initials_region changed

Karl Heuer <kwzh@gnu.org>

parents: 12069

diff changeset

2407 newtext = Fupcase_initials (newtext);

9029

f0d89b62dd27 (Freplace_match): New 4th arg OBJECT can specify string to replace in.

Richard M. Stallman <rms@gnu.org>

parents: 8950

diff changeset

2408

f0d89b62dd27 (Freplace_match): New 4th arg OBJECT can specify string to replace in.

Richard M. Stallman <rms@gnu.org>

parents: 8950

diff changeset

2409 return concat3 (before, newtext, after);

f0d89b62dd27 (Freplace_match): New 4th arg OBJECT can specify string to replace in.

Richard M. Stallman <rms@gnu.org>

parents: 8950

diff changeset

2410 }

f0d89b62dd27 (Freplace_match): New 4th arg OBJECT can specify string to replace in.

Richard M. Stallman <rms@gnu.org>

parents: 8950

diff changeset

2411

18077

27a0ced43e7e (Freplace_match): Use move_if_not_intangible

Richard M. Stallman <rms@gnu.org>

parents: 17463

diff changeset

2412 /* Record point, the move (quietly) to the start of the match. */

23790

c1dbb92db43e (Freplace_match): Set OPOINT clearly for the case

Richard M. Stallman <rms@gnu.org>

parents: 22640

diff changeset

2413 if (PT >= search_regs.end[sub])

18077

27a0ced43e7e (Freplace_match): Use move_if_not_intangible

Richard M. Stallman <rms@gnu.org>

parents: 17463

diff changeset

2414 opoint = PT - ZV;

23790

c1dbb92db43e (Freplace_match): Set OPOINT clearly for the case

Richard M. Stallman <rms@gnu.org>

parents: 22640

diff changeset

2415 else if (PT > search_regs.start[sub])

c1dbb92db43e (Freplace_match): Set OPOINT clearly for the case

Richard M. Stallman <rms@gnu.org>

parents: 22640

diff changeset

2416 opoint = search_regs.end[sub] - ZV;

18077

27a0ced43e7e (Freplace_match): Use move_if_not_intangible

Richard M. Stallman <rms@gnu.org>

parents: 17463

diff changeset

2417 else

27a0ced43e7e (Freplace_match): Use move_if_not_intangible

Richard M. Stallman <rms@gnu.org>

parents: 17463

diff changeset

2418 opoint = PT;

27a0ced43e7e (Freplace_match): Use move_if_not_intangible

Richard M. Stallman <rms@gnu.org>

parents: 17463

diff changeset

2419

20545

c20c92ff4055 (looking_at_1): Use bytepos to call re_search_2.

Richard M. Stallman <rms@gnu.org>

parents: 20347

diff changeset

2420 TEMP_SET_PT (search_regs.start[sub]);

18077

27a0ced43e7e (Freplace_match): Use move_if_not_intangible

Richard M. Stallman <rms@gnu.org>

parents: 17463

diff changeset

2421

2655

594a33ffed85 * search.c (Freplace_match): Arrange for markers sitting at the

Jim Blandy <jimb@redhat.com>

parents: 2475

diff changeset

2422 /* We insert the replacement text before the old text, and then

594a33ffed85 * search.c (Freplace_match): Arrange for markers sitting at the

Jim Blandy <jimb@redhat.com>

parents: 2475

diff changeset

2423 delete the original text. This means that markers at the

594a33ffed85 * search.c (Freplace_match): Arrange for markers sitting at the

Jim Blandy <jimb@redhat.com>

parents: 2475

diff changeset

2424 beginning or end of the original will float to the corresponding

594a33ffed85 * search.c (Freplace_match): Arrange for markers sitting at the

Jim Blandy <jimb@redhat.com>

parents: 2475

diff changeset

2425 position in the replacement. */

603

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2426 if (!NILP (literal))

4882

8c09f87f5087 (Freplace_match): Fix argument names to match doc string.

Brian Fox <bfox@gnu.org>

parents: 4832

diff changeset

2427 Finsert_and_inherit (1, &newtext);

603

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2428 else

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2429 {

22533

6eae236a4f01 (Freplace_match): Work by chars, not by bytes,

Karl Heuer <kwzh@gnu.org>

parents: 22221

diff changeset

2430 int length = STRING_BYTES (XSTRING (newtext));

26982

3527c131b069 (Freplace_match): For nonliteral replacement,

Richard M. Stallman <rms@gnu.org>

parents: 26869

diff changeset

2431 unsigned char *substed;

3527c131b069 (Freplace_match): For nonliteral replacement,

Richard M. Stallman <rms@gnu.org>

parents: 26869

diff changeset

2432 int substed_alloc_size, substed_len;

22533

6eae236a4f01 (Freplace_match): Work by chars, not by bytes,

Karl Heuer <kwzh@gnu.org>

parents: 22221

diff changeset

2433

26982

3527c131b069 (Freplace_match): For nonliteral replacement,

Richard M. Stallman <rms@gnu.org>

parents: 26869

diff changeset

2434 substed_alloc_size = length * 2 + 100;

3527c131b069 (Freplace_match): For nonliteral replacement,

Richard M. Stallman <rms@gnu.org>

parents: 26869

diff changeset

2435 substed = (unsigned char *) xmalloc (substed_alloc_size + 1);

3527c131b069 (Freplace_match): For nonliteral replacement,

Richard M. Stallman <rms@gnu.org>

parents: 26869

diff changeset

2436 substed_len = 0;

3527c131b069 (Freplace_match): For nonliteral replacement,

Richard M. Stallman <rms@gnu.org>

parents: 26869

diff changeset

2437

3527c131b069 (Freplace_match): For nonliteral replacement,

Richard M. Stallman <rms@gnu.org>

parents: 26869

diff changeset

2438 /* Go thru NEWTEXT, producing the actual text to insert in SUBSTED. */

603

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2439

22533

6eae236a4f01 (Freplace_match): Work by chars, not by bytes,

Karl Heuer <kwzh@gnu.org>

parents: 22221

diff changeset

2440 for (pos_byte = 0, pos = 0; pos_byte < length;)

603

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2441 {

26982

3527c131b069 (Freplace_match): For nonliteral replacement,

Richard M. Stallman <rms@gnu.org>

parents: 26869

diff changeset

2442 unsigned char str[MAX_MULTIBYTE_LENGTH];

3527c131b069 (Freplace_match): For nonliteral replacement,

Richard M. Stallman <rms@gnu.org>

parents: 26869

diff changeset

2443 unsigned char *add_stuff;

3527c131b069 (Freplace_match): For nonliteral replacement,

Richard M. Stallman <rms@gnu.org>

parents: 26869

diff changeset

2444 int add_len;

3527c131b069 (Freplace_match): For nonliteral replacement,

Richard M. Stallman <rms@gnu.org>

parents: 26869

diff changeset

2445 int idx = -1;

2655

594a33ffed85 * search.c (Freplace_match): Arrange for markers sitting at the

Jim Blandy <jimb@redhat.com>

parents: 2475

diff changeset

2446

22533

6eae236a4f01 (Freplace_match): Work by chars, not by bytes,

Karl Heuer <kwzh@gnu.org>

parents: 22221

diff changeset

2447 FETCH_STRING_CHAR_ADVANCE (c, newtext, pos, pos_byte);

6eae236a4f01 (Freplace_match): Work by chars, not by bytes,

Karl Heuer <kwzh@gnu.org>

parents: 22221

diff changeset

2448

26982

3527c131b069 (Freplace_match): For nonliteral replacement,

Richard M. Stallman <rms@gnu.org>

parents: 26869

diff changeset

2449 /* Either set ADD_STUFF and ADD_LEN to the text to put in SUBSTED,

3527c131b069 (Freplace_match): For nonliteral replacement,

Richard M. Stallman <rms@gnu.org>

parents: 26869

diff changeset

2450 or set IDX to a match index, which means put that part

3527c131b069 (Freplace_match): For nonliteral replacement,

Richard M. Stallman <rms@gnu.org>

parents: 26869

diff changeset

2451 of the buffer text into SUBSTED. */

3527c131b069 (Freplace_match): For nonliteral replacement,

Richard M. Stallman <rms@gnu.org>

parents: 26869

diff changeset

2452

603

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2453 if (c == '\\')

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2454 {

22533

6eae236a4f01 (Freplace_match): Work by chars, not by bytes,

Karl Heuer <kwzh@gnu.org>

parents: 22221

diff changeset

2455 FETCH_STRING_CHAR_ADVANCE (c, newtext, pos, pos_byte);

603

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2456 if (c == '&')

26982

3527c131b069 (Freplace_match): For nonliteral replacement,

Richard M. Stallman <rms@gnu.org>

parents: 26869

diff changeset

2457 idx = sub;

7856

9687141f6264 (Freplace_match): Be sure not to treat non-digit like digit.

Richard M. Stallman <rms@gnu.org>

parents: 7674

diff changeset

2458 else if (c >= '1' && c <= '9' && c <= search_regs.num_regs + '0')

603

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2459 {

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2460 if (search_regs.start[c - '0'] >= 1)

26982

3527c131b069 (Freplace_match): For nonliteral replacement,

Richard M. Stallman <rms@gnu.org>

parents: 26869

diff changeset

2461 idx = c - '0';

603

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2462 }

17225

739e41eed8b6 (Freplace_match): Give error if

Richard M. Stallman <rms@gnu.org>

parents: 17102

diff changeset

2463 else if (c == '\\')

26982

3527c131b069 (Freplace_match): For nonliteral replacement,

Richard M. Stallman <rms@gnu.org>

parents: 26869

diff changeset

2464 add_len = 1, add_stuff = "\\";

603

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2465 else

17225

739e41eed8b6 (Freplace_match): Give error if

Richard M. Stallman <rms@gnu.org>

parents: 17102

diff changeset

2466 error ("Invalid use of `\\' in replacement text");

603

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2467 }

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2468 else

26982

3527c131b069 (Freplace_match): For nonliteral replacement,

Richard M. Stallman <rms@gnu.org>

parents: 26869

diff changeset

2469 {

3527c131b069 (Freplace_match): For nonliteral replacement,

Richard M. Stallman <rms@gnu.org>

parents: 26869

diff changeset

2470 add_len = CHAR_STRING (c, str);

3527c131b069 (Freplace_match): For nonliteral replacement,

Richard M. Stallman <rms@gnu.org>

parents: 26869

diff changeset

2471 add_stuff = str;

3527c131b069 (Freplace_match): For nonliteral replacement,

Richard M. Stallman <rms@gnu.org>

parents: 26869

diff changeset

2472 }

3527c131b069 (Freplace_match): For nonliteral replacement,

Richard M. Stallman <rms@gnu.org>

parents: 26869

diff changeset

2473

3527c131b069 (Freplace_match): For nonliteral replacement,

Richard M. Stallman <rms@gnu.org>

parents: 26869

diff changeset

2474 /* If we want to copy part of a previous match,

3527c131b069 (Freplace_match): For nonliteral replacement,

Richard M. Stallman <rms@gnu.org>

parents: 26869

diff changeset

2475 set up ADD_STUFF and ADD_LEN to point to it. */

3527c131b069 (Freplace_match): For nonliteral replacement,

Richard M. Stallman <rms@gnu.org>

parents: 26869

diff changeset

2476 if (idx >= 0)

3527c131b069 (Freplace_match): For nonliteral replacement,

Richard M. Stallman <rms@gnu.org>

parents: 26869

diff changeset

2477 {

3527c131b069 (Freplace_match): For nonliteral replacement,

Richard M. Stallman <rms@gnu.org>

parents: 26869

diff changeset

2478 int begbyte = CHAR_TO_BYTE (search_regs.start[idx]);

3527c131b069 (Freplace_match): For nonliteral replacement,

Richard M. Stallman <rms@gnu.org>

parents: 26869

diff changeset

2479 add_len = CHAR_TO_BYTE (search_regs.end[idx]) - begbyte;

3527c131b069 (Freplace_match): For nonliteral replacement,

Richard M. Stallman <rms@gnu.org>

parents: 26869

diff changeset

2480 if (search_regs.start[idx] < GPT && GPT < search_regs.end[idx])

3527c131b069 (Freplace_match): For nonliteral replacement,

Richard M. Stallman <rms@gnu.org>

parents: 26869

diff changeset

2481 move_gap (search_regs.start[idx]);

3527c131b069 (Freplace_match): For nonliteral replacement,

Richard M. Stallman <rms@gnu.org>

parents: 26869

diff changeset

2482 add_stuff = BYTE_POS_ADDR (begbyte);

3527c131b069 (Freplace_match): For nonliteral replacement,

Richard M. Stallman <rms@gnu.org>

parents: 26869

diff changeset

2483 }

3527c131b069 (Freplace_match): For nonliteral replacement,

Richard M. Stallman <rms@gnu.org>

parents: 26869

diff changeset

2484

3527c131b069 (Freplace_match): For nonliteral replacement,

Richard M. Stallman <rms@gnu.org>

parents: 26869

diff changeset

2485 /* Now the stuff we want to add to SUBSTED

3527c131b069 (Freplace_match): For nonliteral replacement,

Richard M. Stallman <rms@gnu.org>

parents: 26869

diff changeset

2486 is invariably ADD_LEN bytes starting at ADD_STUFF. */

3527c131b069 (Freplace_match): For nonliteral replacement,

Richard M. Stallman <rms@gnu.org>

parents: 26869

diff changeset

2487

3527c131b069 (Freplace_match): For nonliteral replacement,

Richard M. Stallman <rms@gnu.org>

parents: 26869

diff changeset

2488 /* Make sure SUBSTED is big enough. */

3527c131b069 (Freplace_match): For nonliteral replacement,

Richard M. Stallman <rms@gnu.org>

parents: 26869

diff changeset

2489 if (substed_len + add_len >= substed_alloc_size)

3527c131b069 (Freplace_match): For nonliteral replacement,

Richard M. Stallman <rms@gnu.org>

parents: 26869

diff changeset

2490 {

3527c131b069 (Freplace_match): For nonliteral replacement,

Richard M. Stallman <rms@gnu.org>

parents: 26869

diff changeset

2491 substed_alloc_size = substed_len + add_len + 500;

3527c131b069 (Freplace_match): For nonliteral replacement,

Richard M. Stallman <rms@gnu.org>

parents: 26869

diff changeset

2492 substed = (unsigned char *) xrealloc (substed,

3527c131b069 (Freplace_match): For nonliteral replacement,

Richard M. Stallman <rms@gnu.org>

parents: 26869

diff changeset

2493 substed_alloc_size + 1);

3527c131b069 (Freplace_match): For nonliteral replacement,

Richard M. Stallman <rms@gnu.org>

parents: 26869

diff changeset

2494 }

3527c131b069 (Freplace_match): For nonliteral replacement,

Richard M. Stallman <rms@gnu.org>

parents: 26869

diff changeset

2495

3527c131b069 (Freplace_match): For nonliteral replacement,

Richard M. Stallman <rms@gnu.org>

parents: 26869

diff changeset

2496 /* Now add to the end of SUBSTED. */

3527c131b069 (Freplace_match): For nonliteral replacement,

Richard M. Stallman <rms@gnu.org>

parents: 26869

diff changeset

2497 bcopy (add_stuff, substed + substed_len, add_len);

3527c131b069 (Freplace_match): For nonliteral replacement,

Richard M. Stallman <rms@gnu.org>

parents: 26869

diff changeset

2498 substed_len += add_len;

603

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2499 }

26982

3527c131b069 (Freplace_match): For nonliteral replacement,

Richard M. Stallman <rms@gnu.org>

parents: 26869

diff changeset

2500

3527c131b069 (Freplace_match): For nonliteral replacement,

Richard M. Stallman <rms@gnu.org>

parents: 26869

diff changeset

2501 /* Now insert what we accumulated. */

3527c131b069 (Freplace_match): For nonliteral replacement,

Richard M. Stallman <rms@gnu.org>

parents: 26869

diff changeset

2502 insert_and_inherit (substed, substed_len);

3527c131b069 (Freplace_match): For nonliteral replacement,

Richard M. Stallman <rms@gnu.org>

parents: 26869

diff changeset

2503

3527c131b069 (Freplace_match): For nonliteral replacement,

Richard M. Stallman <rms@gnu.org>

parents: 26869

diff changeset

2504 xfree (substed);

603

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2505 }

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2506

16039

855c8d8ba0f0 Change all references from point to PT.

Karl Heuer <kwzh@gnu.org>

parents: 15667

diff changeset

2507 inslen = PT - (search_regs.start[sub]);

12807

34d269b30df1 (Freplace_match): New arg SUBEXP.

Richard M. Stallman <rms@gnu.org>

parents: 12244

diff changeset

2508 del_range (search_regs.start[sub] + inslen, search_regs.end[sub] + inslen);

603

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2509

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2510 if (case_action == all_caps)

16039

855c8d8ba0f0 Change all references from point to PT.

Karl Heuer <kwzh@gnu.org>

parents: 15667

diff changeset

2511 Fupcase_region (make_number (PT - inslen), make_number (PT));

603

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2512 else if (case_action == cap_initial)

16039

855c8d8ba0f0 Change all references from point to PT.

Karl Heuer <kwzh@gnu.org>

parents: 15667

diff changeset

2513 Fupcase_initials_region (make_number (PT - inslen), make_number (PT));

18077

27a0ced43e7e (Freplace_match): Use move_if_not_intangible

Richard M. Stallman <rms@gnu.org>

parents: 17463

diff changeset

2514

18081

300068b4fcef (Freplace_match): Fix previous change.

Richard M. Stallman <rms@gnu.org>

parents: 18077

diff changeset

2515 newpoint = PT;

300068b4fcef (Freplace_match): Fix previous change.

Richard M. Stallman <rms@gnu.org>

parents: 18077

diff changeset

2516

18077

27a0ced43e7e (Freplace_match): Use move_if_not_intangible

Richard M. Stallman <rms@gnu.org>

parents: 17463

diff changeset

2517 /* Put point back where it was in the text. */

18124

6f2c80d2425a (Freplace_match): If opoint is 0, that's relative to ZV.

Richard M. Stallman <rms@gnu.org>

parents: 18112

diff changeset

2518 if (opoint <= 0)

20545

c20c92ff4055 (looking_at_1): Use bytepos to call re_search_2.

Richard M. Stallman <rms@gnu.org>

parents: 20347

diff changeset

2519 TEMP_SET_PT (opoint + ZV);

18077

27a0ced43e7e (Freplace_match): Use move_if_not_intangible

Richard M. Stallman <rms@gnu.org>

parents: 17463

diff changeset

2520 else

20545

c20c92ff4055 (looking_at_1): Use bytepos to call re_search_2.

Richard M. Stallman <rms@gnu.org>

parents: 20347

diff changeset

2521 TEMP_SET_PT (opoint);

18077

27a0ced43e7e (Freplace_match): Use move_if_not_intangible

Richard M. Stallman <rms@gnu.org>

parents: 17463

diff changeset

2522

27a0ced43e7e (Freplace_match): Use move_if_not_intangible

Richard M. Stallman <rms@gnu.org>

parents: 17463

diff changeset

2523 /* Now move point "officially" to the start of the inserted replacement. */

18081

300068b4fcef (Freplace_match): Fix previous change.

Richard M. Stallman <rms@gnu.org>

parents: 18077

diff changeset

2524 move_if_not_intangible (newpoint);

18077

27a0ced43e7e (Freplace_match): Use move_if_not_intangible

Richard M. Stallman <rms@gnu.org>

parents: 17463

diff changeset

2525

603

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2526 return Qnil;

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2527 }

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2528

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2529 static Lisp_Object

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2530 match_limit (num, beginningp)

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2531 Lisp_Object num;

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2532 int beginningp;

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2533 {

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2534 register int n;

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2535

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2536 CHECK_NUMBER (num, 0);

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2537 n = XINT (num);

621

eca8812e61cd *** empty log message ***

Jim Blandy <jimb@redhat.com>

parents: 605

diff changeset

2538 if (n < 0 || n >= search_regs.num_regs)

eca8812e61cd *** empty log message ***

Jim Blandy <jimb@redhat.com>

parents: 605

diff changeset

2539 args_out_of_range (num, make_number (search_regs.num_regs));

eca8812e61cd *** empty log message ***

Jim Blandy <jimb@redhat.com>

parents: 605

diff changeset

2540 if (search_regs.num_regs <= 0

eca8812e61cd *** empty log message ***

Jim Blandy <jimb@redhat.com>

parents: 605

diff changeset

2541 || search_regs.start[n] < 0)

603

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2542 return Qnil;

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2543 return (make_number ((beginningp) ? search_regs.start[n]

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2544 : search_regs.end[n]));

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2545 }

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2546

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2547 DEFUN ("match-beginning", Fmatch_beginning, Smatch_beginning, 1, 1, 0,

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2548 "Return position of start of text matched by last search.\n\

14086

a410808fda15 (Fmatch_end, Fregexp_quote): Harmonize arguments with documentation.

Erik Naggum <erik@naggum.no>

parents: 14036

diff changeset

2549 SUBEXP, a number, specifies which parenthesized expression in the last\n\

a410808fda15 (Fmatch_end, Fregexp_quote): Harmonize arguments with documentation.

Erik Naggum <erik@naggum.no>

parents: 14036

diff changeset

2550 regexp.\n\

a410808fda15 (Fmatch_end, Fregexp_quote): Harmonize arguments with documentation.

Erik Naggum <erik@naggum.no>

parents: 14036

diff changeset

2551 Value is nil if SUBEXPth pair didn't match, or there were less than\n\

a410808fda15 (Fmatch_end, Fregexp_quote): Harmonize arguments with documentation.

Erik Naggum <erik@naggum.no>

parents: 14036

diff changeset

2552 SUBEXP pairs.\n\

603

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2553 Zero means the entire text matched by the whole regexp or whole string.")

14086

a410808fda15 (Fmatch_end, Fregexp_quote): Harmonize arguments with documentation.

Erik Naggum <erik@naggum.no>

parents: 14036

diff changeset

2554 (subexp)

a410808fda15 (Fmatch_end, Fregexp_quote): Harmonize arguments with documentation.

Erik Naggum <erik@naggum.no>

parents: 14036

diff changeset

2555 Lisp_Object subexp;

603

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2556 {

14086

a410808fda15 (Fmatch_end, Fregexp_quote): Harmonize arguments with documentation.

Erik Naggum <erik@naggum.no>

parents: 14036

diff changeset

2557 return match_limit (subexp, 1);

603

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2558 }

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2559

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2560 DEFUN ("match-end", Fmatch_end, Smatch_end, 1, 1, 0,

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2561 "Return position of end of text matched by last search.\n\

14086

a410808fda15 (Fmatch_end, Fregexp_quote): Harmonize arguments with documentation.

Erik Naggum <erik@naggum.no>

parents: 14036

diff changeset

2562 SUBEXP, a number, specifies which parenthesized expression in the last\n\

a410808fda15 (Fmatch_end, Fregexp_quote): Harmonize arguments with documentation.

Erik Naggum <erik@naggum.no>

parents: 14036

diff changeset

2563 regexp.\n\

a410808fda15 (Fmatch_end, Fregexp_quote): Harmonize arguments with documentation.

Erik Naggum <erik@naggum.no>

parents: 14036

diff changeset

2564 Value is nil if SUBEXPth pair didn't match, or there were less than\n\

a410808fda15 (Fmatch_end, Fregexp_quote): Harmonize arguments with documentation.

Erik Naggum <erik@naggum.no>

parents: 14036

diff changeset

2565 SUBEXP pairs.\n\

603

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2566 Zero means the entire text matched by the whole regexp or whole string.")

14086

a410808fda15 (Fmatch_end, Fregexp_quote): Harmonize arguments with documentation.

Erik Naggum <erik@naggum.no>

parents: 14036

diff changeset

2567 (subexp)

a410808fda15 (Fmatch_end, Fregexp_quote): Harmonize arguments with documentation.

Erik Naggum <erik@naggum.no>

parents: 14036

diff changeset

2568 Lisp_Object subexp;

603

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2569 {

14086

a410808fda15 (Fmatch_end, Fregexp_quote): Harmonize arguments with documentation.

Erik Naggum <erik@naggum.no>

parents: 14036

diff changeset

2570 return match_limit (subexp, 0);

603

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2571 }

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2572

16724

4b1fb372a4fe (Fmatch_data): New args INTEGERS and REUSE.

Richard M. Stallman <rms@gnu.org>

parents: 16275

diff changeset

2573 DEFUN ("match-data", Fmatch_data, Smatch_data, 0, 2, 0,

603

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2574 "Return a list containing all info on what the last search matched.\n\

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2575 Element 2N is `(match-beginning N)'; element 2N + 1 is `(match-end N)'.\n\

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2576 All the elements are markers or nil (nil if the Nth pair didn't match)\n\

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2577 if the last match was on a buffer; integers or nil if a string was matched.\n\

16724

4b1fb372a4fe (Fmatch_data): New args INTEGERS and REUSE.

Richard M. Stallman <rms@gnu.org>

parents: 16275

diff changeset

2578 Use `store-match-data' to reinstate the data in this list.\n\

4b1fb372a4fe (Fmatch_data): New args INTEGERS and REUSE.

Richard M. Stallman <rms@gnu.org>

parents: 16275

diff changeset

2579 \n\

4b1fb372a4fe (Fmatch_data): New args INTEGERS and REUSE.

Richard M. Stallman <rms@gnu.org>

parents: 16275

diff changeset

2580 If INTEGERS (the optional first argument) is non-nil, always use integers\n\

16731

039ef6e74d3a (Fmatch_data): Doc fix.

Richard M. Stallman <rms@gnu.org>

parents: 16724

diff changeset

2581 \(rather than markers) to represent buffer positions.\n\

16724

4b1fb372a4fe (Fmatch_data): New args INTEGERS and REUSE.

Richard M. Stallman <rms@gnu.org>

parents: 16275

diff changeset

2582 If REUSE is a list, reuse it as part of the value. If REUSE is long enough\n\

4b1fb372a4fe (Fmatch_data): New args INTEGERS and REUSE.

Richard M. Stallman <rms@gnu.org>

parents: 16275

diff changeset

2583 to hold all the values, and if INTEGERS is non-nil, no consing is done.")

4b1fb372a4fe (Fmatch_data): New args INTEGERS and REUSE.

Richard M. Stallman <rms@gnu.org>

parents: 16275

diff changeset

2584 (integers, reuse)

4b1fb372a4fe (Fmatch_data): New args INTEGERS and REUSE.

Richard M. Stallman <rms@gnu.org>

parents: 16275

diff changeset

2585 Lisp_Object integers, reuse;

603

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2586 {

16724

4b1fb372a4fe (Fmatch_data): New args INTEGERS and REUSE.

Richard M. Stallman <rms@gnu.org>

parents: 16275

diff changeset

2587 Lisp_Object tail, prev;

621

eca8812e61cd *** empty log message ***

Jim Blandy <jimb@redhat.com>

parents: 605

diff changeset

2588 Lisp_Object *data;

603

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2589 int i, len;

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2590

727

540b047ece4d *** empty log message ***

Jim Blandy <jimb@redhat.com>

parents: 708

diff changeset

2591 if (NILP (last_thing_searched))

15667

9531c03134b6 (Fmatch_data): If no matching done yet, return Qnil.

Karl Heuer <kwzh@gnu.org>

parents: 14186

diff changeset

2592 return Qnil;

727

540b047ece4d *** empty log message ***

Jim Blandy <jimb@redhat.com>

parents: 708

diff changeset

2593

621

eca8812e61cd *** empty log message ***

Jim Blandy <jimb@redhat.com>

parents: 605

diff changeset

2594 data = (Lisp_Object *) alloca ((2 * search_regs.num_regs)

eca8812e61cd *** empty log message ***

Jim Blandy <jimb@redhat.com>

parents: 605

diff changeset

2595 * sizeof (Lisp_Object));

eca8812e61cd *** empty log message ***

Jim Blandy <jimb@redhat.com>

parents: 605

diff changeset

2596

603

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2597 len = -1;

621

eca8812e61cd *** empty log message ***

Jim Blandy <jimb@redhat.com>

parents: 605

diff changeset

2598 for (i = 0; i < search_regs.num_regs; i++)

603

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2599 {

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2600 int start = search_regs.start[i];

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2601 if (start >= 0)

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2602 {

16724

4b1fb372a4fe (Fmatch_data): New args INTEGERS and REUSE.

Richard M. Stallman <rms@gnu.org>

parents: 16275

diff changeset

2603 if (EQ (last_thing_searched, Qt)

4b1fb372a4fe (Fmatch_data): New args INTEGERS and REUSE.

Richard M. Stallman <rms@gnu.org>

parents: 16275

diff changeset

2604 || ! NILP (integers))

603

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2605 {

9319

7969182b6cc6 (skip_chars, Fmatch_data, Fstore_match_data): Don't use XFASTINT as an lvalue.

Karl Heuer <kwzh@gnu.org>

parents: 9278

diff changeset

2606 XSETFASTINT (data[2 * i], start);

7969182b6cc6 (skip_chars, Fmatch_data, Fstore_match_data): Don't use XFASTINT as an lvalue.

Karl Heuer <kwzh@gnu.org>

parents: 9278

diff changeset

2607 XSETFASTINT (data[2 * i + 1], search_regs.end[i]);

603

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2608 }

9113

766b6288e0f2 (Fmatch_data, Fstore_match_data): Use type test macros.

Karl Heuer <kwzh@gnu.org>

parents: 9029

diff changeset

2609 else if (BUFFERP (last_thing_searched))

603

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2610 {

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2611 data[2 * i] = Fmake_marker ();

727

540b047ece4d *** empty log message ***

Jim Blandy <jimb@redhat.com>

parents: 708

diff changeset

2612 Fset_marker (data[2 * i],

540b047ece4d *** empty log message ***

Jim Blandy <jimb@redhat.com>

parents: 708

diff changeset

2613 make_number (start),

540b047ece4d *** empty log message ***

Jim Blandy <jimb@redhat.com>

parents: 708

diff changeset

2614 last_thing_searched);

603

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2615 data[2 * i + 1] = Fmake_marker ();

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2616 Fset_marker (data[2 * i + 1],

727

540b047ece4d *** empty log message ***

Jim Blandy <jimb@redhat.com>

parents: 708

diff changeset

2617 make_number (search_regs.end[i]),

540b047ece4d *** empty log message ***

Jim Blandy <jimb@redhat.com>

parents: 708

diff changeset

2618 last_thing_searched);

603

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2619 }

727

540b047ece4d *** empty log message ***

Jim Blandy <jimb@redhat.com>

parents: 708

diff changeset

2620 else

540b047ece4d *** empty log message ***

Jim Blandy <jimb@redhat.com>

parents: 708

diff changeset

2621 /* last_thing_searched must always be Qt, a buffer, or Qnil. */

540b047ece4d *** empty log message ***

Jim Blandy <jimb@redhat.com>

parents: 708

diff changeset

2622 abort ();

540b047ece4d *** empty log message ***

Jim Blandy <jimb@redhat.com>

parents: 708

diff changeset

2623

603

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2624 len = i;

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2625 }

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2626 else

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2627 data[2 * i] = data [2 * i + 1] = Qnil;

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2628 }

16724

4b1fb372a4fe (Fmatch_data): New args INTEGERS and REUSE.

Richard M. Stallman <rms@gnu.org>

parents: 16275

diff changeset

2629

4b1fb372a4fe (Fmatch_data): New args INTEGERS and REUSE.

Richard M. Stallman <rms@gnu.org>

parents: 16275

diff changeset

2630 /* If REUSE is not usable, cons up the values and return them. */

4b1fb372a4fe (Fmatch_data): New args INTEGERS and REUSE.

Richard M. Stallman <rms@gnu.org>

parents: 16275

diff changeset

2631 if (! CONSP (reuse))

4b1fb372a4fe (Fmatch_data): New args INTEGERS and REUSE.

Richard M. Stallman <rms@gnu.org>

parents: 16275

diff changeset

2632 return Flist (2 * len + 2, data);

4b1fb372a4fe (Fmatch_data): New args INTEGERS and REUSE.

Richard M. Stallman <rms@gnu.org>

parents: 16275

diff changeset

2633

4b1fb372a4fe (Fmatch_data): New args INTEGERS and REUSE.

Richard M. Stallman <rms@gnu.org>

parents: 16275

diff changeset

2634 /* If REUSE is a list, store as many value elements as will fit

4b1fb372a4fe (Fmatch_data): New args INTEGERS and REUSE.

Richard M. Stallman <rms@gnu.org>

parents: 16275

diff changeset

2635 into the elements of REUSE. */

4b1fb372a4fe (Fmatch_data): New args INTEGERS and REUSE.

Richard M. Stallman <rms@gnu.org>

parents: 16275

diff changeset

2636 for (i = 0, tail = reuse; CONSP (tail);

25663

a5eaace0fa01 Use XCAR and XCDR instead of explicit member access.

Ken Raeburn <raeburn@raeburn.org>

parents: 25441

diff changeset

2637 i++, tail = XCDR (tail))

16724

4b1fb372a4fe (Fmatch_data): New args INTEGERS and REUSE.

Richard M. Stallman <rms@gnu.org>

parents: 16275

diff changeset

2638 {

4b1fb372a4fe (Fmatch_data): New args INTEGERS and REUSE.

Richard M. Stallman <rms@gnu.org>

parents: 16275

diff changeset

2639 if (i < 2 * len + 2)

25663

a5eaace0fa01 Use XCAR and XCDR instead of explicit member access.

Ken Raeburn <raeburn@raeburn.org>

parents: 25441

diff changeset

2640 XCAR (tail) = data[i];

16724

4b1fb372a4fe (Fmatch_data): New args INTEGERS and REUSE.

Richard M. Stallman <rms@gnu.org>

parents: 16275

diff changeset

2641 else

25663

a5eaace0fa01 Use XCAR and XCDR instead of explicit member access.

Ken Raeburn <raeburn@raeburn.org>

parents: 25441

diff changeset

2642 XCAR (tail) = Qnil;

16724

4b1fb372a4fe (Fmatch_data): New args INTEGERS and REUSE.

Richard M. Stallman <rms@gnu.org>

parents: 16275

diff changeset

2643 prev = tail;

4b1fb372a4fe (Fmatch_data): New args INTEGERS and REUSE.

Richard M. Stallman <rms@gnu.org>

parents: 16275

diff changeset

2644 }

4b1fb372a4fe (Fmatch_data): New args INTEGERS and REUSE.

Richard M. Stallman <rms@gnu.org>

parents: 16275

diff changeset

2645

4b1fb372a4fe (Fmatch_data): New args INTEGERS and REUSE.

Richard M. Stallman <rms@gnu.org>

parents: 16275

diff changeset

2646 /* If we couldn't fit all value elements into REUSE,

4b1fb372a4fe (Fmatch_data): New args INTEGERS and REUSE.

Richard M. Stallman <rms@gnu.org>

parents: 16275

diff changeset

2647 cons up the rest of them and add them to the end of REUSE. */

4b1fb372a4fe (Fmatch_data): New args INTEGERS and REUSE.

Richard M. Stallman <rms@gnu.org>

parents: 16275

diff changeset

2648 if (i < 2 * len + 2)

25663

a5eaace0fa01 Use XCAR and XCDR instead of explicit member access.

Ken Raeburn <raeburn@raeburn.org>

parents: 25441

diff changeset

2649 XCDR (prev) = Flist (2 * len + 2 - i, data + i);

16724

4b1fb372a4fe (Fmatch_data): New args INTEGERS and REUSE.

Richard M. Stallman <rms@gnu.org>

parents: 16275

diff changeset

2650

4b1fb372a4fe (Fmatch_data): New args INTEGERS and REUSE.

Richard M. Stallman <rms@gnu.org>

parents: 16275

diff changeset

2651 return reuse;

603

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2652 }

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2653

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2654

21171

60f6085df198 (Fset_match_data): Renamed from Fstore_match_data.

Richard M. Stallman <rms@gnu.org>

parents: 21117

diff changeset

2655 DEFUN ("set-match-data", Fset_match_data, Sset_match_data, 1, 1, 0,

603

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2656 "Set internal data on last search match from elements of LIST.\n\

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2657 LIST should have been created by calling `match-data' previously.")

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2658 (list)

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2659 register Lisp_Object list;

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2660 {

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2661 register int i;

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2662 register Lisp_Object marker;

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2663

10032

f689803caa92 Added code for automatically saving and restoring the match data

Francesco Potortì <pot@gnu.org>

parents: 10020

diff changeset

2664 if (running_asynch_code)

f689803caa92 Added code for automatically saving and restoring the match data

Francesco Potortì <pot@gnu.org>

parents: 10020

diff changeset

2665 save_search_regs ();

f689803caa92 Added code for automatically saving and restoring the match data

Francesco Potortì <pot@gnu.org>

parents: 10020

diff changeset

2666

603

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2667 if (!CONSP (list) && !NILP (list))

1926

952f2a18f83d * callint.c (Fcall_interactively): Pass the correct number of

Jim Blandy <jimb@redhat.com>

parents: 1896

diff changeset

2668 list = wrong_type_argument (Qconsp, list);

603

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2669

727

540b047ece4d *** empty log message ***

Jim Blandy <jimb@redhat.com>

parents: 708

diff changeset

2670 /* Unless we find a marker with a buffer in LIST, assume that this

540b047ece4d *** empty log message ***

Jim Blandy <jimb@redhat.com>

parents: 708

diff changeset

2671 match data came from a string. */

540b047ece4d *** empty log message ***

Jim Blandy <jimb@redhat.com>

parents: 708

diff changeset

2672 last_thing_searched = Qt;

540b047ece4d *** empty log message ***

Jim Blandy <jimb@redhat.com>

parents: 708

diff changeset

2673

621

eca8812e61cd *** empty log message ***

Jim Blandy <jimb@redhat.com>

parents: 605

diff changeset

2674 /* Allocate registers if they don't already exist. */

eca8812e61cd *** empty log message ***

Jim Blandy <jimb@redhat.com>

parents: 605

diff changeset

2675 {

1523

bd61aaa7828b * search.c (Fstore_match_data): Don't assume Flength returns an

Jim Blandy <jimb@redhat.com>

parents: 1413

diff changeset

2676 int length = XFASTINT (Flength (list)) / 2;

621

eca8812e61cd *** empty log message ***

Jim Blandy <jimb@redhat.com>

parents: 605

diff changeset

2677

eca8812e61cd *** empty log message ***

Jim Blandy <jimb@redhat.com>

parents: 605

diff changeset

2678 if (length > search_regs.num_regs)

eca8812e61cd *** empty log message ***

Jim Blandy <jimb@redhat.com>

parents: 605

diff changeset

2679 {

708

030fb4635335 *** empty log message ***

Jim Blandy <jimb@redhat.com>

parents: 648

diff changeset

2680 if (search_regs.num_regs == 0)

030fb4635335 *** empty log message ***

Jim Blandy <jimb@redhat.com>

parents: 648

diff changeset

2681 {

030fb4635335 *** empty log message ***

Jim Blandy <jimb@redhat.com>

parents: 648

diff changeset

2682 search_regs.start

030fb4635335 *** empty log message ***

Jim Blandy <jimb@redhat.com>

parents: 648

diff changeset

2683 = (regoff_t *) xmalloc (length * sizeof (regoff_t));

030fb4635335 *** empty log message ***

Jim Blandy <jimb@redhat.com>

parents: 648

diff changeset

2684 search_regs.end

030fb4635335 *** empty log message ***

Jim Blandy <jimb@redhat.com>

parents: 648

diff changeset

2685 = (regoff_t *) xmalloc (length * sizeof (regoff_t));

030fb4635335 *** empty log message ***

Jim Blandy <jimb@redhat.com>

parents: 648

diff changeset

2686 }

621

eca8812e61cd *** empty log message ***

Jim Blandy <jimb@redhat.com>

parents: 605

diff changeset

2687 else

708

030fb4635335 *** empty log message ***

Jim Blandy <jimb@redhat.com>

parents: 648

diff changeset

2688 {

030fb4635335 *** empty log message ***

Jim Blandy <jimb@redhat.com>

parents: 648

diff changeset

2689 search_regs.start

030fb4635335 *** empty log message ***

Jim Blandy <jimb@redhat.com>

parents: 648

diff changeset

2690 = (regoff_t *) xrealloc (search_regs.start,

030fb4635335 *** empty log message ***

Jim Blandy <jimb@redhat.com>

parents: 648

diff changeset

2691 length * sizeof (regoff_t));

030fb4635335 *** empty log message ***

Jim Blandy <jimb@redhat.com>

parents: 648

diff changeset

2692 search_regs.end

030fb4635335 *** empty log message ***

Jim Blandy <jimb@redhat.com>

parents: 648

diff changeset

2693 = (regoff_t *) xrealloc (search_regs.end,

030fb4635335 *** empty log message ***

Jim Blandy <jimb@redhat.com>

parents: 648

diff changeset

2694 length * sizeof (regoff_t));

030fb4635335 *** empty log message ***

Jim Blandy <jimb@redhat.com>

parents: 648

diff changeset

2695 }

621

eca8812e61cd *** empty log message ***

Jim Blandy <jimb@redhat.com>

parents: 605

diff changeset

2696

9605

cf97e75d8e02 (searchbufs): New variable, replaces searchbuf and last_regexp and

Karl Heuer <kwzh@gnu.org>

parents: 9452

diff changeset

2697 search_regs.num_regs = length;

621

eca8812e61cd *** empty log message ***

Jim Blandy <jimb@redhat.com>

parents: 605

diff changeset

2698 }

eca8812e61cd *** empty log message ***

Jim Blandy <jimb@redhat.com>

parents: 605

diff changeset

2699 }

eca8812e61cd *** empty log message ***

Jim Blandy <jimb@redhat.com>

parents: 605

diff changeset

2700

eca8812e61cd *** empty log message ***

Jim Blandy <jimb@redhat.com>

parents: 605

diff changeset

2701 for (i = 0; i < search_regs.num_regs; i++)

603

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2702 {

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2703 marker = Fcar (list);

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2704 if (NILP (marker))

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2705 {

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2706 search_regs.start[i] = -1;

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2707 list = Fcdr (list);

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2708 }

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2709 else

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2710 {

9113

766b6288e0f2 (Fmatch_data, Fstore_match_data): Use type test macros.

Karl Heuer <kwzh@gnu.org>

parents: 9029

diff changeset

2711 if (MARKERP (marker))

727

540b047ece4d *** empty log message ***

Jim Blandy <jimb@redhat.com>

parents: 708

diff changeset

2712 {

540b047ece4d *** empty log message ***

Jim Blandy <jimb@redhat.com>

parents: 708

diff changeset

2713 if (XMARKER (marker)->buffer == 0)

9319

7969182b6cc6 (skip_chars, Fmatch_data, Fstore_match_data): Don't use XFASTINT as an lvalue.

Karl Heuer <kwzh@gnu.org>

parents: 9278

diff changeset

2714 XSETFASTINT (marker, 0);

727

540b047ece4d *** empty log message ***

Jim Blandy <jimb@redhat.com>

parents: 708

diff changeset

2715 else

9278

f2138d548313 (Flooking_at, skip_chars, search_buffer, set_search_regs, Fstore_match_data):

Karl Heuer <kwzh@gnu.org>

parents: 9113

diff changeset

2716 XSETBUFFER (last_thing_searched, XMARKER (marker)->buffer);

727

540b047ece4d *** empty log message ***

Jim Blandy <jimb@redhat.com>

parents: 708

diff changeset

2717 }

603

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2718

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2719 CHECK_NUMBER_COERCE_MARKER (marker, 0);

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2720 search_regs.start[i] = XINT (marker);

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2721 list = Fcdr (list);

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2722

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2723 marker = Fcar (list);

9113

766b6288e0f2 (Fmatch_data, Fstore_match_data): Use type test macros.

Karl Heuer <kwzh@gnu.org>

parents: 9029

diff changeset

2724 if (MARKERP (marker) && XMARKER (marker)->buffer == 0)

9319

7969182b6cc6 (skip_chars, Fmatch_data, Fstore_match_data): Don't use XFASTINT as an lvalue.

Karl Heuer <kwzh@gnu.org>

parents: 9278

diff changeset

2725 XSETFASTINT (marker, 0);

603

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2726

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2727 CHECK_NUMBER_COERCE_MARKER (marker, 0);

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2728 search_regs.end[i] = XINT (marker);

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2729 }

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2730 list = Fcdr (list);

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2731 }

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2732

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2733 return Qnil;

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2734 }

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2735

10032

f689803caa92 Added code for automatically saving and restoring the match data

Francesco Potortì <pot@gnu.org>

parents: 10020

diff changeset

2736 /* If non-zero the match data have been saved in saved_search_regs

f689803caa92 Added code for automatically saving and restoring the match data

Francesco Potortì <pot@gnu.org>

parents: 10020

diff changeset

2737 during the execution of a sentinel or filter. */

10128

59ccd063e016 (search_regs_saved): Delete initializer.

Richard M. Stallman <rms@gnu.org>

parents: 10055

diff changeset

2738 static int search_regs_saved;

10032

f689803caa92 Added code for automatically saving and restoring the match data

Francesco Potortì <pot@gnu.org>

parents: 10020

diff changeset

2739 static struct re_registers saved_search_regs;

f689803caa92 Added code for automatically saving and restoring the match data

Francesco Potortì <pot@gnu.org>

parents: 10020

diff changeset

2740

f689803caa92 Added code for automatically saving and restoring the match data

Francesco Potortì <pot@gnu.org>

parents: 10020

diff changeset

2741 /* Called from Flooking_at, Fstring_match, search_buffer, Fstore_match_data

f689803caa92 Added code for automatically saving and restoring the match data

Francesco Potortì <pot@gnu.org>

parents: 10020

diff changeset

2742 if asynchronous code (filter or sentinel) is running. */

f689803caa92 Added code for automatically saving and restoring the match data

Francesco Potortì <pot@gnu.org>

parents: 10020

diff changeset

2743 static void

f689803caa92 Added code for automatically saving and restoring the match data

Francesco Potortì <pot@gnu.org>

parents: 10020

diff changeset

2744 save_search_regs ()

f689803caa92 Added code for automatically saving and restoring the match data

Francesco Potortì <pot@gnu.org>

parents: 10020

diff changeset

2745 {

f689803caa92 Added code for automatically saving and restoring the match data

Francesco Potortì <pot@gnu.org>

parents: 10020

diff changeset

2746 if (!search_regs_saved)

f689803caa92 Added code for automatically saving and restoring the match data

Francesco Potortì <pot@gnu.org>

parents: 10020

diff changeset

2747 {

f689803caa92 Added code for automatically saving and restoring the match data

Francesco Potortì <pot@gnu.org>

parents: 10020

diff changeset

2748 saved_search_regs.num_regs = search_regs.num_regs;

f689803caa92 Added code for automatically saving and restoring the match data

Francesco Potortì <pot@gnu.org>

parents: 10020

diff changeset

2749 saved_search_regs.start = search_regs.start;

f689803caa92 Added code for automatically saving and restoring the match data

Francesco Potortì <pot@gnu.org>

parents: 10020

diff changeset

2750 saved_search_regs.end = search_regs.end;

f689803caa92 Added code for automatically saving and restoring the match data

Francesco Potortì <pot@gnu.org>

parents: 10020

diff changeset

2751 search_regs.num_regs = 0;

10250

422c3b96efda (set_search_regs): Really set search_regs.start and .end.

Richard M. Stallman <rms@gnu.org>

parents: 10141

diff changeset

2752 search_regs.start = 0;

422c3b96efda (set_search_regs): Really set search_regs.start and .end.

Richard M. Stallman <rms@gnu.org>

parents: 10141

diff changeset

2753 search_regs.end = 0;

10032

f689803caa92 Added code for automatically saving and restoring the match data

Francesco Potortì <pot@gnu.org>

parents: 10020

diff changeset

2754

f689803caa92 Added code for automatically saving and restoring the match data

Francesco Potortì <pot@gnu.org>

parents: 10020

diff changeset

2755 search_regs_saved = 1;

f689803caa92 Added code for automatically saving and restoring the match data

Francesco Potortì <pot@gnu.org>

parents: 10020

diff changeset

2756 }

f689803caa92 Added code for automatically saving and restoring the match data

Francesco Potortì <pot@gnu.org>

parents: 10020

diff changeset

2757 }

f689803caa92 Added code for automatically saving and restoring the match data

Francesco Potortì <pot@gnu.org>

parents: 10020

diff changeset

2758

f689803caa92 Added code for automatically saving and restoring the match data

Francesco Potortì <pot@gnu.org>

parents: 10020

diff changeset

2759 /* Called upon exit from filters and sentinels. */

f689803caa92 Added code for automatically saving and restoring the match data

Francesco Potortì <pot@gnu.org>

parents: 10020

diff changeset

2760 void

f689803caa92 Added code for automatically saving and restoring the match data

Francesco Potortì <pot@gnu.org>

parents: 10020

diff changeset

2761 restore_match_data ()

f689803caa92 Added code for automatically saving and restoring the match data

Francesco Potortì <pot@gnu.org>

parents: 10020

diff changeset

2762 {

f689803caa92 Added code for automatically saving and restoring the match data

Francesco Potortì <pot@gnu.org>

parents: 10020

diff changeset

2763 if (search_regs_saved)

f689803caa92 Added code for automatically saving and restoring the match data

Francesco Potortì <pot@gnu.org>

parents: 10020

diff changeset

2764 {

f689803caa92 Added code for automatically saving and restoring the match data

Francesco Potortì <pot@gnu.org>

parents: 10020

diff changeset

2765 if (search_regs.num_regs > 0)

f689803caa92 Added code for automatically saving and restoring the match data

Francesco Potortì <pot@gnu.org>

parents: 10020

diff changeset

2766 {

f689803caa92 Added code for automatically saving and restoring the match data

Francesco Potortì <pot@gnu.org>

parents: 10020

diff changeset

2767 xfree (search_regs.start);

f689803caa92 Added code for automatically saving and restoring the match data

Francesco Potortì <pot@gnu.org>

parents: 10020

diff changeset

2768 xfree (search_regs.end);

f689803caa92 Added code for automatically saving and restoring the match data

Francesco Potortì <pot@gnu.org>

parents: 10020

diff changeset

2769 }

f689803caa92 Added code for automatically saving and restoring the match data

Francesco Potortì <pot@gnu.org>

parents: 10020

diff changeset

2770 search_regs.num_regs = saved_search_regs.num_regs;

f689803caa92 Added code for automatically saving and restoring the match data

Francesco Potortì <pot@gnu.org>

parents: 10020

diff changeset

2771 search_regs.start = saved_search_regs.start;

f689803caa92 Added code for automatically saving and restoring the match data

Francesco Potortì <pot@gnu.org>

parents: 10020

diff changeset

2772 search_regs.end = saved_search_regs.end;

f689803caa92 Added code for automatically saving and restoring the match data

Francesco Potortì <pot@gnu.org>

parents: 10020

diff changeset

2773

f689803caa92 Added code for automatically saving and restoring the match data

Francesco Potortì <pot@gnu.org>

parents: 10020

diff changeset

2774 search_regs_saved = 0;

f689803caa92 Added code for automatically saving and restoring the match data

Francesco Potortì <pot@gnu.org>

parents: 10020

diff changeset

2775 }

f689803caa92 Added code for automatically saving and restoring the match data

Francesco Potortì <pot@gnu.org>

parents: 10020

diff changeset

2776 }

f689803caa92 Added code for automatically saving and restoring the match data

Francesco Potortì <pot@gnu.org>

parents: 10020

diff changeset

2777

603

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2778 /* Quote a string to inactivate reg-expr chars */

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2779

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2780 DEFUN ("regexp-quote", Fregexp_quote, Sregexp_quote, 1, 1, 0,

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2781 "Return a regexp string which matches exactly STRING and nothing else.")

14086

a410808fda15 (Fmatch_end, Fregexp_quote): Harmonize arguments with documentation.

Erik Naggum <erik@naggum.no>

parents: 14036

diff changeset

2782 (string)

a410808fda15 (Fmatch_end, Fregexp_quote): Harmonize arguments with documentation.

Erik Naggum <erik@naggum.no>

parents: 14036

diff changeset

2783 Lisp_Object string;

603

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2784 {

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2785 register unsigned char *in, *out, *end;

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2786 register unsigned char *temp;

20588

138c95482e6b (search_buffer): Handle bytes vs chars in non-RE case.

Richard M. Stallman <rms@gnu.org>

parents: 20547

diff changeset

2787 int backslashes_added = 0;

603

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2788

14086

a410808fda15 (Fmatch_end, Fregexp_quote): Harmonize arguments with documentation.

Erik Naggum <erik@naggum.no>

parents: 14036

diff changeset

2789 CHECK_STRING (string, 0);

603

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2790

21244

50929073a0ba Use STRING_BYTES and SET_STRING_BYTES.

Richard M. Stallman <rms@gnu.org>

parents: 21171

diff changeset

2791 temp = (unsigned char *) alloca (STRING_BYTES (XSTRING (string)) * 2);

603

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2792

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2793 /* Now copy the data into the new string, inserting escapes. */

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2794

14086

a410808fda15 (Fmatch_end, Fregexp_quote): Harmonize arguments with documentation.

Erik Naggum <erik@naggum.no>

parents: 14036

diff changeset

2795 in = XSTRING (string)->data;

21244

50929073a0ba Use STRING_BYTES and SET_STRING_BYTES.

Richard M. Stallman <rms@gnu.org>

parents: 21171

diff changeset

2796 end = in + STRING_BYTES (XSTRING (string));

603

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2797 out = temp;

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2798

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2799 for (; in != end; in++)

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2800 {

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2801 if (*in == '[' || *in == ']'

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2802 || *in == '*' || *in == '.' || *in == '\\'

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2803 || *in == '?' || *in == '+'

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2804 || *in == '^' || *in == '$')

20588

138c95482e6b (search_buffer): Handle bytes vs chars in non-RE case.

Richard M. Stallman <rms@gnu.org>

parents: 20547

diff changeset

2805 *out++ = '\\', backslashes_added++;

603

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2806 *out++ = *in;

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2807 }

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2808

21248

aba5e1c3328b (Fregexp_quote): Use make_specified_string.

Richard M. Stallman <rms@gnu.org>

parents: 21244

diff changeset

2809 return make_specified_string (temp,

20588

138c95482e6b (search_buffer): Handle bytes vs chars in non-RE case.

Richard M. Stallman <rms@gnu.org>

parents: 20547

diff changeset

2810 XSTRING (string)->size + backslashes_added,

21248

aba5e1c3328b (Fregexp_quote): Use make_specified_string.

Richard M. Stallman <rms@gnu.org>

parents: 21244

diff changeset

2811 out - temp,

aba5e1c3328b (Fregexp_quote): Use make_specified_string.

Richard M. Stallman <rms@gnu.org>

parents: 21244

diff changeset

2812 STRING_MULTIBYTE (string));

603

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2813 }

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2814

21514

fa9ff387d260 Fix -Wimplicit warnings.

Andreas Schwab <schwab@suse.de>

parents: 21457

diff changeset

2815 void

603

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2816 syms_of_search ()

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2817 {

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2818 register int i;

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2819

9605

cf97e75d8e02 (searchbufs): New variable, replaces searchbuf and last_regexp and

Karl Heuer <kwzh@gnu.org>

parents: 9452

diff changeset

2820 for (i = 0; i < REGEXP_CACHE_SIZE; ++i)

cf97e75d8e02 (searchbufs): New variable, replaces searchbuf and last_regexp and

Karl Heuer <kwzh@gnu.org>

parents: 9452

diff changeset

2821 {

cf97e75d8e02 (searchbufs): New variable, replaces searchbuf and last_regexp and

Karl Heuer <kwzh@gnu.org>

parents: 9452

diff changeset

2822 searchbufs[i].buf.allocated = 100;

cf97e75d8e02 (searchbufs): New variable, replaces searchbuf and last_regexp and

Karl Heuer <kwzh@gnu.org>

parents: 9452

diff changeset

2823 searchbufs[i].buf.buffer = (unsigned char *) malloc (100);

cf97e75d8e02 (searchbufs): New variable, replaces searchbuf and last_regexp and

Karl Heuer <kwzh@gnu.org>

parents: 9452

diff changeset

2824 searchbufs[i].buf.fastmap = searchbufs[i].fastmap;

cf97e75d8e02 (searchbufs): New variable, replaces searchbuf and last_regexp and

Karl Heuer <kwzh@gnu.org>

parents: 9452

diff changeset

2825 searchbufs[i].regexp = Qnil;

cf97e75d8e02 (searchbufs): New variable, replaces searchbuf and last_regexp and

Karl Heuer <kwzh@gnu.org>

parents: 9452

diff changeset

2826 staticpro (&searchbufs[i].regexp);

cf97e75d8e02 (searchbufs): New variable, replaces searchbuf and last_regexp and

Karl Heuer <kwzh@gnu.org>

parents: 9452

diff changeset

2827 searchbufs[i].next = (i == REGEXP_CACHE_SIZE-1 ? 0 : &searchbufs[i+1]);

cf97e75d8e02 (searchbufs): New variable, replaces searchbuf and last_regexp and

Karl Heuer <kwzh@gnu.org>

parents: 9452

diff changeset

2828 }

cf97e75d8e02 (searchbufs): New variable, replaces searchbuf and last_regexp and

Karl Heuer <kwzh@gnu.org>

parents: 9452

diff changeset

2829 searchbuf_head = &searchbufs[0];

603

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2830

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2831 Qsearch_failed = intern ("search-failed");

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2832 staticpro (&Qsearch_failed);

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2833 Qinvalid_regexp = intern ("invalid-regexp");

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2834 staticpro (&Qinvalid_regexp);

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2835

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2836 Fput (Qsearch_failed, Qerror_conditions,

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2837 Fcons (Qsearch_failed, Fcons (Qerror, Qnil)));

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2838 Fput (Qsearch_failed, Qerror_message,

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2839 build_string ("Search failed"));

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2840

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2841 Fput (Qinvalid_regexp, Qerror_conditions,

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2842 Fcons (Qinvalid_regexp, Fcons (Qerror, Qnil)));

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2843 Fput (Qinvalid_regexp, Qerror_message,

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2844 build_string ("Invalid regexp"));

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2845

727

540b047ece4d *** empty log message ***

Jim Blandy <jimb@redhat.com>

parents: 708

diff changeset

2846 last_thing_searched = Qnil;

540b047ece4d *** empty log message ***

Jim Blandy <jimb@redhat.com>

parents: 708

diff changeset

2847 staticpro (&last_thing_searched);

540b047ece4d *** empty log message ***

Jim Blandy <jimb@redhat.com>

parents: 708

diff changeset

2848

10020

c41ce96785a8 (struct regexp_cache): New field `posix'.

Richard M. Stallman <rms@gnu.org>

parents: 9605

diff changeset

2849 defsubr (&Slooking_at);

c41ce96785a8 (struct regexp_cache): New field `posix'.

Richard M. Stallman <rms@gnu.org>

parents: 9605

diff changeset

2850 defsubr (&Sposix_looking_at);

603

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2851 defsubr (&Sstring_match);

10020

c41ce96785a8 (struct regexp_cache): New field `posix'.

Richard M. Stallman <rms@gnu.org>

parents: 9605

diff changeset

2852 defsubr (&Sposix_string_match);

603

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2853 defsubr (&Ssearch_forward);

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2854 defsubr (&Ssearch_backward);

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2855 defsubr (&Sword_search_forward);

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2856 defsubr (&Sword_search_backward);

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2857 defsubr (&Sre_search_forward);

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2858 defsubr (&Sre_search_backward);

10020

c41ce96785a8 (struct regexp_cache): New field `posix'.

Richard M. Stallman <rms@gnu.org>

parents: 9605

diff changeset

2859 defsubr (&Sposix_search_forward);

c41ce96785a8 (struct regexp_cache): New field `posix'.

Richard M. Stallman <rms@gnu.org>

parents: 9605

diff changeset

2860 defsubr (&Sposix_search_backward);

603

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2861 defsubr (&Sreplace_match);

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2862 defsubr (&Smatch_beginning);

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2863 defsubr (&Smatch_end);

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2864 defsubr (&Smatch_data);

21171

60f6085df198 (Fset_match_data): Renamed from Fstore_match_data.

Richard M. Stallman <rms@gnu.org>

parents: 21117

diff changeset

2865 defsubr (&Sset_match_data);

603

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2866 defsubr (&Sregexp_quote);

470f556a9453 Initial revision

Jim Blandy <jimb@redhat.com>

parents:

diff changeset

2867 }

Mercurial > emacs

annotate src/search.c @ 27491:f39592a09195