annotate src/unexencap.c @ 4407:4ee73bbe4f8e

Always use boyer_moore in ASCII or Latin-1 buffers with ASCII search strings. 2007-12-26 Aidan Kehoe <kehoea@parhasard.net> * casetab.c: Extend and correct some case table documentation. * search.c (search_buffer): Correct a bug where only the first entry for a character in the case equivalence table was examined in determining if the Boyer-Moore search algorithm is appropriate. If there are case mappings outside of the charset and row of the characters specified in the search string, those case mappings can be safely ignored (and Boyer-Moore search can be used) if we know from the buffer statistics that the corresponding characters cannot occur. * search.c (boyer_moore): Assert that we haven't been passed a string with varying characters sets or rows within character sets. That's what simple_search is for. In the very rare event that a character in the search string has a canonical case mapping that is not in the same character set and row, don't try to search for the canonical character, search for some other character that is in the the desired character set and row. Assert that the case table isn't corrupt. Do not search for any character case mappings that cannot possibly occur in the buffer, given the buffer metadata about its contents.
author Aidan Kehoe <kehoea@parhasard.net>
date Wed, 26 Dec 2007 17:30:16 +0100
parents 04bc9d2f42c7
children
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
0
376386a54a3c Import from CVS: tag r19-14
cvs
parents:
diff changeset
1 /* Waiting for papers! */
376386a54a3c Import from CVS: tag r19-14
cvs
parents:
diff changeset
2
376386a54a3c Import from CVS: tag r19-14
cvs
parents:
diff changeset
3 /* Synched up with: FSF 19.31. */
376386a54a3c Import from CVS: tag r19-14
cvs
parents:
diff changeset
4
376386a54a3c Import from CVS: tag r19-14
cvs
parents:
diff changeset
5 /*
376386a54a3c Import from CVS: tag r19-14
cvs
parents:
diff changeset
6 * Do an unexec() for coff encapsulation. Uses the approach I took
376386a54a3c Import from CVS: tag r19-14
cvs
parents:
diff changeset
7 * for AKCL, so don't be surprised if it doesn't look too much like
376386a54a3c Import from CVS: tag r19-14
cvs
parents:
diff changeset
8 * the other unexec() routines. Assumes NO_REMAP. Should be easy to
376386a54a3c Import from CVS: tag r19-14
cvs
parents:
diff changeset
9 * adapt to the emacs style unexec() if that is desired, but this works
376386a54a3c Import from CVS: tag r19-14
cvs
parents:
diff changeset
10 * just fine for me with GCC/GAS/GLD under System V. - Jordan
376386a54a3c Import from CVS: tag r19-14
cvs
parents:
diff changeset
11 */
376386a54a3c Import from CVS: tag r19-14
cvs
parents:
diff changeset
12
376386a54a3c Import from CVS: tag r19-14
cvs
parents:
diff changeset
13 #include <sys/types.h>
376386a54a3c Import from CVS: tag r19-14
cvs
parents:
diff changeset
14 #include <sys/fcntl.h>
376386a54a3c Import from CVS: tag r19-14
cvs
parents:
diff changeset
15 #include <sys/file.h>
376386a54a3c Import from CVS: tag r19-14
cvs
parents:
diff changeset
16 #include <stdio.h>
376386a54a3c Import from CVS: tag r19-14
cvs
parents:
diff changeset
17 #include "/usr/gnu/lib/gcc/gcc-include/a.out.h"
2286
04bc9d2f42c7 [xemacs-hg @ 2004-09-20 19:18:55 by james]
james
parents: 0
diff changeset
18 #include "compiler.h"
0
376386a54a3c Import from CVS: tag r19-14
cvs
parents:
diff changeset
19
376386a54a3c Import from CVS: tag r19-14
cvs
parents:
diff changeset
20 filecpy(to, from, n)
376386a54a3c Import from CVS: tag r19-14
cvs
parents:
diff changeset
21 FILE *to, *from;
376386a54a3c Import from CVS: tag r19-14
cvs
parents:
diff changeset
22 int n;
376386a54a3c Import from CVS: tag r19-14
cvs
parents:
diff changeset
23 {
376386a54a3c Import from CVS: tag r19-14
cvs
parents:
diff changeset
24 char buffer[BUFSIZ];
376386a54a3c Import from CVS: tag r19-14
cvs
parents:
diff changeset
25
376386a54a3c Import from CVS: tag r19-14
cvs
parents:
diff changeset
26 for (;;)
376386a54a3c Import from CVS: tag r19-14
cvs
parents:
diff changeset
27 if (n > BUFSIZ) {
376386a54a3c Import from CVS: tag r19-14
cvs
parents:
diff changeset
28 fread(buffer, BUFSIZ, 1, from);
376386a54a3c Import from CVS: tag r19-14
cvs
parents:
diff changeset
29 fwrite(buffer, BUFSIZ, 1, to);
376386a54a3c Import from CVS: tag r19-14
cvs
parents:
diff changeset
30 n -= BUFSIZ;
376386a54a3c Import from CVS: tag r19-14
cvs
parents:
diff changeset
31 } else if (n > 0) {
376386a54a3c Import from CVS: tag r19-14
cvs
parents:
diff changeset
32 fread(buffer, 1, n, from);
376386a54a3c Import from CVS: tag r19-14
cvs
parents:
diff changeset
33 fwrite(buffer, 1, n, to);
376386a54a3c Import from CVS: tag r19-14
cvs
parents:
diff changeset
34 break;
376386a54a3c Import from CVS: tag r19-14
cvs
parents:
diff changeset
35 } else
376386a54a3c Import from CVS: tag r19-14
cvs
parents:
diff changeset
36 break;
376386a54a3c Import from CVS: tag r19-14
cvs
parents:
diff changeset
37 }
376386a54a3c Import from CVS: tag r19-14
cvs
parents:
diff changeset
38 /* ****************************************************************
376386a54a3c Import from CVS: tag r19-14
cvs
parents:
diff changeset
39 * unexec
376386a54a3c Import from CVS: tag r19-14
cvs
parents:
diff changeset
40 *
376386a54a3c Import from CVS: tag r19-14
cvs
parents:
diff changeset
41 * driving logic.
376386a54a3c Import from CVS: tag r19-14
cvs
parents:
diff changeset
42 * ****************************************************************/
376386a54a3c Import from CVS: tag r19-14
cvs
parents:
diff changeset
43 unexec (new_name, a_name, data_start, bss_start, entry_address)
376386a54a3c Import from CVS: tag r19-14
cvs
parents:
diff changeset
44 char *new_name, *a_name;
2286
04bc9d2f42c7 [xemacs-hg @ 2004-09-20 19:18:55 by james]
james
parents: 0
diff changeset
45 unsigned UNUSED (data_start);
04bc9d2f42c7 [xemacs-hg @ 2004-09-20 19:18:55 by james]
james
parents: 0
diff changeset
46 unsigned UNUSED (bss_start);
04bc9d2f42c7 [xemacs-hg @ 2004-09-20 19:18:55 by james]
james
parents: 0
diff changeset
47 unsigned UNUSED (entry_address);
0
376386a54a3c Import from CVS: tag r19-14
cvs
parents:
diff changeset
48 {
376386a54a3c Import from CVS: tag r19-14
cvs
parents:
diff changeset
49 struct coffheader header1;
376386a54a3c Import from CVS: tag r19-14
cvs
parents:
diff changeset
50 struct coffscn *tp, *dp, *bp;
376386a54a3c Import from CVS: tag r19-14
cvs
parents:
diff changeset
51 struct exec header;
376386a54a3c Import from CVS: tag r19-14
cvs
parents:
diff changeset
52 int stsize;
376386a54a3c Import from CVS: tag r19-14
cvs
parents:
diff changeset
53 char *original_file = a_name;
376386a54a3c Import from CVS: tag r19-14
cvs
parents:
diff changeset
54 char *save_file = new_name;
376386a54a3c Import from CVS: tag r19-14
cvs
parents:
diff changeset
55
376386a54a3c Import from CVS: tag r19-14
cvs
parents:
diff changeset
56 char *data_begin, *data_end;
376386a54a3c Import from CVS: tag r19-14
cvs
parents:
diff changeset
57 int original_data;
376386a54a3c Import from CVS: tag r19-14
cvs
parents:
diff changeset
58 FILE *original, *save;
376386a54a3c Import from CVS: tag r19-14
cvs
parents:
diff changeset
59 int n;
376386a54a3c Import from CVS: tag r19-14
cvs
parents:
diff changeset
60 char *p;
376386a54a3c Import from CVS: tag r19-14
cvs
parents:
diff changeset
61 extern char *sbrk();
376386a54a3c Import from CVS: tag r19-14
cvs
parents:
diff changeset
62 char stdin_buf[BUFSIZ], stdout_buf[BUFSIZ];
376386a54a3c Import from CVS: tag r19-14
cvs
parents:
diff changeset
63
376386a54a3c Import from CVS: tag r19-14
cvs
parents:
diff changeset
64
376386a54a3c Import from CVS: tag r19-14
cvs
parents:
diff changeset
65 fclose(stdin);
376386a54a3c Import from CVS: tag r19-14
cvs
parents:
diff changeset
66 original = fopen(original_file, "r");
376386a54a3c Import from CVS: tag r19-14
cvs
parents:
diff changeset
67 if (stdin != original || original->_file != 0) {
376386a54a3c Import from CVS: tag r19-14
cvs
parents:
diff changeset
68 fprintf(stderr, "unexec: Can't open the original file.\n");
376386a54a3c Import from CVS: tag r19-14
cvs
parents:
diff changeset
69 exit(1);
376386a54a3c Import from CVS: tag r19-14
cvs
parents:
diff changeset
70 }
376386a54a3c Import from CVS: tag r19-14
cvs
parents:
diff changeset
71 setbuf(original, stdin_buf);
376386a54a3c Import from CVS: tag r19-14
cvs
parents:
diff changeset
72 fclose(stdout);
376386a54a3c Import from CVS: tag r19-14
cvs
parents:
diff changeset
73 unlink(save_file);
376386a54a3c Import from CVS: tag r19-14
cvs
parents:
diff changeset
74 n = open (save_file, O_CREAT|O_WRONLY, 0777);
376386a54a3c Import from CVS: tag r19-14
cvs
parents:
diff changeset
75 if (n != 1 || (save = fdopen(n, "w")) != stdout) {
376386a54a3c Import from CVS: tag r19-14
cvs
parents:
diff changeset
76 fprintf(stderr, "unexec: Can't open the save file.\n");
376386a54a3c Import from CVS: tag r19-14
cvs
parents:
diff changeset
77 exit(1);
376386a54a3c Import from CVS: tag r19-14
cvs
parents:
diff changeset
78 }
376386a54a3c Import from CVS: tag r19-14
cvs
parents:
diff changeset
79 setbuf(save, stdout_buf);
376386a54a3c Import from CVS: tag r19-14
cvs
parents:
diff changeset
80
376386a54a3c Import from CVS: tag r19-14
cvs
parents:
diff changeset
81 fread(&header1, sizeof(header1), 1, original);
376386a54a3c Import from CVS: tag r19-14
cvs
parents:
diff changeset
82 tp = &header1.scns[0];
376386a54a3c Import from CVS: tag r19-14
cvs
parents:
diff changeset
83 dp = &header1.scns[1];
376386a54a3c Import from CVS: tag r19-14
cvs
parents:
diff changeset
84 bp = &header1.scns[2];
376386a54a3c Import from CVS: tag r19-14
cvs
parents:
diff changeset
85 fread(&header, sizeof(header), 1, original);
376386a54a3c Import from CVS: tag r19-14
cvs
parents:
diff changeset
86 data_begin=(char *)N_DATADDR(header);
376386a54a3c Import from CVS: tag r19-14
cvs
parents:
diff changeset
87 data_end = sbrk(0);
376386a54a3c Import from CVS: tag r19-14
cvs
parents:
diff changeset
88 original_data = header.a_data;
376386a54a3c Import from CVS: tag r19-14
cvs
parents:
diff changeset
89 header.a_data = data_end - data_begin;
376386a54a3c Import from CVS: tag r19-14
cvs
parents:
diff changeset
90 header.a_bss = 0;
376386a54a3c Import from CVS: tag r19-14
cvs
parents:
diff changeset
91 dp->s_size = header.a_data;
376386a54a3c Import from CVS: tag r19-14
cvs
parents:
diff changeset
92 bp->s_paddr = dp->s_vaddr + dp->s_size;
376386a54a3c Import from CVS: tag r19-14
cvs
parents:
diff changeset
93 bp->s_vaddr = bp->s_paddr;
376386a54a3c Import from CVS: tag r19-14
cvs
parents:
diff changeset
94 bp->s_size = 0;
376386a54a3c Import from CVS: tag r19-14
cvs
parents:
diff changeset
95 header1.tsize = tp->s_size;
376386a54a3c Import from CVS: tag r19-14
cvs
parents:
diff changeset
96 header1.dsize = dp->s_size;
376386a54a3c Import from CVS: tag r19-14
cvs
parents:
diff changeset
97 header1.bsize = bp->s_size;
376386a54a3c Import from CVS: tag r19-14
cvs
parents:
diff changeset
98 fwrite(&header1, sizeof(header1), 1, save);
376386a54a3c Import from CVS: tag r19-14
cvs
parents:
diff changeset
99 fwrite(&header, sizeof(header), 1, save);
376386a54a3c Import from CVS: tag r19-14
cvs
parents:
diff changeset
100
376386a54a3c Import from CVS: tag r19-14
cvs
parents:
diff changeset
101 filecpy(save, original, header.a_text);
376386a54a3c Import from CVS: tag r19-14
cvs
parents:
diff changeset
102
376386a54a3c Import from CVS: tag r19-14
cvs
parents:
diff changeset
103 for (n = header.a_data, p = data_begin; ; n -= BUFSIZ, p += BUFSIZ)
376386a54a3c Import from CVS: tag r19-14
cvs
parents:
diff changeset
104 if (n > BUFSIZ)
376386a54a3c Import from CVS: tag r19-14
cvs
parents:
diff changeset
105 fwrite(p, BUFSIZ, 1, save);
376386a54a3c Import from CVS: tag r19-14
cvs
parents:
diff changeset
106 else if (n > 0) {
376386a54a3c Import from CVS: tag r19-14
cvs
parents:
diff changeset
107 fwrite(p, 1, n, save);
376386a54a3c Import from CVS: tag r19-14
cvs
parents:
diff changeset
108 break;
376386a54a3c Import from CVS: tag r19-14
cvs
parents:
diff changeset
109 } else
376386a54a3c Import from CVS: tag r19-14
cvs
parents:
diff changeset
110 break;
376386a54a3c Import from CVS: tag r19-14
cvs
parents:
diff changeset
111
376386a54a3c Import from CVS: tag r19-14
cvs
parents:
diff changeset
112 fseek(original, original_data, 1);
376386a54a3c Import from CVS: tag r19-14
cvs
parents:
diff changeset
113
376386a54a3c Import from CVS: tag r19-14
cvs
parents:
diff changeset
114 filecpy(save, original, header.a_syms+header.a_trsize+header.a_drsize);
376386a54a3c Import from CVS: tag r19-14
cvs
parents:
diff changeset
115 fread(&stsize, sizeof(stsize), 1, original);
376386a54a3c Import from CVS: tag r19-14
cvs
parents:
diff changeset
116 fwrite(&stsize, sizeof(stsize), 1, save);
376386a54a3c Import from CVS: tag r19-14
cvs
parents:
diff changeset
117 filecpy(save, original, stsize - sizeof(stsize));
376386a54a3c Import from CVS: tag r19-14
cvs
parents:
diff changeset
118
376386a54a3c Import from CVS: tag r19-14
cvs
parents:
diff changeset
119 fclose(original);
376386a54a3c Import from CVS: tag r19-14
cvs
parents:
diff changeset
120 fclose(save);
376386a54a3c Import from CVS: tag r19-14
cvs
parents:
diff changeset
121 }