xemacs-beta: src/tests.c comparison

comparison src/tests.c @ 5776:65d65b52d608

Pass character count from coding systems to buffer insertion code. src/ChangeLog addition: 2014-01-16 Aidan Kehoe <kehoea@parhasard.net> Pass character count information from the no-conversion and unicode coding systems to the buffer insertion code, making #'find-file on large buffers a little snappier (if ERROR_CHECK_TEXT is not defined). * file-coding.c: * file-coding.c (coding_character_tell): New. * file-coding.c (conversion_coding_stream_description): New. * file-coding.c (no_conversion_convert): Update characters_seen when decoding. * file-coding.c (no_conversion_character_tell): New. * file-coding.c (lstream_type_create_file_coding): Create the no_conversion type with data. * file-coding.c (coding_system_type_create): Make the character_tell method available here. * file-coding.h: * file-coding.h (struct coding_system_methods): Add a new character_tell() method, passing charcount information from the coding systems to the buffer code, avoiding duplicate bytecount-to-charcount work especially with large buffers. * fileio.c (Finsert_file_contents_internal): Update this to pass charcount information to buffer_insert_string_1(), if that is available from the lstream code. * insdel.c: * insdel.c (buffer_insert_string_1): Add a new CCLEN argument, giving the character count of the string to insert. It can be -1 to indicate that te function should work it out itself using bytecount_to_charcount(), as it used to. * insdel.c (buffer_insert_raw_string_1): * insdel.c (buffer_insert_lisp_string_1): * insdel.c (buffer_insert_ascstring_1): * insdel.c (buffer_insert_emacs_char_1): * insdel.c (buffer_insert_from_buffer_1): * insdel.c (buffer_replace_char): Update these functions to use the new calling convention. * insdel.h: * insdel.h (buffer_insert_string): Update this header to reflect the new buffer_insert_string_1() argument. * lstream.c (Lstream_character_tell): New. Return the number of characters *read* and seen by the consumer so far, taking into account the unget buffer, and buffered reading. * lstream.c (Lstream_unread): Update unget_character_count here as appropriate. * lstream.c (Lstream_rewind): Reset unget_character_count here too. * lstream.h: * lstream.h (struct lstream): Provide the character_tell method, add a new field, unget_character_count, giving the number of characters ever passed to Lstream_unread(). Declare Lstream_character_tell(). Make Lstream_ungetc(), which happens to be unused, an inline function rather than a macro, in the course of updating it to modify unget_character_count. * print.c (output_string): Use the new argument to buffer_insert_string_1(). * tests.c: * tests.c (Ftest_character_tell): New test function. * tests.c (syms_of_tests): Make it available. * unicode.c: * unicode.c (struct unicode_coding_stream): * unicode.c (unicode_character_tell): New method. * unicode.c (unicode_convert): Update the character counter as appropriate. * unicode.c (coding_system_type_create_unicode): Make the character_tell method available.

author	Aidan Kehoe <kehoea@parhasard.net>
date	Thu, 16 Jan 2014 16:27:52 +0000
parents	56144c8593a8
children	e2fae7783046

comparison

equal deleted inserted replaced

-:4004c3266c09
+:65d65b52d608
 DFC_CHECK_DATA (ptr, len, ext_dos, "DOS Lisp opaque, ALLOCA, binary");
 NUNGCPRO;
 UNGCPRO;
 return conversion_result;
+}
+DEFUN ("test-character-tell", Ftest_character_tell, 0, 0, "", /*
+Return list of results of tests of the stream character offset code.
+For use by the automated test suite.  See tests/automated/c-tests.
+Each element is a list (DESCRIPTION, STATUS, REASON).
+DESCRIPTION is a string describing the test.
+STATUS is a symbol, either t (pass) or nil (fail).
+REASON is nil or a string describing the failure (not required).
+*/
+())
+{
+Extbyte ext_unix[]= "\n\nfoo\nbar\n\nf\372b\343\340\nfoo\nbar\n";
+/* Previous string in UTF-8. */
+Extbyte ext_utf_8_unix[]
+= "\n\nfoo\nbar\n\nf\303\272b\303\243\303\240\nfoo\nbar\n";
+Charcount ext_utf_8_unix_char_len = 25;
+Ibyte shortbuf[13], longbuf[512];
+Lisp_Object stream =
+make_fixed_buffer_input_stream (ext_unix, sizeof (ext_unix) - 1);
+Lisp_Object result = Qnil, string = Qnil;
+Charcount count;
+Bytecount bytecount;
+struct gcpro gcpro1, gcpro2, gcpro3;
+#define CHARACTER_TELL_ASSERT(assertion, description, failing_case) \
+do                                                                \
+{                                                               \
+if (assertion)                                                  \
+result = Fcons (list3 (build_cistring (description),          \
+Qt, Qnil), result);                    \
+else                                                            \
+result = Fcons (list3 (build_cistring (description),          \
+Qnil, build_ascstring (failing_case)), \
+result);                                      \
+}                                                               \
+while (0)
+GCPRO3 (stream, result, string);
+Lstream_set_buffering (XLSTREAM (stream), LSTREAM_BLOCKN_BUFFERED, 65536);
+stream = make_coding_input_stream
+(XLSTREAM (stream), Ffind_coding_system (intern ("no-conversion-unix")),
+CODING_DECODE, 0);
+Lstream_set_buffering (XLSTREAM (stream), LSTREAM_BLOCKN_BUFFERED, 65536);
+bytecount = Lstream_read (XLSTREAM (stream), longbuf, sizeof (longbuf));
+CHARACTER_TELL_ASSERT (Lstream_character_tell (XLSTREAM (stream))
+== sizeof (ext_unix) -1,
+"basic character tell, no-conversion-unix",
+"basic character tell failed");
+string = build_extstring (ext_unix,
+Ffind_coding_system (intern
+("no-conversion-unix")));
+CHARACTER_TELL_ASSERT (Lstream_character_tell (XLSTREAM (stream))
+== string_char_length (string),
+"repeat basic character tell, no-conversion-unix",
+"repeat basic character tell failed with string");
+count = Lstream_character_tell (XLSTREAM (stream));
+Lstream_unread (XLSTREAM (stream), "r\n", 2);
+/* This should give the same result as before the unread. */
+CHARACTER_TELL_ASSERT (Lstream_character_tell (XLSTREAM (stream))
+== count, "checking post-unread character tell",
+"post-unread character tell failed");
+bytecount += Lstream_read (XLSTREAM (stream), longbuf + bytecount,
+sizeof (longbuf) - bytecount);
+CHARACTER_TELL_ASSERT (Lstream_character_tell (XLSTREAM (stream))
+== count + 2,
+"checking post-unread+read character tell",
+"post-unread+read character tell failed");
+/* This seems to be buggy for my purposes. */
+/* Lstream_rewind (XLSTREAM (stream)); */
+Lstream_close (XLSTREAM (stream));
+Lstream_delete (XLSTREAM (stream));
+stream = make_fixed_buffer_input_stream (ext_unix, sizeof (ext_unix) - 1);
+Lstream_set_buffering (XLSTREAM (stream), LSTREAM_BLOCKN_BUFFERED, 65536);
+Lstream_unset_character_mode (XLSTREAM (stream));
+stream = make_coding_input_stream
+(XLSTREAM (stream), Ffind_coding_system (intern ("no-conversion-unix")),
+CODING_DECODE, 0);
+Lstream_set_buffering (XLSTREAM (stream), LSTREAM_BLOCKN_BUFFERED, 65536);
+Lstream_unset_character_mode (XLSTREAM (stream));
+bytecount = Lstream_read (XLSTREAM (stream), shortbuf, sizeof (shortbuf));
+CHARACTER_TELL_ASSERT (Lstream_character_tell (XLSTREAM (stream))
+/* This should be equal to sizeof (shortbuf) on
+non-mule. */
+== sizeof (shortbuf) - !(byte_ascii_p (0xff)),
+"character tell with short read, no-conversion-unix",
+"short read character tell failed");
+Lstream_close (XLSTREAM (stream));
+Lstream_delete (XLSTREAM (stream));
+stream
+= make_fixed_buffer_input_stream (ext_utf_8_unix,
+sizeof (ext_utf_8_unix) - 1);
+Lstream_set_buffering (XLSTREAM (stream), LSTREAM_BLOCKN_BUFFERED, 65536);
+stream = make_coding_input_stream
+(XLSTREAM (stream), Ffind_coding_system (intern ("utf-8-unix")),
+CODING_DECODE, 0);
+Lstream_set_buffering (XLSTREAM (stream), LSTREAM_BLOCKN_BUFFERED, 65536);
+bytecount = Lstream_read (XLSTREAM (stream), longbuf, sizeof (longbuf));
+CHARACTER_TELL_ASSERT (Lstream_character_tell (XLSTREAM (stream))
+== ext_utf_8_unix_char_len,
+"utf-8 character tell, utf-8-unix",
+"utf-8 character tell failed");
+string = build_extstring (ext_utf_8_unix,
+Ffind_coding_system (intern
+("utf-8-unix")));
+CHARACTER_TELL_ASSERT (Lstream_character_tell (XLSTREAM (stream))
+== string_char_length (string),
+"repeat utf-8 character tell, utf-8-unix",
+"repeat utf-8 character tell failed with string");
+count = Lstream_character_tell (XLSTREAM (stream));
+Lstream_unread (XLSTREAM (stream), "r\n", 2);
+/* This should give the same result as before the unread. */
+CHARACTER_TELL_ASSERT (Lstream_character_tell (XLSTREAM (stream))
+== count, "checking post-unread utf-8 tell",
+"post-unread utf-8 tell failed");
+bytecount += Lstream_read (XLSTREAM (stream), longbuf + bytecount,
+sizeof (longbuf) - bytecount);
+CHARACTER_TELL_ASSERT (Lstream_character_tell (XLSTREAM (stream))
+== count + 2,
+"checking post-unread+read utf-8 tell",
+"post-unread+read utf-8 tell failed");
+/* This seems to be buggy for my purposes. */
+/* Lstream_rewind (XLSTREAM (stream)); */
+Lstream_close (XLSTREAM (stream));
+Lstream_delete (XLSTREAM (stream));
+stream = make_fixed_buffer_input_stream (ext_utf_8_unix, sizeof (ext_utf_8_unix) - 1);
+Lstream_set_buffering (XLSTREAM (stream), LSTREAM_BLOCKN_BUFFERED, 65536);
+Lstream_set_character_mode (XLSTREAM (stream));
+stream = make_coding_input_stream
+(XLSTREAM (stream), Ffind_coding_system (intern ("utf-8-unix")),
+CODING_DECODE, 0);
+Lstream_set_buffering (XLSTREAM (stream), LSTREAM_BLOCKN_BUFFERED, 65536);
+Lstream_set_character_mode (XLSTREAM (stream));
+bytecount = Lstream_read (XLSTREAM (stream), shortbuf, sizeof (shortbuf));
+CHARACTER_TELL_ASSERT
+(bytecount == (sizeof (shortbuf) - 1),
+"utf-8 Lstream_read, character mode, checking partial char not read",
+"partial char appars to have been read when it shouldn't");
+CHARACTER_TELL_ASSERT
+(Lstream_character_tell (XLSTREAM (stream))
+/* This is shorter, because it's in the middle of a character. */
+== sizeof (shortbuf) - 1,
+"utf-8 tell with short read, character mode, utf-8-unix",
+"utf-8 read character tell, character mode failed");
+Lstream_close (XLSTREAM (stream));
+Lstream_delete (XLSTREAM (stream));
+UNGCPRO;
+return result;
 }
 /* Hash Table testing */
 syms_of_tests (void)
 {
 Vtest_function_list = Qnil;
 TESTS_DEFSUBR (Ftest_data_format_conversion);
+TESTS_DEFSUBR (Ftest_character_tell);
 TESTS_DEFSUBR (Ftest_hash_tables);
 TESTS_DEFSUBR (Ftest_store_void_in_lisp);
 /* Add other test functions here with TESTS_DEFSUBR */
 }

Mercurial > hg > xemacs-beta

comparison src/tests.c @ 5776:65d65b52d608