lread.c 140 KB
Newer Older
Jim Blandy's avatar
Jim Blandy committed
1
/* Lisp parsing and input streams.
2

Paul Eggert's avatar
Paul Eggert committed
3
Copyright (C) 1985-1989, 1993-1995, 1997-2016 Free Software Foundation,
4
Inc.
Jim Blandy's avatar
Jim Blandy committed
5 6 7

This file is part of GNU Emacs.

8
GNU Emacs is free software: you can redistribute it and/or modify
Jim Blandy's avatar
Jim Blandy committed
9
it under the terms of the GNU General Public License as published by
10 11
the Free Software Foundation, either version 3 of the License, or (at
your option) any later version.
Jim Blandy's avatar
Jim Blandy committed
12 13 14 15 16 17 18

GNU Emacs is distributed in the hope that it will be useful,
but WITHOUT ANY WARRANTY; without even the implied warranty of
MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
GNU General Public License for more details.

You should have received a copy of the GNU General Public License
19
along with GNU Emacs.  If not, see <http://www.gnu.org/licenses/>.  */
Jim Blandy's avatar
Jim Blandy committed
20

21 22
/* Tell globals.h to define tables needed by init_obarray.  */
#define DEFINE_SYMBOLS
Jim Blandy's avatar
Jim Blandy committed
23

Richard M. Stallman's avatar
Richard M. Stallman committed
24
#include <config.h>
25
#include "sysstdio.h"
Jim Blandy's avatar
Jim Blandy committed
26 27 28
#include <sys/types.h>
#include <sys/stat.h>
#include <sys/file.h>
29
#include <errno.h>
30
#include <math.h>
31
#include <stat-time.h>
Jim Blandy's avatar
Jim Blandy committed
32
#include "lisp.h"
33
#include "dispextern.h"
34
#include "intervals.h"
Kenichi Handa's avatar
Kenichi Handa committed
35
#include "character.h"
36
#include "buffer.h"
Karl Heuer's avatar
Karl Heuer committed
37
#include "charset.h"
38
#include <epaths.h>
Jim Blandy's avatar
Jim Blandy committed
39
#include "commands.h"
Jim Blandy's avatar
Jim Blandy committed
40
#include "keyboard.h"
41
#include "systime.h"
42
#include "termhooks.h"
YAMAMOTO Mitsuharu's avatar
YAMAMOTO Mitsuharu committed
43
#include "blockinput.h"
44
#include <c-ctype.h>
Jim Blandy's avatar
Jim Blandy committed
45

46 47
#ifdef MSDOS
#include "msdos.h"
Eli Zaretskii's avatar
Eli Zaretskii committed
48 49 50 51
#if __DJGPP__ == 2 && __DJGPP_MINOR__ < 5
# define INFINITY  __builtin_inf()
# define NAN       __builtin_nan("")
#endif
52 53
#endif

54 55 56 57
#ifdef HAVE_NS
#include "nsterm.h"
#endif

Andreas Schwab's avatar
Andreas Schwab committed
58
#include <unistd.h>
Jim Blandy's avatar
Jim Blandy committed
59

Richard M. Stallman's avatar
Richard M. Stallman committed
60 61 62 63
#ifdef HAVE_SETLOCALE
#include <locale.h>
#endif /* HAVE_SETLOCALE */

Dave Love's avatar
Dave Love committed
64
#include <fcntl.h>
Richard M. Stallman's avatar
Richard M. Stallman committed
65

66
#ifdef HAVE_FSEEKO
67 68 69 70 71 72 73
#define file_offset off_t
#define file_tell ftello
#else
#define file_offset long
#define file_tell ftell
#endif

74 75 76 77
/* The association list of objects read with the #n=object form.
   Each member of the list has the form (n . object), and is used to
   look up the object for the corresponding #n# construct.
   It must be set to nil before all top-level calls to read0.  */
78
static Lisp_Object read_objects;
79

80
/* File for get_file_char to read from.  Use by load.  */
Jim Blandy's avatar
Jim Blandy committed
81 82
static FILE *instream;

83
/* For use within read-from-string (this reader is non-reentrant!!)  */
84 85 86
static ptrdiff_t read_from_string_index;
static ptrdiff_t read_from_string_index_byte;
static ptrdiff_t read_from_string_limit;
87

88
/* Number of characters read in the current call to Fread or
89
   Fread_from_string.  */
90
static EMACS_INT readchar_count;
91

92
/* This contains the last string skipped with #@.  */
93 94
static char *saved_doc_string;
/* Length of buffer allocated in saved_doc_string.  */
95
static ptrdiff_t saved_doc_string_size;
96
/* Length of actual data in saved_doc_string.  */
97
static ptrdiff_t saved_doc_string_length;
98
/* This is the file position that string came from.  */
99
static file_offset saved_doc_string_position;
100

101 102 103 104 105
/* This contains the previous string skipped with #@.
   We copy it from saved_doc_string when a new string
   is put in saved_doc_string.  */
static char *prev_saved_doc_string;
/* Length of buffer allocated in prev_saved_doc_string.  */
106
static ptrdiff_t prev_saved_doc_string_size;
107
/* Length of actual data in prev_saved_doc_string.  */
108
static ptrdiff_t prev_saved_doc_string_length;
109
/* This is the file position that string came from.  */
110
static file_offset prev_saved_doc_string_position;
111

112
/* True means inside a new-style backquote
113
   with no surrounding parentheses.
114
   Fread initializes this to false, so we need not specbind it
115
   or worry about what happens to it when there is an error.  */
116
static bool new_backquote_flag;
117 118 119 120

/* A list of file names for files being loaded in Fload.  Used to
   check for recursive loads.  */

Lute Kamstra's avatar
Lute Kamstra committed
121
static Lisp_Object Vloads_in_progress;
122

123 124
static int read_emacs_mule_char (int, int (*) (int, Lisp_Object),
                                 Lisp_Object);
Kenichi Handa's avatar
Kenichi Handa committed
125

126
static void readevalloop (Lisp_Object, FILE *, Lisp_Object, bool,
127 128
                          Lisp_Object, Lisp_Object,
                          Lisp_Object, Lisp_Object);
Jim Blandy's avatar
Jim Blandy committed
129

Kenichi Handa's avatar
Kenichi Handa committed
130 131 132 133 134 135
/* Functions that read one byte from the current source READCHARFUN
   or unreads one byte.  If the integer argument C is -1, it returns
   one read byte, or -1 when there's no more byte in the source.  If C
   is 0 or positive, it unreads C, and the return value is not
   interesting.  */

136 137 138
static int readbyte_for_lambda (int, Lisp_Object);
static int readbyte_from_file (int, Lisp_Object);
static int readbyte_from_string (int, Lisp_Object);
Kenichi Handa's avatar
Kenichi Handa committed
139

Jim Blandy's avatar
Jim Blandy committed
140 141
/* Handle unreading and rereading of characters.
   Write READCHAR to read a character,
Karl Heuer's avatar
Karl Heuer committed
142 143
   UNREAD(c) to unread c to be read again.

Kenichi Handa's avatar
Kenichi Handa committed
144
   These macros correctly read/unread multibyte characters.  */
Jim Blandy's avatar
Jim Blandy committed
145

146
#define READCHAR readchar (readcharfun, NULL)
Jim Blandy's avatar
Jim Blandy committed
147 148
#define UNREAD(c) unreadchar (readcharfun, c)

149 150 151
/* Same as READCHAR but set *MULTIBYTE to the multibyteness of the source.  */
#define READCHAR_REPORT_MULTIBYTE(multibyte) readchar (readcharfun, multibyte)

Kenichi Handa's avatar
Kenichi Handa committed
152
/* When READCHARFUN is Qget_file_char, Qget_emacs_mule_file_char,
Kenichi Handa's avatar
Kenichi Handa committed
153 154
   Qlambda, or a cons, we use this to keep an unread character because
   a file stream can't handle multibyte-char unreading.  The value -1
155
   means that there's no unread character.  */
Kenichi Handa's avatar
Kenichi Handa committed
156 157
static int unread_char;

Jim Blandy's avatar
Jim Blandy committed
158
static int
159
readchar (Lisp_Object readcharfun, bool *multibyte)
Jim Blandy's avatar
Jim Blandy committed
160 161
{
  Lisp_Object tem;
162
  register int c;
163
  int (*readbyte) (int, Lisp_Object);
Kenichi Handa's avatar
Kenichi Handa committed
164 165
  unsigned char buf[MAX_MULTIBYTE_LENGTH];
  int i, len;
166
  bool emacs_mule_encoding = 0;
Jim Blandy's avatar
Jim Blandy committed
167

168 169 170
  if (multibyte)
    *multibyte = 0;

171
  readchar_count++;
172

173
  if (BUFFERP (readcharfun))
Jim Blandy's avatar
Jim Blandy committed
174
    {
175
      register struct buffer *inbuffer = XBUFFER (readcharfun);
Jim Blandy's avatar
Jim Blandy committed
176

177
      ptrdiff_t pt_byte = BUF_PT_BYTE (inbuffer);
178

179 180 181
      if (! BUFFER_LIVE_P (inbuffer))
	return -1;

182 183
      if (pt_byte >= BUF_ZV_BYTE (inbuffer))
	return -1;
Jim Blandy's avatar
Jim Blandy committed
184

Tom Tromey's avatar
Tom Tromey committed
185
      if (! NILP (BVAR (inbuffer, enable_multibyte_characters)))
186
	{
187
	  /* Fetch the character code from the buffer.  */
188 189
	  unsigned char *p = BUF_BYTE_ADDRESS (inbuffer, pt_byte);
	  BUF_INC_POS (inbuffer, pt_byte);
190
	  c = STRING_CHAR (p);
191 192
	  if (multibyte)
	    *multibyte = 1;
193 194 195 196
	}
      else
	{
	  c = BUF_FETCH_BYTE (inbuffer, pt_byte);
197
	  if (! ASCII_CHAR_P (c))
Kenichi Handa's avatar
Kenichi Handa committed
198
	    c = BYTE8_TO_CHAR (c);
199
	  pt_byte++;
200
	}
201
      SET_BUF_PT_BOTH (inbuffer, BUF_PT (inbuffer) + 1, pt_byte);
202

203
      return c;
Jim Blandy's avatar
Jim Blandy committed
204
    }
205
  if (MARKERP (readcharfun))
Jim Blandy's avatar
Jim Blandy committed
206
    {
207
      register struct buffer *inbuffer = XMARKER (readcharfun)->buffer;
Jim Blandy's avatar
Jim Blandy committed
208

209
      ptrdiff_t bytepos = marker_byte_position (readcharfun);
210

211 212
      if (bytepos >= BUF_ZV_BYTE (inbuffer))
	return -1;
213

Tom Tromey's avatar
Tom Tromey committed
214
      if (! NILP (BVAR (inbuffer, enable_multibyte_characters)))
215
	{
216
	  /* Fetch the character code from the buffer.  */
217 218
	  unsigned char *p = BUF_BYTE_ADDRESS (inbuffer, bytepos);
	  BUF_INC_POS (inbuffer, bytepos);
219
	  c = STRING_CHAR (p);
220 221
	  if (multibyte)
	    *multibyte = 1;
222 223 224 225
	}
      else
	{
	  c = BUF_FETCH_BYTE (inbuffer, bytepos);
226
	  if (! ASCII_CHAR_P (c))
Kenichi Handa's avatar
Kenichi Handa committed
227
	    c = BYTE8_TO_CHAR (c);
228
	  bytepos++;
229 230
	}

231 232 233 234
      XMARKER (readcharfun)->bytepos = bytepos;
      XMARKER (readcharfun)->charpos++;

      return c;
Jim Blandy's avatar
Jim Blandy committed
235
    }
236 237

  if (EQ (readcharfun, Qlambda))
Kenichi Handa's avatar
Kenichi Handa committed
238 239 240 241
    {
      readbyte = readbyte_for_lambda;
      goto read_multibyte;
    }
242

Jim Blandy's avatar
Jim Blandy committed
243
  if (EQ (readcharfun, Qget_file_char))
244
    {
Kenichi Handa's avatar
Kenichi Handa committed
245 246
      readbyte = readbyte_from_file;
      goto read_multibyte;
247
    }
Jim Blandy's avatar
Jim Blandy committed
248

249
  if (STRINGP (readcharfun))
Jim Blandy's avatar
Jim Blandy committed
250
    {
251
      if (read_from_string_index >= read_from_string_limit)
Jim Blandy's avatar
Jim Blandy committed
252
	c = -1;
253 254 255 256 257 258 259 260
      else if (STRING_MULTIBYTE (readcharfun))
	{
	  if (multibyte)
	    *multibyte = 1;
	  FETCH_STRING_CHAR_ADVANCE_NO_CHECK (c, readcharfun,
					      read_from_string_index,
					      read_from_string_index_byte);
	}
261
      else
262 263 264 265 266
	{
	  c = SREF (readcharfun, read_from_string_index_byte);
	  read_from_string_index++;
	  read_from_string_index_byte++;
	}
Jim Blandy's avatar
Jim Blandy committed
267 268 269
      return c;
    }

270
  if (CONSP (readcharfun) && STRINGP (XCAR (readcharfun)))
Kenichi Handa's avatar
Kenichi Handa committed
271 272 273 274 275 276 277 278 279 280 281
    {
      /* This is the case that read_vector is reading from a unibyte
	 string that contains a byte sequence previously skipped
	 because of #@NUMBER.  The car part of readcharfun is that
	 string, and the cdr part is a value of readcharfun given to
	 read_vector.  */
      readbyte = readbyte_from_string;
      if (EQ (XCDR (readcharfun), Qget_emacs_mule_file_char))
	emacs_mule_encoding = 1;
      goto read_multibyte;
    }
Kenichi Handa's avatar
Kenichi Handa committed
282

Kenichi Handa's avatar
Kenichi Handa committed
283 284 285 286 287 288
  if (EQ (readcharfun, Qget_emacs_mule_file_char))
    {
      readbyte = readbyte_from_file;
      emacs_mule_encoding = 1;
      goto read_multibyte;
    }
Jim Blandy's avatar
Jim Blandy committed
289 290 291

  tem = call0 (readcharfun);

Jim Blandy's avatar
Jim Blandy committed
292
  if (NILP (tem))
Jim Blandy's avatar
Jim Blandy committed
293 294
    return -1;
  return XINT (tem);
Kenichi Handa's avatar
Kenichi Handa committed
295 296 297 298 299 300 301 302 303

 read_multibyte:
  if (unread_char >= 0)
    {
      c = unread_char;
      unread_char = -1;
      return c;
    }
  c = (*readbyte) (-1, readcharfun);
304
  if (c < 0)
305 306 307
    return c;
  if (multibyte)
    *multibyte = 1;
308
  if (ASCII_CHAR_P (c))
Kenichi Handa's avatar
Kenichi Handa committed
309 310 311 312 313 314 315 316 317 318 319 320 321 322 323 324 325
    return c;
  if (emacs_mule_encoding)
    return read_emacs_mule_char (c, readbyte, readcharfun);
  i = 0;
  buf[i++] = c;
  len = BYTES_BY_CHAR_HEAD (c);
  while (i < len)
    {
      c = (*readbyte) (-1, readcharfun);
      if (c < 0 || ! TRAILING_CODE_P (c))
	{
	  while (--i > 1)
	    (*readbyte) (buf[i], readcharfun);
	  return BYTE8_TO_CHAR (buf[0]);
	}
      buf[i++] = c;
    }
326
  return STRING_CHAR (buf);
Jim Blandy's avatar
Jim Blandy committed
327 328
}

Stefan Monnier's avatar
Stefan Monnier committed
329 330 331 332
#define FROM_FILE_P(readcharfun)			\
  (EQ (readcharfun, Qget_file_char)			\
   || EQ (readcharfun, Qget_emacs_mule_file_char))

333 334 335
static void
skip_dyn_bytes (Lisp_Object readcharfun, ptrdiff_t n)
{
Stefan Monnier's avatar
Stefan Monnier committed
336
  if (FROM_FILE_P (readcharfun))
337 338 339 340 341 342 343 344 345 346 347 348 349 350 351 352 353 354 355
    {
      block_input ();		/* FIXME: Not sure if it's needed.  */
      fseek (instream, n, SEEK_CUR);
      unblock_input ();
    }
  else
    { /* We're not reading directly from a file.  In that case, it's difficult
	 to reliably count bytes, since these are usually meant for the file's
	 encoding, whereas we're now typically in the internal encoding.
	 But luckily, skip_dyn_bytes is used to skip over a single
	 dynamic-docstring (or dynamic byte-code) which is always quoted such
	 that \037 is the final char.  */
      int c;
      do {
	c = READCHAR;
      } while (c >= 0 && c != '\037');
    }
}

356 357 358 359 360 361 362 363 364 365 366 367 368
static void
skip_dyn_eof (Lisp_Object readcharfun)
{
  if (FROM_FILE_P (readcharfun))
    {
      block_input ();		/* FIXME: Not sure if it's needed.  */
      fseek (instream, 0, SEEK_END);
      unblock_input ();
    }
  else
    while (READCHAR >= 0);
}

Jim Blandy's avatar
Jim Blandy committed
369 370 371 372
/* Unread the character C in the way appropriate for the stream READCHARFUN.
   If the stream is a user function, call it with the char as argument.  */

static void
373
unreadchar (Lisp_Object readcharfun, int c)
Jim Blandy's avatar
Jim Blandy committed
374
{
375
  readchar_count--;
376 377 378 379
  if (c == -1)
    /* Don't back up the pointer if we're unreading the end-of-input mark,
       since readchar didn't advance it when we read it.  */
    ;
380
  else if (BUFFERP (readcharfun))
381
    {
382
      struct buffer *b = XBUFFER (readcharfun);
383 384
      ptrdiff_t charpos = BUF_PT (b);
      ptrdiff_t bytepos = BUF_PT_BYTE (b);
385

Tom Tromey's avatar
Tom Tromey committed
386
      if (! NILP (BVAR (b, enable_multibyte_characters)))
Kenichi Handa's avatar
Kenichi Handa committed
387
	BUF_DEC_POS (b, bytepos);
388
      else
Kenichi Handa's avatar
Kenichi Handa committed
389
	bytepos--;
390

391
      SET_BUF_PT_BOTH (b, charpos - 1, bytepos);
392
    }
393
  else if (MARKERP (readcharfun))
394
    {
395
      struct buffer *b = XMARKER (readcharfun)->buffer;
396
      ptrdiff_t bytepos = XMARKER (readcharfun)->bytepos;
397

Kenichi Handa's avatar
Kenichi Handa committed
398
      XMARKER (readcharfun)->charpos--;
Tom Tromey's avatar
Tom Tromey committed
399
      if (! NILP (BVAR (b, enable_multibyte_characters)))
Kenichi Handa's avatar
Kenichi Handa committed
400
	BUF_DEC_POS (b, bytepos);
401
      else
Kenichi Handa's avatar
Kenichi Handa committed
402
	bytepos--;
403

Kenichi Handa's avatar
Kenichi Handa committed
404
      XMARKER (readcharfun)->bytepos = bytepos;
405
    }
406
  else if (STRINGP (readcharfun))
407 408 409 410 411
    {
      read_from_string_index--;
      read_from_string_index_byte
	= string_char_to_byte (readcharfun, read_from_string_index);
    }
412
  else if (CONSP (readcharfun) && STRINGP (XCAR (readcharfun)))
Kenichi Handa's avatar
Kenichi Handa committed
413 414 415
    {
      unread_char = c;
    }
416
  else if (EQ (readcharfun, Qlambda))
Kenichi Handa's avatar
Kenichi Handa committed
417 418 419
    {
      unread_char = c;
    }
Stefan Monnier's avatar
Stefan Monnier committed
420
  else if (FROM_FILE_P (readcharfun))
Kenichi Handa's avatar
Kenichi Handa committed
421
    {
422
      unread_char = c;
Kenichi Handa's avatar
Kenichi Handa committed
423
    }
Jim Blandy's avatar
Jim Blandy committed
424 425 426 427
  else
    call1 (readcharfun, make_number (c));
}

Kenichi Handa's avatar
Kenichi Handa committed
428
static int
429
readbyte_for_lambda (int c, Lisp_Object readcharfun)
Kenichi Handa's avatar
Kenichi Handa committed
430 431 432 433 434 435
{
  return read_bytecode_char (c >= 0);
}


static int
436
readbyte_from_file (int c, Lisp_Object readcharfun)
Kenichi Handa's avatar
Kenichi Handa committed
437 438 439
{
  if (c >= 0)
    {
440
      block_input ();
Kenichi Handa's avatar
Kenichi Handa committed
441
      ungetc (c, instream);
442
      unblock_input ();
Kenichi Handa's avatar
Kenichi Handa committed
443 444 445
      return 0;
    }

446
  block_input ();
Kenichi Handa's avatar
Kenichi Handa committed
447
  c = getc (instream);
Miles Bader's avatar
Miles Bader committed
448

449
  /* Interrupted reads have been observed while reading over the network.  */
Miles Bader's avatar
Miles Bader committed
450 451
  while (c == EOF && ferror (instream) && errno == EINTR)
    {
452
      unblock_input ();
Miles Bader's avatar
Miles Bader committed
453
      QUIT;
454
      block_input ();
Miles Bader's avatar
Miles Bader committed
455
      clearerr (instream);
Miles Bader's avatar
Miles Bader committed
456
      c = getc (instream);
YAMAMOTO Mitsuharu's avatar
YAMAMOTO Mitsuharu committed
457
    }
Miles Bader's avatar
Miles Bader committed
458

459
  unblock_input ();
Miles Bader's avatar
Miles Bader committed
460

Kenichi Handa's avatar
Kenichi Handa committed
461 462 463 464
  return (c == EOF ? -1 : c);
}

static int
465
readbyte_from_string (int c, Lisp_Object readcharfun)
Kenichi Handa's avatar
Kenichi Handa committed
466 467 468 469 470 471 472 473 474
{
  Lisp_Object string = XCAR (readcharfun);

  if (c >= 0)
    {
      read_from_string_index--;
      read_from_string_index_byte
	= string_char_to_byte (string, read_from_string_index);
    }
Kenichi Handa's avatar
Kenichi Handa committed
475

Kenichi Handa's avatar
Kenichi Handa committed
476 477 478 479 480 481 482 483 484 485 486 487 488 489 490
  if (read_from_string_index >= read_from_string_limit)
    c = -1;
  else
    FETCH_STRING_CHAR_ADVANCE (c, string,
			       read_from_string_index,
			       read_from_string_index_byte);
  return c;
}


/* Read one non-ASCII character from INSTREAM.  The character is
   encoded in `emacs-mule' and the first byte is already read in
   C.  */

static int
491
read_emacs_mule_char (int c, int (*readbyte) (int, Lisp_Object), Lisp_Object readcharfun)
Kenichi Handa's avatar
Kenichi Handa committed
492 493 494 495 496 497 498 499 500 501 502 503 504 505 506 507 508 509 510 511 512 513 514 515 516 517 518 519
{
  /* Emacs-mule coding uses at most 4-byte for one character.  */
  unsigned char buf[4];
  int len = emacs_mule_bytes[c];
  struct charset *charset;
  int i;
  unsigned code;

  if (len == 1)
    /* C is not a valid leading-code of `emacs-mule'.  */
    return BYTE8_TO_CHAR (c);

  i = 0;
  buf[i++] = c;
  while (i < len)
    {
      c = (*readbyte) (-1, readcharfun);
      if (c < 0xA0)
	{
	  while (--i > 1)
	    (*readbyte) (buf[i], readcharfun);
	  return BYTE8_TO_CHAR (buf[0]);
	}
      buf[i++] = c;
    }

  if (len == 2)
    {
520
      charset = CHARSET_FROM_ID (emacs_mule_charset[buf[0]]);
Kenichi Handa's avatar
Kenichi Handa committed
521 522 523 524 525 526 527
      code = buf[1] & 0x7F;
    }
  else if (len == 3)
    {
      if (buf[0] == EMACS_MULE_LEADING_CODE_PRIVATE_11
	  || buf[0] == EMACS_MULE_LEADING_CODE_PRIVATE_12)
	{
528
	  charset = CHARSET_FROM_ID (emacs_mule_charset[buf[1]]);
Kenichi Handa's avatar
Kenichi Handa committed
529 530 531 532
	  code = buf[2] & 0x7F;
	}
      else
	{
533
	  charset = CHARSET_FROM_ID (emacs_mule_charset[buf[0]]);
Kenichi Handa's avatar
Kenichi Handa committed
534 535 536 537 538
	  code = ((buf[1] << 8) | buf[2]) & 0x7F7F;
	}
    }
  else
    {
539
      charset = CHARSET_FROM_ID (emacs_mule_charset[buf[1]]);
Kenichi Handa's avatar
Kenichi Handa committed
540
      code = ((buf[2] << 8) | buf[3]) & 0x7F7F;
Kenichi Handa's avatar
Kenichi Handa committed
541 542 543 544
    }
  c = DECODE_CHAR (charset, code);
  if (c < 0)
    Fsignal (Qinvalid_read_syntax,
545
	     list1 (build_string ("invalid multibyte form")));
Kenichi Handa's avatar
Kenichi Handa committed
546 547 548 549
  return c;
}


550 551 552
static Lisp_Object read_internal_start (Lisp_Object, Lisp_Object,
                                        Lisp_Object);
static Lisp_Object read0 (Lisp_Object);
553
static Lisp_Object read1 (Lisp_Object, int *, bool);
554

555 556
static Lisp_Object read_list (bool, Lisp_Object);
static Lisp_Object read_vector (Lisp_Object, bool);
557

558 559 560 561 562
static Lisp_Object substitute_object_recurse (Lisp_Object, Lisp_Object,
                                              Lisp_Object);
static void substitute_object_in_subtree (Lisp_Object,
                                          Lisp_Object);
static void substitute_in_interval (INTERVAL, Lisp_Object);
563

Jim Blandy's avatar
Jim Blandy committed
564

565
/* Get a character from the tty.  */
Jim Blandy's avatar
Jim Blandy committed
566

567 568
/* Read input events until we get one that's acceptable for our purposes.

569
   If NO_SWITCH_FRAME, switch-frame events are stashed
570 571 572
   until we get a character we like, and then stuffed into
   unread_switch_frame.

573
   If ASCII_REQUIRED, check function key events to see
574 575 576
   if the unmodified version of the symbol has a Qascii_character
   property, and use that character, if present.

577 578 579
   If ERROR_NONASCII, signal an error if the input we
   get isn't an ASCII character with modifiers.  If it's false but
   ASCII_REQUIRED is true, just re-read until we get an ASCII
580 581
   character.

582
   If INPUT_METHOD, invoke the current input method
583 584
   if the character warrants that.

585
   If SECONDS is a number, wait that many seconds for input, and
586
   return Qnil if no input arrives within that time.  */
587

Andreas Schwab's avatar
Andreas Schwab committed
588
static Lisp_Object
589 590
read_filtered_event (bool no_switch_frame, bool ascii_required,
		     bool error_nonascii, bool input_method, Lisp_Object seconds)
591
{
592
  Lisp_Object val, delayed_switch_frame;
593
  struct timespec end_time;
594

595
#ifdef HAVE_WINDOW_SYSTEM
596 597
  if (display_hourglass_p)
    cancel_hourglass ();
598
#endif
599

600
  delayed_switch_frame = Qnil;
601

602 603 604
  /* Compute timeout.  */
  if (NUMBERP (seconds))
    {
605
      double duration = extract_float (seconds);
606 607
      struct timespec wait_time = dtotimespec (duration);
      end_time = timespec_add (current_timespec (), wait_time);
608 609
    }

610
  /* Read until we get an acceptable event.  */
611
 retry:
612
  do
613
    val = read_char (0, Qnil, (input_method ? Qnil : Qt), 0,
Karoly Lorentey's avatar
Karoly Lorentey committed
614
		     NUMBERP (seconds) ? &end_time : NULL);
615
  while (INTEGERP (val) && XINT (val) == -2); /* wrong_kboard_jmpbuf */
616

617
  if (BUFFERP (val))
618 619
    goto retry;

620
  /* `switch-frame' events are put off until after the next ASCII
Karl Heuer's avatar
Karl Heuer committed
621
     character.  This is better than signaling an error just because
622 623 624 625 626
     the last characters were typed to a separate minibuffer frame,
     for example.  Eventually, some code which can deal with
     switch-frame events will read it and process it.  */
  if (no_switch_frame
      && EVENT_HAS_PARAMETERS (val)
627
      && EQ (EVENT_HEAD_KIND (EVENT_HEAD (val)), Qswitch_frame))
628 629 630 631 632
    {
      delayed_switch_frame = val;
      goto retry;
    }

633
  if (ascii_required && !(NUMBERP (seconds) && NILP (val)))
634 635
    {
      /* Convert certain symbols to their ASCII equivalents.  */
636
      if (SYMBOLP (val))
637
	{
638
	  Lisp_Object tem, tem1;
639 640 641 642 643 644 645
	  tem = Fget (val, Qevent_symbol_element_mask);
	  if (!NILP (tem))
	    {
	      tem1 = Fget (Fcar (tem), Qascii_character);
	      /* Merge this symbol's modifier bits
		 with the ASCII equivalent of its basic code.  */
	      if (!NILP (tem1))
646
		XSETFASTINT (val, XINT (tem1) | XINT (Fcar (Fcdr (tem))));
647 648
	    }
	}
649

650
      /* If we don't have a character now, deal with it appropriately.  */
651
      if (!INTEGERP (val))
652 653 654
	{
	  if (error_nonascii)
	    {
655
	      Vunread_command_events = list1 (val);
656 657 658 659 660 661 662 663 664 665
	      error ("Non-character input-event");
	    }
	  else
	    goto retry;
	}
    }

  if (! NILP (delayed_switch_frame))
    unread_switch_frame = delayed_switch_frame;

666 667
#if 0

668
#ifdef HAVE_WINDOW_SYSTEM
669 670
  if (display_hourglass_p)
    start_hourglass ();
671
#endif
672 673 674

#endif

675 676 677
  return val;
}

Paul Eggert's avatar
Paul Eggert committed
678
DEFUN ("read-char", Fread_char, Sread_char, 0, 3, 0,
679 680
       doc: /* Read a character from the command input (keyboard or macro).
It is returned as a number.
681 682 683
If the character has modifiers, they are resolved and reflected to the
character code if possible (e.g. C-SPC -> 0).

684 685
If the user generates an event which is not a character (i.e. a mouse
click or function key event), `read-char' signals an error.  As an
686 687
exception, switch-frame events are put off until non-character events
can be read.
688 689 690 691 692 693
If you want to read non-character events, or ignore them, call
`read-event' or `read-char-exclusive' instead.

If the optional argument PROMPT is non-nil, display that as a prompt.
If the optional argument INHERIT-INPUT-METHOD is non-nil and some
input method is turned on in the current buffer, that input method
694 695 696 697 698
is used for reading a character.
If the optional argument SECONDS is non-nil, it should be a number
specifying the maximum number of seconds to wait for input.  If no
input arrives in that time, return nil.  SECONDS may be a
floating-point value.  */)
Dan Nicolaescu's avatar
Dan Nicolaescu committed
699
  (Lisp_Object prompt, Lisp_Object inherit_input_method, Lisp_Object seconds)
Jim Blandy's avatar
Jim Blandy committed
700
{
701 702
  Lisp_Object val;

703 704
  if (! NILP (prompt))
    message_with_string ("%s", prompt, 0);
705
  val = read_filtered_event (1, 1, 1, ! NILP (inherit_input_method), seconds);
706 707 708

  return (NILP (val) ? Qnil
	  : make_number (char_resolve_modifier_mask (XINT (val))));
Jim Blandy's avatar
Jim Blandy committed
709 710
}

Paul Eggert's avatar
Paul Eggert committed
711
DEFUN ("read-event", Fread_event, Sread_event, 0, 3, 0,
712 713 714 715
       doc: /* Read an event object from the input stream.
If the optional argument PROMPT is non-nil, display that as a prompt.
If the optional argument INHERIT-INPUT-METHOD is non-nil and some
input method is turned on in the current buffer, that input method
716 717 718 719 720
is used for reading a character.
If the optional argument SECONDS is non-nil, it should be a number
specifying the maximum number of seconds to wait for input.  If no
input arrives in that time, return nil.  SECONDS may be a
floating-point value.  */)
Dan Nicolaescu's avatar
Dan Nicolaescu committed
721
  (Lisp_Object prompt, Lisp_Object inherit_input_method, Lisp_Object seconds)
Jim Blandy's avatar
Jim Blandy committed
722
{
723 724
  if (! NILP (prompt))
    message_with_string ("%s", prompt, 0);
725
  return read_filtered_event (0, 0, 0, ! NILP (inherit_input_method), seconds);
Jim Blandy's avatar
Jim Blandy committed
726 727
}

728
DEFUN ("read-char-exclusive", Fread_char_exclusive, Sread_char_exclusive, 0, 3, 0,
729 730
       doc: /* Read a character from the command input (keyboard or macro).
It is returned as a number.  Non-character events are ignored.
731 732
If the character has modifiers, they are resolved and reflected to the
character code if possible (e.g. C-SPC -> 0).
733 734 735 736

If the optional argument PROMPT is non-nil, display that as a prompt.
If the optional argument INHERIT-INPUT-METHOD is non-nil and some
input method is turned on in the current buffer, that input method
737 738 739 740 741
is used for reading a character.
If the optional argument SECONDS is non-nil, it should be a number
specifying the maximum number of seconds to wait for input.  If no
input arrives in that time, return nil.  SECONDS may be a
floating-point value.  */)
Dan Nicolaescu's avatar
Dan Nicolaescu committed
742
  (Lisp_Object prompt, Lisp_Object inherit_input_method, Lisp_Object seconds)
Jim Blandy's avatar
Jim Blandy committed
743
{
744 745
  Lisp_Object val;

746 747
  if (! NILP (prompt))
    message_with_string ("%s", prompt, 0);
748

749
  val = read_filtered_event (1, 1, 0, ! NILP (inherit_input_method), seconds);
750 751 752

  return (NILP (val) ? Qnil
	  : make_number (char_resolve_modifier_mask (XINT (val))));
Jim Blandy's avatar
Jim Blandy committed
753 754 755
}

DEFUN ("get-file-char", Fget_file_char, Sget_file_char, 0, 0, 0,
756
       doc: /* Don't use this yourself.  */)
Dan Nicolaescu's avatar
Dan Nicolaescu committed
757
  (void)
Jim Blandy's avatar
Jim Blandy committed
758 759
{
  register Lisp_Object val;
760
  block_input ();
761
  XSETINT (val, getc (instream));
762
  unblock_input ();
Jim Blandy's avatar
Jim Blandy committed
763 764
  return val;
}
765 766


767 768 769 770


/* Return true if the lisp code read using READCHARFUN defines a non-nil
   `lexical-binding' file variable.  After returning, the stream is
771 772
   positioned following the first line, if it is a comment or #! line,
   otherwise nothing is read.  */
773

774
static bool
Stefan Monnier's avatar
Stefan Monnier committed
775
lisp_file_lexically_bound_p (Lisp_Object readcharfun)
776 777
{
  int ch = READCHAR;
778 779 780 781 782 783 784 785 786 787 788 789 790

  if (ch == '#')
    {
      ch = READCHAR;
      if (ch != '!')
        {
          UNREAD (ch);
          UNREAD ('#');
          return 0;
        }
      while (ch != '\n' && ch != EOF)
        ch = READCHAR;
      if (ch == '\n') ch = READCHAR;
Glenn Morris's avatar
Comment  
Glenn Morris committed
791 792
      /* It is OK to leave the position after a #! line, since
         that is what read1 does.  */
793 794
    }

795 796 797 798 799 800 801 802 803
  if (ch != ';')
    /* The first line isn't a comment, just give up.  */
    {
      UNREAD (ch);
      return 0;
    }
  else
    /* Look for an appropriate file-variable in the first line.  */
    {
804
      bool rv = 0;
805
      enum {
Paul Eggert's avatar
Paul Eggert committed
806
	NOMINAL, AFTER_FIRST_DASH, AFTER_ASTERIX
807
      } beg_end_state = NOMINAL;
808
      bool in_file_vars = 0;
809

810 811 812 813 814 815 816 817 818 819
#define UPDATE_BEG_END_STATE(ch)				\
  if (beg_end_state == NOMINAL)					\
    beg_end_state = (ch == '-' ? AFTER_FIRST_DASH : NOMINAL);	\
  else if (beg_end_state == AFTER_FIRST_DASH)			\
    beg_end_state = (ch == '*' ? AFTER_ASTERIX : NOMINAL);	\
  else if (beg_end_state == AFTER_ASTERIX)			\
    {								\
      if (ch == '-')						\
	in_file_vars = !in_file_vars;				\
      beg_end_state = NOMINAL;					\
820 821 822 823 824 825 826 827 828 829 830 831
    }

      /* Skip until we get to the file vars, if any.  */
      do
	{
	  ch = READCHAR;
	  UPDATE_BEG_END_STATE (ch);
	}
      while (!in_file_vars && ch != '\n' && ch != EOF);

      while (in_file_vars)
	{
832
	  char var[100], val[100];
833
	  unsigned i;
834 835 836 837 838 839 840

	  ch = READCHAR;

	  /* Read a variable name.  */
	  while (ch == ' ' || ch == '\t')
	    ch = READCHAR;

841
	  i = 0;
842
	  while (ch != ':' && ch != '\n' && ch != EOF && in_file_vars)
843
	    {
844 845
	      if (i < sizeof var - 1)
		var[i++] = ch;
846 847 848
	      UPDATE_BEG_END_STATE (ch);
	      ch = READCHAR;
	    }
849

850
	  /* Stop scanning if no colon was found before end marker.  */
851
	  if (!in_file_vars || ch == '\n' || ch == EOF)
852 853
	    break;

854 855 856
	  while (i > 0 && (var[i - 1] == ' ' || var[i - 1] == '\t'))
	    i--;
	  var[i] = '\0';
857 858 859 860 861 862 863 864 865

	  if (ch == ':')
	    {
	      /* Read a variable value.  */
	      ch = READCHAR;

	      while (ch == ' ' || ch == '\t')
		ch = READCHAR;

866
	      i = 0;
867 868
	      while (ch != ';' && ch != '\n' && ch != EOF && in_file_vars)
		{
869 870
		  if (i < sizeof val - 1)
		    val[i++] = ch;
871 872 873 874
		  UPDATE_BEG_END_STATE (ch);
		  ch = READCHAR;
		}
	      if (! in_file_vars)
875
		/* The value was terminated by an end-marker, which remove.  */
876 877 878 879
		i -= 3;
	      while (i > 0 && (val[i - 1] == ' ' || val[i - 1] == '\t'))
		i--;
	      val[i] = '\0';
880 881 882 883 884 885 886 887 888 889 890 891 892 893 894 895

	      if (strcmp (var, "lexical-binding") == 0)
		/* This is it...  */
		{
		  rv = (strcmp (val, "nil") != 0);
		  break;
		}
	    }
	}

      while (ch != '\n' && ch != EOF)
	ch = READCHAR;

      return rv;
    }
}
896

Kenichi Handa's avatar
Kenichi Handa committed
897
/* Value is a version number of byte compiled code if the file
Miles Bader's avatar
Miles Bader committed
898
   associated with file descriptor FD is a compiled Lisp file that's
Kenichi Handa's avatar
Kenichi Handa committed
899 900 901
   safe to load.  Only files compiled with Emacs are safe to load.
   Files compiled with XEmacs can lead to a crash in Fbyte_code
   because of an incompatible change in the byte compiler.  */
902 903

static int
904
safe_to_load_version (int fd)
905 906 907
{
  char buf[512];
  int nbytes, i;
Kenichi Handa's avatar
Kenichi Handa committed
908
  int version = 1;
909 910 911

  /* Read the first few bytes from the file, and look for a line
     specifying the byte compiler version used.  */
912
  nbytes = emacs_read (fd, buf, sizeof buf);
913 914 915
  if (nbytes > 0)
    {
      /* Skip to the next newline, skipping over the initial `ELC'
Dave Love's avatar
Dave Love committed
916
	 with NUL bytes following it, but note the version.  */
917
      for (i = 0; i < nbytes && buf[i] != '\n'; ++i)
Dave Love's avatar
Dave Love committed
918
	if (i == 4)
Kenichi Handa's avatar
Kenichi Handa committed
919
	  version = buf[i];
920

921
      if (i >= nbytes
922
	  || fast_c_string_match_ignore_case (Vbytecomp_version_regexp,
923
					      buf + i, nbytes - i) < 0)
924
	version = 0;
925