lread.c 133 KB
Newer Older
Jim Blandy's avatar
Jim Blandy committed
1
/* Lisp parsing and input streams.
2

3
Copyright (C) 1985-1989, 1993-1995, 1997-2012  Free Software Foundation, Inc.
Jim Blandy's avatar
Jim Blandy committed
4 5 6

This file is part of GNU Emacs.

7
GNU Emacs is free software: you can redistribute it and/or modify
Jim Blandy's avatar
Jim Blandy committed
8
it under the terms of the GNU General Public License as published by
9 10
the Free Software Foundation, either version 3 of the License, or
(at your option) any later version.
Jim Blandy's avatar
Jim Blandy committed
11 12 13 14 15 16 17

GNU Emacs is distributed in the hope that it will be useful,
but WITHOUT ANY WARRANTY; without even the implied warranty of
MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
GNU General Public License for more details.

You should have received a copy of the GNU General Public License
18
along with GNU Emacs.  If not, see <http://www.gnu.org/licenses/>.  */
Jim Blandy's avatar
Jim Blandy committed
19 20


Richard M. Stallman's avatar
Richard M. Stallman committed
21
#include <config.h>
Jim Blandy's avatar
Jim Blandy committed
22 23 24 25
#include <stdio.h>
#include <sys/types.h>
#include <sys/stat.h>
#include <sys/file.h>
26
#include <errno.h>
27
#include <limits.h>	/* For CHAR_BIT.  */
28
#include <setjmp.h>
29
#include <stat-time.h>
Jim Blandy's avatar
Jim Blandy committed
30
#include "lisp.h"
31
#include "intervals.h"
Kenichi Handa's avatar
Kenichi Handa committed
32
#include "character.h"
33
#include "buffer.h"
Karl Heuer's avatar
Karl Heuer committed
34
#include "charset.h"
Kenichi Handa's avatar
Kenichi Handa committed
35
#include "coding.h"
36
#include <epaths.h>
Jim Blandy's avatar
Jim Blandy committed
37
#include "commands.h"
Jim Blandy's avatar
Jim Blandy committed
38
#include "keyboard.h"
39
#include "frame.h"
40
#include "termhooks.h"
41
#include "coding.h"
YAMAMOTO Mitsuharu's avatar
YAMAMOTO Mitsuharu committed
42
#include "blockinput.h"
Jim Blandy's avatar
Jim Blandy committed
43

44 45 46 47
#ifdef MSDOS
#include "msdos.h"
#endif

48 49 50 51
#ifdef HAVE_NS
#include "nsterm.h"
#endif

Andreas Schwab's avatar
Andreas Schwab committed
52
#include <unistd.h>
Jim Blandy's avatar
Jim Blandy committed
53 54
#include <math.h>

Richard M. Stallman's avatar
Richard M. Stallman committed
55 56 57 58
#ifdef HAVE_SETLOCALE
#include <locale.h>
#endif /* HAVE_SETLOCALE */

Dave Love's avatar
Dave Love committed
59
#include <fcntl.h>
Richard M. Stallman's avatar
Richard M. Stallman committed
60

61
#ifdef HAVE_FSEEKO
62 63 64 65 66 67 68
#define file_offset off_t
#define file_tell ftello
#else
#define file_offset long
#define file_tell ftell
#endif

69
/* Hash table read constants.  */
70 71 72 73 74 75 76 77
static Lisp_Object Qhash_table, Qdata;
static Lisp_Object Qtest, Qsize;
static Lisp_Object Qweakness;
static Lisp_Object Qrehash_size;
static Lisp_Object Qrehash_threshold;

static Lisp_Object Qread_char, Qget_file_char, Qcurrent_load_list;
Lisp_Object Qstandard_input;
78
Lisp_Object Qvariable_documentation;
79
static Lisp_Object Qascii_character, Qload, Qload_file_name;
80
Lisp_Object Qbackquote, Qcomma, Qcomma_at, Qcomma_dot, Qfunction;
81 82 83 84
static Lisp_Object Qinhibit_file_name_operation;
static Lisp_Object Qeval_buffer_list;
static Lisp_Object Qlexical_binding;
static Lisp_Object Qfile_truename, Qdo_after_load_evaluation; /* ACM 2006/5/16 */
85

Kenichi Handa's avatar
Kenichi Handa committed
86 87 88 89 90 91
/* Used instead of Qget_file_char while loading *.elc files compiled
   by Emacs 21 or older.  */
static Lisp_Object Qget_emacs_mule_file_char;

static Lisp_Object Qload_force_doc_strings;

92
extern Lisp_Object Qinternal_interpreter_environment;
Jim Blandy's avatar
Jim Blandy committed
93

94
static Lisp_Object Qload_in_progress;
Ken Raeburn's avatar
Ken Raeburn committed
95

96 97 98 99
/* The association list of objects read with the #n=object form.
   Each member of the list has the form (n . object), and is used to
   look up the object for the corresponding #n# construct.
   It must be set to nil before all top-level calls to read0.  */
100
static Lisp_Object read_objects;
101

Kenichi Handa's avatar
Kenichi Handa committed
102 103 104 105 106
/* Nonzero means READCHAR should read bytes one by one (not character)
   when READCHARFUN is Qget_file_char or Qget_emacs_mule_file_char.
   This is set to 1 by read1 temporarily while handling #@NUMBER.  */
static int load_each_byte;

107 108 109
/* List of descriptors now open for Fload.  */
static Lisp_Object load_descriptor_list;

110
/* File for get_file_char to read from.  Use by load.  */
Jim Blandy's avatar
Jim Blandy committed
111 112
static FILE *instream;

113
/* For use within read-from-string (this reader is non-reentrant!!)  */
114 115 116
static ptrdiff_t read_from_string_index;
static ptrdiff_t read_from_string_index_byte;
static ptrdiff_t read_from_string_limit;
117

118
/* Number of characters read in the current call to Fread or
119
   Fread_from_string.  */
120
static EMACS_INT readchar_count;
121

122
/* This contains the last string skipped with #@.  */
123 124
static char *saved_doc_string;
/* Length of buffer allocated in saved_doc_string.  */
125
static ptrdiff_t saved_doc_string_size;
126
/* Length of actual data in saved_doc_string.  */
127
static ptrdiff_t saved_doc_string_length;
128
/* This is the file position that string came from.  */
129
static file_offset saved_doc_string_position;
130

131 132 133 134 135
/* This contains the previous string skipped with #@.
   We copy it from saved_doc_string when a new string
   is put in saved_doc_string.  */
static char *prev_saved_doc_string;
/* Length of buffer allocated in prev_saved_doc_string.  */
136
static ptrdiff_t prev_saved_doc_string_size;
137
/* Length of actual data in prev_saved_doc_string.  */
138
static ptrdiff_t prev_saved_doc_string_length;
139
/* This is the file position that string came from.  */
140
static file_offset prev_saved_doc_string_position;
141

142 143 144 145 146
/* Nonzero means inside a new-style backquote
   with no surrounding parentheses.
   Fread initializes this to zero, so we need not specbind it
   or worry about what happens to it when there is an error.  */
static int new_backquote_flag;
147
static Lisp_Object Qold_style_backquotes;
148 149 150 151

/* A list of file names for files being loaded in Fload.  Used to
   check for recursive loads.  */

Lute Kamstra's avatar
Lute Kamstra committed
152
static Lisp_Object Vloads_in_progress;
153

154 155
static int read_emacs_mule_char (int, int (*) (int, Lisp_Object),
                                 Lisp_Object);
Kenichi Handa's avatar
Kenichi Handa committed
156

157
static void readevalloop (Lisp_Object, FILE*, Lisp_Object, int,
158 159 160 161
                          Lisp_Object, Lisp_Object,
                          Lisp_Object, Lisp_Object);
static Lisp_Object load_unwind (Lisp_Object);
static Lisp_Object load_descriptor_unwind (Lisp_Object);
Jim Blandy's avatar
Jim Blandy committed
162

Kenichi Handa's avatar
Kenichi Handa committed
163 164 165 166 167 168
/* Functions that read one byte from the current source READCHARFUN
   or unreads one byte.  If the integer argument C is -1, it returns
   one read byte, or -1 when there's no more byte in the source.  If C
   is 0 or positive, it unreads C, and the return value is not
   interesting.  */

169 170 171
static int readbyte_for_lambda (int, Lisp_Object);
static int readbyte_from_file (int, Lisp_Object);
static int readbyte_from_string (int, Lisp_Object);
Kenichi Handa's avatar
Kenichi Handa committed
172

Jim Blandy's avatar
Jim Blandy committed
173 174
/* Handle unreading and rereading of characters.
   Write READCHAR to read a character,
Karl Heuer's avatar
Karl Heuer committed
175 176
   UNREAD(c) to unread c to be read again.

Kenichi Handa's avatar
Kenichi Handa committed
177
   These macros correctly read/unread multibyte characters.  */
Jim Blandy's avatar
Jim Blandy committed
178

179
#define READCHAR readchar (readcharfun, NULL)
Jim Blandy's avatar
Jim Blandy committed
180 181
#define UNREAD(c) unreadchar (readcharfun, c)

182 183 184
/* Same as READCHAR but set *MULTIBYTE to the multibyteness of the source.  */
#define READCHAR_REPORT_MULTIBYTE(multibyte) readchar (readcharfun, multibyte)

Kenichi Handa's avatar
Kenichi Handa committed
185
/* When READCHARFUN is Qget_file_char, Qget_emacs_mule_file_char,
Kenichi Handa's avatar
Kenichi Handa committed
186 187
   Qlambda, or a cons, we use this to keep an unread character because
   a file stream can't handle multibyte-char unreading.  The value -1
188
   means that there's no unread character.  */
Kenichi Handa's avatar
Kenichi Handa committed
189 190
static int unread_char;

Jim Blandy's avatar
Jim Blandy committed
191
static int
192
readchar (Lisp_Object readcharfun, int *multibyte)
Jim Blandy's avatar
Jim Blandy committed
193 194
{
  Lisp_Object tem;
195
  register int c;
196
  int (*readbyte) (int, Lisp_Object);
Kenichi Handa's avatar
Kenichi Handa committed
197 198 199
  unsigned char buf[MAX_MULTIBYTE_LENGTH];
  int i, len;
  int emacs_mule_encoding = 0;
Jim Blandy's avatar
Jim Blandy committed
200

201 202 203
  if (multibyte)
    *multibyte = 0;

204
  readchar_count++;
205

206
  if (BUFFERP (readcharfun))
Jim Blandy's avatar
Jim Blandy committed
207
    {
208
      register struct buffer *inbuffer = XBUFFER (readcharfun);
Jim Blandy's avatar
Jim Blandy committed
209

210
      ptrdiff_t pt_byte = BUF_PT_BYTE (inbuffer);
211

212 213
      if (pt_byte >= BUF_ZV_BYTE (inbuffer))
	return -1;
Jim Blandy's avatar
Jim Blandy committed
214

Tom Tromey's avatar
Tom Tromey committed
215
      if (! NILP (BVAR (inbuffer, enable_multibyte_characters)))
216
	{
217
	  /* Fetch the character code from the buffer.  */
218 219
	  unsigned char *p = BUF_BYTE_ADDRESS (inbuffer, pt_byte);
	  BUF_INC_POS (inbuffer, pt_byte);
220
	  c = STRING_CHAR (p);
221 222
	  if (multibyte)
	    *multibyte = 1;
223 224 225 226
	}
      else
	{
	  c = BUF_FETCH_BYTE (inbuffer, pt_byte);
Kenichi Handa's avatar
Kenichi Handa committed
227 228
	  if (! ASCII_BYTE_P (c))
	    c = BYTE8_TO_CHAR (c);
229
	  pt_byte++;
230
	}
231
      SET_BUF_PT_BOTH (inbuffer, BUF_PT (inbuffer) + 1, pt_byte);
232

233
      return c;
Jim Blandy's avatar
Jim Blandy committed
234
    }
235
  if (MARKERP (readcharfun))
Jim Blandy's avatar
Jim Blandy committed
236
    {
237
      register struct buffer *inbuffer = XMARKER (readcharfun)->buffer;
Jim Blandy's avatar
Jim Blandy committed
238

239
      ptrdiff_t bytepos = marker_byte_position (readcharfun);
240

241 242
      if (bytepos >= BUF_ZV_BYTE (inbuffer))
	return -1;
243

Tom Tromey's avatar
Tom Tromey committed
244
      if (! NILP (BVAR (inbuffer, enable_multibyte_characters)))
245
	{
246
	  /* Fetch the character code from the buffer.  */
247 248
	  unsigned char *p = BUF_BYTE_ADDRESS (inbuffer, bytepos);
	  BUF_INC_POS (inbuffer, bytepos);
249
	  c = STRING_CHAR (p);
250 251
	  if (multibyte)
	    *multibyte = 1;
252 253 254 255
	}
      else
	{
	  c = BUF_FETCH_BYTE (inbuffer, bytepos);
Kenichi Handa's avatar
Kenichi Handa committed
256 257
	  if (! ASCII_BYTE_P (c))
	    c = BYTE8_TO_CHAR (c);
258
	  bytepos++;
259 260
	}

261 262 263 264
      XMARKER (readcharfun)->bytepos = bytepos;
      XMARKER (readcharfun)->charpos++;

      return c;
Jim Blandy's avatar
Jim Blandy committed
265
    }
266 267

  if (EQ (readcharfun, Qlambda))
Kenichi Handa's avatar
Kenichi Handa committed
268 269 270 271
    {
      readbyte = readbyte_for_lambda;
      goto read_multibyte;
    }
272

Jim Blandy's avatar
Jim Blandy committed
273
  if (EQ (readcharfun, Qget_file_char))
274
    {
Kenichi Handa's avatar
Kenichi Handa committed
275 276
      readbyte = readbyte_from_file;
      goto read_multibyte;
277
    }
Jim Blandy's avatar
Jim Blandy committed
278

279
  if (STRINGP (readcharfun))
Jim Blandy's avatar
Jim Blandy committed
280
    {
281
      if (read_from_string_index >= read_from_string_limit)
Jim Blandy's avatar
Jim Blandy committed
282
	c = -1;
283 284 285 286 287 288 289 290
      else if (STRING_MULTIBYTE (readcharfun))
	{
	  if (multibyte)
	    *multibyte = 1;
	  FETCH_STRING_CHAR_ADVANCE_NO_CHECK (c, readcharfun,
					      read_from_string_index,
					      read_from_string_index_byte);
	}
291
      else
292 293 294 295 296
	{
	  c = SREF (readcharfun, read_from_string_index_byte);
	  read_from_string_index++;
	  read_from_string_index_byte++;
	}
Jim Blandy's avatar
Jim Blandy committed
297 298 299
      return c;
    }

Kenichi Handa's avatar
Kenichi Handa committed
300 301 302 303 304 305 306 307 308 309 310 311
  if (CONSP (readcharfun))
    {
      /* This is the case that read_vector is reading from a unibyte
	 string that contains a byte sequence previously skipped
	 because of #@NUMBER.  The car part of readcharfun is that
	 string, and the cdr part is a value of readcharfun given to
	 read_vector.  */
      readbyte = readbyte_from_string;
      if (EQ (XCDR (readcharfun), Qget_emacs_mule_file_char))
	emacs_mule_encoding = 1;
      goto read_multibyte;
    }
Kenichi Handa's avatar
Kenichi Handa committed
312

Kenichi Handa's avatar
Kenichi Handa committed
313 314 315 316 317 318
  if (EQ (readcharfun, Qget_emacs_mule_file_char))
    {
      readbyte = readbyte_from_file;
      emacs_mule_encoding = 1;
      goto read_multibyte;
    }
Jim Blandy's avatar
Jim Blandy committed
319 320 321

  tem = call0 (readcharfun);

Jim Blandy's avatar
Jim Blandy committed
322
  if (NILP (tem))
Jim Blandy's avatar
Jim Blandy committed
323 324
    return -1;
  return XINT (tem);
Kenichi Handa's avatar
Kenichi Handa committed
325 326 327 328 329 330 331 332 333

 read_multibyte:
  if (unread_char >= 0)
    {
      c = unread_char;
      unread_char = -1;
      return c;
    }
  c = (*readbyte) (-1, readcharfun);
334 335 336 337 338
  if (c < 0 || load_each_byte)
    return c;
  if (multibyte)
    *multibyte = 1;
  if (ASCII_BYTE_P (c))
Kenichi Handa's avatar
Kenichi Handa committed
339 340 341 342 343 344 345 346 347 348 349 350 351 352 353 354 355
    return c;
  if (emacs_mule_encoding)
    return read_emacs_mule_char (c, readbyte, readcharfun);
  i = 0;
  buf[i++] = c;
  len = BYTES_BY_CHAR_HEAD (c);
  while (i < len)
    {
      c = (*readbyte) (-1, readcharfun);
      if (c < 0 || ! TRAILING_CODE_P (c))
	{
	  while (--i > 1)
	    (*readbyte) (buf[i], readcharfun);
	  return BYTE8_TO_CHAR (buf[0]);
	}
      buf[i++] = c;
    }
356
  return STRING_CHAR (buf);
Jim Blandy's avatar
Jim Blandy committed
357 358 359 360 361 362
}

/* Unread the character C in the way appropriate for the stream READCHARFUN.
   If the stream is a user function, call it with the char as argument.  */

static void
363
unreadchar (Lisp_Object readcharfun, int c)
Jim Blandy's avatar
Jim Blandy committed
364
{
365
  readchar_count--;
366 367 368 369
  if (c == -1)
    /* Don't back up the pointer if we're unreading the end-of-input mark,
       since readchar didn't advance it when we read it.  */
    ;
370
  else if (BUFFERP (readcharfun))
371
    {
372
      struct buffer *b = XBUFFER (readcharfun);
373 374
      ptrdiff_t charpos = BUF_PT (b);
      ptrdiff_t bytepos = BUF_PT_BYTE (b);
375

Tom Tromey's avatar
Tom Tromey committed
376
      if (! NILP (BVAR (b, enable_multibyte_characters)))
Kenichi Handa's avatar
Kenichi Handa committed
377
	BUF_DEC_POS (b, bytepos);
378
      else
Kenichi Handa's avatar
Kenichi Handa committed
379
	bytepos--;
380

381
      SET_BUF_PT_BOTH (b, charpos - 1, bytepos);
382
    }
383
  else if (MARKERP (readcharfun))
384
    {
385
      struct buffer *b = XMARKER (readcharfun)->buffer;
386
      ptrdiff_t bytepos = XMARKER (readcharfun)->bytepos;
387

Kenichi Handa's avatar
Kenichi Handa committed
388
      XMARKER (readcharfun)->charpos--;
Tom Tromey's avatar
Tom Tromey committed
389
      if (! NILP (BVAR (b, enable_multibyte_characters)))
Kenichi Handa's avatar
Kenichi Handa committed
390
	BUF_DEC_POS (b, bytepos);
391
      else
Kenichi Handa's avatar
Kenichi Handa committed
392
	bytepos--;
393

Kenichi Handa's avatar
Kenichi Handa committed
394
      XMARKER (readcharfun)->bytepos = bytepos;
395
    }
396
  else if (STRINGP (readcharfun))
397 398 399 400 401
    {
      read_from_string_index--;
      read_from_string_index_byte
	= string_char_to_byte (readcharfun, read_from_string_index);
    }
Kenichi Handa's avatar
Kenichi Handa committed
402 403 404 405
  else if (CONSP (readcharfun))
    {
      unread_char = c;
    }
406
  else if (EQ (readcharfun, Qlambda))
Kenichi Handa's avatar
Kenichi Handa committed
407 408 409 410 411 412 413
    {
      unread_char = c;
    }
  else if (EQ (readcharfun, Qget_file_char)
	   || EQ (readcharfun, Qget_emacs_mule_file_char))
    {
      if (load_each_byte)
Miles Bader's avatar
Miles Bader committed
414 415 416 417 418
	{
	  BLOCK_INPUT;
	  ungetc (c, instream);
	  UNBLOCK_INPUT;
	}
Kenichi Handa's avatar
Kenichi Handa committed
419 420 421
      else
	unread_char = c;
    }
Jim Blandy's avatar
Jim Blandy committed
422 423 424 425
  else
    call1 (readcharfun, make_number (c));
}

Kenichi Handa's avatar
Kenichi Handa committed
426
static int
427
readbyte_for_lambda (int c, Lisp_Object readcharfun)
Kenichi Handa's avatar
Kenichi Handa committed
428 429 430 431 432 433
{
  return read_bytecode_char (c >= 0);
}


static int
434
readbyte_from_file (int c, Lisp_Object readcharfun)
Kenichi Handa's avatar
Kenichi Handa committed
435 436 437
{
  if (c >= 0)
    {
YAMAMOTO Mitsuharu's avatar
YAMAMOTO Mitsuharu committed
438
      BLOCK_INPUT;
Kenichi Handa's avatar
Kenichi Handa committed
439
      ungetc (c, instream);
YAMAMOTO Mitsuharu's avatar
YAMAMOTO Mitsuharu committed
440
      UNBLOCK_INPUT;
Kenichi Handa's avatar
Kenichi Handa committed
441 442 443
      return 0;
    }

Miles Bader's avatar
Miles Bader committed
444
  BLOCK_INPUT;
Kenichi Handa's avatar
Kenichi Handa committed
445
  c = getc (instream);
Miles Bader's avatar
Miles Bader committed
446

Kenichi Handa's avatar
Kenichi Handa committed
447
#ifdef EINTR
448
  /* Interrupted reads have been observed while reading over the network.  */
Miles Bader's avatar
Miles Bader committed
449 450
  while (c == EOF && ferror (instream) && errno == EINTR)
    {
Miles Bader's avatar
Miles Bader committed
451
      UNBLOCK_INPUT;
Miles Bader's avatar
Miles Bader committed
452 453
      QUIT;
      BLOCK_INPUT;
Miles Bader's avatar
Miles Bader committed
454
      clearerr (instream);
Miles Bader's avatar
Miles Bader committed
455
      c = getc (instream);
YAMAMOTO Mitsuharu's avatar
YAMAMOTO Mitsuharu committed
456
    }
Kenichi Handa's avatar
Kenichi Handa committed
457
#endif
Miles Bader's avatar
Miles Bader committed
458

Miles Bader's avatar
Miles Bader committed
459 460
  UNBLOCK_INPUT;

Kenichi Handa's avatar
Kenichi Handa committed
461 462 463 464
  return (c == EOF ? -1 : c);
}

static int
465
readbyte_from_string (int c, Lisp_Object readcharfun)
Kenichi Handa's avatar
Kenichi Handa committed
466 467 468 469 470 471 472 473 474
{
  Lisp_Object string = XCAR (readcharfun);

  if (c >= 0)
    {
      read_from_string_index--;
      read_from_string_index_byte
	= string_char_to_byte (string, read_from_string_index);
    }
Kenichi Handa's avatar
Kenichi Handa committed
475

Kenichi Handa's avatar
Kenichi Handa committed
476 477 478 479 480 481 482 483 484 485 486 487 488 489 490
  if (read_from_string_index >= read_from_string_limit)
    c = -1;
  else
    FETCH_STRING_CHAR_ADVANCE (c, string,
			       read_from_string_index,
			       read_from_string_index_byte);
  return c;
}


/* Read one non-ASCII character from INSTREAM.  The character is
   encoded in `emacs-mule' and the first byte is already read in
   C.  */

static int
491
read_emacs_mule_char (int c, int (*readbyte) (int, Lisp_Object), Lisp_Object readcharfun)
Kenichi Handa's avatar
Kenichi Handa committed
492 493 494 495 496 497 498 499 500 501 502 503 504 505 506 507 508 509 510 511 512 513 514 515 516 517 518 519
{
  /* Emacs-mule coding uses at most 4-byte for one character.  */
  unsigned char buf[4];
  int len = emacs_mule_bytes[c];
  struct charset *charset;
  int i;
  unsigned code;

  if (len == 1)
    /* C is not a valid leading-code of `emacs-mule'.  */
    return BYTE8_TO_CHAR (c);

  i = 0;
  buf[i++] = c;
  while (i < len)
    {
      c = (*readbyte) (-1, readcharfun);
      if (c < 0xA0)
	{
	  while (--i > 1)
	    (*readbyte) (buf[i], readcharfun);
	  return BYTE8_TO_CHAR (buf[0]);
	}
      buf[i++] = c;
    }

  if (len == 2)
    {
520
      charset = CHARSET_FROM_ID (emacs_mule_charset[buf[0]]);
Kenichi Handa's avatar
Kenichi Handa committed
521 522 523 524 525 526 527
      code = buf[1] & 0x7F;
    }
  else if (len == 3)
    {
      if (buf[0] == EMACS_MULE_LEADING_CODE_PRIVATE_11
	  || buf[0] == EMACS_MULE_LEADING_CODE_PRIVATE_12)
	{
528
	  charset = CHARSET_FROM_ID (emacs_mule_charset[buf[1]]);
Kenichi Handa's avatar
Kenichi Handa committed
529 530 531 532
	  code = buf[2] & 0x7F;
	}
      else
	{
533
	  charset = CHARSET_FROM_ID (emacs_mule_charset[buf[0]]);
Kenichi Handa's avatar
Kenichi Handa committed
534 535 536 537 538
	  code = ((buf[1] << 8) | buf[2]) & 0x7F7F;
	}
    }
  else
    {
539
      charset = CHARSET_FROM_ID (emacs_mule_charset[buf[1]]);
Kenichi Handa's avatar
Kenichi Handa committed
540
      code = ((buf[2] << 8) | buf[3]) & 0x7F7F;
Kenichi Handa's avatar
Kenichi Handa committed
541 542 543 544 545 546 547 548 549
    }
  c = DECODE_CHAR (charset, code);
  if (c < 0)
    Fsignal (Qinvalid_read_syntax,
	     Fcons (build_string ("invalid multibyte form"), Qnil));
  return c;
}


550 551 552 553
static Lisp_Object read_internal_start (Lisp_Object, Lisp_Object,
                                        Lisp_Object);
static Lisp_Object read0 (Lisp_Object);
static Lisp_Object read1 (Lisp_Object, int *, int);
554

555 556
static Lisp_Object read_list (int, Lisp_Object);
static Lisp_Object read_vector (Lisp_Object, int);
557

558 559 560 561 562
static Lisp_Object substitute_object_recurse (Lisp_Object, Lisp_Object,
                                              Lisp_Object);
static void substitute_object_in_subtree (Lisp_Object,
                                          Lisp_Object);
static void substitute_in_interval (INTERVAL, Lisp_Object);
563

Jim Blandy's avatar
Jim Blandy committed
564

565
/* Get a character from the tty.  */
Jim Blandy's avatar
Jim Blandy committed
566

567 568 569 570 571 572 573 574 575 576 577 578 579
/* Read input events until we get one that's acceptable for our purposes.

   If NO_SWITCH_FRAME is non-zero, switch-frame events are stashed
   until we get a character we like, and then stuffed into
   unread_switch_frame.

   If ASCII_REQUIRED is non-zero, we check function key events to see
   if the unmodified version of the symbol has a Qascii_character
   property, and use that character, if present.

   If ERROR_NONASCII is non-zero, we signal an error if the input we
   get isn't an ASCII character with modifiers.  If it's zero but
   ASCII_REQUIRED is non-zero, we just re-read until we get an ASCII
580 581 582
   character.

   If INPUT_METHOD is nonzero, we invoke the current input method
583 584 585 586
   if the character warrants that.

   If SECONDS is a number, we wait that many seconds for input, and
   return Qnil if no input arrives within that time.  */
587

Andreas Schwab's avatar
Andreas Schwab committed
588
static Lisp_Object
Andreas Schwab's avatar
Andreas Schwab committed
589 590
read_filtered_event (int no_switch_frame, int ascii_required,
		     int error_nonascii, int input_method, Lisp_Object seconds)
591
{
592
  Lisp_Object val, delayed_switch_frame;
593
  EMACS_TIME end_time;
594

595
#ifdef HAVE_WINDOW_SYSTEM
596 597
  if (display_hourglass_p)
    cancel_hourglass ();
598
#endif
599

600
  delayed_switch_frame = Qnil;
601

602 603 604
  /* Compute timeout.  */
  if (NUMBERP (seconds))
    {
605
      double duration = extract_float (seconds);
606
      EMACS_TIME wait_time = EMACS_TIME_FROM_DOUBLE (duration);
607 608 609 610
      EMACS_GET_TIME (end_time);
      EMACS_ADD_TIME (end_time, end_time, wait_time);
    }

Karoly Lorentey's avatar
Karoly Lorentey committed
611
/* Read until we get an acceptable event.  */
612
 retry:
613
  do
Karoly Lorentey's avatar
Karoly Lorentey committed
614 615
    val = read_char (0, 0, 0, (input_method ? Qnil : Qt), 0,
		     NUMBERP (seconds) ? &end_time : NULL);
616
  while (INTEGERP (val) && XINT (val) == -2); /* wrong_kboard_jmpbuf */
617

618
  if (BUFFERP (val))
619 620
    goto retry;

621
  /* switch-frame events are put off until after the next ASCII
Karl Heuer's avatar
Karl Heuer committed
622
     character.  This is better than signaling an error just because
623 624 625 626 627
     the last characters were typed to a separate minibuffer frame,
     for example.  Eventually, some code which can deal with
     switch-frame events will read it and process it.  */
  if (no_switch_frame
      && EVENT_HAS_PARAMETERS (val)
628
      && EQ (EVENT_HEAD_KIND (EVENT_HEAD (val)), Qswitch_frame))
629 630 631 632 633
    {
      delayed_switch_frame = val;
      goto retry;
    }

634
  if (ascii_required && !(NUMBERP (seconds) && NILP (val)))
635 636
    {
      /* Convert certain symbols to their ASCII equivalents.  */
637
      if (SYMBOLP (val))
638
	{
639
	  Lisp_Object tem, tem1;
640 641 642 643 644 645 646
	  tem = Fget (val, Qevent_symbol_element_mask);
	  if (!NILP (tem))
	    {
	      tem1 = Fget (Fcar (tem), Qascii_character);
	      /* Merge this symbol's modifier bits
		 with the ASCII equivalent of its basic code.  */
	      if (!NILP (tem1))
647
		XSETFASTINT (val, XINT (tem1) | XINT (Fcar (Fcdr (tem))));
648 649
	    }
	}
650

651
      /* If we don't have a character now, deal with it appropriately.  */
652
      if (!INTEGERP (val))
653 654 655
	{
	  if (error_nonascii)
	    {
656
	      Vunread_command_events = Fcons (val, Qnil);
657 658 659 660 661 662 663 664 665 666
	      error ("Non-character input-event");
	    }
	  else
	    goto retry;
	}
    }

  if (! NILP (delayed_switch_frame))
    unread_switch_frame = delayed_switch_frame;

667 668
#if 0

669
#ifdef HAVE_WINDOW_SYSTEM
670 671
  if (display_hourglass_p)
    start_hourglass ();
672
#endif
673 674 675

#endif

676 677 678
  return val;
}

Paul Eggert's avatar
Paul Eggert committed
679
DEFUN ("read-char", Fread_char, Sread_char, 0, 3, 0,
680 681
       doc: /* Read a character from the command input (keyboard or macro).
It is returned as a number.
682 683 684
If the character has modifiers, they are resolved and reflected to the
character code if possible (e.g. C-SPC -> 0).

685 686
If the user generates an event which is not a character (i.e. a mouse
click or function key event), `read-char' signals an error.  As an
687 688
exception, switch-frame events are put off until non-character events
can be read.
689 690 691 692 693 694
If you want to read non-character events, or ignore them, call
`read-event' or `read-char-exclusive' instead.

If the optional argument PROMPT is non-nil, display that as a prompt.
If the optional argument INHERIT-INPUT-METHOD is non-nil and some
input method is turned on in the current buffer, that input method
695 696 697 698 699
is used for reading a character.
If the optional argument SECONDS is non-nil, it should be a number
specifying the maximum number of seconds to wait for input.  If no
input arrives in that time, return nil.  SECONDS may be a
floating-point value.  */)
Dan Nicolaescu's avatar
Dan Nicolaescu committed
700
  (Lisp_Object prompt, Lisp_Object inherit_input_method, Lisp_Object seconds)
Jim Blandy's avatar
Jim Blandy committed
701
{
702 703
  Lisp_Object val;

704 705
  if (! NILP (prompt))
    message_with_string ("%s", prompt, 0);
706
  val = read_filtered_event (1, 1, 1, ! NILP (inherit_input_method), seconds);
707 708 709

  return (NILP (val) ? Qnil
	  : make_number (char_resolve_modifier_mask (XINT (val))));
Jim Blandy's avatar
Jim Blandy committed
710 711
}

Paul Eggert's avatar
Paul Eggert committed
712
DEFUN ("read-event", Fread_event, Sread_event, 0, 3, 0,
713 714 715 716
       doc: /* Read an event object from the input stream.
If the optional argument PROMPT is non-nil, display that as a prompt.
If the optional argument INHERIT-INPUT-METHOD is non-nil and some
input method is turned on in the current buffer, that input method
717 718 719 720 721
is used for reading a character.
If the optional argument SECONDS is non-nil, it should be a number
specifying the maximum number of seconds to wait for input.  If no
input arrives in that time, return nil.  SECONDS may be a
floating-point value.  */)
Dan Nicolaescu's avatar
Dan Nicolaescu committed
722
  (Lisp_Object prompt, Lisp_Object inherit_input_method, Lisp_Object seconds)
Jim Blandy's avatar
Jim Blandy committed
723
{
724 725
  if (! NILP (prompt))
    message_with_string ("%s", prompt, 0);
726
  return read_filtered_event (0, 0, 0, ! NILP (inherit_input_method), seconds);
Jim Blandy's avatar
Jim Blandy committed
727 728
}

729
DEFUN ("read-char-exclusive", Fread_char_exclusive, Sread_char_exclusive, 0, 3, 0,
730 731
       doc: /* Read a character from the command input (keyboard or macro).
It is returned as a number.  Non-character events are ignored.
732 733
If the character has modifiers, they are resolved and reflected to the
character code if possible (e.g. C-SPC -> 0).
734 735 736 737

If the optional argument PROMPT is non-nil, display that as a prompt.
If the optional argument INHERIT-INPUT-METHOD is non-nil and some
input method is turned on in the current buffer, that input method
738 739 740 741 742
is used for reading a character.
If the optional argument SECONDS is non-nil, it should be a number
specifying the maximum number of seconds to wait for input.  If no
input arrives in that time, return nil.  SECONDS may be a
floating-point value.  */)
Dan Nicolaescu's avatar
Dan Nicolaescu committed
743
  (Lisp_Object prompt, Lisp_Object inherit_input_method, Lisp_Object seconds)
Jim Blandy's avatar
Jim Blandy committed
744
{
745 746
  Lisp_Object val;

747 748
  if (! NILP (prompt))
    message_with_string ("%s", prompt, 0);
749

750
  val = read_filtered_event (1, 1, 0, ! NILP (inherit_input_method), seconds);
751 752 753

  return (NILP (val) ? Qnil
	  : make_number (char_resolve_modifier_mask (XINT (val))));
Jim Blandy's avatar
Jim Blandy committed
754 755 756
}

DEFUN ("get-file-char", Fget_file_char, Sget_file_char, 0, 0, 0,
757
       doc: /* Don't use this yourself.  */)
Dan Nicolaescu's avatar
Dan Nicolaescu committed
758
  (void)
Jim Blandy's avatar
Jim Blandy committed
759 760
{
  register Lisp_Object val;
YAMAMOTO Mitsuharu's avatar
YAMAMOTO Mitsuharu committed
761
  BLOCK_INPUT;
762
  XSETINT (val, getc (instream));
YAMAMOTO Mitsuharu's avatar
YAMAMOTO Mitsuharu committed
763
  UNBLOCK_INPUT;
Jim Blandy's avatar
Jim Blandy committed
764 765
  return val;
}
766 767


768 769 770 771 772 773 774 775


/* Return true if the lisp code read using READCHARFUN defines a non-nil
   `lexical-binding' file variable.  After returning, the stream is
   positioned following the first line, if it is a comment, otherwise
   nothing is read.  */

static int
Stefan Monnier's avatar
Stefan Monnier committed
776
lisp_file_lexically_bound_p (Lisp_Object readcharfun)
777 778 779 780 781 782 783 784 785 786 787 788 789 790 791 792 793
{
  int ch = READCHAR;
  if (ch != ';')
    /* The first line isn't a comment, just give up.  */
    {
      UNREAD (ch);
      return 0;
    }
  else
    /* Look for an appropriate file-variable in the first line.  */
    {
      int rv = 0;
      enum {
	NOMINAL, AFTER_FIRST_DASH, AFTER_ASTERIX,
      } beg_end_state = NOMINAL;
      int in_file_vars = 0;

794 795 796 797 798 799 800 801 802 803
#define UPDATE_BEG_END_STATE(ch)				\
  if (beg_end_state == NOMINAL)					\
    beg_end_state = (ch == '-' ? AFTER_FIRST_DASH : NOMINAL);	\
  else if (beg_end_state == AFTER_FIRST_DASH)			\
    beg_end_state = (ch == '*' ? AFTER_ASTERIX : NOMINAL);	\
  else if (beg_end_state == AFTER_ASTERIX)			\
    {								\
      if (ch == '-')						\
	in_file_vars = !in_file_vars;				\
      beg_end_state = NOMINAL;					\
804 805 806 807 808 809 810 811 812 813 814 815
    }

      /* Skip until we get to the file vars, if any.  */
      do
	{
	  ch = READCHAR;
	  UPDATE_BEG_END_STATE (ch);
	}
      while (!in_file_vars && ch != '\n' && ch != EOF);

      while (in_file_vars)
	{
816
	  char var[100], val[100];
817
	  unsigned i;
818 819 820 821 822 823 824

	  ch = READCHAR;

	  /* Read a variable name.  */
	  while (ch == ' ' || ch == '\t')
	    ch = READCHAR;

825
	  i = 0;
826
	  while (ch != ':' && ch != '\n' && ch != EOF && in_file_vars)
827
	    {
828 829
	      if (i < sizeof var - 1)
		var[i++] = ch;
830 831 832
	      UPDATE_BEG_END_STATE (ch);
	      ch = READCHAR;
	    }
833

834
	  /* Stop scanning if no colon was found before end marker.  */
835
	  if (!in_file_vars || ch == '\n' || ch == EOF)
836 837
	    break;

838 839 840
	  while (i > 0 && (var[i - 1] == ' ' || var[i - 1] == '\t'))
	    i--;
	  var[i] = '\0';
841 842 843 844 845 846 847 848 849

	  if (ch == ':')
	    {
	      /* Read a variable value.  */
	      ch = READCHAR;

	      while (ch == ' ' || ch == '\t')
		ch = READCHAR;

850
	      i = 0;
851 852
	      while (ch != ';' && ch != '\n' && ch != EOF && in_file_vars)
		{
853 854
		  if (i < sizeof val - 1)
		    val[i++] = ch;
855 856 857 858
		  UPDATE_BEG_END_STATE (ch);
		  ch = READCHAR;
		}
	      if (! in_file_vars)
859
		/* The value was terminated by an end-marker, which remove.  */
860 861 862 863
		i -= 3;
	      while (i > 0 && (val[i - 1] == ' ' || val[i - 1] == '\t'))
		i--;
	      val[i] = '\0';
864 865 866 867 868 869 870 871 872 873 874 875 876 877 878 879

	      if (strcmp (var, "lexical-binding") == 0)
		/* This is it...  */
		{
		  rv = (strcmp (val, "nil") != 0);
		  break;
		}
	    }
	}

      while (ch != '\n' && ch != EOF)
	ch = READCHAR;

      return rv;
    }
}
880

Kenichi Handa's avatar
Kenichi Handa committed
881
/* Value is a version number of byte compiled code if the file
Miles Bader's avatar
Miles Bader committed
882
   associated with file descriptor FD is a compiled Lisp file that's
Kenichi Handa's avatar
Kenichi Handa committed
883 884 885
   safe to load.  Only files compiled with Emacs are safe to load.
   Files compiled with XEmacs can lead to a crash in Fbyte_code
   because of an incompatible change in the byte compiler.  */
886 887

static int
888
safe_to_load_p (int fd)
889 890 891 892
{
  char buf[512];
  int nbytes, i;
  int safe_p = 1;
Kenichi Handa's avatar
Kenichi Handa committed
893
  int version = 1;
894 895 896 897 898 899 900 901 902

  /* Read the first few bytes from the file, and look for a line
     specifying the byte compiler version used.  */
  nbytes = emacs_read (fd, buf, sizeof buf - 1);
  if (nbytes > 0)
    {
      buf[nbytes] = '\0';

      /* Skip to the next newline, skipping over the initial `ELC'
Dave Love's avatar
Dave Love committed
903
	 with NUL bytes following it, but note the version.  */
904
      for (i = 0; i < nbytes && buf[i] != '\n'; ++i)
Dave Love's avatar
Dave Love committed
905
	if (i == 4)
Kenichi Handa's avatar
Kenichi Handa committed
906
	  version = buf[i];
907

908
      if (i >= nbytes
909
	  || fast_c_string_match_ignore_case (Vbytecomp_version_regexp,
910 911 912
					      buf + i) < 0)
	safe_p = 0;
    }
Dave Love's avatar
Dave Love committed
913 914
  if (safe_p)
    safe_p = version;
915 916 917 918 919 920

  lseek (fd, 0, SEEK_SET);
  return safe_p;
}


921 922 923 924
/* Callback for record_unwind_protect.  Restore the old load list OLD,
   after loading a file successfully.  */

static Lisp_Object
925
record_load_unwind (Lisp_Object old)
926 927 928 929
{
  return Vloads_in_progress = old;
}

930 931 932
/* This handler function is used via internal_condition_case_1.  */

static Lisp_Object
933
load_error_handler (Lisp_Object data)
934 935 936
{
  return Qnil;
}
937

938
static Lisp_Object
939
load_warn_old_style_backquotes (Lisp_Object file)
940 941 942
{