lread.c 134 KB
Newer Older
Jim Blandy's avatar
Jim Blandy committed
1
/* Lisp parsing and input streams.
2

3
Copyright (C) 1985-1989, 1993-1995, 1997-2012  Free Software Foundation, Inc.
Jim Blandy's avatar
Jim Blandy committed
4 5 6

This file is part of GNU Emacs.

7
GNU Emacs is free software: you can redistribute it and/or modify
Jim Blandy's avatar
Jim Blandy committed
8
it under the terms of the GNU General Public License as published by
9 10
the Free Software Foundation, either version 3 of the License, or
(at your option) any later version.
Jim Blandy's avatar
Jim Blandy committed
11 12 13 14 15 16 17

GNU Emacs is distributed in the hope that it will be useful,
but WITHOUT ANY WARRANTY; without even the implied warranty of
MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
GNU General Public License for more details.

You should have received a copy of the GNU General Public License
18
along with GNU Emacs.  If not, see <http://www.gnu.org/licenses/>.  */
Jim Blandy's avatar
Jim Blandy committed
19 20


Richard M. Stallman's avatar
Richard M. Stallman committed
21
#include <config.h>
Jim Blandy's avatar
Jim Blandy committed
22 23 24 25
#include <stdio.h>
#include <sys/types.h>
#include <sys/stat.h>
#include <sys/file.h>
26
#include <errno.h>
27
#include <limits.h>	/* For CHAR_BIT.  */
28
#include <stat-time.h>
Jim Blandy's avatar
Jim Blandy committed
29
#include "lisp.h"
30
#include "intervals.h"
Kenichi Handa's avatar
Kenichi Handa committed
31
#include "character.h"
32
#include "buffer.h"
Karl Heuer's avatar
Karl Heuer committed
33
#include "charset.h"
Kenichi Handa's avatar
Kenichi Handa committed
34
#include "coding.h"
35
#include <epaths.h>
Jim Blandy's avatar
Jim Blandy committed
36
#include "commands.h"
Jim Blandy's avatar
Jim Blandy committed
37
#include "keyboard.h"
38
#include "frame.h"
39
#include "termhooks.h"
40
#include "coding.h"
YAMAMOTO Mitsuharu's avatar
YAMAMOTO Mitsuharu committed
41
#include "blockinput.h"
Jim Blandy's avatar
Jim Blandy committed
42

43 44 45 46
#ifdef MSDOS
#include "msdos.h"
#endif

47 48 49 50
#ifdef HAVE_NS
#include "nsterm.h"
#endif

Andreas Schwab's avatar
Andreas Schwab committed
51
#include <unistd.h>
Jim Blandy's avatar
Jim Blandy committed
52

Richard M. Stallman's avatar
Richard M. Stallman committed
53 54 55 56
#ifdef HAVE_SETLOCALE
#include <locale.h>
#endif /* HAVE_SETLOCALE */

Dave Love's avatar
Dave Love committed
57
#include <fcntl.h>
Richard M. Stallman's avatar
Richard M. Stallman committed
58

59
#ifdef HAVE_FSEEKO
60 61 62 63 64 65 66
#define file_offset off_t
#define file_tell ftello
#else
#define file_offset long
#define file_tell ftell
#endif

67
/* Hash table read constants.  */
68 69 70 71 72 73 74 75
static Lisp_Object Qhash_table, Qdata;
static Lisp_Object Qtest, Qsize;
static Lisp_Object Qweakness;
static Lisp_Object Qrehash_size;
static Lisp_Object Qrehash_threshold;

static Lisp_Object Qread_char, Qget_file_char, Qcurrent_load_list;
Lisp_Object Qstandard_input;
76
Lisp_Object Qvariable_documentation;
77
static Lisp_Object Qascii_character, Qload, Qload_file_name;
78
Lisp_Object Qbackquote, Qcomma, Qcomma_at, Qcomma_dot, Qfunction;
79 80
static Lisp_Object Qinhibit_file_name_operation;
static Lisp_Object Qeval_buffer_list;
81
Lisp_Object Qlexical_binding;
82
static Lisp_Object Qfile_truename, Qdo_after_load_evaluation; /* ACM 2006/5/16 */
83

Kenichi Handa's avatar
Kenichi Handa committed
84 85 86 87 88 89
/* Used instead of Qget_file_char while loading *.elc files compiled
   by Emacs 21 or older.  */
static Lisp_Object Qget_emacs_mule_file_char;

static Lisp_Object Qload_force_doc_strings;

90
static Lisp_Object Qload_in_progress;
Ken Raeburn's avatar
Ken Raeburn committed
91

92 93 94 95
/* The association list of objects read with the #n=object form.
   Each member of the list has the form (n . object), and is used to
   look up the object for the corresponding #n# construct.
   It must be set to nil before all top-level calls to read0.  */
96
static Lisp_Object read_objects;
97

Kenichi Handa's avatar
Kenichi Handa committed
98 99 100 101 102
/* Nonzero means READCHAR should read bytes one by one (not character)
   when READCHARFUN is Qget_file_char or Qget_emacs_mule_file_char.
   This is set to 1 by read1 temporarily while handling #@NUMBER.  */
static int load_each_byte;

103 104 105
/* List of descriptors now open for Fload.  */
static Lisp_Object load_descriptor_list;

106
/* File for get_file_char to read from.  Use by load.  */
Jim Blandy's avatar
Jim Blandy committed
107 108
static FILE *instream;

109
/* For use within read-from-string (this reader is non-reentrant!!)  */
110 111 112
static ptrdiff_t read_from_string_index;
static ptrdiff_t read_from_string_index_byte;
static ptrdiff_t read_from_string_limit;
113

114
/* Number of characters read in the current call to Fread or
115
   Fread_from_string.  */
116
static EMACS_INT readchar_count;
117

118
/* This contains the last string skipped with #@.  */
119 120
static char *saved_doc_string;
/* Length of buffer allocated in saved_doc_string.  */
121
static ptrdiff_t saved_doc_string_size;
122
/* Length of actual data in saved_doc_string.  */
123
static ptrdiff_t saved_doc_string_length;
124
/* This is the file position that string came from.  */
125
static file_offset saved_doc_string_position;
126

127 128 129 130 131
/* This contains the previous string skipped with #@.
   We copy it from saved_doc_string when a new string
   is put in saved_doc_string.  */
static char *prev_saved_doc_string;
/* Length of buffer allocated in prev_saved_doc_string.  */
132
static ptrdiff_t prev_saved_doc_string_size;
133
/* Length of actual data in prev_saved_doc_string.  */
134
static ptrdiff_t prev_saved_doc_string_length;
135
/* This is the file position that string came from.  */
136
static file_offset prev_saved_doc_string_position;
137

138 139 140 141 142
/* Nonzero means inside a new-style backquote
   with no surrounding parentheses.
   Fread initializes this to zero, so we need not specbind it
   or worry about what happens to it when there is an error.  */
static int new_backquote_flag;
143
static Lisp_Object Qold_style_backquotes;
144 145 146 147

/* A list of file names for files being loaded in Fload.  Used to
   check for recursive loads.  */

Lute Kamstra's avatar
Lute Kamstra committed
148
static Lisp_Object Vloads_in_progress;
149

150 151
static int read_emacs_mule_char (int, int (*) (int, Lisp_Object),
                                 Lisp_Object);
Kenichi Handa's avatar
Kenichi Handa committed
152

153
static void readevalloop (Lisp_Object, FILE*, Lisp_Object, int,
154 155 156 157
                          Lisp_Object, Lisp_Object,
                          Lisp_Object, Lisp_Object);
static Lisp_Object load_unwind (Lisp_Object);
static Lisp_Object load_descriptor_unwind (Lisp_Object);
Jim Blandy's avatar
Jim Blandy committed
158

Kenichi Handa's avatar
Kenichi Handa committed
159 160 161 162 163 164
/* Functions that read one byte from the current source READCHARFUN
   or unreads one byte.  If the integer argument C is -1, it returns
   one read byte, or -1 when there's no more byte in the source.  If C
   is 0 or positive, it unreads C, and the return value is not
   interesting.  */

165 166 167
static int readbyte_for_lambda (int, Lisp_Object);
static int readbyte_from_file (int, Lisp_Object);
static int readbyte_from_string (int, Lisp_Object);
Kenichi Handa's avatar
Kenichi Handa committed
168

Jim Blandy's avatar
Jim Blandy committed
169 170
/* Handle unreading and rereading of characters.
   Write READCHAR to read a character,
Karl Heuer's avatar
Karl Heuer committed
171 172
   UNREAD(c) to unread c to be read again.

Kenichi Handa's avatar
Kenichi Handa committed
173
   These macros correctly read/unread multibyte characters.  */
Jim Blandy's avatar
Jim Blandy committed
174

175
#define READCHAR readchar (readcharfun, NULL)
Jim Blandy's avatar
Jim Blandy committed
176 177
#define UNREAD(c) unreadchar (readcharfun, c)

178 179 180
/* Same as READCHAR but set *MULTIBYTE to the multibyteness of the source.  */
#define READCHAR_REPORT_MULTIBYTE(multibyte) readchar (readcharfun, multibyte)

Kenichi Handa's avatar
Kenichi Handa committed
181
/* When READCHARFUN is Qget_file_char, Qget_emacs_mule_file_char,
Kenichi Handa's avatar
Kenichi Handa committed
182 183
   Qlambda, or a cons, we use this to keep an unread character because
   a file stream can't handle multibyte-char unreading.  The value -1
184
   means that there's no unread character.  */
Kenichi Handa's avatar
Kenichi Handa committed
185 186
static int unread_char;

Jim Blandy's avatar
Jim Blandy committed
187
static int
188
readchar (Lisp_Object readcharfun, bool *multibyte)
Jim Blandy's avatar
Jim Blandy committed
189 190
{
  Lisp_Object tem;
191
  register int c;
192
  int (*readbyte) (int, Lisp_Object);
Kenichi Handa's avatar
Kenichi Handa committed
193 194 195
  unsigned char buf[MAX_MULTIBYTE_LENGTH];
  int i, len;
  int emacs_mule_encoding = 0;
Jim Blandy's avatar
Jim Blandy committed
196

197 198 199
  if (multibyte)
    *multibyte = 0;

200
  readchar_count++;
201

202
  if (BUFFERP (readcharfun))
Jim Blandy's avatar
Jim Blandy committed
203
    {
204
      register struct buffer *inbuffer = XBUFFER (readcharfun);
Jim Blandy's avatar
Jim Blandy committed
205

206
      ptrdiff_t pt_byte = BUF_PT_BYTE (inbuffer);
207

208 209
      if (pt_byte >= BUF_ZV_BYTE (inbuffer))
	return -1;
Jim Blandy's avatar
Jim Blandy committed
210

Tom Tromey's avatar
Tom Tromey committed
211
      if (! NILP (BVAR (inbuffer, enable_multibyte_characters)))
212
	{
213
	  /* Fetch the character code from the buffer.  */
214 215
	  unsigned char *p = BUF_BYTE_ADDRESS (inbuffer, pt_byte);
	  BUF_INC_POS (inbuffer, pt_byte);
216
	  c = STRING_CHAR (p);
217 218
	  if (multibyte)
	    *multibyte = 1;
219 220 221 222
	}
      else
	{
	  c = BUF_FETCH_BYTE (inbuffer, pt_byte);
Kenichi Handa's avatar
Kenichi Handa committed
223 224
	  if (! ASCII_BYTE_P (c))
	    c = BYTE8_TO_CHAR (c);
225
	  pt_byte++;
226
	}
227
      SET_BUF_PT_BOTH (inbuffer, BUF_PT (inbuffer) + 1, pt_byte);
228

229
      return c;
Jim Blandy's avatar
Jim Blandy committed
230
    }
231
  if (MARKERP (readcharfun))
Jim Blandy's avatar
Jim Blandy committed
232
    {
233
      register struct buffer *inbuffer = XMARKER (readcharfun)->buffer;
Jim Blandy's avatar
Jim Blandy committed
234

235
      ptrdiff_t bytepos = marker_byte_position (readcharfun);
236

237 238
      if (bytepos >= BUF_ZV_BYTE (inbuffer))
	return -1;
239

Tom Tromey's avatar
Tom Tromey committed
240
      if (! NILP (BVAR (inbuffer, enable_multibyte_characters)))
241
	{
242
	  /* Fetch the character code from the buffer.  */
243 244
	  unsigned char *p = BUF_BYTE_ADDRESS (inbuffer, bytepos);
	  BUF_INC_POS (inbuffer, bytepos);
245
	  c = STRING_CHAR (p);
246 247
	  if (multibyte)
	    *multibyte = 1;
248 249 250 251
	}
      else
	{
	  c = BUF_FETCH_BYTE (inbuffer, bytepos);
Kenichi Handa's avatar
Kenichi Handa committed
252 253
	  if (! ASCII_BYTE_P (c))
	    c = BYTE8_TO_CHAR (c);
254
	  bytepos++;
255 256
	}

257 258 259 260
      XMARKER (readcharfun)->bytepos = bytepos;
      XMARKER (readcharfun)->charpos++;

      return c;
Jim Blandy's avatar
Jim Blandy committed
261
    }
262 263

  if (EQ (readcharfun, Qlambda))
Kenichi Handa's avatar
Kenichi Handa committed
264 265 266 267
    {
      readbyte = readbyte_for_lambda;
      goto read_multibyte;
    }
268

Jim Blandy's avatar
Jim Blandy committed
269
  if (EQ (readcharfun, Qget_file_char))
270
    {
Kenichi Handa's avatar
Kenichi Handa committed
271 272
      readbyte = readbyte_from_file;
      goto read_multibyte;
273
    }
Jim Blandy's avatar
Jim Blandy committed
274

275
  if (STRINGP (readcharfun))
Jim Blandy's avatar
Jim Blandy committed
276
    {
277
      if (read_from_string_index >= read_from_string_limit)
Jim Blandy's avatar
Jim Blandy committed
278
	c = -1;
279 280 281 282 283 284 285 286
      else if (STRING_MULTIBYTE (readcharfun))
	{
	  if (multibyte)
	    *multibyte = 1;
	  FETCH_STRING_CHAR_ADVANCE_NO_CHECK (c, readcharfun,
					      read_from_string_index,
					      read_from_string_index_byte);
	}
287
      else
288 289 290 291 292
	{
	  c = SREF (readcharfun, read_from_string_index_byte);
	  read_from_string_index++;
	  read_from_string_index_byte++;
	}
Jim Blandy's avatar
Jim Blandy committed
293 294 295
      return c;
    }

Kenichi Handa's avatar
Kenichi Handa committed
296 297 298 299 300 301 302 303 304 305 306 307
  if (CONSP (readcharfun))
    {
      /* This is the case that read_vector is reading from a unibyte
	 string that contains a byte sequence previously skipped
	 because of #@NUMBER.  The car part of readcharfun is that
	 string, and the cdr part is a value of readcharfun given to
	 read_vector.  */
      readbyte = readbyte_from_string;
      if (EQ (XCDR (readcharfun), Qget_emacs_mule_file_char))
	emacs_mule_encoding = 1;
      goto read_multibyte;
    }
Kenichi Handa's avatar
Kenichi Handa committed
308

Kenichi Handa's avatar
Kenichi Handa committed
309 310 311 312 313 314
  if (EQ (readcharfun, Qget_emacs_mule_file_char))
    {
      readbyte = readbyte_from_file;
      emacs_mule_encoding = 1;
      goto read_multibyte;
    }
Jim Blandy's avatar
Jim Blandy committed
315 316 317

  tem = call0 (readcharfun);

Jim Blandy's avatar
Jim Blandy committed
318
  if (NILP (tem))
Jim Blandy's avatar
Jim Blandy committed
319 320
    return -1;
  return XINT (tem);
Kenichi Handa's avatar
Kenichi Handa committed
321 322 323 324 325 326 327 328 329

 read_multibyte:
  if (unread_char >= 0)
    {
      c = unread_char;
      unread_char = -1;
      return c;
    }
  c = (*readbyte) (-1, readcharfun);
330 331 332 333 334
  if (c < 0 || load_each_byte)
    return c;
  if (multibyte)
    *multibyte = 1;
  if (ASCII_BYTE_P (c))
Kenichi Handa's avatar
Kenichi Handa committed
335 336 337 338 339 340 341 342 343 344 345 346 347 348 349 350 351
    return c;
  if (emacs_mule_encoding)
    return read_emacs_mule_char (c, readbyte, readcharfun);
  i = 0;
  buf[i++] = c;
  len = BYTES_BY_CHAR_HEAD (c);
  while (i < len)
    {
      c = (*readbyte) (-1, readcharfun);
      if (c < 0 || ! TRAILING_CODE_P (c))
	{
	  while (--i > 1)
	    (*readbyte) (buf[i], readcharfun);
	  return BYTE8_TO_CHAR (buf[0]);
	}
      buf[i++] = c;
    }
352
  return STRING_CHAR (buf);
Jim Blandy's avatar
Jim Blandy committed
353 354 355 356 357 358
}

/* Unread the character C in the way appropriate for the stream READCHARFUN.
   If the stream is a user function, call it with the char as argument.  */

static void
359
unreadchar (Lisp_Object readcharfun, int c)
Jim Blandy's avatar
Jim Blandy committed
360
{
361
  readchar_count--;
362 363 364 365
  if (c == -1)
    /* Don't back up the pointer if we're unreading the end-of-input mark,
       since readchar didn't advance it when we read it.  */
    ;
366
  else if (BUFFERP (readcharfun))
367
    {
368
      struct buffer *b = XBUFFER (readcharfun);
369 370
      ptrdiff_t charpos = BUF_PT (b);
      ptrdiff_t bytepos = BUF_PT_BYTE (b);
371

Tom Tromey's avatar
Tom Tromey committed
372
      if (! NILP (BVAR (b, enable_multibyte_characters)))
Kenichi Handa's avatar
Kenichi Handa committed
373
	BUF_DEC_POS (b, bytepos);
374
      else
Kenichi Handa's avatar
Kenichi Handa committed
375
	bytepos--;
376

377
      SET_BUF_PT_BOTH (b, charpos - 1, bytepos);
378
    }
379
  else if (MARKERP (readcharfun))
380
    {
381
      struct buffer *b = XMARKER (readcharfun)->buffer;
382
      ptrdiff_t bytepos = XMARKER (readcharfun)->bytepos;
383

Kenichi Handa's avatar
Kenichi Handa committed
384
      XMARKER (readcharfun)->charpos--;
Tom Tromey's avatar
Tom Tromey committed
385
      if (! NILP (BVAR (b, enable_multibyte_characters)))
Kenichi Handa's avatar
Kenichi Handa committed
386
	BUF_DEC_POS (b, bytepos);
387
      else
Kenichi Handa's avatar
Kenichi Handa committed
388
	bytepos--;
389

Kenichi Handa's avatar
Kenichi Handa committed
390
      XMARKER (readcharfun)->bytepos = bytepos;
391
    }
392
  else if (STRINGP (readcharfun))
393 394 395 396 397
    {
      read_from_string_index--;
      read_from_string_index_byte
	= string_char_to_byte (readcharfun, read_from_string_index);
    }
Kenichi Handa's avatar
Kenichi Handa committed
398 399 400 401
  else if (CONSP (readcharfun))
    {
      unread_char = c;
    }
402
  else if (EQ (readcharfun, Qlambda))
Kenichi Handa's avatar
Kenichi Handa committed
403 404 405 406 407 408 409
    {
      unread_char = c;
    }
  else if (EQ (readcharfun, Qget_file_char)
	   || EQ (readcharfun, Qget_emacs_mule_file_char))
    {
      if (load_each_byte)
Miles Bader's avatar
Miles Bader committed
410
	{
411
	  block_input ();
Miles Bader's avatar
Miles Bader committed
412
	  ungetc (c, instream);
413
	  unblock_input ();
Miles Bader's avatar
Miles Bader committed
414
	}
Kenichi Handa's avatar
Kenichi Handa committed
415 416 417
      else
	unread_char = c;
    }
Jim Blandy's avatar
Jim Blandy committed
418 419 420 421
  else
    call1 (readcharfun, make_number (c));
}

Kenichi Handa's avatar
Kenichi Handa committed
422
static int
423
readbyte_for_lambda (int c, Lisp_Object readcharfun)
Kenichi Handa's avatar
Kenichi Handa committed
424 425 426 427 428 429
{
  return read_bytecode_char (c >= 0);
}


static int
430
readbyte_from_file (int c, Lisp_Object readcharfun)
Kenichi Handa's avatar
Kenichi Handa committed
431 432 433
{
  if (c >= 0)
    {
434
      block_input ();
Kenichi Handa's avatar
Kenichi Handa committed
435
      ungetc (c, instream);
436
      unblock_input ();
Kenichi Handa's avatar
Kenichi Handa committed
437 438 439
      return 0;
    }

440
  block_input ();
Kenichi Handa's avatar
Kenichi Handa committed
441
  c = getc (instream);
Miles Bader's avatar
Miles Bader committed
442

Kenichi Handa's avatar
Kenichi Handa committed
443
#ifdef EINTR
444
  /* Interrupted reads have been observed while reading over the network.  */
Miles Bader's avatar
Miles Bader committed
445 446
  while (c == EOF && ferror (instream) && errno == EINTR)
    {
447
      unblock_input ();
Miles Bader's avatar
Miles Bader committed
448
      QUIT;
449
      block_input ();
Miles Bader's avatar
Miles Bader committed
450
      clearerr (instream);
Miles Bader's avatar
Miles Bader committed
451
      c = getc (instream);
YAMAMOTO Mitsuharu's avatar
YAMAMOTO Mitsuharu committed
452
    }
Kenichi Handa's avatar
Kenichi Handa committed
453
#endif
Miles Bader's avatar
Miles Bader committed
454

455
  unblock_input ();
Miles Bader's avatar
Miles Bader committed
456

Kenichi Handa's avatar
Kenichi Handa committed
457 458 459 460
  return (c == EOF ? -1 : c);
}

static int
461
readbyte_from_string (int c, Lisp_Object readcharfun)
Kenichi Handa's avatar
Kenichi Handa committed
462 463 464 465 466 467 468 469 470
{
  Lisp_Object string = XCAR (readcharfun);

  if (c >= 0)
    {
      read_from_string_index--;
      read_from_string_index_byte
	= string_char_to_byte (string, read_from_string_index);
    }
Kenichi Handa's avatar
Kenichi Handa committed
471

Kenichi Handa's avatar
Kenichi Handa committed
472 473 474 475 476 477 478 479 480 481 482 483 484 485 486
  if (read_from_string_index >= read_from_string_limit)
    c = -1;
  else
    FETCH_STRING_CHAR_ADVANCE (c, string,
			       read_from_string_index,
			       read_from_string_index_byte);
  return c;
}


/* Read one non-ASCII character from INSTREAM.  The character is
   encoded in `emacs-mule' and the first byte is already read in
   C.  */

static int
487
read_emacs_mule_char (int c, int (*readbyte) (int, Lisp_Object), Lisp_Object readcharfun)
Kenichi Handa's avatar
Kenichi Handa committed
488 489 490 491 492 493 494 495 496 497 498 499 500 501 502 503 504 505 506 507 508 509 510 511 512 513 514 515
{
  /* Emacs-mule coding uses at most 4-byte for one character.  */
  unsigned char buf[4];
  int len = emacs_mule_bytes[c];
  struct charset *charset;
  int i;
  unsigned code;

  if (len == 1)
    /* C is not a valid leading-code of `emacs-mule'.  */
    return BYTE8_TO_CHAR (c);

  i = 0;
  buf[i++] = c;
  while (i < len)
    {
      c = (*readbyte) (-1, readcharfun);
      if (c < 0xA0)
	{
	  while (--i > 1)
	    (*readbyte) (buf[i], readcharfun);
	  return BYTE8_TO_CHAR (buf[0]);
	}
      buf[i++] = c;
    }

  if (len == 2)
    {
516
      charset = CHARSET_FROM_ID (emacs_mule_charset[buf[0]]);
Kenichi Handa's avatar
Kenichi Handa committed
517 518 519 520 521 522 523
      code = buf[1] & 0x7F;
    }
  else if (len == 3)
    {
      if (buf[0] == EMACS_MULE_LEADING_CODE_PRIVATE_11
	  || buf[0] == EMACS_MULE_LEADING_CODE_PRIVATE_12)
	{
524
	  charset = CHARSET_FROM_ID (emacs_mule_charset[buf[1]]);
Kenichi Handa's avatar
Kenichi Handa committed
525 526 527 528
	  code = buf[2] & 0x7F;
	}
      else
	{
529
	  charset = CHARSET_FROM_ID (emacs_mule_charset[buf[0]]);
Kenichi Handa's avatar
Kenichi Handa committed
530 531 532 533 534
	  code = ((buf[1] << 8) | buf[2]) & 0x7F7F;
	}
    }
  else
    {
535
      charset = CHARSET_FROM_ID (emacs_mule_charset[buf[1]]);
Kenichi Handa's avatar
Kenichi Handa committed
536
      code = ((buf[2] << 8) | buf[3]) & 0x7F7F;
Kenichi Handa's avatar
Kenichi Handa committed
537 538 539 540 541 542 543 544 545
    }
  c = DECODE_CHAR (charset, code);
  if (c < 0)
    Fsignal (Qinvalid_read_syntax,
	     Fcons (build_string ("invalid multibyte form"), Qnil));
  return c;
}


546 547 548 549
static Lisp_Object read_internal_start (Lisp_Object, Lisp_Object,
                                        Lisp_Object);
static Lisp_Object read0 (Lisp_Object);
static Lisp_Object read1 (Lisp_Object, int *, int);
550

551 552
static Lisp_Object read_list (int, Lisp_Object);
static Lisp_Object read_vector (Lisp_Object, int);
553

554 555 556 557 558
static Lisp_Object substitute_object_recurse (Lisp_Object, Lisp_Object,
                                              Lisp_Object);
static void substitute_object_in_subtree (Lisp_Object,
                                          Lisp_Object);
static void substitute_in_interval (INTERVAL, Lisp_Object);
559

Jim Blandy's avatar
Jim Blandy committed
560

561
/* Get a character from the tty.  */
Jim Blandy's avatar
Jim Blandy committed
562

563 564 565 566 567 568 569 570 571 572 573 574 575
/* Read input events until we get one that's acceptable for our purposes.

   If NO_SWITCH_FRAME is non-zero, switch-frame events are stashed
   until we get a character we like, and then stuffed into
   unread_switch_frame.

   If ASCII_REQUIRED is non-zero, we check function key events to see
   if the unmodified version of the symbol has a Qascii_character
   property, and use that character, if present.

   If ERROR_NONASCII is non-zero, we signal an error if the input we
   get isn't an ASCII character with modifiers.  If it's zero but
   ASCII_REQUIRED is non-zero, we just re-read until we get an ASCII
576 577 578
   character.

   If INPUT_METHOD is nonzero, we invoke the current input method
579 580 581 582
   if the character warrants that.

   If SECONDS is a number, we wait that many seconds for input, and
   return Qnil if no input arrives within that time.  */
583

Andreas Schwab's avatar
Andreas Schwab committed
584
static Lisp_Object
Andreas Schwab's avatar
Andreas Schwab committed
585 586
read_filtered_event (int no_switch_frame, int ascii_required,
		     int error_nonascii, int input_method, Lisp_Object seconds)
587
{
588
  Lisp_Object val, delayed_switch_frame;
589
  EMACS_TIME end_time;
590

591
#ifdef HAVE_WINDOW_SYSTEM
592 593
  if (display_hourglass_p)
    cancel_hourglass ();
594
#endif
595

596
  delayed_switch_frame = Qnil;
597

598 599 600
  /* Compute timeout.  */
  if (NUMBERP (seconds))
    {
601
      double duration = extract_float (seconds);
602
      EMACS_TIME wait_time = EMACS_TIME_FROM_DOUBLE (duration);
603
      end_time = add_emacs_time (current_emacs_time (), wait_time);
604 605
    }

Karoly Lorentey's avatar
Karoly Lorentey committed
606
/* Read until we get an acceptable event.  */
607
 retry:
608
  do
Karoly Lorentey's avatar
Karoly Lorentey committed
609 610
    val = read_char (0, 0, 0, (input_method ? Qnil : Qt), 0,
		     NUMBERP (seconds) ? &end_time : NULL);
611
  while (INTEGERP (val) && XINT (val) == -2); /* wrong_kboard_jmpbuf */
612

613
  if (BUFFERP (val))
614 615
    goto retry;

616
  /* switch-frame events are put off until after the next ASCII
Karl Heuer's avatar
Karl Heuer committed
617
     character.  This is better than signaling an error just because
618 619 620 621 622
     the last characters were typed to a separate minibuffer frame,
     for example.  Eventually, some code which can deal with
     switch-frame events will read it and process it.  */
  if (no_switch_frame
      && EVENT_HAS_PARAMETERS (val)
623
      && EQ (EVENT_HEAD_KIND (EVENT_HEAD (val)), Qswitch_frame))
624 625 626 627 628
    {
      delayed_switch_frame = val;
      goto retry;
    }

629
  if (ascii_required && !(NUMBERP (seconds) && NILP (val)))
630 631
    {
      /* Convert certain symbols to their ASCII equivalents.  */
632
      if (SYMBOLP (val))
633
	{
634
	  Lisp_Object tem, tem1;
635 636 637 638 639 640 641
	  tem = Fget (val, Qevent_symbol_element_mask);
	  if (!NILP (tem))
	    {
	      tem1 = Fget (Fcar (tem), Qascii_character);
	      /* Merge this symbol's modifier bits
		 with the ASCII equivalent of its basic code.  */
	      if (!NILP (tem1))
642
		XSETFASTINT (val, XINT (tem1) | XINT (Fcar (Fcdr (tem))));
643 644
	    }
	}
645

646
      /* If we don't have a character now, deal with it appropriately.  */
647
      if (!INTEGERP (val))
648 649 650
	{
	  if (error_nonascii)
	    {
651
	      Vunread_command_events = Fcons (val, Qnil);
652 653 654 655 656 657 658 659 660 661
	      error ("Non-character input-event");
	    }
	  else
	    goto retry;
	}
    }

  if (! NILP (delayed_switch_frame))
    unread_switch_frame = delayed_switch_frame;

662 663
#if 0

664
#ifdef HAVE_WINDOW_SYSTEM
665 666
  if (display_hourglass_p)
    start_hourglass ();
667
#endif
668 669 670

#endif

671 672 673
  return val;
}

Paul Eggert's avatar
Paul Eggert committed
674
DEFUN ("read-char", Fread_char, Sread_char, 0, 3, 0,
675 676
       doc: /* Read a character from the command input (keyboard or macro).
It is returned as a number.
677 678 679
If the character has modifiers, they are resolved and reflected to the
character code if possible (e.g. C-SPC -> 0).

680 681
If the user generates an event which is not a character (i.e. a mouse
click or function key event), `read-char' signals an error.  As an
682 683
exception, switch-frame events are put off until non-character events
can be read.
684 685 686 687 688 689
If you want to read non-character events, or ignore them, call
`read-event' or `read-char-exclusive' instead.

If the optional argument PROMPT is non-nil, display that as a prompt.
If the optional argument INHERIT-INPUT-METHOD is non-nil and some
input method is turned on in the current buffer, that input method
690 691 692 693 694
is used for reading a character.
If the optional argument SECONDS is non-nil, it should be a number
specifying the maximum number of seconds to wait for input.  If no
input arrives in that time, return nil.  SECONDS may be a
floating-point value.  */)
Dan Nicolaescu's avatar
Dan Nicolaescu committed
695
  (Lisp_Object prompt, Lisp_Object inherit_input_method, Lisp_Object seconds)
Jim Blandy's avatar
Jim Blandy committed
696
{
697 698
  Lisp_Object val;

699 700
  if (! NILP (prompt))
    message_with_string ("%s", prompt, 0);
701
  val = read_filtered_event (1, 1, 1, ! NILP (inherit_input_method), seconds);
702 703 704

  return (NILP (val) ? Qnil
	  : make_number (char_resolve_modifier_mask (XINT (val))));
Jim Blandy's avatar
Jim Blandy committed
705 706
}

Paul Eggert's avatar
Paul Eggert committed
707
DEFUN ("read-event", Fread_event, Sread_event, 0, 3, 0,
708 709 710 711
       doc: /* Read an event object from the input stream.
If the optional argument PROMPT is non-nil, display that as a prompt.
If the optional argument INHERIT-INPUT-METHOD is non-nil and some
input method is turned on in the current buffer, that input method
712 713 714 715 716
is used for reading a character.
If the optional argument SECONDS is non-nil, it should be a number
specifying the maximum number of seconds to wait for input.  If no
input arrives in that time, return nil.  SECONDS may be a
floating-point value.  */)
Dan Nicolaescu's avatar
Dan Nicolaescu committed
717
  (Lisp_Object prompt, Lisp_Object inherit_input_method, Lisp_Object seconds)
Jim Blandy's avatar
Jim Blandy committed
718
{
719 720
  if (! NILP (prompt))
    message_with_string ("%s", prompt, 0);
721
  return read_filtered_event (0, 0, 0, ! NILP (inherit_input_method), seconds);
Jim Blandy's avatar
Jim Blandy committed
722 723
}

724
DEFUN ("read-char-exclusive", Fread_char_exclusive, Sread_char_exclusive, 0, 3, 0,
725 726
       doc: /* Read a character from the command input (keyboard or macro).
It is returned as a number.  Non-character events are ignored.
727 728
If the character has modifiers, they are resolved and reflected to the
character code if possible (e.g. C-SPC -> 0).
729 730 731 732

If the optional argument PROMPT is non-nil, display that as a prompt.
If the optional argument INHERIT-INPUT-METHOD is non-nil and some
input method is turned on in the current buffer, that input method
733 734 735 736 737
is used for reading a character.
If the optional argument SECONDS is non-nil, it should be a number
specifying the maximum number of seconds to wait for input.  If no
input arrives in that time, return nil.  SECONDS may be a
floating-point value.  */)
Dan Nicolaescu's avatar
Dan Nicolaescu committed
738
  (Lisp_Object prompt, Lisp_Object inherit_input_method, Lisp_Object seconds)
Jim Blandy's avatar
Jim Blandy committed
739
{
740 741
  Lisp_Object val;

742 743
  if (! NILP (prompt))
    message_with_string ("%s", prompt, 0);
744

745
  val = read_filtered_event (1, 1, 0, ! NILP (inherit_input_method), seconds);
746 747 748

  return (NILP (val) ? Qnil
	  : make_number (char_resolve_modifier_mask (XINT (val))));
Jim Blandy's avatar
Jim Blandy committed
749 750 751
}

DEFUN ("get-file-char", Fget_file_char, Sget_file_char, 0, 0, 0,
752
       doc: /* Don't use this yourself.  */)
Dan Nicolaescu's avatar
Dan Nicolaescu committed
753
  (void)
Jim Blandy's avatar
Jim Blandy committed
754 755
{
  register Lisp_Object val;
756
  block_input ();
757
  XSETINT (val, getc (instream));
758
  unblock_input ();
Jim Blandy's avatar
Jim Blandy committed
759 760
  return val;
}
761 762


763 764 765 766


/* Return true if the lisp code read using READCHARFUN defines a non-nil
   `lexical-binding' file variable.  After returning, the stream is
767 768
   positioned following the first line, if it is a comment or #! line,
   otherwise nothing is read.  */
769 770

static int
Stefan Monnier's avatar
Stefan Monnier committed
771
lisp_file_lexically_bound_p (Lisp_Object readcharfun)
772 773
{
  int ch = READCHAR;
774 775 776 777 778 779 780 781 782 783 784 785 786 787 788

  if (ch == '#')
    {
      ch = READCHAR;
      if (ch != '!')
        {
          UNREAD (ch);
          UNREAD ('#');
          return 0;
        }
      while (ch != '\n' && ch != EOF)
        ch = READCHAR;
      if (ch == '\n') ch = READCHAR;
    }

789 790 791 792 793 794 795 796 797 798 799 800 801 802 803
  if (ch != ';')
    /* The first line isn't a comment, just give up.  */
    {
      UNREAD (ch);
      return 0;
    }
  else
    /* Look for an appropriate file-variable in the first line.  */
    {
      int rv = 0;
      enum {
	NOMINAL, AFTER_FIRST_DASH, AFTER_ASTERIX,
      } beg_end_state = NOMINAL;
      int in_file_vars = 0;

804 805 806 807 808 809 810 811 812 813
#define UPDATE_BEG_END_STATE(ch)				\
  if (beg_end_state == NOMINAL)					\
    beg_end_state = (ch == '-' ? AFTER_FIRST_DASH : NOMINAL);	\
  else if (beg_end_state == AFTER_FIRST_DASH)			\
    beg_end_state = (ch == '*' ? AFTER_ASTERIX : NOMINAL);	\
  else if (beg_end_state == AFTER_ASTERIX)			\
    {								\
      if (ch == '-')						\
	in_file_vars = !in_file_vars;				\
      beg_end_state = NOMINAL;					\
814 815 816 817 818 819 820 821 822 823 824 825
    }

      /* Skip until we get to the file vars, if any.  */
      do
	{
	  ch = READCHAR;
	  UPDATE_BEG_END_STATE (ch);
	}
      while (!in_file_vars && ch != '\n' && ch != EOF);

      while (in_file_vars)
	{
826
	  char var[100], val[100];
827
	  unsigned i;
828 829 830 831 832 833 834

	  ch = READCHAR;

	  /* Read a variable name.  */
	  while (ch == ' ' || ch == '\t')
	    ch = READCHAR;

835
	  i = 0;
836
	  while (ch != ':' && ch != '\n' && ch != EOF && in_file_vars)
837
	    {
838 839
	      if (i < sizeof var - 1)
		var[i++] = ch;
840 841 842
	      UPDATE_BEG_END_STATE (ch);
	      ch = READCHAR;
	    }
843

844
	  /* Stop scanning if no colon was found before end marker.  */
845
	  if (!in_file_vars || ch == '\n' || ch == EOF)
846 847
	    break;

848 849 850
	  while (i > 0 && (var[i - 1] == ' ' || var[i - 1] == '\t'))
	    i--;
	  var[i] = '\0';
851 852 853 854 855 856 857 858 859

	  if (ch == ':')
	    {
	      /* Read a variable value.  */
	      ch = READCHAR;

	      while (ch == ' ' || ch == '\t')
		ch = READCHAR;

860
	      i = 0;
861 862
	      while (ch != ';' && ch != '\n' && ch != EOF && in_file_vars)
		{
863 864
		  if (i < sizeof val - 1)
		    val[i++] = ch;
865 866 867 868
		  UPDATE_BEG_END_STATE (ch);
		  ch = READCHAR;
		}
	      if (! in_file_vars)
869
		/* The value was terminated by an end-marker, which remove.  */
870 871 872 873
		i -= 3;
	      while (i > 0 && (val[i - 1] == ' ' || val[i - 1] == '\t'))
		i--;
	      val[i] = '\0';
874 875 876 877 878 879 880 881 882 883 884 885 886 887 888 889

	      if (strcmp (var, "lexical-binding") == 0)
		/* This is it...  */
		{
		  rv = (strcmp (val, "nil") != 0);
		  break;
		}
	    }
	}

      while (ch != '\n' && ch != EOF)
	ch = READCHAR;

      return rv;
    }
}
890

Kenichi Handa's avatar
Kenichi Handa committed
891
/* Value is a version number of byte compiled code if the file
Miles Bader's avatar
Miles Bader committed
892
   associated with file descriptor FD is a compiled Lisp file that's
Kenichi Handa's avatar
Kenichi Handa committed
893 894 895
   safe to load.  Only files compiled with Emacs are safe to load.
   Files compiled with XEmacs can lead to a crash in Fbyte_code
   because of an incompatible change in the byte compiler.  */
896 897

static int
898
safe_to_load_p (int fd)
899 900 901 902
{
  char buf[512];
  int nbytes, i;
  int safe_p = 1;
Kenichi Handa's avatar
Kenichi Handa committed
903
  int version = 1;
904 905 906 907 908 909 910 911 912

  /* Read the first few bytes from the file, and look for a line
     specifying the byte compiler version used.  */
  nbytes = emacs_read (fd, buf, sizeof buf - 1);
  if (nbytes > 0)
    {
      buf[nbytes] = '\0';

      /* Skip to the next newline, skipping over the initial `ELC'
Dave Love's avatar
Dave Love committed
913
	 with NUL bytes following it, but note the version.  */
914
      for (i = 0; i < nbytes && buf[i] != '\n'; ++i)
Dave Love's avatar
Dave Love committed
915
	if (i == 4)
Kenichi Handa's avatar
Kenichi Handa committed
916
	  version = buf[i];
917

918
      if (i >= nbytes
919
	  || fast_c_string_match_ignore_case (Vbytecomp_version_regexp,
920
					      buf + i, nbytes - i) < 0)
921 922
	safe_p = 0;
    }
Dave Love's avatar
Dave Love committed
923 924
  if (safe_p)
    safe_p = version;
925 926 927 928 929 930

  lseek (fd, 0, SEEK_SET);
  return safe_p;
}


931 932 933 934
/* Callback for record_unwind_protect.  Restore the old load list OLD,
   after loading a file successfully.  */

static Lisp_Object
935
record_load_unwind (Lisp_Object old)
936 937 938 939
{
  return Vloads_in_progress = old;
}

940 941 942
/* This handler function is used via internal_condition_case_1.  */

static Lisp_Object
943
load_error_handler (Lisp_Object data)
944 945 946
{
  return Qnil;
}
947

948
static Lisp_Object
949
load_warn_old_style_backquotes (Lisp_Object file)
950 951 952
{
  if (!NILP (Vold_style_backquotes))
    {
953
      Lisp_Object args[2];
954
      args[0] = build_string ("Loading `%s': old-style backquotes detected!");
955 956 957 958 959 960
      args[1] = file;
      Fmessage (2, args);
    }
  return Qnil;
}

Paul Eggert's avatar
Paul Eggert committed
961
DEFUN ("get-load-suffixes", Fget_load_suffixes, Sget_load_suffixes, 0, 0, 0,
962 963 964
       doc: /* Return the suffixes that `load' should try if a suffix is \
required.
This uses the variables `load-suffixes' and `load-file-rep-suffixes'.  */)
Dan Nicolaescu's avatar
Dan Nicolaescu committed
965
  (void)
966 967 968 969 970 971 972 973 974 975 976 977 978 979 980 981 982
{
  Lisp_Object lst = Qnil, suffixes = Vload_suffixes, suffix, ext;
  while (CONSP (suffixes))
    {
      Lisp_Object exts = Vload_file_rep_suffixes;
      suffix = XCAR (suffixes);
      suffixes = XCDR (suffixes);
      while (CONSP (exts))
	{
	  ext = XCAR (exts);
	  exts = XCDR (exts);
	  lst = Fcons (concat2 (suffix, ext), lst);
	}
    }
  return Fnreverse (lst);
}

Paul Eggert's avatar
Paul Eggert committed
983
DEFUN ("load", Fload, Sload, 1, 5, 0,
984 985
       doc: /* Execute a file of Lisp code named FILE.
First try FILE with `.elc' appended, then try with `.el',
986
then try FILE unmodified (the exact suffixes in the exact order are
987
determined by `load-suffixes').  Environment variable references in
988
FILE are replaced with their values by calling `substitute-in-file-name'.
989
This function searches the directories in `load-path'.
990

991
If optional second arg NOERROR is non-nil,
992
report no error if FILE doesn't exist.
993
Print messages at start and end of loading unless
994 995
optional third arg NOMESSAGE is non-nil (but `force-load-messages'
overrides that).
996
If optional fourth arg NOSUFFIX is non-nil, don't try adding
997
suffixes `.elc' or `.el' to the specified name FILE.
998
If optional fifth arg MUST-SUFFIX is non-nil, insist on
999 1000 1001 1002 1003 1004 1005 1006 1007 1008 1009 1010 1011 1012 1013
the suffix `.elc' or `.el'; don't accept just FILE unless
it ends in one of those suffixes or includes a directory name.

If this function fails to find a file, it may look for different
representations of that file before trying another file.
It does so by adding the non-empty suffixes in `load-file-rep-suffixes'
to the file name.  Emacs uses this feature mainly to find compressed
versions of files when Auto Compression mode is enabled.

The exact suffixes that this function tries out, in the exact order,
are given by the value of the variable `load-file-rep-suffixes' if
NOSUFFIX is non-nil and by the return value of the function
`get-load-suffixes' if MUST-SUFFIX is non-nil.  If both NOSUFFIX and
MUST-SUFFIX are nil, this function first tries out the latter suffixes
and then the former.
1014 1015 1016 1017 1018

Loading a file records its definitions, and its `provide' and
`require' calls, in an element of `load-history' whose
car is the file name loaded.  See `load-history'.

1019 1020 1021 1022
While the file is in the process of being loaded, the variable
`load-in-progress' is non-nil and the variable `load-file-name'
is bound to the file's name.

1023
Return t if the file exists and loads successfully.  */)
Dan Nicolaescu's avatar
Dan Nicolaescu committed
1024
  (Lisp_Object file, Lisp_Object noerror, Lisp_Object nomessage, Lisp_Object nosuffix, Lisp_Object must_suffix)
Jim Blandy's avatar
Jim Blandy committed
1025 1026 1027
{
  register FILE *stream;
  register int fd = -1;
1028
  ptrdiff_t count = SPECPDL_INDEX ();
1029 1030
  struct gcpro gcpro1, gcpro2, gcpro3;
  Lisp_Object found, efound, hist_file_name;
1031 1032 1033 1034
  /* 1 means we printed the ".el is newer" message.  */
  int newer = 0;
  /* 1 means we are loading a compiled file.  */
  int compiled = 0;
1035
  Lisp_Object handler;
1036
  int safe_p = 1;
1037
  const char *fmode = "r";
1038
  Lisp_Object tmp[2];
Kenichi Handa's avatar
Kenichi Handa committed
1039 1040
  int version;

1041
#ifdef DOS_NT
1042
  fmode = "rt";