lread.c 127 KB
Newer Older
Jim Blandy's avatar
Jim Blandy committed
1
/* Lisp parsing and input streams.
2

3
Copyright (C) 1985-1989, 1993-1995, 1997-2011  Free Software Foundation, Inc.
Jim Blandy's avatar
Jim Blandy committed
4 5 6

This file is part of GNU Emacs.

7
GNU Emacs is free software: you can redistribute it and/or modify
Jim Blandy's avatar
Jim Blandy committed
8
it under the terms of the GNU General Public License as published by
9 10
the Free Software Foundation, either version 3 of the License, or
(at your option) any later version.
Jim Blandy's avatar
Jim Blandy committed
11 12 13 14 15 16 17

GNU Emacs is distributed in the hope that it will be useful,
but WITHOUT ANY WARRANTY; without even the implied warranty of
MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
GNU General Public License for more details.

You should have received a copy of the GNU General Public License
18
along with GNU Emacs.  If not, see <http://www.gnu.org/licenses/>.  */
Jim Blandy's avatar
Jim Blandy committed
19 20


Richard M. Stallman's avatar
Richard M. Stallman committed
21
#include <config.h>
Jim Blandy's avatar
Jim Blandy committed
22 23 24 25
#include <stdio.h>
#include <sys/types.h>
#include <sys/stat.h>
#include <sys/file.h>
26
#include <errno.h>
27
#include <setjmp.h>
Jim Blandy's avatar
Jim Blandy committed
28
#include "lisp.h"
29
#include "intervals.h"
Jim Blandy's avatar
Jim Blandy committed
30
#include "buffer.h"
Kenichi Handa's avatar
Kenichi Handa committed
31
#include "character.h"
Karl Heuer's avatar
Karl Heuer committed
32
#include "charset.h"
Kenichi Handa's avatar
Kenichi Handa committed
33
#include "coding.h"
34
#include <epaths.h>
Jim Blandy's avatar
Jim Blandy committed
35
#include "commands.h"
Jim Blandy's avatar
Jim Blandy committed
36
#include "keyboard.h"
37
#include "frame.h"
38
#include "termhooks.h"
39
#include "coding.h"
YAMAMOTO Mitsuharu's avatar
YAMAMOTO Mitsuharu committed
40
#include "blockinput.h"
Jim Blandy's avatar
Jim Blandy committed
41

42 43 44 45
#ifdef MSDOS
#include "msdos.h"
#endif

Andreas Schwab's avatar
Andreas Schwab committed
46
#include <unistd.h>
Jim Blandy's avatar
Jim Blandy committed
47 48
#include <math.h>

Richard M. Stallman's avatar
Richard M. Stallman committed
49 50 51 52
#ifdef HAVE_SETLOCALE
#include <locale.h>
#endif /* HAVE_SETLOCALE */

Dave Love's avatar
Dave Love committed
53
#include <fcntl.h>
Richard M. Stallman's avatar
Richard M. Stallman committed
54

55
#ifdef HAVE_FSEEKO
56 57 58 59 60 61 62
#define file_offset off_t
#define file_tell ftello
#else
#define file_offset long
#define file_tell ftell
#endif

63
/* hash table read constants */
64 65 66 67 68 69 70 71
static Lisp_Object Qhash_table, Qdata;
static Lisp_Object Qtest, Qsize;
static Lisp_Object Qweakness;
static Lisp_Object Qrehash_size;
static Lisp_Object Qrehash_threshold;

static Lisp_Object Qread_char, Qget_file_char, Qcurrent_load_list;
Lisp_Object Qstandard_input;
72
Lisp_Object Qvariable_documentation;
73
static Lisp_Object Qascii_character, Qload, Qload_file_name;
74
Lisp_Object Qbackquote, Qcomma, Qcomma_at, Qcomma_dot, Qfunction;
75 76 77 78
static Lisp_Object Qinhibit_file_name_operation;
static Lisp_Object Qeval_buffer_list;
static Lisp_Object Qlexical_binding;
static Lisp_Object Qfile_truename, Qdo_after_load_evaluation; /* ACM 2006/5/16 */
79

Kenichi Handa's avatar
Kenichi Handa committed
80 81 82 83 84 85
/* Used instead of Qget_file_char while loading *.elc files compiled
   by Emacs 21 or older.  */
static Lisp_Object Qget_emacs_mule_file_char;

static Lisp_Object Qload_force_doc_strings;

86
extern Lisp_Object Qinternal_interpreter_environment;
Jim Blandy's avatar
Jim Blandy committed
87

88
static Lisp_Object Qload_in_progress;
Ken Raeburn's avatar
Ken Raeburn committed
89

90 91 92 93
/* The association list of objects read with the #n=object form.
   Each member of the list has the form (n . object), and is used to
   look up the object for the corresponding #n# construct.
   It must be set to nil before all top-level calls to read0.  */
94
static Lisp_Object read_objects;
95

Kenichi Handa's avatar
Kenichi Handa committed
96 97 98 99 100
/* Nonzero means READCHAR should read bytes one by one (not character)
   when READCHARFUN is Qget_file_char or Qget_emacs_mule_file_char.
   This is set to 1 by read1 temporarily while handling #@NUMBER.  */
static int load_each_byte;

101 102 103
/* List of descriptors now open for Fload.  */
static Lisp_Object load_descriptor_list;

104
/* File for get_file_char to read from.  Use by load.  */
Jim Blandy's avatar
Jim Blandy committed
105 106 107 108 109
static FILE *instream;

/* When nonzero, read conses in pure space */
static int read_pure;

110
/* For use within read-from-string (this reader is non-reentrant!!)  */
111 112 113
static EMACS_INT read_from_string_index;
static EMACS_INT read_from_string_index_byte;
static EMACS_INT read_from_string_limit;
114

115 116
/* Number of characters read in the current call to Fread or
   Fread_from_string. */
117
static EMACS_INT readchar_count;
118

119
/* This contains the last string skipped with #@.  */
120 121 122 123 124 125
static char *saved_doc_string;
/* Length of buffer allocated in saved_doc_string.  */
static int saved_doc_string_size;
/* Length of actual data in saved_doc_string.  */
static int saved_doc_string_length;
/* This is the file position that string came from.  */
126
static file_offset saved_doc_string_position;
127

128 129 130 131 132 133 134 135 136
/* This contains the previous string skipped with #@.
   We copy it from saved_doc_string when a new string
   is put in saved_doc_string.  */
static char *prev_saved_doc_string;
/* Length of buffer allocated in prev_saved_doc_string.  */
static int prev_saved_doc_string_size;
/* Length of actual data in prev_saved_doc_string.  */
static int prev_saved_doc_string_length;
/* This is the file position that string came from.  */
137
static file_offset prev_saved_doc_string_position;
138

139 140 141 142 143
/* Nonzero means inside a new-style backquote
   with no surrounding parentheses.
   Fread initializes this to zero, so we need not specbind it
   or worry about what happens to it when there is an error.  */
static int new_backquote_flag;
144
static Lisp_Object Qold_style_backquotes;
145 146 147 148

/* A list of file names for files being loaded in Fload.  Used to
   check for recursive loads.  */

Lute Kamstra's avatar
Lute Kamstra committed
149
static Lisp_Object Vloads_in_progress;
150

151 152
static int read_emacs_mule_char (int, int (*) (int, Lisp_Object),
                                 Lisp_Object);
Kenichi Handa's avatar
Kenichi Handa committed
153

154
static void readevalloop (Lisp_Object, FILE*, Lisp_Object, int,
155 156 157 158
                          Lisp_Object, Lisp_Object,
                          Lisp_Object, Lisp_Object);
static Lisp_Object load_unwind (Lisp_Object);
static Lisp_Object load_descriptor_unwind (Lisp_Object);
159

160
static void invalid_syntax (const char *, int) NO_RETURN;
161
static void end_of_file_error (void) NO_RETURN;
162

Jim Blandy's avatar
Jim Blandy committed
163

Kenichi Handa's avatar
Kenichi Handa committed
164 165 166 167 168 169
/* Functions that read one byte from the current source READCHARFUN
   or unreads one byte.  If the integer argument C is -1, it returns
   one read byte, or -1 when there's no more byte in the source.  If C
   is 0 or positive, it unreads C, and the return value is not
   interesting.  */

170 171 172
static int readbyte_for_lambda (int, Lisp_Object);
static int readbyte_from_file (int, Lisp_Object);
static int readbyte_from_string (int, Lisp_Object);
Kenichi Handa's avatar
Kenichi Handa committed
173

Jim Blandy's avatar
Jim Blandy committed
174 175
/* Handle unreading and rereading of characters.
   Write READCHAR to read a character,
Karl Heuer's avatar
Karl Heuer committed
176 177
   UNREAD(c) to unread c to be read again.

Kenichi Handa's avatar
Kenichi Handa committed
178
   These macros correctly read/unread multibyte characters.  */
Jim Blandy's avatar
Jim Blandy committed
179

180
#define READCHAR readchar (readcharfun, NULL)
Jim Blandy's avatar
Jim Blandy committed
181 182
#define UNREAD(c) unreadchar (readcharfun, c)

183 184 185
/* Same as READCHAR but set *MULTIBYTE to the multibyteness of the source.  */
#define READCHAR_REPORT_MULTIBYTE(multibyte) readchar (readcharfun, multibyte)

Kenichi Handa's avatar
Kenichi Handa committed
186
/* When READCHARFUN is Qget_file_char, Qget_emacs_mule_file_char,
Kenichi Handa's avatar
Kenichi Handa committed
187 188
   Qlambda, or a cons, we use this to keep an unread character because
   a file stream can't handle multibyte-char unreading.  The value -1
Kenichi Handa's avatar
Kenichi Handa committed
189 190 191
   means that there's no unread character. */
static int unread_char;

Jim Blandy's avatar
Jim Blandy committed
192
static int
193
readchar (Lisp_Object readcharfun, int *multibyte)
Jim Blandy's avatar
Jim Blandy committed
194 195
{
  Lisp_Object tem;
196
  register int c;
197
  int (*readbyte) (int, Lisp_Object);
Kenichi Handa's avatar
Kenichi Handa committed
198 199 200
  unsigned char buf[MAX_MULTIBYTE_LENGTH];
  int i, len;
  int emacs_mule_encoding = 0;
Jim Blandy's avatar
Jim Blandy committed
201

202 203 204
  if (multibyte)
    *multibyte = 0;

205
  readchar_count++;
206

207
  if (BUFFERP (readcharfun))
Jim Blandy's avatar
Jim Blandy committed
208
    {
209
      register struct buffer *inbuffer = XBUFFER (readcharfun);
Jim Blandy's avatar
Jim Blandy committed
210

211
      EMACS_INT pt_byte = BUF_PT_BYTE (inbuffer);
212

213 214
      if (pt_byte >= BUF_ZV_BYTE (inbuffer))
	return -1;
Jim Blandy's avatar
Jim Blandy committed
215

Tom Tromey's avatar
Tom Tromey committed
216
      if (! NILP (BVAR (inbuffer, enable_multibyte_characters)))
217
	{
218
	  /* Fetch the character code from the buffer.  */
219 220
	  unsigned char *p = BUF_BYTE_ADDRESS (inbuffer, pt_byte);
	  BUF_INC_POS (inbuffer, pt_byte);
221
	  c = STRING_CHAR (p);
222 223
	  if (multibyte)
	    *multibyte = 1;
224 225 226 227
	}
      else
	{
	  c = BUF_FETCH_BYTE (inbuffer, pt_byte);
Kenichi Handa's avatar
Kenichi Handa committed
228 229
	  if (! ASCII_BYTE_P (c))
	    c = BYTE8_TO_CHAR (c);
230
	  pt_byte++;
231
	}
232
      SET_BUF_PT_BOTH (inbuffer, BUF_PT (inbuffer) + 1, pt_byte);
233

234
      return c;
Jim Blandy's avatar
Jim Blandy committed
235
    }
236
  if (MARKERP (readcharfun))
Jim Blandy's avatar
Jim Blandy committed
237
    {
238
      register struct buffer *inbuffer = XMARKER (readcharfun)->buffer;
Jim Blandy's avatar
Jim Blandy committed
239

240
      EMACS_INT bytepos = marker_byte_position (readcharfun);
241

242 243
      if (bytepos >= BUF_ZV_BYTE (inbuffer))
	return -1;
244

Tom Tromey's avatar
Tom Tromey committed
245
      if (! NILP (BVAR (inbuffer, enable_multibyte_characters)))
246
	{
247
	  /* Fetch the character code from the buffer.  */
248 249
	  unsigned char *p = BUF_BYTE_ADDRESS (inbuffer, bytepos);
	  BUF_INC_POS (inbuffer, bytepos);
250
	  c = STRING_CHAR (p);
251 252
	  if (multibyte)
	    *multibyte = 1;
253 254 255 256
	}
      else
	{
	  c = BUF_FETCH_BYTE (inbuffer, bytepos);
Kenichi Handa's avatar
Kenichi Handa committed
257 258
	  if (! ASCII_BYTE_P (c))
	    c = BYTE8_TO_CHAR (c);
259
	  bytepos++;
260 261
	}

262 263 264 265
      XMARKER (readcharfun)->bytepos = bytepos;
      XMARKER (readcharfun)->charpos++;

      return c;
Jim Blandy's avatar
Jim Blandy committed
266
    }
267 268

  if (EQ (readcharfun, Qlambda))
Kenichi Handa's avatar
Kenichi Handa committed
269 270 271 272
    {
      readbyte = readbyte_for_lambda;
      goto read_multibyte;
    }
273

Jim Blandy's avatar
Jim Blandy committed
274
  if (EQ (readcharfun, Qget_file_char))
275
    {
Kenichi Handa's avatar
Kenichi Handa committed
276 277
      readbyte = readbyte_from_file;
      goto read_multibyte;
278
    }
Jim Blandy's avatar
Jim Blandy committed
279

280
  if (STRINGP (readcharfun))
Jim Blandy's avatar
Jim Blandy committed
281
    {
282
      if (read_from_string_index >= read_from_string_limit)
Jim Blandy's avatar
Jim Blandy committed
283
	c = -1;
284 285 286 287 288 289 290 291
      else if (STRING_MULTIBYTE (readcharfun))
	{
	  if (multibyte)
	    *multibyte = 1;
	  FETCH_STRING_CHAR_ADVANCE_NO_CHECK (c, readcharfun,
					      read_from_string_index,
					      read_from_string_index_byte);
	}
292
      else
293 294 295 296 297
	{
	  c = SREF (readcharfun, read_from_string_index_byte);
	  read_from_string_index++;
	  read_from_string_index_byte++;
	}
Jim Blandy's avatar
Jim Blandy committed
298 299 300
      return c;
    }

Kenichi Handa's avatar
Kenichi Handa committed
301 302 303 304 305 306 307 308 309 310 311 312
  if (CONSP (readcharfun))
    {
      /* This is the case that read_vector is reading from a unibyte
	 string that contains a byte sequence previously skipped
	 because of #@NUMBER.  The car part of readcharfun is that
	 string, and the cdr part is a value of readcharfun given to
	 read_vector.  */
      readbyte = readbyte_from_string;
      if (EQ (XCDR (readcharfun), Qget_emacs_mule_file_char))
	emacs_mule_encoding = 1;
      goto read_multibyte;
    }
Kenichi Handa's avatar
Kenichi Handa committed
313

Kenichi Handa's avatar
Kenichi Handa committed
314 315 316 317 318 319
  if (EQ (readcharfun, Qget_emacs_mule_file_char))
    {
      readbyte = readbyte_from_file;
      emacs_mule_encoding = 1;
      goto read_multibyte;
    }
Jim Blandy's avatar
Jim Blandy committed
320 321 322

  tem = call0 (readcharfun);

Jim Blandy's avatar
Jim Blandy committed
323
  if (NILP (tem))
Jim Blandy's avatar
Jim Blandy committed
324 325
    return -1;
  return XINT (tem);
Kenichi Handa's avatar
Kenichi Handa committed
326 327 328 329 330 331 332 333 334

 read_multibyte:
  if (unread_char >= 0)
    {
      c = unread_char;
      unread_char = -1;
      return c;
    }
  c = (*readbyte) (-1, readcharfun);
335 336 337 338 339
  if (c < 0 || load_each_byte)
    return c;
  if (multibyte)
    *multibyte = 1;
  if (ASCII_BYTE_P (c))
Kenichi Handa's avatar
Kenichi Handa committed
340 341 342 343 344 345 346 347 348 349 350 351 352 353 354 355 356
    return c;
  if (emacs_mule_encoding)
    return read_emacs_mule_char (c, readbyte, readcharfun);
  i = 0;
  buf[i++] = c;
  len = BYTES_BY_CHAR_HEAD (c);
  while (i < len)
    {
      c = (*readbyte) (-1, readcharfun);
      if (c < 0 || ! TRAILING_CODE_P (c))
	{
	  while (--i > 1)
	    (*readbyte) (buf[i], readcharfun);
	  return BYTE8_TO_CHAR (buf[0]);
	}
      buf[i++] = c;
    }
357
  return STRING_CHAR (buf);
Jim Blandy's avatar
Jim Blandy committed
358 359 360 361 362 363
}

/* Unread the character C in the way appropriate for the stream READCHARFUN.
   If the stream is a user function, call it with the char as argument.  */

static void
364
unreadchar (Lisp_Object readcharfun, int c)
Jim Blandy's avatar
Jim Blandy committed
365
{
366
  readchar_count--;
367 368 369 370
  if (c == -1)
    /* Don't back up the pointer if we're unreading the end-of-input mark,
       since readchar didn't advance it when we read it.  */
    ;
371
  else if (BUFFERP (readcharfun))
372
    {
373
      struct buffer *b = XBUFFER (readcharfun);
374
      EMACS_INT charpos = BUF_PT (b);
375
      EMACS_INT bytepos = BUF_PT_BYTE (b);
376

Tom Tromey's avatar
Tom Tromey committed
377
      if (! NILP (BVAR (b, enable_multibyte_characters)))
Kenichi Handa's avatar
Kenichi Handa committed
378
	BUF_DEC_POS (b, bytepos);
379
      else
Kenichi Handa's avatar
Kenichi Handa committed
380
	bytepos--;
381

382
      SET_BUF_PT_BOTH (b, charpos - 1, bytepos);
383
    }
384
  else if (MARKERP (readcharfun))
385
    {
386
      struct buffer *b = XMARKER (readcharfun)->buffer;
387
      EMACS_INT bytepos = XMARKER (readcharfun)->bytepos;
388

Kenichi Handa's avatar
Kenichi Handa committed
389
      XMARKER (readcharfun)->charpos--;
Tom Tromey's avatar
Tom Tromey committed
390
      if (! NILP (BVAR (b, enable_multibyte_characters)))
Kenichi Handa's avatar
Kenichi Handa committed
391
	BUF_DEC_POS (b, bytepos);
392
      else
Kenichi Handa's avatar
Kenichi Handa committed
393
	bytepos--;
394

Kenichi Handa's avatar
Kenichi Handa committed
395
      XMARKER (readcharfun)->bytepos = bytepos;
396
    }
397
  else if (STRINGP (readcharfun))
398 399 400 401 402
    {
      read_from_string_index--;
      read_from_string_index_byte
	= string_char_to_byte (readcharfun, read_from_string_index);
    }
Kenichi Handa's avatar
Kenichi Handa committed
403 404 405 406
  else if (CONSP (readcharfun))
    {
      unread_char = c;
    }
407
  else if (EQ (readcharfun, Qlambda))
Kenichi Handa's avatar
Kenichi Handa committed
408 409 410 411 412 413 414
    {
      unread_char = c;
    }
  else if (EQ (readcharfun, Qget_file_char)
	   || EQ (readcharfun, Qget_emacs_mule_file_char))
    {
      if (load_each_byte)
Miles Bader's avatar
Miles Bader committed
415 416 417 418 419
	{
	  BLOCK_INPUT;
	  ungetc (c, instream);
	  UNBLOCK_INPUT;
	}
Kenichi Handa's avatar
Kenichi Handa committed
420 421 422
      else
	unread_char = c;
    }
Jim Blandy's avatar
Jim Blandy committed
423 424 425 426
  else
    call1 (readcharfun, make_number (c));
}

Kenichi Handa's avatar
Kenichi Handa committed
427
static int
428
readbyte_for_lambda (int c, Lisp_Object readcharfun)
Kenichi Handa's avatar
Kenichi Handa committed
429 430 431 432 433 434
{
  return read_bytecode_char (c >= 0);
}


static int
435
readbyte_from_file (int c, Lisp_Object readcharfun)
Kenichi Handa's avatar
Kenichi Handa committed
436 437 438
{
  if (c >= 0)
    {
YAMAMOTO Mitsuharu's avatar
YAMAMOTO Mitsuharu committed
439
      BLOCK_INPUT;
Kenichi Handa's avatar
Kenichi Handa committed
440
      ungetc (c, instream);
YAMAMOTO Mitsuharu's avatar
YAMAMOTO Mitsuharu committed
441
      UNBLOCK_INPUT;
Kenichi Handa's avatar
Kenichi Handa committed
442 443 444
      return 0;
    }

Miles Bader's avatar
Miles Bader committed
445
  BLOCK_INPUT;
Kenichi Handa's avatar
Kenichi Handa committed
446
  c = getc (instream);
Miles Bader's avatar
Miles Bader committed
447

Kenichi Handa's avatar
Kenichi Handa committed
448
#ifdef EINTR
Miles Bader's avatar
Miles Bader committed
449 450 451
  /* Interrupted reads have been observed while reading over the network */
  while (c == EOF && ferror (instream) && errno == EINTR)
    {
Miles Bader's avatar
Miles Bader committed
452
      UNBLOCK_INPUT;
Miles Bader's avatar
Miles Bader committed
453 454
      QUIT;
      BLOCK_INPUT;
Miles Bader's avatar
Miles Bader committed
455
      clearerr (instream);
Miles Bader's avatar
Miles Bader committed
456
      c = getc (instream);
YAMAMOTO Mitsuharu's avatar
YAMAMOTO Mitsuharu committed
457
    }
Kenichi Handa's avatar
Kenichi Handa committed
458
#endif
Miles Bader's avatar
Miles Bader committed
459

Miles Bader's avatar
Miles Bader committed
460 461
  UNBLOCK_INPUT;

Kenichi Handa's avatar
Kenichi Handa committed
462 463 464 465
  return (c == EOF ? -1 : c);
}

static int
466
readbyte_from_string (int c, Lisp_Object readcharfun)
Kenichi Handa's avatar
Kenichi Handa committed
467 468 469 470 471 472 473 474 475
{
  Lisp_Object string = XCAR (readcharfun);

  if (c >= 0)
    {
      read_from_string_index--;
      read_from_string_index_byte
	= string_char_to_byte (string, read_from_string_index);
    }
Kenichi Handa's avatar
Kenichi Handa committed
476

Kenichi Handa's avatar
Kenichi Handa committed
477 478 479 480 481 482 483 484 485 486 487 488 489 490 491
  if (read_from_string_index >= read_from_string_limit)
    c = -1;
  else
    FETCH_STRING_CHAR_ADVANCE (c, string,
			       read_from_string_index,
			       read_from_string_index_byte);
  return c;
}


/* Read one non-ASCII character from INSTREAM.  The character is
   encoded in `emacs-mule' and the first byte is already read in
   C.  */

static int
492
read_emacs_mule_char (int c, int (*readbyte) (int, Lisp_Object), Lisp_Object readcharfun)
Kenichi Handa's avatar
Kenichi Handa committed
493 494 495 496 497 498 499 500 501 502 503 504 505 506 507 508 509 510 511 512 513 514 515 516 517 518 519 520
{
  /* Emacs-mule coding uses at most 4-byte for one character.  */
  unsigned char buf[4];
  int len = emacs_mule_bytes[c];
  struct charset *charset;
  int i;
  unsigned code;

  if (len == 1)
    /* C is not a valid leading-code of `emacs-mule'.  */
    return BYTE8_TO_CHAR (c);

  i = 0;
  buf[i++] = c;
  while (i < len)
    {
      c = (*readbyte) (-1, readcharfun);
      if (c < 0xA0)
	{
	  while (--i > 1)
	    (*readbyte) (buf[i], readcharfun);
	  return BYTE8_TO_CHAR (buf[0]);
	}
      buf[i++] = c;
    }

  if (len == 2)
    {
521
      charset = CHARSET_FROM_ID (emacs_mule_charset[buf[0]]);
Kenichi Handa's avatar
Kenichi Handa committed
522 523 524 525 526 527 528
      code = buf[1] & 0x7F;
    }
  else if (len == 3)
    {
      if (buf[0] == EMACS_MULE_LEADING_CODE_PRIVATE_11
	  || buf[0] == EMACS_MULE_LEADING_CODE_PRIVATE_12)
	{
529
	  charset = CHARSET_FROM_ID (emacs_mule_charset[buf[1]]);
Kenichi Handa's avatar
Kenichi Handa committed
530 531 532 533
	  code = buf[2] & 0x7F;
	}
      else
	{
534
	  charset = CHARSET_FROM_ID (emacs_mule_charset[buf[0]]);
Kenichi Handa's avatar
Kenichi Handa committed
535 536 537 538 539
	  code = ((buf[1] << 8) | buf[2]) & 0x7F7F;
	}
    }
  else
    {
540
      charset = CHARSET_FROM_ID (emacs_mule_charset[buf[1]]);
Kenichi Handa's avatar
Kenichi Handa committed
541
      code = ((buf[2] << 8) | buf[3]) & 0x7F7F;
Kenichi Handa's avatar
Kenichi Handa committed
542 543 544 545 546 547 548 549 550
    }
  c = DECODE_CHAR (charset, code);
  if (c < 0)
    Fsignal (Qinvalid_read_syntax,
	     Fcons (build_string ("invalid multibyte form"), Qnil));
  return c;
}


551 552 553 554
static Lisp_Object read_internal_start (Lisp_Object, Lisp_Object,
                                        Lisp_Object);
static Lisp_Object read0 (Lisp_Object);
static Lisp_Object read1 (Lisp_Object, int *, int);
555

556 557
static Lisp_Object read_list (int, Lisp_Object);
static Lisp_Object read_vector (Lisp_Object, int);
558

559 560 561 562 563
static Lisp_Object substitute_object_recurse (Lisp_Object, Lisp_Object,
                                              Lisp_Object);
static void substitute_object_in_subtree (Lisp_Object,
                                          Lisp_Object);
static void substitute_in_interval (INTERVAL, Lisp_Object);
564

Jim Blandy's avatar
Jim Blandy committed
565

566
/* Get a character from the tty.  */
Jim Blandy's avatar
Jim Blandy committed
567

568 569 570 571 572 573 574 575 576 577 578 579 580
/* Read input events until we get one that's acceptable for our purposes.

   If NO_SWITCH_FRAME is non-zero, switch-frame events are stashed
   until we get a character we like, and then stuffed into
   unread_switch_frame.

   If ASCII_REQUIRED is non-zero, we check function key events to see
   if the unmodified version of the symbol has a Qascii_character
   property, and use that character, if present.

   If ERROR_NONASCII is non-zero, we signal an error if the input we
   get isn't an ASCII character with modifiers.  If it's zero but
   ASCII_REQUIRED is non-zero, we just re-read until we get an ASCII
581 582 583
   character.

   If INPUT_METHOD is nonzero, we invoke the current input method
584 585 586 587
   if the character warrants that.

   If SECONDS is a number, we wait that many seconds for input, and
   return Qnil if no input arrives within that time.  */
588

Andreas Schwab's avatar
Andreas Schwab committed
589
static Lisp_Object
Andreas Schwab's avatar
Andreas Schwab committed
590 591
read_filtered_event (int no_switch_frame, int ascii_required,
		     int error_nonascii, int input_method, Lisp_Object seconds)
592
{
593
  Lisp_Object val, delayed_switch_frame;
594
  EMACS_TIME end_time;
595

596
#ifdef HAVE_WINDOW_SYSTEM
597 598
  if (display_hourglass_p)
    cancel_hourglass ();
599
#endif
600

601
  delayed_switch_frame = Qnil;
602

603 604 605 606 607
  /* Compute timeout.  */
  if (NUMBERP (seconds))
    {
      EMACS_TIME wait_time;
      int sec, usec;
608
      double duration = extract_float (seconds);
609 610 611 612 613 614 615 616

      sec  = (int) duration;
      usec = (duration - sec) * 1000000;
      EMACS_GET_TIME (end_time);
      EMACS_SET_SECS_USECS (wait_time, sec, usec);
      EMACS_ADD_TIME (end_time, end_time, wait_time);
    }

Karoly Lorentey's avatar
Karoly Lorentey committed
617
/* Read until we get an acceptable event.  */
618
 retry:
619
  do
Karoly Lorentey's avatar
Karoly Lorentey committed
620 621
    val = read_char (0, 0, 0, (input_method ? Qnil : Qt), 0,
		     NUMBERP (seconds) ? &end_time : NULL);
622
  while (INTEGERP (val) && XINT (val) == -2); /* wrong_kboard_jmpbuf */
623

624
  if (BUFFERP (val))
625 626
    goto retry;

627
  /* switch-frame events are put off until after the next ASCII
Karl Heuer's avatar
Karl Heuer committed
628
     character.  This is better than signaling an error just because
629 630 631 632 633
     the last characters were typed to a separate minibuffer frame,
     for example.  Eventually, some code which can deal with
     switch-frame events will read it and process it.  */
  if (no_switch_frame
      && EVENT_HAS_PARAMETERS (val)
634
      && EQ (EVENT_HEAD_KIND (EVENT_HEAD (val)), Qswitch_frame))
635 636 637 638 639
    {
      delayed_switch_frame = val;
      goto retry;
    }

640
  if (ascii_required && !(NUMBERP (seconds) && NILP (val)))
641 642
    {
      /* Convert certain symbols to their ASCII equivalents.  */
643
      if (SYMBOLP (val))
644
	{
645
	  Lisp_Object tem, tem1;
646 647 648 649 650 651 652
	  tem = Fget (val, Qevent_symbol_element_mask);
	  if (!NILP (tem))
	    {
	      tem1 = Fget (Fcar (tem), Qascii_character);
	      /* Merge this symbol's modifier bits
		 with the ASCII equivalent of its basic code.  */
	      if (!NILP (tem1))
653
		XSETFASTINT (val, XINT (tem1) | XINT (Fcar (Fcdr (tem))));
654 655
	    }
	}
656

657
      /* If we don't have a character now, deal with it appropriately.  */
658
      if (!INTEGERP (val))
659 660 661
	{
	  if (error_nonascii)
	    {
662
	      Vunread_command_events = Fcons (val, Qnil);
663 664 665 666 667 668 669 670 671 672
	      error ("Non-character input-event");
	    }
	  else
	    goto retry;
	}
    }

  if (! NILP (delayed_switch_frame))
    unread_switch_frame = delayed_switch_frame;

673 674
#if 0

675
#ifdef HAVE_WINDOW_SYSTEM
676 677
  if (display_hourglass_p)
    start_hourglass ();
678
#endif
679 680 681

#endif

682 683 684
  return val;
}

685
DEFUE ("read-char", Fread_char, Sread_char, 0, 3, 0,
686 687
       doc: /* Read a character from the command input (keyboard or macro).
It is returned as a number.
688 689 690
If the character has modifiers, they are resolved and reflected to the
character code if possible (e.g. C-SPC -> 0).

691 692
If the user generates an event which is not a character (i.e. a mouse
click or function key event), `read-char' signals an error.  As an
693 694
exception, switch-frame events are put off until non-character events
can be read.
695 696 697 698 699 700
If you want to read non-character events, or ignore them, call
`read-event' or `read-char-exclusive' instead.

If the optional argument PROMPT is non-nil, display that as a prompt.
If the optional argument INHERIT-INPUT-METHOD is non-nil and some
input method is turned on in the current buffer, that input method
701 702 703 704 705
is used for reading a character.
If the optional argument SECONDS is non-nil, it should be a number
specifying the maximum number of seconds to wait for input.  If no
input arrives in that time, return nil.  SECONDS may be a
floating-point value.  */)
Dan Nicolaescu's avatar
Dan Nicolaescu committed
706
  (Lisp_Object prompt, Lisp_Object inherit_input_method, Lisp_Object seconds)
Jim Blandy's avatar
Jim Blandy committed
707
{
708 709
  Lisp_Object val;

710 711
  if (! NILP (prompt))
    message_with_string ("%s", prompt, 0);
712
  val = read_filtered_event (1, 1, 1, ! NILP (inherit_input_method), seconds);
713 714 715

  return (NILP (val) ? Qnil
	  : make_number (char_resolve_modifier_mask (XINT (val))));
Jim Blandy's avatar
Jim Blandy committed
716 717
}

718
DEFUE ("read-event", Fread_event, Sread_event, 0, 3, 0,
719 720 721 722
       doc: /* Read an event object from the input stream.
If the optional argument PROMPT is non-nil, display that as a prompt.
If the optional argument INHERIT-INPUT-METHOD is non-nil and some
input method is turned on in the current buffer, that input method
723 724 725 726 727
is used for reading a character.
If the optional argument SECONDS is non-nil, it should be a number
specifying the maximum number of seconds to wait for input.  If no
input arrives in that time, return nil.  SECONDS may be a
floating-point value.  */)
Dan Nicolaescu's avatar
Dan Nicolaescu committed
728
  (Lisp_Object prompt, Lisp_Object inherit_input_method, Lisp_Object seconds)
Jim Blandy's avatar
Jim Blandy committed
729
{
730 731
  if (! NILP (prompt))
    message_with_string ("%s", prompt, 0);
732
  return read_filtered_event (0, 0, 0, ! NILP (inherit_input_method), seconds);
Jim Blandy's avatar
Jim Blandy committed
733 734
}

735
DEFUN ("read-char-exclusive", Fread_char_exclusive, Sread_char_exclusive, 0, 3, 0,
736 737
       doc: /* Read a character from the command input (keyboard or macro).
It is returned as a number.  Non-character events are ignored.
738 739
If the character has modifiers, they are resolved and reflected to the
character code if possible (e.g. C-SPC -> 0).
740 741 742 743

If the optional argument PROMPT is non-nil, display that as a prompt.
If the optional argument INHERIT-INPUT-METHOD is non-nil and some
input method is turned on in the current buffer, that input method
744 745 746 747 748
is used for reading a character.
If the optional argument SECONDS is non-nil, it should be a number
specifying the maximum number of seconds to wait for input.  If no
input arrives in that time, return nil.  SECONDS may be a
floating-point value.  */)
Dan Nicolaescu's avatar
Dan Nicolaescu committed
749
  (Lisp_Object prompt, Lisp_Object inherit_input_method, Lisp_Object seconds)
Jim Blandy's avatar
Jim Blandy committed
750
{
751 752
  Lisp_Object val;

753 754
  if (! NILP (prompt))
    message_with_string ("%s", prompt, 0);
755

756
  val = read_filtered_event (1, 1, 0, ! NILP (inherit_input_method), seconds);
757 758 759

  return (NILP (val) ? Qnil
	  : make_number (char_resolve_modifier_mask (XINT (val))));
Jim Blandy's avatar
Jim Blandy committed
760 761 762
}

DEFUN ("get-file-char", Fget_file_char, Sget_file_char, 0, 0, 0,
763
       doc: /* Don't use this yourself.  */)
Dan Nicolaescu's avatar
Dan Nicolaescu committed
764
  (void)
Jim Blandy's avatar
Jim Blandy committed
765 766
{
  register Lisp_Object val;
YAMAMOTO Mitsuharu's avatar
YAMAMOTO Mitsuharu committed
767
  BLOCK_INPUT;
768
  XSETINT (val, getc (instream));
YAMAMOTO Mitsuharu's avatar
YAMAMOTO Mitsuharu committed
769
  UNBLOCK_INPUT;
Jim Blandy's avatar
Jim Blandy committed
770 771
  return val;
}
772 773


774 775 776 777 778 779 780 781


/* Return true if the lisp code read using READCHARFUN defines a non-nil
   `lexical-binding' file variable.  After returning, the stream is
   positioned following the first line, if it is a comment, otherwise
   nothing is read.  */

static int
Stefan Monnier's avatar
Stefan Monnier committed
782
lisp_file_lexically_bound_p (Lisp_Object readcharfun)
783 784 785 786 787 788 789 790 791 792 793 794 795 796 797 798 799
{
  int ch = READCHAR;
  if (ch != ';')
    /* The first line isn't a comment, just give up.  */
    {
      UNREAD (ch);
      return 0;
    }
  else
    /* Look for an appropriate file-variable in the first line.  */
    {
      int rv = 0;
      enum {
	NOMINAL, AFTER_FIRST_DASH, AFTER_ASTERIX,
      } beg_end_state = NOMINAL;
      int in_file_vars = 0;

800 801 802 803 804 805 806 807 808 809
#define UPDATE_BEG_END_STATE(ch)				\
  if (beg_end_state == NOMINAL)					\
    beg_end_state = (ch == '-' ? AFTER_FIRST_DASH : NOMINAL);	\
  else if (beg_end_state == AFTER_FIRST_DASH)			\
    beg_end_state = (ch == '*' ? AFTER_ASTERIX : NOMINAL);	\
  else if (beg_end_state == AFTER_ASTERIX)			\
    {								\
      if (ch == '-')						\
	in_file_vars = !in_file_vars;				\
      beg_end_state = NOMINAL;					\
810 811 812 813 814 815 816 817 818 819 820 821
    }

      /* Skip until we get to the file vars, if any.  */
      do
	{
	  ch = READCHAR;
	  UPDATE_BEG_END_STATE (ch);
	}
      while (!in_file_vars && ch != '\n' && ch != EOF);

      while (in_file_vars)
	{
822
	  char var[100], val[100];
823
	  unsigned i;
824 825 826 827 828 829 830

	  ch = READCHAR;

	  /* Read a variable name.  */
	  while (ch == ' ' || ch == '\t')
	    ch = READCHAR;

831
	  i = 0;
832 833
	  while (ch != ':' && ch != '\n' && ch != EOF)
	    {
834 835
	      if (i < sizeof var - 1)
		var[i++] = ch;
836 837 838
	      UPDATE_BEG_END_STATE (ch);
	      ch = READCHAR;
	    }
839

840 841 842
	  while (i > 0 && (var[i - 1] == ' ' || var[i - 1] == '\t'))
	    i--;
	  var[i] = '\0';
843 844 845 846 847 848 849 850 851

	  if (ch == ':')
	    {
	      /* Read a variable value.  */
	      ch = READCHAR;

	      while (ch == ' ' || ch == '\t')
		ch = READCHAR;

852
	      i = 0;
853 854
	      while (ch != ';' && ch != '\n' && ch != EOF && in_file_vars)
		{
855 856
		  if (i < sizeof val - 1)
		    val[i++] = ch;
857 858 859 860 861 862
		  UPDATE_BEG_END_STATE (ch);
		  ch = READCHAR;
		}
	      if (! in_file_vars)
		/* The value was terminated by an end-marker, which
		   remove.  */
863 864 865 866
		i -= 3;
	      while (i > 0 && (val[i - 1] == ' ' || val[i - 1] == '\t'))
		i--;
	      val[i] = '\0';
867 868 869 870 871 872 873 874 875 876 877 878 879 880 881 882

	      if (strcmp (var, "lexical-binding") == 0)
		/* This is it...  */
		{
		  rv = (strcmp (val, "nil") != 0);
		  break;
		}
	    }
	}

      while (ch != '\n' && ch != EOF)
	ch = READCHAR;

      return rv;
    }
}
883

Kenichi Handa's avatar
Kenichi Handa committed
884
/* Value is a version number of byte compiled code if the file
Miles Bader's avatar
Miles Bader committed
885
   associated with file descriptor FD is a compiled Lisp file that's
Kenichi Handa's avatar
Kenichi Handa committed
886 887 888
   safe to load.  Only files compiled with Emacs are safe to load.
   Files compiled with XEmacs can lead to a crash in Fbyte_code
   because of an incompatible change in the byte compiler.  */
889 890

static int
891
safe_to_load_p (int fd)
892 893 894 895
{
  char buf[512];
  int nbytes, i;
  int safe_p = 1;
Kenichi Handa's avatar
Kenichi Handa committed
896
  int version = 1;
897 898 899 900 901 902 903 904 905

  /* Read the first few bytes from the file, and look for a line
     specifying the byte compiler version used.  */
  nbytes = emacs_read (fd, buf, sizeof buf - 1);
  if (nbytes > 0)
    {
      buf[nbytes] = '\0';

      /* Skip to the next newline, skipping over the initial `ELC'
Dave Love's avatar
Dave Love committed
906
	 with NUL bytes following it, but note the version.  */
907
      for (i = 0; i < nbytes && buf[i] != '\n'; ++i)
Dave Love's avatar
Dave Love committed
908
	if (i == 4)
Kenichi Handa's avatar
Kenichi Handa committed
909
	  version = buf[i];
910

911
      if (i >= nbytes
912
	  || fast_c_string_match_ignore_case (Vbytecomp_version_regexp,
913 914 915
					      buf + i) < 0)
	safe_p = 0;
    }
Dave Love's avatar
Dave Love committed
916 917
  if (safe_p)
    safe_p = version;
918 919 920 921 922 923

  lseek (fd, 0, SEEK_SET);
  return safe_p;
}


924 925 926 927
/* Callback for record_unwind_protect.  Restore the old load list OLD,
   after loading a file successfully.  */

static Lisp_Object
928
record_load_unwind (Lisp_Object old)
929 930 931 932
{
  return Vloads_in_progress = old;
}

933 934 935
/* This handler function is used via internal_condition_case_1.  */

static Lisp_Object
936
load_error_handler (Lisp_Object data)
937 938 939
{
  return Qnil;
}
940

941
static Lisp_Object
942
load_warn_old_style_backquotes (Lisp_Object file)
943 944 945
{
  if (!NILP (Vold_style_backquotes))
    {
946
      Lisp_Object args[2];
947
      args[0] = build_string ("Loading `%s': old-style backquotes detected!");
948 949 950 951 952 953
      args[1] = file;
      Fmessage (2, args);
    }
  return Qnil;
}

954
DEFUE ("get-load-suffixes", Fget_load_suffixes, Sget_load_suffixes, 0, 0, 0,
955 956 957
       doc: /* Return the suffixes that `load' should try if a suffix is \
required.
This uses the variables `load-suffixes' and `load-file-rep-suffixes'.  */)
Dan Nicolaescu's avatar
Dan Nicolaescu committed
958
  (void)
959 960 961 962 963 964 965 966 967 968 969 970 971 972 973 974 975
{
  Lisp_Object lst = Qnil, suffixes = Vload_suffixes, suffix, ext;
  while (CONSP (suffixes))
    {
      Lisp_Object exts = Vload_file_rep_suffixes;
      suffix = XCAR (suffixes);
      suffixes = XCDR (suffixes);
      while (CONSP (exts))
	{
	  ext = XCAR (exts);
	  exts = XCDR (exts);
	  lst = Fcons (concat2 (suffix, ext), lst);
	}
    }
  return Fnreverse (lst);
}

976
DEFUE ("load", Fload, Sload, 1, 5, 0,
977 978
       doc: /* Execute a file of Lisp code named FILE.
First try FILE with `.elc' appended, then try with `.el',
979
then try FILE unmodified (the exact suffixes in the exact order are
980
determined by `load-suffixes').  Environment variable references in
981
FILE are replaced with their values by calling `substitute-in-file-name'.
982
This function searches the directories in `load-path'.
983

984
If optional second arg NOERROR is non-nil,
985
report no error if FILE doesn't exist.
986
Print messages at start and end of loading unless
987 988
optional third arg NOMESSAGE is non-nil (but `force-load-messages'
overrides that).
989
If optional fourth arg NOSUFFIX is non-nil, don't try adding
990
suffixes `.elc' or `.el' to the specified name FILE.
991
If optional fifth arg MUST-SUFFIX is non-nil, insist on
992 993 994 995 996 997 998 999 1000 1001 1002 1003 1004 1005 1006
the suffix `.elc' or `.el'; don't accept just F