lread.c 132 KB
Newer Older
Jim Blandy's avatar
Jim Blandy committed
1
/* Lisp parsing and input streams.
2

3
Copyright (C) 1985-1989, 1993-1995, 1997-2012  Free Software Foundation, Inc.
Jim Blandy's avatar
Jim Blandy committed
4 5 6

This file is part of GNU Emacs.

7
GNU Emacs is free software: you can redistribute it and/or modify
Jim Blandy's avatar
Jim Blandy committed
8
it under the terms of the GNU General Public License as published by
9 10
the Free Software Foundation, either version 3 of the License, or
(at your option) any later version.
Jim Blandy's avatar
Jim Blandy committed
11 12 13 14 15 16 17

GNU Emacs is distributed in the hope that it will be useful,
but WITHOUT ANY WARRANTY; without even the implied warranty of
MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
GNU General Public License for more details.

You should have received a copy of the GNU General Public License
18
along with GNU Emacs.  If not, see <http://www.gnu.org/licenses/>.  */
Jim Blandy's avatar
Jim Blandy committed
19 20


Richard M. Stallman's avatar
Richard M. Stallman committed
21
#include <config.h>
Jim Blandy's avatar
Jim Blandy committed
22 23 24 25
#include <stdio.h>
#include <sys/types.h>
#include <sys/stat.h>
#include <sys/file.h>
26
#include <errno.h>
27
#include <limits.h>	/* For CHAR_BIT.  */
28
#include <setjmp.h>
Jim Blandy's avatar
Jim Blandy committed
29
#include "lisp.h"
30
#include "intervals.h"
Kenichi Handa's avatar
Kenichi Handa committed
31
#include "character.h"
32
#include "buffer.h"
Karl Heuer's avatar
Karl Heuer committed
33
#include "charset.h"
Kenichi Handa's avatar
Kenichi Handa committed
34
#include "coding.h"
35
#include <epaths.h>
Jim Blandy's avatar
Jim Blandy committed
36
#include "commands.h"
Jim Blandy's avatar
Jim Blandy committed
37
#include "keyboard.h"
38
#include "frame.h"
39
#include "termhooks.h"
40
#include "coding.h"
YAMAMOTO Mitsuharu's avatar
YAMAMOTO Mitsuharu committed
41
#include "blockinput.h"
Jim Blandy's avatar
Jim Blandy committed
42

43 44 45 46
#ifdef MSDOS
#include "msdos.h"
#endif

Andreas Schwab's avatar
Andreas Schwab committed
47
#include <unistd.h>
Jim Blandy's avatar
Jim Blandy committed
48 49
#include <math.h>

Richard M. Stallman's avatar
Richard M. Stallman committed
50 51 52 53
#ifdef HAVE_SETLOCALE
#include <locale.h>
#endif /* HAVE_SETLOCALE */

Dave Love's avatar
Dave Love committed
54
#include <fcntl.h>
Richard M. Stallman's avatar
Richard M. Stallman committed
55

56
#ifdef HAVE_FSEEKO
57 58 59 60 61 62 63
#define file_offset off_t
#define file_tell ftello
#else
#define file_offset long
#define file_tell ftell
#endif

64
/* Hash table read constants.  */
65 66 67 68 69 70 71 72
static Lisp_Object Qhash_table, Qdata;
static Lisp_Object Qtest, Qsize;
static Lisp_Object Qweakness;
static Lisp_Object Qrehash_size;
static Lisp_Object Qrehash_threshold;

static Lisp_Object Qread_char, Qget_file_char, Qcurrent_load_list;
Lisp_Object Qstandard_input;
73
Lisp_Object Qvariable_documentation;
74
static Lisp_Object Qascii_character, Qload, Qload_file_name;
75
Lisp_Object Qbackquote, Qcomma, Qcomma_at, Qcomma_dot, Qfunction;
76 77 78 79
static Lisp_Object Qinhibit_file_name_operation;
static Lisp_Object Qeval_buffer_list;
static Lisp_Object Qlexical_binding;
static Lisp_Object Qfile_truename, Qdo_after_load_evaluation; /* ACM 2006/5/16 */
80

Kenichi Handa's avatar
Kenichi Handa committed
81 82 83 84 85 86
/* Used instead of Qget_file_char while loading *.elc files compiled
   by Emacs 21 or older.  */
static Lisp_Object Qget_emacs_mule_file_char;

static Lisp_Object Qload_force_doc_strings;

87
extern Lisp_Object Qinternal_interpreter_environment;
Jim Blandy's avatar
Jim Blandy committed
88

89
static Lisp_Object Qload_in_progress;
Ken Raeburn's avatar
Ken Raeburn committed
90

91 92 93 94
/* The association list of objects read with the #n=object form.
   Each member of the list has the form (n . object), and is used to
   look up the object for the corresponding #n# construct.
   It must be set to nil before all top-level calls to read0.  */
95
static Lisp_Object read_objects;
96

Kenichi Handa's avatar
Kenichi Handa committed
97 98 99 100 101
/* Nonzero means READCHAR should read bytes one by one (not character)
   when READCHARFUN is Qget_file_char or Qget_emacs_mule_file_char.
   This is set to 1 by read1 temporarily while handling #@NUMBER.  */
static int load_each_byte;

102 103 104
/* List of descriptors now open for Fload.  */
static Lisp_Object load_descriptor_list;

105
/* File for get_file_char to read from.  Use by load.  */
Jim Blandy's avatar
Jim Blandy committed
106 107
static FILE *instream;

108
/* For use within read-from-string (this reader is non-reentrant!!)  */
109 110 111
static ptrdiff_t read_from_string_index;
static ptrdiff_t read_from_string_index_byte;
static ptrdiff_t read_from_string_limit;
112

113
/* Number of characters read in the current call to Fread or
114
   Fread_from_string.  */
115
static EMACS_INT readchar_count;
116

117
/* This contains the last string skipped with #@.  */
118 119
static char *saved_doc_string;
/* Length of buffer allocated in saved_doc_string.  */
120
static ptrdiff_t saved_doc_string_size;
121
/* Length of actual data in saved_doc_string.  */
122
static ptrdiff_t saved_doc_string_length;
123
/* This is the file position that string came from.  */
124
static file_offset saved_doc_string_position;
125

126 127 128 129 130
/* This contains the previous string skipped with #@.
   We copy it from saved_doc_string when a new string
   is put in saved_doc_string.  */
static char *prev_saved_doc_string;
/* Length of buffer allocated in prev_saved_doc_string.  */
131
static ptrdiff_t prev_saved_doc_string_size;
132
/* Length of actual data in prev_saved_doc_string.  */
133
static ptrdiff_t prev_saved_doc_string_length;
134
/* This is the file position that string came from.  */
135
static file_offset prev_saved_doc_string_position;
136

137 138 139 140 141
/* Nonzero means inside a new-style backquote
   with no surrounding parentheses.
   Fread initializes this to zero, so we need not specbind it
   or worry about what happens to it when there is an error.  */
static int new_backquote_flag;
142
static Lisp_Object Qold_style_backquotes;
143 144 145 146

/* A list of file names for files being loaded in Fload.  Used to
   check for recursive loads.  */

Lute Kamstra's avatar
Lute Kamstra committed
147
static Lisp_Object Vloads_in_progress;
148

149 150
static int read_emacs_mule_char (int, int (*) (int, Lisp_Object),
                                 Lisp_Object);
Kenichi Handa's avatar
Kenichi Handa committed
151

152
static void readevalloop (Lisp_Object, FILE*, Lisp_Object, int,
153 154 155 156
                          Lisp_Object, Lisp_Object,
                          Lisp_Object, Lisp_Object);
static Lisp_Object load_unwind (Lisp_Object);
static Lisp_Object load_descriptor_unwind (Lisp_Object);
157

158
static void invalid_syntax (const char *) NO_RETURN;
159
static void end_of_file_error (void) NO_RETURN;
160

Jim Blandy's avatar
Jim Blandy committed
161

Kenichi Handa's avatar
Kenichi Handa committed
162 163 164 165 166 167
/* Functions that read one byte from the current source READCHARFUN
   or unreads one byte.  If the integer argument C is -1, it returns
   one read byte, or -1 when there's no more byte in the source.  If C
   is 0 or positive, it unreads C, and the return value is not
   interesting.  */

168 169 170
static int readbyte_for_lambda (int, Lisp_Object);
static int readbyte_from_file (int, Lisp_Object);
static int readbyte_from_string (int, Lisp_Object);
Kenichi Handa's avatar
Kenichi Handa committed
171

Jim Blandy's avatar
Jim Blandy committed
172 173
/* Handle unreading and rereading of characters.
   Write READCHAR to read a character,
Karl Heuer's avatar
Karl Heuer committed
174 175
   UNREAD(c) to unread c to be read again.

Kenichi Handa's avatar
Kenichi Handa committed
176
   These macros correctly read/unread multibyte characters.  */
Jim Blandy's avatar
Jim Blandy committed
177

178
#define READCHAR readchar (readcharfun, NULL)
Jim Blandy's avatar
Jim Blandy committed
179 180
#define UNREAD(c) unreadchar (readcharfun, c)

181 182 183
/* Same as READCHAR but set *MULTIBYTE to the multibyteness of the source.  */
#define READCHAR_REPORT_MULTIBYTE(multibyte) readchar (readcharfun, multibyte)

Kenichi Handa's avatar
Kenichi Handa committed
184
/* When READCHARFUN is Qget_file_char, Qget_emacs_mule_file_char,
Kenichi Handa's avatar
Kenichi Handa committed
185 186
   Qlambda, or a cons, we use this to keep an unread character because
   a file stream can't handle multibyte-char unreading.  The value -1
187
   means that there's no unread character.  */
Kenichi Handa's avatar
Kenichi Handa committed
188 189
static int unread_char;

Jim Blandy's avatar
Jim Blandy committed
190
static int
191
readchar (Lisp_Object readcharfun, int *multibyte)
Jim Blandy's avatar
Jim Blandy committed
192 193
{
  Lisp_Object tem;
194
  register int c;
195
  int (*readbyte) (int, Lisp_Object);
Kenichi Handa's avatar
Kenichi Handa committed
196 197 198
  unsigned char buf[MAX_MULTIBYTE_LENGTH];
  int i, len;
  int emacs_mule_encoding = 0;
Jim Blandy's avatar
Jim Blandy committed
199

200 201 202
  if (multibyte)
    *multibyte = 0;

203
  readchar_count++;
204

205
  if (BUFFERP (readcharfun))
Jim Blandy's avatar
Jim Blandy committed
206
    {
207
      register struct buffer *inbuffer = XBUFFER (readcharfun);
Jim Blandy's avatar
Jim Blandy committed
208

209
      ptrdiff_t pt_byte = BUF_PT_BYTE (inbuffer);
210

211 212
      if (pt_byte >= BUF_ZV_BYTE (inbuffer))
	return -1;
Jim Blandy's avatar
Jim Blandy committed
213

Tom Tromey's avatar
Tom Tromey committed
214
      if (! NILP (BVAR (inbuffer, enable_multibyte_characters)))
215
	{
216
	  /* Fetch the character code from the buffer.  */
217 218
	  unsigned char *p = BUF_BYTE_ADDRESS (inbuffer, pt_byte);
	  BUF_INC_POS (inbuffer, pt_byte);
219
	  c = STRING_CHAR (p);
220 221
	  if (multibyte)
	    *multibyte = 1;
222 223 224 225
	}
      else
	{
	  c = BUF_FETCH_BYTE (inbuffer, pt_byte);
Kenichi Handa's avatar
Kenichi Handa committed
226 227
	  if (! ASCII_BYTE_P (c))
	    c = BYTE8_TO_CHAR (c);
228
	  pt_byte++;
229
	}
230
      SET_BUF_PT_BOTH (inbuffer, BUF_PT (inbuffer) + 1, pt_byte);
231

232
      return c;
Jim Blandy's avatar
Jim Blandy committed
233
    }
234
  if (MARKERP (readcharfun))
Jim Blandy's avatar
Jim Blandy committed
235
    {
236
      register struct buffer *inbuffer = XMARKER (readcharfun)->buffer;
Jim Blandy's avatar
Jim Blandy committed
237

238
      ptrdiff_t bytepos = marker_byte_position (readcharfun);
239

240 241
      if (bytepos >= BUF_ZV_BYTE (inbuffer))
	return -1;
242

Tom Tromey's avatar
Tom Tromey committed
243
      if (! NILP (BVAR (inbuffer, enable_multibyte_characters)))
244
	{
245
	  /* Fetch the character code from the buffer.  */
246 247
	  unsigned char *p = BUF_BYTE_ADDRESS (inbuffer, bytepos);
	  BUF_INC_POS (inbuffer, bytepos);
248
	  c = STRING_CHAR (p);
249 250
	  if (multibyte)
	    *multibyte = 1;
251 252 253 254
	}
      else
	{
	  c = BUF_FETCH_BYTE (inbuffer, bytepos);
Kenichi Handa's avatar
Kenichi Handa committed
255 256
	  if (! ASCII_BYTE_P (c))
	    c = BYTE8_TO_CHAR (c);
257
	  bytepos++;
258 259
	}

260 261 262 263
      XMARKER (readcharfun)->bytepos = bytepos;
      XMARKER (readcharfun)->charpos++;

      return c;
Jim Blandy's avatar
Jim Blandy committed
264
    }
265 266

  if (EQ (readcharfun, Qlambda))
Kenichi Handa's avatar
Kenichi Handa committed
267 268 269 270
    {
      readbyte = readbyte_for_lambda;
      goto read_multibyte;
    }
271

Jim Blandy's avatar
Jim Blandy committed
272
  if (EQ (readcharfun, Qget_file_char))
273
    {
Kenichi Handa's avatar
Kenichi Handa committed
274 275
      readbyte = readbyte_from_file;
      goto read_multibyte;
276
    }
Jim Blandy's avatar
Jim Blandy committed
277

278
  if (STRINGP (readcharfun))
Jim Blandy's avatar
Jim Blandy committed
279
    {
280
      if (read_from_string_index >= read_from_string_limit)
Jim Blandy's avatar
Jim Blandy committed
281
	c = -1;
282 283 284 285 286 287 288 289
      else if (STRING_MULTIBYTE (readcharfun))
	{
	  if (multibyte)
	    *multibyte = 1;
	  FETCH_STRING_CHAR_ADVANCE_NO_CHECK (c, readcharfun,
					      read_from_string_index,
					      read_from_string_index_byte);
	}
290
      else
291 292 293 294 295
	{
	  c = SREF (readcharfun, read_from_string_index_byte);
	  read_from_string_index++;
	  read_from_string_index_byte++;
	}
Jim Blandy's avatar
Jim Blandy committed
296 297 298
      return c;
    }

Kenichi Handa's avatar
Kenichi Handa committed
299 300 301 302 303 304 305 306 307 308 309 310
  if (CONSP (readcharfun))
    {
      /* This is the case that read_vector is reading from a unibyte
	 string that contains a byte sequence previously skipped
	 because of #@NUMBER.  The car part of readcharfun is that
	 string, and the cdr part is a value of readcharfun given to
	 read_vector.  */
      readbyte = readbyte_from_string;
      if (EQ (XCDR (readcharfun), Qget_emacs_mule_file_char))
	emacs_mule_encoding = 1;
      goto read_multibyte;
    }
Kenichi Handa's avatar
Kenichi Handa committed
311

Kenichi Handa's avatar
Kenichi Handa committed
312 313 314 315 316 317
  if (EQ (readcharfun, Qget_emacs_mule_file_char))
    {
      readbyte = readbyte_from_file;
      emacs_mule_encoding = 1;
      goto read_multibyte;
    }
Jim Blandy's avatar
Jim Blandy committed
318 319 320

  tem = call0 (readcharfun);

Jim Blandy's avatar
Jim Blandy committed
321
  if (NILP (tem))
Jim Blandy's avatar
Jim Blandy committed
322 323
    return -1;
  return XINT (tem);
Kenichi Handa's avatar
Kenichi Handa committed
324 325 326 327 328 329 330 331 332

 read_multibyte:
  if (unread_char >= 0)
    {
      c = unread_char;
      unread_char = -1;
      return c;
    }
  c = (*readbyte) (-1, readcharfun);
333 334 335 336 337
  if (c < 0 || load_each_byte)
    return c;
  if (multibyte)
    *multibyte = 1;
  if (ASCII_BYTE_P (c))
Kenichi Handa's avatar
Kenichi Handa committed
338 339 340 341 342 343 344 345 346 347 348 349 350 351 352 353 354
    return c;
  if (emacs_mule_encoding)
    return read_emacs_mule_char (c, readbyte, readcharfun);
  i = 0;
  buf[i++] = c;
  len = BYTES_BY_CHAR_HEAD (c);
  while (i < len)
    {
      c = (*readbyte) (-1, readcharfun);
      if (c < 0 || ! TRAILING_CODE_P (c))
	{
	  while (--i > 1)
	    (*readbyte) (buf[i], readcharfun);
	  return BYTE8_TO_CHAR (buf[0]);
	}
      buf[i++] = c;
    }
355
  return STRING_CHAR (buf);
Jim Blandy's avatar
Jim Blandy committed
356 357 358 359 360 361
}

/* Unread the character C in the way appropriate for the stream READCHARFUN.
   If the stream is a user function, call it with the char as argument.  */

static void
362
unreadchar (Lisp_Object readcharfun, int c)
Jim Blandy's avatar
Jim Blandy committed
363
{
364
  readchar_count--;
365 366 367 368
  if (c == -1)
    /* Don't back up the pointer if we're unreading the end-of-input mark,
       since readchar didn't advance it when we read it.  */
    ;
369
  else if (BUFFERP (readcharfun))
370
    {
371
      struct buffer *b = XBUFFER (readcharfun);
372 373
      ptrdiff_t charpos = BUF_PT (b);
      ptrdiff_t bytepos = BUF_PT_BYTE (b);
374

Tom Tromey's avatar
Tom Tromey committed
375
      if (! NILP (BVAR (b, enable_multibyte_characters)))
Kenichi Handa's avatar
Kenichi Handa committed
376
	BUF_DEC_POS (b, bytepos);
377
      else
Kenichi Handa's avatar
Kenichi Handa committed
378
	bytepos--;
379

380
      SET_BUF_PT_BOTH (b, charpos - 1, bytepos);
381
    }
382
  else if (MARKERP (readcharfun))
383
    {
384
      struct buffer *b = XMARKER (readcharfun)->buffer;
385
      ptrdiff_t bytepos = XMARKER (readcharfun)->bytepos;
386

Kenichi Handa's avatar
Kenichi Handa committed
387
      XMARKER (readcharfun)->charpos--;
Tom Tromey's avatar
Tom Tromey committed
388
      if (! NILP (BVAR (b, enable_multibyte_characters)))
Kenichi Handa's avatar
Kenichi Handa committed
389
	BUF_DEC_POS (b, bytepos);
390
      else
Kenichi Handa's avatar
Kenichi Handa committed
391
	bytepos--;
392

Kenichi Handa's avatar
Kenichi Handa committed
393
      XMARKER (readcharfun)->bytepos = bytepos;
394
    }
395
  else if (STRINGP (readcharfun))
396 397 398 399 400
    {
      read_from_string_index--;
      read_from_string_index_byte
	= string_char_to_byte (readcharfun, read_from_string_index);
    }
Kenichi Handa's avatar
Kenichi Handa committed
401 402 403 404
  else if (CONSP (readcharfun))
    {
      unread_char = c;
    }
405
  else if (EQ (readcharfun, Qlambda))
Kenichi Handa's avatar
Kenichi Handa committed
406 407 408 409 410 411 412
    {
      unread_char = c;
    }
  else if (EQ (readcharfun, Qget_file_char)
	   || EQ (readcharfun, Qget_emacs_mule_file_char))
    {
      if (load_each_byte)
Miles Bader's avatar
Miles Bader committed
413 414 415 416 417
	{
	  BLOCK_INPUT;
	  ungetc (c, instream);
	  UNBLOCK_INPUT;
	}
Kenichi Handa's avatar
Kenichi Handa committed
418 419 420
      else
	unread_char = c;
    }
Jim Blandy's avatar
Jim Blandy committed
421 422 423 424
  else
    call1 (readcharfun, make_number (c));
}

Kenichi Handa's avatar
Kenichi Handa committed
425
static int
426
readbyte_for_lambda (int c, Lisp_Object readcharfun)
Kenichi Handa's avatar
Kenichi Handa committed
427 428 429 430 431 432
{
  return read_bytecode_char (c >= 0);
}


static int
433
readbyte_from_file (int c, Lisp_Object readcharfun)
Kenichi Handa's avatar
Kenichi Handa committed
434 435 436
{
  if (c >= 0)
    {
YAMAMOTO Mitsuharu's avatar
YAMAMOTO Mitsuharu committed
437
      BLOCK_INPUT;
Kenichi Handa's avatar
Kenichi Handa committed
438
      ungetc (c, instream);
YAMAMOTO Mitsuharu's avatar
YAMAMOTO Mitsuharu committed
439
      UNBLOCK_INPUT;
Kenichi Handa's avatar
Kenichi Handa committed
440 441 442
      return 0;
    }

Miles Bader's avatar
Miles Bader committed
443
  BLOCK_INPUT;
Kenichi Handa's avatar
Kenichi Handa committed
444
  c = getc (instream);
Miles Bader's avatar
Miles Bader committed
445

Kenichi Handa's avatar
Kenichi Handa committed
446
#ifdef EINTR
447
  /* Interrupted reads have been observed while reading over the network.  */
Miles Bader's avatar
Miles Bader committed
448 449
  while (c == EOF && ferror (instream) && errno == EINTR)
    {
Miles Bader's avatar
Miles Bader committed
450
      UNBLOCK_INPUT;
Miles Bader's avatar
Miles Bader committed
451 452
      QUIT;
      BLOCK_INPUT;
Miles Bader's avatar
Miles Bader committed
453
      clearerr (instream);
Miles Bader's avatar
Miles Bader committed
454
      c = getc (instream);
YAMAMOTO Mitsuharu's avatar
YAMAMOTO Mitsuharu committed
455
    }
Kenichi Handa's avatar
Kenichi Handa committed
456
#endif
Miles Bader's avatar
Miles Bader committed
457

Miles Bader's avatar
Miles Bader committed
458 459
  UNBLOCK_INPUT;

Kenichi Handa's avatar
Kenichi Handa committed
460 461 462 463
  return (c == EOF ? -1 : c);
}

static int
464
readbyte_from_string (int c, Lisp_Object readcharfun)
Kenichi Handa's avatar
Kenichi Handa committed
465 466 467 468 469 470 471 472 473
{
  Lisp_Object string = XCAR (readcharfun);

  if (c >= 0)
    {
      read_from_string_index--;
      read_from_string_index_byte
	= string_char_to_byte (string, read_from_string_index);
    }
Kenichi Handa's avatar
Kenichi Handa committed
474

Kenichi Handa's avatar
Kenichi Handa committed
475 476 477 478 479 480 481 482 483 484 485 486 487 488 489
  if (read_from_string_index >= read_from_string_limit)
    c = -1;
  else
    FETCH_STRING_CHAR_ADVANCE (c, string,
			       read_from_string_index,
			       read_from_string_index_byte);
  return c;
}


/* Read one non-ASCII character from INSTREAM.  The character is
   encoded in `emacs-mule' and the first byte is already read in
   C.  */

static int
490
read_emacs_mule_char (int c, int (*readbyte) (int, Lisp_Object), Lisp_Object readcharfun)
Kenichi Handa's avatar
Kenichi Handa committed
491 492 493 494 495 496 497 498 499 500 501 502 503 504 505 506 507 508 509 510 511 512 513 514 515 516 517 518
{
  /* Emacs-mule coding uses at most 4-byte for one character.  */
  unsigned char buf[4];
  int len = emacs_mule_bytes[c];
  struct charset *charset;
  int i;
  unsigned code;

  if (len == 1)
    /* C is not a valid leading-code of `emacs-mule'.  */
    return BYTE8_TO_CHAR (c);

  i = 0;
  buf[i++] = c;
  while (i < len)
    {
      c = (*readbyte) (-1, readcharfun);
      if (c < 0xA0)
	{
	  while (--i > 1)
	    (*readbyte) (buf[i], readcharfun);
	  return BYTE8_TO_CHAR (buf[0]);
	}
      buf[i++] = c;
    }

  if (len == 2)
    {
519
      charset = CHARSET_FROM_ID (emacs_mule_charset[buf[0]]);
Kenichi Handa's avatar
Kenichi Handa committed
520 521 522 523 524 525 526
      code = buf[1] & 0x7F;
    }
  else if (len == 3)
    {
      if (buf[0] == EMACS_MULE_LEADING_CODE_PRIVATE_11
	  || buf[0] == EMACS_MULE_LEADING_CODE_PRIVATE_12)
	{
527
	  charset = CHARSET_FROM_ID (emacs_mule_charset[buf[1]]);
Kenichi Handa's avatar
Kenichi Handa committed
528 529 530 531
	  code = buf[2] & 0x7F;
	}
      else
	{
532
	  charset = CHARSET_FROM_ID (emacs_mule_charset[buf[0]]);
Kenichi Handa's avatar
Kenichi Handa committed
533 534 535 536 537
	  code = ((buf[1] << 8) | buf[2]) & 0x7F7F;
	}
    }
  else
    {
538
      charset = CHARSET_FROM_ID (emacs_mule_charset[buf[1]]);
Kenichi Handa's avatar
Kenichi Handa committed
539
      code = ((buf[2] << 8) | buf[3]) & 0x7F7F;
Kenichi Handa's avatar
Kenichi Handa committed
540 541 542 543 544 545 546 547 548
    }
  c = DECODE_CHAR (charset, code);
  if (c < 0)
    Fsignal (Qinvalid_read_syntax,
	     Fcons (build_string ("invalid multibyte form"), Qnil));
  return c;
}


549 550 551 552
static Lisp_Object read_internal_start (Lisp_Object, Lisp_Object,
                                        Lisp_Object);
static Lisp_Object read0 (Lisp_Object);
static Lisp_Object read1 (Lisp_Object, int *, int);
553

554 555
static Lisp_Object read_list (int, Lisp_Object);
static Lisp_Object read_vector (Lisp_Object, int);
556

557 558 559 560 561
static Lisp_Object substitute_object_recurse (Lisp_Object, Lisp_Object,
                                              Lisp_Object);
static void substitute_object_in_subtree (Lisp_Object,
                                          Lisp_Object);
static void substitute_in_interval (INTERVAL, Lisp_Object);
562

Jim Blandy's avatar
Jim Blandy committed
563

564
/* Get a character from the tty.  */
Jim Blandy's avatar
Jim Blandy committed
565

566 567 568 569 570 571 572 573 574 575 576 577 578
/* Read input events until we get one that's acceptable for our purposes.

   If NO_SWITCH_FRAME is non-zero, switch-frame events are stashed
   until we get a character we like, and then stuffed into
   unread_switch_frame.

   If ASCII_REQUIRED is non-zero, we check function key events to see
   if the unmodified version of the symbol has a Qascii_character
   property, and use that character, if present.

   If ERROR_NONASCII is non-zero, we signal an error if the input we
   get isn't an ASCII character with modifiers.  If it's zero but
   ASCII_REQUIRED is non-zero, we just re-read until we get an ASCII
579 580 581
   character.

   If INPUT_METHOD is nonzero, we invoke the current input method
582 583 584 585
   if the character warrants that.

   If SECONDS is a number, we wait that many seconds for input, and
   return Qnil if no input arrives within that time.  */
586

Andreas Schwab's avatar
Andreas Schwab committed
587
static Lisp_Object
Andreas Schwab's avatar
Andreas Schwab committed
588 589
read_filtered_event (int no_switch_frame, int ascii_required,
		     int error_nonascii, int input_method, Lisp_Object seconds)
590
{
591
  Lisp_Object val, delayed_switch_frame;
592
  EMACS_TIME end_time;
593

594
#ifdef HAVE_WINDOW_SYSTEM
595 596
  if (display_hourglass_p)
    cancel_hourglass ();
597
#endif
598

599
  delayed_switch_frame = Qnil;
600

601 602 603 604 605
  /* Compute timeout.  */
  if (NUMBERP (seconds))
    {
      EMACS_TIME wait_time;
      int sec, usec;
606
      double duration = extract_float (seconds);
607

608 609 610 611 612
      if (0 < duration)
	duration_to_sec_usec (duration, &sec, &usec);
      else
	sec = usec = 0;

613 614 615 616 617
      EMACS_GET_TIME (end_time);
      EMACS_SET_SECS_USECS (wait_time, sec, usec);
      EMACS_ADD_TIME (end_time, end_time, wait_time);
    }

Karoly Lorentey's avatar
Karoly Lorentey committed
618
/* Read until we get an acceptable event.  */
619
 retry:
620
  do
Karoly Lorentey's avatar
Karoly Lorentey committed
621 622
    val = read_char (0, 0, 0, (input_method ? Qnil : Qt), 0,
		     NUMBERP (seconds) ? &end_time : NULL);
623
  while (INTEGERP (val) && XINT (val) == -2); /* wrong_kboard_jmpbuf */
624

625
  if (BUFFERP (val))
626 627
    goto retry;

628
  /* switch-frame events are put off until after the next ASCII
Karl Heuer's avatar
Karl Heuer committed
629
     character.  This is better than signaling an error just because
630 631 632 633 634
     the last characters were typed to a separate minibuffer frame,
     for example.  Eventually, some code which can deal with
     switch-frame events will read it and process it.  */
  if (no_switch_frame
      && EVENT_HAS_PARAMETERS (val)
635
      && EQ (EVENT_HEAD_KIND (EVENT_HEAD (val)), Qswitch_frame))
636 637 638 639 640
    {
      delayed_switch_frame = val;
      goto retry;
    }

641
  if (ascii_required && !(NUMBERP (seconds) && NILP (val)))
642 643
    {
      /* Convert certain symbols to their ASCII equivalents.  */
644
      if (SYMBOLP (val))
645
	{
646
	  Lisp_Object tem, tem1;
647 648 649 650 651 652 653
	  tem = Fget (val, Qevent_symbol_element_mask);
	  if (!NILP (tem))
	    {
	      tem1 = Fget (Fcar (tem), Qascii_character);
	      /* Merge this symbol's modifier bits
		 with the ASCII equivalent of its basic code.  */
	      if (!NILP (tem1))
654
		XSETFASTINT (val, XINT (tem1) | XINT (Fcar (Fcdr (tem))));
655 656
	    }
	}
657

658
      /* If we don't have a character now, deal with it appropriately.  */
659
      if (!INTEGERP (val))
660 661 662
	{
	  if (error_nonascii)
	    {
663
	      Vunread_command_events = Fcons (val, Qnil);
664 665 666 667 668 669 670 671 672 673
	      error ("Non-character input-event");
	    }
	  else
	    goto retry;
	}
    }

  if (! NILP (delayed_switch_frame))
    unread_switch_frame = delayed_switch_frame;

674 675
#if 0

676
#ifdef HAVE_WINDOW_SYSTEM
677 678
  if (display_hourglass_p)
    start_hourglass ();
679
#endif
680 681 682

#endif

683 684 685
  return val;
}

Paul Eggert's avatar
Paul Eggert committed
686
DEFUN ("read-char", Fread_char, Sread_char, 0, 3, 0,
687 688
       doc: /* Read a character from the command input (keyboard or macro).
It is returned as a number.
689 690 691
If the character has modifiers, they are resolved and reflected to the
character code if possible (e.g. C-SPC -> 0).

692 693
If the user generates an event which is not a character (i.e. a mouse
click or function key event), `read-char' signals an error.  As an
694 695
exception, switch-frame events are put off until non-character events
can be read.
696 697 698 699 700 701
If you want to read non-character events, or ignore them, call
`read-event' or `read-char-exclusive' instead.

If the optional argument PROMPT is non-nil, display that as a prompt.
If the optional argument INHERIT-INPUT-METHOD is non-nil and some
input method is turned on in the current buffer, that input method
702 703 704 705 706
is used for reading a character.
If the optional argument SECONDS is non-nil, it should be a number
specifying the maximum number of seconds to wait for input.  If no
input arrives in that time, return nil.  SECONDS may be a
floating-point value.  */)
Dan Nicolaescu's avatar
Dan Nicolaescu committed
707
  (Lisp_Object prompt, Lisp_Object inherit_input_method, Lisp_Object seconds)
Jim Blandy's avatar
Jim Blandy committed
708
{
709 710
  Lisp_Object val;

711 712
  if (! NILP (prompt))
    message_with_string ("%s", prompt, 0);
713
  val = read_filtered_event (1, 1, 1, ! NILP (inherit_input_method), seconds);
714 715 716

  return (NILP (val) ? Qnil
	  : make_number (char_resolve_modifier_mask (XINT (val))));
Jim Blandy's avatar
Jim Blandy committed
717 718
}

Paul Eggert's avatar
Paul Eggert committed
719
DEFUN ("read-event", Fread_event, Sread_event, 0, 3, 0,
720 721 722 723
       doc: /* Read an event object from the input stream.
If the optional argument PROMPT is non-nil, display that as a prompt.
If the optional argument INHERIT-INPUT-METHOD is non-nil and some
input method is turned on in the current buffer, that input method
724 725 726 727 728
is used for reading a character.
If the optional argument SECONDS is non-nil, it should be a number
specifying the maximum number of seconds to wait for input.  If no
input arrives in that time, return nil.  SECONDS may be a
floating-point value.  */)
Dan Nicolaescu's avatar
Dan Nicolaescu committed
729
  (Lisp_Object prompt, Lisp_Object inherit_input_method, Lisp_Object seconds)
Jim Blandy's avatar
Jim Blandy committed
730
{
731 732
  if (! NILP (prompt))
    message_with_string ("%s", prompt, 0);
733
  return read_filtered_event (0, 0, 0, ! NILP (inherit_input_method), seconds);
Jim Blandy's avatar
Jim Blandy committed
734 735
}

736
DEFUN ("read-char-exclusive", Fread_char_exclusive, Sread_char_exclusive, 0, 3, 0,
737 738
       doc: /* Read a character from the command input (keyboard or macro).
It is returned as a number.  Non-character events are ignored.
739 740
If the character has modifiers, they are resolved and reflected to the
character code if possible (e.g. C-SPC -> 0).
741 742 743 744

If the optional argument PROMPT is non-nil, display that as a prompt.
If the optional argument INHERIT-INPUT-METHOD is non-nil and some
input method is turned on in the current buffer, that input method
745 746 747 748 749
is used for reading a character.
If the optional argument SECONDS is non-nil, it should be a number
specifying the maximum number of seconds to wait for input.  If no
input arrives in that time, return nil.  SECONDS may be a
floating-point value.  */)
Dan Nicolaescu's avatar
Dan Nicolaescu committed
750
  (Lisp_Object prompt, Lisp_Object inherit_input_method, Lisp_Object seconds)
Jim Blandy's avatar
Jim Blandy committed
751
{
752 753
  Lisp_Object val;

754 755
  if (! NILP (prompt))
    message_with_string ("%s", prompt, 0);
756

757
  val = read_filtered_event (1, 1, 0, ! NILP (inherit_input_method), seconds);
758 759 760

  return (NILP (val) ? Qnil
	  : make_number (char_resolve_modifier_mask (XINT (val))));
Jim Blandy's avatar
Jim Blandy committed
761 762 763
}

DEFUN ("get-file-char", Fget_file_char, Sget_file_char, 0, 0, 0,
764
       doc: /* Don't use this yourself.  */)
Dan Nicolaescu's avatar
Dan Nicolaescu committed
765
  (void)
Jim Blandy's avatar
Jim Blandy committed
766 767
{
  register Lisp_Object val;
YAMAMOTO Mitsuharu's avatar
YAMAMOTO Mitsuharu committed
768
  BLOCK_INPUT;
769
  XSETINT (val, getc (instream));
YAMAMOTO Mitsuharu's avatar
YAMAMOTO Mitsuharu committed
770
  UNBLOCK_INPUT;
Jim Blandy's avatar
Jim Blandy committed
771 772
  return val;
}
773 774


775 776 777 778 779 780 781 782


/* Return true if the lisp code read using READCHARFUN defines a non-nil
   `lexical-binding' file variable.  After returning, the stream is
   positioned following the first line, if it is a comment, otherwise
   nothing is read.  */

static int
Stefan Monnier's avatar
Stefan Monnier committed
783
lisp_file_lexically_bound_p (Lisp_Object readcharfun)
784 785 786 787 788 789 790 791 792 793 794 795 796 797 798 799 800
{
  int ch = READCHAR;
  if (ch != ';')
    /* The first line isn't a comment, just give up.  */
    {
      UNREAD (ch);
      return 0;
    }
  else
    /* Look for an appropriate file-variable in the first line.  */
    {
      int rv = 0;
      enum {
	NOMINAL, AFTER_FIRST_DASH, AFTER_ASTERIX,
      } beg_end_state = NOMINAL;
      int in_file_vars = 0;

801 802 803 804 805 806 807 808 809 810
#define UPDATE_BEG_END_STATE(ch)				\
  if (beg_end_state == NOMINAL)					\
    beg_end_state = (ch == '-' ? AFTER_FIRST_DASH : NOMINAL);	\
  else if (beg_end_state == AFTER_FIRST_DASH)			\
    beg_end_state = (ch == '*' ? AFTER_ASTERIX : NOMINAL);	\
  else if (beg_end_state == AFTER_ASTERIX)			\
    {								\
      if (ch == '-')						\
	in_file_vars = !in_file_vars;				\
      beg_end_state = NOMINAL;					\
811 812 813 814 815 816 817 818 819 820 821 822
    }

      /* Skip until we get to the file vars, if any.  */
      do
	{
	  ch = READCHAR;
	  UPDATE_BEG_END_STATE (ch);
	}
      while (!in_file_vars && ch != '\n' && ch != EOF);

      while (in_file_vars)
	{
823
	  char var[100], val[100];
824
	  unsigned i;
825 826 827 828 829 830 831

	  ch = READCHAR;

	  /* Read a variable name.  */
	  while (ch == ' ' || ch == '\t')
	    ch = READCHAR;

832
	  i = 0;
833
	  while (ch != ':' && ch != '\n' && ch != EOF && in_file_vars)
834
	    {
835 836
	      if (i < sizeof var - 1)
		var[i++] = ch;
837 838 839
	      UPDATE_BEG_END_STATE (ch);
	      ch = READCHAR;
	    }
840

841
	  /* Stop scanning if no colon was found before end marker.  */
842
	  if (!in_file_vars || ch == '\n' || ch == EOF)
843 844
	    break;

845 846 847
	  while (i > 0 && (var[i - 1] == ' ' || var[i - 1] == '\t'))
	    i--;
	  var[i] = '\0';
848 849 850 851 852 853 854 855 856

	  if (ch == ':')
	    {
	      /* Read a variable value.  */
	      ch = READCHAR;

	      while (ch == ' ' || ch == '\t')
		ch = READCHAR;

857
	      i = 0;
858 859
	      while (ch != ';' && ch != '\n' && ch != EOF && in_file_vars)
		{
860 861
		  if (i < sizeof val - 1)
		    val[i++] = ch;
862 863 864 865
		  UPDATE_BEG_END_STATE (ch);
		  ch = READCHAR;
		}
	      if (! in_file_vars)
866
		/* The value was terminated by an end-marker, which remove.  */
867 868 869 870
		i -= 3;
	      while (i > 0 && (val[i - 1] == ' ' || val[i - 1] == '\t'))
		i--;
	      val[i] = '\0';
871 872 873 874 875 876 877 878 879 880 881 882 883 884 885 886

	      if (strcmp (var, "lexical-binding") == 0)
		/* This is it...  */
		{
		  rv = (strcmp (val, "nil") != 0);
		  break;
		}
	    }
	}

      while (ch != '\n' && ch != EOF)
	ch = READCHAR;

      return rv;
    }
}
887

Kenichi Handa's avatar
Kenichi Handa committed
888
/* Value is a version number of byte compiled code if the file
Miles Bader's avatar
Miles Bader committed
889
   associated with file descriptor FD is a compiled Lisp file that's
Kenichi Handa's avatar
Kenichi Handa committed
890 891 892
   safe to load.  Only files compiled with Emacs are safe to load.
   Files compiled with XEmacs can lead to a crash in Fbyte_code
   because of an incompatible change in the byte compiler.  */
893 894

static int
895
safe_to_load_p (int fd)
896 897 898 899
{
  char buf[512];
  int nbytes, i;
  int safe_p = 1;
Kenichi Handa's avatar
Kenichi Handa committed
900
  int version = 1;
901 902 903 904 905 906 907 908 909

  /* Read the first few bytes from the file, and look for a line
     specifying the byte compiler version used.  */
  nbytes = emacs_read (fd, buf, sizeof buf - 1);
  if (nbytes > 0)
    {
      buf[nbytes] = '\0';

      /* Skip to the next newline, skipping over the initial `ELC'
Dave Love's avatar
Dave Love committed
910
	 with NUL bytes following it, but note the version.  */
911
      for (i = 0; i < nbytes && buf[i] != '\n'; ++i)
Dave Love's avatar
Dave Love committed
912
	if (i == 4)
Kenichi Handa's avatar
Kenichi Handa committed
913
	  version = buf[i];
914

915
      if (i >= nbytes
916
	  || fast_c_string_match_ignore_case (Vbytecomp_version_regexp,
917 918 919
					      buf + i) < 0)
	safe_p = 0;
    }
Dave Love's avatar
Dave Love committed
920 921
  if (safe_p)
    safe_p = version;
922 923 924 925 926 927

  lseek (fd, 0, SEEK_SET);
  return safe_p;
}


928 929 930 931
/* Callback for record_unwind_protect.  Restore the old load list OLD,
   after loading a file successfully.  */

static Lisp_Object
932
record_load_unwind (Lisp_Object old)
933 934 935 936
{
  return Vloads_in_progress = old;
}

937 938 939
/* This handler function is used via internal_condition_case_1.  */

static Lisp_Object
940
load_error_handler (Lisp_Object data)
941 942 943
{
  return Qnil;
}