lread.c 125 KB
Newer Older
Jim Blandy's avatar
Jim Blandy committed
1
/* Lisp parsing and input streams.
2 3
   Copyright (C) 1985, 1986, 1987, 1988, 1989, 1993, 1994, 1995,
                 1997, 1998, 1999, 2000, 2001, 2002, 2003, 2004,
Glenn Morris's avatar
Glenn Morris committed
4
                 2005, 2006, 2007, 2008, 2009, 2010 Free Software Foundation, Inc.
Jim Blandy's avatar
Jim Blandy committed
5 6 7

This file is part of GNU Emacs.

8
GNU Emacs is free software: you can redistribute it and/or modify
Jim Blandy's avatar
Jim Blandy committed
9
it under the terms of the GNU General Public License as published by
10 11
the Free Software Foundation, either version 3 of the License, or
(at your option) any later version.
Jim Blandy's avatar
Jim Blandy committed
12 13 14 15 16 17 18

GNU Emacs is distributed in the hope that it will be useful,
but WITHOUT ANY WARRANTY; without even the implied warranty of
MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
GNU General Public License for more details.

You should have received a copy of the GNU General Public License
19
along with GNU Emacs.  If not, see <http://www.gnu.org/licenses/>.  */
Jim Blandy's avatar
Jim Blandy committed
20 21


Richard M. Stallman's avatar
Richard M. Stallman committed
22
#include <config.h>
Jim Blandy's avatar
Jim Blandy committed
23 24 25 26
#include <stdio.h>
#include <sys/types.h>
#include <sys/stat.h>
#include <sys/file.h>
27
#include <errno.h>
28
#include <setjmp.h>
Jim Blandy's avatar
Jim Blandy committed
29
#include "lisp.h"
30
#include "intervals.h"
Jim Blandy's avatar
Jim Blandy committed
31
#include "buffer.h"
Kenichi Handa's avatar
Kenichi Handa committed
32
#include "character.h"
Karl Heuer's avatar
Karl Heuer committed
33
#include "charset.h"
Kenichi Handa's avatar
Kenichi Handa committed
34
#include "coding.h"
35
#include <epaths.h>
Jim Blandy's avatar
Jim Blandy committed
36
#include "commands.h"
Jim Blandy's avatar
Jim Blandy committed
37
#include "keyboard.h"
38
#include "frame.h"
39
#include "termhooks.h"
40
#include "coding.h"
YAMAMOTO Mitsuharu's avatar
YAMAMOTO Mitsuharu committed
41
#include "blockinput.h"
Jim Blandy's avatar
Jim Blandy committed
42

43 44 45 46
#ifdef MSDOS
#include "msdos.h"
#endif

Andreas Schwab's avatar
Andreas Schwab committed
47 48 49 50
#ifdef HAVE_UNISTD_H
#include <unistd.h>
#endif

Jim Blandy's avatar
Jim Blandy committed
51 52
#include <math.h>

Richard M. Stallman's avatar
Richard M. Stallman committed
53 54 55 56
#ifdef HAVE_SETLOCALE
#include <locale.h>
#endif /* HAVE_SETLOCALE */

Dave Love's avatar
Dave Love committed
57 58 59
#ifdef HAVE_FCNTL_H
#include <fcntl.h>
#endif
Richard M. Stallman's avatar
Richard M. Stallman committed
60 61 62 63
#ifndef O_RDONLY
#define O_RDONLY 0
#endif

64
#ifdef HAVE_FSEEKO
65 66 67 68 69 70 71
#define file_offset off_t
#define file_tell ftello
#else
#define file_offset long
#define file_tell ftell
#endif

72 73 74 75 76 77 78 79
/* hash table read constants */
Lisp_Object Qhash_table, Qdata;
Lisp_Object Qtest, Qsize;
Lisp_Object Qweakness;
Lisp_Object Qrehash_size;
Lisp_Object Qrehash_threshold;
extern Lisp_Object QCtest, QCsize, QCrehash_size, QCrehash_threshold, QCweakness;

80
Lisp_Object Qread_char, Qget_file_char, Qstandard_input, Qcurrent_load_list;
Jim Blandy's avatar
Jim Blandy committed
81
Lisp_Object Qvariable_documentation, Vvalues, Vstandard_input, Vafter_load_alist;
82
Lisp_Object Qascii_character, Qload, Qload_file_name;
83
Lisp_Object Qbackquote, Qcomma, Qcomma_at, Qcomma_dot, Qfunction;
84
Lisp_Object Qinhibit_file_name_operation;
85
Lisp_Object Qeval_buffer_list, Veval_buffer_list;
86
Lisp_Object Qfile_truename, Qdo_after_load_evaluation; /* ACM 2006/5/16 */
87

Kenichi Handa's avatar
Kenichi Handa committed
88 89 90 91 92 93
/* Used instead of Qget_file_char while loading *.elc files compiled
   by Emacs 21 or older.  */
static Lisp_Object Qget_emacs_mule_file_char;

static Lisp_Object Qload_force_doc_strings;

94
extern Lisp_Object Qevent_symbol_element_mask;
95
extern Lisp_Object Qfile_exists_p;
Jim Blandy's avatar
Jim Blandy committed
96

Glenn Morris's avatar
Glenn Morris committed
97
/* non-zero if inside `load' */
Jim Blandy's avatar
Jim Blandy committed
98
int load_in_progress;
99
static Lisp_Object Qload_in_progress;
Ken Raeburn's avatar
Ken Raeburn committed
100

101 102 103
/* Directory in which the sources were found.  */
Lisp_Object Vsource_directory;

104
/* Search path and suffixes for files to be loaded. */
105
Lisp_Object Vload_path, Vload_suffixes, Vload_file_rep_suffixes;
Jim Blandy's avatar
Jim Blandy committed
106

Karl Heuer's avatar
Karl Heuer committed
107 108 109
/* File name of user's init file.  */
Lisp_Object Vuser_init_file;

110 111 112 113
/* This is the user-visible association list that maps features to
   lists of defs in their load files. */
Lisp_Object Vload_history;

114
/* This is used to build the load history. */
115 116
Lisp_Object Vcurrent_load_list;

117 118 119
/* List of files that were preloaded.  */
Lisp_Object Vpreloaded_file_list;

120 121 122
/* Name of file actually being read by `load'.  */
Lisp_Object Vload_file_name;

123 124 125
/* Function to use for reading, in `load' and friends.  */
Lisp_Object Vload_read_function;

126 127 128
/* Non-nil means read recursive structures using #n= and #n# syntax.  */
Lisp_Object Vread_circle;

129 130 131 132 133 134
/* The association list of objects read with the #n=object form.
   Each member of the list has the form (n . object), and is used to
   look up the object for the corresponding #n# construct.
   It must be set to nil before all top-level calls to read0.  */
Lisp_Object read_objects;

135 136 137
/* Nonzero means load should forcibly load all dynamic doc strings.  */
static int load_force_doc_strings;

138 139 140
/* Nonzero means read should convert strings to unibyte.  */
static int load_convert_to_unibyte;

Kenichi Handa's avatar
Kenichi Handa committed
141 142 143 144 145
/* Nonzero means READCHAR should read bytes one by one (not character)
   when READCHARFUN is Qget_file_char or Qget_emacs_mule_file_char.
   This is set to 1 by read1 temporarily while handling #@NUMBER.  */
static int load_each_byte;

146
/* Function to use for loading an Emacs Lisp source file (not
Karl Heuer's avatar
Karl Heuer committed
147 148 149
   compiled) instead of readevalloop.  */
Lisp_Object Vload_source_file_function;

150 151 152
/* List of all DEFVAR_BOOL variables.  Used by the byte optimizer.  */
Lisp_Object Vbyte_boolean_vars;

153 154 155 156 157 158 159
/* Whether or not to add a `read-positions' property to symbols
   read. */
Lisp_Object Vread_with_symbol_positions;

/* List of (SYMBOL . POSITION) accumulated so far. */
Lisp_Object Vread_symbol_positions_list;

160 161 162
/* List of descriptors now open for Fload.  */
static Lisp_Object load_descriptor_list;

163
/* File for get_file_char to read from.  Use by load.  */
Jim Blandy's avatar
Jim Blandy committed
164 165 166 167 168
static FILE *instream;

/* When nonzero, read conses in pure space */
static int read_pure;

169
/* For use within read-from-string (this reader is non-reentrant!!)  */
Jim Blandy's avatar
Jim Blandy committed
170
static int read_from_string_index;
171
static int read_from_string_index_byte;
Jim Blandy's avatar
Jim Blandy committed
172
static int read_from_string_limit;
173

174 175 176
/* Number of characters read in the current call to Fread or
   Fread_from_string. */
static int readchar_count;
177

178
/* This contains the last string skipped with #@.  */
179 180 181 182 183 184
static char *saved_doc_string;
/* Length of buffer allocated in saved_doc_string.  */
static int saved_doc_string_size;
/* Length of actual data in saved_doc_string.  */
static int saved_doc_string_length;
/* This is the file position that string came from.  */
185
static file_offset saved_doc_string_position;
186

187 188 189 190 191 192 193 194 195
/* This contains the previous string skipped with #@.
   We copy it from saved_doc_string when a new string
   is put in saved_doc_string.  */
static char *prev_saved_doc_string;
/* Length of buffer allocated in prev_saved_doc_string.  */
static int prev_saved_doc_string_size;
/* Length of actual data in prev_saved_doc_string.  */
static int prev_saved_doc_string_length;
/* This is the file position that string came from.  */
196
static file_offset prev_saved_doc_string_position;
197

198 199 200 201 202
/* Nonzero means inside a new-style backquote
   with no surrounding parentheses.
   Fread initializes this to zero, so we need not specbind it
   or worry about what happens to it when there is an error.  */
static int new_backquote_flag;
203
static Lisp_Object Vold_style_backquotes, Qold_style_backquotes;
204 205 206 207

/* A list of file names for files being loaded in Fload.  Used to
   check for recursive loads.  */

Lute Kamstra's avatar
Lute Kamstra committed
208
static Lisp_Object Vloads_in_progress;
209

210 211 212 213
/* Non-zero means load dangerous compiled Lisp files.  */

int load_dangerous_libraries;

214 215 216 217
/* Non-zero means force printing messages when loading Lisp files.  */

int force_load_messages;

218 219 220 221
/* A regular expression used to detect files compiled with Emacs.  */

static Lisp_Object Vbytecomp_version_regexp;

Kenichi Handa's avatar
Kenichi Handa committed
222 223 224
static int read_emacs_mule_char P_ ((int, int (*) (int, Lisp_Object),
				     Lisp_Object));

225
static void readevalloop P_ ((Lisp_Object, FILE*, Lisp_Object,
226
			      Lisp_Object (*) (), int,
227
			      Lisp_Object, Lisp_Object,
228 229 230 231
			      Lisp_Object, Lisp_Object));
static Lisp_Object load_unwind P_ ((Lisp_Object));
static Lisp_Object load_descriptor_unwind P_ ((Lisp_Object));

232
static void invalid_syntax P_ ((const char *, int)) NO_RETURN;
233
static void end_of_file_error P_ (()) NO_RETURN;
234

Jim Blandy's avatar
Jim Blandy committed
235

Kenichi Handa's avatar
Kenichi Handa committed
236 237 238 239 240 241 242 243 244 245
/* Functions that read one byte from the current source READCHARFUN
   or unreads one byte.  If the integer argument C is -1, it returns
   one read byte, or -1 when there's no more byte in the source.  If C
   is 0 or positive, it unreads C, and the return value is not
   interesting.  */

static int readbyte_for_lambda P_ ((int, Lisp_Object));
static int readbyte_from_file P_ ((int, Lisp_Object));
static int readbyte_from_string P_ ((int, Lisp_Object));

Jim Blandy's avatar
Jim Blandy committed
246 247
/* Handle unreading and rereading of characters.
   Write READCHAR to read a character,
Karl Heuer's avatar
Karl Heuer committed
248 249
   UNREAD(c) to unread c to be read again.

Kenichi Handa's avatar
Kenichi Handa committed
250
   These macros correctly read/unread multibyte characters.  */
Jim Blandy's avatar
Jim Blandy committed
251

252
#define READCHAR readchar (readcharfun, NULL)
Jim Blandy's avatar
Jim Blandy committed
253 254
#define UNREAD(c) unreadchar (readcharfun, c)

255 256 257
/* Same as READCHAR but set *MULTIBYTE to the multibyteness of the source.  */
#define READCHAR_REPORT_MULTIBYTE(multibyte) readchar (readcharfun, multibyte)

Kenichi Handa's avatar
Kenichi Handa committed
258
/* When READCHARFUN is Qget_file_char, Qget_emacs_mule_file_char,
Kenichi Handa's avatar
Kenichi Handa committed
259 260
   Qlambda, or a cons, we use this to keep an unread character because
   a file stream can't handle multibyte-char unreading.  The value -1
Kenichi Handa's avatar
Kenichi Handa committed
261 262 263
   means that there's no unread character. */
static int unread_char;

Jim Blandy's avatar
Jim Blandy committed
264
static int
265
readchar (readcharfun, multibyte)
Jim Blandy's avatar
Jim Blandy committed
266
     Lisp_Object readcharfun;
267
     int *multibyte;
Jim Blandy's avatar
Jim Blandy committed
268 269
{
  Lisp_Object tem;
270
  register int c;
Kenichi Handa's avatar
Kenichi Handa committed
271 272 273 274
  int (*readbyte) P_ ((int, Lisp_Object));
  unsigned char buf[MAX_MULTIBYTE_LENGTH];
  int i, len;
  int emacs_mule_encoding = 0;
Jim Blandy's avatar
Jim Blandy committed
275

276 277 278
  if (multibyte)
    *multibyte = 0;

279
  readchar_count++;
280

281
  if (BUFFERP (readcharfun))
Jim Blandy's avatar
Jim Blandy committed
282
    {
283
      register struct buffer *inbuffer = XBUFFER (readcharfun);
Jim Blandy's avatar
Jim Blandy committed
284

285
      int pt_byte = BUF_PT_BYTE (inbuffer);
286

287 288
      if (pt_byte >= BUF_ZV_BYTE (inbuffer))
	return -1;
Jim Blandy's avatar
Jim Blandy committed
289

290 291
      if (! NILP (inbuffer->enable_multibyte_characters))
	{
292
	  /* Fetch the character code from the buffer.  */
293 294
	  unsigned char *p = BUF_BYTE_ADDRESS (inbuffer, pt_byte);
	  BUF_INC_POS (inbuffer, pt_byte);
295
	  c = STRING_CHAR (p);
296 297
	  if (multibyte)
	    *multibyte = 1;
298 299 300 301
	}
      else
	{
	  c = BUF_FETCH_BYTE (inbuffer, pt_byte);
Kenichi Handa's avatar
Kenichi Handa committed
302 303
	  if (! ASCII_BYTE_P (c))
	    c = BYTE8_TO_CHAR (c);
304
	  pt_byte++;
305
	}
306
      SET_BUF_PT_BOTH (inbuffer, BUF_PT (inbuffer) + 1, pt_byte);
307

308
      return c;
Jim Blandy's avatar
Jim Blandy committed
309
    }
310
  if (MARKERP (readcharfun))
Jim Blandy's avatar
Jim Blandy committed
311
    {
312
      register struct buffer *inbuffer = XMARKER (readcharfun)->buffer;
Jim Blandy's avatar
Jim Blandy committed
313

314
      int bytepos = marker_byte_position (readcharfun);
315

316 317
      if (bytepos >= BUF_ZV_BYTE (inbuffer))
	return -1;
318

319 320
      if (! NILP (inbuffer->enable_multibyte_characters))
	{
321
	  /* Fetch the character code from the buffer.  */
322 323
	  unsigned char *p = BUF_BYTE_ADDRESS (inbuffer, bytepos);
	  BUF_INC_POS (inbuffer, bytepos);
324
	  c = STRING_CHAR (p);
325 326
	  if (multibyte)
	    *multibyte = 1;
327 328 329 330
	}
      else
	{
	  c = BUF_FETCH_BYTE (inbuffer, bytepos);
Kenichi Handa's avatar
Kenichi Handa committed
331 332
	  if (! ASCII_BYTE_P (c))
	    c = BYTE8_TO_CHAR (c);
333
	  bytepos++;
334 335
	}

336 337 338 339
      XMARKER (readcharfun)->bytepos = bytepos;
      XMARKER (readcharfun)->charpos++;

      return c;
Jim Blandy's avatar
Jim Blandy committed
340
    }
341 342

  if (EQ (readcharfun, Qlambda))
Kenichi Handa's avatar
Kenichi Handa committed
343 344 345 346
    {
      readbyte = readbyte_for_lambda;
      goto read_multibyte;
    }
347

Jim Blandy's avatar
Jim Blandy committed
348
  if (EQ (readcharfun, Qget_file_char))
349
    {
Kenichi Handa's avatar
Kenichi Handa committed
350 351
      readbyte = readbyte_from_file;
      goto read_multibyte;
352
    }
Jim Blandy's avatar
Jim Blandy committed
353

354
  if (STRINGP (readcharfun))
Jim Blandy's avatar
Jim Blandy committed
355
    {
356
      if (read_from_string_index >= read_from_string_limit)
Jim Blandy's avatar
Jim Blandy committed
357
	c = -1;
358 359 360 361 362 363 364 365
      else if (STRING_MULTIBYTE (readcharfun))
	{
	  if (multibyte)
	    *multibyte = 1;
	  FETCH_STRING_CHAR_ADVANCE_NO_CHECK (c, readcharfun,
					      read_from_string_index,
					      read_from_string_index_byte);
	}
366
      else
367 368 369 370 371
	{
	  c = SREF (readcharfun, read_from_string_index_byte);
	  read_from_string_index++;
	  read_from_string_index_byte++;
	}
Jim Blandy's avatar
Jim Blandy committed
372 373 374
      return c;
    }

Kenichi Handa's avatar
Kenichi Handa committed
375 376 377 378 379 380 381 382 383 384 385 386
  if (CONSP (readcharfun))
    {
      /* This is the case that read_vector is reading from a unibyte
	 string that contains a byte sequence previously skipped
	 because of #@NUMBER.  The car part of readcharfun is that
	 string, and the cdr part is a value of readcharfun given to
	 read_vector.  */
      readbyte = readbyte_from_string;
      if (EQ (XCDR (readcharfun), Qget_emacs_mule_file_char))
	emacs_mule_encoding = 1;
      goto read_multibyte;
    }
Kenichi Handa's avatar
Kenichi Handa committed
387

Kenichi Handa's avatar
Kenichi Handa committed
388 389 390 391 392 393
  if (EQ (readcharfun, Qget_emacs_mule_file_char))
    {
      readbyte = readbyte_from_file;
      emacs_mule_encoding = 1;
      goto read_multibyte;
    }
Jim Blandy's avatar
Jim Blandy committed
394 395 396

  tem = call0 (readcharfun);

Jim Blandy's avatar
Jim Blandy committed
397
  if (NILP (tem))
Jim Blandy's avatar
Jim Blandy committed
398 399
    return -1;
  return XINT (tem);
Kenichi Handa's avatar
Kenichi Handa committed
400 401 402 403 404 405 406 407 408

 read_multibyte:
  if (unread_char >= 0)
    {
      c = unread_char;
      unread_char = -1;
      return c;
    }
  c = (*readbyte) (-1, readcharfun);
409 410 411 412 413
  if (c < 0 || load_each_byte)
    return c;
  if (multibyte)
    *multibyte = 1;
  if (ASCII_BYTE_P (c))
Kenichi Handa's avatar
Kenichi Handa committed
414 415 416 417 418 419 420 421 422 423 424 425 426 427 428 429 430
    return c;
  if (emacs_mule_encoding)
    return read_emacs_mule_char (c, readbyte, readcharfun);
  i = 0;
  buf[i++] = c;
  len = BYTES_BY_CHAR_HEAD (c);
  while (i < len)
    {
      c = (*readbyte) (-1, readcharfun);
      if (c < 0 || ! TRAILING_CODE_P (c))
	{
	  while (--i > 1)
	    (*readbyte) (buf[i], readcharfun);
	  return BYTE8_TO_CHAR (buf[0]);
	}
      buf[i++] = c;
    }
431
  return STRING_CHAR (buf);
Jim Blandy's avatar
Jim Blandy committed
432 433 434 435 436 437 438 439 440 441
}

/* Unread the character C in the way appropriate for the stream READCHARFUN.
   If the stream is a user function, call it with the char as argument.  */

static void
unreadchar (readcharfun, c)
     Lisp_Object readcharfun;
     int c;
{
442
  readchar_count--;
443 444 445 446
  if (c == -1)
    /* Don't back up the pointer if we're unreading the end-of-input mark,
       since readchar didn't advance it when we read it.  */
    ;
447
  else if (BUFFERP (readcharfun))
448
    {
449 450
      struct buffer *b = XBUFFER (readcharfun);
      int bytepos = BUF_PT_BYTE (b);
451

Kenichi Handa's avatar
Kenichi Handa committed
452 453 454
      BUF_PT (b)--;
      if (! NILP (b->enable_multibyte_characters))
	BUF_DEC_POS (b, bytepos);
455
      else
Kenichi Handa's avatar
Kenichi Handa committed
456
	bytepos--;
457

Kenichi Handa's avatar
Kenichi Handa committed
458
      BUF_PT_BYTE (b) = bytepos;
459
    }
460
  else if (MARKERP (readcharfun))
461
    {
462 463
      struct buffer *b = XMARKER (readcharfun)->buffer;
      int bytepos = XMARKER (readcharfun)->bytepos;
464

Kenichi Handa's avatar
Kenichi Handa committed
465 466 467
      XMARKER (readcharfun)->charpos--;
      if (! NILP (b->enable_multibyte_characters))
	BUF_DEC_POS (b, bytepos);
468
      else
Kenichi Handa's avatar
Kenichi Handa committed
469
	bytepos--;
470

Kenichi Handa's avatar
Kenichi Handa committed
471
      XMARKER (readcharfun)->bytepos = bytepos;
472
    }
473
  else if (STRINGP (readcharfun))
474 475 476 477 478
    {
      read_from_string_index--;
      read_from_string_index_byte
	= string_char_to_byte (readcharfun, read_from_string_index);
    }
Kenichi Handa's avatar
Kenichi Handa committed
479 480 481 482
  else if (CONSP (readcharfun))
    {
      unread_char = c;
    }
483
  else if (EQ (readcharfun, Qlambda))
Kenichi Handa's avatar
Kenichi Handa committed
484 485 486 487 488 489 490
    {
      unread_char = c;
    }
  else if (EQ (readcharfun, Qget_file_char)
	   || EQ (readcharfun, Qget_emacs_mule_file_char))
    {
      if (load_each_byte)
Miles Bader's avatar
Miles Bader committed
491 492 493 494 495
	{
	  BLOCK_INPUT;
	  ungetc (c, instream);
	  UNBLOCK_INPUT;
	}
Kenichi Handa's avatar
Kenichi Handa committed
496 497 498
      else
	unread_char = c;
    }
Jim Blandy's avatar
Jim Blandy committed
499 500 501 502
  else
    call1 (readcharfun, make_number (c));
}

Kenichi Handa's avatar
Kenichi Handa committed
503 504 505 506 507 508 509 510 511 512 513 514 515 516 517 518
static int
readbyte_for_lambda (c, readcharfun)
     int c;
     Lisp_Object readcharfun;
{
  return read_bytecode_char (c >= 0);
}


static int
readbyte_from_file (c, readcharfun)
     int c;
     Lisp_Object readcharfun;
{
  if (c >= 0)
    {
YAMAMOTO Mitsuharu's avatar
YAMAMOTO Mitsuharu committed
519
      BLOCK_INPUT;
Kenichi Handa's avatar
Kenichi Handa committed
520
      ungetc (c, instream);
YAMAMOTO Mitsuharu's avatar
YAMAMOTO Mitsuharu committed
521
      UNBLOCK_INPUT;
Kenichi Handa's avatar
Kenichi Handa committed
522 523 524
      return 0;
    }

Miles Bader's avatar
Miles Bader committed
525
  BLOCK_INPUT;
Kenichi Handa's avatar
Kenichi Handa committed
526
  c = getc (instream);
Miles Bader's avatar
Miles Bader committed
527

Kenichi Handa's avatar
Kenichi Handa committed
528
#ifdef EINTR
Miles Bader's avatar
Miles Bader committed
529 530 531
  /* Interrupted reads have been observed while reading over the network */
  while (c == EOF && ferror (instream) && errno == EINTR)
    {
Miles Bader's avatar
Miles Bader committed
532
      UNBLOCK_INPUT;
Miles Bader's avatar
Miles Bader committed
533 534
      QUIT;
      BLOCK_INPUT;
Miles Bader's avatar
Miles Bader committed
535
      clearerr (instream);
Miles Bader's avatar
Miles Bader committed
536
      c = getc (instream);
YAMAMOTO Mitsuharu's avatar
YAMAMOTO Mitsuharu committed
537
    }
Kenichi Handa's avatar
Kenichi Handa committed
538
#endif
Miles Bader's avatar
Miles Bader committed
539

Miles Bader's avatar
Miles Bader committed
540 541
  UNBLOCK_INPUT;

Kenichi Handa's avatar
Kenichi Handa committed
542 543 544 545 546 547 548 549 550 551 552 553 554 555 556 557
  return (c == EOF ? -1 : c);
}

static int
readbyte_from_string (c, readcharfun)
     int c;
     Lisp_Object readcharfun;
{
  Lisp_Object string = XCAR (readcharfun);

  if (c >= 0)
    {
      read_from_string_index--;
      read_from_string_index_byte
	= string_char_to_byte (string, read_from_string_index);
    }
Kenichi Handa's avatar
Kenichi Handa committed
558

Kenichi Handa's avatar
Kenichi Handa committed
559 560 561 562 563 564 565 566 567 568 569 570 571 572 573 574 575 576 577 578 579 580 581 582 583 584 585 586 587 588 589 590 591 592 593 594 595 596 597 598 599 600 601 602 603 604 605 606 607
  if (read_from_string_index >= read_from_string_limit)
    c = -1;
  else
    FETCH_STRING_CHAR_ADVANCE (c, string,
			       read_from_string_index,
			       read_from_string_index_byte);
  return c;
}


/* Read one non-ASCII character from INSTREAM.  The character is
   encoded in `emacs-mule' and the first byte is already read in
   C.  */

extern char emacs_mule_bytes[256];

static int
read_emacs_mule_char (c, readbyte, readcharfun)
     int c;
     int (*readbyte) P_ ((int, Lisp_Object));
     Lisp_Object readcharfun;
{
  /* Emacs-mule coding uses at most 4-byte for one character.  */
  unsigned char buf[4];
  int len = emacs_mule_bytes[c];
  struct charset *charset;
  int i;
  unsigned code;

  if (len == 1)
    /* C is not a valid leading-code of `emacs-mule'.  */
    return BYTE8_TO_CHAR (c);

  i = 0;
  buf[i++] = c;
  while (i < len)
    {
      c = (*readbyte) (-1, readcharfun);
      if (c < 0xA0)
	{
	  while (--i > 1)
	    (*readbyte) (buf[i], readcharfun);
	  return BYTE8_TO_CHAR (buf[0]);
	}
      buf[i++] = c;
    }

  if (len == 2)
    {
Dave Love's avatar
Dave Love committed
608
      charset = emacs_mule_charset[buf[0]];
Kenichi Handa's avatar
Kenichi Handa committed
609 610 611 612 613 614 615 616 617 618 619 620 621 622 623 624 625 626 627
      code = buf[1] & 0x7F;
    }
  else if (len == 3)
    {
      if (buf[0] == EMACS_MULE_LEADING_CODE_PRIVATE_11
	  || buf[0] == EMACS_MULE_LEADING_CODE_PRIVATE_12)
	{
	  charset = emacs_mule_charset[buf[1]];
	  code = buf[2] & 0x7F;
	}
      else
	{
	  charset = emacs_mule_charset[buf[0]];
	  code = ((buf[1] << 8) | buf[2]) & 0x7F7F;
	}
    }
  else
    {
      charset = emacs_mule_charset[buf[1]];
Kenichi Handa's avatar
Kenichi Handa committed
628
      code = ((buf[2] << 8) | buf[3]) & 0x7F7F;
Kenichi Handa's avatar
Kenichi Handa committed
629 630 631 632 633 634 635 636 637
    }
  c = DECODE_CHAR (charset, code);
  if (c < 0)
    Fsignal (Qinvalid_read_syntax,
	     Fcons (build_string ("invalid multibyte form"), Qnil));
  return c;
}


638 639 640
static Lisp_Object read_internal_start P_ ((Lisp_Object, Lisp_Object,
					    Lisp_Object));
static Lisp_Object read0 P_ ((Lisp_Object));
641
static Lisp_Object read1 P_ ((Lisp_Object, int *, int));
642 643 644 645 646 647 648 649 650

static Lisp_Object read_list P_ ((int, Lisp_Object));
static Lisp_Object read_vector P_ ((Lisp_Object, int));

static Lisp_Object substitute_object_recurse P_ ((Lisp_Object, Lisp_Object,
						  Lisp_Object));
static void substitute_object_in_subtree P_ ((Lisp_Object,
					      Lisp_Object));
static void substitute_in_interval P_ ((INTERVAL, Lisp_Object));
651

Jim Blandy's avatar
Jim Blandy committed
652

653
/* Get a character from the tty.  */
Jim Blandy's avatar
Jim Blandy committed
654

655 656 657 658 659 660 661 662 663 664 665 666 667
/* Read input events until we get one that's acceptable for our purposes.

   If NO_SWITCH_FRAME is non-zero, switch-frame events are stashed
   until we get a character we like, and then stuffed into
   unread_switch_frame.

   If ASCII_REQUIRED is non-zero, we check function key events to see
   if the unmodified version of the symbol has a Qascii_character
   property, and use that character, if present.

   If ERROR_NONASCII is non-zero, we signal an error if the input we
   get isn't an ASCII character with modifiers.  If it's zero but
   ASCII_REQUIRED is non-zero, we just re-read until we get an ASCII
668 669 670
   character.

   If INPUT_METHOD is nonzero, we invoke the current input method
671 672 673 674
   if the character warrants that.

   If SECONDS is a number, we wait that many seconds for input, and
   return Qnil if no input arrives within that time.  */
675

676
Lisp_Object
677
read_filtered_event (no_switch_frame, ascii_required, error_nonascii,
678
		     input_method, seconds)
679
     int no_switch_frame, ascii_required, error_nonascii, input_method;
680
     Lisp_Object seconds;
681
{
682
  Lisp_Object val, delayed_switch_frame;
683
  EMACS_TIME end_time;
684

685
#ifdef HAVE_WINDOW_SYSTEM
686 687
  if (display_hourglass_p)
    cancel_hourglass ();
688
#endif
689

690
  delayed_switch_frame = Qnil;
691

692 693 694 695 696
  /* Compute timeout.  */
  if (NUMBERP (seconds))
    {
      EMACS_TIME wait_time;
      int sec, usec;
697
      double duration = extract_float (seconds);
698 699 700 701 702 703 704 705

      sec  = (int) duration;
      usec = (duration - sec) * 1000000;
      EMACS_GET_TIME (end_time);
      EMACS_SET_SECS_USECS (wait_time, sec, usec);
      EMACS_ADD_TIME (end_time, end_time, wait_time);
    }

Karoly Lorentey's avatar
Karoly Lorentey committed
706
/* Read until we get an acceptable event.  */
707
 retry:
708
  do
Karoly Lorentey's avatar
Karoly Lorentey committed
709 710
    val = read_char (0, 0, 0, (input_method ? Qnil : Qt), 0,
		     NUMBERP (seconds) ? &end_time : NULL);
711
  while (INTEGERP (val) && XINT (val) == -2); /* wrong_kboard_jmpbuf */
712

713
  if (BUFFERP (val))
714 715
    goto retry;

716
  /* switch-frame events are put off until after the next ASCII
Karl Heuer's avatar
Karl Heuer committed
717
     character.  This is better than signaling an error just because
718 719 720 721 722
     the last characters were typed to a separate minibuffer frame,
     for example.  Eventually, some code which can deal with
     switch-frame events will read it and process it.  */
  if (no_switch_frame
      && EVENT_HAS_PARAMETERS (val)
723
      && EQ (EVENT_HEAD_KIND (EVENT_HEAD (val)), Qswitch_frame))
724 725 726 727 728
    {
      delayed_switch_frame = val;
      goto retry;
    }

729
  if (ascii_required && !(NUMBERP (seconds) && NILP (val)))
730 731
    {
      /* Convert certain symbols to their ASCII equivalents.  */
732
      if (SYMBOLP (val))
733
	{
734
	  Lisp_Object tem, tem1;
735 736 737 738 739 740 741
	  tem = Fget (val, Qevent_symbol_element_mask);
	  if (!NILP (tem))
	    {
	      tem1 = Fget (Fcar (tem), Qascii_character);
	      /* Merge this symbol's modifier bits
		 with the ASCII equivalent of its basic code.  */
	      if (!NILP (tem1))
742
		XSETFASTINT (val, XINT (tem1) | XINT (Fcar (Fcdr (tem))));
743 744
	    }
	}
745

746
      /* If we don't have a character now, deal with it appropriately.  */
747
      if (!INTEGERP (val))
748 749 750
	{
	  if (error_nonascii)
	    {
751
	      Vunread_command_events = Fcons (val, Qnil);
752 753 754 755 756 757 758 759 760 761
	      error ("Non-character input-event");
	    }
	  else
	    goto retry;
	}
    }

  if (! NILP (delayed_switch_frame))
    unread_switch_frame = delayed_switch_frame;

762 763
#if 0

764
#ifdef HAVE_WINDOW_SYSTEM
765 766
  if (display_hourglass_p)
    start_hourglass ();
767
#endif
768 769 770

#endif

771 772 773
  return val;
}

774
DEFUN ("read-char", Fread_char, Sread_char, 0, 3, 0,
775 776
       doc: /* Read a character from the command input (keyboard or macro).
It is returned as a number.
777 778 779
If the character has modifiers, they are resolved and reflected to the
character code if possible (e.g. C-SPC -> 0).

780 781
If the user generates an event which is not a character (i.e. a mouse
click or function key event), `read-char' signals an error.  As an
782 783
exception, switch-frame events are put off until non-character events
can be read.
784 785 786 787 788 789
If you want to read non-character events, or ignore them, call
`read-event' or `read-char-exclusive' instead.

If the optional argument PROMPT is non-nil, display that as a prompt.
If the optional argument INHERIT-INPUT-METHOD is non-nil and some
input method is turned on in the current buffer, that input method
790 791 792 793 794 795 796
is used for reading a character.
If the optional argument SECONDS is non-nil, it should be a number
specifying the maximum number of seconds to wait for input.  If no
input arrives in that time, return nil.  SECONDS may be a
floating-point value.  */)
     (prompt, inherit_input_method, seconds)
     Lisp_Object prompt, inherit_input_method, seconds;
Jim Blandy's avatar
Jim Blandy committed
797
{
798 799
  Lisp_Object val;

800 801
  if (! NILP (prompt))
    message_with_string ("%s", prompt, 0);
802
  val = read_filtered_event (1, 1, 1, ! NILP (inherit_input_method), seconds);
803 804 805

  return (NILP (val) ? Qnil
	  : make_number (char_resolve_modifier_mask (XINT (val))));
Jim Blandy's avatar
Jim Blandy committed
806 807
}

808
DEFUN ("read-event", Fread_event, Sread_event, 0, 3, 0,
809 810 811 812
       doc: /* Read an event object from the input stream.
If the optional argument PROMPT is non-nil, display that as a prompt.
If the optional argument INHERIT-INPUT-METHOD is non-nil and some
input method is turned on in the current buffer, that input method
813 814 815 816 817 818 819
is used for reading a character.
If the optional argument SECONDS is non-nil, it should be a number
specifying the maximum number of seconds to wait for input.  If no
input arrives in that time, return nil.  SECONDS may be a
floating-point value.  */)
     (prompt, inherit_input_method, seconds)
     Lisp_Object prompt, inherit_input_method, seconds;
Jim Blandy's avatar
Jim Blandy committed
820
{
821 822
  if (! NILP (prompt))
    message_with_string ("%s", prompt, 0);
823
  return read_filtered_event (0, 0, 0, ! NILP (inherit_input_method), seconds);
Jim Blandy's avatar
Jim Blandy committed
824 825
}

826
DEFUN ("read-char-exclusive", Fread_char_exclusive, Sread_char_exclusive, 0, 3, 0,
827 828
       doc: /* Read a character from the command input (keyboard or macro).
It is returned as a number.  Non-character events are ignored.
829 830
If the character has modifiers, they are resolved and reflected to the
character code if possible (e.g. C-SPC -> 0).
831 832 833 834

If the optional argument PROMPT is non-nil, display that as a prompt.
If the optional argument INHERIT-INPUT-METHOD is non-nil and some
input method is turned on in the current buffer, that input method
835 836 837 838 839 840 841
is used for reading a character.
If the optional argument SECONDS is non-nil, it should be a number
specifying the maximum number of seconds to wait for input.  If no
input arrives in that time, return nil.  SECONDS may be a
floating-point value.  */)
     (prompt, inherit_input_method, seconds)
     Lisp_Object prompt, inherit_input_method, seconds;
Jim Blandy's avatar
Jim Blandy committed
842
{
843 844
  Lisp_Object val;

845 846
  if (! NILP (prompt))
    message_with_string ("%s", prompt, 0);
847

848
  val = read_filtered_event (1, 1, 0, ! NILP (inherit_input_method), seconds);
849 850 851

  return (NILP (val) ? Qnil
	  : make_number (char_resolve_modifier_mask (XINT (val))));
Jim Blandy's avatar
Jim Blandy committed
852 853 854
}

DEFUN ("get-file-char", Fget_file_char, Sget_file_char, 0, 0, 0,
855 856
       doc: /* Don't use this yourself.  */)
     ()
Jim Blandy's avatar
Jim Blandy committed
857 858
{
  register Lisp_Object val;
YAMAMOTO Mitsuharu's avatar
YAMAMOTO Mitsuharu committed
859
  BLOCK_INPUT;
860
  XSETINT (val, getc (instream));
YAMAMOTO Mitsuharu's avatar
YAMAMOTO Mitsuharu committed
861
  UNBLOCK_INPUT;
Jim Blandy's avatar
Jim Blandy committed
862 863
  return val;
}
864 865


866

Kenichi Handa's avatar
Kenichi Handa committed
867
/* Value is a version number of byte compiled code if the file
Miles Bader's avatar
Miles Bader committed
868
   associated with file descriptor FD is a compiled Lisp file that's
Kenichi Handa's avatar
Kenichi Handa committed
869 870 871
   safe to load.  Only files compiled with Emacs are safe to load.
   Files compiled with XEmacs can lead to a crash in Fbyte_code
   because of an incompatible change in the byte compiler.  */
872 873 874 875 876 877 878 879

static int
safe_to_load_p (fd)
     int fd;
{
  char buf[512];
  int nbytes, i;
  int safe_p = 1;
Kenichi Handa's avatar
Kenichi Handa committed
880
  int version = 1;
881 882 883 884 885 886 887 888 889

  /* Read the first few bytes from the file, and look for a line
     specifying the byte compiler version used.  */
  nbytes = emacs_read (fd, buf, sizeof buf - 1);
  if (nbytes > 0)
    {
      buf[nbytes] = '\0';

      /* Skip to the next newline, skipping over the initial `ELC'
Dave Love's avatar
Dave Love committed
890
	 with NUL bytes following it, but note the version.  */
891
      for (i = 0; i < nbytes && buf[i] != '\n'; ++i)
Dave Love's avatar
Dave Love committed
892
	if (i == 4)
Kenichi Handa's avatar
Kenichi Handa committed
893
	  version = buf[i];
894

895 896
      if (i == nbytes
	  || fast_c_string_match_ignore_case (Vbytecomp_version_regexp,
897 898 899
					      buf + i) < 0)
	safe_p = 0;
    }
Dave Love's avatar
Dave Love committed
900 901
  if (safe_p)
    safe_p = version;
902 903 904 905 906 907

  lseek (fd, 0, SEEK_SET);
  return safe_p;
}


908 909 910 911 912 913 914 915 916 917
/* Callback for record_unwind_protect.  Restore the old load list OLD,
   after loading a file successfully.  */

static Lisp_Object
record_load_unwind (old)
     Lisp_Object old;
{
  return Vloads_in_progress = old;
}

918 919 920 921 922 923 924 925
/* This handler function is used via internal_condition_case_1.  */

static Lisp_Object
load_error_handler (data)
     Lisp_Object data;
{
  return Qnil;
}
926

927 928 929 930 931 932
static Lisp_Object
load_warn_old_style_backquotes (file)
     Lisp_Object file;
{
  if (!NILP (Vold_style_backquotes))
    {
933
      Lisp_Object args[2];
934
      args[0] = build_string ("Loading `%s': old-style backquotes detected!");
935 936 937 938 939 940
      args[1] = file;
      Fmessage (2, args);
    }
  return Qnil;
}

941 942 943 944 945 946 947 948 949 950 951 952 953 954 955 956 957 958 959 960 961 962
DEFUN ("get-load-suffixes", Fget_load_suffixes, Sget_load_suffixes, 0, 0, 0,
       doc: /* Return the suffixes that `load' should try if a suffix is \
required.
This uses the variables `load-suffixes' and `load-file-rep-suffixes'.  */)
     ()
{
  Lisp_Object lst = Qnil, suffixes = Vload_suffixes, suffix, ext;
  while (CONSP (suffixes))
    {
      Lisp_Object exts = Vload_file_rep_suffixes;
      suffix = XCAR (suffixes);
      suffixes = XCDR (suffixes);
      while (CONSP (exts))
	{
	  ext = XCAR (exts);
	  exts = XCDR (exts);
	  lst = Fcons (concat2 (suffix, ext), lst);
	}
    }
  return Fnreverse (lst);
}

963
DEFUN ("load", Fload, Sload, 1, 5, 0,
964 965
       doc: /* Execute a file of Lisp code named FILE.
First try FILE with `.elc' appended, then try with `.el',
966
then try FILE unmodified (the exact suffixes in the exact order are
967
determined by `load-suffixes').  Environment variable references in
968
FILE are replaced with their values by calling `substitute-in-file-name'.
969
This function searches the directories in `load-path'.
970

971
If optional second arg NOERROR is non-nil,
972
report no error if FILE doesn't exist.
973
Print messages at start and end of loading unless
974 975
optional third arg NOMESSAGE is non-nil (but `force-load-messages'
overrides that).
976
If optional fourth arg NOSUFFIX is non-nil, don't try adding
977
suffixes `.elc' or `.el' to the specified name FILE.
978
If optional fifth arg MUST-SUFFIX is non-nil, insist on
979 980 981 982 983 984 985 986 987 988 989 990 991 992 993
the suffix `.elc' or `.el'; don't accept just FILE unless
it ends in one of those suffixes or includes a directory name.

If this function fails to find a file, it may look for different
representations of that file before trying another file.
It does so by adding the non-empty suffixes in `load-file-rep-suffixes'
to the file name.  Emacs uses this feature mainly to find compressed
versions of files when Auto Compression mode is enabled.

The exact suffixes that this function tries out, in the exact order,
are given by the value of the variable `load-file-rep-suffixes' if
NOSUFFIX is non-nil and by the return value of the function
`get-load-suffixes' if MUST-SUFFIX is non-nil.  If both NOSUFFIX and
MUST-SUFFIX are nil, this function first tries out the latter suffixes
and then the former.
994 995 996 997 998

Loading a file records its definitions, and its `provide' and
`require' calls, in an element of `load-history' whose
car is the file name loaded.  See `load-history'.

999
Return t if the file exists and loads successfully.  */)
1000
     (file, noerror, nomessage, nosuffix, must_suffix)
1001
     Lisp_Object file, noerror, nomessage, nosuffix, must_suffix;
Jim Blandy's avatar
Jim Blandy committed
1002 1003 1004
{
  register FILE *stream;
  register int fd = -1;
Juanma Barranquero's avatar
Juanma Barranquero committed
1005
  int count = SPECPDL_INDEX ();
1006 1007
  struct gcpro gcpro1, gcpro2, gcpro3;
  Lisp_Object found, efound, hist_file_name;
1008 1009 1010 1011
  /* 1 means we printed the ".el is newer" message.  */
  int newer = 0;
  /* 1 means we are loading a compiled file.  */
  int compiled = 0;
1012
  Lisp_Object handler;
1013
  int safe_p = 1;
1014
  char *fmode = "r";
1015
  Lisp_Object tmp[2];
Kenichi Handa's avatar
Kenichi Handa committed
1016 1017
  int version;

1018
#ifdef DOS_NT
1019
  fmode = "rt";
1020
#endif /* DOS_NT */
Jim Blandy's avatar
Jim Blandy committed
1021

1022
  CHECK_STRING (file);
Jim Blandy's avatar
Jim Blandy committed
1023

1024
  /* If file name is magic, call the handler.  */
1025 1026 1027 1028
  /* This shouldn't be necessary any more now that `openp' handles it right.
    handler = Ffind_file_name_handler (file, Qload);
    if (!NILP (handler))
      return call5 (handler, Qload, file, noerror, nomessage, nosuffix); */
1029

1030 1031
  /* Do this after the handler to avoid
     the need to gcpro noerror, nomessage and nosuffix.
1032 1033
     (Below here, we care only whether they are nil or not.)
     The presence of this call is the result of a historical accident:
1034
     it used to be in every file-operation and when it got removed
1035 1036 1037
     everywhere, it accidentally stayed here.  Since then, enough people
     supposedly have things like (load "$PROJECT/foo.el") in their .emacs
     that it seemed risky to remove.  */
1038 1039 1040 1041 1042 1043 1044 1045 1046
  if (! NILP (noerror))
    {
      file = internal_condition_case_1 (Fsubstitute_in_file_name, file,
					Qt, load_error_handler);
      if (NILP (file))
	return Qnil;
    }
  else
    file = Fsubstitute_in_file_name (file);
1047

1048

Jim Blandy's avatar
Jim Blandy committed
1049 1050
  /* Avoid weird lossage with null string as arg,
     since it would try to load a directory as a Lisp file */
1051
  if (SCHARS (file) > 0)
Jim Blandy's avatar
Jim Blandy committed
1052
    {
1053
      int size = SBYTES (file);
1054

1055 1056
      found = Qnil;
      GCPRO2 (file, found);
1057 1058 1059 1060 1061

      if (! NILP (must_suffix))
	{
	  /* Don't insist on adding a suffix if FILE already ends with one.  */
	  if (size > 3
1062
	      && !strcmp (SDATA (file) + size - 3, ".el"))
1063 1064
	    must_suffix = Qnil;
	  else if (size > 4
1065
		   && !strcmp (SDATA (file) + size - 4, ".elc"))
1066 1067 1068 1069 1070 1071 1072
	    must_suffix = Qnil;
	  /* Don't insist on adding a suffix
	     if the argument includes a directory name.  */
	  else if (! NILP (Ffile_name_directory (file)))
	    must_suffix = Qnil;
	}

1073
      fd = openp (Vload_path, file,
1074
		  (!NILP (nosuffix) ? Qnil
1075 1076 1077
		   : !NILP (must_suffix) ? Fget_load_suffixes ()
		   : Fappend (2, (tmp[0] = Fget_load_suffixes (),
				  tmp[1] = Vload_file_rep_suffixes,
1078
				  tmp))),
1079
		  &found, Qnil);
1080
      UNGCPRO;
Jim Blandy's avatar
Jim Blandy committed
1081 1082
    }

1083
  if (fd == -1)
Jim Blandy's avatar
Jim Blandy committed
1084
    {
Jim Blandy's avatar
Jim Blandy committed
1085
      if (NILP (noerror))
1086 1087
	xsignal2 (Qfile_error, build_string ("Cannot open load file"), file);
      return Qnil;
Jim Blandy's avatar
Jim Blandy committed
1088 1089
    }

1090
  /* Tell startup.el whether or not we found the user's init file.  */
Karl Heuer's avatar
Karl Heuer committed
1091 1092 1093
  if (EQ (Qt, Vuser_init_file))
    Vuser_init_file = found;

1094 1095
  /* If FD is -2, that means openp found a magic file.  */
  if (fd == -2)
1096
    {
1097 1098 1099 1100 1101 1102 1103 1104 1105
      if (NILP (Fequal (found, file)))
	/* If FOUND is a different file name from FILE,
	   find its handler even if we have already inhibited
	   the `load' operation on FILE.  */
	handler = Ffind_file_name_handler (found, Qt);
      else
	handler = Ffind_file_name_handler (found, Qload);
      if (! NILP (handler))
	return call5 (handler, Qload, found, noerror, nomessage, Qt);
1106 1107
    }

1108 1109 1110 1111 1112
  /* Check if we're stuck in a recursive load cycle.

     2000-09-21: It's not possible to just check for the file loaded
     being a member of Vloads_in_progress.  This fails because of the
     way the byte compiler currently works; `provide's are not
Juanma Barranquero's avatar
Juanma Barranquero committed
1113
     evaluated, see font-lock.el/jit-lock.el as an example.  This
1114 1115 1116 1117
     leads to a certain amount of ``normal'' recursion.