summaryrefslogtreecommitdiff
path: root/rsc/source/rscpp/cpp2.c
blob: 2108f099d83dd0dcb00d5df44cdb98fd836e0a15 (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
356
357
358
359
360
361
362
363
364
365
366
367
368
369
370
371
372
373
374
375
376
377
378
379
380
381
382
383
384
385
386
387
388
389
390
391
392
393
394
395
396
397
398
399
400
401
402
403
404
405
406
407
408
409
410
411
412
413
414
415
416
417
418
419
420
421
422
423
424
425
426
427
428
429
430
431
432
433
434
435
436
437
438
439
440
441
442
443
444
445
446
447
448
449
450
451
452
453
454
455
456
457
458
459
460
461
462
463
464
465
466
467
468
469
470
471
472
473
474
475
476
477
478
479
480
481
482
483
484
485
486
487
488
489
490
491
492
493
494
495
496
497
498
499
500
501
502
503
504
505
506
507
508
509
510
511
512
513
514
515
516
517
518
519
520
521
522
523
524
525
526
527
528
529
530
531
532
533
534
535
536
537
538
539
540
541
542
543
544
545
546
/* -*- Mode: C++; tab-width: 4; indent-tabs-mode: nil; c-basic-offset: 4 -*- */
/*
 * This file is part of the LibreOffice project.
 *
 * This Source Code Form is subject to the terms of the Mozilla Public
 * License, v. 2.0. If a copy of the MPL was not distributed with this
 * file, You can obtain one at http://mozilla.org/MPL/2.0/.
 *
 * This file incorporates work covered by the following license notice:
 *
 *   Licensed to the Apache Software Foundation (ASF) under one or more
 *   contributor license agreements. See the NOTICE file distributed
 *   with this work for additional information regarding copyright
 *   ownership. The ASF licenses this file to you under the Apache
 *   License, Version 2.0 (the "License"); you may not use this file
 *   except in compliance with the License. You may obtain a copy of
 *   the License at http://www.apache.org/licenses/LICENSE-2.0 .
 */

#include <stdio.h>
#include <ctype.h>
#include "cppdef.h"
#include "cpp.h"

/*
 * Generate (by hand-inspection) a set of unique values for each control
 * operator.  Note that this is not guaranteed to work for non-Ascii
 * machines.  CPP won't compile if there are hash conflicts.
 */

#define L_assert        ('a' + ('s' << 1))
#define L_define        ('d' + ('f' << 1))
#define L_elif          ('e' + ('i' << 1))
#define L_else          ('e' + ('s' << 1))
#define L_endif         ('e' + ('d' << 1))
#define L_if            ('i' + (EOS << 1))
#define L_ifdef         ('i' + ('d' << 1))
#define L_ifndef        ('i' + ('n' << 1))
#define L_include       ('i' + ('c' << 1))
#define L_line          ('l' + ('n' << 1))
#define L_nogood        (EOS + (EOS << 1))      /* To catch #i          */
#define L_pragma        ('p' + ('a' << 1))
#define L_undef         ('u' + ('d' << 1))
#define L_error         ('e' + ('r' << 1))      /* BP 5.3.92, #error */
#if OSL_DEBUG_LEVEL > 1
#define L_debug         ('d' + ('b' << 1))      /* #debug               */
#define L_nodebug       ('n' + ('d' << 1))      /* #nodebug             */
#endif


/*
 * Process #control lines.  Simple commands are processed inline,
 * while complex commands have their own subroutines.
 *
 * The counter is used to force out a newline before #line, and
 * #pragma commands.  This prevents these commands from ending up at
 * the end of the previous line if cpp is invoked with the -C option.
 */
int control(int counter)
{
    int c;
    char* tp;
    int hash;
    char* ep;

    c = skipws();
    if (c == '\n' || c == EOF_CHAR)
        return counter + 1;
    if (!isdigit(c))
        scanid(c);                  /* Get #word to token[]         */
    else
    {
        unget();                    /* Hack -- allow #123 as a      */
        strcpy(token, "line");      /* synonym for #line 123        */
    }
    hash = (token[1] == EOS) ? L_nogood : (token[0] + (token[2] << 1));
    switch (hash)
    {
    case L_assert:  tp = "assert";          break;
    case L_define:  tp = "define";          break;
    case L_elif:    tp = "elif";            break;
    case L_else:    tp = "else";            break;
    case L_endif:   tp = "endif";           break;
    case L_if:      tp = "if";              break;
    case L_ifdef:   tp = "ifdef";           break;
    case L_ifndef:  tp = "ifndef";          break;
    case L_include: tp = "include";         break;
    case L_line:    tp = "line";            break;
    case L_pragma:  tp = "pragma";          break;
    case L_undef:   tp = "undef";           break;
    case L_error:   tp = "error";           break;
#if OSL_DEBUG_LEVEL > 1
    case L_debug:   tp = "debug";           break;
    case L_nodebug: tp = "nodebug";         break;
#endif
    default:        hash = L_nogood;
        /*fall-through*/
    case L_nogood:  tp = "";                break;
    }
    if (!streq(tp, token))
        hash = L_nogood;
    /*
     * hash is set to a unique value corresponding to the
     * control keyword (or L_nogood if we think it's nonsense).
     */
    if (infile->fp == NULL)
        cwarn("Control line \"%s\" within macro expansion", token);
    if (!compiling)
    {                       /* Not compiling now    */
        switch (hash)
        {
        case L_if:                          /* These can't turn     */
        case L_ifdef:                       /*  compilation on, but */
        case L_ifndef:                      /*   we must nest #if's */
            if (++ifptr >= &ifstack[BLK_NEST])
                goto if_nest_err;
            *ifptr = 0;                     /* !WAS_COMPILING       */
        case L_line:                        /* Many                 */
            /*
             * Are pragma's always processed?
             */
        case L_pragma:                      /*  options             */
        case L_include:                     /*   are uninteresting  */
        case L_define:                      /*    if we             */
        case L_undef:                       /*     aren't           */
        case L_assert:                      /*      compiling.      */
        case L_error:                       /* BP 5.3.92, #error */
        dump_line:      skipnl();                       /* Ignore rest of line  */
            return counter + 1;
        }
    }
    /*
     * Make sure that #line and #pragma are output on a fresh line.
     */
    if (counter > 0 && (hash == L_line || hash == L_pragma))
    {
        PUTCHAR('\n');
        counter--;
    }

    switch (hash)
    {
    case L_line:
        /*
         * Parse the line to update the line number and "progname"
         * field and line number for the next input line.
         * Set wrongline to force it out later.
         */
        c = skipws();
        workp = work;                       /* Save name in work    */
        while (c != '\n' && c != EOF_CHAR)
        {
            save(c);
            c = get();
        }
        unget();
        save(EOS);
        /*
         * Split #line argument into <line-number> and <name>
         * We subtract 1 as we want the number of the next line.
         */
        line = atoi(work) - 1;              /* Reset line number    */
        for (tp = work; isdigit(*tp) || type[(int)*tp] == SPA; tp++)
            ;                               /* Skip over digits     */
        if (*tp != EOS)                     /* Got a filename, so:  */
        {
            if (*tp == '"' && (ep = strrchr(tp + 1, '"')) != NULL)
            {
                tp++;                       /* Skip over left quote */
                *ep = EOS;                  /* And ignore right one */
            }
            if (infile->progname != NULL)   /* Give up the old name */
                free(infile->progname);     /* if it's allocated.   */
            infile->progname = savestring(tp);
        }
        wrongline = TRUE;                   /* Force output later   */
        break;

    case L_include:
        doinclude();
        break;

    case L_define:
        dodefine();
        break;

    case L_undef:
        doundef();
        break;

    case L_else:
        if (ifptr == &ifstack[0])
            goto nest_err;
        else if ((*ifptr & ELSE_SEEN) != 0)
            goto else_seen_err;
        *ifptr |= ELSE_SEEN;
        if ((*ifptr & WAS_COMPILING) != 0)
        {
            if (compiling || (*ifptr & TRUE_SEEN) != 0)
                compiling = FALSE;
            else
            {
                compiling = TRUE;
            }
        }
        break;

    case L_elif:
        if (ifptr == &ifstack[0])
            goto nest_err;
        else if ((*ifptr & ELSE_SEEN) != 0)
        {
          else_seen_err:  cerror("#%s may not follow #else", token);
            goto dump_line;
        }
        if ((*ifptr & (WAS_COMPILING | TRUE_SEEN)) != WAS_COMPILING)
        {
            compiling = FALSE;              /* Done compiling stuff */
            goto dump_line;                 /* Skip this clause     */
        }
        doif(L_if);
        break;

    case L_if:
    case L_ifdef:
    case L_ifndef:
        if (++ifptr >= &ifstack[BLK_NEST])
          if_nest_err:    cfatal("Too many nested #%s statements", token);
        *ifptr = WAS_COMPILING;
        doif(hash);
        break;

    case L_endif:
        if (ifptr == &ifstack[0])
        {
          nest_err:       cerror("#%s must be in an #if", token);
            goto dump_line;
        }
        if (!compiling && (*ifptr & WAS_COMPILING) != 0)
            wrongline = TRUE;
        compiling = ((*ifptr & WAS_COMPILING) != 0);
        --ifptr;
        break;

    case L_assert:
        if (eval() == 0)
            cerror("Preprocessor assertion failure", NULLST);
        break;

    case L_pragma:
        /*
         * #pragma is provided to pass "options" to later
         * passes of the compiler.  cpp doesn't have any yet.
         */
        fprintf( pCppOut, "#pragma ");
        while ((c = get()) != '\n' && c != EOF_CHAR)
            cput(c);
        unget();
        break;

#if OSL_DEBUG_LEVEL > 1
    case L_debug:
        if (debug == 0)
            dumpdef("debug set on");
        debug++;
        break;

    case L_nodebug:
        debug--;
        break;
#endif
    case L_error:                       /* BP 5.3.92, #error */
        fprintf( pCppOut, "cpp: line %d, Error directive: ", line );
        while ((c = get()) != '\n' && c != EOF_CHAR)
            cput(c);
        fprintf( pCppOut, "\n" );
        exit( 1 );

    default:
        /*
         * Undefined #control keyword.
         * Note: the correct behavior may be to warn and
         * pass the line to a subsequent compiler pass.
         * This would allow #asm or similar extensions.
         */
        cerror("Illegal # command \"%s\"", token);
        break;
    }
    if (hash != L_include)
    {
        if (skipws() != '\n')
        {
            cwarn("Unexpected text in #control line ignored", NULLST);
            skipnl();
        }
    }
    return counter + 1;
}

/*
 * Process an #if, #ifdef, or #ifndef.  The latter two are straightforward,
 * while #if needs a subroutine of its own to evaluate the expression.
 *
 * doif() is called only if compiling is TRUE.  If false, compilation
 * is always suppressed, so we don't need to evaluate anything.  This
 * suppresses unnecessary warnings.
 */
FILE_LOCAL void doif(int hash)
{
    int c;
    int found;

    if ((c = skipws()) == '\n' || c == EOF_CHAR)
    {
        unget();
        goto badif;
    }
    if (hash == L_if)
    {
        unget();
        found = (eval() != 0);      /* Evaluate expr, != 0 is  TRUE */
        hash = L_ifdef;             /* #if is now like #ifdef       */
    }
    else
    {
        if (type[c] != LET)         /* Next non-blank isn't letter  */
            goto badif;             /* ... is an error              */
        found = (lookid(c) != NULL); /* Look for it in symbol table */
    }
    if (found == (hash == L_ifdef))
    {
        compiling = TRUE;
        *ifptr |= TRUE_SEEN;
    }
    else
    {
        compiling = FALSE;
    }
    return;

  badif:  cerror("#if, #ifdef, or #ifndef without an argument", NULLST);
    skipnl();                               /* Prevent an extra     */
    unget();                                /* Error message        */
    return;
}

/*
 * Process the #include control line.
 * There are three variations:
 *      #include "file"         search somewhere relative to the
 *                              current source file, if not found,
 *                              treat as #include <file>.
 *      #include <file>         Search in an implementation-dependent
 *                              list of places.
 *      #include token          Expand the token, it must be one of
 *                              "file" or <file>, process as such.
 *
 * Note: the November 12 draft forbids '>' in the #include <file> format.
 * This restriction is unnecessary and not implemented.
 */
FILE_LOCAL void doinclude()
{
    int c;
    int delim;

    delim = macroid(skipws());
    if (delim != '<' && delim != '"')
        goto incerr;
    if (delim == '<')
        delim = '>';
    workp = work;
    instring = TRUE;                /* Accept all characters        */
#ifdef CONTROL_COMMENTS_NOT_ALLOWED
    while ((c = get()) != '\n' && c != EOF_CHAR)
        save(c);                    /* Put it away.                 */
    unget();                        /* Force nl after include      */
    /*
     * The draft is unclear if the following should be done.
     */
    while (--workp >= work && *workp == ' ')
        ;                           /* Trim blanks from filename    */
    if (*workp != delim)
        goto incerr;
#else
    while ((c = get()) != delim && c != EOF_CHAR)
        save(c);
#endif
    *workp = EOS;                   /* Terminate filename           */
    instring = FALSE;
    if (openinclude(work, (delim == '"')))
        return;
    /*
     * No sense continuing if #include file isn't there.
     */
    cfatal("Cannot open include file \"%s\"", work);

  incerr: cerror("#include syntax error", NULLST);
    return;
}

/*
 * Actually open an include file.  This routine is only called from
 * doinclude() above, but was written as a separate subroutine for
 * programmer convenience.  It searches the list of directories
 * and actually opens the file, linking it into the list of
 * active files.  Returns TRUE if the file was opened, FALSE
 * if openinclude() fails.  No error message is printed.
 */
FILE_LOCAL int openinclude(char* filename, int searchlocal)
{
    char** incptr;
    char tmpname[NFWORK]; /* Filename work area   */

    if (searchlocal)
    {
        /*
         * Look in local directory first
         */
#if HOST == SYS_UNIX
        /*
         * Try to open filename relative to the directory of the current
         * source file (as opposed to the current directory). (ARF, SCK).
         */
        if (filename[0] != '/' &&
            hasdirectory(infile->filename, tmpname, NFWORK))
        {
            int len = strlen(tmpname);
            int len2 = strlen(filename);
            if(len + len2 < NFWORK)
            {
                memcpy(tmpname + len, filename, len2);
                tmpname[len + len2] = 0;
            }
            else
            {
                cfatal("Filename work buffer overflow", NULLST);
            }
        }
        else
        {
            int len = strlen(filename);
            if(len < NFWORK)
            {
                memcpy(tmpname, filename, len);
                tmpname[len] = 0;
            }
            else
            {
                cfatal("Filename work buffer overflow", NULLST);
            }
        }
#else
        if (!hasdirectory(filename, tmpname, NFWORK) &&
            hasdirectory(infile->filename, tmpname, NFWORK))
        {
            strcat(tmpname, filename);
        }
        else
        {
            strcpy(tmpname, filename);
        }
#endif
        if (openfile(tmpname))
            return TRUE;
    }
    /*
     * Look in any directories specified by -I command line
     * arguments, then in the builtin search list.
     */
    for (incptr = incdir; incptr < incend; incptr++)
    {
        if (strlen(*incptr) + strlen(filename) >= (NFWORK - 1))
            cfatal("Filename work buffer overflow", NULLST);
        else
        {
#if HOST == SYS_UNIX
            if (filename[0] == '/')
                strcpy(tmpname, filename);
            else
                sprintf(tmpname, "%s/%s", *incptr, filename);

#elif HOST == SYS_UNKNOWN
            if (filename[0] == '\\')
                strcpy(tmpname, filename);
            else
                sprintf(tmpname, "%s\\%s", *incptr, filename);
#else
            if (!hasdirectory(filename, tmpname, NFWORK))
                sprintf(tmpname, "%s%s", *incptr, filename);
#endif
            if (openfile(tmpname))
                return TRUE;
        }
    }
    return FALSE;
}

/*
 * If a device or directory is found in the source filename string, the
 * node/device/directory part of the string is copied to result and
 * hasdirectory returns TRUE.  Else, nothing is copied and it returns FALSE.
 */
FILE_LOCAL int hasdirectory(char* source, char* result, int max)
{
#if HOST == SYS_UNIX
    char* tp;

    if ((tp = strrchr(source, '/')) == NULL)
        return FALSE;
    else
    {
        int len = (int)(tp - source);
        if(len < max)
        {
            memcpy(result, source, len);
            result[len] = 0;
        }
        else
        {
            cfatal("Filename work buffer overflow", NULLST);
        }
        return TRUE;
    }
#else
    /*
     * Random DEC operating system (RSTS/E)
     */
    char* tp;

    (void)max;

    if ((tp = strrchr(source, ']')) == NULL &&
        (tp = strrchr(source, ':')) == NULL)
    {
        return FALSE;
    }
    else
    {
        strncpy(result, source, tp - source + 1);
        result[tp - source + 1] = EOS;
        return TRUE;
    }
#endif
}

/* vim:set shiftwidth=4 softtabstop=4 expandtab: */