/* * PROGRAM: JRD Data Definition Language * MODULE: lex.cpp * DESCRIPTION: Lexical analyser * * The contents of this file are subject to the Interbase Public * License Version 1.0 (the "License"); you may not use this file * except in compliance with the License. You may obtain a copy * of the License at http://www.Inprise.com/IPL.html * * Software distributed under the License is distributed on an * "AS IS" basis, WITHOUT WARRANTY OF ANY KIND, either express * or implied. See the License for the specific language governing * rights and limitations under the License. * * The Original Code was created by Inprise Corporation * and its predecessors. Portions created by Inprise Corporation are * Copyright (C) Inprise Corporation. * * All Rights Reserved. * Contributor(s): ______________________________________. * * 2002.10.29 Sean Leyne - Removed obsolete "Netware" port * * 2002.10.30 Sean Leyne - Removed support for obsolete "PC_PLATFORM" define * */ #include "firebird.h" #include "../jrd/ib_stdio.h" #include #include #include #include "../jrd/y_ref.h" #include "../jrd/ibase.h" #include "../dudley/ddl.h" #include "../dudley/parse.h" #include "../dudley/ddl_proto.h" #include "../dudley/hsh_proto.h" #include "../dudley/lex_proto.h" #include "../jrd/gds_proto.h" #ifdef HAVE_UNISTD_H #include #endif #ifdef SMALL_FILE_NAMES const char* SCRATCH = "fb_q"; #else const char* SCRATCH = "fb_query_"; #endif extern const TEXT* DDL_prompt; static int nextchar(void); static void retchar(SSHORT); static int skip_white(void); /* Input line control */ static IB_FILE *input_file, *trace_file; static TEXT *DDL_char, DDL_buffer[256], trace_file_name[128]; enum chr_types { CHR_ident = 1, CHR_letter = 2, CHR_digit = 4, CHR_quote = 8, CHR_white = 16, CHR_eol = 32, CHR_IDENT = CHR_ident, CHR_LETTER = CHR_letter + CHR_ident, CHR_DIGIT = CHR_digit + CHR_ident, CHR_QUOTE = CHR_quote, CHR_WHITE = CHR_white, CHR_EOL = CHR_white }; static SCHAR classes[256] = { 0, 0, 0, 0, 0, 0, 0, 0, 0, CHR_WHITE, CHR_EOL, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, CHR_WHITE, 0, CHR_QUOTE, CHR_IDENT, CHR_IDENT, 0, 0, CHR_QUOTE, 0, 0, 0, 0, 0, 0, 0, 0, CHR_DIGIT, CHR_DIGIT, CHR_DIGIT, CHR_DIGIT, CHR_DIGIT, CHR_DIGIT, CHR_DIGIT, CHR_DIGIT, CHR_DIGIT, CHR_DIGIT, 0, 0, 0, 0, 0, 0, 0, CHR_LETTER, CHR_LETTER, CHR_LETTER, CHR_LETTER, CHR_LETTER, CHR_LETTER, CHR_LETTER, CHR_LETTER, CHR_LETTER, CHR_LETTER, CHR_LETTER, CHR_LETTER, CHR_LETTER, CHR_LETTER, CHR_LETTER, CHR_LETTER, CHR_LETTER, CHR_LETTER, CHR_LETTER, CHR_LETTER, CHR_LETTER, CHR_LETTER, CHR_LETTER, CHR_LETTER, CHR_LETTER, CHR_LETTER, 0, 0, 0, 0, CHR_LETTER, 0, CHR_LETTER, CHR_LETTER, CHR_LETTER, CHR_LETTER, CHR_LETTER, CHR_LETTER, CHR_LETTER, CHR_LETTER, CHR_LETTER, CHR_LETTER, CHR_LETTER, CHR_LETTER, CHR_LETTER, CHR_LETTER, CHR_LETTER, CHR_LETTER, CHR_LETTER, CHR_LETTER, CHR_LETTER, CHR_LETTER, CHR_LETTER, CHR_LETTER, CHR_LETTER, CHR_LETTER, CHR_LETTER, CHR_LETTER, 0 }; TOK LEX_filename(void) { /************************************** * * L E X _ f i l e n a m e * ************************************** * * Functional description * Parse the next token as a filename. * **************************************/ TOK token; SSHORT c; TEXT *p; token = &DDL_token; p = token->tok_string; *p++ = c = skip_white(); if (DDL_eof) { token->tok_symbol = NULL; token->tok_keyword = KW_none; return NULL; } while (!(classes[c = nextchar()] & (CHR_white | CHR_eol))) *p++ = c; retchar(c); token->tok_length = p - token->tok_string; *p = 0; token->tok_symbol = NULL; token->tok_keyword = KW_none; return token; } void LEX_fini(void) { /************************************** * * L E X _ f i n i * ************************************** * * Functional description * Shut down LEX in a more or less clean way. * **************************************/ if (trace_file != NULL) ib_fclose(trace_file); if (trace_file_name[0]) unlink(trace_file_name); } void LEX_flush(void) { /************************************** * * L E X _ f l u s h * ************************************** * * Functional description * Flush the input stream after an error. For now, just look for * an end of line. * **************************************/ SSHORT c; while (!DDL_eof) { if ((c = nextchar()) == '\n') break; } *DDL_char = 0; } void LEX_get_text(UCHAR * buffer, TXT text) { /************************************** * * L E X _ g e t _ t e x t * ************************************** * * Functional description * Write text from the scratch trace file into a buffer. * **************************************/ SLONG start; int length; UCHAR *p; start = text->txt_position; length = text->txt_length; if (ib_fseek(trace_file, start, 0)) { ib_fseek(trace_file, (SLONG) 0, 2); DDL_err(275, NULL, NULL, NULL, NULL, NULL); /* msg 275: ib_fseek failed */ } p = buffer; while (length--) *p++ = ib_getc(trace_file); ib_fseek(trace_file, (SLONG) 0, 2); } void LEX_init( void *file) { /************************************** * * L E X _ i n i t * ************************************** * * Functional description * Initialize for lexical scanning. While we're at it, open a * scratch trace file to keep all input. * **************************************/ #if !(defined WIN_NT) trace_file = (IB_FILE*) gds__temp_file(TRUE, SCRATCH, 0); #else trace_file = (IB_FILE*) gds__temp_file(TRUE, SCRATCH, trace_file_name); #endif if (trace_file == (IB_FILE*) - 1) DDL_err(276, NULL, NULL, NULL, NULL, NULL); /* msg 276: couldn't open scratch file */ input_file = (IB_FILE*) file; DDL_char = DDL_buffer; DDL_token.tok_position = 0; DDL_description = false; DDL_line = 1; } void LEX_put_text (FRBRD *blob, TXT text) { /************************************** * * L E X _ p u t _ t e x t * ************************************** * * Functional description * Write text from the scratch trace file into a blob. * **************************************/ SLONG start; ISC_STATUS_ARRAY status_vector; int length; SSHORT l, c; TEXT buffer[1024], *p; start = text->txt_position; length = text->txt_length; if (ib_fseek(trace_file, start, 0)) { ib_fseek(trace_file, (SLONG) 0, 2); DDL_err(275, NULL, NULL, NULL, NULL, NULL); /* msg 275: ib_fseek failed */ } while (length) { p = buffer; while (length) { --length; *p++ = c = ib_getc(trace_file); if (c == '\n') break; } if (l = p - buffer) if (isc_put_segment(status_vector, &blob, l, buffer)) DDL_err(277, NULL, NULL, NULL, NULL, NULL); /* msg 277: isc_put_segment failed */ } ib_fseek(trace_file, (SLONG) 0, 2); } void LEX_real(void) { /************************************** * * L E X _ r e a l * ************************************** * * Functional description * If the token is an end of line, get the next token. * **************************************/ if (DDL_token.tok_string[0] != '\n') return; LEX_token(); } TOK LEX_token(void) { /************************************** * * L E X _ t o k e n * ************************************** * * Functional description * Parse and return the next token. * **************************************/ SSHORT c, next; SYM symbol; TOK token = &DDL_token; TEXT* p = token->tok_string; *p++ = c = skip_white(); /* On end of file, generate furious but phony end of line tokens */ TEXT char_class = classes[c]; if (DDL_eof) { p = token->tok_string; *p++ = '*'; *p++ = 'E'; *p++ = 'O'; *p++ = 'F'; *p++ = '*'; token->tok_symbol = NULL; token->tok_keyword = KW_none; token->tok_type = tok_eol; token->tok_length = p - token->tok_string; *p = '\0'; return NULL; } else if (char_class & CHR_letter) { while (classes[c = nextchar()] & CHR_ident) *p++ = c; retchar(c); token->tok_type = tok_ident; } else if (char_class & CHR_digit) { while (classes[c = nextchar()] & CHR_digit) *p++ = c; if (c == '.') { *p++ = c; while (classes[c = nextchar()] & CHR_digit) *p++ = c; } retchar(c); token->tok_type = tok_number; } else if ((char_class & CHR_quote) && !DDL_description) { token->tok_type = tok_quoted; do { if (!(next = nextchar()) || next == '\n') { DDL_err(278, NULL, NULL, NULL, NULL, NULL); /* msg 278: unterminated quoted string */ break; } *p++ = next; } while (next != c); } else if (c == '\n') token->tok_type = tok_eol; else { token->tok_type = tok_punct; *p++ = nextchar(); if (!HSH_lookup(token->tok_string, 2)) retchar(*--p); } token->tok_length = p - token->tok_string; *p = '\0'; token->tok_symbol = symbol = HSH_lookup(token->tok_string, token->tok_length); if (symbol && symbol->sym_type == SYM_keyword) token->tok_keyword = (enum kwwords) symbol->sym_keyword; else token->tok_keyword = KW_none; if (DDL_trace) ib_puts(token->tok_string); return token; } static int nextchar(void) { /************************************** * * n e x t c h a r * ************************************** * * Functional description * Get the next character from the input stream. * **************************************/ SSHORT c; SCHAR *end; /* mark the end of the buffer */ end = DDL_buffer + sizeof(DDL_buffer); /* If there isn't anything floating around, get a new line */ while (!(c = *DDL_char++)) { DDL_char = DDL_buffer; if (DDL_interactive) { ib_printf(DDL_prompt); if (DDL_service) ib_putc('\001', ib_stdout); ib_fflush(ib_stdout); } while (c = ib_getc(input_file)) { if (c == EOF && SYSCALL_INTERRUPTED(errno)) { errno = 0; continue; } if (c == EOF) break; if (DDL_char < end) *DDL_char++ = c; else DDL_err(279, NULL, NULL, NULL, NULL, NULL); /* msg 279: line too SLONG */ if (c == '\n') break; } *DDL_char = 0; if (c == EOF && DDL_char == DDL_buffer) { #ifdef UNIX if (DDL_interactive) ib_printf("\n"); #endif DDL_eof = true; return EOF; } DDL_char = DDL_buffer; ib_fputs(DDL_buffer, trace_file); } DDL_token.tok_position++; if (c == '\n') { ++DDL_line; #if (defined WIN_NT) /* need to account for extra linefeed on newline */ DDL_token.tok_position++; #endif } return c; } static void retchar( SSHORT c) { /************************************** * * r e t c h a r * ************************************** * * Functional description * Return a character to the input stream. * **************************************/ if (c == '\n') { --DDL_line; #if (defined WIN_NT) /* account for the extra linefeed in a newline */ --DDL_token.tok_position; #endif } --DDL_token.tok_position; --DDL_char; } static int skip_white(void) { /************************************** * * s k i p _ w h i t e * ************************************** * * Functional description * Skip over white space and comments in input stream * **************************************/ SSHORT c; while ((c = nextchar()) != EOF) { const SSHORT char_class = classes[c]; if (char_class & CHR_white) continue; if (c == '/') { SSHORT next = nextchar(); if (next != '*') { retchar(next); return c; } c = nextchar(); while ((next = nextchar()) && (next != EOF) && !(c == '*' && next == '/')) { c = next; } continue; } break; } return c; }