Mercurial > hg > octave-lyh
view libinterp/parse-tree/lex.h @ 16199:810a71122c25
move more global variables to octave_lexical_feedback class
* help.cc (raw_help_from_file): Don't protect and set
reading_script_file.
* octave.cc (likewise):
* oct_parse.in.yy (parse_fcn_file): Don't protect
reading_script_file.
* input.cc (get_debug_input): Don't protect and set reading_fcn_file,
reading_classdef_file, or reading_script_file.
* lex.h, lex.ll, input.h, input.cc (reading_fcn_file,
reading_classdef_file, reading_script_file): Declare as members of the
lexical_feedback class. Change all uses.
(lexical_feedback::lexical_feedback, lexical_feedback::reset):
Initialize and set them.
author | John W. Eaton <jwe@octave.org> |
---|---|
date | Tue, 05 Mar 2013 17:50:37 -0500 |
parents | b52d2f9294b6 |
children | 127cccb037bf |
line wrap: on
line source
/* Copyright (C) 1993-2012 John W. Eaton This file is part of Octave. Octave is free software; you can redistribute it and/or modify it under the terms of the GNU General Public License as published by the Free Software Foundation; either version 3 of the License, or (at your option) any later version. Octave is distributed in the hope that it will be useful, but WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License for more details. You should have received a copy of the GNU General Public License along with Octave; see the file COPYING. If not, see <http://www.gnu.org/licenses/>. */ #if !defined (octave_lex_h) #define octave_lex_h 1 #include <list> #include <set> #include <stack> #include "input.h" extern OCTINTERP_API void cleanup_parser (void); // Is the given string a keyword? extern bool is_keyword (const std::string& s); class stream_reader { public: virtual int getc (void) = 0; virtual int ungetc (int c) = 0; protected: stream_reader (void) { } ~stream_reader (void) { } private: // No copying! stream_reader (const stream_reader&); stream_reader& operator = (const stream_reader&); }; // Forward decl for octave_lexer::token_stack. class token; // For communication between the lexer and parser. class lexical_feedback { public: // Did eat_whitespace or eat_continuation eat a space or tab, or a // newline, or both? // // Functions that return this type will return a logical OR of the // following values: // // NO_WHITESPACE no spaces to eat // SPACE_OR_TAB space or tab in input // NEWLINE bare new line in input enum whitespace_type { NO_WHITESPACE = 1, SPACE_OR_TAB = 2, NEWLINE = 4 }; // Track nesting of square brackets, curly braces, and parentheses. class bbp_nesting_level { private: enum bracket_type { BRACKET = 1, BRACE = 2, PAREN = 3 }; public: bbp_nesting_level (void) : context () { } bbp_nesting_level (const bbp_nesting_level& nl) : context (nl.context) { } bbp_nesting_level& operator = (const bbp_nesting_level& nl) { if (&nl != this) context = nl.context; return *this; } ~bbp_nesting_level (void) { } void reset (void) { while (! context.empty ()) context.pop (); } void bracket (void) { context.push (BRACKET); } bool is_bracket (void) { return ! context.empty () && context.top () == BRACKET; } void brace (void) { context.push (BRACE); } bool is_brace (void) { return ! context.empty () && context.top () == BRACE; } void paren (void) { context.push (PAREN); } bool is_paren (void) { return ! context.empty () && context.top () == PAREN; } bool is_bracket_or_brace (void) { return (! context.empty () && (context.top () == BRACKET || context.top () == BRACE)); } bool none (void) { return context.empty (); } void remove (void) { if (! context.empty ()) context.pop (); } void clear (void) { while (! context.empty ()) context.pop (); } private: std::stack<int> context; }; lexical_feedback (void) : end_of_input (false), convert_spaces_to_comma (true), do_comma_insert (false), at_beginning_of_statement (true), looking_at_anon_fcn_args (false), looking_at_return_list (false), looking_at_parameter_list (false), looking_at_decl_list (false), looking_at_initializer_expression (false), looking_at_matrix_or_assign_lhs (false), looking_for_object_index (false), looking_at_indirect_ref (false), parsing_class_method (false), maybe_classdef_get_set_method (false), parsing_classdef (false), quote_is_transpose (false), reading_fcn_file (false), reading_script_file (false), reading_classdef_file (false), input_line_number (1), current_input_column (1), bracketflag (0), braceflag (0), looping (0), defining_func (0), looking_at_function_handle (0), block_comment_nesting_level (0), looking_at_object_index (), parsed_function_name (), pending_local_variables (), nesting_level (), token_stack () { init (); } ~lexical_feedback (void); void init (void); void reset (void); // true means that we have encountered eof on the input stream. bool end_of_input; // true means that we should convert spaces to a comma inside a // matrix definition. bool convert_spaces_to_comma; // gag. stupid kludge so that [[1,2][3,4]] will work. bool do_comma_insert; // true means we are at the beginning of a statement, where a // command name is possible. bool at_beginning_of_statement; // true means we are parsing an anonymous function argument list. bool looking_at_anon_fcn_args; // true means we're parsing the return list for a function. bool looking_at_return_list; // true means we're parsing the parameter list for a function. bool looking_at_parameter_list; // true means we're parsing a declaration list (global or // persistent). bool looking_at_decl_list; // true means we are looking at the initializer expression for a // parameter list element. bool looking_at_initializer_expression; // true means we're parsing a matrix or the left hand side of // multi-value assignment statement. bool looking_at_matrix_or_assign_lhs; // object index not possible until we've seen something. bool looking_for_object_index; // true means we're looking at an indirect reference to a // structure element. bool looking_at_indirect_ref; // true means we are parsing a class method in function or classdef file. bool parsing_class_method; // true means we are parsing a class method declaration line in a // classdef file and can accept a property get or set method name. // for example, "get.propertyname" is recognized as a function name. bool maybe_classdef_get_set_method; // true means we are parsing a classdef file bool parsing_classdef; // return transpose or start a string? bool quote_is_transpose; // TRUE means we're parsing a function file. bool reading_fcn_file; // TRUE means we're parsing a script file. bool reading_script_file; // TRUE means we're parsing a classdef file. bool reading_classdef_file; // the current input line number. int input_line_number; // the column of the current token. int current_input_column; // square bracket level count. int bracketflag; // curly brace level count. int braceflag; // true means we're in the middle of defining a loop. int looping; // nonzero means we're in the middle of defining a function. int defining_func; // nonzero means we are parsing a function handle. int looking_at_function_handle; // nestng level for blcok comments. int block_comment_nesting_level; // if the front of the list is true, the closest paren, brace, or // bracket nesting is an index for an object. std::list<bool> looking_at_object_index; // if the top of the stack is true, then we've already seen the name // of the current function. should only matter if // current_function_level > 0 std::stack<bool> parsed_function_name; // set of identifiers that might be local variable names. std::set<std::string> pending_local_variables; // is the closest nesting level a square bracket, squiggly brace or // a paren? bbp_nesting_level nesting_level; // Stack to hold tokens so that we can delete them when the parser is // reset and avoid growing forever just because we are stashing some // information. std::stack <token*> token_stack; private: void reset_token_stack (void); // No copying! lexical_feedback (const lexical_feedback&); lexical_feedback& operator = (const lexical_feedback&); }; // octave_lexer inherits from lexical_feedback because we will // eventually have several different constructors and it is easier to // intialize if everything is grouped in a parent class rather than // listing all the members in the octave_lexer class. class octave_lexer : public lexical_feedback { public: // Handle buffering of input for lexer. class input_buffer { public: input_buffer (void) : buffer (), pos (0), chars_left (0), eof (false) { } void fill (const std::string& input, bool eof_arg); // Copy at most max_size characters to buf. int copy_chunk (char *buf, size_t max_size); bool empty (void) const { return chars_left == 0; } bool at_eof (void) const { return eof; } private: std::string buffer; const char *pos; size_t chars_left; bool eof; }; octave_lexer (void) : lexical_feedback (), scanner (0), input_buf (), input_reader () { init (); } octave_lexer (FILE *file) : lexical_feedback (), scanner (0), input_buf (), input_reader (file) { init (); } octave_lexer (const std::string& eval_string) : lexical_feedback (), scanner (0), input_buf (), input_reader (eval_string) { init (); } ~octave_lexer (void); void init (void); void reset (void); void prep_for_script_file (void); void prep_for_function_file (void); int read (char *buf, unsigned int max_size); int handle_end_of_input (void); char *flex_yytext (void); int flex_yyleng (void); void do_comma_insert_check (void); int text_yyinput (void); void xunput (char c, char *buf); void xunput (char c); void fixup_column_count (char *s); bool inside_any_object_index (void); int is_keyword_token (const std::string& s); bool is_variable (const std::string& name); std::string grab_block_comment (stream_reader& reader, bool& eof); std::string grab_comment_block (stream_reader& reader, bool at_bol, bool& eof); int process_comment (bool start_in_block, bool& eof); bool next_token_is_sep_op (void); bool next_token_is_postfix_unary_op (bool spc_prev); bool next_token_is_bin_op (bool spc_prev); void scan_for_comments (const char *text); int eat_whitespace (void); void handle_number (void); bool have_continuation (bool trailing_comments_ok = true); bool have_ellipsis_continuation (bool trailing_comments_ok = true); int eat_continuation (void); int handle_string (char delim); bool next_token_is_assign_op (void); bool next_token_is_index_op (void); int handle_close_bracket (bool spc_gobbled, int bracket_type); void maybe_unput_comma (int spc_gobbled); bool next_token_can_follow_bin_op (void); bool looks_like_command_arg (void); int handle_superclass_identifier (void); int handle_meta_identifier (void); int handle_identifier (void); void maybe_warn_separator_insert (char sep); void gripe_single_quote_string (void); void gripe_matlab_incompatible (const std::string& msg); void maybe_gripe_matlab_incompatible_comment (char c); void gripe_matlab_incompatible_continuation (void); void gripe_matlab_incompatible_operator (const std::string& op); void push_token (token *); token *current_token (void); void display_token (int tok); void fatal_error (const char *msg); void lexer_debug (const char *pattern, const char *text); // Internal state of the flex-generated lexer. void *scanner; // Object that reads and buffers input. input_buffer input_buf; octave_input_reader input_reader; std::string input_source (void) const { return input_reader.input_source (); } bool input_from_eval_string (void) const { return input_source () == "eval_string"; } // For unwind protect. static void cleanup (octave_lexer *lexer) { delete lexer; } private: // No copying! octave_lexer (const octave_lexer&); octave_lexer& operator = (const octave_lexer&); }; #endif