Wave: a Standard conformant C++ preprocessor library

Hartmut Kaiser

Rate me:

4.96/5 (58 votes)

10 Jan 200413 min read

399.2K

4.4K

Describes a free and fully Standard conformant C++ preprocessor library

wave_preprocessor_src.zip
- wave
  - doc
    - acknowledgements.html
    - class_reference_context.html
    - class_reference_fileposition.html
    - class_reference_inputpolicy.html
    - class_reference_lexer.html
    - class_reference_tokentype.html
    - class_reference_tracepolicy.html
    - compiletime_config.html
    - index.html
    - introduction.html
    - macro_expansion_process.html
    - predefined_macros.html
    - preface.html
    - preliminary_cpp0x_support.html
    - quickstart.html
    - references.html
    - supported_pragmas.html
    - theme
      - bkd.gif
      - bkd2.gif
      - bullet.gif
      - l_arr.gif
      - l_arr_disabled.gif
      - r_arr.gif
      - r_arr_disabled.gif
      - style.css
      - u_arr.gif
      - uc.gif
      - wave.gif
    - token_ids.html
    - tracing_facility.html
    - wave_driver.html
  - test
    - boost-build.jam
    - cpp_tokens
    - Jamfile.v2
    - list_includes
    - project-root.jam
    - wave.vcproj
    - wave
      - cpp.cpp
      - cpp.hpp
      - cpp_config.hpp
      - cpp_version.hpp
      - instantiate_cpp_exprgrammar.cpp
      - instantiate_cpp_grammar.cpp
      - instantiate_cpp_literalgrammars.cpp
      - instantiate_defined_grammar.cpp
      - instantiate_predef_macros.cpp
      - instantiate_re2c_idllexer.cpp
      - instantiate_re2c_lexer.cpp
      - instantiate_slex_lexer.cpp
      - Jamfile
      - Jamfile.v2
      - runtests.sh
      - test_files
        
        scope1.cpp
        
        scope10.cpp
        
        scope11.cpp
        
        scope12.cpp
        
        scope13.cpp
        
        scope14.cpp
        
        scope15.cpp
        
        scope16.cpp
        
        scope17.cpp
        
        scope18.cpp
        
        scope19.cpp
        
        scope2.cpp
        
        scope20.cpp
        
        scope21.cpp
        
        scope22.cpp
        
        scope23.cpp
        
        scope24.cpp
        
        scope25.cpp
        
        scope26.cpp
        
        scope27.cpp
        
        scope3.cpp
        
        scope4.cpp
        
        scope5.cpp
        
        scope6.cpp
        
        scope7.cpp
        
        scope8.cpp
        
        scope9.cpp
        
        test1.cpp
        
        test10.cpp
        
        test11.cpp
        
        test12.cpp
        
        test13.cpp
        
        test14.cpp
        
        test15.cpp
        
        test16.cpp
        
        test17.cpp
        
        test18.cpp
        
        test19.cpp
        
        test2.cpp
        
        test20.cpp
        
        test21.cpp
        
        test22.cpp
        
        test23.cpp
        
        test24.cpp
        
        test25.cpp
        
        test26.cpp
        
        test27.cpp
        
        test28.cpp
        
        test29.cpp
        
        test3.cpp
        
        test30.cpp
        
        test31.cpp
        
        test32.cpp
        
        test33.cpp
        
        test34.cpp
        
        test35.cpp
        
        test36.cpp
        
        test37.cpp
        
        test38.cpp
        
        test39.cpp
        
        test4.cpp
        
        test40.cpp
        
        test41.cpp
        
        test41_0.hpp
        
        test41_1.hpp
        
        test42.cpp
        
        test43.cpp
        
        test44.cpp
        
        test45.cpp
        
        test46.cpp
        
        test47.cpp
        
        test48.cpp
        
        test49.cpp
        
        test5.cpp
        
        test50.cpp
        
        test51.cpp
        
        test52.cpp
        
        test53.cpp
        
        test54.cpp
        
        test55.cpp
        
        test56.cpp
        
        test57.cpp
        
        test58.cpp
        
        test59.cpp
        
        test6.cpp
        
        test60.cpp
        
        test61.cpp
        
        test62.cpp
        
        test63.cpp
        
        test64.cpp
        
        test65.cpp
        
        test66.cpp
        
        test67.cpp
        
        test68.cpp
        
        test69.cpp
        
        test7.cpp
        
        test70.cpp
        
        test71.cpp
        
        test72.cpp
        
        test73.cpp
        
        test74.cpp
        
        test75.cpp
        
        test76.cpp
        
        test77.cpp
        
        test78.cpp
        
        test79.cpp
        
        test8.cpp
        
        test9.cpp
      - trace_macro_expansion.hpp
  - wave
    - cpp_context.hpp
    - cpp_exceptions.hpp
    - cpp_iteration_context.hpp
    - cpplexer
      - cpp_lex_interface.hpp
      - cpp_lex_iterator.hpp
      - cpp_lex_token.hpp
      - cpp_token_ids.hpp
      - cpplexer_exceptions.hpp
      - macro_scoping_tokens.hpp
      - re2c_functor.hpp
      - re2clex
        
        aq.cpp
        
        aq.hpp
        
        cpp.re
        
        cpp.re.cpp
        
        cpp_re2c_lexer.hpp
        
        scanner.hpp
        
        test
        
        lextest.in
        
        lextest.output
        
        run_tests.sh
        
        test_lexer.c
        
        test_lexer.in
        
        test_lexer.output
      - slex
        
        cpp_slex_lexer.hpp
      - slex_functor.hpp
      - test
        
        instantiate_re2c_lexer.cpp
        
        instantiate_slex_lexer.cpp
        
        lextest.in
        
        lextest.re2c.output
        
        lextest.slex.output
        
        run_tests.sh
        
        test_re2c_lexer.cpp
        
        test_re2c_lexer.hpp
        
        test_slex_lexer.cpp
        
        test_slex_lexer.hpp
      - validate_universal_char.hpp
    - grammars
    - idllexer
      - idl_lex_interface.hpp
      - idl_lex_iterator.hpp
      - idl_lex_token.hpp
      - idl_token_ids.hpp
      - re2clex
        
        aq.cpp
        
        aq.hpp
        
        idl.re
        
        idl.re.cpp
        
        idl_re2c_lexer.hpp
        
        scanner.hpp
    - language_support.hpp
    - lex_iterator.hpp
    - lex_token.hpp
    - token_ids.hpp
    - trace_policies.hpp
    - util
    - wave.hpp
    - wave_version.hpp
wave_preprocessor_demo.zip
- wave.exe
wave_preprocessor_src1.zip
- acknowledgements.html
- class_reference_context.html
- class_reference_fileposition.html
- class_reference_inputpolicy.html
- class_reference_lexer.html
- class_reference_tokentype.html
- class_reference_tracepolicy.html
- compiletime_config.html
- index.html
- introduction.html
- macro_expansion_process.html
- predefined_macros.html
- preface.html
- preliminary_cpp0x_support.html
- quickstart.html
- references.html
- supported_pragmas.html
- bkd.gif
- bkd2.gif
- bullet.gif
- l_arr.gif
- l_arr_disabled.gif
- r_arr.gif
- r_arr_disabled.gif
- style.css
- u_arr.gif
- uc.gif
- wave.gif
- token_ids.html
- tracing_facility.html
- wave_driver.html
- boost-build.jam
- cpp_tokens.cpp
- cpp_tokens_config.hpp
- instantiate_cpp_exprgrammar.cpp
- instantiate_cpp_grammar.cpp
- instantiate_cpp_literalgrammars.cpp
- instantiate_re2c_lexer.cpp
- instantiate_slex_lexer.cpp
- Jamfile.v2
- instantiate_cpp_exprgrammar.cpp
- instantiate_cpp_grammar.cpp
- instantiate_cpp_literalgrammars.cpp
- instantiate_re2c_lexer.cpp
- instantiate_slex_lexer.cpp
- list_includes.cpp
- list_includes.hpp
- list_includes_version.hpp
- Readme.txt
- project-root.jam
- wave.vcproj
- cpp.cpp
- cpp.hpp
- cpp_config.hpp
- cpp_version.hpp
- instantiate_cpp_exprgrammar.cpp
- instantiate_cpp_grammar.cpp
- instantiate_cpp_literalgrammars.cpp
- instantiate_defined_grammar.cpp
- instantiate_predef_macros.cpp
- instantiate_re2c_lexer.cpp
- instantiate_slex_lexer.cpp
- Jamfile
- Jamfile.v2
- runtests.sh
- test1.cpp
- test10.cpp
- test11.cpp
- test12.cpp
- test13.cpp
- test14.cpp
- test15.cpp
- test16.cpp
- test17.cpp
- test18.cpp
- test19.cpp
- test2.cpp
- test20.cpp
- test21.cpp
- test22.cpp
- test23.cpp
- test24.cpp
- test25.cpp
- test26.cpp
- test27.cpp
- test28.cpp
- test29.cpp
- test3.cpp
- test30.cpp
- test31.cpp
- test32.cpp
- test33.cpp
- test4.cpp
- test5.cpp
- test6.cpp
- test7.cpp
- test8.cpp
- test9.cpp
- trace_macro_expansion.hpp
- cpp_context.hpp
- cpp_exceptions.hpp
- cpp_iteration_context.hpp
- cpp_lex_interface.hpp
- cpp_lex_iterator.hpp
- cpp_lex_token.hpp
- cpp_token_ids.hpp
- cpplexer_exceptions.hpp
- macro_scoping_tokens.hpp
- re2c_functor.hpp
- aq.cpp
- aq.hpp
- cpp.re
- cpp.re.cpp
- cpp_re2c_lexer.hpp
- scanner.hpp
- lextest.in
- lextest.output
- run_tests.sh
- test_lexer.c
- test_lexer.in
- test_lexer.output
- cpp_slex_lexer.hpp
- slex_functor.hpp
- instantiate_re2c_lexer.cpp
- instantiate_slex_lexer.cpp
- lextest.in
- lextest.re2c.output
- lextest.slex.output
- run_tests.sh
- test_re2c_lexer.cpp
- test_re2c_lexer.hpp
- test_slex_lexer.cpp
- test_slex_lexer.hpp
- validate_universal_char.hpp
- cpp_chlit_grammar.hpp
- cpp_defined_grammar.hpp
- cpp_defined_grammar_gen.hpp
- cpp_expression_grammar.hpp
- cpp_expression_grammar_gen.hpp
- cpp_floatlit_grammar.hpp
- cpp_grammar.hpp
- cpp_grammar_gen.hpp
- cpp_intlit_grammar.hpp
- cpp_literal_grammar_gen.hpp
- cpp_predef_macros_gen.hpp
- cpp_predef_macros_grammar.hpp
- language_support.hpp
- macro_trace_policies.hpp
- cpp_ifblock.hpp
- cpp_include_pathes.hpp
- cpp_iterator.hpp
- cpp_macromap.hpp
- eat_whitespace.hpp
- file_position.hpp
- flex_string.hpp
- insert_whitespace_detection.hpp
- interpret_pragma.hpp
- iteration_context.hpp
- macro_definition.hpp
- macro_helpers.hpp
- pattern_parser.hpp
- symbol_table.hpp
- time_conversion_helper.hpp
- transform_iterator.hpp
- unput_queue_iterator.hpp
- wave_version.hpp
wave_preprocessor_demo1.zip
- wave.exe

/*=============================================================================
    Wave: A Standard compliant C++ preprocessor

    Detect the need to insert a whitespace token into the output stream
    
    Copyright (c) 2001-2004 Hartmut Kaiser
    http://spirit.sourceforge.net/

    Use, modification and distribution is subject to the Boost Software
    License, Version 1.0. (See accompanying file LICENSE_1_0.txt or copy at
    http://www.boost.org/LICENSE_1_0.txt)

    See Copyright.txt for full acknowledgements.
=============================================================================*/
#if !defined(INSERT_WHITESPACE_DETECTION_HPP_765EF77B_0513_4967_BDD6_6A38148C4C96_INCLUDED)
#define INSERT_WHITESPACE_DETECTION_HPP_765EF77B_0513_4967_BDD6_6A38148C4C96_INCLUDED

#include "wave/token_ids.hpp"   

///////////////////////////////////////////////////////////////////////////////
namespace wave {
namespace util {

namespace impl {

// T_IDENTIFIER
    template <typename StringT>
    inline bool
    would_form_universal_char (StringT const &value)
    {
        if ('u' != value[0] && 'U' != value[0])
            return false;
        if ('u' == value[0] && value.size() < 5)
            return false;
        if ('U' == value[0] && value.size() < 9)
            return false;
    
    typename StringT::size_type pos = 
        value.find_first_not_of("0123456789abcdefABCDEF", 1);
        
        if (StringT::npos == pos || 
            ('u' == value[0] && pos > 5) ||
            ('U' == value[0] && pos > 9))
        {
            return true;        // would form an universal char
        }
        return false;
    }
    template <typename StringT>
    inline bool 
    handle_identifier(WAVE_LEXER_NS::token_id prev, 
        WAVE_LEXER_NS::token_id before, StringT const &value)
    {
        using namespace WAVE_LEXER_NS;
        switch (static_cast<unsigned int>(prev)) {
        case T_IDENTIFIER:
        case T_NONREPLACABLE_IDENTIFIER:
        case T_INTLIT:
        case T_FLOATLIT:
#if !defined(WAVE_USE_RE2C_IDL_LEXER)
        case T_COMPL_ALT:
        case T_OR_ALT:
        case T_AND_ALT:
        case T_NOT_ALT:
        case T_XOR_ALT:
        case T_ANDASSIGN_ALT:
        case T_ORASSIGN_ALT:
        case T_XORASSIGN_ALT:
        case T_NOTEQUAL_ALT:
#else
        case T_FIXEDPOINTLIT:
#endif // !defined(WAVE_USE_RE2C_IDL_LEXER)
            return true;

         // avoid constructing universal characters (\u1234)
        case TOKEN_FROM_ID('\\', UnknownTokenType):
            return would_form_universal_char(value);
        }
        return false;
    }
// T_INTLIT
    inline bool 
    handle_intlit(WAVE_LEXER_NS::token_id prev, WAVE_LEXER_NS::token_id before)
    {
        using namespace WAVE_LEXER_NS;
        switch(prev) {
        case T_IDENTIFIER:
        case T_NONREPLACABLE_IDENTIFIER:
        case T_INTLIT:
        case T_FLOATLIT:
#if defined(WAVE_USE_RE2C_IDL_LEXER)
        case T_FIXEDPOINTLIT:
#endif // defined(WAVE_USE_RE2C_IDL_LEXER)
            return true;
        }
        return false;
    }
// T_FLOATLIT
    inline bool 
    handle_floatlit(WAVE_LEXER_NS::token_id prev, 
        WAVE_LEXER_NS::token_id before)
    {
        using namespace WAVE_LEXER_NS;
        switch(prev) {
        case T_IDENTIFIER:
        case T_NONREPLACABLE_IDENTIFIER:
        case T_INTLIT:
        case T_FLOATLIT:
#if defined(WAVE_USE_RE2C_IDL_LEXER)
        case T_FIXEDPOINTLIT:
#endif // defined(WAVE_USE_RE2C_IDL_LEXER)
            return true;
        }
        return false;
    }
#if !defined(WAVE_USE_RE2C_IDL_LEXER)
// <% T_LEFTBRACE
    inline bool 
    handle_alt_leftbrace(WAVE_LEXER_NS::token_id prev, 
        WAVE_LEXER_NS::token_id before)
    {
        using namespace WAVE_LEXER_NS;
        switch(prev) {
        case T_LESS:        // <<%
        case T_SHIFTLEFT:   // <<<%
            return true;
        }
        return false;
    }
// <: T_LEFTBRACKET
    inline bool 
    handle_alt_leftbracket(WAVE_LEXER_NS::token_id prev, 
        WAVE_LEXER_NS::token_id before)
    {
        using namespace WAVE_LEXER_NS;
        switch(prev) {
        case T_LESS:        // <<:
        case T_SHIFTLEFT:   // <<<:
            return true;
        }
        return false;
    }
#else
// T_FIXEDPOINTLIT
    inline bool 
    handle_fixedpointlit(WAVE_LEXER_NS::token_id prev, 
        WAVE_LEXER_NS::token_id before)
    {
        using namespace WAVE_LEXER_NS;
        switch(prev) {
        case T_IDENTIFIER:
        case T_NONREPLACABLE_IDENTIFIER:
        case T_INTLIT:
        case T_FLOATLIT:
        case T_FIXEDPOINTLIT:
            return true;
        }
        return false;
    }
#endif // !defined(WAVE_USE_RE2C_IDL_LEXER)
// T_DOT
    inline bool 
    handle_dot(WAVE_LEXER_NS::token_id prev, WAVE_LEXER_NS::token_id before)
    {
        using namespace WAVE_LEXER_NS;
        switch(prev) {
        case T_DOT:
            if (T_DOT == before)
                return true;    // ...
            break;
        }
        return false;
    }
// T_QUESTION_MARK
    inline bool 
    handle_questionmark(WAVE_LEXER_NS::token_id prev, 
        WAVE_LEXER_NS::token_id before)
    {
        using namespace WAVE_LEXER_NS;
        switch(static_cast<unsigned int>(prev)) {
        case TOKEN_FROM_ID('\\', UnknownTokenType):     // \?
        case T_QUESTION_MARK:   // ??
            return true;
        }
        return false;
    }
// T_NEWLINE
    inline bool
    handle_newline(WAVE_LEXER_NS::token_id prev, 
        WAVE_LEXER_NS::token_id before)
    {
        using namespace WAVE_LEXER_NS;
        switch(static_cast<unsigned int>(prev)) {
        case TOKEN_FROM_ID('\\', UnknownTokenType): // \ \n
        case T_DIVIDE:
            if (T_QUESTION_MARK == before)
                return true;    // ?/\n     // may be \\n
            break;
        }
        return false;
    }
    
}   // namespace impl

class insert_whitespace_detection 
{
public:
    insert_whitespace_detection() 
    :   prev(WAVE_LEXER_NS::T_EOF), beforeprev(WAVE_LEXER_NS::T_EOF) 
    {}
    
    template <typename StringT>
    bool must_insert(WAVE_LEXER_NS::token_id current, StringT const &value)
    {
        using namespace WAVE_LEXER_NS;
        switch (current) {
        case T_NONREPLACABLE_IDENTIFIER:
        case T_IDENTIFIER: 
            return impl::handle_identifier(prev, beforeprev, value); 
        case T_INTLIT:
            return impl::handle_intlit(prev, beforeprev); 
        case T_FLOATLIT:
            return impl::handle_floatlit(prev, beforeprev); 
        case T_STRINGLIT:
            if (TOKEN_FROM_ID('L', UnknownTokenType) == prev)       // 'L'
                return true;
            break;
#if !defined(WAVE_USE_RE2C_IDL_LEXER)
        case T_LEFTBRACE_ALT:
            return impl::handle_alt_leftbrace(prev, beforeprev); 
        case T_LEFTBRACKET_ALT:
            return impl::handle_alt_leftbracket(prev, beforeprev); 
#else
        case T_FIXEDPOINTLIT:
            return impl::handle_fixedpointlit(prev, beforeprev); 
#endif // !defined(WAVE_USE_RE2C_IDL_LEXER)
        case T_DOT:
            return impl::handle_dot(prev, beforeprev); 
        case T_QUESTION_MARK:
            return impl::handle_questionmark(prev, beforeprev); 
        case T_NEWLINE:
            return impl::handle_newline(prev, beforeprev); 

        case T_LEFTPAREN:
        case T_RIGHTPAREN:
        case T_LEFTBRACKET:
        case T_RIGHTBRACKET:
        case T_SEMICOLON:
        case T_COMMA:
        case T_COLON:
            switch (prev) {
            case T_LEFTPAREN:
            case T_RIGHTPAREN:
            case T_LEFTBRACKET:
            case T_RIGHTBRACKET:
            case T_LEFTBRACE:
            case T_RIGHTBRACE:
                return false;   // no insertion between parens/brackets/braces

            default:
                break;
            }        
            break;
            
        case T_LEFTBRACE:
        case T_RIGHTBRACE:
            switch (prev) {
            case T_LEFTPAREN:
            case T_RIGHTPAREN:
            case T_LEFTBRACKET:
            case T_RIGHTBRACKET:
            case T_LEFTBRACE:
            case T_RIGHTBRACE:
            case T_SEMICOLON:
            case T_COMMA:
            case T_COLON:
                return false;   // no insertion between parens/brackets/braces

            case T_QUESTION_MARK:
                if (T_QUESTION_MARK == beforeprev)
                    return true;
                break;
                
            default:
                break;
            }
            break;
                            
        case T_MINUS:
        case T_MINUSMINUS:
        case T_LESS:
        case T_EQUAL:
        case T_ASSIGN:
        case T_GREATER:
        case T_DIVIDE:
        case T_CHARLIT:
        case T_NOT:
        case T_NOTEQUAL:
#if !defined(WAVE_USE_RE2C_IDL_LEXER)
        case T_DIVIDEASSIGN:
        case T_MINUSASSIGN:
#endif // !defined(WAVE_USE_RE2C_IDL_LEXER)
            if (T_QUESTION_MARK == prev && T_QUESTION_MARK == beforeprev)
                return true;    // ??{op}
            break;

#if !defined(WAVE_USE_RE2C_IDL_LEXER)
        case T_COMPL_ALT:
        case T_OR_ALT:
        case T_AND_ALT:
        case T_NOT_ALT:
        case T_XOR_ALT:
        case T_ANDASSIGN_ALT:
        case T_ORASSIGN_ALT:
        case T_XORASSIGN_ALT:
        case T_NOTEQUAL_ALT:
            if (T_IDENTIFIER == prev || T_NONREPLACABLE_IDENTIFIER == prev ||
                IS_CATEGORY(prev, KeywordTokenType))
                return true;
            break;
#endif // !defined(WAVE_USE_RE2C_IDL_LEXER)
        }

    // else, handle operators separately
        if (IS_CATEGORY(current, OperatorTokenType) && 
            IS_CATEGORY(prev, OperatorTokenType))
        {
            return true;    // operators must be delimited always
        }
        return false;
    }
    void shift_tokens (WAVE_LEXER_NS::token_id next_id)
    {
        beforeprev = prev;
        prev = next_id;
    }
    
private:
    WAVE_LEXER_NS::token_id prev;        // the previous analyzed token
    WAVE_LEXER_NS::token_id beforeprev;  // the token before the previous
};

///////////////////////////////////////////////////////////////////////////////
}   //  namespace util
}   //  namespace wave 

#endif // !defined(INSERT_WHITESPACE_DETECTION_HPP_765EF77B_0513_4967_BDD6_6A38148C4C96_INCLUDED)

By viewing downloads associated with this article you agree to the Terms of Service and the article's licence.

If a file you wish to view isn't highlighted, and is a text file (not binary), please let us know and we'll add colourisation support for it.

License

This article has no explicit license attached to it but may contain usage terms in the article text or the download files themselves. If in doubt please contact the author via the discussion board below.

A list of licenses authors might use can be found here

Written By

Hartmut Kaiser

United States

Actively involved in Boost and the development of the Spirit parser construction framework.

Wave: a Standard conformant C++ preprocessor library

License

Comments and Discussions