src/libclang/cxtokenizer.cpp

// Copyright (C) 2017-2023 Jonathan Müller and cppast contributors
// SPDX-License-Identifier: MIT

#include "cxtokenizer.hpp"

#include <cctype>

#include "libclang_visitor.hpp"
#include "parse_error.hpp"

using namespace cppast;

detail::cxtoken::cxtoken(const CXTranslationUnit& tu_unit, const CXToken& token)
: value_(clang_getTokenSpelling(tu_unit, token)), kind_(clang_getTokenKind(token))
{}

namespace
{
bool cursor_is_function(CXCursorKind kind)
{
    return kind == CXCursor_FunctionDecl || kind == CXCursor_CXXMethod
           || kind == CXCursor_Constructor || kind == CXCursor_Destructor
           || kind == CXCursor_ConversionFunction;
}

bool cursor_is_var(CXCursorKind kind)
{
    return kind == CXCursor_VarDecl || kind == CXCursor_FieldDecl;
}

bool is_in_range(const CXSourceLocation& loc, const CXSourceRange& range)
{
    auto begin = clang_getRangeStart(range);
    auto end   = clang_getRangeEnd(range);

    CXFile   f_loc, f_begin, f_end;
    unsigned l_loc, l_begin, l_end;
    clang_getSpellingLocation(loc, &f_loc, &l_loc, nullptr, nullptr);
    clang_getSpellingLocation(begin, &f_begin, &l_begin, nullptr, nullptr);
    clang_getSpellingLocation(end, &f_end, &l_end, nullptr, nullptr);

    return l_loc >= l_begin && l_loc < l_end && clang_File_isEqual(f_loc, f_begin);
}

// heuristic to detect when the type of a variable is declared inline,
// i.e. `struct foo {} f`
bool has_inline_type_definition(CXCursor var_decl)
{
    auto type_decl = clang_getTypeDeclaration(clang_getCursorType(var_decl));
    if (clang_Cursor_isNull(type_decl))
        return false;

    auto type_loc  = clang_getCursorLocation(type_decl);
    auto var_range = clang_getCursorExtent(var_decl);
    return is_in_range(type_loc, var_range);
}

class simple_tokenizer
{
public:
    explicit simple_tokenizer(const CXTranslationUnit& tu, const CXSourceRange& range) : tu_(tu)
    {
        clang_tokenize(tu, range, &tokens_, &no_);
    }

    ~simple_tokenizer()
    {
        clang_disposeTokens(tu_, tokens_, no_);
    }

    simple_tokenizer(const simple_tokenizer&)            = delete;
    simple_tokenizer& operator=(const simple_tokenizer&) = delete;

    unsigned size() const noexcept
    {
        return no_;
    }

    const CXToken& operator[](unsigned i) const noexcept
    {
        DEBUG_ASSERT(i < no_, detail::assert_handler{});
        return tokens_[i];
    }

    std::string get_spelling(std::size_t length) noexcept
    {
        // might need multiple tokens, because [[, for example, is treated as two separate tokens

        std::string result;
        for (auto cur = 0u; cur < no_; ++cur)
        {
            auto cur_spelling = detail::cxstring(clang_getTokenSpelling(tu_, tokens_[cur]));
            result += cur_spelling.c_str();
            if (result.length() >= length)
                return result;
        }
        return result;
    }

private:
    CXTranslationUnit tu_;
    CXToken*          tokens_;
    unsigned          no_;
};

CXSourceLocation get_next_location_impl(const CXTranslationUnit& tu, CXFile file,
                                        const CXSourceLocation& loc, int inc = 1)
{
    DEBUG_ASSERT(clang_Location_isFromMainFile(loc), detail::assert_handler{});

    unsigned offset;
    clang_getSpellingLocation(loc, nullptr, nullptr, nullptr, &offset);
    if (inc >= 0)
        offset += unsigned(inc);
    else
        offset -= unsigned(-inc);
    return clang_getLocationForOffset(tu, file, offset);
}

CXSourceLocation get_next_location(const CXTranslationUnit& tu, const CXFile& file,
                                   const CXSourceLocation& loc, std::size_t token_length)
{
    // simple move over by token_length
    return get_next_location_impl(tu, file, loc, int(token_length));
}

CXSourceLocation get_prev_location(const CXTranslationUnit& tu, const CXFile& file,
                                   const CXSourceLocation& loc, std::size_t token_length)
{
    auto inc = 1;
    while (true)
    {
        auto loc_before = get_next_location_impl(tu, file, loc, -inc);
        DEBUG_ASSERT(!clang_equalLocations(loc_before, loc), detail::assert_handler{});

        if (!clang_Location_isFromMainFile(loc_before))
            // out of range
            return clang_getNullLocation();

        simple_tokenizer tokenizer(tu, clang_getRange(loc_before, loc));

        auto token_location = clang_getTokenLocation(tu, tokenizer[0]);
        if (clang_equalLocations(loc_before, token_location))
        {
            // actually found a new token and not just whitespace
            // loc_before is now the last character of the new token
            // need to move by token_length - 1 to get to the first character
            return get_next_location_impl(tu, file, loc, -1 * (inc + int(token_length) - 1));
        }
        else
            ++inc;
    }

    return clang_getNullLocation();
}

bool token_at_is(const CXTranslationUnit& tu, const CXFile& file, const CXSourceLocation& loc,
                 const char* token_str)
{
    auto length = std::strlen(token_str);

    auto loc_after = get_next_location(tu, file, loc, length);
    if (!clang_Location_isFromMainFile(loc_after))
        return false;

    simple_tokenizer tokenizer(tu, clang_getRange(loc, loc_after));
    return tokenizer.get_spelling(length) == token_str;
}

bool consume_if_token_at_is(const CXTranslationUnit& tu, const CXFile& file, CXSourceLocation& loc,
                            const char* token_str)
{
    auto length = std::strlen(token_str);

    auto loc_after = get_next_location(tu, file, loc, length);
    if (!clang_Location_isFromMainFile(loc_after))
        return false;

    simple_tokenizer tokenizer(tu, clang_getRange(loc, loc_after));
    if (tokenizer.get_spelling(length) == token_str)
    {
        loc = loc_after;
        return true;
    }
    else
        return false;
}

bool token_before_is(const CXTranslationUnit& tu, const CXFile& file, const CXSourceLocation& loc,
                     const char* token_str)
{
    auto length = std::strlen(token_str);

    auto loc_before = get_prev_location(tu, file, loc, length);
    if (!clang_Location_isFromMainFile(loc_before))
        return false;

    simple_tokenizer tokenizer(tu, clang_getRange(loc_before, loc));
    return tokenizer.get_spelling(length) == token_str;
}

bool consume_if_token_before_is(const CXTranslationUnit& tu, const CXFile& file,
                                CXSourceLocation& loc, const char* token_str)
{
    auto length = std::strlen(token_str);

    auto loc_before = get_prev_location(tu, file, loc, length);
    if (!clang_Location_isFromMainFile(loc_before))
        return false;

    simple_tokenizer tokenizer(tu, clang_getRange(loc_before, loc));
    if (tokenizer.get_spelling(length) == token_str)
    {
        loc = loc_before;
        return true;
    }
    else
        return false;
}

struct Extent
{
    CXSourceRange first_part;
    CXSourceRange second_part;
};

// clang_getCursorExtent() is somehow broken in various ways
// this function returns the actual CXSourceRange that covers all parts required for parsing
// might include more tokens
// this function is the reason you shouldn't use libclang
Extent get_extent(const CXTranslationUnit& tu, const CXFile& file, const CXCursor& cur)
{
    auto extent = clang_getCursorExtent(cur);
    auto begin  = clang_getRangeStart(extent);
    auto end    = clang_getRangeEnd(extent);

    auto kind = clang_getCursorKind(cur);

    // first need to extend the range to capture attributes that are before the declaration
    if (cursor_is_function(kind) || cursor_is_function(clang_getTemplateCursorKind(cur))
        || kind == CXCursor_VarDecl || kind == CXCursor_FieldDecl || kind == CXCursor_ParmDecl
        || kind == CXCursor_NonTypeTemplateParameter)
    {
        while (token_before_is(tu, file, begin, "]]") || token_before_is(tu, file, begin, ")"))
        {
            auto save_begin = begin;
            if (consume_if_token_before_is(tu, file, begin, "]]"))
            {
                while (!consume_if_token_before_is(tu, file, begin, "[["))
                    begin = get_prev_location(tu, file, begin, 1);
            }
            else if (consume_if_token_before_is(tu, file, begin, ")"))
            {
                // maybe alignas specifier

                auto paren_count = 1;
                for (auto last_begin = begin; paren_count != 0; last_begin = begin)
                {
                    if (token_before_is(tu, file, begin, "("))
                        --paren_count;
                    else if (token_before_is(tu, file, begin, ")"))
                        ++paren_count;

                    begin = get_prev_location(tu, file, begin, 1);
                    DEBUG_ASSERT(!clang_equalLocations(last_begin, begin),
                                 detail::parse_error_handler{}, cur,
                                 "infinite loop in alignas parsing");
                }

                if (!consume_if_token_before_is(tu, file, begin, "alignas"))
                {
                    // not alignas
                    begin = save_begin;
                    break;
                }
            }
        }
    }

    if (cursor_is_function(kind) || cursor_is_function(clang_getTemplateCursorKind(cur)))
    {
        if (clang_CXXMethod_isDefaulted(cur) || !clang_isCursorDefinition(cur))
        {
            // defaulted or declaration: extend until semicolon
            while (!token_at_is(tu, file, end, ";"))
                end = get_next_location(tu, file, end, 1);
        }
        else
        {
            // declaration: remove body, we don't care about that
            auto has_children = false;
            detail::visit_children(cur, [&](const CXCursor& child) {
                if (has_children)
                    return;
                else if (clang_getCursorKind(child) == CXCursor_CompoundStmt
                         || clang_getCursorKind(child) == CXCursor_CXXTryStmt
                         || clang_getCursorKind(child) == CXCursor_InitListExpr)
                {
                    auto child_extent = clang_getCursorExtent(child);
                    end               = clang_getRangeStart(child_extent);
                    has_children      = true;
                }
            });
        }
    }
    else if (cursor_is_var(kind) || cursor_is_var(clang_getTemplateCursorKind(cur)))
    {
        // need to extend until the semicolon
        while (!token_at_is(tu, file, end, ";"))
            end = get_next_location(tu, file, end, 1);

        if (has_inline_type_definition(cur))
        {
            // the type is declared inline,
            // remove the type definition from the range
            auto type_cursor = clang_getTypeDeclaration(clang_getCursorType(cur));
            auto type_extent = clang_getCursorExtent(type_cursor);

            auto type_begin = clang_getRangeStart(type_extent);
            auto type_end   = clang_getRangeEnd(type_extent);

            return {clang_getRange(begin, type_begin), clang_getRange(type_end, end)};
        }
    }
    else if (kind == CXCursor_TemplateTypeParameter && token_at_is(tu, file, end, "("))
    {
        // if you have decltype as default argument for a type template parameter
        // libclang doesn't include the parameters
        auto next = get_next_location(tu, file, end, 1);
        auto prev = end;
        for (auto paren_count = 1; paren_count != 0; next = get_next_location(tu, file, next, 1))
        {
            if (token_at_is(tu, file, next, "("))
                ++paren_count;
            else if (token_at_is(tu, file, next, ")"))
                --paren_count;
            prev = next;
        }
        end = next;
    }
    else if (kind == CXCursor_TemplateTemplateParameter && token_at_is(tu, file, end, "<"))
    {
        // if you have a template template parameter in a template template parameter,
        // the tokens are all messed up, only contain the `template`

        // first: skip to closing angle bracket
        // luckily no need to handle expressions here
        auto next = get_next_location(tu, file, end, 1);
        for (auto angle_count = 1; angle_count != 0; next = get_next_location(tu, file, next, 1))
        {
            if (token_at_is(tu, file, next, ">"))
                --angle_count;
            else if (token_at_is(tu, file, next, ">>"))
                angle_count -= 2;
            else if (token_at_is(tu, file, next, "<"))
                ++angle_count;
        }

        // second: skip until end of parameter
        // no need to handle default, so look for '>' or ','
        while (!token_at_is(tu, file, next, ">") && !token_at_is(tu, file, next, ","))
            next = get_next_location(tu, file, next, 1);
        // now we found the proper end of the token
        end = get_prev_location(tu, file, next, 1);
    }
    else if ((kind == CXCursor_TemplateTypeParameter || kind == CXCursor_NonTypeTemplateParameter
              || kind == CXCursor_TemplateTemplateParameter))
    {
        // variadic tokens in unnamed parameter not included
        consume_if_token_at_is(tu, file, end, "...");
    }
    else if (kind == CXCursor_EnumDecl && !token_at_is(tu, file, end, ";"))
    {
        while (!token_at_is(tu, file, end, ";"))
            end = get_next_location(tu, file, end, 1);
    }
    else if (kind == CXCursor_EnumConstantDecl && !token_at_is(tu, file, end, ","))
    {
        // need to support attributes
        // just give up and extend the range to the range of the entire enum...
        auto parent = clang_getCursorLexicalParent(cur);
        end         = clang_getRangeEnd(clang_getCursorExtent(parent));
    }
    else if (kind == CXCursor_UnexposedDecl)
    {
        // include semicolon, if necessary
        if (token_at_is(tu, file, end, ";"))
            end = get_next_location(tu, file, end, 1);
    }

    return Extent{clang_getRange(begin, end), clang_getNullRange()};
}
} // namespace

detail::cxtokenizer::cxtokenizer(const CXTranslationUnit& tu, const CXFile& file,
                                 const CXCursor& cur)
{
    auto extent = get_extent(tu, file, cur);

    simple_tokenizer tokenizer(tu, extent.first_part);
    tokens_.reserve(tokenizer.size());
    for (auto i = 0u; i != tokenizer.size(); ++i)
        tokens_.emplace_back(tu, tokenizer[i]);

    if (!clang_Range_isNull(extent.second_part))
    {
        simple_tokenizer second_tokenizer(tu, extent.second_part);
        tokens_.reserve(tokens_.size() + second_tokenizer.size());
        for (auto i = 0u; i != second_tokenizer.size(); ++i)
            tokens_.emplace_back(tu, second_tokenizer[i]);
    }
}

void detail::skip(detail::cxtoken_stream& stream, const char* str)
{
    if (*str)
    {
        // non-empty string
        DEBUG_ASSERT(!stream.done(), parse_error_handler{}, stream.cursor(),
                     format("expected '", str, "', got exhausted stream"));
        auto& token = stream.peek();
        DEBUG_ASSERT(token == str, parse_error_handler{}, stream.cursor(),
                     format("expected '", str, "', got '", token.c_str(), "'"));
        stream.bump();
    }
}

namespace
{
bool starts_with(const char*& str, const detail::cxtoken& t)
{
    if (std::strncmp(str, t.c_str(), t.value().length()) != 0)
        return false;
    str += t.value().length();
    while (*str == ' ' || *str == '\t')
        ++str;
    return true;
}
} // namespace

bool detail::skip_if(detail::cxtoken_stream& stream, const char* str, bool multi_token)
{
    if (!*str)
        return true;
    else if (stream.done())
        return false;
    auto save = stream.cur();
    do
    {
        auto& token = stream.peek();
        if (!starts_with(str, token) || (!multi_token && *str != '\0'))
        {
            stream.set_cur(save);
            return false;
        }
        stream.bump();
    } while (multi_token && *str);
    return true;
}

namespace
{
// whether or not the current angle bracket can be a comparison
// note: this is a heuristic I hope works often enough
bool is_comparison(CXTokenKind last_kind, const detail::cxtoken& cur, CXTokenKind next_kind)
{
    if (cur == "<")
        return last_kind == CXToken_Literal;
    else if (cur == ">")
        return next_kind == CXToken_Literal;
    return false;
}
} // namespace

detail::closing_bracket_pos detail::find_closing_bracket(detail::cxtoken_stream stream)
{
    auto        template_bracket = false;
    auto        open_bracket     = stream.peek().c_str();
    const char* close_bracket    = nullptr;
    if (skip_if(stream, "("))
        close_bracket = ")";
    else if (skip_if(stream, "{"))
        close_bracket = "}";
    else if (skip_if(stream, "["))
        close_bracket = "]";
    else if (skip_if(stream, "<"))
    {
        close_bracket    = ">";
        template_bracket = true;
    }
    else
        DEBUG_UNREACHABLE(parse_error_handler{}, stream.cursor(),
                          format("expected a bracket, got '", stream.peek().c_str(), "'"));

    auto bracket_count         = 1;
    auto paren_count           = 0; // internal nested parenthesis
    auto last_token            = CXToken_Comment;
    auto last_was_double_angle = false;
    while (!stream.done() && bracket_count != 0)
    {
        last_was_double_angle = false;

        auto& cur = stream.get();
        if (paren_count == 0 && cur == open_bracket
            && !is_comparison(last_token, cur, stream.peek().kind()))
            ++bracket_count;
        else if (paren_count == 0 && cur == close_bracket
                 && !is_comparison(last_token, cur, stream.peek().kind()))
            --bracket_count;
        else if (paren_count == 0 && template_bracket && cur == ">>")
        {
            // maximal munch
            bracket_count -= 2;
            last_was_double_angle = true;
        }
        else if (cur == "(" || cur == "{" || cur == "[")
            ++paren_count;
        else if (cur == ")" || cur == "}" || cur == "]")
            --paren_count;

        last_token = cur.kind();
    }
    DEBUG_ASSERT(bracket_count == 0 && paren_count == 0, parse_error_handler{}, stream.cursor(),
                 "find_closing_bracket() internal parse error");

    if (last_was_double_angle)
    {
        return {stream.cur(), stream.cur(), true};
    }
    else
    {
        auto after = stream.cur();
        stream.bump_back();
        return {stream.cur(), after, false};
    }
}

void detail::skip_brackets(detail::cxtoken_stream& stream)
{
    auto closing = find_closing_bracket(stream);
    stream.set_cur(closing.after);
}

detail::cxtoken_iterator detail::find_sequence(detail::cxtoken_stream   stream,
                                               detail::cxtoken_iterator start,
                                               detail::cxtoken_iterator end)
{
    detail::cxtoken_iterator search_start = stream.cur();
    while (search_start != stream.end())
    {
        detail::cxtoken_iterator search_iter = search_start;
        detail::cxtoken_iterator seq_iter    = start;
        bool                     failed      = false;

        while (!failed && search_iter != stream.end() && seq_iter != end)
        {
            if (search_iter->value() != seq_iter->value()
                || search_iter->kind() != seq_iter->kind())
            {
                failed = true;
            }
            else
            {
                ++search_iter;
                ++seq_iter;
            }
        }
        if (!failed)
            return search_start;

        ++search_start;
    }

    return stream.end();
}

namespace
{
type_safe::optional<std::string> parse_attribute_using(detail::cxtoken_stream& stream)
{
    // using identifier :
    if (skip_if(stream, "using"))
    {
        DEBUG_ASSERT(stream.peek().kind() == CXToken_Identifier, detail::parse_error_handler{},
                     stream.cursor(), "expected identifier");
        auto scope = stream.get().value().std_str();
        skip(stream, ":");

        return scope;
    }
    else
        return type_safe::nullopt;
}

cpp_attribute_kind get_attribute_kind(const std::string& name)
{
    if (name == "carries_dependency")
        return cpp_attribute_kind::carries_dependency;
    else if (name == "deprecated")
        return cpp_attribute_kind::deprecated;
    else if (name == "fallthrough")
        return cpp_attribute_kind::fallthrough;
    else if (name == "maybe_unused")
        return cpp_attribute_kind::maybe_unused;
    else if (name == "nodiscard")
        return cpp_attribute_kind::nodiscard;
    else if (name == "noreturn")
        return cpp_attribute_kind::noreturn;
    else
        return cpp_attribute_kind::unknown;
}

cpp_token_string parse_attribute_arguments(detail::cxtoken_stream& stream)
{
    auto end = find_closing_bracket(stream);
    skip(stream, "(");

    auto arguments = detail::to_string(stream, end.bracket, end.unmunch);
    stream.set_cur(end.bracket);

    skip(stream, ")");

    return arguments;
}

cpp_attribute parse_attribute_token(detail::cxtoken_stream&          stream,
                                    type_safe::optional<std::string> scope)
{
    // (identifier ::)_opt identifier ( '(' some tokens ')' )_opt ..._opt

    // parse name
    DEBUG_ASSERT(stream.peek().kind() == CXToken_Identifier
                     || stream.peek().kind() == CXToken_Keyword,
                 detail::parse_error_handler{}, stream.cursor(), "expected identifier");
    auto name = stream.get().value().std_str();
    if (skip_if(stream, "::"))
    {
        // name was actually a scope, so parse name again
        DEBUG_ASSERT(!scope, detail::parse_error_handler{}, stream.cursor(),
                     "attribute using + scope not allowed");
        scope = std::move(name);

        DEBUG_ASSERT(stream.peek().kind() == CXToken_Identifier
                         || stream.peek().kind() == CXToken_Keyword,
                     detail::parse_error_handler{}, stream.cursor(), "expected identifier");
        name = stream.get().value().std_str();
    }

    // parse arguments
    type_safe::optional<cpp_token_string> arguments;
    if (stream.peek() == "(")
        arguments = parse_attribute_arguments(stream);

    // parse variadic token
    auto is_variadic = skip_if(stream, "...");

    // get kind
    auto kind = get_attribute_kind(name);
    if (!scope && kind != cpp_attribute_kind::unknown)
        return cpp_attribute(kind, std::move(arguments));
    else
        return cpp_attribute(std::move(scope), std::move(name), std::move(arguments), is_variadic);
}

bool parse_attribute_impl(cpp_attribute_list& result, detail::cxtoken_stream& stream)
{
    if (skip_if(stream, "[") && stream.peek() == "[")
    {
        // C++11 attribute
        // [[<attribute>]]
        //  ^
        skip(stream, "[");

        auto scope = parse_attribute_using(stream);
        while (!skip_if(stream, "]"))
        {
            auto attribute = parse_attribute_token(stream, scope);
            result.push_back(std::move(attribute));
            detail::skip_if(stream, ",");
        }

        // [[<attribute>]]
        //               ^
        skip(stream, "]");
        return true;
    }
    else if (skip_if(stream, "alignas"))
    {
        // alignas specifier
        // alignas(<some arguments>)
        //        ^
        auto arguments = parse_attribute_arguments(stream);
        result.push_back(cpp_attribute(cpp_attribute_kind::alignas_, std::move(arguments)));
    }
    else if (skip_if(stream, "__attribute__") && stream.peek() == "(")
    {
        // GCC/clang attributes
        // __attribute__((<attribute>))
        //              ^^
        skip(stream, "(");
        skip(stream, "(");

        auto scope = parse_attribute_using(stream);
        while (!skip_if(stream, ")"))
        {
            auto attribute = parse_attribute_token(stream, scope);
            result.push_back(std::move(attribute));
            detail::skip_if(stream, ",");
        }

        skip(stream, ")");
        return true;
    }
    else if (skip_if(stream, "__declspec"))
    {
        // MSVC declspec
        // __declspec(<attribute>)
        //           ^
        skip(stream, "(");
        auto scope = parse_attribute_using(stream);
        while (!skip_if(stream, ")"))
        {
            auto attribute = parse_attribute_token(stream, scope);
            result.push_back(std::move(attribute));
            detail::skip_if(stream, ",");
        }

        return true;
    }

    return false;
}
} // namespace

cpp_attribute_list detail::parse_attributes(detail::cxtoken_stream& stream, bool skip_anway)
{
    cpp_attribute_list result;

    while (parse_attribute_impl(result, stream))
        skip_anway = false;

    if (skip_anway)
        stream.bump();

    return result;
}

namespace
{
cpp_token_kind get_kind(const detail::cxtoken& token)
{
    switch (token.kind())
    {
    case CXToken_Punctuation:
        return cpp_token_kind::punctuation;
    case CXToken_Keyword:
        return cpp_token_kind::keyword;
    case CXToken_Identifier:
        return cpp_token_kind::identifier;

    case CXToken_Literal: {
        auto spelling = token.value().std_str();
        if (spelling.find('.') != std::string::npos && spelling.find('\"') == std::string::npos)
            return cpp_token_kind::float_literal;
        else if (std::isdigit(spelling.front()))
            return cpp_token_kind::int_literal;
        else if (spelling.back() == '\'')
            return cpp_token_kind::char_literal;
        else
            return cpp_token_kind::string_literal;
    }

    case CXToken_Comment:
        break;
    }

    DEBUG_UNREACHABLE(detail::assert_handler{});
    return cpp_token_kind::punctuation;
}
} // namespace

cpp_token_string detail::to_string(cxtoken_stream& stream, cxtoken_iterator end, bool unmunch)
{
    cpp_token_string::builder builder;

    while (stream.cur() != end)
    {
        auto& token = stream.get();
        builder.add_token(cpp_token(get_kind(token), token.c_str()));
    }

    if (unmunch)
        builder.unmunch();

    return builder.finish();
}

bool detail::append_scope(detail::cxtoken_stream& stream, std::string& scope)
{
    // add identifiers and "::" to current scope name,
    // clear if there is any other token in between, or mismatched combination
    if (stream.peek().kind() == CXToken_Identifier)
    {
        if (!scope.empty() && scope.back() != ':')
            scope.clear();
        scope += stream.get().c_str();
    }
    else if (stream.peek() == "::")
    {
        if (!scope.empty() && scope.back() == ':')
            scope.clear();
        scope += stream.get().c_str();
    }
    else if (stream.peek() == "<")
    {
        auto pos = detail::find_closing_bracket(stream);
        scope += detail::to_string(stream, pos.bracket, pos.unmunch).as_string();
        if (!detail::skip_if(stream, ">>"))
            detail::skip(stream, ">");
        scope += ">";
    }
    else
    {
        scope.clear();
        return false;
    }
    return true;
}