zig/src/tokenizer.hpp
Andrew Kelley b581da41f8 remove compiler directives
* add `setFnTest`, `setFnVisible`, `setFnStaticEval`,
   `setFnNoInline` builtin functions to replace previous
   directive functionality
 * add `coldcc` and `nakedcc` as keywords which can be used as part
   of a function prototype.
 * `setDebugSafety` builtin can be used to set debug safety features
   at a per block scope level.
 * closes #169
2016-09-28 02:33:32 -04:00

174 lines
3.5 KiB
C++

/*
* Copyright (c) 2015 Andrew Kelley
*
* This file is part of zig, which is MIT licensed.
* See http://opensource.org/licenses/MIT
*/
#ifndef ZIG_TOKENIZER_HPP
#define ZIG_TOKENIZER_HPP
#include "buffer.hpp"
#include "bignum.hpp"
enum TokenId {
TokenIdEof,
TokenIdSymbol,
TokenIdKeywordFn,
TokenIdKeywordReturn,
TokenIdKeywordVar,
TokenIdKeywordConst,
TokenIdKeywordExtern,
TokenIdKeywordPub,
TokenIdKeywordUse,
TokenIdKeywordExport,
TokenIdKeywordTrue,
TokenIdKeywordFalse,
TokenIdKeywordIf,
TokenIdKeywordElse,
TokenIdKeywordGoto,
TokenIdKeywordAsm,
TokenIdKeywordVolatile,
TokenIdKeywordStruct,
TokenIdKeywordEnum,
TokenIdKeywordUnion,
TokenIdKeywordWhile,
TokenIdKeywordFor,
TokenIdKeywordContinue,
TokenIdKeywordBreak,
TokenIdKeywordNull,
TokenIdKeywordNoAlias,
TokenIdKeywordSwitch,
TokenIdKeywordUndefined,
TokenIdKeywordZeroes,
TokenIdKeywordError,
TokenIdKeywordType,
TokenIdKeywordInline,
TokenIdKeywordDefer,
TokenIdKeywordThis,
TokenIdKeywordColdCC,
TokenIdKeywordNakedCC,
TokenIdLParen,
TokenIdRParen,
TokenIdComma,
TokenIdStar,
TokenIdStarStar,
TokenIdLBrace,
TokenIdRBrace,
TokenIdLBracket,
TokenIdRBracket,
TokenIdStringLiteral,
TokenIdCharLiteral,
TokenIdSemicolon,
TokenIdNumberLiteral,
TokenIdPlus,
TokenIdPlusPlus,
TokenIdColon,
TokenIdArrow,
TokenIdFatArrow,
TokenIdDash,
TokenIdNumberSign,
TokenIdBoolOr,
TokenIdBoolAnd,
TokenIdBinOr,
TokenIdAmpersand,
TokenIdBinXor,
TokenIdEq,
TokenIdTimesEq,
TokenIdTimesPercent,
TokenIdTimesPercentEq,
TokenIdDivEq,
TokenIdModEq,
TokenIdPlusEq,
TokenIdPlusPercent,
TokenIdPlusPercentEq,
TokenIdMinusEq,
TokenIdMinusPercent,
TokenIdMinusPercentEq,
TokenIdBitShiftLeftEq,
TokenIdBitShiftLeftPercent,
TokenIdBitShiftLeftPercentEq,
TokenIdBitShiftRightEq,
TokenIdBitAndEq,
TokenIdBitXorEq,
TokenIdBitOrEq,
TokenIdBoolAndEq,
TokenIdBoolOrEq,
TokenIdCmpEq,
TokenIdBang,
TokenIdTilde,
TokenIdCmpNotEq,
TokenIdCmpLessThan,
TokenIdCmpGreaterThan,
TokenIdCmpLessOrEq,
TokenIdCmpGreaterOrEq,
TokenIdBitShiftLeft,
TokenIdBitShiftRight,
TokenIdSlash,
TokenIdPercent,
TokenIdPercentPercent,
TokenIdDot,
TokenIdEllipsis,
TokenIdMaybe,
TokenIdDoubleQuestion,
TokenIdMaybeAssign,
TokenIdAtSign,
TokenIdPercentDot,
};
struct TokenNumLit {
BigNum bignum;
// overflow is true if when parsing the number, we discovered it would not
// fit without losing data in a uint64_t or double
bool overflow;
};
struct TokenStrLit {
Buf str;
bool is_c_str;
};
struct TokenCharLit {
uint8_t c;
};
struct Token {
TokenId id;
size_t start_pos;
size_t end_pos;
size_t start_line;
size_t start_column;
union {
// TokenIdNumberLiteral
TokenNumLit num_lit;
// TokenIdStringLiteral or TokenIdSymbol
TokenStrLit str_lit;
// TokenIdCharLiteral
TokenCharLit char_lit;
} data;
};
struct Tokenization {
ZigList<Token> *tokens;
ZigList<size_t> *line_offsets;
// if an error occurred
Buf *err;
size_t err_line;
size_t err_column;
};
void tokenize(Buf *buf, Tokenization *out_tokenization);
void print_tokens(Buf *buf, ZigList<Token> *tokens);
const char * token_name(TokenId id);
bool valid_symbol_starter(uint8_t c);
bool is_zig_keyword(Buf *buf);
#endif