18 #include <unordered_map>
29 return (
'a' <= c && c <=
'z') || (
'A' <= c && c <=
'Z') || c ==
'_';
44 inline void error(
char *fmt, ...) {
47 vfprintf(stderr, fmt, ap);
48 fprintf(stderr,
"\n");
59 inline void error_at(
char *user_input,
char *loc,
char *fmt, ...) {
63 int pos = loc - user_input;
64 fprintf(stderr,
"%s\n", user_input);
65 fprintf(stderr,
"%*s", pos,
"");
66 fprintf(stderr,
"^ ");
67 vfprintf(stderr, fmt, ap);
68 fprintf(stderr,
"\n");
107 memcmp(token->
str, op, token->
len))
121 if (token->
kind != tok) {
152 memcmp(token->
str, op, token->
len)) {
153 char em[] =
"expected \"%s\"";
168 char em[] =
"expected a number";
171 float val = token->
val;
211 return memcmp(p, q, strlen(q)) == 0;
223 std::unordered_map<std::string, int> &var_counter) {
224 char *p = user_input;
252 if (strncmp(p,
"if", 2) == 0 && !
is_alnum(p[2])) {
258 if (strncmp(p,
"else", 4) == 0 && !
is_alnum(p[4])) {
264 if (strncmp(p,
"return", 6) == 0 && !
is_alnum(p[6])) {
271 if (strchr(
"+-*/()<>=;{}", *p)) {
277 if (isdigit(*p) || (*p ==
'.' && isdigit(p[1]))) {
280 cur->
val = strtof(p, &p);
290 char var_name[(p - q) + 1];
291 strncpy(var_name, q, (p - q));
292 var_name[p - q] =
'\0';
293 std::string var_name_s(var_name);
295 if (var_counter.find(var_name_s) == var_counter.end()) {
296 var_counter.emplace(var_name_s, (
int)var_counter.size());
300 cur->
var_id = var_counter[var_name_s];
313 char em[] =
"invalid token\n";
Definition: compiler.h:11
bool consume_tok(Token *&token, TokenKind tok)
Consumes the current token if it matches tok.
Definition: tokenizer.h:120
bool startswith(char *p, char *q)
Checks if the string p starts with the string q.
Definition: tokenizer.h:210
Token * new_token(TokenKind kind, Token *cur, char *str, int len)
Creates a new token and adds it as the next token of cur.
Definition: tokenizer.h:194
bool consume(Token *&token, char *op)
Consumes the current token if it matches op.
Definition: tokenizer.h:105
bool at_eof(Token *token)
Checks if the current token is at the end of the program.
Definition: tokenizer.h:183
void error_at(char *user_input, char *loc, char *fmt,...)
Reports an error location and exits the program.
Definition: tokenizer.h:59
float expect_number(Token *&token, char *user_input)
Ensures that the current token is a number.
Definition: tokenizer.h:166
TokenKind
Enumeration representing different token kinds.
Definition: tokenizer.h:75
@ TOKEN_NUM
Token representing integer literals.
Definition: tokenizer.h:82
@ TOKEN_ELSE
Token representing the 'else' keyword.
Definition: tokenizer.h:79
@ TOKEN_RETURN
Token representing the 'return' keyword.
Definition: tokenizer.h:77
@ TOKEN_EOF
Token representing end-of-file markers.
Definition: tokenizer.h:83
@ TOKEN_IDENT
Token representing an identifier.
Definition: tokenizer.h:81
@ TOKEN_IF
Token representing the 'if' keyword.
Definition: tokenizer.h:78
@ TOKEN_RESERVED
Keywords or punctuators.
Definition: tokenizer.h:76
@ TOKEN_FOR
Token representing the 'for' keyword.
Definition: tokenizer.h:80
Token * tokenize(char *user_input, std::unordered_map< std::string, int > &var_counter)
Tokenizes a given string and returns a linked list of tokens.
Definition: tokenizer.h:222
bool is_alnum(char c)
Checks if a character is an alphanumeric character.
Definition: tokenizer.h:37
bool is_alpha(char c)
Checks if a character is an alphabetical character or underscore.
Definition: tokenizer.h:28
void expect(Token *&token, char *user_input, char *op)
Ensures that the current token matches op.
Definition: tokenizer.h:150
Token * consume_ident(Token *&token)
Consumes the current token if it is an identifier.
Definition: tokenizer.h:135
void error(char *fmt,...)
Reports an error and exits the program.
Definition: tokenizer.h:44
char LETTER_NEQ[]
Array representing the inequality operator "!=".
Definition: parser.h:20
char LETTER_OR[]
Array representing the logical OR operator "||".
Definition: parser.h:70
char LETTER_LEQ[]
Array representing the less than or equal to operator "<=".
Definition: parser.h:30
char LETTER_EQ[]
Array representing the equality operator "==".
Definition: parser.h:15
char LETTER_GEQ[]
Array representing the greater than or equal to operator ">=".
Definition: parser.h:40
char LETTER_AND[]
Array representing the logical AND operator "&&".
Definition: parser.h:65
Structure representing a token.
Definition: tokenizer.h:89
TokenKind kind
Token kind.
Definition: tokenizer.h:90
int var_id
Variable ID.
Definition: tokenizer.h:95
char * str
Token string.
Definition: tokenizer.h:93
int len
Token length.
Definition: tokenizer.h:94
Token * next
Pointer to the next token in the sequence.
Definition: tokenizer.h:91
float val
If kind is TOKEN_NUM, its value.
Definition: tokenizer.h:92