chibicc/chibicc.h

188 lines
3.6 KiB
C
Raw Normal View History

2020-10-07 14:12:19 +03:00
#define _POSIX_C_SOURCE 200809L
2020-10-07 14:11:16 +03:00
#include <assert.h>
#include <ctype.h>
#include <stdarg.h>
#include <stdbool.h>
#include <stdio.h>
#include <stdlib.h>
#include <string.h>
2020-09-04 07:39:06 +03:00
typedef struct Type Type;
2020-10-07 14:12:19 +03:00
typedef struct Node Node;
2020-10-08 08:30:04 +03:00
//
// strings.c
//
char *format(char *fmt, ...);
2020-10-07 14:11:16 +03:00
//
// tokenize.c
//
2020-10-07 14:12:19 +03:00
// Token
2020-10-07 14:11:16 +03:00
typedef enum {
2020-10-07 14:12:57 +03:00
TK_IDENT, // Identifiers
TK_PUNCT, // Punctuators
TK_KEYWORD, // Keywords
2020-10-07 06:49:08 +03:00
TK_STR, // String literals
2020-10-07 14:12:57 +03:00
TK_NUM, // Numeric literals
TK_EOF, // End-of-file markers
2020-10-07 14:11:16 +03:00
} TokenKind;
// Token type
typedef struct Token Token;
struct Token {
TokenKind kind; // Token kind
Token *next; // Next token
int val; // If kind is TK_NUM, its value
char *loc; // Token location
int len; // Token length
2020-10-07 06:49:08 +03:00
Type *ty; // Used if TK_STR
char *str; // String literal contents including terminating '\0'
2020-10-07 14:11:16 +03:00
};
void error(char *fmt, ...);
void error_at(char *loc, char *fmt, ...);
void error_tok(Token *tok, char *fmt, ...);
bool equal(Token *tok, char *op);
Token *skip(Token *tok, char *op);
bool consume(Token **rest, Token *tok, char *str);
2020-10-07 14:11:16 +03:00
Token *tokenize(char *input);
//
// parse.c
//
// Variable or function
2020-10-07 14:12:19 +03:00
typedef struct Obj Obj;
struct Obj {
Obj *next;
char *name; // Variable name
Type *ty; // Type
bool is_local; // local or global/function
2020-10-07 14:12:19 +03:00
// Local variable
int offset;
// Global variable or function
bool is_function;
2020-10-07 06:49:08 +03:00
// Global variable
char *init_data;
// Function
Obj *params;
2020-10-07 14:12:19 +03:00
Node *body;
Obj *locals;
int stack_size;
};
// AST node
2020-10-07 14:11:16 +03:00
typedef enum {
ND_ADD, // +
ND_SUB, // -
ND_MUL, // *
ND_DIV, // /
ND_NEG, // unary -
ND_EQ, // ==
ND_NE, // !=
ND_LT, // <
ND_LE, // <=
2020-09-26 02:59:56 +03:00
ND_ASSIGN, // =
2019-08-05 15:12:44 +03:00
ND_ADDR, // unary &
ND_DEREF, // unary *
2020-10-07 14:12:57 +03:00
ND_RETURN, // "return"
2020-10-07 06:47:09 +03:00
ND_IF, // "if"
2019-08-04 11:24:03 +03:00
ND_FOR, // "for" or "while"
2020-09-04 07:38:41 +03:00
ND_BLOCK, // { ... }
2019-08-04 12:25:20 +03:00
ND_FUNCALL, // Function call
ND_EXPR_STMT, // Expression statement
2020-09-26 02:59:56 +03:00
ND_VAR, // Variable
ND_NUM, // Integer
2020-10-07 14:11:16 +03:00
} NodeKind;
// AST node type
struct Node {
NodeKind kind; // Node kind
Node *next; // Next node
2020-09-04 07:39:06 +03:00
Type *ty; // Type, e.g. int or pointer to int
Token *tok; // Representative token
2020-10-07 06:47:09 +03:00
2020-10-07 14:11:16 +03:00
Node *lhs; // Left-hand side
Node *rhs; // Right-hand side
2020-09-04 07:38:41 +03:00
2019-08-04 11:35:53 +03:00
// "if" or "for" statement
2020-10-07 06:47:09 +03:00
Node *cond;
Node *then;
Node *els;
2019-08-04 11:35:53 +03:00
Node *init;
Node *inc;
2020-10-07 06:47:09 +03:00
2020-09-04 07:38:41 +03:00
// Block
Node *body;
2019-08-04 12:25:20 +03:00
// Function call
char *funcname;
Node *args;
2019-08-04 12:25:20 +03:00
2020-10-07 14:12:19 +03:00
Obj *var; // Used if kind == ND_VAR
2020-10-07 14:11:16 +03:00
int val; // Used if kind == ND_NUM
};
Obj *parse(Token *tok);
2020-10-07 14:11:16 +03:00
2020-09-04 07:39:06 +03:00
//
// type.c
//
typedef enum {
2020-08-27 15:04:17 +03:00
TY_CHAR,
2020-09-04 07:39:06 +03:00
TY_INT,
TY_PTR,
2020-09-04 13:01:33 +03:00
TY_FUNC,
2020-09-26 04:15:32 +03:00
TY_ARRAY,
2020-09-04 07:39:06 +03:00
} TypeKind;
struct Type {
TypeKind kind;
2020-09-26 04:15:32 +03:00
int size; // sizeof() value
// Pointer-to or array-of type. We intentionally use the same member
// to represent pointer/array duality in C.
//
// In many contexts in which a pointer is expected, we examine this
// member instead of "kind" member to determine whether a type is a
// pointer or not. That means in many contexts "array of T" is
// naturally handled as if it were "pointer to T", as required by
// the C spec.
2020-09-04 07:39:06 +03:00
Type *base;
// Declaration
Token *name;
2020-09-04 13:01:33 +03:00
2020-09-26 04:15:32 +03:00
// Array
int array_len;
2020-09-04 13:01:33 +03:00
// Function type
Type *return_ty;
Type *params;
Type *next;
2020-09-04 07:39:06 +03:00
};
2020-08-27 15:04:17 +03:00
extern Type *ty_char;
2020-09-04 07:39:06 +03:00
extern Type *ty_int;
bool is_integer(Type *ty);
Type *copy_type(Type *ty);
Type *pointer_to(Type *base);
2020-09-04 13:01:33 +03:00
Type *func_type(Type *return_ty);
2020-09-26 04:15:32 +03:00
Type *array_of(Type *base, int size);
2020-09-04 07:39:06 +03:00
void add_type(Node *node);
2020-10-07 14:11:16 +03:00
//
// codegen.c
//
void codegen(Obj *prog);