@@ -1,441 +1,15 @@ | |||
/* Copyright (C) 2014-2015 Ben Kurtovic <ben.kurtovic@gmail.com> | |||
Released under the terms of the MIT License. See LICENSE for details. */ | |||
#include <libgen.h> | |||
#include <limits.h> | |||
#include <stdlib.h> | |||
#include <string.h> | |||
#include "assembler.h" | |||
#include "assembler/errors.h" | |||
#include "assembler/io.h" | |||
#include "assembler/preprocessor.h" | |||
#include "assembler/state.h" | |||
#include "logging.h" | |||
#define DIRECTIVE_MARKER '.' | |||
#define DIR_INCLUDE ".include" | |||
#define DIR_ORIGIN ".org" | |||
#define DIR_OPTIMIZER ".optimizer" | |||
#define DIR_ROM_SIZE ".rom_size" | |||
#define DIR_ROM_HEADER ".rom_header" | |||
#define DIR_ROM_CHECKSUM ".rom_checksum" | |||
#define DIR_ROM_PRODUCT ".rom_product" | |||
#define DIR_ROM_VERSION ".rom_version" | |||
#define DIR_ROM_REGION ".rom_region" | |||
#define DIR_ROM_DECLSIZE ".rom_declsize" | |||
#define DIRECTIVE_HAS_ARG(line, d) ((line)->length > strlen(d)) | |||
#define IS_DIRECTIVE(line, d) \ | |||
(((line)->length >= strlen(d)) && \ | |||
!strncmp((line)->data, d, strlen(d)) && \ | |||
(!DIRECTIVE_HAS_ARG(line, d) || (line)->data[strlen(d)] == ' ')) | |||
#define DIRECTIVE_OFFSET(line, d) \ | |||
(DIRECTIVE_HAS_ARG(line, d) ? strlen(d) : 0) | |||
/* | |||
Preprocess a single source line (source, length) into a normalized ASMLine. | |||
*Only* the data and length fields in the ASMLine object are populated. The | |||
normalization process converts tabs to spaces, lowercases all alphabetical | |||
characters, and removes runs of multiple spaces (outside of string | |||
literals), strips comments, and other things. | |||
Return NULL if an ASM line was not generated from the source, i.e. if it is | |||
blank after being stripped. | |||
*/ | |||
static ASMLine* normalize_line(const char *source, size_t length) | |||
{ | |||
char *data = malloc(sizeof(char) * length); | |||
if (!data) | |||
OUT_OF_MEMORY() | |||
size_t si, di, slashes = 0; | |||
bool has_content = false, space_pending = false, in_string = false; | |||
for (si = di = 0; si < length; si++) { | |||
char c = source[si]; | |||
if (c == '\\') | |||
slashes++; | |||
else | |||
slashes = 0; | |||
if (in_string) { | |||
if (c == '"' && (slashes % 2) == 0) | |||
in_string = false; | |||
data[di++] = c; | |||
} else { | |||
if (c == ';') | |||
break; | |||
if (c == '"' && (slashes % 2) == 0) | |||
in_string = true; | |||
if (c >= 'A' && c <= 'Z') | |||
c += 'a' - 'A'; | |||
if (c == ' ' || c == '\t') | |||
space_pending = true; | |||
else { | |||
if (space_pending) { | |||
if (has_content) | |||
data[di++] = ' '; | |||
space_pending = false; | |||
} | |||
has_content = true; | |||
data[di++] = c; | |||
} | |||
} | |||
} | |||
if (!has_content) { | |||
free(data); | |||
return NULL; | |||
} | |||
ASMLine *line = malloc(sizeof(ASMLine)); | |||
if (!line) | |||
OUT_OF_MEMORY() | |||
data = realloc(data, sizeof(char) * di); | |||
if (!data) | |||
OUT_OF_MEMORY() | |||
line->data = data; | |||
line->length = di; | |||
return line; | |||
} | |||
/* | |||
Read and return the target path from an include directive. | |||
This function allocates a buffer to store the filename; it must be free()'d | |||
after calling read_source_file(). If a syntax error occurs while trying to | |||
read the path, it returns NULL. | |||
*/ | |||
char* read_include_path(const ASMLine *line) | |||
{ | |||
size_t maxlen = strlen(line->filename) + line->length, i, start, slashes; | |||
if (maxlen >= INT_MAX) // Allows us to safely downcast to int later | |||
return NULL; | |||
char *path = malloc(sizeof(char) * maxlen); | |||
if (!path) | |||
OUT_OF_MEMORY() | |||
if (!(i = DIRECTIVE_OFFSET(line, DIR_INCLUDE))) | |||
goto error; | |||
if (line->length - i <= 4) // Not long enough to hold a non-zero argument | |||
goto error; | |||
if (line->data[i++] != ' ' || line->data[i++] != '"') | |||
goto error; | |||
// TODO: parse escaped characters properly | |||
for (start = i, slashes = 0; i < line->length; i++) { | |||
if (line->data[i] == '"' && (slashes % 2) == 0) | |||
break; | |||
if (line->data[i] == '\\') | |||
slashes++; | |||
else | |||
slashes = 0; | |||
} | |||
if (i != line->length - 1) // Junk present after closing quote | |||
goto error; | |||
char *dup = strdup(line->filename); | |||
if (!dup) | |||
OUT_OF_MEMORY() | |||
// TODO: should normalize filenames in some way to prevent accidental dupes | |||
snprintf(path, maxlen, "%s/%.*s", dirname(dup), (int) (i - start), | |||
line->data + start); | |||
free(dup); | |||
return path; | |||
error: | |||
free(path); | |||
return NULL; | |||
} | |||
/* | |||
Return whether the given path has already been loaded. | |||
*/ | |||
static bool path_has_been_loaded( | |||
const char *path, const LineBuffer *root, const ASMInclude *include) | |||
{ | |||
if (!strcmp(path, root->filename)) | |||
return true; | |||
while (include) { | |||
if (!strcmp(path, include->lines->filename)) | |||
return true; | |||
include = include->next; | |||
} | |||
return false; | |||
} | |||
/* | |||
Build a LineBuffer into a ASMLines, normalizing them along the way. | |||
This function operates recursively to handle includes, but handles no other | |||
preprocessor directives. | |||
On success, NULL is returned; *head points to the head of the new ASMLine | |||
list, and *tail to its tail (assuming it is non-NULL). On error, an | |||
ErrorInfo object is returned, and *head and *tail are not modified. | |||
*includes may be updated in either case. | |||
*/ | |||
static ErrorInfo* build_asm_lines( | |||
const LineBuffer *root, const LineBuffer *source, ASMLine **head, | |||
ASMLine **tail, ASMInclude **includes) | |||
{ | |||
ASMLine dummy = {.next = NULL}; | |||
ASMLine *line, *prev = &dummy; | |||
const Line *orig, *next_orig = source->lines; | |||
while ((orig = next_orig)) { | |||
line = normalize_line(orig->data, orig->length); | |||
next_orig = orig->next; | |||
if (!line) | |||
continue; | |||
// Populate ASMLine fields not set by normalize_line(): | |||
line->original = orig; | |||
line->filename = source->filename; | |||
line->next = NULL; | |||
if (IS_DIRECTIVE(line, DIR_INCLUDE)) { | |||
ErrorInfo *ei; | |||
char *path = read_include_path(line); | |||
if (!path) { | |||
ei = error_info_create(line, ET_INCLUDE, ED_INC_BAD_ARG); | |||
asm_lines_free(line); | |||
asm_lines_free(dummy.next); | |||
return ei; | |||
} | |||
if (path_has_been_loaded(path, root, *includes)) { | |||
ei = error_info_create(line, ET_INCLUDE, ED_INC_RECURSION); | |||
asm_lines_free(line); | |||
asm_lines_free(dummy.next); | |||
free(path); | |||
return ei; | |||
} | |||
DEBUG("- reading included file: %s", path) | |||
LineBuffer *incbuffer = read_source_file(path, false); | |||
free(path); | |||
if (!incbuffer) { | |||
ei = error_info_create(line, ET_INCLUDE, ED_INC_FILE_READ); | |||
asm_lines_free(line); | |||
asm_lines_free(dummy.next); | |||
return ei; | |||
} | |||
ASMInclude *include = malloc(sizeof(ASMInclude)); | |||
if (!include) | |||
OUT_OF_MEMORY() | |||
include->lines = incbuffer; | |||
include->next = *includes; | |||
*includes = include; | |||
ASMLine *inchead, *inctail; | |||
if ((ei = build_asm_lines(root, incbuffer, &inchead, &inctail, | |||
includes))) { | |||
error_info_append(ei, line); | |||
asm_lines_free(line); | |||
asm_lines_free(dummy.next); | |||
return ei; | |||
} | |||
prev->next = inchead; | |||
prev = inctail; | |||
asm_lines_free(line); // Destroy only the .include line | |||
} | |||
else { | |||
prev->next = line; | |||
prev = line; | |||
} | |||
} | |||
*head = dummy.next; | |||
if (tail) | |||
*tail = prev; | |||
return NULL; | |||
} | |||
/* | |||
Read in a boolean argument from the given line and store it in *result. | |||
auto_val is used if the argument's value is "auto". Return true on success | |||
and false on failure; in the latter case, *result is not modified. | |||
*/ | |||
static inline bool read_bool_argument( | |||
bool *result, const ASMLine *line, const char *directive, bool auto_val) | |||
{ | |||
const char *arg = line->data + (DIRECTIVE_OFFSET(line, directive) + 1); | |||
ssize_t len = line->length - (DIRECTIVE_OFFSET(line, directive) + 1); | |||
if (len <= 0 || len > 5) | |||
return false; | |||
switch (len) { | |||
case 1: // 0, 1 | |||
if (*arg == '0' || *arg == '1') | |||
return (*result = *arg - '0'), true; | |||
return false; | |||
case 2: // on | |||
if (!strncmp(arg, "on", 2)) | |||
return (*result = true), true; | |||
return false; | |||
case 3: // off | |||
if (!strncmp(arg, "off", 3)) | |||
return (*result = false), true; | |||
return false; | |||
case 4: // true, auto | |||
if (!strncmp(arg, "true", 4)) | |||
return (*result = true), true; | |||
if (!strncmp(arg, "auto", 4)) | |||
return (*result = auto_val), true; | |||
return false; | |||
case 5: // false | |||
if (!strncmp(arg, "false", 5)) | |||
return (*result = false), true; | |||
return false; | |||
} | |||
return false; | |||
} | |||
/* | |||
Preprocess the LineBuffer into ASMLines. Change some state along the way. | |||
This function processes include directives, so read_source_file() may be | |||
called multiple times (along with the implications that has), and | |||
state->includes may be modified. | |||
On success, NULL is returned. On error, an ErrorInfo object is returned. | |||
state->lines and state->includes may still be modified. | |||
*/ | |||
static ErrorInfo* preprocess(AssemblerState *state, const LineBuffer *source) | |||
{ | |||
// state->header.offset <-- check in list of acceptable values | |||
// state->header.product_code <-- range check | |||
// state->header.version <-- range check | |||
// state->header.region <-- string conversion, check | |||
// state->header.rom_size <-- value/range check | |||
// state->rom_size <-- value check | |||
// if giving rom size, check header offset is in rom size range | |||
// if giving reported and actual rom size, check reported is <= actual | |||
#define CATCH_DUPES(line, first, oldval, newval) \ | |||
if (first && oldval != newval) { \ | |||
ei = error_info_create(line, ET_PREPROC, ED_PP_DUPLICATE); \ | |||
error_info_append(ei, first); \ | |||
asm_lines_free(condemned); \ | |||
return ei; \ | |||
} \ | |||
oldval = newval; \ | |||
first = line; | |||
#define REQUIRE_ARG(line, d) \ | |||
if (!DIRECTIVE_HAS_ARG(line, d)) { \ | |||
asm_lines_free(condemned); \ | |||
return error_info_create(line, ET_PREPROC, ED_PP_NO_ARG); \ | |||
} | |||
#define VALIDATE(retval) \ | |||
if (!(retval)) { \ | |||
asm_lines_free(condemned); \ | |||
return error_info_create(line, ET_PREPROC, ED_PP_BAD_ARG); \ | |||
} | |||
DEBUG("Running preprocessor:") | |||
ErrorInfo* ei; | |||
if ((ei = build_asm_lines(source, source, &state->lines, NULL, | |||
&state->includes))) | |||
return ei; | |||
ASMLine dummy = {.next = state->lines}; | |||
ASMLine *prev, *line = &dummy, *next = state->lines, *condemned = NULL; | |||
const ASMLine *first_optimizer = NULL, *first_checksum = NULL; | |||
while ((prev = line, line = next)) { | |||
next = line->next; | |||
if (line->data[0] == DIRECTIVE_MARKER) { | |||
if (IS_DIRECTIVE(line, DIR_ORIGIN)) | |||
continue; // Origins are handled by tokenizer | |||
DEBUG("- handling directive: %.*s", (int) line->length, line->data) | |||
if (IS_DIRECTIVE(line, DIR_OPTIMIZER)) { | |||
REQUIRE_ARG(line, DIR_OPTIMIZER) | |||
bool arg; | |||
VALIDATE(read_bool_argument(&arg, line, DIR_OPTIMIZER, false)) | |||
CATCH_DUPES(line, first_optimizer, state->optimizer, arg) | |||
} | |||
else if (IS_DIRECTIVE(line, DIR_ROM_SIZE)) { | |||
// TODO | |||
} | |||
else if (IS_DIRECTIVE(line, DIR_ROM_HEADER)) { | |||
// TODO | |||
} | |||
else if (IS_DIRECTIVE(line, DIR_ROM_CHECKSUM)) { | |||
REQUIRE_ARG(line, DIR_ROM_CHECKSUM) | |||
bool arg; | |||
VALIDATE(read_bool_argument(&arg, line, DIR_ROM_CHECKSUM, true)) | |||
CATCH_DUPES(line, first_checksum, state->header.checksum, arg) | |||
} | |||
else if (IS_DIRECTIVE(line, DIR_ROM_PRODUCT)) { | |||
// TODO | |||
} | |||
else if (IS_DIRECTIVE(line, DIR_ROM_VERSION)) { | |||
// TODO | |||
} | |||
else if (IS_DIRECTIVE(line, DIR_ROM_REGION)) { | |||
// TODO | |||
} | |||
else if (IS_DIRECTIVE(line, DIR_ROM_DECLSIZE)) { | |||
// TODO | |||
} | |||
else { | |||
asm_lines_free(condemned); | |||
return error_info_create(line, ET_PREPROC, ED_PP_UNKNOWN); | |||
} | |||
// Remove directive from lines, and schedule it for deletion: | |||
line->next = condemned; | |||
condemned = line; | |||
prev->next = next; | |||
line = prev; | |||
} | |||
} | |||
state->rom_size = 8; // TODO | |||
asm_lines_free(condemned); | |||
state->lines = dummy.next; // Fix list head if first line was a directive | |||
#ifdef DEBUG_MODE | |||
DEBUG("Dumping ASMLines:") | |||
const ASMLine *temp = state->lines; | |||
while (temp) { | |||
DEBUG("- %-40.*s [%s:%02zu]", (int) temp->length, temp->data, | |||
temp->filename, temp->original->lineno) | |||
temp = temp->next; | |||
} | |||
#endif | |||
return NULL; | |||
#undef VALIDATE | |||
#undef REQUIRE_ARG | |||
#undef CATCH_DUPES | |||
} | |||
/* | |||
Tokenize ASMLines into ASMInstructions. | |||
@@ -0,0 +1,437 @@ | |||
/* Copyright (C) 2014-2015 Ben Kurtovic <ben.kurtovic@gmail.com> | |||
Released under the terms of the MIT License. See LICENSE for details. */ | |||
#include <libgen.h> | |||
#include <limits.h> | |||
#include <stdio.h> | |||
#include <stdlib.h> | |||
#include <string.h> | |||
#include "preprocessor.h" | |||
#include "errors.h" | |||
#include "io.h" | |||
#include "../logging.h" | |||
#define DIRECTIVE_MARKER '.' | |||
#define DIR_INCLUDE ".include" | |||
#define DIR_ORIGIN ".org" | |||
#define DIR_OPTIMIZER ".optimizer" | |||
#define DIR_ROM_SIZE ".rom_size" | |||
#define DIR_ROM_HEADER ".rom_header" | |||
#define DIR_ROM_CHECKSUM ".rom_checksum" | |||
#define DIR_ROM_PRODUCT ".rom_product" | |||
#define DIR_ROM_VERSION ".rom_version" | |||
#define DIR_ROM_REGION ".rom_region" | |||
#define DIR_ROM_DECLSIZE ".rom_declsize" | |||
#define DIRECTIVE_HAS_ARG(line, d) ((line)->length > strlen(d)) | |||
#define IS_DIRECTIVE(line, d) \ | |||
(((line)->length >= strlen(d)) && \ | |||
!strncmp((line)->data, d, strlen(d)) && \ | |||
(!DIRECTIVE_HAS_ARG(line, d) || (line)->data[strlen(d)] == ' ')) | |||
#define DIRECTIVE_OFFSET(line, d) \ | |||
(DIRECTIVE_HAS_ARG(line, d) ? strlen(d) : 0) | |||
/* | |||
Preprocess a single source line (source, length) into a normalized ASMLine. | |||
*Only* the data and length fields in the ASMLine object are populated. The | |||
normalization process converts tabs to spaces, lowercases all alphabetical | |||
characters, and removes runs of multiple spaces (outside of string | |||
literals), strips comments, and other things. | |||
Return NULL if an ASM line was not generated from the source, i.e. if it is | |||
blank after being stripped. | |||
*/ | |||
static ASMLine* normalize_line(const char *source, size_t length) | |||
{ | |||
char *data = malloc(sizeof(char) * length); | |||
if (!data) | |||
OUT_OF_MEMORY() | |||
size_t si, di, slashes = 0; | |||
bool has_content = false, space_pending = false, in_string = false; | |||
for (si = di = 0; si < length; si++) { | |||
char c = source[si]; | |||
if (c == '\\') | |||
slashes++; | |||
else | |||
slashes = 0; | |||
if (in_string) { | |||
if (c == '"' && (slashes % 2) == 0) | |||
in_string = false; | |||
data[di++] = c; | |||
} else { | |||
if (c == ';') | |||
break; | |||
if (c == '"' && (slashes % 2) == 0) | |||
in_string = true; | |||
if (c >= 'A' && c <= 'Z') | |||
c += 'a' - 'A'; | |||
if (c == ' ' || c == '\t') | |||
space_pending = true; | |||
else { | |||
if (space_pending) { | |||
if (has_content) | |||
data[di++] = ' '; | |||
space_pending = false; | |||
} | |||
has_content = true; | |||
data[di++] = c; | |||
} | |||
} | |||
} | |||
if (!has_content) { | |||
free(data); | |||
return NULL; | |||
} | |||
ASMLine *line = malloc(sizeof(ASMLine)); | |||
if (!line) | |||
OUT_OF_MEMORY() | |||
data = realloc(data, sizeof(char) * di); | |||
if (!data) | |||
OUT_OF_MEMORY() | |||
line->data = data; | |||
line->length = di; | |||
return line; | |||
} | |||
/* | |||
Read and return the target path from an include directive. | |||
This function allocates a buffer to store the filename; it must be free()'d | |||
after calling read_source_file(). If a syntax error occurs while trying to | |||
read the path, it returns NULL. | |||
*/ | |||
char* read_include_path(const ASMLine *line) | |||
{ | |||
size_t maxlen = strlen(line->filename) + line->length, i, start, slashes; | |||
if (maxlen >= INT_MAX) // Allows us to safely downcast to int later | |||
return NULL; | |||
char *path = malloc(sizeof(char) * maxlen); | |||
if (!path) | |||
OUT_OF_MEMORY() | |||
if (!(i = DIRECTIVE_OFFSET(line, DIR_INCLUDE))) | |||
goto error; | |||
if (line->length - i <= 4) // Not long enough to hold a non-zero argument | |||
goto error; | |||
if (line->data[i++] != ' ' || line->data[i++] != '"') | |||
goto error; | |||
// TODO: parse escaped characters properly | |||
for (start = i, slashes = 0; i < line->length; i++) { | |||
if (line->data[i] == '"' && (slashes % 2) == 0) | |||
break; | |||
if (line->data[i] == '\\') | |||
slashes++; | |||
else | |||
slashes = 0; | |||
} | |||
if (i != line->length - 1) // Junk present after closing quote | |||
goto error; | |||
char *dup = strdup(line->filename); | |||
if (!dup) | |||
OUT_OF_MEMORY() | |||
// TODO: should normalize filenames in some way to prevent accidental dupes | |||
snprintf(path, maxlen, "%s/%.*s", dirname(dup), (int) (i - start), | |||
line->data + start); | |||
free(dup); | |||
return path; | |||
error: | |||
free(path); | |||
return NULL; | |||
} | |||
/* | |||
Return whether the given path has already been loaded. | |||
*/ | |||
static bool path_has_been_loaded( | |||
const char *path, const LineBuffer *root, const ASMInclude *include) | |||
{ | |||
if (!strcmp(path, root->filename)) | |||
return true; | |||
while (include) { | |||
if (!strcmp(path, include->lines->filename)) | |||
return true; | |||
include = include->next; | |||
} | |||
return false; | |||
} | |||
/* | |||
Build a LineBuffer into a ASMLines, normalizing them along the way. | |||
This function operates recursively to handle includes, but handles no other | |||
preprocessor directives. | |||
On success, NULL is returned; *head points to the head of the new ASMLine | |||
list, and *tail to its tail (assuming it is non-NULL). On error, an | |||
ErrorInfo object is returned, and *head and *tail are not modified. | |||
*includes may be updated in either case. | |||
*/ | |||
static ErrorInfo* build_asm_lines( | |||
const LineBuffer *root, const LineBuffer *source, ASMLine **head, | |||
ASMLine **tail, ASMInclude **includes) | |||
{ | |||
ASMLine dummy = {.next = NULL}; | |||
ASMLine *line, *prev = &dummy; | |||
const Line *orig, *next_orig = source->lines; | |||
while ((orig = next_orig)) { | |||
line = normalize_line(orig->data, orig->length); | |||
next_orig = orig->next; | |||
if (!line) | |||
continue; | |||
// Populate ASMLine fields not set by normalize_line(): | |||
line->original = orig; | |||
line->filename = source->filename; | |||
line->next = NULL; | |||
if (IS_DIRECTIVE(line, DIR_INCLUDE)) { | |||
ErrorInfo *ei; | |||
char *path = read_include_path(line); | |||
if (!path) { | |||
ei = error_info_create(line, ET_INCLUDE, ED_INC_BAD_ARG); | |||
asm_lines_free(line); | |||
asm_lines_free(dummy.next); | |||
return ei; | |||
} | |||
if (path_has_been_loaded(path, root, *includes)) { | |||
ei = error_info_create(line, ET_INCLUDE, ED_INC_RECURSION); | |||
asm_lines_free(line); | |||
asm_lines_free(dummy.next); | |||
free(path); | |||
return ei; | |||
} | |||
DEBUG("- reading included file: %s", path) | |||
LineBuffer *incbuffer = read_source_file(path, false); | |||
free(path); | |||
if (!incbuffer) { | |||
ei = error_info_create(line, ET_INCLUDE, ED_INC_FILE_READ); | |||
asm_lines_free(line); | |||
asm_lines_free(dummy.next); | |||
return ei; | |||
} | |||
ASMInclude *include = malloc(sizeof(ASMInclude)); | |||
if (!include) | |||
OUT_OF_MEMORY() | |||
include->lines = incbuffer; | |||
include->next = *includes; | |||
*includes = include; | |||
ASMLine *inchead, *inctail; | |||
if ((ei = build_asm_lines(root, incbuffer, &inchead, &inctail, | |||
includes))) { | |||
error_info_append(ei, line); | |||
asm_lines_free(line); | |||
asm_lines_free(dummy.next); | |||
return ei; | |||
} | |||
prev->next = inchead; | |||
prev = inctail; | |||
asm_lines_free(line); // Destroy only the .include line | |||
} | |||
else { | |||
prev->next = line; | |||
prev = line; | |||
} | |||
} | |||
*head = dummy.next; | |||
if (tail) | |||
*tail = prev; | |||
return NULL; | |||
} | |||
/* | |||
Read in a boolean argument from the given line and store it in *result. | |||
auto_val is used if the argument's value is "auto". Return true on success | |||
and false on failure; in the latter case, *result is not modified. | |||
*/ | |||
static inline bool read_bool_argument( | |||
bool *result, const ASMLine *line, const char *directive, bool auto_val) | |||
{ | |||
const char *arg = line->data + (DIRECTIVE_OFFSET(line, directive) + 1); | |||
ssize_t len = line->length - (DIRECTIVE_OFFSET(line, directive) + 1); | |||
if (len <= 0 || len > 5) | |||
return false; | |||
switch (len) { | |||
case 1: // 0, 1 | |||
if (*arg == '0' || *arg == '1') | |||
return (*result = *arg - '0'), true; | |||
return false; | |||
case 2: // on | |||
if (!strncmp(arg, "on", 2)) | |||
return (*result = true), true; | |||
return false; | |||
case 3: // off | |||
if (!strncmp(arg, "off", 3)) | |||
return (*result = false), true; | |||
return false; | |||
case 4: // true, auto | |||
if (!strncmp(arg, "true", 4)) | |||
return (*result = true), true; | |||
if (!strncmp(arg, "auto", 4)) | |||
return (*result = auto_val), true; | |||
return false; | |||
case 5: // false | |||
if (!strncmp(arg, "false", 5)) | |||
return (*result = false), true; | |||
return false; | |||
} | |||
return false; | |||
} | |||
/* | |||
Preprocess the LineBuffer into ASMLines. Change some state along the way. | |||
This function processes include directives, so read_source_file() may be | |||
called multiple times (along with the implications that has), and | |||
state->includes may be modified. | |||
On success, NULL is returned. On error, an ErrorInfo object is returned. | |||
state->lines and state->includes may still be modified. | |||
*/ | |||
ErrorInfo* preprocess(AssemblerState *state, const LineBuffer *source) | |||
{ | |||
// state->header.offset <-- check in list of acceptable values | |||
// state->header.product_code <-- range check | |||
// state->header.version <-- range check | |||
// state->header.region <-- string conversion, check | |||
// state->header.rom_size <-- value/range check | |||
// state->rom_size <-- value check | |||
// if giving rom size, check header offset is in rom size range | |||
// if giving reported and actual rom size, check reported is <= actual | |||
#define CATCH_DUPES(line, first, oldval, newval) \ | |||
if (first && oldval != newval) { \ | |||
ei = error_info_create(line, ET_PREPROC, ED_PP_DUPLICATE); \ | |||
error_info_append(ei, first); \ | |||
asm_lines_free(condemned); \ | |||
return ei; \ | |||
} \ | |||
oldval = newval; \ | |||
first = line; | |||
#define REQUIRE_ARG(line, d) \ | |||
if (!DIRECTIVE_HAS_ARG(line, d)) { \ | |||
asm_lines_free(condemned); \ | |||
return error_info_create(line, ET_PREPROC, ED_PP_NO_ARG); \ | |||
} | |||
#define VALIDATE(retval) \ | |||
if (!(retval)) { \ | |||
asm_lines_free(condemned); \ | |||
return error_info_create(line, ET_PREPROC, ED_PP_BAD_ARG); \ | |||
} | |||
DEBUG("Running preprocessor:") | |||
ErrorInfo* ei; | |||
if ((ei = build_asm_lines(source, source, &state->lines, NULL, | |||
&state->includes))) | |||
return ei; | |||
ASMLine dummy = {.next = state->lines}; | |||
ASMLine *prev, *line = &dummy, *next = state->lines, *condemned = NULL; | |||
const ASMLine *first_optimizer = NULL, *first_checksum = NULL; | |||
while ((prev = line, line = next)) { | |||
next = line->next; | |||
if (line->data[0] == DIRECTIVE_MARKER) { | |||
if (IS_DIRECTIVE(line, DIR_ORIGIN)) | |||
continue; // Origins are handled by tokenizer | |||
DEBUG("- handling directive: %.*s", (int) line->length, line->data) | |||
if (IS_DIRECTIVE(line, DIR_OPTIMIZER)) { | |||
REQUIRE_ARG(line, DIR_OPTIMIZER) | |||
bool arg; | |||
VALIDATE(read_bool_argument(&arg, line, DIR_OPTIMIZER, false)) | |||
CATCH_DUPES(line, first_optimizer, state->optimizer, arg) | |||
} | |||
else if (IS_DIRECTIVE(line, DIR_ROM_SIZE)) { | |||
// TODO | |||
} | |||
else if (IS_DIRECTIVE(line, DIR_ROM_HEADER)) { | |||
// TODO | |||
} | |||
else if (IS_DIRECTIVE(line, DIR_ROM_CHECKSUM)) { | |||
REQUIRE_ARG(line, DIR_ROM_CHECKSUM) | |||
bool arg; | |||
VALIDATE(read_bool_argument(&arg, line, DIR_ROM_CHECKSUM, true)) | |||
CATCH_DUPES(line, first_checksum, state->header.checksum, arg) | |||
} | |||
else if (IS_DIRECTIVE(line, DIR_ROM_PRODUCT)) { | |||
// TODO | |||
} | |||
else if (IS_DIRECTIVE(line, DIR_ROM_VERSION)) { | |||
// TODO | |||
} | |||
else if (IS_DIRECTIVE(line, DIR_ROM_REGION)) { | |||
// TODO | |||
} | |||
else if (IS_DIRECTIVE(line, DIR_ROM_DECLSIZE)) { | |||
// TODO | |||
} | |||
else { | |||
asm_lines_free(condemned); | |||
return error_info_create(line, ET_PREPROC, ED_PP_UNKNOWN); | |||
} | |||
// Remove directive from lines, and schedule it for deletion: | |||
line->next = condemned; | |||
condemned = line; | |||
prev->next = next; | |||
line = prev; | |||
} | |||
} | |||
state->rom_size = 8; // TODO | |||
asm_lines_free(condemned); | |||
state->lines = dummy.next; // Fix list head if first line was a directive | |||
#ifdef DEBUG_MODE | |||
DEBUG("Dumping ASMLines:") | |||
const ASMLine *temp = state->lines; | |||
while (temp) { | |||
DEBUG("- %-40.*s [%s:%02zu]", (int) temp->length, temp->data, | |||
temp->filename, temp->original->lineno) | |||
temp = temp->next; | |||
} | |||
#endif | |||
return NULL; | |||
#undef VALIDATE | |||
#undef REQUIRE_ARG | |||
#undef CATCH_DUPES | |||
} |
@@ -0,0 +1,11 @@ | |||
/* Copyright (C) 2014-2015 Ben Kurtovic <ben.kurtovic@gmail.com> | |||
Released under the terms of the MIT License. See LICENSE for details. */ | |||
#pragma once | |||
#include "state.h" | |||
#include "../assembler.h" | |||
/* Functions */ | |||
ErrorInfo* preprocess(AssemblerState*, const LineBuffer*); |