An emulator, assembler, and disassembler for the Sega Game Gear
You can not select more than 25 topics Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.
 
 
 
 
 

397 lines
15 KiB

  1. /* Copyright (C) 2014-2015 Ben Kurtovic <ben.kurtovic@gmail.com>
  2. Released under the terms of the MIT License. See LICENSE for details. */
  3. #include <stdarg.h>
  4. #include <stdlib.h>
  5. #include "instructions.h"
  6. #include "inst_args.h"
  7. #include "parse_util.h"
  8. #include "../logging.h"
  9. /* Helper macros for get_inst_parser() */
  10. #define JOIN_(a, b, c, d) ((uint32_t) ((a << 24) + (b << 16) + (c << 8) + d))
  11. #define DISPATCH_(s, z) ( \
  12. (z) == 2 ? JOIN_(s[0], s[1], 0x00, 0x00) : \
  13. (z) == 3 ? JOIN_(s[0], s[1], s[2], 0x00) : \
  14. JOIN_(s[0], s[1], s[2], s[3])) \
  15. #define MAKE_CMP_(s) DISPATCH_(s, sizeof(s) / sizeof(char) - 1)
  16. #define HANDLE(m) if (key == MAKE_CMP_(#m)) return parse_inst_##m;
  17. /* Internal helper macros for instruction parsers */
  18. #define INST_ALLOC_(len) \
  19. *length = len; \
  20. if (!(*bytes = malloc(sizeof(uint8_t) * (len)))) \
  21. OUT_OF_MEMORY()
  22. #define INST_SET_(b, val) ((*bytes)[b] = val)
  23. #define INST_SET1_(b1) INST_SET_(0, b1)
  24. #define INST_SET2_(b1, b2) INST_SET1_(b1), INST_SET_(1, b2)
  25. #define INST_SET3_(b1, b2, b3) INST_SET2_(b1, b2), INST_SET_(2, b3)
  26. #define INST_SET4_(b1, b2, b3, b4) INST_SET3_(b1, b2, b3), INST_SET_(3, b4)
  27. #define INST_DISPATCH_(a, b, c, d, target, ...) target
  28. #define INST_FILL_BYTES_(len, ...) \
  29. ((len > 4) ? fill_bytes_variadic(*bytes, len, __VA_ARGS__) : \
  30. INST_DISPATCH_(__VA_ARGS__, INST_SET4_, INST_SET3_, INST_SET2_, \
  31. INST_SET1_, __VA_ARGS__)(__VA_ARGS__));
  32. #define INST_PREFIX_(reg) \
  33. (((reg) == REG_IX || (reg) == REG_IXH || (reg) == REG_IXL) ? 0xDD : 0xFD)
  34. /* Helper macros for instruction parsers */
  35. #define INST_FUNC(mnemonic) \
  36. static ASMErrorDesc parse_inst_##mnemonic( \
  37. uint8_t **bytes, size_t *length, char **symbol, ASMArgParseInfo ap_info) \
  38. #define INST_ERROR(desc) return ED_PS_##desc;
  39. #define INST_TAKES_NO_ARGS \
  40. if (ap_info.arg) \
  41. INST_ERROR(TOO_MANY_ARGS) \
  42. #define INST_TAKES_ARGS(lo, hi) \
  43. if (!ap_info.arg) \
  44. INST_ERROR(TOO_FEW_ARGS) \
  45. ASMInstArg args[3]; \
  46. size_t nargs = 0; \
  47. ASMErrorDesc err = parse_args(args, &nargs, ap_info); \
  48. if (err) \
  49. return err; \
  50. if (nargs < lo) \
  51. INST_ERROR(TOO_FEW_ARGS) \
  52. if (nargs > hi) \
  53. INST_ERROR(TOO_MANY_ARGS)
  54. #define INST_NARGS nargs
  55. #define INST_TYPE(n) args[n].type
  56. #define INST_REG(n) args[n].data.reg
  57. #define INST_IMM(n) args[n].data.imm
  58. #define INST_INDIRECT(n) args[n].data.indirect
  59. #define INST_INDEX(n) args[n].data.index
  60. #define INST_LABEL(n) args[n].data.label
  61. #define INST_COND(n) args[n].data.cond
  62. #define INST_FORCE_TYPE(n, t) { \
  63. if (INST_TYPE(n) != t) \
  64. INST_ERROR(ARG##n##_TYPE) \
  65. }
  66. #define INST_CHECK_IMM(n, m) { \
  67. if (!(INST_IMM(n).mask & (m))) \
  68. INST_ERROR(ARG##n##_RANGE) \
  69. }
  70. #define INST_INDIRECT_HL_ONLY(n) { \
  71. if (INST_INDIRECT(n).type != AT_REGISTER) \
  72. INST_ERROR(ARG##n##_TYPE) \
  73. if (INST_INDIRECT(n).addr.reg != REG_HL) \
  74. INST_ERROR(ARG##n##_BAD_REG) \
  75. }
  76. #define INST_RETURN(len, ...) { \
  77. (void) symbol; \
  78. INST_ALLOC_(len) \
  79. INST_FILL_BYTES_(len, __VA_ARGS__) \
  80. return ED_NONE; \
  81. }
  82. #define INST_RETURN_WITH_SYMBOL(len, label, ...) { \
  83. *symbol = strdup(label); \
  84. if (!(*symbol)) \
  85. OUT_OF_MEMORY() \
  86. INST_ALLOC_(len) \
  87. INST_FILL_BYTES_(len - 2, __VA_ARGS__) \
  88. return ED_NONE; \
  89. }
  90. #define INST_INDEX_PREFIX(n) INST_PREFIX_(INST_INDEX(n).reg)
  91. #define INST_INDEX_BYTES(n, b) \
  92. INST_INDEX_PREFIX(n), b, INST_INDEX(n).offset
  93. /*
  94. Fill an instruction's byte array with the given data.
  95. This internal function is only called for instructions longer than four
  96. bytes (of which there is only one: the fake emulator debugging/testing
  97. opcode with mnemonic "emu"), so it does not get used in normal situations.
  98. Return the value of the last byte inserted, for compatibility with the
  99. INST_SETn_ family of macros.
  100. */
  101. static uint8_t fill_bytes_variadic(uint8_t *bytes, size_t len, ...)
  102. {
  103. va_list vargs;
  104. va_start(vargs, len);
  105. for (size_t i = 0; i < len; i++)
  106. bytes[i] = va_arg(vargs, unsigned);
  107. va_end(vargs);
  108. return bytes[len - 1];
  109. }
  110. /*
  111. Parse a single instruction argument into an ASMInstArg object.
  112. Return ED_NONE (0) on success or an error code on failure.
  113. */
  114. static ASMErrorDesc parse_arg(
  115. ASMInstArg *arg, const char *str, size_t size, ASMDefineTable *deftable)
  116. {
  117. #define TRY_PARSER(func, argtype, field) \
  118. if (argparse_##func(&arg->data.field, info)) { \
  119. arg->type = argtype; \
  120. return ED_NONE; \
  121. }
  122. ASMArgParseInfo info = {.arg = str, .size = size, .deftable = deftable};
  123. TRY_PARSER(register, AT_REGISTER, reg)
  124. TRY_PARSER(immediate, AT_IMMEDIATE, imm)
  125. TRY_PARSER(indirect, AT_INDIRECT, indirect)
  126. TRY_PARSER(indexed, AT_INDEXED, index)
  127. TRY_PARSER(condition, AT_CONDITION, cond)
  128. TRY_PARSER(label, AT_LABEL, label)
  129. return ED_PS_ARG_SYNTAX;
  130. #undef TRY_PARSER
  131. }
  132. /*
  133. Parse an argument string into ASMInstArg objects.
  134. Return ED_NONE (0) on success or an error code on failure.
  135. */
  136. static ASMErrorDesc parse_args(
  137. ASMInstArg args[3], size_t *nargs, ASMArgParseInfo ap_info)
  138. {
  139. ASMErrorDesc err;
  140. ASMDefineTable *dt = ap_info.deftable;
  141. const char *str = ap_info.arg;
  142. size_t size = ap_info.size, start = 0, i = 0;
  143. while (i < size) {
  144. char c = str[i];
  145. if (c == ',') {
  146. if (i == start)
  147. return ED_PS_ARG_SYNTAX;
  148. if ((err = parse_arg(&args[*nargs], str + start, i - start, dt)))
  149. return err;
  150. (*nargs)++;
  151. i++;
  152. if (i < size && str[i] == ' ')
  153. i++;
  154. start = i;
  155. if (i == size)
  156. return ED_PS_ARG_SYNTAX;
  157. if (*nargs >= 3)
  158. return ED_PS_TOO_MANY_ARGS;
  159. } else {
  160. if ((c >= 'a' && c <= 'z') || (c >= '0' && c <= '9') ||
  161. c == ' ' || c == '+' || c == '-' || c == '(' || c == ')' ||
  162. c == '$' || c == '_' || c == '.')
  163. i++;
  164. else
  165. return ED_PS_ARG_SYNTAX;
  166. }
  167. }
  168. if (i > start) {
  169. if ((err = parse_arg(&args[*nargs], str + start, i - start, dt)))
  170. return err;
  171. (*nargs)++;
  172. }
  173. return ED_NONE;
  174. }
  175. /* Instruction parser functions */
  176. INST_FUNC(adc)
  177. {
  178. INST_TAKES_ARGS(2, 2)
  179. INST_FORCE_TYPE(0, AT_REGISTER)
  180. switch (INST_REG(0)) {
  181. case REG_A:
  182. switch (INST_TYPE(1)) {
  183. case AT_REGISTER:
  184. switch (INST_REG(1)) {
  185. case REG_A: INST_RETURN(1, 0x8F)
  186. case REG_B: INST_RETURN(1, 0x88)
  187. case REG_C: INST_RETURN(1, 0x89)
  188. case REG_D: INST_RETURN(1, 0x8A)
  189. case REG_E: INST_RETURN(1, 0x8B)
  190. case REG_H: INST_RETURN(1, 0x8C)
  191. case REG_L: INST_RETURN(1, 0x8D)
  192. case REG_IXH: INST_RETURN(2, 0xDD, 0x8C)
  193. case REG_IXL: INST_RETURN(2, 0xDD, 0x8D)
  194. case REG_IYH: INST_RETURN(2, 0xFD, 0x8C)
  195. case REG_IYL: INST_RETURN(2, 0xFD, 0x8D)
  196. default: INST_ERROR(ARG1_BAD_REG)
  197. }
  198. case AT_IMMEDIATE:
  199. INST_CHECK_IMM(1, IMM_U8)
  200. INST_RETURN(2, 0xCE, INST_IMM(1).uval)
  201. case AT_INDIRECT:
  202. INST_INDIRECT_HL_ONLY(1)
  203. INST_RETURN(1, 0x8E)
  204. case AT_INDEXED:
  205. INST_RETURN(3, INST_INDEX_BYTES(1, 0x8E))
  206. default:
  207. INST_ERROR(ARG1_TYPE)
  208. }
  209. case REG_HL:
  210. INST_FORCE_TYPE(1, AT_REGISTER)
  211. switch (INST_REG(1)) {
  212. case REG_BC: INST_RETURN(2, 0xED, 0x4A)
  213. case REG_DE: INST_RETURN(2, 0xED, 0x5A)
  214. case REG_HL: INST_RETURN(2, 0xED, 0x6A)
  215. case REG_SP: INST_RETURN(2, 0xED, 0x7A)
  216. default: INST_ERROR(ARG1_BAD_REG)
  217. }
  218. default:
  219. INST_ERROR(ARG0_TYPE)
  220. }
  221. }
  222. INST_FUNC(add)
  223. {
  224. INST_TAKES_ARGS(2, 2)
  225. INST_FORCE_TYPE(0, AT_REGISTER)
  226. switch (INST_REG(0)) {
  227. case REG_A:
  228. switch (INST_TYPE(1)) {
  229. case AT_REGISTER:
  230. switch (INST_REG(1)) {
  231. case REG_A: INST_RETURN(1, 0x87)
  232. case REG_B: INST_RETURN(1, 0x80)
  233. case REG_C: INST_RETURN(1, 0x81)
  234. case REG_D: INST_RETURN(1, 0x82)
  235. case REG_E: INST_RETURN(1, 0x83)
  236. case REG_H: INST_RETURN(1, 0x84)
  237. case REG_L: INST_RETURN(1, 0x85)
  238. case REG_IXH: INST_RETURN(2, 0xDD, 0x84)
  239. case REG_IXL: INST_RETURN(2, 0xDD, 0x85)
  240. case REG_IYH: INST_RETURN(2, 0xFD, 0x84)
  241. case REG_IYL: INST_RETURN(2, 0xFD, 0x85)
  242. default: INST_ERROR(ARG1_BAD_REG)
  243. }
  244. case AT_IMMEDIATE:
  245. INST_CHECK_IMM(1, IMM_U8)
  246. INST_RETURN(2, 0xC6, INST_IMM(1).uval)
  247. case AT_INDIRECT:
  248. INST_INDIRECT_HL_ONLY(1)
  249. INST_RETURN(1, 0x86)
  250. case AT_INDEXED:
  251. INST_RETURN(3, INST_INDEX_BYTES(1, 0x86))
  252. default:
  253. INST_ERROR(ARG1_TYPE)
  254. }
  255. case REG_HL:
  256. INST_FORCE_TYPE(1, AT_REGISTER)
  257. switch (INST_REG(1)) {
  258. case REG_BC: INST_RETURN(1, 0x09)
  259. case REG_DE: INST_RETURN(1, 0x19)
  260. case REG_HL: INST_RETURN(1, 0x29)
  261. case REG_SP: INST_RETURN(1, 0x39)
  262. default: INST_ERROR(ARG1_BAD_REG)
  263. }
  264. case REG_IX:
  265. case REG_IY:
  266. INST_FORCE_TYPE(1, AT_REGISTER)
  267. switch (INST_REG(1)) {
  268. case REG_BC: INST_RETURN(2, INST_INDEX_PREFIX(1), 0x09)
  269. case REG_DE: INST_RETURN(2, INST_INDEX_PREFIX(1), 0x19)
  270. case REG_IX:
  271. case REG_IY:
  272. if (INST_REG(0) != INST_REG(1))
  273. INST_ERROR(ARG1_BAD_REG)
  274. INST_RETURN(2, INST_INDEX_PREFIX(1), 0x29)
  275. case REG_SP: INST_RETURN(2, INST_INDEX_PREFIX(1), 0x39)
  276. default: INST_ERROR(ARG1_BAD_REG)
  277. }
  278. default:
  279. INST_ERROR(ARG0_TYPE)
  280. }
  281. }
  282. INST_FUNC(inc)
  283. {
  284. INST_TAKES_ARGS(1, 1)
  285. switch (INST_TYPE(0)) {
  286. case AT_REGISTER:
  287. switch (INST_REG(0)) {
  288. case REG_A: INST_RETURN(1, 0x3C)
  289. case REG_B: INST_RETURN(1, 0x04)
  290. case REG_C: INST_RETURN(1, 0x0C)
  291. case REG_D: INST_RETURN(1, 0x14)
  292. case REG_E: INST_RETURN(1, 0x1C)
  293. case REG_H: INST_RETURN(1, 0x24)
  294. case REG_L: INST_RETURN(1, 0x2C)
  295. case REG_BC: INST_RETURN(1, 0x03)
  296. case REG_DE: INST_RETURN(1, 0x13)
  297. case REG_HL: INST_RETURN(1, 0x23)
  298. case REG_SP: INST_RETURN(1, 0x33)
  299. case REG_IX: INST_RETURN(2, 0xDD, 0x23)
  300. case REG_IY: INST_RETURN(2, 0xFD, 0x23)
  301. case REG_IXH: INST_RETURN(2, 0xDD, 0x2C)
  302. case REG_IXL: INST_RETURN(2, 0xFD, 0x2C)
  303. case REG_IYH: INST_RETURN(2, 0xDD, 0x2C)
  304. case REG_IYL: INST_RETURN(2, 0xFD, 0x2C)
  305. default: INST_ERROR(ARG0_BAD_REG)
  306. }
  307. case AT_INDIRECT:
  308. INST_INDIRECT_HL_ONLY(0)
  309. INST_RETURN(1, 0x34)
  310. case AT_INDEXED:
  311. INST_RETURN(3, INST_INDEX_BYTES(0, 0x34))
  312. default:
  313. INST_ERROR(ARG0_TYPE)
  314. }
  315. }
  316. INST_FUNC(nop)
  317. {
  318. INST_TAKES_NO_ARGS
  319. INST_RETURN(1, 0x00)
  320. }
  321. INST_FUNC(reti)
  322. {
  323. INST_TAKES_NO_ARGS
  324. INST_RETURN(2, 0xED, 0x4D)
  325. }
  326. INST_FUNC(retn)
  327. {
  328. INST_TAKES_NO_ARGS
  329. INST_RETURN(2, 0xED, 0x45)
  330. }
  331. /*
  332. Return the relevant ASMInstParser function for a given mnemonic.
  333. NULL is returned if the mnemonic is not known.
  334. */
  335. ASMInstParser get_inst_parser(char mstr[MAX_MNEMONIC_SIZE])
  336. {
  337. // Exploit the fact that we can store the entire mnemonic string as a
  338. // single 32-bit value to do fast lookups:
  339. uint32_t key = (mstr[0] << 24) + (mstr[1] << 16) + (mstr[2] << 8) + mstr[3];
  340. HANDLE(adc)
  341. HANDLE(add)
  342. HANDLE(inc)
  343. HANDLE(nop)
  344. HANDLE(reti)
  345. HANDLE(retn)
  346. return NULL;
  347. }