Guest User

Untitled

a guest
Dec 14th, 2018
165
0
Never
Not a member of Pastebin yet? Sign Up, it unlocks many cool features!
text 3.81 KB | None | 0 0
  1. // mandeljit.c
  2. #include <stdio.h>
  3. #include <stdlib.h>
  4. #include <sys/mman.h>
  5. #include <stdarg.h>
  6. typedef struct {
  7. char *dest;
  8. } microasm;
  9.  
  10. // this makes it more obvious what we're doing later on
  11. #define xmm(n) (n)
  12.  
  13. void asm_write(microasm *a, int n, ...) {
  14. va_list bytes;
  15. int i;
  16. va_start(bytes, n);
  17. for (i = 0; i < n; ++i) *(a->dest++) = (char) va_arg(bytes, int);
  18. va_end(bytes);
  19. }
  20.  
  21. void movsd_reg_memory(microasm *a, char reg, char disp)
  22. { asm_write(a, 5, 0xf2, 0x0f, 0x11, 0x47 | reg << 3, disp); }
  23.  
  24. void movsd_memory_reg(microasm *a, char disp, char reg)
  25. { asm_write(a, 5, 0xf2, 0x0f, 0x10, 0x47 | reg << 3, disp); }
  26.  
  27. void movsd_reg_reg(microasm *a, char src, char dst)
  28. { asm_write(a, 4, 0xf2, 0x0f, 0x11, 0xc0 | src << 3 | dst); }
  29.  
  30. void mulsd(microasm *a, char src, char dst)
  31. { asm_write(a, 4, 0xf2, 0x0f, 0x59, 0xc0 | dst << 3 | src); }
  32.  
  33. void addsd(microasm *a, char src, char dst)
  34. { asm_write(a, 4, 0xf2, 0x0f, 0x58, 0xc0 | dst << 3 | src); }
  35.  
  36. void subsd(microasm *a, char src, char dst)
  37. { asm_write(a, 4, 0xf2, 0x0f, 0x5c, 0xc0 | dst << 3 | src); }
  38.  
  39. void movpd_reg_memory(microasm *a, char reg, char disp)
  40. { asm_write(a, 5, 0x66, 0x0f, 0x11, 0x47 | reg << 3, disp); }
  41.  
  42. void movpd_memory_reg(microasm *a, char disp, char reg)
  43. { asm_write(a, 5, 0x66, 0x0f, 0x10, 0x47 | reg << 3, disp); }
  44.  
  45. void addpd_memory_reg(microasm *a, char disp, char reg)
  46. { asm_write(a, 5, 0x66, 0x0f, 0x58, 0x47 | reg << 3, disp); }
  47.  
  48. #define sqr(x) ((x) * (x))
  49.  
  50. typedef struct { double r; double i; } complex;
  51. typedef void(*compiled)(complex*);
  52.  
  53. #define offsetof(type, field) ((unsigned long) &(((type *) 0)->field))
  54.  
  55. compiled compile(char *code) {
  56. char *memory = mmap(NULL, 4096, PROT_READ | PROT_WRITE | PROT_EXEC,
  57. MAP_PRIVATE | MAP_ANONYMOUS, -1, 0);
  58. microasm a = { .dest = memory };
  59. char src_dsp, dst_dsp;
  60. char const r = offsetof(complex, r);
  61. char const i = offsetof(complex, i);
  62.  
  63. for (; *code; code += 3) {
  64. src_dsp = sizeof(complex) * (code[1] - 'a');
  65. dst_dsp = sizeof(complex) * (code[2] - 'a');
  66. switch (*code) {
  67. case '=':
  68. movpd_memory_reg(&a, src_dsp, xmm(0));
  69. movpd_reg_memory(&a, xmm(0), dst_dsp);
  70. break;
  71.  
  72. case '+':
  73. movpd_memory_reg(&a, src_dsp, xmm(0));
  74. addpd_memory_reg(&a, dst_dsp, xmm(0));
  75. movpd_reg_memory(&a, xmm(0), dst_dsp);
  76. break;
  77.  
  78. case '*':
  79. movsd_memory_reg(&a, src_dsp + r, xmm(0));
  80. movsd_memory_reg(&a, src_dsp + i, xmm(1));
  81. movsd_memory_reg(&a, dst_dsp + r, xmm(2));
  82. movsd_memory_reg(&a, dst_dsp + i, xmm(3));
  83. movsd_reg_reg (&a, xmm(0), xmm(4));
  84. mulsd (&a, xmm(2), xmm(4));
  85. movsd_reg_reg (&a, xmm(1), xmm(5));
  86. mulsd (&a, xmm(3), xmm(5));
  87. subsd (&a, xmm(5), xmm(4));
  88. movsd_reg_memory(&a, xmm(4), dst_dsp + r);
  89.  
  90. mulsd (&a, xmm(0), xmm(3));
  91. mulsd (&a, xmm(1), xmm(2));
  92. addsd (&a, xmm(3), xmm(2));
  93. movsd_reg_memory(&a, xmm(2), dst_dsp + i);
  94. break;
  95.  
  96. default:
  97. fprintf(stderr, "undefined instruction %s (ASCII %x)\n", code, *code);
  98. exit(1);
  99. }
  100. }
  101.  
  102. // Return to caller (important! otherwise we'll segfault)
  103. asm_write(&a, 1, 0xc3);
  104.  
  105. return (compiled) memory;
  106. }
  107.  
  108. int main(int argc, char **argv) {
  109. compiled fn = compile(argv[1]);
  110. complex registers[4];
  111. int i, x, y;
  112. char line[1600];
  113. printf("P5\n%d %d\n%d\n", 1600, 900, 255);
  114. for (y = 0; y < 900; ++y) {
  115. for (x = 0; x < 1600; ++x) {
  116. registers[0].r = 2 * 1.6 * (x / 1600.0 - 0.5);
  117. registers[0].i = 2 * 0.9 * (y / 900.0 - 0.5);
  118. for (i = 1; i < 4; ++i) registers[i].r = registers[i].i = 0;
  119. for (i = 0; i < 256 && sqr(registers[1].r) + sqr(registers[1].i) < 4; ++i)
  120. (*fn)(registers);
  121. line[x] = i;
  122. }
  123. fwrite(line, 1, sizeof(line), stdout);
  124. }
  125. return 0;
  126. }
Add Comment
Please, Sign In to add comment